diff --git "a/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" "b/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" --- "a/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" +++ "b/wandb/run-20220318_085757-9419yrth/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 0.5145, "train/learning_rate": 7.6270783847981e-05, "train/epoch": 5.61, "train/global_step": 5000, "_runtime": 31656, "_timestamp": 1647625533, "_step": 5001, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 9.0, 12.0, 13.0, 34.0, 81.0, 154.0, 297.0, 204.0, 101.0, 50.0, 29.0, 9.0, 6.0, 9.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.6256103515625, -130.96363830566406, -127.30166625976562, -123.63969421386719, -119.97772216796875, -116.31575012207031, -112.65377807617188, -108.99180603027344, -105.329833984375, -101.66786193847656, -98.00588989257812, -94.34391784667969, -90.68194580078125, -87.01997375488281, -83.35800170898438, -79.69602966308594, -76.0340576171875, -72.37208557128906, -68.71011352539062, -65.04814147949219, -61.38616943359375, -57.72419738769531, -54.062225341796875, -50.40025329589844, -46.73828887939453, -43.076316833496094, -39.414344787597656, -35.75237274169922, -32.09040069580078, -28.428430557250977, -24.76645851135254, -21.1044864654541, -17.44251251220703, -13.780540466308594, -10.118568420410156, -6.456597328186035, -2.7946252822875977, 0.8673458099365234, 4.529317855834961, 8.191289901733398, 11.853261947631836, 15.515233993530273, 19.17720603942871, 22.839176177978516, 26.501148223876953, 30.16312026977539, 33.82509231567383, 37.487064361572266, 41.1490364074707, 44.81100845336914, 48.47298049926758, 52.134952545166016, 55.79692459106445, 59.458892822265625, 63.12086486816406, 66.7828369140625, 70.44480895996094, 74.10678100585938, 77.76875305175781, 81.43072509765625, 85.09269714355469, 88.75466918945312, 92.41664123535156, 96.07861328125, 99.74058532714844]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 3.0, 4.0, 9.0, 5.0, 12.0, 17.0, 16.0, 13.0, 28.0, 32.0, 31.0, 46.0, 40.0, 37.0, 42.0, 61.0, 44.0, 63.0, 88.0, 54.0, 42.0, 38.0, 39.0, 34.0, 41.0, 29.0, 24.0, 23.0, 16.0, 17.0, 8.0, 8.0, 7.0, 9.0, 6.0, 5.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-134.67343139648438, -130.7504425048828, -126.82745361328125, -122.90446472167969, -118.98147583007812, -115.05848693847656, -111.135498046875, -107.21250915527344, -103.28952026367188, -99.36653137207031, -95.44354248046875, -91.52055358886719, -87.59756469726562, -83.67457580566406, -79.7515869140625, -75.82859802246094, -71.9056167602539, -67.98262786865234, -64.05963897705078, -60.13665008544922, -56.213661193847656, -52.290672302246094, -48.3676872253418, -44.444698333740234, -40.52170944213867, -36.59872055053711, -32.67573165893555, -28.752744674682617, -24.829755783081055, -20.906766891479492, -16.983779907226562, -13.060791015625, -9.137809753417969, -5.2148213386535645, -1.2918329238891602, 2.631155014038086, 6.554143905639648, 10.477132797241211, 14.40011978149414, 18.323108673095703, 22.246097564697266, 26.169086456298828, 30.09207534790039, 34.01506042480469, 37.93804931640625, 41.86103820800781, 45.784027099609375, 49.70701599121094, 53.6300048828125, 57.55299377441406, 61.475982666015625, 65.39897155761719, 69.32196044921875, 73.24494934082031, 77.16793823242188, 81.09092712402344, 85.013916015625, 88.93690490722656, 92.85989379882812, 96.78288269042969, 100.70587158203125, 104.62886047363281, 108.55184936523438, 112.47483825683594, 116.39781951904297]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 11.0, 5.0, 9.0, 11.0, 14.0, 7.0, 20.0, 18.0, 34.0, 33.0, 36.0, 42.0, 29.0, 52.0, 54.0, 70.0, 51.0, 68.0, 63.0, 47.0, 58.0, 42.0, 37.0, 25.0, 29.0, 26.0, 18.0, 22.0, 14.0, 13.0, 10.0, 2.0, 6.0, 6.0, 5.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.529296875, -3.425628662109375, -3.32196044921875, -3.218292236328125, -3.1146240234375, -3.010955810546875, -2.90728759765625, -2.803619384765625, -2.699951171875, -2.596282958984375, -2.49261474609375, -2.388946533203125, -2.2852783203125, -2.181610107421875, -2.07794189453125, -1.974273681640625, -1.87060546875, -1.766937255859375, -1.66326904296875, -1.559600830078125, -1.4559326171875, -1.352264404296875, -1.24859619140625, -1.144927978515625, -1.041259765625, -0.937591552734375, -0.83392333984375, -0.730255126953125, -0.6265869140625, -0.522918701171875, -0.41925048828125, -0.315582275390625, -0.2119140625, -0.108245849609375, -0.00457763671875, 0.099090576171875, 0.2027587890625, 0.306427001953125, 0.41009521484375, 0.513763427734375, 0.617431640625, 0.721099853515625, 0.82476806640625, 0.928436279296875, 1.0321044921875, 1.135772705078125, 1.23944091796875, 1.343109130859375, 1.44677734375, 1.550445556640625, 1.65411376953125, 1.757781982421875, 1.8614501953125, 1.965118408203125, 2.06878662109375, 2.172454833984375, 2.276123046875, 2.379791259765625, 2.48345947265625, 2.587127685546875, 2.6907958984375, 2.794464111328125, 2.89813232421875, 3.001800537109375, 3.10546875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 8.0, 4.0, 9.0, 8.0, 18.0, 18.0, 23.0, 23.0, 34.0, 49.0, 89.0, 110.0, 179.0, 246.0, 370.0, 528.0, 841.0, 1371.0, 2516.0, 4512.0, 9200.0, 21314.0, 62283.0, 1164393.0, 2802842.0, 75340.0, 24402.0, 10775.0, 5321.0, 2896.0, 1649.0, 974.0, 631.0, 401.0, 260.0, 205.0, 112.0, 88.0, 69.0, 46.0, 40.0, 18.0, 27.0, 12.0, 12.0, 5.0, 8.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-25.40625, -24.68212890625, -23.9580078125, -23.23388671875, -22.509765625, -21.78564453125, -21.0615234375, -20.33740234375, -19.61328125, -18.88916015625, -18.1650390625, -17.44091796875, -16.716796875, -15.99267578125, -15.2685546875, -14.54443359375, -13.8203125, -13.09619140625, -12.3720703125, -11.64794921875, -10.923828125, -10.19970703125, -9.4755859375, -8.75146484375, -8.02734375, -7.30322265625, -6.5791015625, -5.85498046875, -5.130859375, -4.40673828125, -3.6826171875, -2.95849609375, -2.234375, -1.51025390625, -0.7861328125, -0.06201171875, 0.662109375, 1.38623046875, 2.1103515625, 2.83447265625, 3.55859375, 4.28271484375, 5.0068359375, 5.73095703125, 6.455078125, 7.17919921875, 7.9033203125, 8.62744140625, 9.3515625, 10.07568359375, 10.7998046875, 11.52392578125, 12.248046875, 12.97216796875, 13.6962890625, 14.42041015625, 15.14453125, 15.86865234375, 16.5927734375, 17.31689453125, 18.041015625, 18.76513671875, 19.4892578125, 20.21337890625, 20.9375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 5.0, 3.0, 4.0, 5.0, 6.0, 12.0, 18.0, 18.0, 27.0, 17.0, 31.0, 35.0, 40.0, 57.0, 103.0, 149.0, 209.0, 400.0, 693.0, 834.0, 520.0, 279.0, 149.0, 115.0, 72.0, 61.0, 34.0, 38.0, 29.0, 20.0, 23.0, 16.0, 15.0, 8.0, 7.0, 11.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.25, -13.8336181640625, -13.417236328125, -13.0008544921875, -12.58447265625, -12.1680908203125, -11.751708984375, -11.3353271484375, -10.9189453125, -10.5025634765625, -10.086181640625, -9.6697998046875, -9.25341796875, -8.8370361328125, -8.420654296875, -8.0042724609375, -7.587890625, -7.1715087890625, -6.755126953125, -6.3387451171875, -5.92236328125, -5.5059814453125, -5.089599609375, -4.6732177734375, -4.2568359375, -3.8404541015625, -3.424072265625, -3.0076904296875, -2.59130859375, -2.1749267578125, -1.758544921875, -1.3421630859375, -0.92578125, -0.5093994140625, -0.093017578125, 0.3233642578125, 0.73974609375, 1.1561279296875, 1.572509765625, 1.9888916015625, 2.4052734375, 2.8216552734375, 3.238037109375, 3.6544189453125, 4.07080078125, 4.4871826171875, 4.903564453125, 5.3199462890625, 5.736328125, 6.1527099609375, 6.569091796875, 6.9854736328125, 7.40185546875, 7.8182373046875, 8.234619140625, 8.6510009765625, 9.0673828125, 9.4837646484375, 9.900146484375, 10.3165283203125, 10.73291015625, 11.1492919921875, 11.565673828125, 11.9820556640625, 12.3984375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 9.0, 5.0, 6.0, 14.0, 13.0, 23.0, 29.0, 40.0, 60.0, 63.0, 98.0, 144.0, 207.0, 370.0, 764.0, 2016.0, 6092.0, 24410.0, 165253.0, 3648778.0, 299772.0, 33649.0, 7830.0, 2491.0, 926.0, 425.0, 244.0, 147.0, 114.0, 76.0, 51.0, 51.0, 26.0, 21.0, 15.0, 10.0, 10.0, 11.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-45.65625, -44.29736328125, -42.9384765625, -41.57958984375, -40.220703125, -38.86181640625, -37.5029296875, -36.14404296875, -34.78515625, -33.42626953125, -32.0673828125, -30.70849609375, -29.349609375, -27.99072265625, -26.6318359375, -25.27294921875, -23.9140625, -22.55517578125, -21.1962890625, -19.83740234375, -18.478515625, -17.11962890625, -15.7607421875, -14.40185546875, -13.04296875, -11.68408203125, -10.3251953125, -8.96630859375, -7.607421875, -6.24853515625, -4.8896484375, -3.53076171875, -2.171875, -0.81298828125, 0.5458984375, 1.90478515625, 3.263671875, 4.62255859375, 5.9814453125, 7.34033203125, 8.69921875, 10.05810546875, 11.4169921875, 12.77587890625, 14.134765625, 15.49365234375, 16.8525390625, 18.21142578125, 19.5703125, 20.92919921875, 22.2880859375, 23.64697265625, 25.005859375, 26.36474609375, 27.7236328125, 29.08251953125, 30.44140625, 31.80029296875, 33.1591796875, 34.51806640625, 35.876953125, 37.23583984375, 38.5947265625, 39.95361328125, 41.3125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 11.0, 24.0, 41.0, 95.0, 226.0, 310.0, 174.0, 62.0, 37.0, 18.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.96576499938965, -25.505510330200195, -22.045255661010742, -18.584999084472656, -15.12474536895752, -11.66448974609375, -8.204235076904297, -4.743980407714844, -1.2837257385253906, 2.1765291690826416, 5.636784076690674, 9.097039222717285, 12.557293891906738, 16.017549514770508, 19.47780418395996, 22.938058853149414, 26.398313522338867, 29.85856819152832, 33.318824768066406, 36.77907943725586, 40.23933410644531, 43.699588775634766, 47.15984344482422, 50.62009811401367, 54.080352783203125, 57.54060745239258, 61.00086212158203, 64.46112060546875, 67.92137145996094, 71.38162994384766, 74.84188079833984, 78.30213928222656, 81.76239776611328, 85.22265625, 88.68290710449219, 92.1431655883789, 95.6034164428711, 99.06367492675781, 102.52392578125, 105.98418426513672, 109.4444351196289, 112.90469360351562, 116.36494445800781, 119.82520294189453, 123.28545379638672, 126.74571228027344, 130.20596313476562, 133.6662139892578, 137.12648010253906, 140.58673095703125, 144.0469970703125, 147.5072479248047, 150.96749877929688, 154.42774963378906, 157.8880157470703, 161.3482666015625, 164.8085174560547, 168.26876831054688, 171.72903442382812, 175.1892852783203, 178.6495361328125, 182.1097869873047, 185.57005310058594, 189.03030395507812, 192.4905548095703]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 5.0, 2.0, 4.0, 4.0, 5.0, 10.0, 12.0, 17.0, 15.0, 16.0, 18.0, 23.0, 18.0, 26.0, 33.0, 29.0, 35.0, 38.0, 40.0, 35.0, 47.0, 34.0, 48.0, 36.0, 40.0, 48.0, 33.0, 42.0, 21.0, 28.0, 43.0, 28.0, 31.0, 27.0, 18.0, 13.0, 11.0, 15.0, 14.0, 7.0, 7.0, 7.0, 6.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-43.81364059448242, -42.432498931884766, -41.051353454589844, -39.67021179199219, -38.28907012939453, -36.907928466796875, -35.52678298950195, -34.1456413269043, -32.764495849609375, -31.383352279663086, -30.00221061706543, -28.62106704711914, -27.239925384521484, -25.858781814575195, -24.477638244628906, -23.09649658203125, -21.715354919433594, -20.334211349487305, -18.95306968688965, -17.57192611694336, -16.190784454345703, -14.809640884399414, -13.428497314453125, -12.047354698181152, -10.66621208190918, -9.285069465637207, -7.903926372528076, -6.522783279418945, -5.141640663146973, -3.760498046875, -2.379354476928711, -0.9982118606567383, 0.3829307556152344, 1.7640736103057861, 3.145216464996338, 4.526359558105469, 5.907502174377441, 7.288644790649414, 8.669788360595703, 10.050930976867676, 11.432073593139648, 12.813216209411621, 14.194358825683594, 15.575502395629883, 16.956645965576172, 18.337787628173828, 19.718931198120117, 21.100074768066406, 22.481216430664062, 23.86236000061035, 25.243501663208008, 26.624645233154297, 28.005786895751953, 29.386930465698242, 30.76807403564453, 32.14921569824219, 33.530357360839844, 34.9114990234375, 36.29264450073242, 37.67378616333008, 39.054927825927734, 40.436073303222656, 41.81721496582031, 43.19835662841797, 44.57950210571289]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 7.0, 7.0, 9.0, 13.0, 7.0, 19.0, 24.0, 21.0, 31.0, 30.0, 45.0, 36.0, 33.0, 60.0, 69.0, 53.0, 60.0, 71.0, 55.0, 44.0, 54.0, 57.0, 28.0, 20.0, 21.0, 25.0, 19.0, 22.0, 9.0, 9.0, 10.0, 5.0, 6.0, 8.0, 7.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.8203125, -3.709442138671875, -3.59857177734375, -3.487701416015625, -3.3768310546875, -3.265960693359375, -3.15509033203125, -3.044219970703125, -2.933349609375, -2.822479248046875, -2.71160888671875, -2.600738525390625, -2.4898681640625, -2.378997802734375, -2.26812744140625, -2.157257080078125, -2.04638671875, -1.935516357421875, -1.82464599609375, -1.713775634765625, -1.6029052734375, -1.492034912109375, -1.38116455078125, -1.270294189453125, -1.159423828125, -1.048553466796875, -0.93768310546875, -0.826812744140625, -0.7159423828125, -0.605072021484375, -0.49420166015625, -0.383331298828125, -0.2724609375, -0.161590576171875, -0.05072021484375, 0.060150146484375, 0.1710205078125, 0.281890869140625, 0.39276123046875, 0.503631591796875, 0.614501953125, 0.725372314453125, 0.83624267578125, 0.947113037109375, 1.0579833984375, 1.168853759765625, 1.27972412109375, 1.390594482421875, 1.50146484375, 1.612335205078125, 1.72320556640625, 1.834075927734375, 1.9449462890625, 2.055816650390625, 2.16668701171875, 2.277557373046875, 2.388427734375, 2.499298095703125, 2.61016845703125, 2.721038818359375, 2.8319091796875, 2.942779541015625, 3.05364990234375, 3.164520263671875, 3.275390625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 10.0, 16.0, 19.0, 25.0, 53.0, 91.0, 131.0, 259.0, 357.0, 655.0, 965.0, 1704.0, 2910.0, 4806.0, 8137.0, 14190.0, 25990.0, 51845.0, 121291.0, 319349.0, 285994.0, 106975.0, 46857.0, 23892.0, 13246.0, 7554.0, 4501.0, 2704.0, 1512.0, 961.0, 641.0, 355.0, 221.0, 140.0, 94.0, 40.0, 22.0, 18.0, 12.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9765625, -2.880340576171875, -2.78411865234375, -2.687896728515625, -2.5916748046875, -2.495452880859375, -2.39923095703125, -2.303009033203125, -2.206787109375, -2.110565185546875, -2.01434326171875, -1.918121337890625, -1.8218994140625, -1.725677490234375, -1.62945556640625, -1.533233642578125, -1.43701171875, -1.340789794921875, -1.24456787109375, -1.148345947265625, -1.0521240234375, -0.955902099609375, -0.85968017578125, -0.763458251953125, -0.667236328125, -0.571014404296875, -0.47479248046875, -0.378570556640625, -0.2823486328125, -0.186126708984375, -0.08990478515625, 0.006317138671875, 0.1025390625, 0.198760986328125, 0.29498291015625, 0.391204833984375, 0.4874267578125, 0.583648681640625, 0.67987060546875, 0.776092529296875, 0.872314453125, 0.968536376953125, 1.06475830078125, 1.160980224609375, 1.2572021484375, 1.353424072265625, 1.44964599609375, 1.545867919921875, 1.64208984375, 1.738311767578125, 1.83453369140625, 1.930755615234375, 2.0269775390625, 2.123199462890625, 2.21942138671875, 2.315643310546875, 2.411865234375, 2.508087158203125, 2.60430908203125, 2.700531005859375, 2.7967529296875, 2.892974853515625, 2.98919677734375, 3.085418701171875, 3.181640625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 10.0, 8.0, 10.0, 14.0, 11.0, 17.0, 21.0, 17.0, 24.0, 26.0, 25.0, 31.0, 39.0, 32.0, 26.0, 40.0, 37.0, 46.0, 1065.0, 42.0, 39.0, 40.0, 39.0, 33.0, 34.0, 40.0, 28.0, 22.0, 31.0, 28.0, 26.0, 17.0, 14.0, 12.0, 15.0, 12.0, 13.0, 5.0, 5.0, 5.0, 5.0, 1.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0], "bins": [-3.55078125, -3.448822021484375, -3.34686279296875, -3.244903564453125, -3.1429443359375, -3.040985107421875, -2.93902587890625, -2.837066650390625, -2.735107421875, -2.633148193359375, -2.53118896484375, -2.429229736328125, -2.3272705078125, -2.225311279296875, -2.12335205078125, -2.021392822265625, -1.91943359375, -1.817474365234375, -1.71551513671875, -1.613555908203125, -1.5115966796875, -1.409637451171875, -1.30767822265625, -1.205718994140625, -1.103759765625, -1.001800537109375, -0.89984130859375, -0.797882080078125, -0.6959228515625, -0.593963623046875, -0.49200439453125, -0.390045166015625, -0.2880859375, -0.186126708984375, -0.08416748046875, 0.017791748046875, 0.1197509765625, 0.221710205078125, 0.32366943359375, 0.425628662109375, 0.527587890625, 0.629547119140625, 0.73150634765625, 0.833465576171875, 0.9354248046875, 1.037384033203125, 1.13934326171875, 1.241302490234375, 1.34326171875, 1.445220947265625, 1.54718017578125, 1.649139404296875, 1.7510986328125, 1.853057861328125, 1.95501708984375, 2.056976318359375, 2.158935546875, 2.260894775390625, 2.36285400390625, 2.464813232421875, 2.5667724609375, 2.668731689453125, 2.77069091796875, 2.872650146484375, 2.974609375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 9.0, 8.0, 5.0, 11.0, 15.0, 16.0, 23.0, 38.0, 54.0, 66.0, 110.0, 148.0, 215.0, 289.0, 384.0, 690.0, 1031.0, 1695.0, 3008.0, 5950.0, 13588.0, 37723.0, 152734.0, 1286331.0, 465231.0, 82841.0, 24399.0, 9757.0, 4465.0, 2402.0, 1344.0, 792.0, 558.0, 357.0, 265.0, 179.0, 103.0, 84.0, 55.0, 57.0, 28.0, 30.0, 17.0, 16.0, 7.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-2.771484375, -2.689483642578125, -2.60748291015625, -2.525482177734375, -2.4434814453125, -2.361480712890625, -2.27947998046875, -2.197479248046875, -2.115478515625, -2.033477783203125, -1.95147705078125, -1.869476318359375, -1.7874755859375, -1.705474853515625, -1.62347412109375, -1.541473388671875, -1.45947265625, -1.377471923828125, -1.29547119140625, -1.213470458984375, -1.1314697265625, -1.049468994140625, -0.96746826171875, -0.885467529296875, -0.803466796875, -0.721466064453125, -0.63946533203125, -0.557464599609375, -0.4754638671875, -0.393463134765625, -0.31146240234375, -0.229461669921875, -0.1474609375, -0.065460205078125, 0.01654052734375, 0.098541259765625, 0.1805419921875, 0.262542724609375, 0.34454345703125, 0.426544189453125, 0.508544921875, 0.590545654296875, 0.67254638671875, 0.754547119140625, 0.8365478515625, 0.918548583984375, 1.00054931640625, 1.082550048828125, 1.16455078125, 1.246551513671875, 1.32855224609375, 1.410552978515625, 1.4925537109375, 1.574554443359375, 1.65655517578125, 1.738555908203125, 1.820556640625, 1.902557373046875, 1.98455810546875, 2.066558837890625, 2.1485595703125, 2.230560302734375, 2.31256103515625, 2.394561767578125, 2.4765625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 14.0, 11.0, 5.0, 25.0, 54.0, 73.0, 314.0, 300.0, 75.0, 44.0, 23.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3203125, -2.24542236328125, -2.1705322265625, -2.09564208984375, -2.020751953125, -1.94586181640625, -1.8709716796875, -1.79608154296875, -1.72119140625, -1.64630126953125, -1.5714111328125, -1.49652099609375, -1.421630859375, -1.34674072265625, -1.2718505859375, -1.19696044921875, -1.1220703125, -1.04718017578125, -0.9722900390625, -0.89739990234375, -0.822509765625, -0.74761962890625, -0.6727294921875, -0.59783935546875, -0.52294921875, -0.44805908203125, -0.3731689453125, -0.29827880859375, -0.223388671875, -0.14849853515625, -0.0736083984375, 0.00128173828125, 0.076171875, 0.15106201171875, 0.2259521484375, 0.30084228515625, 0.375732421875, 0.45062255859375, 0.5255126953125, 0.60040283203125, 0.67529296875, 0.75018310546875, 0.8250732421875, 0.89996337890625, 0.974853515625, 1.04974365234375, 1.1246337890625, 1.19952392578125, 1.2744140625, 1.34930419921875, 1.4241943359375, 1.49908447265625, 1.573974609375, 1.64886474609375, 1.7237548828125, 1.79864501953125, 1.87353515625, 1.94842529296875, 2.0233154296875, 2.09820556640625, 2.173095703125, 2.24798583984375, 2.3228759765625, 2.39776611328125, 2.47265625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 8.0, 6.0, 7.0, 6.0, 9.0, 10.0, 17.0, 18.0, 39.0, 44.0, 62.0, 198.0, 2453.0, 1019026.0, 25621.0, 675.0, 116.0, 49.0, 38.0, 31.0, 15.0, 16.0, 11.0, 9.0, 7.0, 7.0, 6.0, 6.0, 5.0, 0.0, 7.0, 5.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.1875, -41.78515625, -40.3828125, -38.98046875, -37.578125, -36.17578125, -34.7734375, -33.37109375, -31.96875, -30.56640625, -29.1640625, -27.76171875, -26.359375, -24.95703125, -23.5546875, -22.15234375, -20.75, -19.34765625, -17.9453125, -16.54296875, -15.140625, -13.73828125, -12.3359375, -10.93359375, -9.53125, -8.12890625, -6.7265625, -5.32421875, -3.921875, -2.51953125, -1.1171875, 0.28515625, 1.6875, 3.08984375, 4.4921875, 5.89453125, 7.296875, 8.69921875, 10.1015625, 11.50390625, 12.90625, 14.30859375, 15.7109375, 17.11328125, 18.515625, 19.91796875, 21.3203125, 22.72265625, 24.125, 25.52734375, 26.9296875, 28.33203125, 29.734375, 31.13671875, 32.5390625, 33.94140625, 35.34375, 36.74609375, 38.1484375, 39.55078125, 40.953125, 42.35546875, 43.7578125, 45.16015625, 46.5625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 8.0, 29.0, 79.0, 305.0, 434.0, 114.0, 23.0, 11.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.780243873596191, -11.50096607208252, -11.221687316894531, -10.94240951538086, -10.663131713867188, -10.3838529586792, -10.104575157165527, -9.825297355651855, -9.546018600463867, -9.266740798950195, -8.987462043762207, -8.708184242248535, -8.428906440734863, -8.149627685546875, -7.870349884033203, -7.591071605682373, -7.311793804168701, -7.032515525817871, -6.753237724304199, -6.473959445953369, -6.194681167602539, -5.915403366088867, -5.636125087738037, -5.356846809387207, -5.077569007873535, -4.798290729522705, -4.519012928009033, -4.239734649658203, -3.960456371307373, -3.681178331375122, -3.401900291442871, -3.122622013092041, -2.8433432579040527, -2.5640652179718018, -2.2847869396209717, -2.0055088996887207, -1.7262307405471802, -1.4469525814056396, -1.1676745414733887, -0.8883963823318481, -0.6091182231903076, -0.3298400938510895, -0.05056196451187134, 0.22871613502502441, 0.5079942941665649, 0.7872724533081055, 1.0665504932403564, 1.345828652381897, 1.6251068115234375, 1.904384970664978, 2.1836631298065186, 2.4629411697387695, 2.7422194480895996, 3.0214974880218506, 3.3007755279541016, 3.5800538063049316, 3.8593318462371826, 4.138609886169434, 4.417888164520264, 4.697166442871094, 4.976444244384766, 5.255722522735596, 5.535000801086426, 5.814278602600098, 6.093556880950928]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 7.0, 3.0, 7.0, 5.0, 7.0, 13.0, 13.0, 14.0, 23.0, 22.0, 24.0, 22.0, 24.0, 32.0, 32.0, 31.0, 35.0, 48.0, 36.0, 38.0, 39.0, 40.0, 44.0, 45.0, 45.0, 30.0, 34.0, 28.0, 29.0, 29.0, 16.0, 29.0, 20.0, 17.0, 24.0, 23.0, 16.0, 8.0, 9.0, 6.0, 4.0, 6.0, 5.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.7098567485809326, -1.6552585363388062, -1.6006604433059692, -1.5460622310638428, -1.4914641380310059, -1.4368659257888794, -1.382267713546753, -1.327669620513916, -1.2730714082717896, -1.218473196029663, -1.1638751029968262, -1.1092768907546997, -1.0546786785125732, -1.0000805854797363, -0.9454823732376099, -0.8908842206001282, -0.8362860679626465, -0.7816879153251648, -0.7270897626876831, -0.6724915504455566, -0.617893397808075, -0.5632952451705933, -0.5086970329284668, -0.4540988802909851, -0.3995007276535034, -0.34490257501602173, -0.29030439257621765, -0.23570622503757477, -0.18110805749893188, -0.1265099048614502, -0.07191172242164612, -0.01731353998184204, 0.03728461265563965, 0.09188278019428253, 0.14648094773292542, 0.2010791152715683, 0.2556772828102112, 0.31027543544769287, 0.36487361788749695, 0.419471800327301, 0.4740699529647827, 0.5286681056022644, 0.5832662582397461, 0.6378644704818726, 0.6924626231193542, 0.7470607757568359, 0.8016589879989624, 0.8562571406364441, 0.9108552932739258, 0.9654534459114075, 1.0200515985488892, 1.0746498107910156, 1.1292479038238525, 1.183846116065979, 1.2384443283081055, 1.2930424213409424, 1.3476406335830688, 1.4022388458251953, 1.4568369388580322, 1.5114351511001587, 1.5660333633422852, 1.620631456375122, 1.6752296686172485, 1.729827880859375, 1.784425973892212]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 2.0, 6.0, 5.0, 8.0, 12.0, 13.0, 14.0, 27.0, 33.0, 35.0, 26.0, 45.0, 35.0, 42.0, 52.0, 60.0, 70.0, 68.0, 57.0, 56.0, 54.0, 50.0, 45.0, 34.0, 33.0, 16.0, 21.0, 13.0, 14.0, 9.0, 9.0, 9.0, 6.0, 10.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.04296875, -3.928314208984375, -3.81365966796875, -3.699005126953125, -3.5843505859375, -3.469696044921875, -3.35504150390625, -3.240386962890625, -3.125732421875, -3.011077880859375, -2.89642333984375, -2.781768798828125, -2.6671142578125, -2.552459716796875, -2.43780517578125, -2.323150634765625, -2.20849609375, -2.093841552734375, -1.97918701171875, -1.864532470703125, -1.7498779296875, -1.635223388671875, -1.52056884765625, -1.405914306640625, -1.291259765625, -1.176605224609375, -1.06195068359375, -0.947296142578125, -0.8326416015625, -0.717987060546875, -0.60333251953125, -0.488677978515625, -0.3740234375, -0.259368896484375, -0.14471435546875, -0.030059814453125, 0.0845947265625, 0.199249267578125, 0.31390380859375, 0.428558349609375, 0.543212890625, 0.657867431640625, 0.77252197265625, 0.887176513671875, 1.0018310546875, 1.116485595703125, 1.23114013671875, 1.345794677734375, 1.46044921875, 1.575103759765625, 1.68975830078125, 1.804412841796875, 1.9190673828125, 2.033721923828125, 2.14837646484375, 2.263031005859375, 2.377685546875, 2.492340087890625, 2.60699462890625, 2.721649169921875, 2.8363037109375, 2.950958251953125, 3.06561279296875, 3.180267333984375, 3.294921875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 5.0, 5.0, 12.0, 21.0, 28.0, 59.0, 83.0, 107.0, 197.0, 303.0, 456.0, 855.0, 1447.0, 2656.0, 5005.0, 10472.0, 24490.0, 70895.0, 308092.0, 459744.0, 104409.0, 32387.0, 13369.0, 6201.0, 3145.0, 1691.0, 974.0, 585.0, 296.0, 186.0, 122.0, 91.0, 56.0, 25.0, 34.0, 13.0, 13.0, 6.0, 9.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.7890625, -13.38525390625, -12.9814453125, -12.57763671875, -12.173828125, -11.77001953125, -11.3662109375, -10.96240234375, -10.55859375, -10.15478515625, -9.7509765625, -9.34716796875, -8.943359375, -8.53955078125, -8.1357421875, -7.73193359375, -7.328125, -6.92431640625, -6.5205078125, -6.11669921875, -5.712890625, -5.30908203125, -4.9052734375, -4.50146484375, -4.09765625, -3.69384765625, -3.2900390625, -2.88623046875, -2.482421875, -2.07861328125, -1.6748046875, -1.27099609375, -0.8671875, -0.46337890625, -0.0595703125, 0.34423828125, 0.748046875, 1.15185546875, 1.5556640625, 1.95947265625, 2.36328125, 2.76708984375, 3.1708984375, 3.57470703125, 3.978515625, 4.38232421875, 4.7861328125, 5.18994140625, 5.59375, 5.99755859375, 6.4013671875, 6.80517578125, 7.208984375, 7.61279296875, 8.0166015625, 8.42041015625, 8.82421875, 9.22802734375, 9.6318359375, 10.03564453125, 10.439453125, 10.84326171875, 11.2470703125, 11.65087890625, 12.0546875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 10.0, 10.0, 15.0, 12.0, 15.0, 17.0, 16.0, 24.0, 23.0, 26.0, 58.0, 44.0, 55.0, 70.0, 111.0, 142.0, 240.0, 1320.0, 201.0, 135.0, 79.0, 81.0, 63.0, 40.0, 46.0, 38.0, 35.0, 23.0, 26.0, 17.0, 13.0, 13.0, 10.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0, -11.640380859375, -11.28076171875, -10.921142578125, -10.5615234375, -10.201904296875, -9.84228515625, -9.482666015625, -9.123046875, -8.763427734375, -8.40380859375, -8.044189453125, -7.6845703125, -7.324951171875, -6.96533203125, -6.605712890625, -6.24609375, -5.886474609375, -5.52685546875, -5.167236328125, -4.8076171875, -4.447998046875, -4.08837890625, -3.728759765625, -3.369140625, -3.009521484375, -2.64990234375, -2.290283203125, -1.9306640625, -1.571044921875, -1.21142578125, -0.851806640625, -0.4921875, -0.132568359375, 0.22705078125, 0.586669921875, 0.9462890625, 1.305908203125, 1.66552734375, 2.025146484375, 2.384765625, 2.744384765625, 3.10400390625, 3.463623046875, 3.8232421875, 4.182861328125, 4.54248046875, 4.902099609375, 5.26171875, 5.621337890625, 5.98095703125, 6.340576171875, 6.7001953125, 7.059814453125, 7.41943359375, 7.779052734375, 8.138671875, 8.498291015625, 8.85791015625, 9.217529296875, 9.5771484375, 9.936767578125, 10.29638671875, 10.656005859375, 11.015625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 9.0, 11.0, 6.0, 23.0, 23.0, 26.0, 46.0, 66.0, 98.0, 277.0, 1201.0, 13948.0, 1166593.0, 1943431.0, 17890.0, 1432.0, 307.0, 118.0, 44.0, 37.0, 24.0, 19.0, 14.0, 16.0, 10.0, 11.0, 6.0, 4.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.8125, -50.1953125, -48.578125, -46.9609375, -45.34375, -43.7265625, -42.109375, -40.4921875, -38.875, -37.2578125, -35.640625, -34.0234375, -32.40625, -30.7890625, -29.171875, -27.5546875, -25.9375, -24.3203125, -22.703125, -21.0859375, -19.46875, -17.8515625, -16.234375, -14.6171875, -13.0, -11.3828125, -9.765625, -8.1484375, -6.53125, -4.9140625, -3.296875, -1.6796875, -0.0625, 1.5546875, 3.171875, 4.7890625, 6.40625, 8.0234375, 9.640625, 11.2578125, 12.875, 14.4921875, 16.109375, 17.7265625, 19.34375, 20.9609375, 22.578125, 24.1953125, 25.8125, 27.4296875, 29.046875, 30.6640625, 32.28125, 33.8984375, 35.515625, 37.1328125, 38.75, 40.3671875, 41.984375, 43.6015625, 45.21875, 46.8359375, 48.453125, 50.0703125, 51.6875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [3.0, 11.0, 47.0, 234.0, 419.0, 234.0, 50.0, 17.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.466659545898438, -12.729753494262695, -8.992847442626953, -5.2559404373168945, -1.5190343856811523, 2.2178726196289062, 5.954778671264648, 9.69168472290039, 13.428590774536133, 17.165496826171875, 20.902402877807617, 24.63930892944336, 28.376216888427734, 32.113121032714844, 35.85002899169922, 39.586936950683594, 43.3238410949707, 47.06074905395508, 50.79765319824219, 54.53456115722656, 58.27146530151367, 62.00837326049805, 65.74527740478516, 69.48218536376953, 73.2190933227539, 76.95600128173828, 80.69290924072266, 84.4298095703125, 88.16671752929688, 91.90362548828125, 95.64053344726562, 99.37744140625, 103.11434173583984, 106.85124969482422, 110.5881576538086, 114.32505798339844, 118.06196594238281, 121.79887390136719, 125.53578186035156, 129.27268981933594, 133.0095977783203, 136.7465057373047, 140.48341369628906, 144.22032165527344, 147.9572296142578, 151.69412231445312, 155.4310302734375, 159.16793823242188, 162.90484619140625, 166.64175415039062, 170.378662109375, 174.11557006835938, 177.85247802734375, 181.58938598632812, 185.32627868652344, 189.0631866455078, 192.8000946044922, 196.53700256347656, 200.27391052246094, 204.0108184814453, 207.7477264404297, 211.484619140625, 215.22152709960938, 218.95843505859375, 222.69534301757812]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 4.0, 6.0, 7.0, 6.0, 6.0, 9.0, 18.0, 13.0, 16.0, 23.0, 21.0, 16.0, 19.0, 27.0, 26.0, 31.0, 35.0, 44.0, 38.0, 35.0, 42.0, 56.0, 41.0, 40.0, 41.0, 39.0, 38.0, 29.0, 29.0, 38.0, 28.0, 31.0, 15.0, 25.0, 19.0, 13.0, 13.0, 13.0, 14.0, 7.0, 7.0, 4.0, 3.0, 6.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.441776275634766, -30.3626708984375, -29.283565521240234, -28.20446014404297, -27.125354766845703, -26.046249389648438, -24.96714210510254, -23.888036727905273, -22.808931350708008, -21.729825973510742, -20.650720596313477, -19.57161521911621, -18.492507934570312, -17.413402557373047, -16.33429718017578, -15.255191802978516, -14.17608642578125, -13.096981048583984, -12.017875671386719, -10.938769340515137, -9.859663963317871, -8.780558586120605, -7.701452732086182, -6.622346878051758, -5.543241500854492, -4.464136123657227, -3.3850302696228027, -2.305924654006958, -1.2268190383911133, -0.14771366119384766, 0.9313921928405762, 2.010498046875, 3.0896034240722656, 4.168708801269531, 5.247814655303955, 6.326920509338379, 7.4060258865356445, 8.48513126373291, 9.564237594604492, 10.643342971801758, 11.722448348999023, 12.801553726196289, 13.880659103393555, 14.959765434265137, 16.03887176513672, 17.117977142333984, 18.19708251953125, 19.276187896728516, 20.35529327392578, 21.434398651123047, 22.513504028320312, 23.592609405517578, 24.671714782714844, 25.75082015991211, 26.829927444458008, 27.909032821655273, 28.98813819885254, 30.067243576049805, 31.14634895324707, 32.22545623779297, 33.304561614990234, 34.3836669921875, 35.462772369384766, 36.54187774658203, 37.6209831237793]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 9.0, 9.0, 9.0, 15.0, 19.0, 18.0, 24.0, 27.0, 27.0, 41.0, 41.0, 40.0, 54.0, 46.0, 52.0, 49.0, 63.0, 72.0, 51.0, 47.0, 41.0, 41.0, 30.0, 31.0, 21.0, 30.0, 9.0, 18.0, 13.0, 12.0, 6.0, 8.0, 6.0, 6.0, 3.0, 7.0, 3.0, 1.0, 0.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.98828125, -3.87481689453125, -3.7613525390625, -3.64788818359375, -3.534423828125, -3.42095947265625, -3.3074951171875, -3.19403076171875, -3.08056640625, -2.96710205078125, -2.8536376953125, -2.74017333984375, -2.626708984375, -2.51324462890625, -2.3997802734375, -2.28631591796875, -2.1728515625, -2.05938720703125, -1.9459228515625, -1.83245849609375, -1.718994140625, -1.60552978515625, -1.4920654296875, -1.37860107421875, -1.26513671875, -1.15167236328125, -1.0382080078125, -0.92474365234375, -0.811279296875, -0.69781494140625, -0.5843505859375, -0.47088623046875, -0.357421875, -0.24395751953125, -0.1304931640625, -0.01702880859375, 0.096435546875, 0.20989990234375, 0.3233642578125, 0.43682861328125, 0.55029296875, 0.66375732421875, 0.7772216796875, 0.89068603515625, 1.004150390625, 1.11761474609375, 1.2310791015625, 1.34454345703125, 1.4580078125, 1.57147216796875, 1.6849365234375, 1.79840087890625, 1.911865234375, 2.02532958984375, 2.1387939453125, 2.25225830078125, 2.36572265625, 2.47918701171875, 2.5926513671875, 2.70611572265625, 2.819580078125, 2.93304443359375, 3.0465087890625, 3.15997314453125, 3.2734375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 14.0, 11.0, 23.0, 29.0, 39.0, 39.0, 50.0, 71.0, 142.0, 204.0, 366.0, 698.0, 1675.0, 3989.0, 11958.0, 46327.0, 2741077.0, 1330302.0, 38408.0, 10987.0, 4145.0, 1767.0, 847.0, 432.0, 213.0, 146.0, 90.0, 67.0, 40.0, 25.0, 16.0, 20.0, 11.0, 16.0, 9.0, 9.0, 6.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 5.0], "bins": [-30.71875, -29.88720703125, -29.0556640625, -28.22412109375, -27.392578125, -26.56103515625, -25.7294921875, -24.89794921875, -24.06640625, -23.23486328125, -22.4033203125, -21.57177734375, -20.740234375, -19.90869140625, -19.0771484375, -18.24560546875, -17.4140625, -16.58251953125, -15.7509765625, -14.91943359375, -14.087890625, -13.25634765625, -12.4248046875, -11.59326171875, -10.76171875, -9.93017578125, -9.0986328125, -8.26708984375, -7.435546875, -6.60400390625, -5.7724609375, -4.94091796875, -4.109375, -3.27783203125, -2.4462890625, -1.61474609375, -0.783203125, 0.04833984375, 0.8798828125, 1.71142578125, 2.54296875, 3.37451171875, 4.2060546875, 5.03759765625, 5.869140625, 6.70068359375, 7.5322265625, 8.36376953125, 9.1953125, 10.02685546875, 10.8583984375, 11.68994140625, 12.521484375, 13.35302734375, 14.1845703125, 15.01611328125, 15.84765625, 16.67919921875, 17.5107421875, 18.34228515625, 19.173828125, 20.00537109375, 20.8369140625, 21.66845703125, 22.5]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 14.0, 9.0, 7.0, 15.0, 28.0, 44.0, 56.0, 99.0, 201.0, 420.0, 926.0, 1161.0, 538.0, 223.0, 109.0, 66.0, 45.0, 32.0, 22.0, 17.0, 15.0, 8.0, 6.0, 7.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9140625, -10.3443603515625, -9.774658203125, -9.2049560546875, -8.63525390625, -8.0655517578125, -7.495849609375, -6.9261474609375, -6.3564453125, -5.7867431640625, -5.217041015625, -4.6473388671875, -4.07763671875, -3.5079345703125, -2.938232421875, -2.3685302734375, -1.798828125, -1.2291259765625, -0.659423828125, -0.0897216796875, 0.47998046875, 1.0496826171875, 1.619384765625, 2.1890869140625, 2.7587890625, 3.3284912109375, 3.898193359375, 4.4678955078125, 5.03759765625, 5.6072998046875, 6.177001953125, 6.7467041015625, 7.31640625, 7.8861083984375, 8.455810546875, 9.0255126953125, 9.59521484375, 10.1649169921875, 10.734619140625, 11.3043212890625, 11.8740234375, 12.4437255859375, 13.013427734375, 13.5831298828125, 14.15283203125, 14.7225341796875, 15.292236328125, 15.8619384765625, 16.431640625, 17.0013427734375, 17.571044921875, 18.1407470703125, 18.71044921875, 19.2801513671875, 19.849853515625, 20.4195556640625, 20.9892578125, 21.5589599609375, 22.128662109375, 22.6983642578125, 23.26806640625, 23.8377685546875, 24.407470703125, 24.9771728515625, 25.546875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 3.0, 5.0, 6.0, 6.0, 5.0, 15.0, 24.0, 27.0, 26.0, 46.0, 66.0, 112.0, 261.0, 664.0, 1763.0, 5334.0, 21139.0, 162026.0, 3789135.0, 182749.0, 22175.0, 5604.0, 1788.0, 671.0, 284.0, 140.0, 74.0, 39.0, 31.0, 19.0, 13.0, 15.0, 15.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.109375, -25.720458984375, -24.33154296875, -22.942626953125, -21.5537109375, -20.164794921875, -18.77587890625, -17.386962890625, -15.998046875, -14.609130859375, -13.22021484375, -11.831298828125, -10.4423828125, -9.053466796875, -7.66455078125, -6.275634765625, -4.88671875, -3.497802734375, -2.10888671875, -0.719970703125, 0.6689453125, 2.057861328125, 3.44677734375, 4.835693359375, 6.224609375, 7.613525390625, 9.00244140625, 10.391357421875, 11.7802734375, 13.169189453125, 14.55810546875, 15.947021484375, 17.3359375, 18.724853515625, 20.11376953125, 21.502685546875, 22.8916015625, 24.280517578125, 25.66943359375, 27.058349609375, 28.447265625, 29.836181640625, 31.22509765625, 32.614013671875, 34.0029296875, 35.391845703125, 36.78076171875, 38.169677734375, 39.55859375, 40.947509765625, 42.33642578125, 43.725341796875, 45.1142578125, 46.503173828125, 47.89208984375, 49.281005859375, 50.669921875, 52.058837890625, 53.44775390625, 54.836669921875, 56.2255859375, 57.614501953125, 59.00341796875, 60.392333984375, 61.78125]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [4.0, 2.0, 5.0, 7.0, 4.0, 15.0, 18.0, 28.0, 44.0, 56.0, 82.0, 111.0, 142.0, 145.0, 116.0, 77.0, 39.0, 37.0, 33.0, 12.0, 9.0, 8.0, 13.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.72919273376465, -21.91128921508789, -20.0933837890625, -18.275480270385742, -16.457576751708984, -14.639671325683594, -12.821767807006836, -11.003863334655762, -9.185958862304688, -7.368054389953613, -5.550150394439697, -3.7322463989257812, -1.914341926574707, -0.09643745422363281, 1.721466064453125, 3.539370536804199, 5.357275009155273, 7.175179481506348, 8.993083953857422, 10.81098747253418, 12.628891944885254, 14.446796417236328, 16.264699935913086, 18.082603454589844, 19.900508880615234, 21.718412399291992, 23.536317825317383, 25.35422134399414, 27.17212677001953, 28.99003028869629, 30.807933807373047, 32.62583923339844, 34.44374084472656, 36.26164627075195, 38.07954788208008, 39.89745330810547, 41.71535873413086, 43.53326416015625, 45.351165771484375, 47.169071197509766, 48.986976623535156, 50.80488204956055, 52.62278366088867, 54.44068908691406, 56.25859451293945, 58.076499938964844, 59.89440155029297, 61.71230697631836, 63.530208587646484, 65.34811401367188, 67.166015625, 68.98391723632812, 70.80182647705078, 72.6197280883789, 74.43763732910156, 76.25553894042969, 78.07344055175781, 79.89134216308594, 81.7092514038086, 83.52715301513672, 85.34505462646484, 87.1629638671875, 88.98086547851562, 90.79876708984375, 92.6166763305664]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 6.0, 7.0, 5.0, 12.0, 17.0, 16.0, 26.0, 17.0, 16.0, 27.0, 27.0, 33.0, 24.0, 35.0, 28.0, 39.0, 27.0, 38.0, 37.0, 48.0, 41.0, 33.0, 40.0, 34.0, 33.0, 39.0, 30.0, 33.0, 27.0, 30.0, 24.0, 25.0, 20.0, 18.0, 17.0, 13.0, 10.0, 13.0, 9.0, 4.0, 10.0, 6.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.889301300048828, -30.84830093383789, -29.807300567626953, -28.766300201416016, -27.725299835205078, -26.68429946899414, -25.643299102783203, -24.602298736572266, -23.561298370361328, -22.52029800415039, -21.479297637939453, -20.438297271728516, -19.397296905517578, -18.35629653930664, -17.315296173095703, -16.274295806884766, -15.233297348022461, -14.192296981811523, -13.151296615600586, -12.110296249389648, -11.069295883178711, -10.028295516967773, -8.987296104431152, -7.946295738220215, -6.905295372009277, -5.86429500579834, -4.823294639587402, -3.782294750213623, -2.7412943840026855, -1.700294017791748, -0.6592941284179688, 0.38170623779296875, 1.4227066040039062, 2.4637069702148438, 3.504707098007202, 4.5457072257995605, 5.586707592010498, 6.6277079582214355, 7.668707847595215, 8.709708213806152, 9.75070858001709, 10.791708946228027, 11.832709312438965, 12.873708724975586, 13.914709091186523, 14.955709457397461, 15.996709823608398, 17.037710189819336, 18.078710556030273, 19.11971092224121, 20.16071128845215, 21.201711654663086, 22.242712020874023, 23.28371238708496, 24.324710845947266, 25.365711212158203, 26.40671157836914, 27.447711944580078, 28.488712310791016, 29.529712677001953, 30.57071304321289, 31.611713409423828, 32.652713775634766, 33.6937141418457, 34.73471450805664]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 8.0, 3.0, 8.0, 6.0, 14.0, 15.0, 6.0, 23.0, 17.0, 25.0, 31.0, 42.0, 43.0, 64.0, 53.0, 39.0, 52.0, 52.0, 58.0, 63.0, 45.0, 49.0, 49.0, 43.0, 33.0, 29.0, 28.0, 18.0, 14.0, 20.0, 13.0, 10.0, 7.0, 11.0, 7.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.91796875, -3.795318603515625, -3.67266845703125, -3.550018310546875, -3.4273681640625, -3.304718017578125, -3.18206787109375, -3.059417724609375, -2.936767578125, -2.814117431640625, -2.69146728515625, -2.568817138671875, -2.4461669921875, -2.323516845703125, -2.20086669921875, -2.078216552734375, -1.95556640625, -1.832916259765625, -1.71026611328125, -1.587615966796875, -1.4649658203125, -1.342315673828125, -1.21966552734375, -1.097015380859375, -0.974365234375, -0.851715087890625, -0.72906494140625, -0.606414794921875, -0.4837646484375, -0.361114501953125, -0.23846435546875, -0.115814208984375, 0.0068359375, 0.129486083984375, 0.25213623046875, 0.374786376953125, 0.4974365234375, 0.620086669921875, 0.74273681640625, 0.865386962890625, 0.988037109375, 1.110687255859375, 1.23333740234375, 1.355987548828125, 1.4786376953125, 1.601287841796875, 1.72393798828125, 1.846588134765625, 1.96923828125, 2.091888427734375, 2.21453857421875, 2.337188720703125, 2.4598388671875, 2.582489013671875, 2.70513916015625, 2.827789306640625, 2.950439453125, 3.073089599609375, 3.19573974609375, 3.318389892578125, 3.4410400390625, 3.563690185546875, 3.68634033203125, 3.808990478515625, 3.931640625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 1.0, 7.0, 4.0, 5.0, 5.0, 7.0, 4.0, 12.0, 20.0, 34.0, 34.0, 47.0, 83.0, 113.0, 201.0, 340.0, 561.0, 1081.0, 1869.0, 3181.0, 5770.0, 10664.0, 21957.0, 67579.0, 336934.0, 450111.0, 93811.0, 26708.0, 12154.0, 6609.0, 3652.0, 2006.0, 1242.0, 725.0, 381.0, 227.0, 144.0, 94.0, 55.0, 40.0, 31.0, 14.0, 15.0, 13.0, 6.0, 4.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.5078125, -5.318603515625, -5.12939453125, -4.940185546875, -4.7509765625, -4.561767578125, -4.37255859375, -4.183349609375, -3.994140625, -3.804931640625, -3.61572265625, -3.426513671875, -3.2373046875, -3.048095703125, -2.85888671875, -2.669677734375, -2.48046875, -2.291259765625, -2.10205078125, -1.912841796875, -1.7236328125, -1.534423828125, -1.34521484375, -1.156005859375, -0.966796875, -0.777587890625, -0.58837890625, -0.399169921875, -0.2099609375, -0.020751953125, 0.16845703125, 0.357666015625, 0.546875, 0.736083984375, 0.92529296875, 1.114501953125, 1.3037109375, 1.492919921875, 1.68212890625, 1.871337890625, 2.060546875, 2.249755859375, 2.43896484375, 2.628173828125, 2.8173828125, 3.006591796875, 3.19580078125, 3.385009765625, 3.57421875, 3.763427734375, 3.95263671875, 4.141845703125, 4.3310546875, 4.520263671875, 4.70947265625, 4.898681640625, 5.087890625, 5.277099609375, 5.46630859375, 5.655517578125, 5.8447265625, 6.033935546875, 6.22314453125, 6.412353515625, 6.6015625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 0.0, 5.0, 4.0, 15.0, 6.0, 8.0, 13.0, 19.0, 22.0, 22.0, 26.0, 27.0, 36.0, 33.0, 36.0, 35.0, 46.0, 41.0, 46.0, 38.0, 1072.0, 49.0, 35.0, 40.0, 30.0, 31.0, 34.0, 41.0, 29.0, 24.0, 23.0, 27.0, 26.0, 10.0, 11.0, 11.0, 10.0, 6.0, 10.0, 6.0, 5.0, 5.0, 4.0, 1.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-3.115234375, -3.017333984375, -2.91943359375, -2.821533203125, -2.7236328125, -2.625732421875, -2.52783203125, -2.429931640625, -2.33203125, -2.234130859375, -2.13623046875, -2.038330078125, -1.9404296875, -1.842529296875, -1.74462890625, -1.646728515625, -1.548828125, -1.450927734375, -1.35302734375, -1.255126953125, -1.1572265625, -1.059326171875, -0.96142578125, -0.863525390625, -0.765625, -0.667724609375, -0.56982421875, -0.471923828125, -0.3740234375, -0.276123046875, -0.17822265625, -0.080322265625, 0.017578125, 0.115478515625, 0.21337890625, 0.311279296875, 0.4091796875, 0.507080078125, 0.60498046875, 0.702880859375, 0.80078125, 0.898681640625, 0.99658203125, 1.094482421875, 1.1923828125, 1.290283203125, 1.38818359375, 1.486083984375, 1.583984375, 1.681884765625, 1.77978515625, 1.877685546875, 1.9755859375, 2.073486328125, 2.17138671875, 2.269287109375, 2.3671875, 2.465087890625, 2.56298828125, 2.660888671875, 2.7587890625, 2.856689453125, 2.95458984375, 3.052490234375, 3.150390625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 0.0, 6.0, 3.0, 2.0, 4.0, 8.0, 13.0, 21.0, 31.0, 35.0, 63.0, 78.0, 127.0, 134.0, 238.0, 347.0, 586.0, 882.0, 1660.0, 3143.0, 6798.0, 16062.0, 49902.0, 271076.0, 1519405.0, 164792.0, 36889.0, 12763.0, 5633.0, 2607.0, 1507.0, 807.0, 499.0, 305.0, 226.0, 140.0, 88.0, 74.0, 43.0, 34.0, 29.0, 19.0, 22.0, 10.0, 5.0, 8.0, 6.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.734375, -3.602783203125, -3.47119140625, -3.339599609375, -3.2080078125, -3.076416015625, -2.94482421875, -2.813232421875, -2.681640625, -2.550048828125, -2.41845703125, -2.286865234375, -2.1552734375, -2.023681640625, -1.89208984375, -1.760498046875, -1.62890625, -1.497314453125, -1.36572265625, -1.234130859375, -1.1025390625, -0.970947265625, -0.83935546875, -0.707763671875, -0.576171875, -0.444580078125, -0.31298828125, -0.181396484375, -0.0498046875, 0.081787109375, 0.21337890625, 0.344970703125, 0.4765625, 0.608154296875, 0.73974609375, 0.871337890625, 1.0029296875, 1.134521484375, 1.26611328125, 1.397705078125, 1.529296875, 1.660888671875, 1.79248046875, 1.924072265625, 2.0556640625, 2.187255859375, 2.31884765625, 2.450439453125, 2.58203125, 2.713623046875, 2.84521484375, 2.976806640625, 3.1083984375, 3.239990234375, 3.37158203125, 3.503173828125, 3.634765625, 3.766357421875, 3.89794921875, 4.029541015625, 4.1611328125, 4.292724609375, 4.42431640625, 4.555908203125, 4.6875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 7.0, 6.0, 7.0, 6.0, 8.0, 27.0, 50.0, 74.0, 313.0, 247.0, 84.0, 51.0, 16.0, 12.0, 10.0, 11.0, 2.0, 9.0, 4.0, 4.0, 6.0, 4.0, 1.0, 3.0, 7.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.255859375, -1.203399658203125, -1.15093994140625, -1.098480224609375, -1.0460205078125, -0.993560791015625, -0.94110107421875, -0.888641357421875, -0.836181640625, -0.783721923828125, -0.73126220703125, -0.678802490234375, -0.6263427734375, -0.573883056640625, -0.52142333984375, -0.468963623046875, -0.41650390625, -0.364044189453125, -0.31158447265625, -0.259124755859375, -0.2066650390625, -0.154205322265625, -0.10174560546875, -0.049285888671875, 0.003173828125, 0.055633544921875, 0.10809326171875, 0.160552978515625, 0.2130126953125, 0.265472412109375, 0.31793212890625, 0.370391845703125, 0.4228515625, 0.475311279296875, 0.52777099609375, 0.580230712890625, 0.6326904296875, 0.685150146484375, 0.73760986328125, 0.790069580078125, 0.842529296875, 0.894989013671875, 0.94744873046875, 0.999908447265625, 1.0523681640625, 1.104827880859375, 1.15728759765625, 1.209747314453125, 1.26220703125, 1.314666748046875, 1.36712646484375, 1.419586181640625, 1.4720458984375, 1.524505615234375, 1.57696533203125, 1.629425048828125, 1.681884765625, 1.734344482421875, 1.78680419921875, 1.839263916015625, 1.8917236328125, 1.944183349609375, 1.99664306640625, 2.049102783203125, 2.1015625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 7.0, 10.0, 9.0, 8.0, 14.0, 22.0, 20.0, 29.0, 28.0, 49.0, 61.0, 140.0, 878.0, 7412.0, 904813.0, 129106.0, 4956.0, 572.0, 118.0, 66.0, 44.0, 27.0, 37.0, 19.0, 18.0, 17.0, 8.0, 19.0, 6.0, 6.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.671875, -23.81884765625, -22.9658203125, -22.11279296875, -21.259765625, -20.40673828125, -19.5537109375, -18.70068359375, -17.84765625, -16.99462890625, -16.1416015625, -15.28857421875, -14.435546875, -13.58251953125, -12.7294921875, -11.87646484375, -11.0234375, -10.17041015625, -9.3173828125, -8.46435546875, -7.611328125, -6.75830078125, -5.9052734375, -5.05224609375, -4.19921875, -3.34619140625, -2.4931640625, -1.64013671875, -0.787109375, 0.06591796875, 0.9189453125, 1.77197265625, 2.625, 3.47802734375, 4.3310546875, 5.18408203125, 6.037109375, 6.89013671875, 7.7431640625, 8.59619140625, 9.44921875, 10.30224609375, 11.1552734375, 12.00830078125, 12.861328125, 13.71435546875, 14.5673828125, 15.42041015625, 16.2734375, 17.12646484375, 17.9794921875, 18.83251953125, 19.685546875, 20.53857421875, 21.3916015625, 22.24462890625, 23.09765625, 23.95068359375, 24.8037109375, 25.65673828125, 26.509765625, 27.36279296875, 28.2158203125, 29.06884765625, 29.921875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 7.0, 23.0, 32.0, 58.0, 118.0, 203.0, 270.0, 164.0, 51.0, 39.0, 15.0, 5.0, 9.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.910794973373413, -3.7719953060150146, -3.6331958770751953, -3.494396209716797, -3.3555965423583984, -3.216796875, -3.0779972076416016, -2.9391977787017822, -2.800398111343384, -2.6615984439849854, -2.522799015045166, -2.3839993476867676, -2.245199680328369, -2.1064000129699707, -1.9676004648208618, -1.828800916671753, -1.6900012493133545, -1.551201581954956, -1.4124020338058472, -1.2736024856567383, -1.1348028182983398, -0.9960032105445862, -0.8572036027908325, -0.7184039950370789, -0.5796043872833252, -0.44080477952957153, -0.30200517177581787, -0.1632055640220642, -0.024405956268310547, 0.11439365148544312, 0.2531932592391968, 0.39199286699295044, 0.530792236328125, 0.6695918440818787, 0.8083914518356323, 0.947191059589386, 1.0859906673431396, 1.224790334701538, 1.363589882850647, 1.5023894309997559, 1.6411890983581543, 1.7799887657165527, 1.9187883138656616, 2.0575878620147705, 2.196387529373169, 2.3351871967315674, 2.4739866256713867, 2.612786293029785, 2.7515859603881836, 2.890385627746582, 3.0291852951049805, 3.1679847240448, 3.3067843914031982, 3.4455840587615967, 3.584383487701416, 3.7231831550598145, 3.861982822418213, 4.000782489776611, 4.13958215713501, 4.278381824493408, 4.417181015014648, 4.555980682373047, 4.694780349731445, 4.833580017089844, 4.972379684448242]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 9.0, 3.0, 11.0, 11.0, 8.0, 11.0, 15.0, 21.0, 16.0, 22.0, 30.0, 21.0, 27.0, 34.0, 49.0, 30.0, 44.0, 34.0, 37.0, 60.0, 38.0, 48.0, 43.0, 38.0, 45.0, 36.0, 29.0, 31.0, 32.0, 28.0, 18.0, 21.0, 16.0, 17.0, 16.0, 11.0, 7.0, 10.0, 9.0, 7.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9071562886238098, -0.876125156879425, -0.8450940251350403, -0.8140628337860107, -0.783031702041626, -0.7520005702972412, -0.7209694385528564, -0.6899383068084717, -0.6589071750640869, -0.6278760433197021, -0.5968449115753174, -0.5658137798309326, -0.5347825884819031, -0.5037514567375183, -0.47272032499313354, -0.4416891932487488, -0.41065800189971924, -0.3796268701553345, -0.3485957086086273, -0.31756457686424255, -0.2865334153175354, -0.25550228357315063, -0.22447115182876587, -0.1934400051832199, -0.16240885853767395, -0.131377711892128, -0.10034657269716263, -0.06931543350219727, -0.038284286856651306, -0.007253140211105347, 0.02377799153327942, 0.05480913817882538, 0.08584022521972656, 0.11687137186527252, 0.14790251851081848, 0.17893365025520325, 0.2099647969007492, 0.24099594354629517, 0.27202707529067993, 0.3030582070350647, 0.33408936858177185, 0.3651205003261566, 0.39615166187286377, 0.42718279361724854, 0.4582139253616333, 0.48924508690834045, 0.5202761888504028, 0.5513073801994324, 0.5823385119438171, 0.6133696436882019, 0.6444007754325867, 0.6754319667816162, 0.706463098526001, 0.7374942302703857, 0.7685253620147705, 0.7995564937591553, 0.83058762550354, 0.8616187572479248, 0.8926498889923096, 0.9236810207366943, 0.9547122120857239, 0.9857433438301086, 1.0167744159698486, 1.047805666923523, 1.0788367986679077]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 6.0, 13.0, 13.0, 19.0, 14.0, 15.0, 19.0, 21.0, 26.0, 41.0, 45.0, 48.0, 51.0, 50.0, 48.0, 58.0, 74.0, 49.0, 62.0, 54.0, 35.0, 42.0, 29.0, 32.0, 20.0, 23.0, 14.0, 20.0, 16.0, 9.0, 7.0, 8.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.84765625, -3.7235107421875, -3.599365234375, -3.4752197265625, -3.35107421875, -3.2269287109375, -3.102783203125, -2.9786376953125, -2.8544921875, -2.7303466796875, -2.606201171875, -2.4820556640625, -2.35791015625, -2.2337646484375, -2.109619140625, -1.9854736328125, -1.861328125, -1.7371826171875, -1.613037109375, -1.4888916015625, -1.36474609375, -1.2406005859375, -1.116455078125, -0.9923095703125, -0.8681640625, -0.7440185546875, -0.619873046875, -0.4957275390625, -0.37158203125, -0.2474365234375, -0.123291015625, 0.0008544921875, 0.125, 0.2491455078125, 0.373291015625, 0.4974365234375, 0.62158203125, 0.7457275390625, 0.869873046875, 0.9940185546875, 1.1181640625, 1.2423095703125, 1.366455078125, 1.4906005859375, 1.61474609375, 1.7388916015625, 1.863037109375, 1.9871826171875, 2.111328125, 2.2354736328125, 2.359619140625, 2.4837646484375, 2.60791015625, 2.7320556640625, 2.856201171875, 2.9803466796875, 3.1044921875, 3.2286376953125, 3.352783203125, 3.4769287109375, 3.60107421875, 3.7252197265625, 3.849365234375, 3.9735107421875, 4.09765625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 6.0, 7.0, 10.0, 11.0, 26.0, 22.0, 38.0, 65.0, 67.0, 131.0, 162.0, 272.0, 413.0, 655.0, 1099.0, 1991.0, 3572.0, 7302.0, 15765.0, 40561.0, 125012.0, 405368.0, 303152.0, 87319.0, 30073.0, 12469.0, 5782.0, 2972.0, 1608.0, 1004.0, 541.0, 371.0, 247.0, 135.0, 105.0, 69.0, 53.0, 25.0, 24.0, 23.0, 11.0, 8.0, 2.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.25390625, -5.1031494140625, -4.952392578125, -4.8016357421875, -4.65087890625, -4.5001220703125, -4.349365234375, -4.1986083984375, -4.0478515625, -3.8970947265625, -3.746337890625, -3.5955810546875, -3.44482421875, -3.2940673828125, -3.143310546875, -2.9925537109375, -2.841796875, -2.6910400390625, -2.540283203125, -2.3895263671875, -2.23876953125, -2.0880126953125, -1.937255859375, -1.7864990234375, -1.6357421875, -1.4849853515625, -1.334228515625, -1.1834716796875, -1.03271484375, -0.8819580078125, -0.731201171875, -0.5804443359375, -0.4296875, -0.2789306640625, -0.128173828125, 0.0225830078125, 0.17333984375, 0.3240966796875, 0.474853515625, 0.6256103515625, 0.7763671875, 0.9271240234375, 1.077880859375, 1.2286376953125, 1.37939453125, 1.5301513671875, 1.680908203125, 1.8316650390625, 1.982421875, 2.1331787109375, 2.283935546875, 2.4346923828125, 2.58544921875, 2.7362060546875, 2.886962890625, 3.0377197265625, 3.1884765625, 3.3392333984375, 3.489990234375, 3.6407470703125, 3.79150390625, 3.9422607421875, 4.093017578125, 4.2437744140625, 4.39453125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 4.0, 4.0, 4.0, 9.0, 9.0, 10.0, 8.0, 11.0, 14.0, 17.0, 19.0, 23.0, 21.0, 34.0, 26.0, 28.0, 55.0, 51.0, 57.0, 61.0, 54.0, 113.0, 288.0, 1438.0, 158.0, 78.0, 52.0, 72.0, 54.0, 36.0, 41.0, 36.0, 21.0, 28.0, 16.0, 15.0, 20.0, 10.0, 11.0, 15.0, 6.0, 10.0, 3.0, 2.0, 1.0, 5.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-12.1171875, -11.715087890625, -11.31298828125, -10.910888671875, -10.5087890625, -10.106689453125, -9.70458984375, -9.302490234375, -8.900390625, -8.498291015625, -8.09619140625, -7.694091796875, -7.2919921875, -6.889892578125, -6.48779296875, -6.085693359375, -5.68359375, -5.281494140625, -4.87939453125, -4.477294921875, -4.0751953125, -3.673095703125, -3.27099609375, -2.868896484375, -2.466796875, -2.064697265625, -1.66259765625, -1.260498046875, -0.8583984375, -0.456298828125, -0.05419921875, 0.347900390625, 0.75, 1.152099609375, 1.55419921875, 1.956298828125, 2.3583984375, 2.760498046875, 3.16259765625, 3.564697265625, 3.966796875, 4.368896484375, 4.77099609375, 5.173095703125, 5.5751953125, 5.977294921875, 6.37939453125, 6.781494140625, 7.18359375, 7.585693359375, 7.98779296875, 8.389892578125, 8.7919921875, 9.194091796875, 9.59619140625, 9.998291015625, 10.400390625, 10.802490234375, 11.20458984375, 11.606689453125, 12.0087890625, 12.410888671875, 12.81298828125, 13.215087890625, 13.6171875]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 3.0, 1.0, 4.0, 6.0, 2.0, 14.0, 12.0, 14.0, 21.0, 32.0, 33.0, 46.0, 79.0, 118.0, 186.0, 276.0, 470.0, 876.0, 2060.0, 5296.0, 17477.0, 106688.0, 2728712.0, 244618.0, 26280.0, 7111.0, 2563.0, 1157.0, 604.0, 310.0, 200.0, 113.0, 83.0, 67.0, 34.0, 39.0, 31.0, 15.0, 8.0, 9.0, 10.0, 9.0, 12.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.203125, -24.453857421875, -23.70458984375, -22.955322265625, -22.2060546875, -21.456787109375, -20.70751953125, -19.958251953125, -19.208984375, -18.459716796875, -17.71044921875, -16.961181640625, -16.2119140625, -15.462646484375, -14.71337890625, -13.964111328125, -13.21484375, -12.465576171875, -11.71630859375, -10.967041015625, -10.2177734375, -9.468505859375, -8.71923828125, -7.969970703125, -7.220703125, -6.471435546875, -5.72216796875, -4.972900390625, -4.2236328125, -3.474365234375, -2.72509765625, -1.975830078125, -1.2265625, -0.477294921875, 0.27197265625, 1.021240234375, 1.7705078125, 2.519775390625, 3.26904296875, 4.018310546875, 4.767578125, 5.516845703125, 6.26611328125, 7.015380859375, 7.7646484375, 8.513916015625, 9.26318359375, 10.012451171875, 10.76171875, 11.510986328125, 12.26025390625, 13.009521484375, 13.7587890625, 14.508056640625, 15.25732421875, 16.006591796875, 16.755859375, 17.505126953125, 18.25439453125, 19.003662109375, 19.7529296875, 20.502197265625, 21.25146484375, 22.000732421875, 22.75]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 22.0, 181.0, 554.0, 214.0, 34.0, 5.0], "bins": [-302.636474609375, -297.6337890625, -292.6310729980469, -287.6283874511719, -282.6257019042969, -277.6230163574219, -272.62030029296875, -267.61761474609375, -262.61492919921875, -257.61224365234375, -252.6095428466797, -247.60684204101562, -242.60415649414062, -237.60145568847656, -232.59877014160156, -227.5960693359375, -222.59336853027344, -217.59066772460938, -212.58798217773438, -207.5852813720703, -202.5825958251953, -197.57989501953125, -192.57720947265625, -187.5745086669922, -182.57180786132812, -177.56910705566406, -172.56642150878906, -167.563720703125, -162.56103515625, -157.55833435058594, -152.55564880371094, -147.55294799804688, -142.5502471923828, -137.54754638671875, -132.54486083984375, -127.54216766357422, -122.53947448730469, -117.53677368164062, -112.5340805053711, -107.53138732910156, -102.52870178222656, -97.52600860595703, -92.5233154296875, -87.52062225341797, -82.51792907714844, -77.51522827148438, -72.51253509521484, -67.50984191894531, -62.507144927978516, -57.504451751708984, -52.50175476074219, -47.499061584472656, -42.496368408203125, -37.493675231933594, -32.49098205566406, -27.488285064697266, -22.485591888427734, -17.482898712158203, -12.480203628540039, -7.477509498596191, -2.4748153686523438, 2.5278778076171875, 7.530572891235352, 12.533267974853516, 17.535961151123047]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 2.0, 3.0, 4.0, 1.0, 2.0, 8.0, 8.0, 11.0, 15.0, 14.0, 12.0, 16.0, 18.0, 20.0, 18.0, 17.0, 28.0, 30.0, 41.0, 37.0, 46.0, 39.0, 45.0, 35.0, 34.0, 48.0, 46.0, 39.0, 43.0, 39.0, 33.0, 43.0, 27.0, 29.0, 21.0, 22.0, 20.0, 16.0, 13.0, 9.0, 6.0, 9.0, 9.0, 10.0, 8.0, 5.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-45.60725021362305, -44.210269927978516, -42.813289642333984, -41.41630935668945, -40.01932907104492, -38.62234878540039, -37.22536849975586, -35.82838821411133, -34.4314079284668, -33.034427642822266, -31.637447357177734, -30.240467071533203, -28.843486785888672, -27.44650650024414, -26.04952621459961, -24.652545928955078, -23.255565643310547, -21.858585357666016, -20.461605072021484, -19.064624786376953, -17.667644500732422, -16.27066421508789, -14.87368392944336, -13.476703643798828, -12.079723358154297, -10.682743072509766, -9.285762786865234, -7.888782501220703, -6.491802215576172, -5.094821929931641, -3.6978416442871094, -2.300861358642578, -0.9038772583007812, 0.49310302734375, 1.8900833129882812, 3.2870635986328125, 4.684043884277344, 6.081024169921875, 7.478004455566406, 8.874984741210938, 10.271965026855469, 11.6689453125, 13.065925598144531, 14.462905883789062, 15.859886169433594, 17.256866455078125, 18.653846740722656, 20.050827026367188, 21.44780731201172, 22.84478759765625, 24.24176788330078, 25.638748168945312, 27.035728454589844, 28.432708740234375, 29.829689025878906, 31.226669311523438, 32.62364959716797, 34.0206298828125, 35.41761016845703, 36.81459045410156, 38.211570739746094, 39.608551025390625, 41.005531311035156, 42.40251159667969, 43.79949188232422]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 8.0, 4.0, 4.0, 6.0, 9.0, 13.0, 11.0, 17.0, 9.0, 28.0, 29.0, 29.0, 37.0, 51.0, 44.0, 57.0, 41.0, 61.0, 45.0, 58.0, 51.0, 51.0, 55.0, 36.0, 41.0, 27.0, 38.0, 25.0, 19.0, 20.0, 12.0, 16.0, 14.0, 6.0, 9.0, 6.0, 3.0, 9.0, 2.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.015625, -3.894317626953125, -3.77301025390625, -3.651702880859375, -3.5303955078125, -3.409088134765625, -3.28778076171875, -3.166473388671875, -3.045166015625, -2.923858642578125, -2.80255126953125, -2.681243896484375, -2.5599365234375, -2.438629150390625, -2.31732177734375, -2.196014404296875, -2.07470703125, -1.953399658203125, -1.83209228515625, -1.710784912109375, -1.5894775390625, -1.468170166015625, -1.34686279296875, -1.225555419921875, -1.104248046875, -0.982940673828125, -0.86163330078125, -0.740325927734375, -0.6190185546875, -0.497711181640625, -0.37640380859375, -0.255096435546875, -0.1337890625, -0.012481689453125, 0.10882568359375, 0.230133056640625, 0.3514404296875, 0.472747802734375, 0.59405517578125, 0.715362548828125, 0.836669921875, 0.957977294921875, 1.07928466796875, 1.200592041015625, 1.3218994140625, 1.443206787109375, 1.56451416015625, 1.685821533203125, 1.80712890625, 1.928436279296875, 2.04974365234375, 2.171051025390625, 2.2923583984375, 2.413665771484375, 2.53497314453125, 2.656280517578125, 2.777587890625, 2.898895263671875, 3.02020263671875, 3.141510009765625, 3.2628173828125, 3.384124755859375, 3.50543212890625, 3.626739501953125, 3.748046875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 8.0, 11.0, 10.0, 24.0, 29.0, 32.0, 75.0, 96.0, 124.0, 196.0, 287.0, 429.0, 606.0, 869.0, 1360.0, 2145.0, 3649.0, 6060.0, 10913.0, 21117.0, 51826.0, 393173.0, 3309380.0, 298958.0, 46440.0, 19530.0, 10389.0, 6065.0, 3657.0, 2237.0, 1460.0, 999.0, 641.0, 430.0, 314.0, 227.0, 154.0, 109.0, 72.0, 56.0, 28.0, 32.0, 20.0, 15.0, 12.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-14.8828125, -14.450927734375, -14.01904296875, -13.587158203125, -13.1552734375, -12.723388671875, -12.29150390625, -11.859619140625, -11.427734375, -10.995849609375, -10.56396484375, -10.132080078125, -9.7001953125, -9.268310546875, -8.83642578125, -8.404541015625, -7.97265625, -7.540771484375, -7.10888671875, -6.677001953125, -6.2451171875, -5.813232421875, -5.38134765625, -4.949462890625, -4.517578125, -4.085693359375, -3.65380859375, -3.221923828125, -2.7900390625, -2.358154296875, -1.92626953125, -1.494384765625, -1.0625, -0.630615234375, -0.19873046875, 0.233154296875, 0.6650390625, 1.096923828125, 1.52880859375, 1.960693359375, 2.392578125, 2.824462890625, 3.25634765625, 3.688232421875, 4.1201171875, 4.552001953125, 4.98388671875, 5.415771484375, 5.84765625, 6.279541015625, 6.71142578125, 7.143310546875, 7.5751953125, 8.007080078125, 8.43896484375, 8.870849609375, 9.302734375, 9.734619140625, 10.16650390625, 10.598388671875, 11.0302734375, 11.462158203125, 11.89404296875, 12.325927734375, 12.7578125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 3.0, 4.0, 3.0, 3.0, 7.0, 12.0, 13.0, 15.0, 14.0, 19.0, 34.0, 39.0, 45.0, 75.0, 139.0, 241.0, 511.0, 951.0, 850.0, 454.0, 246.0, 123.0, 65.0, 49.0, 42.0, 31.0, 17.0, 15.0, 14.0, 11.0, 8.0, 6.0, 8.0, 2.0, 7.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.46875, -14.984130859375, -14.49951171875, -14.014892578125, -13.5302734375, -13.045654296875, -12.56103515625, -12.076416015625, -11.591796875, -11.107177734375, -10.62255859375, -10.137939453125, -9.6533203125, -9.168701171875, -8.68408203125, -8.199462890625, -7.71484375, -7.230224609375, -6.74560546875, -6.260986328125, -5.7763671875, -5.291748046875, -4.80712890625, -4.322509765625, -3.837890625, -3.353271484375, -2.86865234375, -2.384033203125, -1.8994140625, -1.414794921875, -0.93017578125, -0.445556640625, 0.0390625, 0.523681640625, 1.00830078125, 1.492919921875, 1.9775390625, 2.462158203125, 2.94677734375, 3.431396484375, 3.916015625, 4.400634765625, 4.88525390625, 5.369873046875, 5.8544921875, 6.339111328125, 6.82373046875, 7.308349609375, 7.79296875, 8.277587890625, 8.76220703125, 9.246826171875, 9.7314453125, 10.216064453125, 10.70068359375, 11.185302734375, 11.669921875, 12.154541015625, 12.63916015625, 13.123779296875, 13.6083984375, 14.093017578125, 14.57763671875, 15.062255859375, 15.546875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 9.0, 6.0, 15.0, 18.0, 23.0, 37.0, 46.0, 96.0, 190.0, 341.0, 665.0, 1384.0, 2914.0, 6367.0, 15699.0, 47008.0, 285682.0, 3455714.0, 301860.0, 47859.0, 15994.0, 6545.0, 2943.0, 1413.0, 653.0, 354.0, 190.0, 79.0, 70.0, 44.0, 16.0, 17.0, 11.0, 8.0, 7.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.875, -27.896484375, -26.91796875, -25.939453125, -24.9609375, -23.982421875, -23.00390625, -22.025390625, -21.046875, -20.068359375, -19.08984375, -18.111328125, -17.1328125, -16.154296875, -15.17578125, -14.197265625, -13.21875, -12.240234375, -11.26171875, -10.283203125, -9.3046875, -8.326171875, -7.34765625, -6.369140625, -5.390625, -4.412109375, -3.43359375, -2.455078125, -1.4765625, -0.498046875, 0.48046875, 1.458984375, 2.4375, 3.416015625, 4.39453125, 5.373046875, 6.3515625, 7.330078125, 8.30859375, 9.287109375, 10.265625, 11.244140625, 12.22265625, 13.201171875, 14.1796875, 15.158203125, 16.13671875, 17.115234375, 18.09375, 19.072265625, 20.05078125, 21.029296875, 22.0078125, 22.986328125, 23.96484375, 24.943359375, 25.921875, 26.900390625, 27.87890625, 28.857421875, 29.8359375, 30.814453125, 31.79296875, 32.771484375, 33.75]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 9.0, 8.0, 6.0, 21.0, 22.0, 28.0, 40.0, 66.0, 72.0, 100.0, 150.0, 109.0, 99.0, 76.0, 46.0, 44.0, 15.0, 28.0, 12.0, 9.0, 10.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.2528190612793, -55.40382766723633, -53.55483627319336, -51.70584487915039, -49.85685348510742, -48.00786209106445, -46.158870697021484, -44.309879302978516, -42.46088790893555, -40.61189651489258, -38.76290512084961, -36.91391372680664, -35.06492233276367, -33.2159309387207, -31.366939544677734, -29.517948150634766, -27.668956756591797, -25.819965362548828, -23.97097396850586, -22.12198257446289, -20.272991180419922, -18.423999786376953, -16.575008392333984, -14.726016998291016, -12.877025604248047, -11.028034210205078, -9.17904281616211, -7.330051422119141, -5.481060028076172, -3.632068634033203, -1.7830772399902344, 0.06591415405273438, 1.9149093627929688, 3.7639007568359375, 5.612892150878906, 7.461883544921875, 9.310874938964844, 11.159866333007812, 13.008857727050781, 14.85784912109375, 16.70684051513672, 18.555831909179688, 20.404823303222656, 22.253814697265625, 24.102806091308594, 25.951797485351562, 27.80078887939453, 29.6497802734375, 31.49877166748047, 33.34776306152344, 35.196754455566406, 37.045745849609375, 38.894737243652344, 40.74372863769531, 42.59272003173828, 44.44171142578125, 46.29070281982422, 48.13969421386719, 49.988685607910156, 51.837677001953125, 53.686668395996094, 55.53565979003906, 57.38465118408203, 59.233642578125, 61.08263397216797]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 9.0, 3.0, 7.0, 3.0, 5.0, 6.0, 5.0, 7.0, 11.0, 17.0, 16.0, 12.0, 20.0, 33.0, 21.0, 26.0, 28.0, 38.0, 33.0, 31.0, 38.0, 33.0, 53.0, 35.0, 44.0, 28.0, 33.0, 22.0, 39.0, 41.0, 36.0, 29.0, 24.0, 22.0, 35.0, 26.0, 14.0, 17.0, 21.0, 10.0, 11.0, 11.0, 12.0, 8.0, 11.0, 6.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0], "bins": [-36.570594787597656, -35.454071044921875, -34.337547302246094, -33.22102737426758, -32.1045036315918, -30.987979888916016, -29.871456146240234, -28.754932403564453, -27.638410568237305, -26.521886825561523, -25.405364990234375, -24.288841247558594, -23.172317504882812, -22.055795669555664, -20.939271926879883, -19.822750091552734, -18.706226348876953, -17.589702606201172, -16.473180770874023, -15.356657028198242, -14.240134239196777, -13.123611450195312, -12.007087707519531, -10.890564918518066, -9.774042129516602, -8.657519340515137, -7.540996074676514, -6.424472808837891, -5.307950019836426, -4.191427230834961, -3.074903964996338, -1.9583806991577148, -0.8418540954589844, 0.27466893196105957, 1.3911919593811035, 2.5077149868011475, 3.6242380142211914, 4.740760803222656, 5.857284069061279, 6.973807334899902, 8.090330123901367, 9.206852912902832, 10.323375701904297, 11.439899444580078, 12.556422233581543, 13.672945022583008, 14.789468765258789, 15.905991554260254, 17.02251434326172, 18.1390380859375, 19.25555992126465, 20.37208366394043, 21.488605499267578, 22.60512924194336, 23.72165298461914, 24.838176727294922, 25.95469856262207, 27.07122230529785, 28.187744140625, 29.30426788330078, 30.420791625976562, 31.53731346130371, 32.65383529663086, 33.77035903930664, 34.88688278198242]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 5.0, 13.0, 7.0, 8.0, 14.0, 18.0, 13.0, 22.0, 23.0, 23.0, 36.0, 38.0, 53.0, 39.0, 44.0, 52.0, 57.0, 56.0, 63.0, 60.0, 40.0, 43.0, 36.0, 32.0, 39.0, 29.0, 25.0, 21.0, 15.0, 16.0, 6.0, 14.0, 7.0, 9.0, 6.0, 3.0, 2.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.16796875, -4.044158935546875, -3.92034912109375, -3.796539306640625, -3.6727294921875, -3.548919677734375, -3.42510986328125, -3.301300048828125, -3.177490234375, -3.053680419921875, -2.92987060546875, -2.806060791015625, -2.6822509765625, -2.558441162109375, -2.43463134765625, -2.310821533203125, -2.18701171875, -2.063201904296875, -1.93939208984375, -1.815582275390625, -1.6917724609375, -1.567962646484375, -1.44415283203125, -1.320343017578125, -1.196533203125, -1.072723388671875, -0.94891357421875, -0.825103759765625, -0.7012939453125, -0.577484130859375, -0.45367431640625, -0.329864501953125, -0.2060546875, -0.082244873046875, 0.04156494140625, 0.165374755859375, 0.2891845703125, 0.412994384765625, 0.53680419921875, 0.660614013671875, 0.784423828125, 0.908233642578125, 1.03204345703125, 1.155853271484375, 1.2796630859375, 1.403472900390625, 1.52728271484375, 1.651092529296875, 1.77490234375, 1.898712158203125, 2.02252197265625, 2.146331787109375, 2.2701416015625, 2.393951416015625, 2.51776123046875, 2.641571044921875, 2.765380859375, 2.889190673828125, 3.01300048828125, 3.136810302734375, 3.2606201171875, 3.384429931640625, 3.50823974609375, 3.632049560546875, 3.755859375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 2.0, 2.0, 6.0, 5.0, 8.0, 7.0, 11.0, 14.0, 38.0, 38.0, 65.0, 93.0, 142.0, 260.0, 384.0, 553.0, 859.0, 1299.0, 2060.0, 3277.0, 5236.0, 8837.0, 15386.0, 28333.0, 57788.0, 138166.0, 355433.0, 243688.0, 92745.0, 41878.0, 21450.0, 12002.0, 6928.0, 4166.0, 2633.0, 1661.0, 1073.0, 726.0, 446.0, 299.0, 193.0, 113.0, 88.0, 58.0, 38.0, 24.0, 24.0, 7.0, 9.0, 8.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6015625, -12.1636962890625, -11.725830078125, -11.2879638671875, -10.85009765625, -10.4122314453125, -9.974365234375, -9.5364990234375, -9.0986328125, -8.6607666015625, -8.222900390625, -7.7850341796875, -7.34716796875, -6.9093017578125, -6.471435546875, -6.0335693359375, -5.595703125, -5.1578369140625, -4.719970703125, -4.2821044921875, -3.84423828125, -3.4063720703125, -2.968505859375, -2.5306396484375, -2.0927734375, -1.6549072265625, -1.217041015625, -0.7791748046875, -0.34130859375, 0.0965576171875, 0.534423828125, 0.9722900390625, 1.41015625, 1.8480224609375, 2.285888671875, 2.7237548828125, 3.16162109375, 3.5994873046875, 4.037353515625, 4.4752197265625, 4.9130859375, 5.3509521484375, 5.788818359375, 6.2266845703125, 6.66455078125, 7.1024169921875, 7.540283203125, 7.9781494140625, 8.416015625, 8.8538818359375, 9.291748046875, 9.7296142578125, 10.16748046875, 10.6053466796875, 11.043212890625, 11.4810791015625, 11.9189453125, 12.3568115234375, 12.794677734375, 13.2325439453125, 13.67041015625, 14.1082763671875, 14.546142578125, 14.9840087890625, 15.421875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 6.0, 2.0, 5.0, 2.0, 6.0, 10.0, 9.0, 12.0, 14.0, 13.0, 10.0, 16.0, 18.0, 28.0, 20.0, 23.0, 28.0, 30.0, 31.0, 29.0, 34.0, 37.0, 33.0, 23.0, 35.0, 37.0, 1054.0, 33.0, 28.0, 40.0, 33.0, 30.0, 33.0, 12.0, 39.0, 32.0, 30.0, 16.0, 19.0, 20.0, 13.0, 13.0, 17.0, 10.0, 15.0, 5.0, 11.0, 3.0, 7.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0], "bins": [-3.072265625, -2.981964111328125, -2.89166259765625, -2.801361083984375, -2.7110595703125, -2.620758056640625, -2.53045654296875, -2.440155029296875, -2.349853515625, -2.259552001953125, -2.16925048828125, -2.078948974609375, -1.9886474609375, -1.898345947265625, -1.80804443359375, -1.717742919921875, -1.62744140625, -1.537139892578125, -1.44683837890625, -1.356536865234375, -1.2662353515625, -1.175933837890625, -1.08563232421875, -0.995330810546875, -0.905029296875, -0.814727783203125, -0.72442626953125, -0.634124755859375, -0.5438232421875, -0.453521728515625, -0.36322021484375, -0.272918701171875, -0.1826171875, -0.092315673828125, -0.00201416015625, 0.088287353515625, 0.1785888671875, 0.268890380859375, 0.35919189453125, 0.449493408203125, 0.539794921875, 0.630096435546875, 0.72039794921875, 0.810699462890625, 0.9010009765625, 0.991302490234375, 1.08160400390625, 1.171905517578125, 1.26220703125, 1.352508544921875, 1.44281005859375, 1.533111572265625, 1.6234130859375, 1.713714599609375, 1.80401611328125, 1.894317626953125, 1.984619140625, 2.074920654296875, 2.16522216796875, 2.255523681640625, 2.3458251953125, 2.436126708984375, 2.52642822265625, 2.616729736328125, 2.70703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 10.0, 11.0, 21.0, 14.0, 23.0, 22.0, 42.0, 58.0, 79.0, 134.0, 176.0, 266.0, 405.0, 558.0, 868.0, 1407.0, 2270.0, 4019.0, 6997.0, 13990.0, 32049.0, 104993.0, 844906.0, 910462.0, 108842.0, 32706.0, 13998.0, 7210.0, 4129.0, 2390.0, 1386.0, 857.0, 575.0, 392.0, 240.0, 177.0, 142.0, 87.0, 85.0, 42.0, 32.0, 16.0, 14.0, 12.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-12.7421875, -12.356201171875, -11.97021484375, -11.584228515625, -11.1982421875, -10.812255859375, -10.42626953125, -10.040283203125, -9.654296875, -9.268310546875, -8.88232421875, -8.496337890625, -8.1103515625, -7.724365234375, -7.33837890625, -6.952392578125, -6.56640625, -6.180419921875, -5.79443359375, -5.408447265625, -5.0224609375, -4.636474609375, -4.25048828125, -3.864501953125, -3.478515625, -3.092529296875, -2.70654296875, -2.320556640625, -1.9345703125, -1.548583984375, -1.16259765625, -0.776611328125, -0.390625, -0.004638671875, 0.38134765625, 0.767333984375, 1.1533203125, 1.539306640625, 1.92529296875, 2.311279296875, 2.697265625, 3.083251953125, 3.46923828125, 3.855224609375, 4.2412109375, 4.627197265625, 5.01318359375, 5.399169921875, 5.78515625, 6.171142578125, 6.55712890625, 6.943115234375, 7.3291015625, 7.715087890625, 8.10107421875, 8.487060546875, 8.873046875, 9.259033203125, 9.64501953125, 10.031005859375, 10.4169921875, 10.802978515625, 11.18896484375, 11.574951171875, 11.9609375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 3.0, 8.0, 6.0, 6.0, 6.0, 8.0, 10.0, 20.0, 14.0, 10.0, 19.0, 17.0, 21.0, 31.0, 37.0, 47.0, 47.0, 70.0, 141.0, 111.0, 69.0, 49.0, 30.0, 38.0, 28.0, 29.0, 18.0, 17.0, 18.0, 11.0, 11.0, 8.0, 4.0, 6.0, 7.0, 4.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.564453125, -2.490875244140625, -2.41729736328125, -2.343719482421875, -2.2701416015625, -2.196563720703125, -2.12298583984375, -2.049407958984375, -1.975830078125, -1.902252197265625, -1.82867431640625, -1.755096435546875, -1.6815185546875, -1.607940673828125, -1.53436279296875, -1.460784912109375, -1.38720703125, -1.313629150390625, -1.24005126953125, -1.166473388671875, -1.0928955078125, -1.019317626953125, -0.94573974609375, -0.872161865234375, -0.798583984375, -0.725006103515625, -0.65142822265625, -0.577850341796875, -0.5042724609375, -0.430694580078125, -0.35711669921875, -0.283538818359375, -0.2099609375, -0.136383056640625, -0.06280517578125, 0.010772705078125, 0.0843505859375, 0.157928466796875, 0.23150634765625, 0.305084228515625, 0.378662109375, 0.452239990234375, 0.52581787109375, 0.599395751953125, 0.6729736328125, 0.746551513671875, 0.82012939453125, 0.893707275390625, 0.96728515625, 1.040863037109375, 1.11444091796875, 1.188018798828125, 1.2615966796875, 1.335174560546875, 1.40875244140625, 1.482330322265625, 1.555908203125, 1.629486083984375, 1.70306396484375, 1.776641845703125, 1.8502197265625, 1.923797607421875, 1.99737548828125, 2.070953369140625, 2.14453125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 4.0, 3.0, 11.0, 13.0, 11.0, 16.0, 14.0, 24.0, 24.0, 30.0, 31.0, 45.0, 53.0, 78.0, 75.0, 86.0, 110.0, 185.0, 363.0, 940.0, 4026.0, 31182.0, 739858.0, 252058.0, 15186.0, 2455.0, 651.0, 292.0, 171.0, 101.0, 92.0, 69.0, 56.0, 50.0, 41.0, 26.0, 22.0, 17.0, 15.0, 18.0, 11.0, 9.0, 7.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.078125, -27.167724609375, -26.25732421875, -25.346923828125, -24.4365234375, -23.526123046875, -22.61572265625, -21.705322265625, -20.794921875, -19.884521484375, -18.97412109375, -18.063720703125, -17.1533203125, -16.242919921875, -15.33251953125, -14.422119140625, -13.51171875, -12.601318359375, -11.69091796875, -10.780517578125, -9.8701171875, -8.959716796875, -8.04931640625, -7.138916015625, -6.228515625, -5.318115234375, -4.40771484375, -3.497314453125, -2.5869140625, -1.676513671875, -0.76611328125, 0.144287109375, 1.0546875, 1.965087890625, 2.87548828125, 3.785888671875, 4.6962890625, 5.606689453125, 6.51708984375, 7.427490234375, 8.337890625, 9.248291015625, 10.15869140625, 11.069091796875, 11.9794921875, 12.889892578125, 13.80029296875, 14.710693359375, 15.62109375, 16.531494140625, 17.44189453125, 18.352294921875, 19.2626953125, 20.173095703125, 21.08349609375, 21.993896484375, 22.904296875, 23.814697265625, 24.72509765625, 25.635498046875, 26.5458984375, 27.456298828125, 28.36669921875, 29.277099609375, 30.1875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 22.0, 64.0, 218.0, 361.0, 217.0, 92.0, 24.0, 4.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.78233528137207, -17.28201675415039, -16.78169822692871, -16.281381607055664, -15.781063079833984, -15.280744552612305, -14.780426025390625, -14.280108451843262, -13.779790878295898, -13.279472351074219, -12.779154777526855, -12.278836250305176, -11.778518676757812, -11.278200149536133, -10.777881622314453, -10.27756404876709, -9.77724552154541, -9.27692699432373, -8.776609420776367, -8.276290893554688, -7.775973320007324, -7.2756547927856445, -6.775336742401123, -6.275018692016602, -5.77470064163208, -5.274382591247559, -4.774064540863037, -4.273746490478516, -3.773428201675415, -3.2731101512908936, -2.772791862487793, -2.2724738121032715, -1.77215576171875, -1.2718377113342285, -0.7715195417404175, -0.27120137214660645, 0.22911667823791504, 0.7294347286224365, 1.229753017425537, 1.7300710678100586, 2.23038911819458, 2.7307071685791016, 3.231025218963623, 3.7313435077667236, 4.231661796569824, 4.7319793701171875, 5.232297897338867, 5.732615947723389, 6.23293399810791, 6.733252048492432, 7.233570098876953, 7.733888626098633, 8.234206199645996, 8.734524726867676, 9.234842300415039, 9.735160827636719, 10.235479354858398, 10.735797882080078, 11.236115455627441, 11.736433982849121, 12.236751556396484, 12.737070083618164, 13.237388610839844, 13.737706184387207, 14.23802375793457]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 6.0, 6.0, 6.0, 6.0, 6.0, 5.0, 13.0, 13.0, 15.0, 15.0, 17.0, 18.0, 27.0, 27.0, 26.0, 28.0, 37.0, 36.0, 29.0, 36.0, 41.0, 37.0, 48.0, 34.0, 39.0, 39.0, 34.0, 31.0, 33.0, 32.0, 31.0, 34.0, 29.0, 20.0, 15.0, 17.0, 14.0, 15.0, 16.0, 15.0, 16.0, 7.0, 8.0, 7.0, 3.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.8897461891174316, -2.7988765239715576, -2.7080070972442627, -2.6171374320983887, -2.5262680053710938, -2.4353983402252197, -2.3445286750793457, -2.253659248352051, -2.162789821624756, -2.071920156478882, -1.981050729751587, -1.890181064605713, -1.799311637878418, -1.708441972732544, -1.6175724267959595, -1.526702880859375, -1.435833215713501, -1.3449636697769165, -1.254094123840332, -1.163224458694458, -1.072355031967163, -0.9814854264259338, -0.8906158208847046, -0.7997462749481201, -0.7088767290115356, -0.6180071830749512, -0.5271376371383667, -0.43626803159713745, -0.345398485660553, -0.2545289397239685, -0.16365933418273926, -0.07278978824615479, 0.018079757690429688, 0.10894931852817535, 0.19981887936592102, 0.2906884551048279, 0.38155800104141235, 0.4724275469779968, 0.5632971525192261, 0.6541666984558105, 0.745036244392395, 0.8359057903289795, 0.926775336265564, 1.0176448822021484, 1.1085145473480225, 1.1993839740753174, 1.2902536392211914, 1.3811231851577759, 1.4719927310943604, 1.5628622770309448, 1.6537318229675293, 1.7446014881134033, 1.8354709148406982, 1.9263405799865723, 2.017210006713867, 2.108079671859741, 2.1989493370056152, 2.2898190021514893, 2.380688428878784, 2.471558094024658, 2.562427520751953, 2.653297185897827, 2.744166851043701, 2.835036277770996, 2.925905704498291]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 6.0, 9.0, 14.0, 9.0, 11.0, 15.0, 18.0, 21.0, 25.0, 34.0, 38.0, 36.0, 39.0, 48.0, 56.0, 53.0, 62.0, 64.0, 55.0, 55.0, 46.0, 33.0, 35.0, 38.0, 35.0, 30.0, 21.0, 15.0, 8.0, 9.0, 16.0, 10.0, 10.0, 9.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.318511962890625, -4.18780517578125, -4.057098388671875, -3.9263916015625, -3.795684814453125, -3.66497802734375, -3.534271240234375, -3.403564453125, -3.272857666015625, -3.14215087890625, -3.011444091796875, -2.8807373046875, -2.750030517578125, -2.61932373046875, -2.488616943359375, -2.35791015625, -2.227203369140625, -2.09649658203125, -1.965789794921875, -1.8350830078125, -1.704376220703125, -1.57366943359375, -1.442962646484375, -1.312255859375, -1.181549072265625, -1.05084228515625, -0.920135498046875, -0.7894287109375, -0.658721923828125, -0.52801513671875, -0.397308349609375, -0.2666015625, -0.135894775390625, -0.00518798828125, 0.125518798828125, 0.2562255859375, 0.386932373046875, 0.51763916015625, 0.648345947265625, 0.779052734375, 0.909759521484375, 1.04046630859375, 1.171173095703125, 1.3018798828125, 1.432586669921875, 1.56329345703125, 1.694000244140625, 1.82470703125, 1.955413818359375, 2.08612060546875, 2.216827392578125, 2.3475341796875, 2.478240966796875, 2.60894775390625, 2.739654541015625, 2.870361328125, 3.001068115234375, 3.13177490234375, 3.262481689453125, 3.3931884765625, 3.523895263671875, 3.65460205078125, 3.785308837890625, 3.916015625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 4.0, 5.0, 6.0, 6.0, 19.0, 27.0, 27.0, 47.0, 63.0, 113.0, 141.0, 225.0, 335.0, 497.0, 839.0, 1290.0, 2118.0, 3741.0, 6894.0, 15830.0, 73771.0, 752218.0, 149904.0, 21187.0, 8345.0, 4310.0, 2432.0, 1473.0, 915.0, 564.0, 381.0, 288.0, 180.0, 101.0, 77.0, 60.0, 39.0, 31.0, 15.0, 16.0, 8.0, 8.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3203125, -9.9720458984375, -9.623779296875, -9.2755126953125, -8.92724609375, -8.5789794921875, -8.230712890625, -7.8824462890625, -7.5341796875, -7.1859130859375, -6.837646484375, -6.4893798828125, -6.14111328125, -5.7928466796875, -5.444580078125, -5.0963134765625, -4.748046875, -4.3997802734375, -4.051513671875, -3.7032470703125, -3.35498046875, -3.0067138671875, -2.658447265625, -2.3101806640625, -1.9619140625, -1.6136474609375, -1.265380859375, -0.9171142578125, -0.56884765625, -0.2205810546875, 0.127685546875, 0.4759521484375, 0.82421875, 1.1724853515625, 1.520751953125, 1.8690185546875, 2.21728515625, 2.5655517578125, 2.913818359375, 3.2620849609375, 3.6103515625, 3.9586181640625, 4.306884765625, 4.6551513671875, 5.00341796875, 5.3516845703125, 5.699951171875, 6.0482177734375, 6.396484375, 6.7447509765625, 7.093017578125, 7.4412841796875, 7.78955078125, 8.1378173828125, 8.486083984375, 8.8343505859375, 9.1826171875, 9.5308837890625, 9.879150390625, 10.2274169921875, 10.57568359375, 10.9239501953125, 11.272216796875, 11.6204833984375, 11.96875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 7.0, 5.0, 8.0, 15.0, 16.0, 13.0, 21.0, 37.0, 35.0, 34.0, 44.0, 43.0, 63.0, 68.0, 90.0, 133.0, 1605.0, 265.0, 118.0, 70.0, 54.0, 48.0, 41.0, 38.0, 32.0, 30.0, 30.0, 30.0, 11.0, 13.0, 10.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.703125, -16.142578125, -15.58203125, -15.021484375, -14.4609375, -13.900390625, -13.33984375, -12.779296875, -12.21875, -11.658203125, -11.09765625, -10.537109375, -9.9765625, -9.416015625, -8.85546875, -8.294921875, -7.734375, -7.173828125, -6.61328125, -6.052734375, -5.4921875, -4.931640625, -4.37109375, -3.810546875, -3.25, -2.689453125, -2.12890625, -1.568359375, -1.0078125, -0.447265625, 0.11328125, 0.673828125, 1.234375, 1.794921875, 2.35546875, 2.916015625, 3.4765625, 4.037109375, 4.59765625, 5.158203125, 5.71875, 6.279296875, 6.83984375, 7.400390625, 7.9609375, 8.521484375, 9.08203125, 9.642578125, 10.203125, 10.763671875, 11.32421875, 11.884765625, 12.4453125, 13.005859375, 13.56640625, 14.126953125, 14.6875, 15.248046875, 15.80859375, 16.369140625, 16.9296875, 17.490234375, 18.05078125, 18.611328125, 19.171875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 11.0, 12.0, 31.0, 41.0, 55.0, 90.0, 139.0, 222.0, 381.0, 611.0, 1257.0, 2916.0, 9205.0, 73875.0, 2996055.0, 47936.0, 7654.0, 2595.0, 1150.0, 579.0, 315.0, 226.0, 136.0, 76.0, 52.0, 33.0, 21.0, 14.0, 6.0, 4.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.625, -48.0458984375, -46.466796875, -44.8876953125, -43.30859375, -41.7294921875, -40.150390625, -38.5712890625, -36.9921875, -35.4130859375, -33.833984375, -32.2548828125, -30.67578125, -29.0966796875, -27.517578125, -25.9384765625, -24.359375, -22.7802734375, -21.201171875, -19.6220703125, -18.04296875, -16.4638671875, -14.884765625, -13.3056640625, -11.7265625, -10.1474609375, -8.568359375, -6.9892578125, -5.41015625, -3.8310546875, -2.251953125, -0.6728515625, 0.90625, 2.4853515625, 4.064453125, 5.6435546875, 7.22265625, 8.8017578125, 10.380859375, 11.9599609375, 13.5390625, 15.1181640625, 16.697265625, 18.2763671875, 19.85546875, 21.4345703125, 23.013671875, 24.5927734375, 26.171875, 27.7509765625, 29.330078125, 30.9091796875, 32.48828125, 34.0673828125, 35.646484375, 37.2255859375, 38.8046875, 40.3837890625, 41.962890625, 43.5419921875, 45.12109375, 46.7001953125, 48.279296875, 49.8583984375, 51.4375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 11.0, 786.0, 217.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1423.282958984375, -1399.080810546875, -1374.8787841796875, -1350.6766357421875, -1326.4744873046875, -1302.2723388671875, -1278.0703125, -1253.8681640625, -1229.666015625, -1205.4638671875, -1181.2618408203125, -1157.0596923828125, -1132.8575439453125, -1108.6553955078125, -1084.453369140625, -1060.251220703125, -1036.049072265625, -1011.8469848632812, -987.6448364257812, -963.4427490234375, -939.2406005859375, -915.0385131835938, -890.8363647460938, -866.63427734375, -842.4321899414062, -818.2301025390625, -794.0279541015625, -769.8258666992188, -745.6237182617188, -721.421630859375, -697.219482421875, -673.0173950195312, -648.815185546875, -624.6130981445312, -600.4109497070312, -576.2088623046875, -552.0067138671875, -527.8046264648438, -503.60247802734375, -479.400390625, -455.1982727050781, -430.99615478515625, -406.7940368652344, -382.5919189453125, -358.3898010253906, -334.18768310546875, -309.985595703125, -285.783447265625, -261.58135986328125, -237.37924194335938, -213.1771240234375, -188.97500610351562, -164.77288818359375, -140.57077026367188, -116.36866760253906, -92.16654968261719, -67.96442413330078, -43.762306213378906, -19.560192108154297, 4.6419219970703125, 28.844039916992188, 53.04615783691406, 77.2482681274414, 101.45038604736328, 125.65250396728516]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 8.0, 7.0, 6.0, 9.0, 13.0, 21.0, 23.0, 14.0, 25.0, 22.0, 21.0, 30.0, 26.0, 30.0, 26.0, 48.0, 47.0, 27.0, 45.0, 40.0, 38.0, 44.0, 50.0, 47.0, 36.0, 37.0, 31.0, 23.0, 30.0, 17.0, 20.0, 27.0, 16.0, 9.0, 22.0, 11.0, 11.0, 11.0, 10.0, 3.0, 5.0, 4.0, 1.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-49.65642166137695, -48.06755447387695, -46.47868347167969, -44.88981628417969, -43.30094909667969, -41.71207809448242, -40.12321090698242, -38.534339904785156, -36.945472717285156, -35.356605529785156, -33.76773452758789, -32.17886734008789, -30.589998245239258, -29.001129150390625, -27.412261962890625, -25.823392868041992, -24.23452377319336, -22.645654678344727, -21.056785583496094, -19.467918395996094, -17.87904930114746, -16.290180206298828, -14.701312065124512, -13.112443923950195, -11.523574829101562, -9.93470573425293, -8.345837593078613, -6.756968975067139, -5.168100357055664, -3.5792317390441895, -1.9903631210327148, -0.40149497985839844, 1.1873779296875, 2.7762465476989746, 4.365115165710449, 5.953983783721924, 7.542852401733398, 9.131721496582031, 10.720589637756348, 12.309457778930664, 13.898326873779297, 15.48719596862793, 17.076065063476562, 18.664932250976562, 20.253801345825195, 21.842670440673828, 23.431537628173828, 25.02040672302246, 26.609275817871094, 28.198144912719727, 29.78701400756836, 31.37588119506836, 32.964752197265625, 34.553619384765625, 36.142486572265625, 37.731353759765625, 39.32022476196289, 40.90909194946289, 42.497962951660156, 44.086830139160156, 45.675697326660156, 47.26456832885742, 48.85343551635742, 50.44230651855469, 52.03117370605469]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 6.0, 8.0, 4.0, 9.0, 13.0, 19.0, 15.0, 27.0, 18.0, 20.0, 33.0, 33.0, 37.0, 40.0, 45.0, 48.0, 46.0, 49.0, 70.0, 48.0, 53.0, 42.0, 40.0, 43.0, 31.0, 29.0, 20.0, 29.0, 20.0, 17.0, 17.0, 13.0, 9.0, 9.0, 8.0, 5.0, 9.0, 1.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.19140625, -4.0614013671875, -3.931396484375, -3.8013916015625, -3.67138671875, -3.5413818359375, -3.411376953125, -3.2813720703125, -3.1513671875, -3.0213623046875, -2.891357421875, -2.7613525390625, -2.63134765625, -2.5013427734375, -2.371337890625, -2.2413330078125, -2.111328125, -1.9813232421875, -1.851318359375, -1.7213134765625, -1.59130859375, -1.4613037109375, -1.331298828125, -1.2012939453125, -1.0712890625, -0.9412841796875, -0.811279296875, -0.6812744140625, -0.55126953125, -0.4212646484375, -0.291259765625, -0.1612548828125, -0.03125, 0.0987548828125, 0.228759765625, 0.3587646484375, 0.48876953125, 0.6187744140625, 0.748779296875, 0.8787841796875, 1.0087890625, 1.1387939453125, 1.268798828125, 1.3988037109375, 1.52880859375, 1.6588134765625, 1.788818359375, 1.9188232421875, 2.048828125, 2.1788330078125, 2.308837890625, 2.4388427734375, 2.56884765625, 2.6988525390625, 2.828857421875, 2.9588623046875, 3.0888671875, 3.2188720703125, 3.348876953125, 3.4788818359375, 3.60888671875, 3.7388916015625, 3.868896484375, 3.9989013671875, 4.12890625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 9.0, 6.0, 16.0, 14.0, 15.0, 32.0, 46.0, 68.0, 95.0, 146.0, 223.0, 284.0, 466.0, 649.0, 907.0, 1309.0, 2137.0, 2922.0, 4858.0, 8137.0, 14812.0, 31503.0, 123312.0, 2522962.0, 1336536.0, 81986.0, 26569.0, 13157.0, 7592.0, 4594.0, 2884.0, 1876.0, 1223.0, 904.0, 566.0, 441.0, 318.0, 215.0, 159.0, 103.0, 75.0, 45.0, 37.0, 22.0, 28.0, 8.0, 5.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-14.65625, -14.223876953125, -13.79150390625, -13.359130859375, -12.9267578125, -12.494384765625, -12.06201171875, -11.629638671875, -11.197265625, -10.764892578125, -10.33251953125, -9.900146484375, -9.4677734375, -9.035400390625, -8.60302734375, -8.170654296875, -7.73828125, -7.305908203125, -6.87353515625, -6.441162109375, -6.0087890625, -5.576416015625, -5.14404296875, -4.711669921875, -4.279296875, -3.846923828125, -3.41455078125, -2.982177734375, -2.5498046875, -2.117431640625, -1.68505859375, -1.252685546875, -0.8203125, -0.387939453125, 0.04443359375, 0.476806640625, 0.9091796875, 1.341552734375, 1.77392578125, 2.206298828125, 2.638671875, 3.071044921875, 3.50341796875, 3.935791015625, 4.3681640625, 4.800537109375, 5.23291015625, 5.665283203125, 6.09765625, 6.530029296875, 6.96240234375, 7.394775390625, 7.8271484375, 8.259521484375, 8.69189453125, 9.124267578125, 9.556640625, 9.989013671875, 10.42138671875, 10.853759765625, 11.2861328125, 11.718505859375, 12.15087890625, 12.583251953125, 13.015625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 4.0, 10.0, 4.0, 13.0, 14.0, 17.0, 29.0, 28.0, 43.0, 52.0, 69.0, 132.0, 201.0, 407.0, 634.0, 887.0, 637.0, 353.0, 162.0, 92.0, 61.0, 44.0, 38.0, 33.0, 22.0, 17.0, 10.0, 5.0, 9.0, 7.0, 8.0, 6.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.9453125, -15.5194091796875, -15.093505859375, -14.6676025390625, -14.24169921875, -13.8157958984375, -13.389892578125, -12.9639892578125, -12.5380859375, -12.1121826171875, -11.686279296875, -11.2603759765625, -10.83447265625, -10.4085693359375, -9.982666015625, -9.5567626953125, -9.130859375, -8.7049560546875, -8.279052734375, -7.8531494140625, -7.42724609375, -7.0013427734375, -6.575439453125, -6.1495361328125, -5.7236328125, -5.2977294921875, -4.871826171875, -4.4459228515625, -4.02001953125, -3.5941162109375, -3.168212890625, -2.7423095703125, -2.31640625, -1.8905029296875, -1.464599609375, -1.0386962890625, -0.61279296875, -0.1868896484375, 0.239013671875, 0.6649169921875, 1.0908203125, 1.5167236328125, 1.942626953125, 2.3685302734375, 2.79443359375, 3.2203369140625, 3.646240234375, 4.0721435546875, 4.498046875, 4.9239501953125, 5.349853515625, 5.7757568359375, 6.20166015625, 6.6275634765625, 7.053466796875, 7.4793701171875, 7.9052734375, 8.3311767578125, 8.757080078125, 9.1829833984375, 9.60888671875, 10.0347900390625, 10.460693359375, 10.8865966796875, 11.3125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 9.0, 12.0, 6.0, 13.0, 17.0, 30.0, 39.0, 75.0, 110.0, 156.0, 300.0, 557.0, 981.0, 1757.0, 3420.0, 7092.0, 16184.0, 43541.0, 184805.0, 3035665.0, 771189.0, 81430.0, 26007.0, 10509.0, 4898.0, 2483.0, 1228.0, 716.0, 402.0, 239.0, 146.0, 81.0, 51.0, 47.0, 27.0, 24.0, 12.0, 12.0, 7.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-28.9375, -28.150146484375, -27.36279296875, -26.575439453125, -25.7880859375, -25.000732421875, -24.21337890625, -23.426025390625, -22.638671875, -21.851318359375, -21.06396484375, -20.276611328125, -19.4892578125, -18.701904296875, -17.91455078125, -17.127197265625, -16.33984375, -15.552490234375, -14.76513671875, -13.977783203125, -13.1904296875, -12.403076171875, -11.61572265625, -10.828369140625, -10.041015625, -9.253662109375, -8.46630859375, -7.678955078125, -6.8916015625, -6.104248046875, -5.31689453125, -4.529541015625, -3.7421875, -2.954833984375, -2.16748046875, -1.380126953125, -0.5927734375, 0.194580078125, 0.98193359375, 1.769287109375, 2.556640625, 3.343994140625, 4.13134765625, 4.918701171875, 5.7060546875, 6.493408203125, 7.28076171875, 8.068115234375, 8.85546875, 9.642822265625, 10.43017578125, 11.217529296875, 12.0048828125, 12.792236328125, 13.57958984375, 14.366943359375, 15.154296875, 15.941650390625, 16.72900390625, 17.516357421875, 18.3037109375, 19.091064453125, 19.87841796875, 20.665771484375, 21.453125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 11.0, 22.0, 83.0, 288.0, 431.0, 123.0, 34.0, 16.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-243.83172607421875, -236.282958984375, -228.7342071533203, -221.18544006347656, -213.63668823242188, -206.08792114257812, -198.53915405273438, -190.9904022216797, -183.44163513183594, -175.8928680419922, -168.3441162109375, -160.79534912109375, -153.24659729003906, -145.6978302001953, -138.14907836914062, -130.60031127929688, -123.05155181884766, -115.50279235839844, -107.95403289794922, -100.4052734375, -92.85650634765625, -85.30774688720703, -77.75898742675781, -70.21022033691406, -62.66146469116211, -55.11270523071289, -47.563941955566406, -40.01518249511719, -32.46642303466797, -24.917659759521484, -17.368900299072266, -9.820137023925781, -2.2713775634765625, 5.277383327484131, 12.826144218444824, 20.37490463256836, 27.92366600036621, 35.47242736816406, 43.02118682861328, 50.569950103759766, 58.118709564208984, 65.66747283935547, 73.21623229980469, 80.7649917602539, 88.31375122070312, 95.86251831054688, 103.41127014160156, 110.96003723144531, 118.50879669189453, 126.05755615234375, 133.6063232421875, 141.1550750732422, 148.70384216308594, 156.25259399414062, 163.80136108398438, 171.35012817382812, 178.8988800048828, 186.44764709472656, 193.99639892578125, 201.545166015625, 209.0939178466797, 216.64268493652344, 224.19143676757812, 231.74020385742188, 239.28897094726562]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 7.0, 1.0, 10.0, 12.0, 8.0, 10.0, 13.0, 13.0, 20.0, 20.0, 19.0, 23.0, 29.0, 24.0, 37.0, 32.0, 42.0, 39.0, 37.0, 42.0, 47.0, 47.0, 45.0, 39.0, 48.0, 29.0, 46.0, 27.0, 31.0, 29.0, 25.0, 24.0, 28.0, 16.0, 14.0, 14.0, 12.0, 10.0, 10.0, 3.0, 5.0, 7.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.5467529296875, -34.332035064697266, -33.117313385009766, -31.90259552001953, -30.687875747680664, -29.473155975341797, -28.25843620300293, -27.043716430664062, -25.828998565673828, -24.61427879333496, -23.399559020996094, -22.18484115600586, -20.970121383666992, -19.755401611328125, -18.540681838989258, -17.32596206665039, -16.111242294311523, -14.896522521972656, -13.681803703308105, -12.467083930969238, -11.252365112304688, -10.03764533996582, -8.822925567626953, -7.608206748962402, -6.393486976623535, -5.178767681121826, -3.964048147201538, -2.74932861328125, -1.534609317779541, -0.31989002227783203, 0.8948297500610352, 2.109548568725586, 3.324268341064453, 4.538987636566162, 5.753706932067871, 6.968426704406738, 8.183145523071289, 9.397865295410156, 10.612585067749023, 11.827303886413574, 13.042023658752441, 14.256743431091309, 15.47146224975586, 16.686182022094727, 17.900901794433594, 19.115619659423828, 20.330341339111328, 21.545059204101562, 22.75977897644043, 23.974498748779297, 25.189218521118164, 26.40393829345703, 27.618656158447266, 28.833375930786133, 30.048095703125, 31.262813568115234, 32.477535247802734, 33.69225311279297, 34.90697479248047, 36.1216926574707, 37.3364143371582, 38.55113220214844, 39.76585388183594, 40.98057174682617, 42.195289611816406]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 11.0, 10.0, 8.0, 8.0, 12.0, 6.0, 10.0, 11.0, 25.0, 23.0, 23.0, 32.0, 31.0, 30.0, 39.0, 39.0, 40.0, 38.0, 46.0, 42.0, 45.0, 36.0, 49.0, 32.0, 37.0, 42.0, 34.0, 36.0, 32.0, 21.0, 19.0, 18.0, 19.0, 10.0, 16.0, 13.0, 7.0, 7.0, 5.0, 8.0, 6.0, 8.0, 7.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0], "bins": [-4.1015625, -3.9818115234375, -3.862060546875, -3.7423095703125, -3.62255859375, -3.5028076171875, -3.383056640625, -3.2633056640625, -3.1435546875, -3.0238037109375, -2.904052734375, -2.7843017578125, -2.66455078125, -2.5447998046875, -2.425048828125, -2.3052978515625, -2.185546875, -2.0657958984375, -1.946044921875, -1.8262939453125, -1.70654296875, -1.5867919921875, -1.467041015625, -1.3472900390625, -1.2275390625, -1.1077880859375, -0.988037109375, -0.8682861328125, -0.74853515625, -0.6287841796875, -0.509033203125, -0.3892822265625, -0.26953125, -0.1497802734375, -0.030029296875, 0.0897216796875, 0.20947265625, 0.3292236328125, 0.448974609375, 0.5687255859375, 0.6884765625, 0.8082275390625, 0.927978515625, 1.0477294921875, 1.16748046875, 1.2872314453125, 1.406982421875, 1.5267333984375, 1.646484375, 1.7662353515625, 1.885986328125, 2.0057373046875, 2.12548828125, 2.2452392578125, 2.364990234375, 2.4847412109375, 2.6044921875, 2.7242431640625, 2.843994140625, 2.9637451171875, 3.08349609375, 3.2032470703125, 3.322998046875, 3.4427490234375, 3.5625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 1.0, 8.0, 14.0, 12.0, 15.0, 38.0, 54.0, 69.0, 110.0, 156.0, 237.0, 333.0, 425.0, 689.0, 924.0, 1350.0, 1884.0, 2697.0, 3850.0, 5708.0, 8723.0, 13782.0, 22409.0, 38755.0, 70427.0, 142159.0, 333676.0, 192785.0, 86617.0, 46898.0, 26747.0, 16115.0, 10083.0, 6438.0, 4291.0, 3019.0, 2114.0, 1462.0, 987.0, 759.0, 482.0, 381.0, 300.0, 175.0, 130.0, 84.0, 54.0, 42.0, 31.0, 22.0, 11.0, 12.0, 5.0, 4.0, 2.0, 4.0, 3.0], "bins": [-13.765625, -13.356689453125, -12.94775390625, -12.538818359375, -12.1298828125, -11.720947265625, -11.31201171875, -10.903076171875, -10.494140625, -10.085205078125, -9.67626953125, -9.267333984375, -8.8583984375, -8.449462890625, -8.04052734375, -7.631591796875, -7.22265625, -6.813720703125, -6.40478515625, -5.995849609375, -5.5869140625, -5.177978515625, -4.76904296875, -4.360107421875, -3.951171875, -3.542236328125, -3.13330078125, -2.724365234375, -2.3154296875, -1.906494140625, -1.49755859375, -1.088623046875, -0.6796875, -0.270751953125, 0.13818359375, 0.547119140625, 0.9560546875, 1.364990234375, 1.77392578125, 2.182861328125, 2.591796875, 3.000732421875, 3.40966796875, 3.818603515625, 4.2275390625, 4.636474609375, 5.04541015625, 5.454345703125, 5.86328125, 6.272216796875, 6.68115234375, 7.090087890625, 7.4990234375, 7.907958984375, 8.31689453125, 8.725830078125, 9.134765625, 9.543701171875, 9.95263671875, 10.361572265625, 10.7705078125, 11.179443359375, 11.58837890625, 11.997314453125, 12.40625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 4.0, 3.0, 14.0, 14.0, 11.0, 14.0, 21.0, 20.0, 19.0, 26.0, 20.0, 26.0, 27.0, 28.0, 39.0, 18.0, 37.0, 36.0, 43.0, 30.0, 28.0, 1058.0, 29.0, 31.0, 28.0, 48.0, 34.0, 32.0, 29.0, 28.0, 20.0, 25.0, 29.0, 10.0, 14.0, 29.0, 10.0, 17.0, 13.0, 16.0, 11.0, 9.0, 3.0, 6.0, 8.0, 4.0, 0.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0], "bins": [-3.57421875, -3.46246337890625, -3.3507080078125, -3.23895263671875, -3.127197265625, -3.01544189453125, -2.9036865234375, -2.79193115234375, -2.68017578125, -2.56842041015625, -2.4566650390625, -2.34490966796875, -2.233154296875, -2.12139892578125, -2.0096435546875, -1.89788818359375, -1.7861328125, -1.67437744140625, -1.5626220703125, -1.45086669921875, -1.339111328125, -1.22735595703125, -1.1156005859375, -1.00384521484375, -0.89208984375, -0.78033447265625, -0.6685791015625, -0.55682373046875, -0.445068359375, -0.33331298828125, -0.2215576171875, -0.10980224609375, 0.001953125, 0.11370849609375, 0.2254638671875, 0.33721923828125, 0.448974609375, 0.56072998046875, 0.6724853515625, 0.78424072265625, 0.89599609375, 1.00775146484375, 1.1195068359375, 1.23126220703125, 1.343017578125, 1.45477294921875, 1.5665283203125, 1.67828369140625, 1.7900390625, 1.90179443359375, 2.0135498046875, 2.12530517578125, 2.237060546875, 2.34881591796875, 2.4605712890625, 2.57232666015625, 2.68408203125, 2.79583740234375, 2.9075927734375, 3.01934814453125, 3.131103515625, 3.24285888671875, 3.3546142578125, 3.46636962890625, 3.578125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 5.0, 3.0, 3.0, 6.0, 9.0, 6.0, 11.0, 13.0, 24.0, 26.0, 51.0, 54.0, 81.0, 106.0, 154.0, 219.0, 273.0, 435.0, 561.0, 864.0, 1379.0, 2119.0, 3468.0, 5721.0, 10205.0, 20316.0, 47352.0, 169155.0, 1348353.0, 356214.0, 70817.0, 27314.0, 13216.0, 7121.0, 4081.0, 2513.0, 1547.0, 1005.0, 704.0, 451.0, 310.0, 238.0, 167.0, 121.0, 78.0, 83.0, 48.0, 39.0, 29.0, 15.0, 16.0, 16.0, 11.0, 7.0, 5.0, 1.0, 1.0, 2.0, 5.0, 1.0], "bins": [-17.796875, -17.25244140625, -16.7080078125, -16.16357421875, -15.619140625, -15.07470703125, -14.5302734375, -13.98583984375, -13.44140625, -12.89697265625, -12.3525390625, -11.80810546875, -11.263671875, -10.71923828125, -10.1748046875, -9.63037109375, -9.0859375, -8.54150390625, -7.9970703125, -7.45263671875, -6.908203125, -6.36376953125, -5.8193359375, -5.27490234375, -4.73046875, -4.18603515625, -3.6416015625, -3.09716796875, -2.552734375, -2.00830078125, -1.4638671875, -0.91943359375, -0.375, 0.16943359375, 0.7138671875, 1.25830078125, 1.802734375, 2.34716796875, 2.8916015625, 3.43603515625, 3.98046875, 4.52490234375, 5.0693359375, 5.61376953125, 6.158203125, 6.70263671875, 7.2470703125, 7.79150390625, 8.3359375, 8.88037109375, 9.4248046875, 9.96923828125, 10.513671875, 11.05810546875, 11.6025390625, 12.14697265625, 12.69140625, 13.23583984375, 13.7802734375, 14.32470703125, 14.869140625, 15.41357421875, 15.9580078125, 16.50244140625, 17.046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 9.0, 5.0, 14.0, 8.0, 15.0, 23.0, 35.0, 37.0, 59.0, 86.0, 187.0, 180.0, 80.0, 54.0, 51.0, 36.0, 23.0, 16.0, 18.0, 7.0, 8.0, 9.0, 7.0, 4.0, 1.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.16796875, -6.95721435546875, -6.7464599609375, -6.53570556640625, -6.324951171875, -6.11419677734375, -5.9034423828125, -5.69268798828125, -5.48193359375, -5.27117919921875, -5.0604248046875, -4.84967041015625, -4.638916015625, -4.42816162109375, -4.2174072265625, -4.00665283203125, -3.7958984375, -3.58514404296875, -3.3743896484375, -3.16363525390625, -2.952880859375, -2.74212646484375, -2.5313720703125, -2.32061767578125, -2.10986328125, -1.89910888671875, -1.6883544921875, -1.47760009765625, -1.266845703125, -1.05609130859375, -0.8453369140625, -0.63458251953125, -0.423828125, -0.21307373046875, -0.0023193359375, 0.20843505859375, 0.419189453125, 0.62994384765625, 0.8406982421875, 1.05145263671875, 1.26220703125, 1.47296142578125, 1.6837158203125, 1.89447021484375, 2.105224609375, 2.31597900390625, 2.5267333984375, 2.73748779296875, 2.9482421875, 3.15899658203125, 3.3697509765625, 3.58050537109375, 3.791259765625, 4.00201416015625, 4.2127685546875, 4.42352294921875, 4.63427734375, 4.84503173828125, 5.0557861328125, 5.26654052734375, 5.477294921875, 5.68804931640625, 5.8988037109375, 6.10955810546875, 6.3203125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 4.0, 3.0, 4.0, 8.0, 3.0, 7.0, 3.0, 10.0, 12.0, 13.0, 23.0, 11.0, 25.0, 31.0, 57.0, 89.0, 122.0, 275.0, 638.0, 1743.0, 5806.0, 34230.0, 935610.0, 58650.0, 7508.0, 2108.0, 704.0, 330.0, 176.0, 101.0, 62.0, 32.0, 38.0, 29.0, 14.0, 12.0, 14.0, 9.0, 12.0, 7.0, 4.0, 8.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-77.875, -75.556640625, -73.23828125, -70.919921875, -68.6015625, -66.283203125, -63.96484375, -61.646484375, -59.328125, -57.009765625, -54.69140625, -52.373046875, -50.0546875, -47.736328125, -45.41796875, -43.099609375, -40.78125, -38.462890625, -36.14453125, -33.826171875, -31.5078125, -29.189453125, -26.87109375, -24.552734375, -22.234375, -19.916015625, -17.59765625, -15.279296875, -12.9609375, -10.642578125, -8.32421875, -6.005859375, -3.6875, -1.369140625, 0.94921875, 3.267578125, 5.5859375, 7.904296875, 10.22265625, 12.541015625, 14.859375, 17.177734375, 19.49609375, 21.814453125, 24.1328125, 26.451171875, 28.76953125, 31.087890625, 33.40625, 35.724609375, 38.04296875, 40.361328125, 42.6796875, 44.998046875, 47.31640625, 49.634765625, 51.953125, 54.271484375, 56.58984375, 58.908203125, 61.2265625, 63.544921875, 65.86328125, 68.181640625, 70.5]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 9.0, 7.0, 18.0, 38.0, 83.0, 172.0, 296.0, 219.0, 76.0, 44.0, 26.0, 8.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.6009407043457, -37.73585891723633, -36.87077331542969, -36.00569152832031, -35.14060974121094, -34.2755241394043, -33.41044235229492, -32.54536056518555, -31.680274963378906, -30.8151912689209, -29.950109481811523, -29.085025787353516, -28.219942092895508, -27.3548583984375, -26.489776611328125, -25.624692916870117, -24.759611129760742, -23.894527435302734, -23.02944564819336, -22.16436195373535, -21.299278259277344, -20.43419647216797, -19.56911277770996, -18.704029083251953, -17.838947296142578, -16.97386360168457, -16.108781814575195, -15.243698120117188, -14.37861442565918, -13.513531684875488, -12.648448944091797, -11.783365249633789, -10.918281555175781, -10.05319881439209, -9.188115119934082, -8.32303237915039, -7.457949161529541, -6.592865943908691, -5.727783203125, -4.86269998550415, -3.997616767883301, -3.132533550262451, -2.2674505710601807, -1.4023675918579102, -0.5372843742370605, 0.32779884338378906, 1.1928815841674805, 2.05796480178833, 2.9230480194091797, 3.7881312370300293, 4.653214454650879, 5.51829719543457, 6.38338041305542, 7.2484636306762695, 8.113546371459961, 8.978630065917969, 9.84371280670166, 10.708795547485352, 11.57387924194336, 12.43896198272705, 13.304044723510742, 14.16912841796875, 15.034211158752441, 15.899293899536133, 16.76437759399414]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 5.0, 6.0, 7.0, 5.0, 8.0, 9.0, 9.0, 15.0, 13.0, 20.0, 21.0, 29.0, 30.0, 45.0, 33.0, 43.0, 48.0, 41.0, 50.0, 50.0, 35.0, 49.0, 50.0, 60.0, 42.0, 28.0, 30.0, 38.0, 34.0, 21.0, 28.0, 20.0, 18.0, 16.0, 13.0, 8.0, 2.0, 4.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.751711845397949, -7.495659351348877, -7.239606857299805, -6.983554840087891, -6.727502346038818, -6.471449851989746, -6.215397834777832, -5.95934534072876, -5.7032928466796875, -5.447240352630615, -5.191187858581543, -4.935135841369629, -4.679083347320557, -4.423030853271484, -4.16697883605957, -3.910926342010498, -3.654873847961426, -3.3988213539123535, -3.1427690982818604, -2.886716842651367, -2.630664348602295, -2.3746118545532227, -2.1185595989227295, -1.8625072240829468, -1.606454849243164, -1.3504024744033813, -1.0943500995635986, -0.8382977247238159, -0.5822453498840332, -0.3261929750442505, -0.07014060020446777, 0.18591177463531494, 0.44196510314941406, 0.6980174779891968, 0.9540698528289795, 1.2101222276687622, 1.466174602508545, 1.7222269773483276, 1.9782793521881104, 2.2343316078186035, 2.490384101867676, 2.746436595916748, 3.002488851547241, 3.2585411071777344, 3.5145936012268066, 3.770646095275879, 4.026698112487793, 4.282750606536865, 4.5388031005859375, 4.79485559463501, 5.050908088684082, 5.306960105895996, 5.563012599945068, 5.819065093994141, 6.075117111206055, 6.331169605255127, 6.587222099304199, 6.8432745933532715, 7.099327087402344, 7.355379104614258, 7.61143159866333, 7.867484092712402, 8.123536109924316, 8.379589080810547, 8.635641098022461]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 5.0, 9.0, 5.0, 7.0, 14.0, 10.0, 21.0, 18.0, 16.0, 15.0, 32.0, 32.0, 39.0, 29.0, 27.0, 32.0, 47.0, 41.0, 41.0, 48.0, 44.0, 51.0, 38.0, 48.0, 44.0, 31.0, 38.0, 42.0, 14.0, 24.0, 22.0, 13.0, 21.0, 14.0, 11.0, 9.0, 8.0, 6.0, 5.0, 7.0, 6.0, 4.0, 5.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-4.171875, -4.048828125, -3.92578125, -3.802734375, -3.6796875, -3.556640625, -3.43359375, -3.310546875, -3.1875, -3.064453125, -2.94140625, -2.818359375, -2.6953125, -2.572265625, -2.44921875, -2.326171875, -2.203125, -2.080078125, -1.95703125, -1.833984375, -1.7109375, -1.587890625, -1.46484375, -1.341796875, -1.21875, -1.095703125, -0.97265625, -0.849609375, -0.7265625, -0.603515625, -0.48046875, -0.357421875, -0.234375, -0.111328125, 0.01171875, 0.134765625, 0.2578125, 0.380859375, 0.50390625, 0.626953125, 0.75, 0.873046875, 0.99609375, 1.119140625, 1.2421875, 1.365234375, 1.48828125, 1.611328125, 1.734375, 1.857421875, 1.98046875, 2.103515625, 2.2265625, 2.349609375, 2.47265625, 2.595703125, 2.71875, 2.841796875, 2.96484375, 3.087890625, 3.2109375, 3.333984375, 3.45703125, 3.580078125, 3.703125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 1.0, 3.0, 9.0, 8.0, 6.0, 22.0, 27.0, 45.0, 45.0, 59.0, 81.0, 127.0, 195.0, 267.0, 343.0, 572.0, 833.0, 1319.0, 2013.0, 3428.0, 6325.0, 13207.0, 34600.0, 153613.0, 609483.0, 157813.0, 34988.0, 13398.0, 6244.0, 3373.0, 2132.0, 1302.0, 867.0, 548.0, 362.0, 267.0, 185.0, 140.0, 81.0, 63.0, 50.0, 39.0, 28.0, 16.0, 8.0, 8.0, 5.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-9.9296875, -9.6500244140625, -9.370361328125, -9.0906982421875, -8.81103515625, -8.5313720703125, -8.251708984375, -7.9720458984375, -7.6923828125, -7.4127197265625, -7.133056640625, -6.8533935546875, -6.57373046875, -6.2940673828125, -6.014404296875, -5.7347412109375, -5.455078125, -5.1754150390625, -4.895751953125, -4.6160888671875, -4.33642578125, -4.0567626953125, -3.777099609375, -3.4974365234375, -3.2177734375, -2.9381103515625, -2.658447265625, -2.3787841796875, -2.09912109375, -1.8194580078125, -1.539794921875, -1.2601318359375, -0.98046875, -0.7008056640625, -0.421142578125, -0.1414794921875, 0.13818359375, 0.4178466796875, 0.697509765625, 0.9771728515625, 1.2568359375, 1.5364990234375, 1.816162109375, 2.0958251953125, 2.37548828125, 2.6551513671875, 2.934814453125, 3.2144775390625, 3.494140625, 3.7738037109375, 4.053466796875, 4.3331298828125, 4.61279296875, 4.8924560546875, 5.172119140625, 5.4517822265625, 5.7314453125, 6.0111083984375, 6.290771484375, 6.5704345703125, 6.85009765625, 7.1297607421875, 7.409423828125, 7.6890869140625, 7.96875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 8.0, 4.0, 9.0, 6.0, 5.0, 13.0, 8.0, 10.0, 15.0, 16.0, 30.0, 29.0, 27.0, 26.0, 38.0, 48.0, 40.0, 43.0, 69.0, 98.0, 176.0, 1443.0, 269.0, 118.0, 73.0, 65.0, 54.0, 38.0, 42.0, 34.0, 38.0, 26.0, 23.0, 16.0, 19.0, 24.0, 13.0, 14.0, 4.0, 8.0, 5.0, 2.0, 2.0, 2.0, 6.0, 1.0, 0.0, 1.0], "bins": [-19.390625, -18.8768310546875, -18.363037109375, -17.8492431640625, -17.33544921875, -16.8216552734375, -16.307861328125, -15.7940673828125, -15.2802734375, -14.7664794921875, -14.252685546875, -13.7388916015625, -13.22509765625, -12.7113037109375, -12.197509765625, -11.6837158203125, -11.169921875, -10.6561279296875, -10.142333984375, -9.6285400390625, -9.11474609375, -8.6009521484375, -8.087158203125, -7.5733642578125, -7.0595703125, -6.5457763671875, -6.031982421875, -5.5181884765625, -5.00439453125, -4.4906005859375, -3.976806640625, -3.4630126953125, -2.94921875, -2.4354248046875, -1.921630859375, -1.4078369140625, -0.89404296875, -0.3802490234375, 0.133544921875, 0.6473388671875, 1.1611328125, 1.6749267578125, 2.188720703125, 2.7025146484375, 3.21630859375, 3.7301025390625, 4.243896484375, 4.7576904296875, 5.271484375, 5.7852783203125, 6.299072265625, 6.8128662109375, 7.32666015625, 7.8404541015625, 8.354248046875, 8.8680419921875, 9.3818359375, 9.8956298828125, 10.409423828125, 10.9232177734375, 11.43701171875, 11.9508056640625, 12.464599609375, 12.9783935546875, 13.4921875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 8.0, 8.0, 16.0, 11.0, 16.0, 21.0, 45.0, 54.0, 90.0, 126.0, 211.0, 367.0, 661.0, 1255.0, 2470.0, 5339.0, 14505.0, 52043.0, 902408.0, 2064358.0, 71713.0, 17680.0, 6488.0, 2727.0, 1305.0, 697.0, 398.0, 234.0, 129.0, 115.0, 54.0, 44.0, 25.0, 17.0, 12.0, 18.0, 8.0, 9.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-23.84375, -23.076904296875, -22.31005859375, -21.543212890625, -20.7763671875, -20.009521484375, -19.24267578125, -18.475830078125, -17.708984375, -16.942138671875, -16.17529296875, -15.408447265625, -14.6416015625, -13.874755859375, -13.10791015625, -12.341064453125, -11.57421875, -10.807373046875, -10.04052734375, -9.273681640625, -8.5068359375, -7.739990234375, -6.97314453125, -6.206298828125, -5.439453125, -4.672607421875, -3.90576171875, -3.138916015625, -2.3720703125, -1.605224609375, -0.83837890625, -0.071533203125, 0.6953125, 1.462158203125, 2.22900390625, 2.995849609375, 3.7626953125, 4.529541015625, 5.29638671875, 6.063232421875, 6.830078125, 7.596923828125, 8.36376953125, 9.130615234375, 9.8974609375, 10.664306640625, 11.43115234375, 12.197998046875, 12.96484375, 13.731689453125, 14.49853515625, 15.265380859375, 16.0322265625, 16.799072265625, 17.56591796875, 18.332763671875, 19.099609375, 19.866455078125, 20.63330078125, 21.400146484375, 22.1669921875, 22.933837890625, 23.70068359375, 24.467529296875, 25.234375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 42.0, 330.0, 539.0, 93.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.393192291259766, -40.60619354248047, -32.819190979003906, -25.03219223022461, -17.245193481445312, -9.458194732666016, -1.6711921691894531, 6.115806579589844, 13.90280532836914, 21.689804077148438, 29.476804733276367, 37.2638053894043, 45.050804138183594, 52.83780288696289, 60.62480545043945, 68.41180419921875, 76.19880676269531, 83.98580932617188, 91.7728042602539, 99.55980682373047, 107.3468017578125, 115.13380432128906, 122.92080688476562, 130.7078094482422, 138.4947967529297, 146.28179931640625, 154.0688018798828, 161.85580444335938, 169.64279174804688, 177.42979431152344, 185.216796875, 193.00379943847656, 200.79080200195312, 208.5778045654297, 216.36480712890625, 224.15179443359375, 231.9387969970703, 239.72579956054688, 247.51280212402344, 255.2998046875, 263.0867919921875, 270.873779296875, 278.6607971191406, 286.4477844238281, 294.23480224609375, 302.02178955078125, 309.80877685546875, 317.5957946777344, 325.3828125, 333.1697998046875, 340.9568176269531, 348.7438049316406, 356.53082275390625, 364.31781005859375, 372.10479736328125, 379.8918151855469, 387.6788024902344, 395.4657897949219, 403.2528076171875, 411.039794921875, 418.8268127441406, 426.6138000488281, 434.40081787109375, 442.18780517578125, 449.97479248046875]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 7.0, 2.0, 1.0, 3.0, 8.0, 7.0, 2.0, 11.0, 17.0, 21.0, 14.0, 25.0, 20.0, 23.0, 30.0, 30.0, 32.0, 23.0, 30.0, 39.0, 41.0, 49.0, 28.0, 39.0, 53.0, 44.0, 40.0, 33.0, 37.0, 41.0, 27.0, 27.0, 32.0, 24.0, 21.0, 22.0, 19.0, 12.0, 12.0, 15.0, 9.0, 6.0, 6.0, 7.0, 2.0, 6.0, 3.0, 5.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.28388214111328, -47.65742492675781, -46.030967712402344, -44.40451431274414, -42.77805709838867, -41.1515998840332, -39.525146484375, -37.89868927001953, -36.27223205566406, -34.645774841308594, -33.019317626953125, -31.392864227294922, -29.766407012939453, -28.139949798583984, -26.51349449157715, -24.887039184570312, -23.260581970214844, -21.634124755859375, -20.00766944885254, -18.381214141845703, -16.754756927490234, -15.128300666809082, -13.50184440612793, -11.875388145446777, -10.248931884765625, -8.622475624084473, -6.99601936340332, -5.369563102722168, -3.7431068420410156, -2.1166505813598633, -0.49019432067871094, 1.1362619400024414, 2.7627220153808594, 4.389178276062012, 6.015634536743164, 7.642090797424316, 9.268547058105469, 10.895003318786621, 12.521459579467773, 14.147915840148926, 15.774372100830078, 17.400829315185547, 19.027284622192383, 20.65373992919922, 22.280197143554688, 23.906654357910156, 25.533109664916992, 27.159564971923828, 28.786022186279297, 30.412479400634766, 32.03893280029297, 33.66539001464844, 35.291847229003906, 36.918304443359375, 38.544761657714844, 40.17121505737305, 41.797672271728516, 43.424129486083984, 45.05058288574219, 46.677040100097656, 48.303497314453125, 49.929954528808594, 51.55641174316406, 53.182865142822266, 54.809322357177734]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 7.0, 3.0, 14.0, 13.0, 10.0, 11.0, 15.0, 20.0, 13.0, 26.0, 17.0, 28.0, 36.0, 36.0, 38.0, 42.0, 44.0, 45.0, 49.0, 41.0, 38.0, 59.0, 38.0, 39.0, 35.0, 43.0, 31.0, 35.0, 25.0, 20.0, 21.0, 12.0, 10.0, 7.0, 12.0, 9.0, 7.0, 6.0, 7.0, 6.0, 6.0, 7.0, 1.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.8125, -3.68707275390625, -3.5616455078125, -3.43621826171875, -3.310791015625, -3.18536376953125, -3.0599365234375, -2.93450927734375, -2.80908203125, -2.68365478515625, -2.5582275390625, -2.43280029296875, -2.307373046875, -2.18194580078125, -2.0565185546875, -1.93109130859375, -1.8056640625, -1.68023681640625, -1.5548095703125, -1.42938232421875, -1.303955078125, -1.17852783203125, -1.0531005859375, -0.92767333984375, -0.80224609375, -0.67681884765625, -0.5513916015625, -0.42596435546875, -0.300537109375, -0.17510986328125, -0.0496826171875, 0.07574462890625, 0.201171875, 0.32659912109375, 0.4520263671875, 0.57745361328125, 0.702880859375, 0.82830810546875, 0.9537353515625, 1.07916259765625, 1.20458984375, 1.33001708984375, 1.4554443359375, 1.58087158203125, 1.706298828125, 1.83172607421875, 1.9571533203125, 2.08258056640625, 2.2080078125, 2.33343505859375, 2.4588623046875, 2.58428955078125, 2.709716796875, 2.83514404296875, 2.9605712890625, 3.08599853515625, 3.21142578125, 3.33685302734375, 3.4622802734375, 3.58770751953125, 3.713134765625, 3.83856201171875, 3.9639892578125, 4.08941650390625, 4.21484375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 4.0, 5.0, 7.0, 14.0, 13.0, 21.0, 30.0, 46.0, 62.0, 88.0, 129.0, 193.0, 293.0, 424.0, 660.0, 976.0, 1544.0, 2432.0, 4020.0, 6705.0, 11683.0, 23771.0, 72037.0, 1004143.0, 2831041.0, 160432.0, 34693.0, 15809.0, 8631.0, 5233.0, 3209.0, 1997.0, 1335.0, 842.0, 555.0, 380.0, 244.0, 177.0, 128.0, 82.0, 58.0, 44.0, 33.0, 10.0, 11.0, 14.0, 11.0, 6.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-13.609375, -13.173095703125, -12.73681640625, -12.300537109375, -11.8642578125, -11.427978515625, -10.99169921875, -10.555419921875, -10.119140625, -9.682861328125, -9.24658203125, -8.810302734375, -8.3740234375, -7.937744140625, -7.50146484375, -7.065185546875, -6.62890625, -6.192626953125, -5.75634765625, -5.320068359375, -4.8837890625, -4.447509765625, -4.01123046875, -3.574951171875, -3.138671875, -2.702392578125, -2.26611328125, -1.829833984375, -1.3935546875, -0.957275390625, -0.52099609375, -0.084716796875, 0.3515625, 0.787841796875, 1.22412109375, 1.660400390625, 2.0966796875, 2.532958984375, 2.96923828125, 3.405517578125, 3.841796875, 4.278076171875, 4.71435546875, 5.150634765625, 5.5869140625, 6.023193359375, 6.45947265625, 6.895751953125, 7.33203125, 7.768310546875, 8.20458984375, 8.640869140625, 9.0771484375, 9.513427734375, 9.94970703125, 10.385986328125, 10.822265625, 11.258544921875, 11.69482421875, 12.131103515625, 12.5673828125, 13.003662109375, 13.43994140625, 13.876220703125, 14.3125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 4.0, 8.0, 4.0, 14.0, 15.0, 19.0, 18.0, 24.0, 41.0, 51.0, 63.0, 130.0, 260.0, 517.0, 1011.0, 866.0, 449.0, 218.0, 122.0, 62.0, 42.0, 38.0, 26.0, 16.0, 8.0, 8.0, 5.0, 5.0, 7.0, 5.0, 8.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.96875, -19.4268798828125, -18.885009765625, -18.3431396484375, -17.80126953125, -17.2593994140625, -16.717529296875, -16.1756591796875, -15.6337890625, -15.0919189453125, -14.550048828125, -14.0081787109375, -13.46630859375, -12.9244384765625, -12.382568359375, -11.8406982421875, -11.298828125, -10.7569580078125, -10.215087890625, -9.6732177734375, -9.13134765625, -8.5894775390625, -8.047607421875, -7.5057373046875, -6.9638671875, -6.4219970703125, -5.880126953125, -5.3382568359375, -4.79638671875, -4.2545166015625, -3.712646484375, -3.1707763671875, -2.62890625, -2.0870361328125, -1.545166015625, -1.0032958984375, -0.46142578125, 0.0804443359375, 0.622314453125, 1.1641845703125, 1.7060546875, 2.2479248046875, 2.789794921875, 3.3316650390625, 3.87353515625, 4.4154052734375, 4.957275390625, 5.4991455078125, 6.041015625, 6.5828857421875, 7.124755859375, 7.6666259765625, 8.20849609375, 8.7503662109375, 9.292236328125, 9.8341064453125, 10.3759765625, 10.9178466796875, 11.459716796875, 12.0015869140625, 12.54345703125, 13.0853271484375, 13.627197265625, 14.1690673828125, 14.7109375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 8.0, 7.0, 11.0, 13.0, 25.0, 30.0, 45.0, 61.0, 81.0, 144.0, 218.0, 382.0, 618.0, 1049.0, 1930.0, 3648.0, 7233.0, 16275.0, 44435.0, 210769.0, 3221001.0, 574513.0, 69341.0, 22516.0, 9696.0, 4539.0, 2468.0, 1341.0, 690.0, 435.0, 261.0, 166.0, 119.0, 73.0, 46.0, 22.0, 18.0, 20.0, 12.0, 9.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.359375, -25.552734375, -24.74609375, -23.939453125, -23.1328125, -22.326171875, -21.51953125, -20.712890625, -19.90625, -19.099609375, -18.29296875, -17.486328125, -16.6796875, -15.873046875, -15.06640625, -14.259765625, -13.453125, -12.646484375, -11.83984375, -11.033203125, -10.2265625, -9.419921875, -8.61328125, -7.806640625, -7.0, -6.193359375, -5.38671875, -4.580078125, -3.7734375, -2.966796875, -2.16015625, -1.353515625, -0.546875, 0.259765625, 1.06640625, 1.873046875, 2.6796875, 3.486328125, 4.29296875, 5.099609375, 5.90625, 6.712890625, 7.51953125, 8.326171875, 9.1328125, 9.939453125, 10.74609375, 11.552734375, 12.359375, 13.166015625, 13.97265625, 14.779296875, 15.5859375, 16.392578125, 17.19921875, 18.005859375, 18.8125, 19.619140625, 20.42578125, 21.232421875, 22.0390625, 22.845703125, 23.65234375, 24.458984375, 25.265625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 4.0, 9.0, 5.0, 4.0, 17.0, 17.0, 23.0, 45.0, 40.0, 87.0, 94.0, 118.0, 124.0, 133.0, 81.0, 52.0, 40.0, 30.0, 16.0, 11.0, 24.0, 10.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-71.00122833251953, -68.87163543701172, -66.74203491210938, -64.61244201660156, -62.48284912109375, -60.35325622558594, -58.22365951538086, -56.09406280517578, -53.96446990966797, -51.834877014160156, -49.70528030395508, -47.57568359375, -45.44609069824219, -43.316497802734375, -41.1869010925293, -39.05730438232422, -36.927711486816406, -34.798118591308594, -32.668521881103516, -30.53892707824707, -28.409332275390625, -26.27973747253418, -24.150142669677734, -22.02054786682129, -19.890953063964844, -17.7613582611084, -15.631763458251953, -13.502168655395508, -11.372573852539062, -9.242979049682617, -7.113384246826172, -4.983789443969727, -2.8541946411132812, -0.7245998382568359, 1.4049949645996094, 3.5345897674560547, 5.6641845703125, 7.793779373168945, 9.92337417602539, 12.052968978881836, 14.182563781738281, 16.312158584594727, 18.441753387451172, 20.571348190307617, 22.700942993164062, 24.830537796020508, 26.960132598876953, 29.0897274017334, 31.219322204589844, 33.348915100097656, 35.478511810302734, 37.60810852050781, 39.737701416015625, 41.86729431152344, 43.996891021728516, 46.126487731933594, 48.256080627441406, 50.38567352294922, 52.5152702331543, 54.644866943359375, 56.77445983886719, 58.904052734375, 61.03364944458008, 63.163246154785156, 65.29283905029297]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 6.0, 2.0, 5.0, 2.0, 4.0, 5.0, 9.0, 6.0, 7.0, 12.0, 18.0, 13.0, 14.0, 21.0, 18.0, 25.0, 23.0, 26.0, 27.0, 27.0, 38.0, 36.0, 34.0, 43.0, 37.0, 34.0, 45.0, 35.0, 33.0, 40.0, 18.0, 34.0, 38.0, 28.0, 33.0, 33.0, 13.0, 19.0, 24.0, 15.0, 18.0, 22.0, 6.0, 13.0, 9.0, 6.0, 9.0, 6.0, 8.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.73562240600586, -32.56083679199219, -31.38604736328125, -30.211259841918945, -29.03647232055664, -27.86168670654297, -26.686899185180664, -25.51211166381836, -24.337324142456055, -23.16253662109375, -21.987749099731445, -20.81296157836914, -19.63817596435547, -18.46338653564453, -17.28860092163086, -16.113813400268555, -14.93902587890625, -13.764238357543945, -12.58945083618164, -11.414664268493652, -10.239876747131348, -9.065089225769043, -7.8903021812438965, -6.71551513671875, -5.540727615356445, -4.365940093994141, -3.191153049468994, -2.0163657665252686, -0.841578483581543, 0.3332090377807617, 1.5079960823059082, 2.6827831268310547, 3.8575668334960938, 5.032354354858398, 6.207141399383545, 7.381928443908691, 8.556715965270996, 9.7315034866333, 10.906290054321289, 12.081077575683594, 13.255865097045898, 14.430652618408203, 15.605440139770508, 16.780227661132812, 17.955013275146484, 19.129802703857422, 20.304588317871094, 21.4793758392334, 22.654163360595703, 23.828950881958008, 25.003738403320312, 26.178525924682617, 27.353313446044922, 28.528099060058594, 29.7028865814209, 30.877674102783203, 32.052459716796875, 33.22724533081055, 34.402034759521484, 35.576820373535156, 36.751609802246094, 37.926395416259766, 39.1011848449707, 40.275970458984375, 41.45075988769531]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 4.0, 4.0, 5.0, 8.0, 9.0, 11.0, 16.0, 10.0, 17.0, 20.0, 17.0, 25.0, 28.0, 23.0, 28.0, 43.0, 37.0, 45.0, 46.0, 39.0, 44.0, 42.0, 59.0, 39.0, 28.0, 40.0, 39.0, 43.0, 37.0, 22.0, 26.0, 18.0, 13.0, 27.0, 9.0, 13.0, 10.0, 8.0, 12.0, 5.0, 11.0, 4.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.92578125, -3.79296875, -3.66015625, -3.52734375, -3.39453125, -3.26171875, -3.12890625, -2.99609375, -2.86328125, -2.73046875, -2.59765625, -2.46484375, -2.33203125, -2.19921875, -2.06640625, -1.93359375, -1.80078125, -1.66796875, -1.53515625, -1.40234375, -1.26953125, -1.13671875, -1.00390625, -0.87109375, -0.73828125, -0.60546875, -0.47265625, -0.33984375, -0.20703125, -0.07421875, 0.05859375, 0.19140625, 0.32421875, 0.45703125, 0.58984375, 0.72265625, 0.85546875, 0.98828125, 1.12109375, 1.25390625, 1.38671875, 1.51953125, 1.65234375, 1.78515625, 1.91796875, 2.05078125, 2.18359375, 2.31640625, 2.44921875, 2.58203125, 2.71484375, 2.84765625, 2.98046875, 3.11328125, 3.24609375, 3.37890625, 3.51171875, 3.64453125, 3.77734375, 3.91015625, 4.04296875, 4.17578125, 4.30859375, 4.44140625, 4.57421875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 12.0, 20.0, 15.0, 23.0, 32.0, 41.0, 80.0, 92.0, 130.0, 196.0, 231.0, 344.0, 479.0, 649.0, 954.0, 1277.0, 1958.0, 2704.0, 3821.0, 5651.0, 8651.0, 14154.0, 25638.0, 53767.0, 130186.0, 291747.0, 274042.0, 118223.0, 50105.0, 24097.0, 13176.0, 8244.0, 5386.0, 3588.0, 2651.0, 1809.0, 1256.0, 861.0, 638.0, 455.0, 321.0, 237.0, 177.0, 120.0, 75.0, 63.0, 45.0, 30.0, 34.0, 18.0, 12.0, 12.0, 9.0, 6.0, 8.0, 3.0, 0.0, 3.0], "bins": [-14.359375, -13.909912109375, -13.46044921875, -13.010986328125, -12.5615234375, -12.112060546875, -11.66259765625, -11.213134765625, -10.763671875, -10.314208984375, -9.86474609375, -9.415283203125, -8.9658203125, -8.516357421875, -8.06689453125, -7.617431640625, -7.16796875, -6.718505859375, -6.26904296875, -5.819580078125, -5.3701171875, -4.920654296875, -4.47119140625, -4.021728515625, -3.572265625, -3.122802734375, -2.67333984375, -2.223876953125, -1.7744140625, -1.324951171875, -0.87548828125, -0.426025390625, 0.0234375, 0.472900390625, 0.92236328125, 1.371826171875, 1.8212890625, 2.270751953125, 2.72021484375, 3.169677734375, 3.619140625, 4.068603515625, 4.51806640625, 4.967529296875, 5.4169921875, 5.866455078125, 6.31591796875, 6.765380859375, 7.21484375, 7.664306640625, 8.11376953125, 8.563232421875, 9.0126953125, 9.462158203125, 9.91162109375, 10.361083984375, 10.810546875, 11.260009765625, 11.70947265625, 12.158935546875, 12.6083984375, 13.057861328125, 13.50732421875, 13.956787109375, 14.40625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 3.0, 6.0, 6.0, 15.0, 11.0, 13.0, 22.0, 16.0, 22.0, 28.0, 42.0, 29.0, 26.0, 30.0, 50.0, 38.0, 44.0, 43.0, 1059.0, 39.0, 39.0, 39.0, 47.0, 41.0, 39.0, 37.0, 56.0, 32.0, 22.0, 22.0, 14.0, 16.0, 8.0, 8.0, 14.0, 8.0, 7.0, 4.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.51416015625, -4.3759765625, -4.23779296875, -4.099609375, -3.96142578125, -3.8232421875, -3.68505859375, -3.546875, -3.40869140625, -3.2705078125, -3.13232421875, -2.994140625, -2.85595703125, -2.7177734375, -2.57958984375, -2.44140625, -2.30322265625, -2.1650390625, -2.02685546875, -1.888671875, -1.75048828125, -1.6123046875, -1.47412109375, -1.3359375, -1.19775390625, -1.0595703125, -0.92138671875, -0.783203125, -0.64501953125, -0.5068359375, -0.36865234375, -0.23046875, -0.09228515625, 0.0458984375, 0.18408203125, 0.322265625, 0.46044921875, 0.5986328125, 0.73681640625, 0.875, 1.01318359375, 1.1513671875, 1.28955078125, 1.427734375, 1.56591796875, 1.7041015625, 1.84228515625, 1.98046875, 2.11865234375, 2.2568359375, 2.39501953125, 2.533203125, 2.67138671875, 2.8095703125, 2.94775390625, 3.0859375, 3.22412109375, 3.3623046875, 3.50048828125, 3.638671875, 3.77685546875, 3.9150390625, 4.05322265625, 4.19140625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 6.0, 9.0, 17.0, 15.0, 29.0, 48.0, 61.0, 81.0, 102.0, 141.0, 258.0, 334.0, 474.0, 797.0, 1211.0, 2063.0, 3541.0, 6633.0, 14566.0, 42368.0, 307385.0, 1532911.0, 131985.0, 28143.0, 10864.0, 5349.0, 2936.0, 1660.0, 1063.0, 657.0, 435.0, 296.0, 206.0, 150.0, 98.0, 65.0, 43.0, 42.0, 19.0, 19.0, 12.0, 15.0, 5.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.46875, -17.839111328125, -17.20947265625, -16.579833984375, -15.9501953125, -15.320556640625, -14.69091796875, -14.061279296875, -13.431640625, -12.802001953125, -12.17236328125, -11.542724609375, -10.9130859375, -10.283447265625, -9.65380859375, -9.024169921875, -8.39453125, -7.764892578125, -7.13525390625, -6.505615234375, -5.8759765625, -5.246337890625, -4.61669921875, -3.987060546875, -3.357421875, -2.727783203125, -2.09814453125, -1.468505859375, -0.8388671875, -0.209228515625, 0.42041015625, 1.050048828125, 1.6796875, 2.309326171875, 2.93896484375, 3.568603515625, 4.1982421875, 4.827880859375, 5.45751953125, 6.087158203125, 6.716796875, 7.346435546875, 7.97607421875, 8.605712890625, 9.2353515625, 9.864990234375, 10.49462890625, 11.124267578125, 11.75390625, 12.383544921875, 13.01318359375, 13.642822265625, 14.2724609375, 14.902099609375, 15.53173828125, 16.161376953125, 16.791015625, 17.420654296875, 18.05029296875, 18.679931640625, 19.3095703125, 19.939208984375, 20.56884765625, 21.198486328125, 21.828125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 3.0, 3.0, 6.0, 10.0, 7.0, 20.0, 15.0, 29.0, 43.0, 67.0, 100.0, 111.0, 147.0, 113.0, 93.0, 68.0, 46.0, 32.0, 15.0, 16.0, 10.0, 9.0, 13.0, 4.0, 6.0, 9.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.22265625, -4.08099365234375, -3.9393310546875, -3.79766845703125, -3.656005859375, -3.51434326171875, -3.3726806640625, -3.23101806640625, -3.08935546875, -2.94769287109375, -2.8060302734375, -2.66436767578125, -2.522705078125, -2.38104248046875, -2.2393798828125, -2.09771728515625, -1.9560546875, -1.81439208984375, -1.6727294921875, -1.53106689453125, -1.389404296875, -1.24774169921875, -1.1060791015625, -0.96441650390625, -0.82275390625, -0.68109130859375, -0.5394287109375, -0.39776611328125, -0.256103515625, -0.11444091796875, 0.0272216796875, 0.16888427734375, 0.310546875, 0.45220947265625, 0.5938720703125, 0.73553466796875, 0.877197265625, 1.01885986328125, 1.1605224609375, 1.30218505859375, 1.44384765625, 1.58551025390625, 1.7271728515625, 1.86883544921875, 2.010498046875, 2.15216064453125, 2.2938232421875, 2.43548583984375, 2.5771484375, 2.71881103515625, 2.8604736328125, 3.00213623046875, 3.143798828125, 3.28546142578125, 3.4271240234375, 3.56878662109375, 3.71044921875, 3.85211181640625, 3.9937744140625, 4.13543701171875, 4.277099609375, 4.41876220703125, 4.5604248046875, 4.70208740234375, 4.84375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 2.0, 4.0, 10.0, 10.0, 15.0, 29.0, 31.0, 33.0, 59.0, 102.0, 160.0, 323.0, 888.0, 2667.0, 19076.0, 929210.0, 88399.0, 5185.0, 1271.0, 466.0, 207.0, 117.0, 81.0, 53.0, 41.0, 28.0, 21.0, 16.0, 12.0, 6.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.53125, -47.91845703125, -46.3056640625, -44.69287109375, -43.080078125, -41.46728515625, -39.8544921875, -38.24169921875, -36.62890625, -35.01611328125, -33.4033203125, -31.79052734375, -30.177734375, -28.56494140625, -26.9521484375, -25.33935546875, -23.7265625, -22.11376953125, -20.5009765625, -18.88818359375, -17.275390625, -15.66259765625, -14.0498046875, -12.43701171875, -10.82421875, -9.21142578125, -7.5986328125, -5.98583984375, -4.373046875, -2.76025390625, -1.1474609375, 0.46533203125, 2.078125, 3.69091796875, 5.3037109375, 6.91650390625, 8.529296875, 10.14208984375, 11.7548828125, 13.36767578125, 14.98046875, 16.59326171875, 18.2060546875, 19.81884765625, 21.431640625, 23.04443359375, 24.6572265625, 26.27001953125, 27.8828125, 29.49560546875, 31.1083984375, 32.72119140625, 34.333984375, 35.94677734375, 37.5595703125, 39.17236328125, 40.78515625, 42.39794921875, 44.0107421875, 45.62353515625, 47.236328125, 48.84912109375, 50.4619140625, 52.07470703125, 53.6875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 19.0, 37.0, 99.0, 242.0, 331.0, 184.0, 51.0, 17.0, 12.0, 7.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.259296417236328, -16.783069610595703, -16.306842803955078, -15.830615997314453, -15.354388236999512, -14.878161430358887, -14.401934623718262, -13.925707817077637, -13.449480056762695, -12.97325325012207, -12.497026443481445, -12.02079963684082, -11.544571876525879, -11.068345069885254, -10.592118263244629, -10.115891456604004, -9.639664649963379, -9.163437843322754, -8.687211036682129, -8.210983276367188, -7.7347564697265625, -7.2585296630859375, -6.7823028564453125, -6.3060760498046875, -5.829848766326904, -5.353621959686279, -4.877394676208496, -4.401167869567871, -3.924940824508667, -3.448713779449463, -2.972486972808838, -2.496259927749634, -2.0200319290161133, -1.5438048839569092, -1.0675779581069946, -0.5913510322570801, -0.11512398719787598, 0.3611030578613281, 0.8373298645019531, 1.3135569095611572, 1.7897839546203613, 2.2660109996795654, 2.7422380447387695, 3.2184648513793945, 3.6946918964385986, 4.170918941497803, 4.647145748138428, 5.123373031616211, 5.599599838256836, 6.075826644897461, 6.552053928375244, 7.028280735015869, 7.504508018493652, 7.980734825134277, 8.456961631774902, 8.933188438415527, 9.409416198730469, 9.885643005371094, 10.361869812011719, 10.838096618652344, 11.314324378967285, 11.79055118560791, 12.266777992248535, 12.74300479888916, 13.219231605529785]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 7.0, 4.0, 4.0, 3.0, 8.0, 10.0, 18.0, 16.0, 15.0, 16.0, 28.0, 34.0, 33.0, 30.0, 34.0, 37.0, 40.0, 51.0, 48.0, 43.0, 34.0, 50.0, 43.0, 43.0, 40.0, 37.0, 45.0, 36.0, 39.0, 22.0, 21.0, 20.0, 12.0, 15.0, 13.0, 15.0, 11.0, 13.0, 8.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.073789119720459, -2.9723269939422607, -2.8708651065826416, -2.7694029808044434, -2.667940855026245, -2.566478729248047, -2.4650168418884277, -2.3635547161102295, -2.2620925903320312, -2.160630464553833, -2.059168577194214, -1.9577064514160156, -1.8562443256378174, -1.7547823190689087, -1.6533203125, -1.5518581867218018, -1.4503962993621826, -1.348934292793274, -1.2474721670150757, -1.146010160446167, -1.0445480346679688, -0.9430860280990601, -0.8416240215301514, -0.7401619553565979, -0.6386998891830444, -0.537237823009491, -0.4357757866382599, -0.3343137502670288, -0.23285168409347534, -0.13138961791992188, -0.029927611351013184, 0.07153445482254028, 0.17299628257751465, 0.2744583487510681, 0.3759203851222992, 0.4773824214935303, 0.5788444876670837, 0.6803065538406372, 0.7817685604095459, 0.8832306265830994, 0.9846926927566528, 1.0861546993255615, 1.1876168251037598, 1.2890788316726685, 1.3905408382415771, 1.4920029640197754, 1.593464970588684, 1.6949269771575928, 1.796389102935791, 1.8978511095046997, 1.999313235282898, 2.1007752418518066, 2.202237367630005, 2.303699493408203, 2.4051613807678223, 2.5066235065460205, 2.6080856323242188, 2.709547758102417, 2.811009645462036, 2.9124717712402344, 3.0139338970184326, 3.115396022796631, 3.21685791015625, 3.3183200359344482, 3.4197819232940674]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 3.0, 6.0, 9.0, 10.0, 13.0, 12.0, 19.0, 11.0, 29.0, 12.0, 24.0, 28.0, 22.0, 33.0, 31.0, 25.0, 34.0, 47.0, 42.0, 35.0, 51.0, 35.0, 36.0, 39.0, 45.0, 35.0, 31.0, 46.0, 32.0, 23.0, 12.0, 23.0, 16.0, 22.0, 20.0, 13.0, 9.0, 16.0, 3.0, 8.0, 13.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.669921875, -3.543609619140625, -3.41729736328125, -3.290985107421875, -3.1646728515625, -3.038360595703125, -2.91204833984375, -2.785736083984375, -2.659423828125, -2.533111572265625, -2.40679931640625, -2.280487060546875, -2.1541748046875, -2.027862548828125, -1.90155029296875, -1.775238037109375, -1.64892578125, -1.522613525390625, -1.39630126953125, -1.269989013671875, -1.1436767578125, -1.017364501953125, -0.89105224609375, -0.764739990234375, -0.638427734375, -0.512115478515625, -0.38580322265625, -0.259490966796875, -0.1331787109375, -0.006866455078125, 0.11944580078125, 0.245758056640625, 0.3720703125, 0.498382568359375, 0.62469482421875, 0.751007080078125, 0.8773193359375, 1.003631591796875, 1.12994384765625, 1.256256103515625, 1.382568359375, 1.508880615234375, 1.63519287109375, 1.761505126953125, 1.8878173828125, 2.014129638671875, 2.14044189453125, 2.266754150390625, 2.39306640625, 2.519378662109375, 2.64569091796875, 2.772003173828125, 2.8983154296875, 3.024627685546875, 3.15093994140625, 3.277252197265625, 3.403564453125, 3.529876708984375, 3.65618896484375, 3.782501220703125, 3.9088134765625, 4.035125732421875, 4.16143798828125, 4.287750244140625, 4.4140625]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 5.0, 3.0, 4.0, 5.0, 13.0, 12.0, 21.0, 27.0, 38.0, 46.0, 55.0, 84.0, 83.0, 133.0, 191.0, 264.0, 362.0, 442.0, 639.0, 869.0, 1331.0, 1816.0, 2757.0, 4349.0, 7969.0, 19427.0, 98191.0, 648804.0, 204308.0, 30577.0, 10150.0, 5202.0, 3188.0, 2089.0, 1421.0, 1020.0, 696.0, 502.0, 362.0, 288.0, 221.0, 159.0, 116.0, 93.0, 62.0, 26.0, 36.0, 38.0, 20.0, 16.0, 15.0, 4.0, 9.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.58984375, -7.34234619140625, -7.0948486328125, -6.84735107421875, -6.599853515625, -6.35235595703125, -6.1048583984375, -5.85736083984375, -5.60986328125, -5.36236572265625, -5.1148681640625, -4.86737060546875, -4.619873046875, -4.37237548828125, -4.1248779296875, -3.87738037109375, -3.6298828125, -3.38238525390625, -3.1348876953125, -2.88739013671875, -2.639892578125, -2.39239501953125, -2.1448974609375, -1.89739990234375, -1.64990234375, -1.40240478515625, -1.1549072265625, -0.90740966796875, -0.659912109375, -0.41241455078125, -0.1649169921875, 0.08258056640625, 0.330078125, 0.57757568359375, 0.8250732421875, 1.07257080078125, 1.320068359375, 1.56756591796875, 1.8150634765625, 2.06256103515625, 2.31005859375, 2.55755615234375, 2.8050537109375, 3.05255126953125, 3.300048828125, 3.54754638671875, 3.7950439453125, 4.04254150390625, 4.2900390625, 4.53753662109375, 4.7850341796875, 5.03253173828125, 5.280029296875, 5.52752685546875, 5.7750244140625, 6.02252197265625, 6.27001953125, 6.51751708984375, 6.7650146484375, 7.01251220703125, 7.260009765625, 7.50750732421875, 7.7550048828125, 8.00250244140625, 8.25]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 3.0, 2.0, 6.0, 5.0, 19.0, 17.0, 18.0, 14.0, 22.0, 32.0, 31.0, 30.0, 39.0, 40.0, 63.0, 72.0, 70.0, 154.0, 1610.0, 298.0, 91.0, 82.0, 63.0, 41.0, 36.0, 33.0, 26.0, 24.0, 11.0, 16.0, 16.0, 13.0, 17.0, 7.0, 6.0, 11.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.84375, -16.18896484375, -15.5341796875, -14.87939453125, -14.224609375, -13.56982421875, -12.9150390625, -12.26025390625, -11.60546875, -10.95068359375, -10.2958984375, -9.64111328125, -8.986328125, -8.33154296875, -7.6767578125, -7.02197265625, -6.3671875, -5.71240234375, -5.0576171875, -4.40283203125, -3.748046875, -3.09326171875, -2.4384765625, -1.78369140625, -1.12890625, -0.47412109375, 0.1806640625, 0.83544921875, 1.490234375, 2.14501953125, 2.7998046875, 3.45458984375, 4.109375, 4.76416015625, 5.4189453125, 6.07373046875, 6.728515625, 7.38330078125, 8.0380859375, 8.69287109375, 9.34765625, 10.00244140625, 10.6572265625, 11.31201171875, 11.966796875, 12.62158203125, 13.2763671875, 13.93115234375, 14.5859375, 15.24072265625, 15.8955078125, 16.55029296875, 17.205078125, 17.85986328125, 18.5146484375, 19.16943359375, 19.82421875, 20.47900390625, 21.1337890625, 21.78857421875, 22.443359375, 23.09814453125, 23.7529296875, 24.40771484375, 25.0625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 8.0, 12.0, 10.0, 14.0, 19.0, 25.0, 30.0, 34.0, 35.0, 76.0, 119.0, 255.0, 520.0, 1093.0, 2457.0, 6863.0, 25826.0, 333715.0, 2697464.0, 58419.0, 11747.0, 3821.0, 1543.0, 707.0, 343.0, 176.0, 108.0, 76.0, 42.0, 33.0, 29.0, 22.0, 14.0, 9.0, 7.0, 3.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.875, -28.005859375, -27.13671875, -26.267578125, -25.3984375, -24.529296875, -23.66015625, -22.791015625, -21.921875, -21.052734375, -20.18359375, -19.314453125, -18.4453125, -17.576171875, -16.70703125, -15.837890625, -14.96875, -14.099609375, -13.23046875, -12.361328125, -11.4921875, -10.623046875, -9.75390625, -8.884765625, -8.015625, -7.146484375, -6.27734375, -5.408203125, -4.5390625, -3.669921875, -2.80078125, -1.931640625, -1.0625, -0.193359375, 0.67578125, 1.544921875, 2.4140625, 3.283203125, 4.15234375, 5.021484375, 5.890625, 6.759765625, 7.62890625, 8.498046875, 9.3671875, 10.236328125, 11.10546875, 11.974609375, 12.84375, 13.712890625, 14.58203125, 15.451171875, 16.3203125, 17.189453125, 18.05859375, 18.927734375, 19.796875, 20.666015625, 21.53515625, 22.404296875, 23.2734375, 24.142578125, 25.01171875, 25.880859375, 26.75]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 26.0, 209.0, 537.0, 204.0, 27.0, 6.0], "bins": [-347.0757141113281, -341.3372497558594, -335.5987548828125, -329.86029052734375, -324.121826171875, -318.38336181640625, -312.6448669433594, -306.9064025878906, -301.1679382324219, -295.4294738769531, -289.69097900390625, -283.9525146484375, -278.21405029296875, -272.4755859375, -266.7370910644531, -260.9986267089844, -255.26016235351562, -249.5216827392578, -243.78321838378906, -238.04473876953125, -232.3062744140625, -226.5677947998047, -220.82933044433594, -215.09085083007812, -209.3523712158203, -203.6138916015625, -197.87542724609375, -192.13694763183594, -186.3984832763672, -180.66000366210938, -174.92153930664062, -169.1830596923828, -163.44459533691406, -157.70611572265625, -151.9676513671875, -146.2291717529297, -140.49070739746094, -134.75222778320312, -129.01376342773438, -123.27528381347656, -117.53681945800781, -111.79834747314453, -106.05987548828125, -100.32140350341797, -94.58293151855469, -88.8444595336914, -83.10598754882812, -77.36750793457031, -71.62904357910156, -65.89057159423828, -60.152099609375, -54.41362762451172, -48.67515563964844, -42.936683654785156, -37.19820785522461, -31.459735870361328, -25.72126007080078, -19.9827880859375, -14.244315147399902, -8.505842208862305, -2.7673702239990234, 2.971101760864258, 8.709575653076172, 14.448047637939453, 20.186519622802734]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 1.0, 9.0, 8.0, 5.0, 10.0, 8.0, 9.0, 17.0, 22.0, 29.0, 23.0, 24.0, 30.0, 24.0, 32.0, 37.0, 43.0, 38.0, 52.0, 34.0, 41.0, 36.0, 28.0, 34.0, 36.0, 39.0, 34.0, 42.0, 32.0, 24.0, 31.0, 27.0, 15.0, 27.0, 17.0, 16.0, 13.0, 10.0, 10.0, 8.0, 7.0, 4.0, 2.0, 4.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.22519302368164, -56.46272659301758, -54.70025634765625, -52.93778991699219, -51.175323486328125, -49.41285705566406, -47.650390625, -45.88792037963867, -44.12545394897461, -42.36298751831055, -40.60051727294922, -38.838050842285156, -37.075584411621094, -35.31311798095703, -33.55065155029297, -31.78818130493164, -30.025714874267578, -28.263248443603516, -26.50078010559082, -24.738311767578125, -22.975845336914062, -21.21337890625, -19.450910568237305, -17.68844223022461, -15.925975799560547, -14.163508415222168, -12.401041030883789, -10.63857364654541, -8.876106262207031, -7.113638877868652, -5.351171493530273, -3.5887041091918945, -1.8262367248535156, -0.06376934051513672, 1.6986980438232422, 3.461165428161621, 5.2236328125, 6.986100196838379, 8.748567581176758, 10.511034965515137, 12.273502349853516, 14.035969734191895, 15.798437118530273, 17.56090545654297, 19.32337188720703, 21.085838317871094, 22.84830665588379, 24.610774993896484, 26.373241424560547, 28.13570785522461, 29.898176193237305, 31.66064453125, 33.42311096191406, 35.185577392578125, 36.94804382324219, 38.710514068603516, 40.47298049926758, 42.23544692993164, 43.99791717529297, 45.76038360595703, 47.522850036621094, 49.285316467285156, 51.04778289794922, 52.81025314331055, 54.57271957397461]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 5.0, 9.0, 10.0, 10.0, 10.0, 13.0, 21.0, 8.0, 26.0, 28.0, 29.0, 23.0, 26.0, 29.0, 20.0, 46.0, 30.0, 42.0, 36.0, 35.0, 44.0, 51.0, 39.0, 39.0, 41.0, 38.0, 33.0, 29.0, 30.0, 28.0, 19.0, 21.0, 20.0, 16.0, 15.0, 13.0, 10.0, 6.0, 8.0, 7.0, 10.0, 6.0, 4.0, 2.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.08203125, -3.94866943359375, -3.8153076171875, -3.68194580078125, -3.548583984375, -3.41522216796875, -3.2818603515625, -3.14849853515625, -3.01513671875, -2.88177490234375, -2.7484130859375, -2.61505126953125, -2.481689453125, -2.34832763671875, -2.2149658203125, -2.08160400390625, -1.9482421875, -1.81488037109375, -1.6815185546875, -1.54815673828125, -1.414794921875, -1.28143310546875, -1.1480712890625, -1.01470947265625, -0.88134765625, -0.74798583984375, -0.6146240234375, -0.48126220703125, -0.347900390625, -0.21453857421875, -0.0811767578125, 0.05218505859375, 0.185546875, 0.31890869140625, 0.4522705078125, 0.58563232421875, 0.718994140625, 0.85235595703125, 0.9857177734375, 1.11907958984375, 1.25244140625, 1.38580322265625, 1.5191650390625, 1.65252685546875, 1.785888671875, 1.91925048828125, 2.0526123046875, 2.18597412109375, 2.3193359375, 2.45269775390625, 2.5860595703125, 2.71942138671875, 2.852783203125, 2.98614501953125, 3.1195068359375, 3.25286865234375, 3.38623046875, 3.51959228515625, 3.6529541015625, 3.78631591796875, 3.919677734375, 4.05303955078125, 4.1864013671875, 4.31976318359375, 4.453125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 6.0, 2.0, 6.0, 8.0, 16.0, 14.0, 16.0, 35.0, 49.0, 68.0, 90.0, 117.0, 155.0, 262.0, 294.0, 451.0, 639.0, 847.0, 1075.0, 1581.0, 2099.0, 2981.0, 4278.0, 6241.0, 9674.0, 15547.0, 28343.0, 74312.0, 460999.0, 2657066.0, 743620.0, 100308.0, 32624.0, 17114.0, 10293.0, 6749.0, 4546.0, 3191.0, 2225.0, 1704.0, 1213.0, 904.0, 664.0, 490.0, 370.0, 272.0, 205.0, 153.0, 97.0, 81.0, 62.0, 50.0, 30.0, 21.0, 15.0, 10.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0], "bins": [-9.6015625, -9.287841796875, -8.97412109375, -8.660400390625, -8.3466796875, -8.032958984375, -7.71923828125, -7.405517578125, -7.091796875, -6.778076171875, -6.46435546875, -6.150634765625, -5.8369140625, -5.523193359375, -5.20947265625, -4.895751953125, -4.58203125, -4.268310546875, -3.95458984375, -3.640869140625, -3.3271484375, -3.013427734375, -2.69970703125, -2.385986328125, -2.072265625, -1.758544921875, -1.44482421875, -1.131103515625, -0.8173828125, -0.503662109375, -0.18994140625, 0.123779296875, 0.4375, 0.751220703125, 1.06494140625, 1.378662109375, 1.6923828125, 2.006103515625, 2.31982421875, 2.633544921875, 2.947265625, 3.260986328125, 3.57470703125, 3.888427734375, 4.2021484375, 4.515869140625, 4.82958984375, 5.143310546875, 5.45703125, 5.770751953125, 6.08447265625, 6.398193359375, 6.7119140625, 7.025634765625, 7.33935546875, 7.653076171875, 7.966796875, 8.280517578125, 8.59423828125, 8.907958984375, 9.2216796875, 9.535400390625, 9.84912109375, 10.162841796875, 10.4765625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 3.0, 9.0, 10.0, 8.0, 5.0, 19.0, 14.0, 23.0, 39.0, 56.0, 74.0, 134.0, 237.0, 556.0, 968.0, 897.0, 448.0, 222.0, 100.0, 76.0, 41.0, 25.0, 17.0, 16.0, 12.0, 14.0, 10.0, 6.0, 5.0, 4.0, 4.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3828125, -13.8472900390625, -13.311767578125, -12.7762451171875, -12.24072265625, -11.7052001953125, -11.169677734375, -10.6341552734375, -10.0986328125, -9.5631103515625, -9.027587890625, -8.4920654296875, -7.95654296875, -7.4210205078125, -6.885498046875, -6.3499755859375, -5.814453125, -5.2789306640625, -4.743408203125, -4.2078857421875, -3.67236328125, -3.1368408203125, -2.601318359375, -2.0657958984375, -1.5302734375, -0.9947509765625, -0.459228515625, 0.0762939453125, 0.61181640625, 1.1473388671875, 1.682861328125, 2.2183837890625, 2.75390625, 3.2894287109375, 3.824951171875, 4.3604736328125, 4.89599609375, 5.4315185546875, 5.967041015625, 6.5025634765625, 7.0380859375, 7.5736083984375, 8.109130859375, 8.6446533203125, 9.18017578125, 9.7156982421875, 10.251220703125, 10.7867431640625, 11.322265625, 11.8577880859375, 12.393310546875, 12.9288330078125, 13.46435546875, 13.9998779296875, 14.535400390625, 15.0709228515625, 15.6064453125, 16.1419677734375, 16.677490234375, 17.2130126953125, 17.74853515625, 18.2840576171875, 18.819580078125, 19.3551025390625, 19.890625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 8.0, 2.0, 11.0, 7.0, 13.0, 14.0, 27.0, 44.0, 62.0, 72.0, 137.0, 261.0, 361.0, 639.0, 1008.0, 1765.0, 3114.0, 5718.0, 11974.0, 28444.0, 99341.0, 1362363.0, 2475696.0, 139465.0, 34995.0, 13664.0, 6683.0, 3536.0, 1953.0, 1160.0, 661.0, 387.0, 262.0, 154.0, 105.0, 72.0, 37.0, 29.0, 19.0, 7.0, 11.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.171875, -18.437255859375, -17.70263671875, -16.968017578125, -16.2333984375, -15.498779296875, -14.76416015625, -14.029541015625, -13.294921875, -12.560302734375, -11.82568359375, -11.091064453125, -10.3564453125, -9.621826171875, -8.88720703125, -8.152587890625, -7.41796875, -6.683349609375, -5.94873046875, -5.214111328125, -4.4794921875, -3.744873046875, -3.01025390625, -2.275634765625, -1.541015625, -0.806396484375, -0.07177734375, 0.662841796875, 1.3974609375, 2.132080078125, 2.86669921875, 3.601318359375, 4.3359375, 5.070556640625, 5.80517578125, 6.539794921875, 7.2744140625, 8.009033203125, 8.74365234375, 9.478271484375, 10.212890625, 10.947509765625, 11.68212890625, 12.416748046875, 13.1513671875, 13.885986328125, 14.62060546875, 15.355224609375, 16.08984375, 16.824462890625, 17.55908203125, 18.293701171875, 19.0283203125, 19.762939453125, 20.49755859375, 21.232177734375, 21.966796875, 22.701416015625, 23.43603515625, 24.170654296875, 24.9052734375, 25.639892578125, 26.37451171875, 27.109130859375, 27.84375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 12.0, 14.0, 17.0, 27.0, 33.0, 60.0, 125.0, 159.0, 161.0, 121.0, 107.0, 55.0, 46.0, 24.0, 15.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.55537414550781, -113.7451400756836, -110.9349136352539, -108.12467956542969, -105.31444549560547, -102.50421142578125, -99.69398498535156, -96.88375091552734, -94.07351684570312, -91.2632827758789, -88.45305633544922, -85.642822265625, -82.83258819580078, -80.02235412597656, -77.21212768554688, -74.40189361572266, -71.59166717529297, -68.78143310546875, -65.97120666503906, -63.160972595214844, -60.350738525390625, -57.54050827026367, -54.73027801513672, -51.9200439453125, -49.10981369018555, -46.299583435058594, -43.489349365234375, -40.67911911010742, -37.86888885498047, -35.05865478515625, -32.2484245300293, -29.43819236755371, -26.62795639038086, -23.817724227905273, -21.007492065429688, -18.197261810302734, -15.387029647827148, -12.576797485351562, -9.76656723022461, -6.956335067749023, -4.1461029052734375, -1.3358712196350098, 1.474360466003418, 4.2845916748046875, 7.094823837280273, 9.90505599975586, 12.715286254882812, 15.525518417358398, 18.335750579833984, 21.14598274230957, 23.956214904785156, 26.76644515991211, 29.576677322387695, 32.38690948486328, 35.197139739990234, 38.00736999511719, 40.817604064941406, 43.62783432006836, 46.43806838989258, 49.24829864501953, 52.05853271484375, 54.8687629699707, 57.678993225097656, 60.489227294921875, 63.29945755004883]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 4.0, 5.0, 8.0, 8.0, 11.0, 6.0, 12.0, 19.0, 15.0, 21.0, 22.0, 30.0, 32.0, 23.0, 31.0, 35.0, 36.0, 39.0, 26.0, 43.0, 41.0, 45.0, 43.0, 44.0, 46.0, 39.0, 46.0, 28.0, 30.0, 36.0, 25.0, 27.0, 17.0, 11.0, 19.0, 19.0, 7.0, 9.0, 12.0, 10.0, 2.0, 3.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-41.914405822753906, -40.61658477783203, -39.31876754760742, -38.02094650268555, -36.72312927246094, -35.42530822753906, -34.12748718261719, -32.82966613769531, -31.531848907470703, -30.23402976989746, -28.93621063232422, -27.638389587402344, -26.3405704498291, -25.04275131225586, -23.744930267333984, -22.447111129760742, -21.1492919921875, -19.851472854614258, -18.553653717041016, -17.25583267211914, -15.958013534545898, -14.660194396972656, -13.362374305725098, -12.064554214477539, -10.766735076904297, -9.468915939331055, -8.171095848083496, -6.873276233673096, -5.575456619262695, -4.277637004852295, -2.9798173904418945, -1.681997299194336, -0.38417816162109375, 0.9136414527893066, 2.211461067199707, 3.5092806816101074, 4.807100296020508, 6.104919910430908, 7.402739524841309, 8.700559616088867, 9.99837875366211, 11.296197891235352, 12.59401798248291, 13.891838073730469, 15.189657211303711, 16.487476348876953, 17.785297393798828, 19.08311653137207, 20.380935668945312, 21.678754806518555, 22.976573944091797, 24.274394989013672, 25.572214126586914, 26.870033264160156, 28.16785430908203, 29.465673446655273, 30.763492584228516, 32.06131362915039, 33.359130859375, 34.656951904296875, 35.95477294921875, 37.25259017944336, 38.550411224365234, 39.848228454589844, 41.14604949951172]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 0.0, 4.0, 7.0, 5.0, 9.0, 13.0, 14.0, 17.0, 19.0, 17.0, 24.0, 40.0, 23.0, 30.0, 32.0, 30.0, 36.0, 41.0, 40.0, 36.0, 46.0, 37.0, 47.0, 46.0, 39.0, 50.0, 42.0, 32.0, 28.0, 27.0, 23.0, 27.0, 14.0, 17.0, 9.0, 11.0, 12.0, 4.0, 15.0, 2.0, 8.0, 10.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.7265625, -4.58050537109375, -4.4344482421875, -4.28839111328125, -4.142333984375, -3.99627685546875, -3.8502197265625, -3.70416259765625, -3.55810546875, -3.41204833984375, -3.2659912109375, -3.11993408203125, -2.973876953125, -2.82781982421875, -2.6817626953125, -2.53570556640625, -2.3896484375, -2.24359130859375, -2.0975341796875, -1.95147705078125, -1.805419921875, -1.65936279296875, -1.5133056640625, -1.36724853515625, -1.22119140625, -1.07513427734375, -0.9290771484375, -0.78302001953125, -0.636962890625, -0.49090576171875, -0.3448486328125, -0.19879150390625, -0.052734375, 0.09332275390625, 0.2393798828125, 0.38543701171875, 0.531494140625, 0.67755126953125, 0.8236083984375, 0.96966552734375, 1.11572265625, 1.26177978515625, 1.4078369140625, 1.55389404296875, 1.699951171875, 1.84600830078125, 1.9920654296875, 2.13812255859375, 2.2841796875, 2.43023681640625, 2.5762939453125, 2.72235107421875, 2.868408203125, 3.01446533203125, 3.1605224609375, 3.30657958984375, 3.45263671875, 3.59869384765625, 3.7447509765625, 3.89080810546875, 4.036865234375, 4.18292236328125, 4.3289794921875, 4.47503662109375, 4.62109375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 10.0, 17.0, 27.0, 29.0, 58.0, 61.0, 114.0, 171.0, 205.0, 317.0, 416.0, 583.0, 895.0, 1338.0, 2103.0, 3336.0, 5653.0, 9637.0, 17588.0, 34077.0, 74546.0, 210079.0, 425354.0, 142520.0, 57078.0, 26979.0, 14216.0, 8095.0, 4715.0, 2792.0, 1803.0, 1124.0, 786.0, 571.0, 371.0, 277.0, 184.0, 145.0, 84.0, 68.0, 46.0, 27.0, 21.0, 13.0, 6.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.640625, -19.98193359375, -19.3232421875, -18.66455078125, -18.005859375, -17.34716796875, -16.6884765625, -16.02978515625, -15.37109375, -14.71240234375, -14.0537109375, -13.39501953125, -12.736328125, -12.07763671875, -11.4189453125, -10.76025390625, -10.1015625, -9.44287109375, -8.7841796875, -8.12548828125, -7.466796875, -6.80810546875, -6.1494140625, -5.49072265625, -4.83203125, -4.17333984375, -3.5146484375, -2.85595703125, -2.197265625, -1.53857421875, -0.8798828125, -0.22119140625, 0.4375, 1.09619140625, 1.7548828125, 2.41357421875, 3.072265625, 3.73095703125, 4.3896484375, 5.04833984375, 5.70703125, 6.36572265625, 7.0244140625, 7.68310546875, 8.341796875, 9.00048828125, 9.6591796875, 10.31787109375, 10.9765625, 11.63525390625, 12.2939453125, 12.95263671875, 13.611328125, 14.27001953125, 14.9287109375, 15.58740234375, 16.24609375, 16.90478515625, 17.5634765625, 18.22216796875, 18.880859375, 19.53955078125, 20.1982421875, 20.85693359375, 21.515625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 11.0, 14.0, 12.0, 10.0, 10.0, 12.0, 23.0, 20.0, 26.0, 28.0, 30.0, 43.0, 40.0, 49.0, 42.0, 43.0, 39.0, 50.0, 1068.0, 43.0, 37.0, 40.0, 39.0, 38.0, 35.0, 38.0, 15.0, 19.0, 23.0, 19.0, 18.0, 17.0, 14.0, 15.0, 6.0, 11.0, 3.0, 3.0, 4.0, 8.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.71875, -4.58050537109375, -4.4422607421875, -4.30401611328125, -4.165771484375, -4.02752685546875, -3.8892822265625, -3.75103759765625, -3.61279296875, -3.47454833984375, -3.3363037109375, -3.19805908203125, -3.059814453125, -2.92156982421875, -2.7833251953125, -2.64508056640625, -2.5068359375, -2.36859130859375, -2.2303466796875, -2.09210205078125, -1.953857421875, -1.81561279296875, -1.6773681640625, -1.53912353515625, -1.40087890625, -1.26263427734375, -1.1243896484375, -0.98614501953125, -0.847900390625, -0.70965576171875, -0.5714111328125, -0.43316650390625, -0.294921875, -0.15667724609375, -0.0184326171875, 0.11981201171875, 0.258056640625, 0.39630126953125, 0.5345458984375, 0.67279052734375, 0.81103515625, 0.94927978515625, 1.0875244140625, 1.22576904296875, 1.364013671875, 1.50225830078125, 1.6405029296875, 1.77874755859375, 1.9169921875, 2.05523681640625, 2.1934814453125, 2.33172607421875, 2.469970703125, 2.60821533203125, 2.7464599609375, 2.88470458984375, 3.02294921875, 3.16119384765625, 3.2994384765625, 3.43768310546875, 3.575927734375, 3.71417236328125, 3.8524169921875, 3.99066162109375, 4.12890625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 4.0, 10.0, 14.0, 15.0, 32.0, 34.0, 55.0, 76.0, 135.0, 158.0, 255.0, 391.0, 589.0, 857.0, 1493.0, 2369.0, 4536.0, 8284.0, 17497.0, 44073.0, 181516.0, 1406804.0, 321766.0, 61369.0, 21870.0, 10113.0, 5166.0, 2924.0, 1677.0, 1024.0, 692.0, 393.0, 305.0, 192.0, 153.0, 81.0, 58.0, 51.0, 31.0, 16.0, 17.0, 11.0, 9.0, 7.0, 5.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.796875, -15.263916015625, -14.73095703125, -14.197998046875, -13.6650390625, -13.132080078125, -12.59912109375, -12.066162109375, -11.533203125, -11.000244140625, -10.46728515625, -9.934326171875, -9.4013671875, -8.868408203125, -8.33544921875, -7.802490234375, -7.26953125, -6.736572265625, -6.20361328125, -5.670654296875, -5.1376953125, -4.604736328125, -4.07177734375, -3.538818359375, -3.005859375, -2.472900390625, -1.93994140625, -1.406982421875, -0.8740234375, -0.341064453125, 0.19189453125, 0.724853515625, 1.2578125, 1.790771484375, 2.32373046875, 2.856689453125, 3.3896484375, 3.922607421875, 4.45556640625, 4.988525390625, 5.521484375, 6.054443359375, 6.58740234375, 7.120361328125, 7.6533203125, 8.186279296875, 8.71923828125, 9.252197265625, 9.78515625, 10.318115234375, 10.85107421875, 11.384033203125, 11.9169921875, 12.449951171875, 12.98291015625, 13.515869140625, 14.048828125, 14.581787109375, 15.11474609375, 15.647705078125, 16.1806640625, 16.713623046875, 17.24658203125, 17.779541015625, 18.3125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 4.0, 2.0, 4.0, 1.0, 6.0, 9.0, 8.0, 21.0, 15.0, 10.0, 13.0, 21.0, 21.0, 38.0, 39.0, 42.0, 60.0, 81.0, 107.0, 111.0, 87.0, 54.0, 37.0, 42.0, 23.0, 31.0, 24.0, 13.0, 13.0, 11.0, 12.0, 7.0, 8.0, 5.0, 5.0, 4.0, 6.0, 3.0, 3.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.376953125, -2.288330078125, -2.19970703125, -2.111083984375, -2.0224609375, -1.933837890625, -1.84521484375, -1.756591796875, -1.66796875, -1.579345703125, -1.49072265625, -1.402099609375, -1.3134765625, -1.224853515625, -1.13623046875, -1.047607421875, -0.958984375, -0.870361328125, -0.78173828125, -0.693115234375, -0.6044921875, -0.515869140625, -0.42724609375, -0.338623046875, -0.25, -0.161376953125, -0.07275390625, 0.015869140625, 0.1044921875, 0.193115234375, 0.28173828125, 0.370361328125, 0.458984375, 0.547607421875, 0.63623046875, 0.724853515625, 0.8134765625, 0.902099609375, 0.99072265625, 1.079345703125, 1.16796875, 1.256591796875, 1.34521484375, 1.433837890625, 1.5224609375, 1.611083984375, 1.69970703125, 1.788330078125, 1.876953125, 1.965576171875, 2.05419921875, 2.142822265625, 2.2314453125, 2.320068359375, 2.40869140625, 2.497314453125, 2.5859375, 2.674560546875, 2.76318359375, 2.851806640625, 2.9404296875, 3.029052734375, 3.11767578125, 3.206298828125, 3.294921875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 8.0, 11.0, 14.0, 11.0, 17.0, 22.0, 32.0, 39.0, 42.0, 68.0, 90.0, 123.0, 173.0, 293.0, 635.0, 1894.0, 9636.0, 131758.0, 854315.0, 42151.0, 4787.0, 1156.0, 448.0, 211.0, 163.0, 99.0, 68.0, 77.0, 46.0, 34.0, 34.0, 23.0, 14.0, 10.0, 13.0, 10.0, 5.0, 1.0, 4.0, 1.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-34.96875, -33.85205078125, -32.7353515625, -31.61865234375, -30.501953125, -29.38525390625, -28.2685546875, -27.15185546875, -26.03515625, -24.91845703125, -23.8017578125, -22.68505859375, -21.568359375, -20.45166015625, -19.3349609375, -18.21826171875, -17.1015625, -15.98486328125, -14.8681640625, -13.75146484375, -12.634765625, -11.51806640625, -10.4013671875, -9.28466796875, -8.16796875, -7.05126953125, -5.9345703125, -4.81787109375, -3.701171875, -2.58447265625, -1.4677734375, -0.35107421875, 0.765625, 1.88232421875, 2.9990234375, 4.11572265625, 5.232421875, 6.34912109375, 7.4658203125, 8.58251953125, 9.69921875, 10.81591796875, 11.9326171875, 13.04931640625, 14.166015625, 15.28271484375, 16.3994140625, 17.51611328125, 18.6328125, 19.74951171875, 20.8662109375, 21.98291015625, 23.099609375, 24.21630859375, 25.3330078125, 26.44970703125, 27.56640625, 28.68310546875, 29.7998046875, 30.91650390625, 32.033203125, 33.14990234375, 34.2666015625, 35.38330078125, 36.5]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 10.0, 8.0, 8.0, 14.0, 15.0, 26.0, 52.0, 85.0, 144.0, 152.0, 161.0, 129.0, 78.0, 58.0, 27.0, 18.0, 10.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.857371807098389, -7.584421634674072, -7.311471462249756, -7.0385212898254395, -6.765571117401123, -6.492620944976807, -6.219671249389648, -5.946721076965332, -5.673770904541016, -5.400820732116699, -5.127870559692383, -4.854920387268066, -4.58197021484375, -4.309020042419434, -4.036069869995117, -3.76311993598938, -3.4901695251464844, -3.217219352722168, -2.9442691802978516, -2.671319007873535, -2.3983688354492188, -2.1254186630249023, -1.852468729019165, -1.5795185565948486, -1.3065683841705322, -1.0336182117462158, -0.7606680989265442, -0.48771798610687256, -0.21476781368255615, 0.058182358741760254, 0.3311324119567871, 0.6040825843811035, 0.8770332336425781, 1.1499834060668945, 1.422933578491211, 1.6958836317062378, 1.9688338041305542, 2.24178409576416, 2.5147340297698975, 2.787684202194214, 3.0606343746185303, 3.3335845470428467, 3.606534719467163, 3.8794846534729004, 4.152434825897217, 4.425384998321533, 4.69833517074585, 4.971285343170166, 5.244235515594482, 5.517185688018799, 5.790135860443115, 6.063086032867432, 6.336036205291748, 6.6089863777160645, 6.881936073303223, 7.154886245727539, 7.4278364181518555, 7.700786590576172, 7.973736763000488, 8.246686935424805, 8.519637107849121, 8.792587280273438, 9.065537452697754, 9.33848762512207, 9.611437797546387]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 2.0, 10.0, 14.0, 8.0, 13.0, 15.0, 20.0, 32.0, 37.0, 30.0, 38.0, 40.0, 34.0, 43.0, 45.0, 51.0, 46.0, 44.0, 43.0, 56.0, 38.0, 46.0, 34.0, 28.0, 34.0, 21.0, 38.0, 32.0, 22.0, 25.0, 10.0, 16.0, 8.0, 9.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.479132652282715, -4.336423397064209, -4.193713665008545, -4.051004409790039, -3.908295154571533, -3.7655856609344482, -3.6228761672973633, -3.4801669120788574, -3.3374576568603516, -3.1947481632232666, -3.0520389080047607, -2.909329414367676, -2.76662015914917, -2.623910665512085, -2.481201171875, -2.338491916656494, -2.195782423019409, -2.053072929382324, -1.9103636741638184, -1.7676541805267334, -1.6249449253082275, -1.4822354316711426, -1.3395260572433472, -1.1968166828155518, -1.0541073083877563, -0.9113979339599609, -0.7686885595321655, -0.6259791254997253, -0.48326975107192993, -0.3405603766441345, -0.19785094261169434, -0.055141568183898926, 0.08756780624389648, 0.2302771955728531, 0.3729865849018097, 0.5156959891319275, 0.6584053635597229, 0.8011147379875183, 0.9438241720199585, 1.086533546447754, 1.2292429208755493, 1.3719522953033447, 1.5146616697311401, 1.6573710441589355, 1.8000805377960205, 1.9427897930145264, 2.0854992866516113, 2.228208541870117, 2.370918035507202, 2.513627529144287, 2.656336784362793, 2.799046277999878, 2.941755533218384, 3.0844650268554688, 3.2271742820739746, 3.3698837757110596, 3.5125932693481445, 3.6553027629852295, 3.7980120182037354, 3.9407215118408203, 4.083430767059326, 4.226140022277832, 4.368849754333496, 4.511559009552002, 4.654268264770508]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 4.0, 6.0, 7.0, 11.0, 13.0, 13.0, 15.0, 16.0, 25.0, 21.0, 25.0, 25.0, 37.0, 32.0, 36.0, 35.0, 35.0, 44.0, 33.0, 44.0, 55.0, 65.0, 41.0, 42.0, 51.0, 32.0, 28.0, 33.0, 18.0, 21.0, 28.0, 9.0, 10.0, 12.0, 12.0, 15.0, 11.0, 9.0, 6.0, 8.0, 5.0, 1.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.46484375, -4.31591796875, -4.1669921875, -4.01806640625, -3.869140625, -3.72021484375, -3.5712890625, -3.42236328125, -3.2734375, -3.12451171875, -2.9755859375, -2.82666015625, -2.677734375, -2.52880859375, -2.3798828125, -2.23095703125, -2.08203125, -1.93310546875, -1.7841796875, -1.63525390625, -1.486328125, -1.33740234375, -1.1884765625, -1.03955078125, -0.890625, -0.74169921875, -0.5927734375, -0.44384765625, -0.294921875, -0.14599609375, 0.0029296875, 0.15185546875, 0.30078125, 0.44970703125, 0.5986328125, 0.74755859375, 0.896484375, 1.04541015625, 1.1943359375, 1.34326171875, 1.4921875, 1.64111328125, 1.7900390625, 1.93896484375, 2.087890625, 2.23681640625, 2.3857421875, 2.53466796875, 2.68359375, 2.83251953125, 2.9814453125, 3.13037109375, 3.279296875, 3.42822265625, 3.5771484375, 3.72607421875, 3.875, 4.02392578125, 4.1728515625, 4.32177734375, 4.470703125, 4.61962890625, 4.7685546875, 4.91748046875, 5.06640625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 4.0, 4.0, 8.0, 12.0, 28.0, 29.0, 44.0, 56.0, 103.0, 130.0, 196.0, 293.0, 448.0, 676.0, 1002.0, 1503.0, 2531.0, 4315.0, 7446.0, 14027.0, 31977.0, 109561.0, 580627.0, 203146.0, 48929.0, 18667.0, 9142.0, 5150.0, 3135.0, 1871.0, 1198.0, 756.0, 529.0, 324.0, 209.0, 138.0, 111.0, 75.0, 54.0, 30.0, 23.0, 17.0, 12.0, 3.0, 7.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.0, -12.625244140625, -12.25048828125, -11.875732421875, -11.5009765625, -11.126220703125, -10.75146484375, -10.376708984375, -10.001953125, -9.627197265625, -9.25244140625, -8.877685546875, -8.5029296875, -8.128173828125, -7.75341796875, -7.378662109375, -7.00390625, -6.629150390625, -6.25439453125, -5.879638671875, -5.5048828125, -5.130126953125, -4.75537109375, -4.380615234375, -4.005859375, -3.631103515625, -3.25634765625, -2.881591796875, -2.5068359375, -2.132080078125, -1.75732421875, -1.382568359375, -1.0078125, -0.633056640625, -0.25830078125, 0.116455078125, 0.4912109375, 0.865966796875, 1.24072265625, 1.615478515625, 1.990234375, 2.364990234375, 2.73974609375, 3.114501953125, 3.4892578125, 3.864013671875, 4.23876953125, 4.613525390625, 4.98828125, 5.363037109375, 5.73779296875, 6.112548828125, 6.4873046875, 6.862060546875, 7.23681640625, 7.611572265625, 7.986328125, 8.361083984375, 8.73583984375, 9.110595703125, 9.4853515625, 9.860107421875, 10.23486328125, 10.609619140625, 10.984375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 1.0, 4.0, 2.0, 5.0, 6.0, 4.0, 9.0, 12.0, 9.0, 16.0, 13.0, 19.0, 29.0, 17.0, 31.0, 22.0, 25.0, 30.0, 44.0, 39.0, 50.0, 63.0, 101.0, 128.0, 235.0, 1355.0, 149.0, 108.0, 82.0, 64.0, 51.0, 43.0, 31.0, 40.0, 23.0, 36.0, 22.0, 27.0, 15.0, 15.0, 15.0, 12.0, 16.0, 8.0, 6.0, 2.0, 4.0, 4.0, 4.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0], "bins": [-15.96875, -15.4891357421875, -15.009521484375, -14.5299072265625, -14.05029296875, -13.5706787109375, -13.091064453125, -12.6114501953125, -12.1318359375, -11.6522216796875, -11.172607421875, -10.6929931640625, -10.21337890625, -9.7337646484375, -9.254150390625, -8.7745361328125, -8.294921875, -7.8153076171875, -7.335693359375, -6.8560791015625, -6.37646484375, -5.8968505859375, -5.417236328125, -4.9376220703125, -4.4580078125, -3.9783935546875, -3.498779296875, -3.0191650390625, -2.53955078125, -2.0599365234375, -1.580322265625, -1.1007080078125, -0.62109375, -0.1414794921875, 0.338134765625, 0.8177490234375, 1.29736328125, 1.7769775390625, 2.256591796875, 2.7362060546875, 3.2158203125, 3.6954345703125, 4.175048828125, 4.6546630859375, 5.13427734375, 5.6138916015625, 6.093505859375, 6.5731201171875, 7.052734375, 7.5323486328125, 8.011962890625, 8.4915771484375, 8.97119140625, 9.4508056640625, 9.930419921875, 10.4100341796875, 10.8896484375, 11.3692626953125, 11.848876953125, 12.3284912109375, 12.80810546875, 13.2877197265625, 13.767333984375, 14.2469482421875, 14.7265625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 11.0, 7.0, 15.0, 21.0, 32.0, 36.0, 64.0, 132.0, 230.0, 475.0, 1375.0, 5778.0, 47222.0, 2824890.0, 246964.0, 14330.0, 2565.0, 813.0, 327.0, 146.0, 91.0, 54.0, 40.0, 21.0, 19.0, 10.0, 14.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-54.65625, -52.81884765625, -50.9814453125, -49.14404296875, -47.306640625, -45.46923828125, -43.6318359375, -41.79443359375, -39.95703125, -38.11962890625, -36.2822265625, -34.44482421875, -32.607421875, -30.77001953125, -28.9326171875, -27.09521484375, -25.2578125, -23.42041015625, -21.5830078125, -19.74560546875, -17.908203125, -16.07080078125, -14.2333984375, -12.39599609375, -10.55859375, -8.72119140625, -6.8837890625, -5.04638671875, -3.208984375, -1.37158203125, 0.4658203125, 2.30322265625, 4.140625, 5.97802734375, 7.8154296875, 9.65283203125, 11.490234375, 13.32763671875, 15.1650390625, 17.00244140625, 18.83984375, 20.67724609375, 22.5146484375, 24.35205078125, 26.189453125, 28.02685546875, 29.8642578125, 31.70166015625, 33.5390625, 35.37646484375, 37.2138671875, 39.05126953125, 40.888671875, 42.72607421875, 44.5634765625, 46.40087890625, 48.23828125, 50.07568359375, 51.9130859375, 53.75048828125, 55.587890625, 57.42529296875, 59.2626953125, 61.10009765625, 62.9375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 372.0, 626.0, 16.0], "bins": [-1310.8900146484375, -1289.771728515625, -1268.6534423828125, -1247.53515625, -1226.4168701171875, -1205.298583984375, -1184.1802978515625, -1163.06201171875, -1141.943603515625, -1120.8253173828125, -1099.70703125, -1078.5887451171875, -1057.470458984375, -1036.3521728515625, -1015.2338256835938, -994.1155395507812, -972.997314453125, -951.8790283203125, -930.7607421875, -909.6424560546875, -888.524169921875, -867.4058227539062, -846.2875366210938, -825.1692504882812, -804.0509643554688, -782.9326782226562, -761.8143920898438, -740.6961059570312, -719.5777587890625, -698.45947265625, -677.3411865234375, -656.222900390625, -635.1046752929688, -613.9863891601562, -592.8681030273438, -571.7498168945312, -550.6314697265625, -529.51318359375, -508.3948974609375, -487.276611328125, -466.1583251953125, -445.0400390625, -423.9217529296875, -402.8034362792969, -381.6851501464844, -360.5668640136719, -339.44854736328125, -318.33026123046875, -297.21197509765625, -276.09368896484375, -254.9753875732422, -233.85708618164062, -212.73880004882812, -191.62051391601562, -170.50221252441406, -149.3839111328125, -128.265625, -107.14733123779297, -86.02903747558594, -64.9107437133789, -43.792449951171875, -22.674156188964844, -1.5558624267578125, 19.56243896484375, 40.680728912353516]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 7.0, 11.0, 12.0, 19.0, 9.0, 12.0, 16.0, 24.0, 24.0, 21.0, 36.0, 21.0, 35.0, 39.0, 35.0, 42.0, 41.0, 33.0, 53.0, 48.0, 32.0, 41.0, 25.0, 30.0, 46.0, 21.0, 40.0, 24.0, 28.0, 20.0, 17.0, 22.0, 15.0, 12.0, 13.0, 12.0, 11.0, 16.0, 8.0, 8.0, 4.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.19475173950195, -47.45106506347656, -45.707374572753906, -43.963687896728516, -42.21999740600586, -40.47631072998047, -38.73262023925781, -36.98893356323242, -35.245243072509766, -33.501556396484375, -31.75786590576172, -30.014177322387695, -28.270488739013672, -26.52680206298828, -24.783111572265625, -23.039424896240234, -21.29573631286621, -19.552047729492188, -17.808359146118164, -16.06467056274414, -14.320981979370117, -12.57729434967041, -10.833605766296387, -9.089917182922363, -7.34622859954834, -5.602540016174316, -3.858851671218872, -2.1151633262634277, -0.3714747428894043, 1.372213363647461, 3.1159019470214844, 4.859590530395508, 6.603279113769531, 8.346967697143555, 10.090656280517578, 11.834344863891602, 13.578033447265625, 15.321721076965332, 17.065410614013672, 18.809097290039062, 20.55278778076172, 22.296476364135742, 24.040164947509766, 25.78385353088379, 27.527542114257812, 29.271228790283203, 31.01491928100586, 32.75860595703125, 34.502296447753906, 36.2459831237793, 37.98967361450195, 39.733360290527344, 41.47705078125, 43.22073745727539, 44.96442794799805, 46.70811462402344, 48.45180130004883, 50.19548797607422, 51.939178466796875, 53.682865142822266, 55.42655563354492, 57.17024230957031, 58.91393280029297, 60.65761947631836, 62.401309967041016]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 6.0, 9.0, 9.0, 5.0, 13.0, 12.0, 18.0, 17.0, 10.0, 18.0, 21.0, 18.0, 34.0, 36.0, 27.0, 29.0, 36.0, 34.0, 42.0, 42.0, 34.0, 42.0, 41.0, 34.0, 41.0, 42.0, 43.0, 26.0, 31.0, 28.0, 26.0, 27.0, 18.0, 12.0, 19.0, 14.0, 16.0, 10.0, 11.0, 4.0, 12.0, 7.0, 3.0, 4.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.16015625, -4.01263427734375, -3.8651123046875, -3.71759033203125, -3.570068359375, -3.42254638671875, -3.2750244140625, -3.12750244140625, -2.97998046875, -2.83245849609375, -2.6849365234375, -2.53741455078125, -2.389892578125, -2.24237060546875, -2.0948486328125, -1.94732666015625, -1.7998046875, -1.65228271484375, -1.5047607421875, -1.35723876953125, -1.209716796875, -1.06219482421875, -0.9146728515625, -0.76715087890625, -0.61962890625, -0.47210693359375, -0.3245849609375, -0.17706298828125, -0.029541015625, 0.11798095703125, 0.2655029296875, 0.41302490234375, 0.560546875, 0.70806884765625, 0.8555908203125, 1.00311279296875, 1.150634765625, 1.29815673828125, 1.4456787109375, 1.59320068359375, 1.74072265625, 1.88824462890625, 2.0357666015625, 2.18328857421875, 2.330810546875, 2.47833251953125, 2.6258544921875, 2.77337646484375, 2.9208984375, 3.06842041015625, 3.2159423828125, 3.36346435546875, 3.510986328125, 3.65850830078125, 3.8060302734375, 3.95355224609375, 4.10107421875, 4.24859619140625, 4.3961181640625, 4.54364013671875, 4.691162109375, 4.83868408203125, 4.9862060546875, 5.13372802734375, 5.28125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 11.0, 9.0, 12.0, 11.0, 18.0, 24.0, 48.0, 44.0, 66.0, 114.0, 171.0, 264.0, 495.0, 824.0, 1450.0, 2493.0, 4451.0, 9120.0, 20397.0, 66838.0, 1318048.0, 2609618.0, 109113.0, 26746.0, 11333.0, 5518.0, 2804.0, 1702.0, 985.0, 601.0, 356.0, 211.0, 122.0, 77.0, 55.0, 30.0, 27.0, 19.0, 11.0, 13.0, 11.0, 10.0, 4.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.046875, -16.46142578125, -15.8759765625, -15.29052734375, -14.705078125, -14.11962890625, -13.5341796875, -12.94873046875, -12.36328125, -11.77783203125, -11.1923828125, -10.60693359375, -10.021484375, -9.43603515625, -8.8505859375, -8.26513671875, -7.6796875, -7.09423828125, -6.5087890625, -5.92333984375, -5.337890625, -4.75244140625, -4.1669921875, -3.58154296875, -2.99609375, -2.41064453125, -1.8251953125, -1.23974609375, -0.654296875, -0.06884765625, 0.5166015625, 1.10205078125, 1.6875, 2.27294921875, 2.8583984375, 3.44384765625, 4.029296875, 4.61474609375, 5.2001953125, 5.78564453125, 6.37109375, 6.95654296875, 7.5419921875, 8.12744140625, 8.712890625, 9.29833984375, 9.8837890625, 10.46923828125, 11.0546875, 11.64013671875, 12.2255859375, 12.81103515625, 13.396484375, 13.98193359375, 14.5673828125, 15.15283203125, 15.73828125, 16.32373046875, 16.9091796875, 17.49462890625, 18.080078125, 18.66552734375, 19.2509765625, 19.83642578125, 20.421875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 4.0, 1.0, 8.0, 0.0, 8.0, 7.0, 13.0, 10.0, 8.0, 22.0, 32.0, 27.0, 28.0, 58.0, 79.0, 127.0, 261.0, 512.0, 817.0, 791.0, 517.0, 266.0, 154.0, 76.0, 55.0, 38.0, 36.0, 27.0, 17.0, 15.0, 9.0, 10.0, 11.0, 6.0, 5.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.421875, -14.924560546875, -14.42724609375, -13.929931640625, -13.4326171875, -12.935302734375, -12.43798828125, -11.940673828125, -11.443359375, -10.946044921875, -10.44873046875, -9.951416015625, -9.4541015625, -8.956787109375, -8.45947265625, -7.962158203125, -7.46484375, -6.967529296875, -6.47021484375, -5.972900390625, -5.4755859375, -4.978271484375, -4.48095703125, -3.983642578125, -3.486328125, -2.989013671875, -2.49169921875, -1.994384765625, -1.4970703125, -0.999755859375, -0.50244140625, -0.005126953125, 0.4921875, 0.989501953125, 1.48681640625, 1.984130859375, 2.4814453125, 2.978759765625, 3.47607421875, 3.973388671875, 4.470703125, 4.968017578125, 5.46533203125, 5.962646484375, 6.4599609375, 6.957275390625, 7.45458984375, 7.951904296875, 8.44921875, 8.946533203125, 9.44384765625, 9.941162109375, 10.4384765625, 10.935791015625, 11.43310546875, 11.930419921875, 12.427734375, 12.925048828125, 13.42236328125, 13.919677734375, 14.4169921875, 14.914306640625, 15.41162109375, 15.908935546875, 16.40625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 7.0, 13.0, 19.0, 25.0, 26.0, 45.0, 60.0, 98.0, 117.0, 183.0, 245.0, 375.0, 621.0, 867.0, 1395.0, 2160.0, 3609.0, 5991.0, 10823.0, 21791.0, 53634.0, 212044.0, 2145841.0, 1486137.0, 159495.0, 45096.0, 19195.0, 9818.0, 5359.0, 3263.0, 2135.0, 1232.0, 787.0, 576.0, 367.0, 277.0, 165.0, 120.0, 85.0, 66.0, 37.0, 19.0, 26.0, 18.0, 5.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-18.703125, -18.16748046875, -17.6318359375, -17.09619140625, -16.560546875, -16.02490234375, -15.4892578125, -14.95361328125, -14.41796875, -13.88232421875, -13.3466796875, -12.81103515625, -12.275390625, -11.73974609375, -11.2041015625, -10.66845703125, -10.1328125, -9.59716796875, -9.0615234375, -8.52587890625, -7.990234375, -7.45458984375, -6.9189453125, -6.38330078125, -5.84765625, -5.31201171875, -4.7763671875, -4.24072265625, -3.705078125, -3.16943359375, -2.6337890625, -2.09814453125, -1.5625, -1.02685546875, -0.4912109375, 0.04443359375, 0.580078125, 1.11572265625, 1.6513671875, 2.18701171875, 2.72265625, 3.25830078125, 3.7939453125, 4.32958984375, 4.865234375, 5.40087890625, 5.9365234375, 6.47216796875, 7.0078125, 7.54345703125, 8.0791015625, 8.61474609375, 9.150390625, 9.68603515625, 10.2216796875, 10.75732421875, 11.29296875, 11.82861328125, 12.3642578125, 12.89990234375, 13.435546875, 13.97119140625, 14.5068359375, 15.04248046875, 15.578125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 42.0, 120.0, 282.0, 318.0, 158.0, 52.0, 13.0, 8.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-311.03076171875, -304.70758056640625, -298.3843688964844, -292.0611877441406, -285.73797607421875, -279.414794921875, -273.0915832519531, -266.7684020996094, -260.4451904296875, -254.1219940185547, -247.79879760742188, -241.47560119628906, -235.15240478515625, -228.82920837402344, -222.50601196289062, -216.1828155517578, -209.859619140625, -203.5364227294922, -197.21322631835938, -190.89002990722656, -184.56683349609375, -178.24363708496094, -171.92044067382812, -165.5972442626953, -159.27406311035156, -152.95086669921875, -146.62767028808594, -140.30447387695312, -133.9812774658203, -127.6580810546875, -121.33488464355469, -115.01168823242188, -108.68849182128906, -102.36529541015625, -96.04209899902344, -89.71890258789062, -83.39570617675781, -77.072509765625, -70.74931335449219, -64.42611694335938, -58.10292434692383, -51.779727935791016, -45.4565315246582, -39.133338928222656, -32.810142517089844, -26.4869441986084, -20.16374969482422, -13.840553283691406, -7.517356872558594, -1.1941609382629395, 5.129034996032715, 11.452230453491211, 17.775426864624023, 24.098623275756836, 30.421817779541016, 36.74501419067383, 43.06821060180664, 49.39140701293945, 55.714603424072266, 62.03779602050781, 68.36099243164062, 74.68418884277344, 81.00738525390625, 87.33058166503906, 93.65377807617188]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 9.0, 5.0, 3.0, 4.0, 9.0, 11.0, 8.0, 12.0, 8.0, 16.0, 26.0, 24.0, 24.0, 22.0, 26.0, 28.0, 37.0, 35.0, 40.0, 48.0, 38.0, 47.0, 49.0, 40.0, 33.0, 40.0, 30.0, 38.0, 40.0, 35.0, 32.0, 31.0, 26.0, 28.0, 25.0, 15.0, 14.0, 12.0, 10.0, 10.0, 6.0, 2.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-47.6296272277832, -46.21665573120117, -44.803680419921875, -43.390708923339844, -41.97773742675781, -40.564762115478516, -39.151790618896484, -37.73881530761719, -36.325843811035156, -34.912872314453125, -33.49989700317383, -32.0869255065918, -30.673952102661133, -29.26097869873047, -27.848007202148438, -26.435033798217773, -25.022062301635742, -23.609088897705078, -22.196117401123047, -20.783143997192383, -19.37017059326172, -17.957199096679688, -16.544225692749023, -15.13125228881836, -13.718279838562012, -12.305307388305664, -10.892333984375, -9.479361534118652, -8.066389083862305, -6.653415679931641, -5.240443229675293, -3.827469825744629, -2.4144973754882812, -1.001524567604065, 0.41144824028015137, 1.8244209289550781, 3.237393856048584, 4.65036678314209, 6.0633392333984375, 7.476312637329102, 8.88928508758545, 10.302257537841797, 11.715230941772461, 13.128203392028809, 14.541175842285156, 15.95414924621582, 17.367122650146484, 18.780094146728516, 20.19306755065918, 21.606040954589844, 23.019012451171875, 24.43198585510254, 25.844959259033203, 27.257930755615234, 28.6709041595459, 30.083877563476562, 31.496849060058594, 32.909820556640625, 34.32279586791992, 35.73576736450195, 37.148738861083984, 38.56171417236328, 39.97468566894531, 41.387657165527344, 42.80063247680664]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 10.0, 11.0, 10.0, 13.0, 8.0, 19.0, 16.0, 14.0, 20.0, 15.0, 29.0, 22.0, 20.0, 29.0, 36.0, 36.0, 39.0, 51.0, 37.0, 34.0, 51.0, 33.0, 32.0, 40.0, 52.0, 34.0, 35.0, 29.0, 30.0, 25.0, 21.0, 23.0, 21.0, 14.0, 17.0, 14.0, 15.0, 6.0, 6.0, 3.0, 3.0, 7.0, 6.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.56640625, -4.416748046875, -4.26708984375, -4.117431640625, -3.9677734375, -3.818115234375, -3.66845703125, -3.518798828125, -3.369140625, -3.219482421875, -3.06982421875, -2.920166015625, -2.7705078125, -2.620849609375, -2.47119140625, -2.321533203125, -2.171875, -2.022216796875, -1.87255859375, -1.722900390625, -1.5732421875, -1.423583984375, -1.27392578125, -1.124267578125, -0.974609375, -0.824951171875, -0.67529296875, -0.525634765625, -0.3759765625, -0.226318359375, -0.07666015625, 0.072998046875, 0.22265625, 0.372314453125, 0.52197265625, 0.671630859375, 0.8212890625, 0.970947265625, 1.12060546875, 1.270263671875, 1.419921875, 1.569580078125, 1.71923828125, 1.868896484375, 2.0185546875, 2.168212890625, 2.31787109375, 2.467529296875, 2.6171875, 2.766845703125, 2.91650390625, 3.066162109375, 3.2158203125, 3.365478515625, 3.51513671875, 3.664794921875, 3.814453125, 3.964111328125, 4.11376953125, 4.263427734375, 4.4130859375, 4.562744140625, 4.71240234375, 4.862060546875, 5.01171875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 13.0, 16.0, 14.0, 30.0, 35.0, 52.0, 62.0, 82.0, 130.0, 175.0, 279.0, 340.0, 521.0, 714.0, 1053.0, 1600.0, 2622.0, 4285.0, 7936.0, 16150.0, 41155.0, 172410.0, 634156.0, 104066.0, 30465.0, 12980.0, 6571.0, 3727.0, 2216.0, 1436.0, 1006.0, 650.0, 434.0, 344.0, 242.0, 154.0, 111.0, 102.0, 61.0, 35.0, 39.0, 26.0, 12.0, 10.0, 9.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0], "bins": [-25.421875, -24.63623046875, -23.8505859375, -23.06494140625, -22.279296875, -21.49365234375, -20.7080078125, -19.92236328125, -19.13671875, -18.35107421875, -17.5654296875, -16.77978515625, -15.994140625, -15.20849609375, -14.4228515625, -13.63720703125, -12.8515625, -12.06591796875, -11.2802734375, -10.49462890625, -9.708984375, -8.92333984375, -8.1376953125, -7.35205078125, -6.56640625, -5.78076171875, -4.9951171875, -4.20947265625, -3.423828125, -2.63818359375, -1.8525390625, -1.06689453125, -0.28125, 0.50439453125, 1.2900390625, 2.07568359375, 2.861328125, 3.64697265625, 4.4326171875, 5.21826171875, 6.00390625, 6.78955078125, 7.5751953125, 8.36083984375, 9.146484375, 9.93212890625, 10.7177734375, 11.50341796875, 12.2890625, 13.07470703125, 13.8603515625, 14.64599609375, 15.431640625, 16.21728515625, 17.0029296875, 17.78857421875, 18.57421875, 19.35986328125, 20.1455078125, 20.93115234375, 21.716796875, 22.50244140625, 23.2880859375, 24.07373046875, 24.859375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 9.0, 7.0, 9.0, 9.0, 11.0, 12.0, 12.0, 21.0, 20.0, 24.0, 27.0, 24.0, 28.0, 17.0, 33.0, 27.0, 31.0, 32.0, 38.0, 40.0, 34.0, 1063.0, 42.0, 45.0, 44.0, 46.0, 34.0, 34.0, 35.0, 32.0, 18.0, 22.0, 23.0, 19.0, 23.0, 14.0, 12.0, 14.0, 12.0, 9.0, 6.0, 4.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.62109375, -4.47705078125, -4.3330078125, -4.18896484375, -4.044921875, -3.90087890625, -3.7568359375, -3.61279296875, -3.46875, -3.32470703125, -3.1806640625, -3.03662109375, -2.892578125, -2.74853515625, -2.6044921875, -2.46044921875, -2.31640625, -2.17236328125, -2.0283203125, -1.88427734375, -1.740234375, -1.59619140625, -1.4521484375, -1.30810546875, -1.1640625, -1.02001953125, -0.8759765625, -0.73193359375, -0.587890625, -0.44384765625, -0.2998046875, -0.15576171875, -0.01171875, 0.13232421875, 0.2763671875, 0.42041015625, 0.564453125, 0.70849609375, 0.8525390625, 0.99658203125, 1.140625, 1.28466796875, 1.4287109375, 1.57275390625, 1.716796875, 1.86083984375, 2.0048828125, 2.14892578125, 2.29296875, 2.43701171875, 2.5810546875, 2.72509765625, 2.869140625, 3.01318359375, 3.1572265625, 3.30126953125, 3.4453125, 3.58935546875, 3.7333984375, 3.87744140625, 4.021484375, 4.16552734375, 4.3095703125, 4.45361328125, 4.59765625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 4.0, 6.0, 14.0, 16.0, 30.0, 39.0, 41.0, 89.0, 103.0, 173.0, 270.0, 365.0, 562.0, 882.0, 1339.0, 2363.0, 4003.0, 7381.0, 15467.0, 39038.0, 210448.0, 1658620.0, 101336.0, 27875.0, 11918.0, 6026.0, 3334.0, 1965.0, 1241.0, 736.0, 462.0, 355.0, 216.0, 130.0, 83.0, 71.0, 48.0, 26.0, 23.0, 7.0, 15.0, 3.0, 5.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.796875, -25.045654296875, -24.29443359375, -23.543212890625, -22.7919921875, -22.040771484375, -21.28955078125, -20.538330078125, -19.787109375, -19.035888671875, -18.28466796875, -17.533447265625, -16.7822265625, -16.031005859375, -15.27978515625, -14.528564453125, -13.77734375, -13.026123046875, -12.27490234375, -11.523681640625, -10.7724609375, -10.021240234375, -9.27001953125, -8.518798828125, -7.767578125, -7.016357421875, -6.26513671875, -5.513916015625, -4.7626953125, -4.011474609375, -3.26025390625, -2.509033203125, -1.7578125, -1.006591796875, -0.25537109375, 0.495849609375, 1.2470703125, 1.998291015625, 2.74951171875, 3.500732421875, 4.251953125, 5.003173828125, 5.75439453125, 6.505615234375, 7.2568359375, 8.008056640625, 8.75927734375, 9.510498046875, 10.26171875, 11.012939453125, 11.76416015625, 12.515380859375, 13.2666015625, 14.017822265625, 14.76904296875, 15.520263671875, 16.271484375, 17.022705078125, 17.77392578125, 18.525146484375, 19.2763671875, 20.027587890625, 20.77880859375, 21.530029296875, 22.28125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 1.0, 6.0, 9.0, 13.0, 23.0, 26.0, 36.0, 90.0, 382.0, 212.0, 60.0, 43.0, 15.0, 18.0, 12.0, 6.0, 8.0, 9.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.0318603515625, -7.719970703125, -7.4080810546875, -7.09619140625, -6.7843017578125, -6.472412109375, -6.1605224609375, -5.8486328125, -5.5367431640625, -5.224853515625, -4.9129638671875, -4.60107421875, -4.2891845703125, -3.977294921875, -3.6654052734375, -3.353515625, -3.0416259765625, -2.729736328125, -2.4178466796875, -2.10595703125, -1.7940673828125, -1.482177734375, -1.1702880859375, -0.8583984375, -0.5465087890625, -0.234619140625, 0.0772705078125, 0.38916015625, 0.7010498046875, 1.012939453125, 1.3248291015625, 1.63671875, 1.9486083984375, 2.260498046875, 2.5723876953125, 2.88427734375, 3.1961669921875, 3.508056640625, 3.8199462890625, 4.1318359375, 4.4437255859375, 4.755615234375, 5.0675048828125, 5.37939453125, 5.6912841796875, 6.003173828125, 6.3150634765625, 6.626953125, 6.9388427734375, 7.250732421875, 7.5626220703125, 7.87451171875, 8.1864013671875, 8.498291015625, 8.8101806640625, 9.1220703125, 9.4339599609375, 9.745849609375, 10.0577392578125, 10.36962890625, 10.6815185546875, 10.993408203125, 11.3052978515625, 11.6171875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 5.0, 7.0, 12.0, 13.0, 11.0, 15.0, 19.0, 15.0, 50.0, 84.0, 137.0, 447.0, 1712.0, 12632.0, 1009161.0, 21154.0, 2093.0, 509.0, 176.0, 101.0, 59.0, 32.0, 21.0, 14.0, 15.0, 17.0, 10.0, 3.0, 8.0, 4.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-141.375, -137.2861328125, -133.197265625, -129.1083984375, -125.01953125, -120.9306640625, -116.841796875, -112.7529296875, -108.6640625, -104.5751953125, -100.486328125, -96.3974609375, -92.30859375, -88.2197265625, -84.130859375, -80.0419921875, -75.953125, -71.8642578125, -67.775390625, -63.6865234375, -59.59765625, -55.5087890625, -51.419921875, -47.3310546875, -43.2421875, -39.1533203125, -35.064453125, -30.9755859375, -26.88671875, -22.7978515625, -18.708984375, -14.6201171875, -10.53125, -6.4423828125, -2.353515625, 1.7353515625, 5.82421875, 9.9130859375, 14.001953125, 18.0908203125, 22.1796875, 26.2685546875, 30.357421875, 34.4462890625, 38.53515625, 42.6240234375, 46.712890625, 50.8017578125, 54.890625, 58.9794921875, 63.068359375, 67.1572265625, 71.24609375, 75.3349609375, 79.423828125, 83.5126953125, 87.6015625, 91.6904296875, 95.779296875, 99.8681640625, 103.95703125, 108.0458984375, 112.134765625, 116.2236328125, 120.3125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 7.0, 7.0, 16.0, 18.0, 37.0, 73.0, 111.0, 245.0, 215.0, 111.0, 64.0, 32.0, 29.0, 13.0, 8.0, 7.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.527434349060059, -13.045394897460938, -12.563356399536133, -12.081316947937012, -11.599278450012207, -11.117238998413086, -10.635200500488281, -10.15316104888916, -9.671121597290039, -9.189082145690918, -8.707043647766113, -8.225004196166992, -7.7429656982421875, -7.260926246643066, -6.7788872718811035, -6.296848297119141, -5.814809799194336, -5.332770824432373, -4.85073184967041, -4.368692398071289, -3.8866536617279053, -3.4046146869659424, -2.9225754737854004, -2.4405364990234375, -1.9584975242614746, -1.4764585494995117, -0.9944194555282593, -0.5123803615570068, -0.030341386795043945, 0.45169758796691895, 0.9337368011474609, 1.4157757759094238, 1.8978157043457031, 2.379854679107666, 2.861893653869629, 3.343932867050171, 3.825971841812134, 4.308011054992676, 4.790050029754639, 5.272089004516602, 5.7541279792785645, 6.236166954040527, 6.71820592880249, 7.200244903564453, 7.682284355163574, 8.164322853088379, 8.6463623046875, 9.128400802612305, 9.610440254211426, 10.092479705810547, 10.574518203735352, 11.056557655334473, 11.538596153259277, 12.020635604858398, 12.502674102783203, 12.984713554382324, 13.466753005981445, 13.948792457580566, 14.430830955505371, 14.912870407104492, 15.394908905029297, 15.876948356628418, 16.35898780822754, 16.841026306152344, 17.32306480407715]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 6.0, 8.0, 8.0, 8.0, 13.0, 16.0, 24.0, 14.0, 19.0, 24.0, 28.0, 29.0, 29.0, 37.0, 42.0, 43.0, 39.0, 42.0, 44.0, 32.0, 44.0, 49.0, 45.0, 61.0, 35.0, 42.0, 28.0, 28.0, 23.0, 20.0, 13.0, 14.0, 19.0, 12.0, 9.0, 10.0, 8.0, 7.0, 5.0, 6.0, 4.0, 7.0, 4.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-7.91430139541626, -7.684327602386475, -7.4543538093566895, -7.224379539489746, -6.994405746459961, -6.764431953430176, -6.534458160400391, -6.3044843673706055, -6.07451057434082, -5.844536781311035, -5.61456298828125, -5.384589195251465, -5.1546149253845215, -4.924641132354736, -4.694667339324951, -4.464693546295166, -4.234719276428223, -4.0047454833984375, -3.7747714519500732, -3.544797658920288, -3.314823865890503, -3.0848498344421387, -2.8548760414123535, -2.6249022483825684, -2.394928455352783, -2.164954662322998, -1.9349807500839233, -1.7050068378448486, -1.4750330448150635, -1.2450591325759888, -1.015085220336914, -0.7851114273071289, -0.5551376342773438, -0.3251637816429138, -0.0951898992061615, 0.13478398323059082, 0.36475783586502075, 0.5947316884994507, 0.8247056007385254, 1.0546793937683105, 1.2846533060073853, 1.51462721824646, 1.7446010112762451, 1.9745749235153198, 2.2045488357543945, 2.4345226287841797, 2.664496421813965, 2.89447021484375, 3.1244442462921143, 3.3544180393218994, 3.5843920707702637, 3.814365863800049, 4.044339656829834, 4.274313449859619, 4.5042877197265625, 4.734261512756348, 4.964235305786133, 5.194209098815918, 5.424182891845703, 5.654156684875488, 5.884130954742432, 6.114104747772217, 6.344078540802002, 6.574052333831787, 6.804026126861572]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 12.0, 11.0, 10.0, 8.0, 11.0, 16.0, 17.0, 18.0, 20.0, 23.0, 19.0, 26.0, 32.0, 33.0, 40.0, 34.0, 47.0, 42.0, 41.0, 38.0, 46.0, 35.0, 37.0, 34.0, 40.0, 29.0, 30.0, 32.0, 24.0, 31.0, 26.0, 24.0, 24.0, 7.0, 13.0, 14.0, 10.0, 12.0, 3.0, 4.0, 7.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.82421875, -4.66864013671875, -4.5130615234375, -4.35748291015625, -4.201904296875, -4.04632568359375, -3.8907470703125, -3.73516845703125, -3.57958984375, -3.42401123046875, -3.2684326171875, -3.11285400390625, -2.957275390625, -2.80169677734375, -2.6461181640625, -2.49053955078125, -2.3349609375, -2.17938232421875, -2.0238037109375, -1.86822509765625, -1.712646484375, -1.55706787109375, -1.4014892578125, -1.24591064453125, -1.09033203125, -0.93475341796875, -0.7791748046875, -0.62359619140625, -0.468017578125, -0.31243896484375, -0.1568603515625, -0.00128173828125, 0.154296875, 0.30987548828125, 0.4654541015625, 0.62103271484375, 0.776611328125, 0.93218994140625, 1.0877685546875, 1.24334716796875, 1.39892578125, 1.55450439453125, 1.7100830078125, 1.86566162109375, 2.021240234375, 2.17681884765625, 2.3323974609375, 2.48797607421875, 2.6435546875, 2.79913330078125, 2.9547119140625, 3.11029052734375, 3.265869140625, 3.42144775390625, 3.5770263671875, 3.73260498046875, 3.88818359375, 4.04376220703125, 4.1993408203125, 4.35491943359375, 4.510498046875, 4.66607666015625, 4.8216552734375, 4.97723388671875, 5.1328125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 2.0, 8.0, 9.0, 12.0, 20.0, 33.0, 40.0, 57.0, 73.0, 97.0, 131.0, 181.0, 264.0, 324.0, 515.0, 697.0, 1019.0, 1520.0, 2266.0, 3592.0, 5797.0, 10543.0, 19890.0, 50151.0, 264947.0, 546203.0, 80121.0, 27019.0, 13097.0, 7180.0, 4302.0, 2811.0, 1614.0, 1209.0, 792.0, 596.0, 381.0, 287.0, 179.0, 170.0, 103.0, 81.0, 66.0, 44.0, 37.0, 21.0, 16.0, 12.0, 6.0, 10.0, 5.0, 0.0, 6.0, 1.0, 0.0, 1.0, 2.0], "bins": [-12.359375, -11.975341796875, -11.59130859375, -11.207275390625, -10.8232421875, -10.439208984375, -10.05517578125, -9.671142578125, -9.287109375, -8.903076171875, -8.51904296875, -8.135009765625, -7.7509765625, -7.366943359375, -6.98291015625, -6.598876953125, -6.21484375, -5.830810546875, -5.44677734375, -5.062744140625, -4.6787109375, -4.294677734375, -3.91064453125, -3.526611328125, -3.142578125, -2.758544921875, -2.37451171875, -1.990478515625, -1.6064453125, -1.222412109375, -0.83837890625, -0.454345703125, -0.0703125, 0.313720703125, 0.69775390625, 1.081787109375, 1.4658203125, 1.849853515625, 2.23388671875, 2.617919921875, 3.001953125, 3.385986328125, 3.77001953125, 4.154052734375, 4.5380859375, 4.922119140625, 5.30615234375, 5.690185546875, 6.07421875, 6.458251953125, 6.84228515625, 7.226318359375, 7.6103515625, 7.994384765625, 8.37841796875, 8.762451171875, 9.146484375, 9.530517578125, 9.91455078125, 10.298583984375, 10.6826171875, 11.066650390625, 11.45068359375, 11.834716796875, 12.21875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 0.0, 7.0, 10.0, 7.0, 9.0, 12.0, 10.0, 11.0, 17.0, 23.0, 30.0, 22.0, 38.0, 31.0, 44.0, 59.0, 71.0, 106.0, 135.0, 263.0, 1381.0, 206.0, 105.0, 84.0, 55.0, 53.0, 44.0, 34.0, 35.0, 26.0, 20.0, 12.0, 17.0, 12.0, 9.0, 11.0, 4.0, 11.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.28125, -19.6103515625, -18.939453125, -18.2685546875, -17.59765625, -16.9267578125, -16.255859375, -15.5849609375, -14.9140625, -14.2431640625, -13.572265625, -12.9013671875, -12.23046875, -11.5595703125, -10.888671875, -10.2177734375, -9.546875, -8.8759765625, -8.205078125, -7.5341796875, -6.86328125, -6.1923828125, -5.521484375, -4.8505859375, -4.1796875, -3.5087890625, -2.837890625, -2.1669921875, -1.49609375, -0.8251953125, -0.154296875, 0.5166015625, 1.1875, 1.8583984375, 2.529296875, 3.2001953125, 3.87109375, 4.5419921875, 5.212890625, 5.8837890625, 6.5546875, 7.2255859375, 7.896484375, 8.5673828125, 9.23828125, 9.9091796875, 10.580078125, 11.2509765625, 11.921875, 12.5927734375, 13.263671875, 13.9345703125, 14.60546875, 15.2763671875, 15.947265625, 16.6181640625, 17.2890625, 17.9599609375, 18.630859375, 19.3017578125, 19.97265625, 20.6435546875, 21.314453125, 21.9853515625, 22.65625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 7.0, 2.0, 2.0, 5.0, 10.0, 11.0, 19.0, 25.0, 31.0, 35.0, 58.0, 77.0, 104.0, 210.0, 419.0, 929.0, 3537.0, 28912.0, 2674659.0, 418830.0, 14112.0, 2176.0, 707.0, 321.0, 155.0, 91.0, 67.0, 54.0, 38.0, 34.0, 23.0, 11.0, 18.0, 6.0, 9.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-51.59375, -49.67236328125, -47.7509765625, -45.82958984375, -43.908203125, -41.98681640625, -40.0654296875, -38.14404296875, -36.22265625, -34.30126953125, -32.3798828125, -30.45849609375, -28.537109375, -26.61572265625, -24.6943359375, -22.77294921875, -20.8515625, -18.93017578125, -17.0087890625, -15.08740234375, -13.166015625, -11.24462890625, -9.3232421875, -7.40185546875, -5.48046875, -3.55908203125, -1.6376953125, 0.28369140625, 2.205078125, 4.12646484375, 6.0478515625, 7.96923828125, 9.890625, 11.81201171875, 13.7333984375, 15.65478515625, 17.576171875, 19.49755859375, 21.4189453125, 23.34033203125, 25.26171875, 27.18310546875, 29.1044921875, 31.02587890625, 32.947265625, 34.86865234375, 36.7900390625, 38.71142578125, 40.6328125, 42.55419921875, 44.4755859375, 46.39697265625, 48.318359375, 50.23974609375, 52.1611328125, 54.08251953125, 56.00390625, 57.92529296875, 59.8466796875, 61.76806640625, 63.689453125, 65.61083984375, 67.5322265625, 69.45361328125, 71.375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 10.0, 80.0, 345.0, 435.0, 113.0, 27.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-258.848388671875, -251.2611083984375, -243.673828125, -236.0865478515625, -228.499267578125, -220.9119873046875, -213.32470703125, -205.7374267578125, -198.150146484375, -190.5628662109375, -182.9755859375, -175.3883056640625, -167.801025390625, -160.2137451171875, -152.62646484375, -145.0391845703125, -137.451904296875, -129.8646240234375, -122.27734375, -114.6900634765625, -107.102783203125, -99.5155029296875, -91.92822265625, -84.3409423828125, -76.753662109375, -69.1663818359375, -61.5791015625, -53.9918212890625, -46.404541015625, -38.8172607421875, -31.22998046875, -23.6427001953125, -16.055404663085938, -8.468124389648438, -0.8808441162109375, 6.7064361572265625, 14.293716430664062, 21.880996704101562, 29.468276977539062, 37.05555725097656, 44.64283752441406, 52.23011779785156, 59.81739807128906, 67.40467834472656, 74.99195861816406, 82.57923889160156, 90.16651916503906, 97.75379943847656, 105.34107971191406, 112.92835998535156, 120.51564025878906, 128.10292053222656, 135.69020080566406, 143.27748107910156, 150.86476135253906, 158.45204162597656, 166.03932189941406, 173.62660217285156, 181.21388244628906, 188.80116271972656, 196.38844299316406, 203.97572326660156, 211.56300354003906, 219.15028381347656, 226.73756408691406]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 7.0, 12.0, 9.0, 7.0, 12.0, 11.0, 19.0, 24.0, 21.0, 32.0, 29.0, 25.0, 25.0, 33.0, 31.0, 40.0, 33.0, 35.0, 37.0, 51.0, 35.0, 40.0, 37.0, 42.0, 26.0, 41.0, 28.0, 31.0, 24.0, 29.0, 19.0, 29.0, 21.0, 16.0, 8.0, 21.0, 11.0, 8.0, 6.0, 7.0, 7.0, 3.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-56.27058410644531, -54.56818771362305, -52.86579132080078, -51.16339111328125, -49.460994720458984, -47.75859832763672, -46.05620193481445, -44.35380554199219, -42.65140914916992, -40.949012756347656, -39.24661636352539, -37.544219970703125, -35.841819763183594, -34.13942337036133, -32.43702697753906, -30.734630584716797, -29.0322322845459, -27.329835891723633, -25.627437591552734, -23.92504119873047, -22.222644805908203, -20.520248413085938, -18.81785011291504, -17.115453720092773, -15.413056373596191, -13.71065902709961, -12.008262634277344, -10.305865287780762, -8.60346794128418, -6.901071548461914, -5.198674201965332, -3.4962778091430664, -1.7938804626464844, -0.091483473777771, 1.6109135150909424, 3.3133106231689453, 5.015707492828369, 6.718104362487793, 8.420501708984375, 10.12289810180664, 11.825295448303223, 13.527692794799805, 15.23008918762207, 16.93248748779297, 18.634883880615234, 20.3372802734375, 22.039676666259766, 23.74207305908203, 25.44447135925293, 27.146867752075195, 28.849266052246094, 30.55166244506836, 32.254058837890625, 33.95645523071289, 35.658851623535156, 37.36125183105469, 39.06364822387695, 40.76604461669922, 42.468441009521484, 44.17083740234375, 45.87323760986328, 47.57563400268555, 49.27803039550781, 50.98042678833008, 52.682823181152344]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 8.0, 3.0, 9.0, 8.0, 13.0, 17.0, 14.0, 15.0, 20.0, 18.0, 15.0, 22.0, 26.0, 32.0, 35.0, 31.0, 38.0, 40.0, 43.0, 42.0, 40.0, 57.0, 46.0, 35.0, 36.0, 34.0, 35.0, 22.0, 27.0, 34.0, 19.0, 30.0, 11.0, 18.0, 27.0, 16.0, 8.0, 12.0, 10.0, 8.0, 5.0, 4.0, 9.0, 6.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.890625, -4.7235107421875, -4.556396484375, -4.3892822265625, -4.22216796875, -4.0550537109375, -3.887939453125, -3.7208251953125, -3.5537109375, -3.3865966796875, -3.219482421875, -3.0523681640625, -2.88525390625, -2.7181396484375, -2.551025390625, -2.3839111328125, -2.216796875, -2.0496826171875, -1.882568359375, -1.7154541015625, -1.54833984375, -1.3812255859375, -1.214111328125, -1.0469970703125, -0.8798828125, -0.7127685546875, -0.545654296875, -0.3785400390625, -0.21142578125, -0.0443115234375, 0.122802734375, 0.2899169921875, 0.45703125, 0.6241455078125, 0.791259765625, 0.9583740234375, 1.12548828125, 1.2926025390625, 1.459716796875, 1.6268310546875, 1.7939453125, 1.9610595703125, 2.128173828125, 2.2952880859375, 2.46240234375, 2.6295166015625, 2.796630859375, 2.9637451171875, 3.130859375, 3.2979736328125, 3.465087890625, 3.6322021484375, 3.79931640625, 3.9664306640625, 4.133544921875, 4.3006591796875, 4.4677734375, 4.6348876953125, 4.802001953125, 4.9691162109375, 5.13623046875, 5.3033447265625, 5.470458984375, 5.6375732421875, 5.8046875]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 7.0, 11.0, 7.0, 20.0, 23.0, 30.0, 43.0, 70.0, 85.0, 160.0, 241.0, 345.0, 617.0, 1025.0, 1758.0, 3231.0, 6336.0, 13990.0, 39965.0, 430359.0, 3292319.0, 337706.0, 38046.0, 13928.0, 6261.0, 3342.0, 1728.0, 1019.0, 609.0, 332.0, 237.0, 153.0, 85.0, 63.0, 44.0, 29.0, 13.0, 18.0, 9.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-19.984375, -19.4208984375, -18.857421875, -18.2939453125, -17.73046875, -17.1669921875, -16.603515625, -16.0400390625, -15.4765625, -14.9130859375, -14.349609375, -13.7861328125, -13.22265625, -12.6591796875, -12.095703125, -11.5322265625, -10.96875, -10.4052734375, -9.841796875, -9.2783203125, -8.71484375, -8.1513671875, -7.587890625, -7.0244140625, -6.4609375, -5.8974609375, -5.333984375, -4.7705078125, -4.20703125, -3.6435546875, -3.080078125, -2.5166015625, -1.953125, -1.3896484375, -0.826171875, -0.2626953125, 0.30078125, 0.8642578125, 1.427734375, 1.9912109375, 2.5546875, 3.1181640625, 3.681640625, 4.2451171875, 4.80859375, 5.3720703125, 5.935546875, 6.4990234375, 7.0625, 7.6259765625, 8.189453125, 8.7529296875, 9.31640625, 9.8798828125, 10.443359375, 11.0068359375, 11.5703125, 12.1337890625, 12.697265625, 13.2607421875, 13.82421875, 14.3876953125, 14.951171875, 15.5146484375, 16.078125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 2.0, 3.0, 12.0, 9.0, 11.0, 14.0, 13.0, 21.0, 38.0, 63.0, 97.0, 170.0, 366.0, 795.0, 1054.0, 679.0, 295.0, 153.0, 94.0, 48.0, 29.0, 29.0, 20.0, 10.0, 10.0, 9.0, 8.0, 9.0, 3.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.71875, -21.08642578125, -20.4541015625, -19.82177734375, -19.189453125, -18.55712890625, -17.9248046875, -17.29248046875, -16.66015625, -16.02783203125, -15.3955078125, -14.76318359375, -14.130859375, -13.49853515625, -12.8662109375, -12.23388671875, -11.6015625, -10.96923828125, -10.3369140625, -9.70458984375, -9.072265625, -8.43994140625, -7.8076171875, -7.17529296875, -6.54296875, -5.91064453125, -5.2783203125, -4.64599609375, -4.013671875, -3.38134765625, -2.7490234375, -2.11669921875, -1.484375, -0.85205078125, -0.2197265625, 0.41259765625, 1.044921875, 1.67724609375, 2.3095703125, 2.94189453125, 3.57421875, 4.20654296875, 4.8388671875, 5.47119140625, 6.103515625, 6.73583984375, 7.3681640625, 8.00048828125, 8.6328125, 9.26513671875, 9.8974609375, 10.52978515625, 11.162109375, 11.79443359375, 12.4267578125, 13.05908203125, 13.69140625, 14.32373046875, 14.9560546875, 15.58837890625, 16.220703125, 16.85302734375, 17.4853515625, 18.11767578125, 18.75]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 7.0, 9.0, 13.0, 23.0, 27.0, 68.0, 131.0, 272.0, 659.0, 1693.0, 4891.0, 18342.0, 126145.0, 3683125.0, 319751.0, 28330.0, 6977.0, 2276.0, 846.0, 365.0, 148.0, 82.0, 39.0, 21.0, 11.0, 9.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.3125, -35.08740234375, -33.8623046875, -32.63720703125, -31.412109375, -30.18701171875, -28.9619140625, -27.73681640625, -26.51171875, -25.28662109375, -24.0615234375, -22.83642578125, -21.611328125, -20.38623046875, -19.1611328125, -17.93603515625, -16.7109375, -15.48583984375, -14.2607421875, -13.03564453125, -11.810546875, -10.58544921875, -9.3603515625, -8.13525390625, -6.91015625, -5.68505859375, -4.4599609375, -3.23486328125, -2.009765625, -0.78466796875, 0.4404296875, 1.66552734375, 2.890625, 4.11572265625, 5.3408203125, 6.56591796875, 7.791015625, 9.01611328125, 10.2412109375, 11.46630859375, 12.69140625, 13.91650390625, 15.1416015625, 16.36669921875, 17.591796875, 18.81689453125, 20.0419921875, 21.26708984375, 22.4921875, 23.71728515625, 24.9423828125, 26.16748046875, 27.392578125, 28.61767578125, 29.8427734375, 31.06787109375, 32.29296875, 33.51806640625, 34.7431640625, 35.96826171875, 37.193359375, 38.41845703125, 39.6435546875, 40.86865234375, 42.09375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 8.0, 27.0, 111.0, 336.0, 324.0, 133.0, 51.0, 13.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-245.24896240234375, -238.44882202148438, -231.648681640625, -224.84854125976562, -218.04840087890625, -211.24826049804688, -204.4481201171875, -197.6479949951172, -190.8478546142578, -184.04771423339844, -177.24757385253906, -170.4474334716797, -163.6472930908203, -156.84716796875, -150.04702758789062, -143.24688720703125, -136.44674682617188, -129.6466064453125, -122.84646606445312, -116.04632568359375, -109.2461929321289, -102.44605255126953, -95.64591217041016, -88.84577941894531, -82.04562377929688, -75.2454833984375, -68.44534301757812, -61.645206451416016, -54.845069885253906, -48.04492950439453, -41.244789123535156, -34.44465255737305, -27.644515991210938, -20.844377517700195, -14.044238090515137, -7.244098663330078, -0.44396018981933594, 6.356178283691406, 13.156318664550781, 19.95645523071289, 26.756595611572266, 33.55673599243164, 40.35687255859375, 47.157012939453125, 53.9571533203125, 60.75728988647461, 67.55743408203125, 74.3575668334961, 81.15770721435547, 87.95784759521484, 94.75798797607422, 101.55812072753906, 108.35826110839844, 115.15840148925781, 121.95854187011719, 128.75868225097656, 135.55882263183594, 142.3589630126953, 149.1591033935547, 155.95924377441406, 162.75938415527344, 169.55950927734375, 176.35964965820312, 183.1597900390625, 189.95993041992188]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 9.0, 12.0, 6.0, 18.0, 5.0, 12.0, 18.0, 15.0, 27.0, 27.0, 28.0, 29.0, 32.0, 41.0, 48.0, 38.0, 42.0, 39.0, 47.0, 29.0, 50.0, 39.0, 37.0, 34.0, 36.0, 37.0, 32.0, 35.0, 20.0, 31.0, 23.0, 19.0, 18.0, 16.0, 9.0, 6.0, 3.0, 6.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.95659637451172, -40.59119415283203, -39.22578811645508, -37.86038589477539, -36.4949836730957, -35.129581451416016, -33.76417541503906, -32.398773193359375, -31.033370971679688, -29.667966842651367, -28.30256462097168, -26.93716049194336, -25.571758270263672, -24.20635414123535, -22.84095001220703, -21.475547790527344, -20.110143661499023, -18.744739532470703, -17.379337310791016, -16.013933181762695, -14.648530960083008, -13.283126831054688, -11.917723655700684, -10.55232048034668, -9.186917304992676, -7.821514129638672, -6.456110954284668, -5.090707302093506, -3.725304126739502, -2.359900951385498, -0.9944972991943359, 0.37090587615966797, 1.7363090515136719, 3.101712226867676, 4.46711540222168, 5.832519054412842, 7.197922229766846, 8.563325881958008, 9.928729057312012, 11.294132232666016, 12.65953540802002, 14.024938583374023, 15.390341758728027, 16.75574493408203, 18.12114906311035, 19.48655128479004, 20.85195541381836, 22.217357635498047, 23.582761764526367, 24.948165893554688, 26.313568115234375, 27.678972244262695, 29.044374465942383, 30.409778594970703, 31.77518081665039, 33.140586853027344, 34.50598907470703, 35.87139129638672, 37.23679733276367, 38.60219955444336, 39.96760177612305, 41.333003997802734, 42.69841003417969, 44.063812255859375, 45.42921447753906]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 7.0, 8.0, 4.0, 7.0, 8.0, 7.0, 17.0, 15.0, 19.0, 17.0, 14.0, 23.0, 22.0, 25.0, 26.0, 36.0, 34.0, 44.0, 45.0, 40.0, 50.0, 50.0, 45.0, 51.0, 39.0, 36.0, 34.0, 22.0, 31.0, 39.0, 22.0, 32.0, 23.0, 10.0, 17.0, 17.0, 16.0, 15.0, 9.0, 7.0, 9.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.59765625, -4.42657470703125, -4.2554931640625, -4.08441162109375, -3.913330078125, -3.74224853515625, -3.5711669921875, -3.40008544921875, -3.22900390625, -3.05792236328125, -2.8868408203125, -2.71575927734375, -2.544677734375, -2.37359619140625, -2.2025146484375, -2.03143310546875, -1.8603515625, -1.68927001953125, -1.5181884765625, -1.34710693359375, -1.176025390625, -1.00494384765625, -0.8338623046875, -0.66278076171875, -0.49169921875, -0.32061767578125, -0.1495361328125, 0.02154541015625, 0.192626953125, 0.36370849609375, 0.5347900390625, 0.70587158203125, 0.876953125, 1.04803466796875, 1.2191162109375, 1.39019775390625, 1.561279296875, 1.73236083984375, 1.9034423828125, 2.07452392578125, 2.24560546875, 2.41668701171875, 2.5877685546875, 2.75885009765625, 2.929931640625, 3.10101318359375, 3.2720947265625, 3.44317626953125, 3.6142578125, 3.78533935546875, 3.9564208984375, 4.12750244140625, 4.298583984375, 4.46966552734375, 4.6407470703125, 4.81182861328125, 4.98291015625, 5.15399169921875, 5.3250732421875, 5.49615478515625, 5.667236328125, 5.83831787109375, 6.0093994140625, 6.18048095703125, 6.3515625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 8.0, 10.0, 14.0, 20.0, 24.0, 46.0, 58.0, 78.0, 112.0, 138.0, 218.0, 312.0, 493.0, 775.0, 1101.0, 1780.0, 2781.0, 4496.0, 7457.0, 12494.0, 22096.0, 42138.0, 96348.0, 544265.0, 180636.0, 60112.0, 29609.0, 16093.0, 9358.0, 5577.0, 3544.0, 2182.0, 1319.0, 927.0, 630.0, 365.0, 275.0, 198.0, 140.0, 102.0, 78.0, 42.0, 25.0, 27.0, 22.0, 14.0, 6.0, 7.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-20.171875, -19.5556640625, -18.939453125, -18.3232421875, -17.70703125, -17.0908203125, -16.474609375, -15.8583984375, -15.2421875, -14.6259765625, -14.009765625, -13.3935546875, -12.77734375, -12.1611328125, -11.544921875, -10.9287109375, -10.3125, -9.6962890625, -9.080078125, -8.4638671875, -7.84765625, -7.2314453125, -6.615234375, -5.9990234375, -5.3828125, -4.7666015625, -4.150390625, -3.5341796875, -2.91796875, -2.3017578125, -1.685546875, -1.0693359375, -0.453125, 0.1630859375, 0.779296875, 1.3955078125, 2.01171875, 2.6279296875, 3.244140625, 3.8603515625, 4.4765625, 5.0927734375, 5.708984375, 6.3251953125, 6.94140625, 7.5576171875, 8.173828125, 8.7900390625, 9.40625, 10.0224609375, 10.638671875, 11.2548828125, 11.87109375, 12.4873046875, 13.103515625, 13.7197265625, 14.3359375, 14.9521484375, 15.568359375, 16.1845703125, 16.80078125, 17.4169921875, 18.033203125, 18.6494140625, 19.265625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 3.0, 1.0, 3.0, 8.0, 6.0, 9.0, 10.0, 10.0, 5.0, 17.0, 12.0, 16.0, 19.0, 19.0, 31.0, 39.0, 25.0, 27.0, 51.0, 43.0, 39.0, 47.0, 31.0, 1056.0, 40.0, 34.0, 32.0, 32.0, 38.0, 25.0, 41.0, 23.0, 33.0, 29.0, 20.0, 24.0, 21.0, 17.0, 16.0, 11.0, 13.0, 15.0, 7.0, 7.0, 4.0, 6.0, 2.0, 4.0, 4.0, 4.0, 2.0, 4.0], "bins": [-4.80078125, -4.667205810546875, -4.53363037109375, -4.400054931640625, -4.2664794921875, -4.132904052734375, -3.99932861328125, -3.865753173828125, -3.732177734375, -3.598602294921875, -3.46502685546875, -3.331451416015625, -3.1978759765625, -3.064300537109375, -2.93072509765625, -2.797149658203125, -2.66357421875, -2.529998779296875, -2.39642333984375, -2.262847900390625, -2.1292724609375, -1.995697021484375, -1.86212158203125, -1.728546142578125, -1.594970703125, -1.461395263671875, -1.32781982421875, -1.194244384765625, -1.0606689453125, -0.927093505859375, -0.79351806640625, -0.659942626953125, -0.5263671875, -0.392791748046875, -0.25921630859375, -0.125640869140625, 0.0079345703125, 0.141510009765625, 0.27508544921875, 0.408660888671875, 0.542236328125, 0.675811767578125, 0.80938720703125, 0.942962646484375, 1.0765380859375, 1.210113525390625, 1.34368896484375, 1.477264404296875, 1.61083984375, 1.744415283203125, 1.87799072265625, 2.011566162109375, 2.1451416015625, 2.278717041015625, 2.41229248046875, 2.545867919921875, 2.679443359375, 2.813018798828125, 2.94659423828125, 3.080169677734375, 3.2137451171875, 3.347320556640625, 3.48089599609375, 3.614471435546875, 3.748046875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 9.0, 11.0, 16.0, 18.0, 25.0, 34.0, 55.0, 62.0, 94.0, 140.0, 190.0, 281.0, 383.0, 568.0, 812.0, 1226.0, 1925.0, 3104.0, 5228.0, 9775.0, 20130.0, 61022.0, 1431395.0, 474495.0, 47339.0, 17377.0, 8451.0, 4684.0, 2890.0, 1744.0, 1089.0, 776.0, 556.0, 377.0, 238.0, 173.0, 118.0, 97.0, 51.0, 49.0, 39.0, 21.0, 17.0, 13.0, 11.0, 6.0, 4.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 3.0], "bins": [-25.515625, -24.740234375, -23.96484375, -23.189453125, -22.4140625, -21.638671875, -20.86328125, -20.087890625, -19.3125, -18.537109375, -17.76171875, -16.986328125, -16.2109375, -15.435546875, -14.66015625, -13.884765625, -13.109375, -12.333984375, -11.55859375, -10.783203125, -10.0078125, -9.232421875, -8.45703125, -7.681640625, -6.90625, -6.130859375, -5.35546875, -4.580078125, -3.8046875, -3.029296875, -2.25390625, -1.478515625, -0.703125, 0.072265625, 0.84765625, 1.623046875, 2.3984375, 3.173828125, 3.94921875, 4.724609375, 5.5, 6.275390625, 7.05078125, 7.826171875, 8.6015625, 9.376953125, 10.15234375, 10.927734375, 11.703125, 12.478515625, 13.25390625, 14.029296875, 14.8046875, 15.580078125, 16.35546875, 17.130859375, 17.90625, 18.681640625, 19.45703125, 20.232421875, 21.0078125, 21.783203125, 22.55859375, 23.333984375, 24.109375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 2.0, 2.0, 5.0, 2.0, 11.0, 16.0, 52.0, 133.0, 521.0, 130.0, 64.0, 23.0, 6.0, 4.0, 10.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6796875, -11.3406982421875, -11.001708984375, -10.6627197265625, -10.32373046875, -9.9847412109375, -9.645751953125, -9.3067626953125, -8.9677734375, -8.6287841796875, -8.289794921875, -7.9508056640625, -7.61181640625, -7.2728271484375, -6.933837890625, -6.5948486328125, -6.255859375, -5.9168701171875, -5.577880859375, -5.2388916015625, -4.89990234375, -4.5609130859375, -4.221923828125, -3.8829345703125, -3.5439453125, -3.2049560546875, -2.865966796875, -2.5269775390625, -2.18798828125, -1.8489990234375, -1.510009765625, -1.1710205078125, -0.83203125, -0.4930419921875, -0.154052734375, 0.1849365234375, 0.52392578125, 0.8629150390625, 1.201904296875, 1.5408935546875, 1.8798828125, 2.2188720703125, 2.557861328125, 2.8968505859375, 3.23583984375, 3.5748291015625, 3.913818359375, 4.2528076171875, 4.591796875, 4.9307861328125, 5.269775390625, 5.6087646484375, 5.94775390625, 6.2867431640625, 6.625732421875, 6.9647216796875, 7.3037109375, 7.6427001953125, 7.981689453125, 8.3206787109375, 8.65966796875, 8.9986572265625, 9.337646484375, 9.6766357421875, 10.015625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 9.0, 7.0, 5.0, 9.0, 15.0, 17.0, 29.0, 31.0, 63.0, 135.0, 400.0, 1564.0, 11770.0, 1020983.0, 11206.0, 1603.0, 391.0, 116.0, 60.0, 35.0, 16.0, 13.0, 13.0, 12.0, 6.0, 11.0, 6.0, 7.0, 2.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-125.3125, -121.0634765625, -116.814453125, -112.5654296875, -108.31640625, -104.0673828125, -99.818359375, -95.5693359375, -91.3203125, -87.0712890625, -82.822265625, -78.5732421875, -74.32421875, -70.0751953125, -65.826171875, -61.5771484375, -57.328125, -53.0791015625, -48.830078125, -44.5810546875, -40.33203125, -36.0830078125, -31.833984375, -27.5849609375, -23.3359375, -19.0869140625, -14.837890625, -10.5888671875, -6.33984375, -2.0908203125, 2.158203125, 6.4072265625, 10.65625, 14.9052734375, 19.154296875, 23.4033203125, 27.65234375, 31.9013671875, 36.150390625, 40.3994140625, 44.6484375, 48.8974609375, 53.146484375, 57.3955078125, 61.64453125, 65.8935546875, 70.142578125, 74.3916015625, 78.640625, 82.8896484375, 87.138671875, 91.3876953125, 95.63671875, 99.8857421875, 104.134765625, 108.3837890625, 112.6328125, 116.8818359375, 121.130859375, 125.3798828125, 129.62890625, 133.8779296875, 138.126953125, 142.3759765625, 146.625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 9.0, 25.0, 70.0, 324.0, 455.0, 93.0, 25.0, 5.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.83820343017578, -39.603981018066406, -38.3697624206543, -37.13554000854492, -35.90131759643555, -34.66709518432617, -33.43287658691406, -32.19865417480469, -30.964431762695312, -29.73021125793457, -28.495988845825195, -27.261768341064453, -26.027545928955078, -24.793325424194336, -23.559104919433594, -22.32488250732422, -21.090662002563477, -19.856441497802734, -18.62221908569336, -17.387998580932617, -16.153776168823242, -14.9195556640625, -13.685334205627441, -12.451112747192383, -11.216891288757324, -9.982669830322266, -8.748448371887207, -7.514227390289307, -6.280005931854248, -5.0457844734191895, -3.811563491821289, -2.5773420333862305, -1.3431205749511719, -0.10889923572540283, 1.1253221035003662, 2.3595433235168457, 3.5937647819519043, 4.827986240386963, 6.062207221984863, 7.296428680419922, 8.53065013885498, 9.764871597290039, 10.999093055725098, 12.233314514160156, 13.467535018920898, 14.701757431030273, 15.935977935791016, 17.17020034790039, 18.404420852661133, 19.638641357421875, 20.87286376953125, 22.107084274291992, 23.341306686401367, 24.57552719116211, 25.809749603271484, 27.043970108032227, 28.27819061279297, 29.51241111755371, 30.746633529663086, 31.980854034423828, 33.2150764465332, 34.44929885864258, 35.68351745605469, 36.91773986816406, 38.15196228027344]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 4.0, 6.0, 6.0, 14.0, 13.0, 6.0, 21.0, 24.0, 18.0, 21.0, 29.0, 28.0, 30.0, 19.0, 29.0, 42.0, 35.0, 45.0, 36.0, 37.0, 41.0, 39.0, 33.0, 45.0, 40.0, 27.0, 33.0, 45.0, 39.0, 24.0, 12.0, 22.0, 23.0, 21.0, 10.0, 11.0, 14.0, 7.0, 9.0, 11.0, 5.0, 3.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0], "bins": [-6.155326843261719, -5.963757038116455, -5.77218770980835, -5.580617904663086, -5.3890485763549805, -5.197478771209717, -5.005909442901611, -4.814339637756348, -4.622770309448242, -4.4312005043029785, -4.239631175994873, -4.048061370849609, -3.856492042541504, -3.6649224758148193, -3.4733529090881348, -3.281783103942871, -3.0902135372161865, -2.898643970489502, -2.7070744037628174, -2.515504837036133, -2.3239352703094482, -2.1323657035827637, -1.9407960176467896, -1.749226450920105, -1.5576568841934204, -1.3660873174667358, -1.1745177507400513, -0.9829481244087219, -0.7913785576820374, -0.5998089909553528, -0.40823936462402344, -0.21666979789733887, -0.025100231170654297, 0.16646935045719147, 0.35803893208503723, 0.5496085286140442, 0.7411780953407288, 0.9327476620674133, 1.1243172883987427, 1.3158868551254272, 1.5074564218521118, 1.6990259885787964, 1.890595555305481, 2.082165241241455, 2.2737348079681396, 2.465304374694824, 2.656873941421509, 2.8484435081481934, 3.040013074874878, 3.2315826416015625, 3.423152208328247, 3.6147217750549316, 3.806291341781616, 3.997860908508301, 4.1894307136535645, 4.38100004196167, 4.572569847106934, 4.764139652252197, 4.955708980560303, 5.147278785705566, 5.338848114013672, 5.5304179191589355, 5.721987247467041, 5.913557052612305, 6.10512638092041]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 6.0, 2.0, 7.0, 10.0, 10.0, 12.0, 19.0, 10.0, 19.0, 26.0, 14.0, 17.0, 18.0, 26.0, 31.0, 30.0, 35.0, 35.0, 49.0, 57.0, 42.0, 54.0, 41.0, 46.0, 37.0, 32.0, 36.0, 34.0, 34.0, 20.0, 26.0, 25.0, 14.0, 22.0, 19.0, 18.0, 12.0, 7.0, 15.0, 11.0, 8.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.70703125, -4.536865234375, -4.36669921875, -4.196533203125, -4.0263671875, -3.856201171875, -3.68603515625, -3.515869140625, -3.345703125, -3.175537109375, -3.00537109375, -2.835205078125, -2.6650390625, -2.494873046875, -2.32470703125, -2.154541015625, -1.984375, -1.814208984375, -1.64404296875, -1.473876953125, -1.3037109375, -1.133544921875, -0.96337890625, -0.793212890625, -0.623046875, -0.452880859375, -0.28271484375, -0.112548828125, 0.0576171875, 0.227783203125, 0.39794921875, 0.568115234375, 0.73828125, 0.908447265625, 1.07861328125, 1.248779296875, 1.4189453125, 1.589111328125, 1.75927734375, 1.929443359375, 2.099609375, 2.269775390625, 2.43994140625, 2.610107421875, 2.7802734375, 2.950439453125, 3.12060546875, 3.290771484375, 3.4609375, 3.631103515625, 3.80126953125, 3.971435546875, 4.1416015625, 4.311767578125, 4.48193359375, 4.652099609375, 4.822265625, 4.992431640625, 5.16259765625, 5.332763671875, 5.5029296875, 5.673095703125, 5.84326171875, 6.013427734375, 6.18359375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 8.0, 8.0, 19.0, 23.0, 29.0, 42.0, 50.0, 66.0, 97.0, 129.0, 189.0, 243.0, 374.0, 550.0, 760.0, 1186.0, 1831.0, 3056.0, 5048.0, 9091.0, 16814.0, 34421.0, 81751.0, 258111.0, 403688.0, 130604.0, 48781.0, 22580.0, 11689.0, 6638.0, 3738.0, 2399.0, 1483.0, 945.0, 617.0, 422.0, 322.0, 200.0, 138.0, 107.0, 97.0, 55.0, 39.0, 29.0, 28.0, 19.0, 14.0, 9.0, 7.0, 7.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.19921875, -6.96099853515625, -6.7227783203125, -6.48455810546875, -6.246337890625, -6.00811767578125, -5.7698974609375, -5.53167724609375, -5.29345703125, -5.05523681640625, -4.8170166015625, -4.57879638671875, -4.340576171875, -4.10235595703125, -3.8641357421875, -3.62591552734375, -3.3876953125, -3.14947509765625, -2.9112548828125, -2.67303466796875, -2.434814453125, -2.19659423828125, -1.9583740234375, -1.72015380859375, -1.48193359375, -1.24371337890625, -1.0054931640625, -0.76727294921875, -0.529052734375, -0.29083251953125, -0.0526123046875, 0.18560791015625, 0.423828125, 0.66204833984375, 0.9002685546875, 1.13848876953125, 1.376708984375, 1.61492919921875, 1.8531494140625, 2.09136962890625, 2.32958984375, 2.56781005859375, 2.8060302734375, 3.04425048828125, 3.282470703125, 3.52069091796875, 3.7589111328125, 3.99713134765625, 4.2353515625, 4.47357177734375, 4.7117919921875, 4.95001220703125, 5.188232421875, 5.42645263671875, 5.6646728515625, 5.90289306640625, 6.14111328125, 6.37933349609375, 6.6175537109375, 6.85577392578125, 7.093994140625, 7.33221435546875, 7.5704345703125, 7.80865478515625, 8.046875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 7.0, 4.0, 5.0, 11.0, 7.0, 7.0, 10.0, 30.0, 21.0, 25.0, 32.0, 34.0, 36.0, 56.0, 59.0, 69.0, 97.0, 128.0, 317.0, 1418.0, 171.0, 90.0, 64.0, 57.0, 44.0, 44.0, 47.0, 25.0, 23.0, 25.0, 16.0, 10.0, 9.0, 11.0, 13.0, 4.0, 2.0, 4.0, 9.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-23.1875, -22.46630859375, -21.7451171875, -21.02392578125, -20.302734375, -19.58154296875, -18.8603515625, -18.13916015625, -17.41796875, -16.69677734375, -15.9755859375, -15.25439453125, -14.533203125, -13.81201171875, -13.0908203125, -12.36962890625, -11.6484375, -10.92724609375, -10.2060546875, -9.48486328125, -8.763671875, -8.04248046875, -7.3212890625, -6.60009765625, -5.87890625, -5.15771484375, -4.4365234375, -3.71533203125, -2.994140625, -2.27294921875, -1.5517578125, -0.83056640625, -0.109375, 0.61181640625, 1.3330078125, 2.05419921875, 2.775390625, 3.49658203125, 4.2177734375, 4.93896484375, 5.66015625, 6.38134765625, 7.1025390625, 7.82373046875, 8.544921875, 9.26611328125, 9.9873046875, 10.70849609375, 11.4296875, 12.15087890625, 12.8720703125, 13.59326171875, 14.314453125, 15.03564453125, 15.7568359375, 16.47802734375, 17.19921875, 17.92041015625, 18.6416015625, 19.36279296875, 20.083984375, 20.80517578125, 21.5263671875, 22.24755859375, 22.96875]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 8.0, 13.0, 21.0, 31.0, 69.0, 180.0, 528.0, 2099.0, 92095.0, 3045063.0, 4299.0, 843.0, 250.0, 87.0, 45.0, 27.0, 18.0, 8.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-177.75, -172.96875, -168.1875, -163.40625, -158.625, -153.84375, -149.0625, -144.28125, -139.5, -134.71875, -129.9375, -125.15625, -120.375, -115.59375, -110.8125, -106.03125, -101.25, -96.46875, -91.6875, -86.90625, -82.125, -77.34375, -72.5625, -67.78125, -63.0, -58.21875, -53.4375, -48.65625, -43.875, -39.09375, -34.3125, -29.53125, -24.75, -19.96875, -15.1875, -10.40625, -5.625, -0.84375, 3.9375, 8.71875, 13.5, 18.28125, 23.0625, 27.84375, 32.625, 37.40625, 42.1875, 46.96875, 51.75, 56.53125, 61.3125, 66.09375, 70.875, 75.65625, 80.4375, 85.21875, 90.0, 94.78125, 99.5625, 104.34375, 109.125, 113.90625, 118.6875, 123.46875, 128.25]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 29.0, 86.0, 221.0, 341.0, 200.0, 87.0, 28.0, 6.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.52264404296875, -137.16053771972656, -132.79843139648438, -128.4363250732422, -124.07421875, -119.71211242675781, -115.35001373291016, -110.98790740966797, -106.62580108642578, -102.2636947631836, -97.9015884399414, -93.53948211669922, -89.17738342285156, -84.81527709960938, -80.45317077636719, -76.091064453125, -71.72895812988281, -67.36685180664062, -63.00474548339844, -58.642642974853516, -54.28053665161133, -49.91843032836914, -45.55632781982422, -41.19422149658203, -36.832115173339844, -32.470008850097656, -28.1079044342041, -23.745800018310547, -19.38369369506836, -15.021587371826172, -10.659482955932617, -6.2973785400390625, -1.9352569580078125, 2.4268484115600586, 6.78895378112793, 11.1510591506958, 15.513164520263672, 19.87527084350586, 24.237375259399414, 28.59947967529297, 32.961585998535156, 37.323692321777344, 41.68579864501953, 46.04790115356445, 50.41000747680664, 54.77211380004883, 59.13421630859375, 63.49632263183594, 67.85842895507812, 72.22053527832031, 76.5826416015625, 80.94474792480469, 85.30685424804688, 89.66896057128906, 94.03105926513672, 98.3931655883789, 102.7552719116211, 107.11737823486328, 111.47948455810547, 115.84159088134766, 120.20368957519531, 124.5657958984375, 128.9279022216797, 133.29000854492188, 137.65211486816406]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 6.0, 4.0, 6.0, 15.0, 14.0, 7.0, 10.0, 21.0, 17.0, 15.0, 19.0, 34.0, 33.0, 33.0, 37.0, 29.0, 33.0, 29.0, 40.0, 30.0, 46.0, 32.0, 37.0, 36.0, 32.0, 37.0, 36.0, 36.0, 21.0, 34.0, 25.0, 31.0, 27.0, 15.0, 14.0, 20.0, 13.0, 12.0, 16.0, 13.0, 6.0, 9.0, 5.0, 5.0, 3.0, 4.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.63307189941406, -60.77549362182617, -58.917911529541016, -57.060333251953125, -55.20275115966797, -53.34517288208008, -51.48759460449219, -49.63001251220703, -47.77243423461914, -45.91485595703125, -44.057273864746094, -42.1996955871582, -40.34211730957031, -38.484535217285156, -36.626956939697266, -34.769378662109375, -32.91179656982422, -31.054216384887695, -29.196636199951172, -27.33905792236328, -25.481477737426758, -23.623897552490234, -21.766319274902344, -19.90873908996582, -18.051158905029297, -16.193578720092773, -14.335999488830566, -12.47842025756836, -10.620840072631836, -8.763259887695312, -6.9056806564331055, -5.048101425170898, -3.190521240234375, -1.3329415321350098, 0.5246381759643555, 2.3822178840637207, 4.239797592163086, 6.097377777099609, 7.954957008361816, 9.812536239624023, 11.670116424560547, 13.52769660949707, 15.385275840759277, 17.242855072021484, 19.100435256958008, 20.95801544189453, 22.815593719482422, 24.673173904418945, 26.53075408935547, 28.388334274291992, 30.245914459228516, 32.103492736816406, 33.96107482910156, 35.81865310668945, 37.676231384277344, 39.5338134765625, 41.39139175415039, 43.24897003173828, 45.10655212402344, 46.96413040161133, 48.82170867919922, 50.679290771484375, 52.536869049072266, 54.394447326660156, 56.25202941894531]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 7.0, 5.0, 9.0, 11.0, 8.0, 19.0, 12.0, 22.0, 14.0, 23.0, 18.0, 22.0, 26.0, 28.0, 37.0, 29.0, 32.0, 43.0, 49.0, 45.0, 34.0, 53.0, 31.0, 42.0, 37.0, 34.0, 36.0, 30.0, 27.0, 22.0, 33.0, 22.0, 14.0, 18.0, 16.0, 23.0, 18.0, 7.0, 8.0, 11.0, 3.0, 8.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1171875, -4.93438720703125, -4.7515869140625, -4.56878662109375, -4.385986328125, -4.20318603515625, -4.0203857421875, -3.83758544921875, -3.65478515625, -3.47198486328125, -3.2891845703125, -3.10638427734375, -2.923583984375, -2.74078369140625, -2.5579833984375, -2.37518310546875, -2.1923828125, -2.00958251953125, -1.8267822265625, -1.64398193359375, -1.461181640625, -1.27838134765625, -1.0955810546875, -0.91278076171875, -0.72998046875, -0.54718017578125, -0.3643798828125, -0.18157958984375, 0.001220703125, 0.18402099609375, 0.3668212890625, 0.54962158203125, 0.732421875, 0.91522216796875, 1.0980224609375, 1.28082275390625, 1.463623046875, 1.64642333984375, 1.8292236328125, 2.01202392578125, 2.19482421875, 2.37762451171875, 2.5604248046875, 2.74322509765625, 2.926025390625, 3.10882568359375, 3.2916259765625, 3.47442626953125, 3.6572265625, 3.84002685546875, 4.0228271484375, 4.20562744140625, 4.388427734375, 4.57122802734375, 4.7540283203125, 4.93682861328125, 5.11962890625, 5.30242919921875, 5.4852294921875, 5.66802978515625, 5.850830078125, 6.03363037109375, 6.2164306640625, 6.39923095703125, 6.58203125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 11.0, 8.0, 11.0, 23.0, 21.0, 27.0, 50.0, 65.0, 84.0, 108.0, 166.0, 234.0, 319.0, 455.0, 681.0, 879.0, 1246.0, 1866.0, 2630.0, 4078.0, 6267.0, 10443.0, 19722.0, 50974.0, 241680.0, 1360900.0, 1960167.0, 394713.0, 76868.0, 25447.0, 12698.0, 7402.0, 4667.0, 2975.0, 2028.0, 1332.0, 888.0, 639.0, 450.0, 296.0, 230.0, 162.0, 107.0, 62.0, 67.0, 46.0, 32.0, 20.0, 9.0, 17.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-9.8046875, -9.4996337890625, -9.194580078125, -8.8895263671875, -8.58447265625, -8.2794189453125, -7.974365234375, -7.6693115234375, -7.3642578125, -7.0592041015625, -6.754150390625, -6.4490966796875, -6.14404296875, -5.8389892578125, -5.533935546875, -5.2288818359375, -4.923828125, -4.6187744140625, -4.313720703125, -4.0086669921875, -3.70361328125, -3.3985595703125, -3.093505859375, -2.7884521484375, -2.4833984375, -2.1783447265625, -1.873291015625, -1.5682373046875, -1.26318359375, -0.9581298828125, -0.653076171875, -0.3480224609375, -0.04296875, 0.2620849609375, 0.567138671875, 0.8721923828125, 1.17724609375, 1.4822998046875, 1.787353515625, 2.0924072265625, 2.3974609375, 2.7025146484375, 3.007568359375, 3.3126220703125, 3.61767578125, 3.9227294921875, 4.227783203125, 4.5328369140625, 4.837890625, 5.1429443359375, 5.447998046875, 5.7530517578125, 6.05810546875, 6.3631591796875, 6.668212890625, 6.9732666015625, 7.2783203125, 7.5833740234375, 7.888427734375, 8.1934814453125, 8.49853515625, 8.8035888671875, 9.108642578125, 9.4136962890625, 9.71875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 4.0, 2.0, 11.0, 5.0, 8.0, 11.0, 13.0, 14.0, 20.0, 28.0, 32.0, 61.0, 116.0, 169.0, 282.0, 496.0, 687.0, 712.0, 492.0, 321.0, 175.0, 105.0, 84.0, 58.0, 43.0, 25.0, 22.0, 11.0, 12.0, 8.0, 11.0, 4.0, 5.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.140625, -14.696533203125, -14.25244140625, -13.808349609375, -13.3642578125, -12.920166015625, -12.47607421875, -12.031982421875, -11.587890625, -11.143798828125, -10.69970703125, -10.255615234375, -9.8115234375, -9.367431640625, -8.92333984375, -8.479248046875, -8.03515625, -7.591064453125, -7.14697265625, -6.702880859375, -6.2587890625, -5.814697265625, -5.37060546875, -4.926513671875, -4.482421875, -4.038330078125, -3.59423828125, -3.150146484375, -2.7060546875, -2.261962890625, -1.81787109375, -1.373779296875, -0.9296875, -0.485595703125, -0.04150390625, 0.402587890625, 0.8466796875, 1.290771484375, 1.73486328125, 2.178955078125, 2.623046875, 3.067138671875, 3.51123046875, 3.955322265625, 4.3994140625, 4.843505859375, 5.28759765625, 5.731689453125, 6.17578125, 6.619873046875, 7.06396484375, 7.508056640625, 7.9521484375, 8.396240234375, 8.84033203125, 9.284423828125, 9.728515625, 10.172607421875, 10.61669921875, 11.060791015625, 11.5048828125, 11.948974609375, 12.39306640625, 12.837158203125, 13.28125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 6.0, 5.0, 10.0, 15.0, 29.0, 45.0, 50.0, 105.0, 137.0, 189.0, 314.0, 480.0, 738.0, 1232.0, 2215.0, 4150.0, 8818.0, 21260.0, 72136.0, 511546.0, 3043300.0, 425206.0, 64704.0, 20002.0, 8253.0, 3982.0, 2191.0, 1172.0, 690.0, 459.0, 278.0, 184.0, 122.0, 86.0, 57.0, 41.0, 29.0, 18.0, 10.0, 8.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-19.140625, -18.551025390625, -17.96142578125, -17.371826171875, -16.7822265625, -16.192626953125, -15.60302734375, -15.013427734375, -14.423828125, -13.834228515625, -13.24462890625, -12.655029296875, -12.0654296875, -11.475830078125, -10.88623046875, -10.296630859375, -9.70703125, -9.117431640625, -8.52783203125, -7.938232421875, -7.3486328125, -6.759033203125, -6.16943359375, -5.579833984375, -4.990234375, -4.400634765625, -3.81103515625, -3.221435546875, -2.6318359375, -2.042236328125, -1.45263671875, -0.863037109375, -0.2734375, 0.316162109375, 0.90576171875, 1.495361328125, 2.0849609375, 2.674560546875, 3.26416015625, 3.853759765625, 4.443359375, 5.032958984375, 5.62255859375, 6.212158203125, 6.8017578125, 7.391357421875, 7.98095703125, 8.570556640625, 9.16015625, 9.749755859375, 10.33935546875, 10.928955078125, 11.5185546875, 12.108154296875, 12.69775390625, 13.287353515625, 13.876953125, 14.466552734375, 15.05615234375, 15.645751953125, 16.2353515625, 16.824951171875, 17.41455078125, 18.004150390625, 18.59375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 35.0, 135.0, 423.0, 298.0, 85.0, 22.0, 9.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-335.96075439453125, -327.9210510253906, -319.88134765625, -311.8416748046875, -303.8019714355469, -295.76226806640625, -287.72259521484375, -279.6828918457031, -271.6431884765625, -263.6034851074219, -255.5637969970703, -247.52410888671875, -239.48440551757812, -231.4447021484375, -223.40501403808594, -215.36532592773438, -207.32562255859375, -199.28591918945312, -191.24623107910156, -183.20654296875, -175.16683959960938, -167.12713623046875, -159.0874481201172, -151.04776000976562, -143.008056640625, -134.96835327148438, -126.92866516113281, -118.88896942138672, -110.84927368164062, -102.80957794189453, -94.76988220214844, -86.73018646240234, -78.69050598144531, -70.65081024169922, -62.611114501953125, -54.57141876220703, -46.53172302246094, -38.492027282714844, -30.45233154296875, -22.412635803222656, -14.372940063476562, -6.333244323730469, 1.706451416015625, 9.746147155761719, 17.785842895507812, 25.825538635253906, 33.865234375, 41.904930114746094, 49.94462585449219, 57.98432159423828, 66.02401733398438, 74.06371307373047, 82.10340881347656, 90.14310455322266, 98.18280029296875, 106.22249603271484, 114.26219177246094, 122.30188751220703, 130.34158325195312, 138.38128662109375, 146.4209747314453, 154.46066284179688, 162.5003662109375, 170.54006958007812, 178.5797576904297]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 6.0, 4.0, 8.0, 9.0, 15.0, 20.0, 12.0, 22.0, 16.0, 22.0, 34.0, 31.0, 31.0, 34.0, 36.0, 33.0, 42.0, 43.0, 43.0, 34.0, 46.0, 40.0, 41.0, 42.0, 43.0, 41.0, 38.0, 27.0, 24.0, 27.0, 17.0, 17.0, 16.0, 19.0, 14.0, 6.0, 11.0, 9.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.966026306152344, -38.600746154785156, -37.235469818115234, -35.87018966674805, -34.504913330078125, -33.13963317871094, -31.774354934692383, -30.409076690673828, -29.043798446655273, -27.67852020263672, -26.313241958618164, -24.94796371459961, -23.582683563232422, -22.2174072265625, -20.852127075195312, -19.486848831176758, -18.121570587158203, -16.75629234313965, -15.391014099121094, -14.025734901428223, -12.660456657409668, -11.295178413391113, -9.929899215698242, -8.564620971679688, -7.199342727661133, -5.834064483642578, -4.468785762786865, -3.1035070419311523, -1.7382287979125977, -0.37295055389404297, 0.9923286437988281, 2.357606887817383, 3.722881317138672, 5.088159561157227, 6.4534382820129395, 7.818717002868652, 9.183995246887207, 10.549273490905762, 11.914552688598633, 13.279830932617188, 14.645109176635742, 16.010387420654297, 17.37566566467285, 18.740943908691406, 20.106224060058594, 21.471500396728516, 22.836780548095703, 24.202058792114258, 25.567337036132812, 26.932615280151367, 28.297893524169922, 29.66317367553711, 31.02845001220703, 32.39373016357422, 33.759010314941406, 35.12428665161133, 36.48956298828125, 37.85484313964844, 39.22011947631836, 40.58539962768555, 41.95067596435547, 43.315956115722656, 44.681236267089844, 46.046512603759766, 47.41179275512695]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 5.0, 8.0, 10.0, 14.0, 10.0, 12.0, 15.0, 28.0, 24.0, 24.0, 23.0, 22.0, 35.0, 37.0, 34.0, 41.0, 44.0, 56.0, 51.0, 50.0, 45.0, 38.0, 39.0, 31.0, 49.0, 27.0, 25.0, 34.0, 29.0, 20.0, 15.0, 12.0, 20.0, 15.0, 18.0, 13.0, 6.0, 7.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.76953125, -5.5731201171875, -5.376708984375, -5.1802978515625, -4.98388671875, -4.7874755859375, -4.591064453125, -4.3946533203125, -4.1982421875, -4.0018310546875, -3.805419921875, -3.6090087890625, -3.41259765625, -3.2161865234375, -3.019775390625, -2.8233642578125, -2.626953125, -2.4305419921875, -2.234130859375, -2.0377197265625, -1.84130859375, -1.6448974609375, -1.448486328125, -1.2520751953125, -1.0556640625, -0.8592529296875, -0.662841796875, -0.4664306640625, -0.27001953125, -0.0736083984375, 0.122802734375, 0.3192138671875, 0.515625, 0.7120361328125, 0.908447265625, 1.1048583984375, 1.30126953125, 1.4976806640625, 1.694091796875, 1.8905029296875, 2.0869140625, 2.2833251953125, 2.479736328125, 2.6761474609375, 2.87255859375, 3.0689697265625, 3.265380859375, 3.4617919921875, 3.658203125, 3.8546142578125, 4.051025390625, 4.2474365234375, 4.44384765625, 4.6402587890625, 4.836669921875, 5.0330810546875, 5.2294921875, 5.4259033203125, 5.622314453125, 5.8187255859375, 6.01513671875, 6.2115478515625, 6.407958984375, 6.6043701171875, 6.80078125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 7.0, 10.0, 16.0, 19.0, 35.0, 51.0, 72.0, 79.0, 152.0, 229.0, 308.0, 423.0, 701.0, 941.0, 1624.0, 2652.0, 5013.0, 11095.0, 28341.0, 79143.0, 242806.0, 416950.0, 164109.0, 54927.0, 20218.0, 8309.0, 4023.0, 2177.0, 1355.0, 898.0, 623.0, 406.0, 255.0, 182.0, 113.0, 99.0, 60.0, 40.0, 36.0, 23.0, 8.0, 7.0, 7.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.263671875, -3.1627197265625, -3.061767578125, -2.9608154296875, -2.85986328125, -2.7589111328125, -2.657958984375, -2.5570068359375, -2.4560546875, -2.3551025390625, -2.254150390625, -2.1531982421875, -2.05224609375, -1.9512939453125, -1.850341796875, -1.7493896484375, -1.6484375, -1.5474853515625, -1.446533203125, -1.3455810546875, -1.24462890625, -1.1436767578125, -1.042724609375, -0.9417724609375, -0.8408203125, -0.7398681640625, -0.638916015625, -0.5379638671875, -0.43701171875, -0.3360595703125, -0.235107421875, -0.1341552734375, -0.033203125, 0.0677490234375, 0.168701171875, 0.2696533203125, 0.37060546875, 0.4715576171875, 0.572509765625, 0.6734619140625, 0.7744140625, 0.8753662109375, 0.976318359375, 1.0772705078125, 1.17822265625, 1.2791748046875, 1.380126953125, 1.4810791015625, 1.58203125, 1.6829833984375, 1.783935546875, 1.8848876953125, 1.98583984375, 2.0867919921875, 2.187744140625, 2.2886962890625, 2.3896484375, 2.4906005859375, 2.591552734375, 2.6925048828125, 2.79345703125, 2.8944091796875, 2.995361328125, 3.0963134765625, 3.197265625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 7.0, 4.0, 14.0, 9.0, 13.0, 10.0, 18.0, 17.0, 9.0, 27.0, 25.0, 40.0, 31.0, 38.0, 43.0, 29.0, 46.0, 43.0, 36.0, 1071.0, 47.0, 43.0, 42.0, 37.0, 40.0, 45.0, 32.0, 28.0, 31.0, 30.0, 20.0, 16.0, 22.0, 13.0, 17.0, 13.0, 8.0, 2.0, 6.0, 6.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.22265625, -5.075927734375, -4.92919921875, -4.782470703125, -4.6357421875, -4.489013671875, -4.34228515625, -4.195556640625, -4.048828125, -3.902099609375, -3.75537109375, -3.608642578125, -3.4619140625, -3.315185546875, -3.16845703125, -3.021728515625, -2.875, -2.728271484375, -2.58154296875, -2.434814453125, -2.2880859375, -2.141357421875, -1.99462890625, -1.847900390625, -1.701171875, -1.554443359375, -1.40771484375, -1.260986328125, -1.1142578125, -0.967529296875, -0.82080078125, -0.674072265625, -0.52734375, -0.380615234375, -0.23388671875, -0.087158203125, 0.0595703125, 0.206298828125, 0.35302734375, 0.499755859375, 0.646484375, 0.793212890625, 0.93994140625, 1.086669921875, 1.2333984375, 1.380126953125, 1.52685546875, 1.673583984375, 1.8203125, 1.967041015625, 2.11376953125, 2.260498046875, 2.4072265625, 2.553955078125, 2.70068359375, 2.847412109375, 2.994140625, 3.140869140625, 3.28759765625, 3.434326171875, 3.5810546875, 3.727783203125, 3.87451171875, 4.021240234375, 4.16796875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 3.0, 5.0, 5.0, 12.0, 16.0, 21.0, 22.0, 43.0, 65.0, 85.0, 136.0, 213.0, 356.0, 560.0, 1076.0, 2247.0, 5562.0, 18863.0, 96657.0, 1252175.0, 628116.0, 67900.0, 14266.0, 4467.0, 1959.0, 902.0, 533.0, 300.0, 190.0, 115.0, 77.0, 57.0, 38.0, 23.0, 14.0, 12.0, 16.0, 7.0, 6.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.97265625, -2.87646484375, -2.7802734375, -2.68408203125, -2.587890625, -2.49169921875, -2.3955078125, -2.29931640625, -2.203125, -2.10693359375, -2.0107421875, -1.91455078125, -1.818359375, -1.72216796875, -1.6259765625, -1.52978515625, -1.43359375, -1.33740234375, -1.2412109375, -1.14501953125, -1.048828125, -0.95263671875, -0.8564453125, -0.76025390625, -0.6640625, -0.56787109375, -0.4716796875, -0.37548828125, -0.279296875, -0.18310546875, -0.0869140625, 0.00927734375, 0.10546875, 0.20166015625, 0.2978515625, 0.39404296875, 0.490234375, 0.58642578125, 0.6826171875, 0.77880859375, 0.875, 0.97119140625, 1.0673828125, 1.16357421875, 1.259765625, 1.35595703125, 1.4521484375, 1.54833984375, 1.64453125, 1.74072265625, 1.8369140625, 1.93310546875, 2.029296875, 2.12548828125, 2.2216796875, 2.31787109375, 2.4140625, 2.51025390625, 2.6064453125, 2.70263671875, 2.798828125, 2.89501953125, 2.9912109375, 3.08740234375, 3.18359375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 9.0, 7.0, 15.0, 12.0, 10.0, 15.0, 19.0, 25.0, 32.0, 47.0, 61.0, 100.0, 213.0, 137.0, 65.0, 49.0, 34.0, 39.0, 23.0, 13.0, 9.0, 13.0, 10.0, 5.0, 6.0, 7.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.48681640625, -0.4719505310058594, -0.45708465576171875, -0.4422187805175781, -0.4273529052734375, -0.4124870300292969, -0.39762115478515625, -0.3827552795410156, -0.367889404296875, -0.3530235290527344, -0.33815765380859375, -0.3232917785644531, -0.3084259033203125, -0.2935600280761719, -0.27869415283203125, -0.2638282775878906, -0.24896240234375, -0.23409652709960938, -0.21923065185546875, -0.20436477661132812, -0.1894989013671875, -0.17463302612304688, -0.15976715087890625, -0.14490127563476562, -0.130035400390625, -0.11516952514648438, -0.10030364990234375, -0.08543777465820312, -0.0705718994140625, -0.055706024169921875, -0.04084014892578125, -0.025974273681640625, -0.0111083984375, 0.003757476806640625, 0.01862335205078125, 0.033489227294921875, 0.0483551025390625, 0.06322097778320312, 0.07808685302734375, 0.09295272827148438, 0.107818603515625, 0.12268447875976562, 0.13755035400390625, 0.15241622924804688, 0.1672821044921875, 0.18214797973632812, 0.19701385498046875, 0.21187973022460938, 0.22674560546875, 0.24161148071289062, 0.25647735595703125, 0.2713432312011719, 0.2862091064453125, 0.3010749816894531, 0.31594085693359375, 0.3308067321777344, 0.345672607421875, 0.3605384826660156, 0.37540435791015625, 0.3902702331542969, 0.4051361083984375, 0.4200019836425781, 0.43486785888671875, 0.4497337341308594, 0.464599609375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 6.0, 6.0, 12.0, 9.0, 13.0, 24.0, 21.0, 40.0, 60.0, 107.0, 184.0, 492.0, 6451.0, 967647.0, 71477.0, 1293.0, 306.0, 151.0, 70.0, 42.0, 29.0, 16.0, 18.0, 19.0, 9.0, 10.0, 6.0, 6.0, 8.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.2398681640625, -7.971923828125, -7.7039794921875, -7.43603515625, -7.1680908203125, -6.900146484375, -6.6322021484375, -6.3642578125, -6.0963134765625, -5.828369140625, -5.5604248046875, -5.29248046875, -5.0245361328125, -4.756591796875, -4.4886474609375, -4.220703125, -3.9527587890625, -3.684814453125, -3.4168701171875, -3.14892578125, -2.8809814453125, -2.613037109375, -2.3450927734375, -2.0771484375, -1.8092041015625, -1.541259765625, -1.2733154296875, -1.00537109375, -0.7374267578125, -0.469482421875, -0.2015380859375, 0.06640625, 0.3343505859375, 0.602294921875, 0.8702392578125, 1.13818359375, 1.4061279296875, 1.674072265625, 1.9420166015625, 2.2099609375, 2.4779052734375, 2.745849609375, 3.0137939453125, 3.28173828125, 3.5496826171875, 3.817626953125, 4.0855712890625, 4.353515625, 4.6214599609375, 4.889404296875, 5.1573486328125, 5.42529296875, 5.6932373046875, 5.961181640625, 6.2291259765625, 6.4970703125, 6.7650146484375, 7.032958984375, 7.3009033203125, 7.56884765625, 7.8367919921875, 8.104736328125, 8.3726806640625, 8.640625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 13.0, 40.0, 79.0, 195.0, 263.0, 222.0, 113.0, 55.0, 22.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0071334838867188, -0.9535536170005798, -0.8999736905097961, -0.8463938236236572, -0.7928138971328735, -0.7392340302467346, -0.6856541633605957, -0.632074236869812, -0.5784943103790283, -0.5249144434928894, -0.4713345170021057, -0.4177546501159668, -0.3641747236251831, -0.3105948567390442, -0.2570149600505829, -0.20343506336212158, -0.14985519647598267, -0.09627529978752136, -0.042695410549640656, 0.010884478688240051, 0.06446437537670135, 0.11804425716400146, 0.17162415385246277, 0.22520405054092407, 0.2787839472293854, 0.3323638439178467, 0.385943740606308, 0.4395236372947693, 0.4931035041809082, 0.5466834306716919, 0.6002632975578308, 0.6538431644439697, 0.7074230909347534, 0.7610029578208923, 0.814582884311676, 0.8681627511978149, 0.9217426776885986, 0.9753225445747375, 1.0289024114608765, 1.0824823379516602, 1.1360622644424438, 1.1896421909332275, 1.2432219982147217, 1.2968019247055054, 1.350381851196289, 1.4039616584777832, 1.457541584968567, 1.5111215114593506, 1.5647013187408447, 1.6182812452316284, 1.6718610525131226, 1.7254409790039062, 1.77902090549469, 1.8326008319854736, 1.8861806392669678, 1.9397605657577515, 1.9933404922485352, 2.0469202995300293, 2.1005003452301025, 2.1540801525115967, 2.207659959793091, 2.261240005493164, 2.314819812774658, 2.3683996200561523, 2.4219796657562256]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 7.0, 2.0, 6.0, 7.0, 5.0, 5.0, 9.0, 9.0, 13.0, 17.0, 22.0, 25.0, 29.0, 32.0, 28.0, 32.0, 31.0, 38.0, 39.0, 38.0, 43.0, 40.0, 43.0, 57.0, 38.0, 40.0, 43.0, 49.0, 33.0, 40.0, 26.0, 22.0, 20.0, 17.0, 20.0, 20.0, 16.0, 8.0, 9.0, 3.0, 6.0, 6.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.3933756351470947, -0.38143232464790344, -0.36948901414871216, -0.35754573345184326, -0.345602422952652, -0.3336591124534607, -0.3217158317565918, -0.3097725212574005, -0.29782921075820923, -0.28588590025901794, -0.27394258975982666, -0.26199930906295776, -0.2500559985637665, -0.2381126880645752, -0.2261693924665451, -0.21422609686851501, -0.20228278636932373, -0.19033947587013245, -0.17839618027210236, -0.16645288467407227, -0.15450957417488098, -0.1425662636756897, -0.1306229680776596, -0.11867966502904892, -0.10673636198043823, -0.09479305893182755, -0.08284975588321686, -0.07090645283460617, -0.05896314978599548, -0.047019846737384796, -0.03507654368877411, -0.02313324064016342, -0.011189937591552734, 0.0007533654570579529, 0.01269666850566864, 0.024639971554279327, 0.036583274602890015, 0.0485265776515007, 0.06046988070011139, 0.07241318374872208, 0.08435648679733276, 0.09629978984594345, 0.10824309289455414, 0.12018639594316483, 0.1321296989917755, 0.1440730094909668, 0.1560163050889969, 0.16795960068702698, 0.17990291118621826, 0.19184622168540955, 0.20378951728343964, 0.21573281288146973, 0.227676123380661, 0.2396194338798523, 0.2515627145767212, 0.2635060250759125, 0.27544933557510376, 0.28739264607429504, 0.29933595657348633, 0.3112792372703552, 0.3232225477695465, 0.3351658582687378, 0.3471091389656067, 0.359052449464798, 0.37099575996398926]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 8.0, 8.0, 4.0, 13.0, 12.0, 16.0, 23.0, 29.0, 20.0, 26.0, 33.0, 29.0, 42.0, 26.0, 47.0, 49.0, 43.0, 37.0, 52.0, 54.0, 29.0, 43.0, 35.0, 27.0, 39.0, 24.0, 31.0, 27.0, 16.0, 32.0, 15.0, 15.0, 16.0, 20.0, 16.0, 14.0, 5.0, 2.0, 5.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51171875, -5.31964111328125, -5.1275634765625, -4.93548583984375, -4.743408203125, -4.55133056640625, -4.3592529296875, -4.16717529296875, -3.97509765625, -3.78302001953125, -3.5909423828125, -3.39886474609375, -3.206787109375, -3.01470947265625, -2.8226318359375, -2.63055419921875, -2.4384765625, -2.24639892578125, -2.0543212890625, -1.86224365234375, -1.670166015625, -1.47808837890625, -1.2860107421875, -1.09393310546875, -0.90185546875, -0.70977783203125, -0.5177001953125, -0.32562255859375, -0.133544921875, 0.05853271484375, 0.2506103515625, 0.44268798828125, 0.634765625, 0.82684326171875, 1.0189208984375, 1.21099853515625, 1.403076171875, 1.59515380859375, 1.7872314453125, 1.97930908203125, 2.17138671875, 2.36346435546875, 2.5555419921875, 2.74761962890625, 2.939697265625, 3.13177490234375, 3.3238525390625, 3.51593017578125, 3.7080078125, 3.90008544921875, 4.0921630859375, 4.28424072265625, 4.476318359375, 4.66839599609375, 4.8604736328125, 5.05255126953125, 5.24462890625, 5.43670654296875, 5.6287841796875, 5.82086181640625, 6.012939453125, 6.20501708984375, 6.3970947265625, 6.58917236328125, 6.78125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 8.0, 8.0, 6.0, 12.0, 12.0, 27.0, 23.0, 53.0, 63.0, 73.0, 114.0, 157.0, 234.0, 393.0, 562.0, 899.0, 1374.0, 2242.0, 3727.0, 6216.0, 11309.0, 21033.0, 45567.0, 119477.0, 362080.0, 296458.0, 95287.0, 38057.0, 18496.0, 9989.0, 5557.0, 3302.0, 2037.0, 1260.0, 797.0, 527.0, 328.0, 237.0, 180.0, 118.0, 62.0, 44.0, 44.0, 41.0, 31.0, 14.0, 14.0, 9.0, 0.0, 4.0, 1.0], "bins": [-12.78125, -12.4439697265625, -12.106689453125, -11.7694091796875, -11.43212890625, -11.0948486328125, -10.757568359375, -10.4202880859375, -10.0830078125, -9.7457275390625, -9.408447265625, -9.0711669921875, -8.73388671875, -8.3966064453125, -8.059326171875, -7.7220458984375, -7.384765625, -7.0474853515625, -6.710205078125, -6.3729248046875, -6.03564453125, -5.6983642578125, -5.361083984375, -5.0238037109375, -4.6865234375, -4.3492431640625, -4.011962890625, -3.6746826171875, -3.33740234375, -3.0001220703125, -2.662841796875, -2.3255615234375, -1.98828125, -1.6510009765625, -1.313720703125, -0.9764404296875, -0.63916015625, -0.3018798828125, 0.035400390625, 0.3726806640625, 0.7099609375, 1.0472412109375, 1.384521484375, 1.7218017578125, 2.05908203125, 2.3963623046875, 2.733642578125, 3.0709228515625, 3.408203125, 3.7454833984375, 4.082763671875, 4.4200439453125, 4.75732421875, 5.0946044921875, 5.431884765625, 5.7691650390625, 6.1064453125, 6.4437255859375, 6.781005859375, 7.1182861328125, 7.45556640625, 7.7928466796875, 8.130126953125, 8.4674072265625, 8.8046875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 3.0, 2.0, 4.0, 6.0, 6.0, 5.0, 9.0, 8.0, 7.0, 19.0, 21.0, 21.0, 24.0, 27.0, 43.0, 43.0, 59.0, 68.0, 90.0, 112.0, 227.0, 1414.0, 260.0, 145.0, 83.0, 62.0, 45.0, 45.0, 28.0, 33.0, 37.0, 22.0, 21.0, 13.0, 14.0, 6.0, 8.0, 3.0, 5.0, 6.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.625, -23.662109375, -22.69921875, -21.736328125, -20.7734375, -19.810546875, -18.84765625, -17.884765625, -16.921875, -15.958984375, -14.99609375, -14.033203125, -13.0703125, -12.107421875, -11.14453125, -10.181640625, -9.21875, -8.255859375, -7.29296875, -6.330078125, -5.3671875, -4.404296875, -3.44140625, -2.478515625, -1.515625, -0.552734375, 0.41015625, 1.373046875, 2.3359375, 3.298828125, 4.26171875, 5.224609375, 6.1875, 7.150390625, 8.11328125, 9.076171875, 10.0390625, 11.001953125, 11.96484375, 12.927734375, 13.890625, 14.853515625, 15.81640625, 16.779296875, 17.7421875, 18.705078125, 19.66796875, 20.630859375, 21.59375, 22.556640625, 23.51953125, 24.482421875, 25.4453125, 26.408203125, 27.37109375, 28.333984375, 29.296875, 30.259765625, 31.22265625, 32.185546875, 33.1484375, 34.111328125, 35.07421875, 36.037109375, 37.0]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 8.0, 12.0, 17.0, 28.0, 23.0, 78.0, 119.0, 237.0, 571.0, 1720.0, 9503.0, 2033407.0, 1088789.0, 8372.0, 1695.0, 569.0, 208.0, 128.0, 56.0, 24.0, 26.0, 20.0, 25.0, 7.0, 8.0, 6.0, 2.0, 3.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-110.0625, -106.6201171875, -103.177734375, -99.7353515625, -96.29296875, -92.8505859375, -89.408203125, -85.9658203125, -82.5234375, -79.0810546875, -75.638671875, -72.1962890625, -68.75390625, -65.3115234375, -61.869140625, -58.4267578125, -54.984375, -51.5419921875, -48.099609375, -44.6572265625, -41.21484375, -37.7724609375, -34.330078125, -30.8876953125, -27.4453125, -24.0029296875, -20.560546875, -17.1181640625, -13.67578125, -10.2333984375, -6.791015625, -3.3486328125, 0.09375, 3.5361328125, 6.978515625, 10.4208984375, 13.86328125, 17.3056640625, 20.748046875, 24.1904296875, 27.6328125, 31.0751953125, 34.517578125, 37.9599609375, 41.40234375, 44.8447265625, 48.287109375, 51.7294921875, 55.171875, 58.6142578125, 62.056640625, 65.4990234375, 68.94140625, 72.3837890625, 75.826171875, 79.2685546875, 82.7109375, 86.1533203125, 89.595703125, 93.0380859375, 96.48046875, 99.9228515625, 103.365234375, 106.8076171875, 110.25]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 190.0, 804.0, 21.0, 1.0, 1.0, 3.0], "bins": [-1539.7672119140625, -1513.7623291015625, -1487.7574462890625, -1461.7525634765625, -1435.74755859375, -1409.74267578125, -1383.73779296875, -1357.73291015625, -1331.72802734375, -1305.72314453125, -1279.71826171875, -1253.71337890625, -1227.7083740234375, -1201.7034912109375, -1175.6986083984375, -1149.6937255859375, -1123.6888427734375, -1097.6839599609375, -1071.6790771484375, -1045.6741943359375, -1019.6692504882812, -993.664306640625, -967.659423828125, -941.654541015625, -915.6495971679688, -889.6447143554688, -863.6397705078125, -837.6348876953125, -811.6300048828125, -785.6251220703125, -759.6201782226562, -733.6152954101562, -707.6104125976562, -681.6055297851562, -655.6005859375, -629.595703125, -603.5908203125, -577.5859375, -551.5809936523438, -525.5761108398438, -499.57122802734375, -473.5663146972656, -447.5614318847656, -421.5565185546875, -395.5516357421875, -369.5467224121094, -343.54180908203125, -317.53692626953125, -291.53204345703125, -265.5271301269531, -239.52224731445312, -213.517333984375, -187.512451171875, -161.50753784179688, -135.5026397705078, -109.49774169921875, -83.49282836914062, -57.48793029785156, -31.483028411865234, -5.478126525878906, 20.526771545410156, 46.53167724609375, 72.53657531738281, 98.54147338867188, 124.54637145996094]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 6.0, 2.0, 3.0, 10.0, 16.0, 12.0, 16.0, 12.0, 15.0, 18.0, 24.0, 31.0, 23.0, 38.0, 33.0, 32.0, 40.0, 35.0, 49.0, 60.0, 39.0, 26.0, 55.0, 43.0, 50.0, 41.0, 33.0, 37.0, 41.0, 26.0, 21.0, 18.0, 25.0, 20.0, 12.0, 10.0, 5.0, 8.0, 11.0, 5.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-82.3473129272461, -80.09688568115234, -77.8464584350586, -75.59603118896484, -73.3456039428711, -71.09517669677734, -68.8447494506836, -66.59432220458984, -64.3438949584961, -62.093467712402344, -59.843040466308594, -57.592613220214844, -55.342185974121094, -53.091758728027344, -50.841331481933594, -48.590904235839844, -46.340476989746094, -44.090049743652344, -41.839622497558594, -39.589195251464844, -37.338768005371094, -35.088340759277344, -32.837913513183594, -30.587486267089844, -28.337059020996094, -26.086631774902344, -23.836204528808594, -21.585777282714844, -19.335350036621094, -17.084922790527344, -14.834495544433594, -12.584068298339844, -10.333633422851562, -8.083206176757812, -5.8327789306640625, -3.5823516845703125, -1.3319244384765625, 0.9185028076171875, 3.1689300537109375, 5.4193572998046875, 7.6697845458984375, 9.920211791992188, 12.170639038085938, 14.421066284179688, 16.671493530273438, 18.921920776367188, 21.172348022460938, 23.422775268554688, 25.673202514648438, 27.923629760742188, 30.174057006835938, 32.42448425292969, 34.67491149902344, 36.92533874511719, 39.17576599121094, 41.42619323730469, 43.67662048339844, 45.92704772949219, 48.17747497558594, 50.42790222167969, 52.67832946777344, 54.92875671386719, 57.17918395996094, 59.42961120605469, 61.68003845214844]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 3.0, 4.0, 10.0, 10.0, 17.0, 17.0, 18.0, 20.0, 24.0, 25.0, 28.0, 28.0, 38.0, 35.0, 42.0, 40.0, 48.0, 44.0, 44.0, 32.0, 46.0, 29.0, 56.0, 50.0, 36.0, 34.0, 20.0, 31.0, 23.0, 30.0, 21.0, 23.0, 18.0, 13.0, 5.0, 5.0, 8.0, 8.0, 5.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.78125, -5.5596923828125, -5.338134765625, -5.1165771484375, -4.89501953125, -4.6734619140625, -4.451904296875, -4.2303466796875, -4.0087890625, -3.7872314453125, -3.565673828125, -3.3441162109375, -3.12255859375, -2.9010009765625, -2.679443359375, -2.4578857421875, -2.236328125, -2.0147705078125, -1.793212890625, -1.5716552734375, -1.35009765625, -1.1285400390625, -0.906982421875, -0.6854248046875, -0.4638671875, -0.2423095703125, -0.020751953125, 0.2008056640625, 0.42236328125, 0.6439208984375, 0.865478515625, 1.0870361328125, 1.30859375, 1.5301513671875, 1.751708984375, 1.9732666015625, 2.19482421875, 2.4163818359375, 2.637939453125, 2.8594970703125, 3.0810546875, 3.3026123046875, 3.524169921875, 3.7457275390625, 3.96728515625, 4.1888427734375, 4.410400390625, 4.6319580078125, 4.853515625, 5.0750732421875, 5.296630859375, 5.5181884765625, 5.73974609375, 5.9613037109375, 6.182861328125, 6.4044189453125, 6.6259765625, 6.8475341796875, 7.069091796875, 7.2906494140625, 7.51220703125, 7.7337646484375, 7.955322265625, 8.1768798828125, 8.3984375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 8.0, 9.0, 20.0, 22.0, 31.0, 47.0, 78.0, 130.0, 225.0, 356.0, 589.0, 880.0, 1503.0, 2779.0, 5263.0, 10536.0, 24812.0, 99702.0, 1420023.0, 2400444.0, 168360.0, 31679.0, 12818.0, 5996.0, 3262.0, 1812.0, 1045.0, 649.0, 428.0, 277.0, 154.0, 128.0, 68.0, 39.0, 37.0, 25.0, 17.0, 13.0, 12.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.53125, -16.94921875, -16.3671875, -15.78515625, -15.203125, -14.62109375, -14.0390625, -13.45703125, -12.875, -12.29296875, -11.7109375, -11.12890625, -10.546875, -9.96484375, -9.3828125, -8.80078125, -8.21875, -7.63671875, -7.0546875, -6.47265625, -5.890625, -5.30859375, -4.7265625, -4.14453125, -3.5625, -2.98046875, -2.3984375, -1.81640625, -1.234375, -0.65234375, -0.0703125, 0.51171875, 1.09375, 1.67578125, 2.2578125, 2.83984375, 3.421875, 4.00390625, 4.5859375, 5.16796875, 5.75, 6.33203125, 6.9140625, 7.49609375, 8.078125, 8.66015625, 9.2421875, 9.82421875, 10.40625, 10.98828125, 11.5703125, 12.15234375, 12.734375, 13.31640625, 13.8984375, 14.48046875, 15.0625, 15.64453125, 16.2265625, 16.80859375, 17.390625, 17.97265625, 18.5546875, 19.13671875, 19.71875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 10.0, 7.0, 14.0, 17.0, 23.0, 29.0, 46.0, 51.0, 79.0, 117.0, 199.0, 400.0, 758.0, 955.0, 607.0, 321.0, 160.0, 76.0, 58.0, 39.0, 26.0, 22.0, 14.0, 8.0, 6.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.4375, -24.77294921875, -24.1083984375, -23.44384765625, -22.779296875, -22.11474609375, -21.4501953125, -20.78564453125, -20.12109375, -19.45654296875, -18.7919921875, -18.12744140625, -17.462890625, -16.79833984375, -16.1337890625, -15.46923828125, -14.8046875, -14.14013671875, -13.4755859375, -12.81103515625, -12.146484375, -11.48193359375, -10.8173828125, -10.15283203125, -9.48828125, -8.82373046875, -8.1591796875, -7.49462890625, -6.830078125, -6.16552734375, -5.5009765625, -4.83642578125, -4.171875, -3.50732421875, -2.8427734375, -2.17822265625, -1.513671875, -0.84912109375, -0.1845703125, 0.47998046875, 1.14453125, 1.80908203125, 2.4736328125, 3.13818359375, 3.802734375, 4.46728515625, 5.1318359375, 5.79638671875, 6.4609375, 7.12548828125, 7.7900390625, 8.45458984375, 9.119140625, 9.78369140625, 10.4482421875, 11.11279296875, 11.77734375, 12.44189453125, 13.1064453125, 13.77099609375, 14.435546875, 15.10009765625, 15.7646484375, 16.42919921875, 17.09375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 7.0, 8.0, 13.0, 24.0, 51.0, 63.0, 102.0, 207.0, 410.0, 799.0, 1648.0, 4178.0, 11848.0, 43938.0, 390650.0, 3479054.0, 213698.0, 31976.0, 9238.0, 3351.0, 1480.0, 717.0, 358.0, 197.0, 97.0, 68.0, 34.0, 22.0, 13.0, 10.0, 5.0, 5.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.0, -26.97802734375, -25.9560546875, -24.93408203125, -23.912109375, -22.89013671875, -21.8681640625, -20.84619140625, -19.82421875, -18.80224609375, -17.7802734375, -16.75830078125, -15.736328125, -14.71435546875, -13.6923828125, -12.67041015625, -11.6484375, -10.62646484375, -9.6044921875, -8.58251953125, -7.560546875, -6.53857421875, -5.5166015625, -4.49462890625, -3.47265625, -2.45068359375, -1.4287109375, -0.40673828125, 0.615234375, 1.63720703125, 2.6591796875, 3.68115234375, 4.703125, 5.72509765625, 6.7470703125, 7.76904296875, 8.791015625, 9.81298828125, 10.8349609375, 11.85693359375, 12.87890625, 13.90087890625, 14.9228515625, 15.94482421875, 16.966796875, 17.98876953125, 19.0107421875, 20.03271484375, 21.0546875, 22.07666015625, 23.0986328125, 24.12060546875, 25.142578125, 26.16455078125, 27.1865234375, 28.20849609375, 29.23046875, 30.25244140625, 31.2744140625, 32.29638671875, 33.318359375, 34.34033203125, 35.3623046875, 36.38427734375, 37.40625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 13.0, 15.0, 41.0, 42.0, 93.0, 173.0, 218.0, 183.0, 100.0, 61.0, 32.0, 18.0, 7.0, 4.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.308170318603516, -54.06150436401367, -49.814842224121094, -45.56817626953125, -41.321510314941406, -37.07484817504883, -32.828182220458984, -28.581518173217773, -24.334854125976562, -20.08819007873535, -15.841525077819824, -11.594860076904297, -7.348196029663086, -3.101531982421875, 1.1451339721679688, 5.39179801940918, 9.63846206665039, 13.885126113891602, 18.131790161132812, 22.378456115722656, 26.625120162963867, 30.871784210205078, 35.11845016479492, 39.3651123046875, 43.611778259277344, 47.85844421386719, 52.105106353759766, 56.35177230834961, 60.59843444824219, 64.84510040283203, 69.09176635742188, 73.33843231201172, 77.5850830078125, 81.83174896240234, 86.07841491699219, 90.3250732421875, 94.57173919677734, 98.81840515136719, 103.06507110595703, 107.31173706054688, 111.55839538574219, 115.80506134033203, 120.05172729492188, 124.29838562011719, 128.54505920410156, 132.79171752929688, 137.03839111328125, 141.28504943847656, 145.53170776367188, 149.7783660888672, 154.02503967285156, 158.27169799804688, 162.51837158203125, 166.76502990722656, 171.01168823242188, 175.25836181640625, 179.50503540039062, 183.75169372558594, 187.9983673095703, 192.24502563476562, 196.49169921875, 200.7383575439453, 204.98501586914062, 209.231689453125, 213.4783477783203]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 3.0, 6.0, 6.0, 15.0, 8.0, 18.0, 17.0, 12.0, 16.0, 24.0, 22.0, 23.0, 39.0, 44.0, 38.0, 34.0, 29.0, 35.0, 48.0, 40.0, 51.0, 38.0, 36.0, 39.0, 34.0, 35.0, 34.0, 35.0, 26.0, 23.0, 17.0, 20.0, 22.0, 30.0, 11.0, 15.0, 10.0, 10.0, 12.0, 4.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.37556076049805, -50.801177978515625, -49.2267951965332, -47.65241241455078, -46.078033447265625, -44.5036506652832, -42.92926788330078, -41.35488510131836, -39.78050231933594, -38.206119537353516, -36.631736755371094, -35.05735397338867, -33.48297119140625, -31.90859031677246, -30.334209442138672, -28.75982666015625, -27.185443878173828, -25.611061096191406, -24.036678314208984, -22.462297439575195, -20.887914657592773, -19.31353187561035, -17.739151000976562, -16.16476821899414, -14.590385437011719, -13.016002655029297, -11.441620826721191, -9.867238998413086, -8.292856216430664, -6.7184739112854, -5.144091606140137, -3.5697097778320312, -1.9953269958496094, -0.4209446907043457, 1.153437614440918, 2.7278199195861816, 4.302202224731445, 5.876584529876709, 7.450966835021973, 9.025348663330078, 10.5997314453125, 12.174114227294922, 13.748496055603027, 15.322877883911133, 16.897260665893555, 18.471643447875977, 20.046024322509766, 21.620407104492188, 23.19478988647461, 24.76917266845703, 26.343555450439453, 27.917936325073242, 29.492319107055664, 31.066701889038086, 32.641082763671875, 34.2154655456543, 35.78984832763672, 37.36423110961914, 38.93861389160156, 40.512996673583984, 42.087379455566406, 43.66175842285156, 45.236141204833984, 46.810523986816406, 48.38490676879883]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 3.0, 7.0, 10.0, 8.0, 11.0, 9.0, 17.0, 21.0, 23.0, 31.0, 29.0, 35.0, 30.0, 39.0, 35.0, 28.0, 34.0, 48.0, 57.0, 37.0, 32.0, 34.0, 42.0, 38.0, 40.0, 41.0, 26.0, 31.0, 28.0, 26.0, 21.0, 18.0, 22.0, 15.0, 14.0, 11.0, 10.0, 8.0, 4.0, 6.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.53125, -5.333251953125, -5.13525390625, -4.937255859375, -4.7392578125, -4.541259765625, -4.34326171875, -4.145263671875, -3.947265625, -3.749267578125, -3.55126953125, -3.353271484375, -3.1552734375, -2.957275390625, -2.75927734375, -2.561279296875, -2.36328125, -2.165283203125, -1.96728515625, -1.769287109375, -1.5712890625, -1.373291015625, -1.17529296875, -0.977294921875, -0.779296875, -0.581298828125, -0.38330078125, -0.185302734375, 0.0126953125, 0.210693359375, 0.40869140625, 0.606689453125, 0.8046875, 1.002685546875, 1.20068359375, 1.398681640625, 1.5966796875, 1.794677734375, 1.99267578125, 2.190673828125, 2.388671875, 2.586669921875, 2.78466796875, 2.982666015625, 3.1806640625, 3.378662109375, 3.57666015625, 3.774658203125, 3.97265625, 4.170654296875, 4.36865234375, 4.566650390625, 4.7646484375, 4.962646484375, 5.16064453125, 5.358642578125, 5.556640625, 5.754638671875, 5.95263671875, 6.150634765625, 6.3486328125, 6.546630859375, 6.74462890625, 6.942626953125, 7.140625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 10.0, 17.0, 17.0, 22.0, 33.0, 42.0, 67.0, 86.0, 126.0, 174.0, 274.0, 464.0, 716.0, 1157.0, 1973.0, 3882.0, 7820.0, 16549.0, 36443.0, 86278.0, 220071.0, 377060.0, 170295.0, 67986.0, 29413.0, 13250.0, 6460.0, 3313.0, 1750.0, 992.0, 621.0, 375.0, 248.0, 166.0, 108.0, 87.0, 59.0, 55.0, 24.0, 14.0, 9.0, 11.0, 5.0, 10.0, 5.0, 4.0, 3.0, 0.0, 3.0, 4.0, 3.0], "bins": [-3.232421875, -3.13836669921875, -3.0443115234375, -2.95025634765625, -2.856201171875, -2.76214599609375, -2.6680908203125, -2.57403564453125, -2.47998046875, -2.38592529296875, -2.2918701171875, -2.19781494140625, -2.103759765625, -2.00970458984375, -1.9156494140625, -1.82159423828125, -1.7275390625, -1.63348388671875, -1.5394287109375, -1.44537353515625, -1.351318359375, -1.25726318359375, -1.1632080078125, -1.06915283203125, -0.97509765625, -0.88104248046875, -0.7869873046875, -0.69293212890625, -0.598876953125, -0.50482177734375, -0.4107666015625, -0.31671142578125, -0.22265625, -0.12860107421875, -0.0345458984375, 0.05950927734375, 0.153564453125, 0.24761962890625, 0.3416748046875, 0.43572998046875, 0.52978515625, 0.62384033203125, 0.7178955078125, 0.81195068359375, 0.906005859375, 1.00006103515625, 1.0941162109375, 1.18817138671875, 1.2822265625, 1.37628173828125, 1.4703369140625, 1.56439208984375, 1.658447265625, 1.75250244140625, 1.8465576171875, 1.94061279296875, 2.03466796875, 2.12872314453125, 2.2227783203125, 2.31683349609375, 2.410888671875, 2.50494384765625, 2.5989990234375, 2.69305419921875, 2.787109375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 14.0, 5.0, 11.0, 10.0, 11.0, 12.0, 21.0, 18.0, 21.0, 26.0, 23.0, 23.0, 29.0, 31.0, 39.0, 30.0, 37.0, 38.0, 41.0, 1077.0, 51.0, 42.0, 41.0, 33.0, 44.0, 43.0, 31.0, 27.0, 26.0, 31.0, 25.0, 23.0, 13.0, 12.0, 15.0, 10.0, 11.0, 7.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.55078125, -4.4029541015625, -4.255126953125, -4.1072998046875, -3.95947265625, -3.8116455078125, -3.663818359375, -3.5159912109375, -3.3681640625, -3.2203369140625, -3.072509765625, -2.9246826171875, -2.77685546875, -2.6290283203125, -2.481201171875, -2.3333740234375, -2.185546875, -2.0377197265625, -1.889892578125, -1.7420654296875, -1.59423828125, -1.4464111328125, -1.298583984375, -1.1507568359375, -1.0029296875, -0.8551025390625, -0.707275390625, -0.5594482421875, -0.41162109375, -0.2637939453125, -0.115966796875, 0.0318603515625, 0.1796875, 0.3275146484375, 0.475341796875, 0.6231689453125, 0.77099609375, 0.9188232421875, 1.066650390625, 1.2144775390625, 1.3623046875, 1.5101318359375, 1.657958984375, 1.8057861328125, 1.95361328125, 2.1014404296875, 2.249267578125, 2.3970947265625, 2.544921875, 2.6927490234375, 2.840576171875, 2.9884033203125, 3.13623046875, 3.2840576171875, 3.431884765625, 3.5797119140625, 3.7275390625, 3.8753662109375, 4.023193359375, 4.1710205078125, 4.31884765625, 4.4666748046875, 4.614501953125, 4.7623291015625, 4.91015625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 6.0, 4.0, 5.0, 11.0, 13.0, 16.0, 24.0, 34.0, 50.0, 78.0, 144.0, 230.0, 335.0, 566.0, 956.0, 1815.0, 3430.0, 6937.0, 15399.0, 37702.0, 107564.0, 466267.0, 1155059.0, 197542.0, 59808.0, 22999.0, 9763.0, 4736.0, 2410.0, 1321.0, 721.0, 425.0, 284.0, 160.0, 137.0, 48.0, 45.0, 31.0, 13.0, 19.0, 8.0, 6.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9990234375, -1.938873291015625, -1.87872314453125, -1.818572998046875, -1.7584228515625, -1.698272705078125, -1.63812255859375, -1.577972412109375, -1.517822265625, -1.457672119140625, -1.39752197265625, -1.337371826171875, -1.2772216796875, -1.217071533203125, -1.15692138671875, -1.096771240234375, -1.03662109375, -0.976470947265625, -0.91632080078125, -0.856170654296875, -0.7960205078125, -0.735870361328125, -0.67572021484375, -0.615570068359375, -0.555419921875, -0.495269775390625, -0.43511962890625, -0.374969482421875, -0.3148193359375, -0.254669189453125, -0.19451904296875, -0.134368896484375, -0.07421875, -0.014068603515625, 0.04608154296875, 0.106231689453125, 0.1663818359375, 0.226531982421875, 0.28668212890625, 0.346832275390625, 0.406982421875, 0.467132568359375, 0.52728271484375, 0.587432861328125, 0.6475830078125, 0.707733154296875, 0.76788330078125, 0.828033447265625, 0.88818359375, 0.948333740234375, 1.00848388671875, 1.068634033203125, 1.1287841796875, 1.188934326171875, 1.24908447265625, 1.309234619140625, 1.369384765625, 1.429534912109375, 1.48968505859375, 1.549835205078125, 1.6099853515625, 1.670135498046875, 1.73028564453125, 1.790435791015625, 1.8505859375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 0.0, 5.0, 3.0, 2.0, 8.0, 5.0, 10.0, 15.0, 12.0, 14.0, 15.0, 23.0, 31.0, 39.0, 45.0, 76.0, 106.0, 116.0, 109.0, 80.0, 49.0, 44.0, 29.0, 22.0, 29.0, 28.0, 16.0, 11.0, 16.0, 11.0, 10.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.363525390625, -0.3499259948730469, -0.33632659912109375, -0.3227272033691406, -0.3091278076171875, -0.2955284118652344, -0.28192901611328125, -0.2683296203613281, -0.254730224609375, -0.24113082885742188, -0.22753143310546875, -0.21393203735351562, -0.2003326416015625, -0.18673324584960938, -0.17313385009765625, -0.15953445434570312, -0.14593505859375, -0.13233566284179688, -0.11873626708984375, -0.10513687133789062, -0.0915374755859375, -0.07793807983398438, -0.06433868408203125, -0.050739288330078125, -0.037139892578125, -0.023540496826171875, -0.00994110107421875, 0.003658294677734375, 0.0172576904296875, 0.030857086181640625, 0.04445648193359375, 0.058055877685546875, 0.0716552734375, 0.08525466918945312, 0.09885406494140625, 0.11245346069335938, 0.1260528564453125, 0.13965225219726562, 0.15325164794921875, 0.16685104370117188, 0.180450439453125, 0.19404983520507812, 0.20764923095703125, 0.22124862670898438, 0.2348480224609375, 0.24844741821289062, 0.26204681396484375, 0.2756462097167969, 0.28924560546875, 0.3028450012207031, 0.31644439697265625, 0.3300437927246094, 0.3436431884765625, 0.3572425842285156, 0.37084197998046875, 0.3844413757324219, 0.398040771484375, 0.4116401672363281, 0.42523956298828125, 0.4388389587402344, 0.4524383544921875, 0.4660377502441406, 0.47963714599609375, 0.4932365417480469, 0.5068359375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 3.0, 5.0, 12.0, 9.0, 10.0, 19.0, 24.0, 32.0, 25.0, 42.0, 81.0, 93.0, 147.0, 384.0, 2346.0, 54540.0, 963466.0, 25013.0, 1549.0, 302.0, 135.0, 79.0, 62.0, 42.0, 30.0, 21.0, 24.0, 14.0, 12.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.984375, -8.744140625, -8.50390625, -8.263671875, -8.0234375, -7.783203125, -7.54296875, -7.302734375, -7.0625, -6.822265625, -6.58203125, -6.341796875, -6.1015625, -5.861328125, -5.62109375, -5.380859375, -5.140625, -4.900390625, -4.66015625, -4.419921875, -4.1796875, -3.939453125, -3.69921875, -3.458984375, -3.21875, -2.978515625, -2.73828125, -2.498046875, -2.2578125, -2.017578125, -1.77734375, -1.537109375, -1.296875, -1.056640625, -0.81640625, -0.576171875, -0.3359375, -0.095703125, 0.14453125, 0.384765625, 0.625, 0.865234375, 1.10546875, 1.345703125, 1.5859375, 1.826171875, 2.06640625, 2.306640625, 2.546875, 2.787109375, 3.02734375, 3.267578125, 3.5078125, 3.748046875, 3.98828125, 4.228515625, 4.46875, 4.708984375, 4.94921875, 5.189453125, 5.4296875, 5.669921875, 5.91015625, 6.150390625, 6.390625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 23.0, 31.0, 46.0, 93.0, 106.0, 142.0, 142.0, 136.0, 122.0, 67.0, 44.0, 24.0, 7.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5879830121994019, -1.5536115169525146, -1.519239902496338, -1.4848684072494507, -1.4504969120025635, -1.4161254167556763, -1.3817538022994995, -1.3473823070526123, -1.313010811805725, -1.278639316558838, -1.2442677021026611, -1.209896206855774, -1.1755247116088867, -1.1411532163619995, -1.1067816019058228, -1.0724101066589355, -1.0380384922027588, -1.0036669969558716, -0.9692954421043396, -0.9349238872528076, -0.9005523920059204, -0.8661808371543884, -0.8318092823028564, -0.7974377870559692, -0.763066291809082, -0.72869473695755, -0.6943232417106628, -0.6599516868591309, -0.6255801916122437, -0.5912086367607117, -0.5568370819091797, -0.5224655866622925, -0.4880940318107605, -0.4537225067615509, -0.4193509817123413, -0.3849794268608093, -0.3506079316139221, -0.31623637676239014, -0.28186485171318054, -0.24749332666397095, -0.21312180161476135, -0.17875027656555176, -0.14437875151634216, -0.11000721156597137, -0.07563568651676178, -0.041264161467552185, -0.0068926215171813965, 0.027478903532028198, 0.06185042858123779, 0.09622195363044739, 0.13059347867965698, 0.16496501863002777, 0.19933654367923737, 0.23370806872844696, 0.26807960867881775, 0.30245113372802734, 0.33682265877723694, 0.37119418382644653, 0.40556570887565613, 0.4399372339248657, 0.4743087887763977, 0.5086802840232849, 0.5430518388748169, 0.5774233341217041, 0.6117948889732361]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 6.0, 2.0, 8.0, 3.0, 10.0, 8.0, 8.0, 16.0, 16.0, 15.0, 20.0, 32.0, 42.0, 35.0, 39.0, 30.0, 38.0, 40.0, 42.0, 48.0, 44.0, 43.0, 38.0, 42.0, 49.0, 33.0, 38.0, 29.0, 25.0, 36.0, 26.0, 20.0, 21.0, 18.0, 21.0, 16.0, 9.0, 7.0, 5.0, 9.0, 7.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.4755464196205139, -0.4611012041568756, -0.4466559588909149, -0.4322107434272766, -0.4177654981613159, -0.4033202826976776, -0.3888750374317169, -0.3744298219680786, -0.3599845767021179, -0.3455393612384796, -0.3310941159725189, -0.3166489005088806, -0.3022036552429199, -0.2877584397792816, -0.2733131945133209, -0.2588679790496826, -0.24442274868488312, -0.22997751832008362, -0.21553228795528412, -0.20108705759048462, -0.18664182722568512, -0.17219659686088562, -0.15775138139724731, -0.14330613613128662, -0.12886092066764832, -0.11441569030284882, -0.09997045993804932, -0.08552522957324982, -0.07107999920845032, -0.056634776294231415, -0.042189545929431915, -0.027744315564632416, -0.01329907774925232, 0.0011461516842246056, 0.01559138111770153, 0.03003660961985588, 0.04448183998465538, 0.05892706662416458, 0.07337229698896408, 0.08781752735376358, 0.10226275771856308, 0.11670798808336258, 0.13115321099758148, 0.14559844136238098, 0.16004367172718048, 0.17448890209197998, 0.18893413245677948, 0.20337936282157898, 0.21782459318637848, 0.23226982355117798, 0.24671505391597748, 0.261160284280777, 0.2756054997444153, 0.290050745010376, 0.3044959604740143, 0.318941205739975, 0.3333864212036133, 0.3478316366672516, 0.3622768819332123, 0.3767220973968506, 0.3911673426628113, 0.4056125581264496, 0.4200578033924103, 0.4345030188560486, 0.4489482641220093]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 5.0, 7.0, 4.0, 10.0, 9.0, 13.0, 17.0, 18.0, 23.0, 23.0, 22.0, 28.0, 22.0, 36.0, 30.0, 36.0, 43.0, 39.0, 54.0, 32.0, 33.0, 43.0, 37.0, 32.0, 28.0, 44.0, 33.0, 39.0, 20.0, 24.0, 22.0, 24.0, 17.0, 22.0, 28.0, 12.0, 10.0, 12.0, 9.0, 4.0, 9.0, 4.0, 2.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.796875, -5.61517333984375, -5.4334716796875, -5.25177001953125, -5.070068359375, -4.88836669921875, -4.7066650390625, -4.52496337890625, -4.34326171875, -4.16156005859375, -3.9798583984375, -3.79815673828125, -3.616455078125, -3.43475341796875, -3.2530517578125, -3.07135009765625, -2.8896484375, -2.70794677734375, -2.5262451171875, -2.34454345703125, -2.162841796875, -1.98114013671875, -1.7994384765625, -1.61773681640625, -1.43603515625, -1.25433349609375, -1.0726318359375, -0.89093017578125, -0.709228515625, -0.52752685546875, -0.3458251953125, -0.16412353515625, 0.017578125, 0.19927978515625, 0.3809814453125, 0.56268310546875, 0.744384765625, 0.92608642578125, 1.1077880859375, 1.28948974609375, 1.47119140625, 1.65289306640625, 1.8345947265625, 2.01629638671875, 2.197998046875, 2.37969970703125, 2.5614013671875, 2.74310302734375, 2.9248046875, 3.10650634765625, 3.2882080078125, 3.46990966796875, 3.651611328125, 3.83331298828125, 4.0150146484375, 4.19671630859375, 4.37841796875, 4.56011962890625, 4.7418212890625, 4.92352294921875, 5.105224609375, 5.28692626953125, 5.4686279296875, 5.65032958984375, 5.83203125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 10.0, 19.0, 22.0, 22.0, 31.0, 56.0, 78.0, 93.0, 142.0, 203.0, 269.0, 439.0, 567.0, 867.0, 1256.0, 1872.0, 3107.0, 5146.0, 9110.0, 17620.0, 38216.0, 101701.0, 389909.0, 318155.0, 88448.0, 33627.0, 15836.0, 8300.0, 4855.0, 2853.0, 1866.0, 1203.0, 813.0, 524.0, 384.0, 270.0, 190.0, 143.0, 93.0, 71.0, 43.0, 37.0, 26.0, 22.0, 10.0, 10.0, 2.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0], "bins": [-12.9140625, -12.5096435546875, -12.105224609375, -11.7008056640625, -11.29638671875, -10.8919677734375, -10.487548828125, -10.0831298828125, -9.6787109375, -9.2742919921875, -8.869873046875, -8.4654541015625, -8.06103515625, -7.6566162109375, -7.252197265625, -6.8477783203125, -6.443359375, -6.0389404296875, -5.634521484375, -5.2301025390625, -4.82568359375, -4.4212646484375, -4.016845703125, -3.6124267578125, -3.2080078125, -2.8035888671875, -2.399169921875, -1.9947509765625, -1.59033203125, -1.1859130859375, -0.781494140625, -0.3770751953125, 0.02734375, 0.4317626953125, 0.836181640625, 1.2406005859375, 1.64501953125, 2.0494384765625, 2.453857421875, 2.8582763671875, 3.2626953125, 3.6671142578125, 4.071533203125, 4.4759521484375, 4.88037109375, 5.2847900390625, 5.689208984375, 6.0936279296875, 6.498046875, 6.9024658203125, 7.306884765625, 7.7113037109375, 8.11572265625, 8.5201416015625, 8.924560546875, 9.3289794921875, 9.7333984375, 10.1378173828125, 10.542236328125, 10.9466552734375, 11.35107421875, 11.7554931640625, 12.159912109375, 12.5643310546875, 12.96875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 6.0, 6.0, 8.0, 10.0, 7.0, 12.0, 10.0, 26.0, 14.0, 19.0, 29.0, 24.0, 45.0, 42.0, 56.0, 74.0, 87.0, 143.0, 267.0, 1393.0, 182.0, 105.0, 87.0, 73.0, 55.0, 45.0, 22.0, 28.0, 30.0, 23.0, 21.0, 17.0, 17.0, 9.0, 16.0, 7.0, 11.0, 3.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.953125, -20.282958984375, -19.61279296875, -18.942626953125, -18.2724609375, -17.602294921875, -16.93212890625, -16.261962890625, -15.591796875, -14.921630859375, -14.25146484375, -13.581298828125, -12.9111328125, -12.240966796875, -11.57080078125, -10.900634765625, -10.23046875, -9.560302734375, -8.89013671875, -8.219970703125, -7.5498046875, -6.879638671875, -6.20947265625, -5.539306640625, -4.869140625, -4.198974609375, -3.52880859375, -2.858642578125, -2.1884765625, -1.518310546875, -0.84814453125, -0.177978515625, 0.4921875, 1.162353515625, 1.83251953125, 2.502685546875, 3.1728515625, 3.843017578125, 4.51318359375, 5.183349609375, 5.853515625, 6.523681640625, 7.19384765625, 7.864013671875, 8.5341796875, 9.204345703125, 9.87451171875, 10.544677734375, 11.21484375, 11.885009765625, 12.55517578125, 13.225341796875, 13.8955078125, 14.565673828125, 15.23583984375, 15.906005859375, 16.576171875, 17.246337890625, 17.91650390625, 18.586669921875, 19.2568359375, 19.927001953125, 20.59716796875, 21.267333984375, 21.9375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 0.0, 6.0, 4.0, 5.0, 6.0, 9.0, 15.0, 16.0, 12.0, 22.0, 27.0, 34.0, 59.0, 70.0, 81.0, 136.0, 149.0, 276.0, 661.0, 2150.0, 12782.0, 446796.0, 2647053.0, 29774.0, 3549.0, 945.0, 376.0, 195.0, 119.0, 91.0, 64.0, 58.0, 32.0, 29.0, 25.0, 19.0, 18.0, 10.0, 5.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.75, -56.0087890625, -54.267578125, -52.5263671875, -50.78515625, -49.0439453125, -47.302734375, -45.5615234375, -43.8203125, -42.0791015625, -40.337890625, -38.5966796875, -36.85546875, -35.1142578125, -33.373046875, -31.6318359375, -29.890625, -28.1494140625, -26.408203125, -24.6669921875, -22.92578125, -21.1845703125, -19.443359375, -17.7021484375, -15.9609375, -14.2197265625, -12.478515625, -10.7373046875, -8.99609375, -7.2548828125, -5.513671875, -3.7724609375, -2.03125, -0.2900390625, 1.451171875, 3.1923828125, 4.93359375, 6.6748046875, 8.416015625, 10.1572265625, 11.8984375, 13.6396484375, 15.380859375, 17.1220703125, 18.86328125, 20.6044921875, 22.345703125, 24.0869140625, 25.828125, 27.5693359375, 29.310546875, 31.0517578125, 32.79296875, 34.5341796875, 36.275390625, 38.0166015625, 39.7578125, 41.4990234375, 43.240234375, 44.9814453125, 46.72265625, 48.4638671875, 50.205078125, 51.9462890625, 53.6875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 45.0, 839.0, 132.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.889549255371094, -43.596412658691406, -27.303272247314453, -11.0101318359375, 5.2830047607421875, 21.576141357421875, 37.869285583496094, 54.16242218017578, 70.45555877685547, 86.74869537353516, 103.04183959960938, 119.33497619628906, 135.62811279296875, 151.92124938964844, 168.21438598632812, 184.50753784179688, 200.8006591796875, 217.0937957763672, 233.38693237304688, 249.68008422851562, 265.97320556640625, 282.266357421875, 298.55950927734375, 314.8526306152344, 331.1457824707031, 347.4389343261719, 363.7320556640625, 380.02520751953125, 396.3183288574219, 412.6114807128906, 428.90460205078125, 445.19775390625, 461.49090576171875, 477.7840576171875, 494.0771789550781, 510.3703308105469, 526.6634521484375, 542.9566040039062, 559.249755859375, 575.5428466796875, 591.8359985351562, 608.129150390625, 624.4223022460938, 640.7153930664062, 657.008544921875, 673.3016967773438, 689.5948486328125, 705.887939453125, 722.18115234375, 738.4743041992188, 754.7674560546875, 771.060546875, 787.3536987304688, 803.6468505859375, 819.9400024414062, 836.233154296875, 852.5262451171875, 868.8193969726562, 885.112548828125, 901.4056396484375, 917.6987915039062, 933.991943359375, 950.2850952148438, 966.5782470703125, 982.871337890625]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 9.0, 11.0, 18.0, 18.0, 25.0, 19.0, 27.0, 31.0, 35.0, 43.0, 42.0, 55.0, 53.0, 64.0, 54.0, 47.0, 38.0, 46.0, 47.0, 52.0, 34.0, 37.0, 35.0, 22.0, 30.0, 22.0, 17.0, 12.0, 15.0, 19.0, 6.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.81705474853516, -89.38529205322266, -86.95352935791016, -84.52176666259766, -82.09000396728516, -79.65824127197266, -77.22647857666016, -74.79470825195312, -72.36294555664062, -69.93118286132812, -67.49942016601562, -65.06765747070312, -62.635894775390625, -60.204132080078125, -57.77236557006836, -55.34060287475586, -52.908843994140625, -50.477081298828125, -48.045318603515625, -45.613555908203125, -43.181793212890625, -40.750030517578125, -38.31826400756836, -35.88650131225586, -33.45473861694336, -31.02297592163086, -28.59121322631836, -26.159448623657227, -23.727685928344727, -21.295923233032227, -18.864158630371094, -16.432395935058594, -14.000640869140625, -11.568878173828125, -9.137114524841309, -6.70535135269165, -4.273588180541992, -1.8418254852294922, 0.5899381637573242, 3.0217018127441406, 5.453464508056641, 7.885227680206299, 10.316990852355957, 12.748754501342773, 15.180517196655273, 17.612279891967773, 20.044044494628906, 22.475807189941406, 24.907569885253906, 27.339332580566406, 29.771095275878906, 32.202857971191406, 34.634620666503906, 37.066383361816406, 39.49814987182617, 41.92991256713867, 44.36167526245117, 46.79343795776367, 49.22520065307617, 51.65696334838867, 54.08872985839844, 56.52049255371094, 58.95225524902344, 61.38401794433594, 63.81578063964844]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 6.0, 7.0, 12.0, 18.0, 12.0, 22.0, 22.0, 23.0, 20.0, 32.0, 18.0, 25.0, 30.0, 41.0, 38.0, 42.0, 37.0, 36.0, 56.0, 45.0, 33.0, 35.0, 30.0, 38.0, 27.0, 40.0, 33.0, 37.0, 20.0, 20.0, 17.0, 14.0, 19.0, 19.0, 14.0, 11.0, 11.0, 10.0, 4.0, 7.0, 0.0, 2.0, 2.0, 1.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-6.9140625, -6.70556640625, -6.4970703125, -6.28857421875, -6.080078125, -5.87158203125, -5.6630859375, -5.45458984375, -5.24609375, -5.03759765625, -4.8291015625, -4.62060546875, -4.412109375, -4.20361328125, -3.9951171875, -3.78662109375, -3.578125, -3.36962890625, -3.1611328125, -2.95263671875, -2.744140625, -2.53564453125, -2.3271484375, -2.11865234375, -1.91015625, -1.70166015625, -1.4931640625, -1.28466796875, -1.076171875, -0.86767578125, -0.6591796875, -0.45068359375, -0.2421875, -0.03369140625, 0.1748046875, 0.38330078125, 0.591796875, 0.80029296875, 1.0087890625, 1.21728515625, 1.42578125, 1.63427734375, 1.8427734375, 2.05126953125, 2.259765625, 2.46826171875, 2.6767578125, 2.88525390625, 3.09375, 3.30224609375, 3.5107421875, 3.71923828125, 3.927734375, 4.13623046875, 4.3447265625, 4.55322265625, 4.76171875, 4.97021484375, 5.1787109375, 5.38720703125, 5.595703125, 5.80419921875, 6.0126953125, 6.22119140625, 6.4296875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 7.0, 5.0, 7.0, 1.0, 5.0, 10.0, 7.0, 15.0, 16.0, 16.0, 29.0, 40.0, 50.0, 89.0, 135.0, 276.0, 464.0, 948.0, 1913.0, 4384.0, 10871.0, 35451.0, 275703.0, 2865015.0, 899636.0, 69266.0, 17705.0, 6523.0, 2764.0, 1316.0, 731.0, 321.0, 187.0, 128.0, 58.0, 56.0, 40.0, 24.0, 17.0, 10.0, 5.0, 9.0, 12.0, 4.0, 2.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-19.890625, -19.300537109375, -18.71044921875, -18.120361328125, -17.5302734375, -16.940185546875, -16.35009765625, -15.760009765625, -15.169921875, -14.579833984375, -13.98974609375, -13.399658203125, -12.8095703125, -12.219482421875, -11.62939453125, -11.039306640625, -10.44921875, -9.859130859375, -9.26904296875, -8.678955078125, -8.0888671875, -7.498779296875, -6.90869140625, -6.318603515625, -5.728515625, -5.138427734375, -4.54833984375, -3.958251953125, -3.3681640625, -2.778076171875, -2.18798828125, -1.597900390625, -1.0078125, -0.417724609375, 0.17236328125, 0.762451171875, 1.3525390625, 1.942626953125, 2.53271484375, 3.122802734375, 3.712890625, 4.302978515625, 4.89306640625, 5.483154296875, 6.0732421875, 6.663330078125, 7.25341796875, 7.843505859375, 8.43359375, 9.023681640625, 9.61376953125, 10.203857421875, 10.7939453125, 11.384033203125, 11.97412109375, 12.564208984375, 13.154296875, 13.744384765625, 14.33447265625, 14.924560546875, 15.5146484375, 16.104736328125, 16.69482421875, 17.284912109375, 17.875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 7.0, 7.0, 8.0, 13.0, 10.0, 12.0, 15.0, 17.0, 30.0, 32.0, 55.0, 53.0, 75.0, 118.0, 218.0, 339.0, 460.0, 615.0, 579.0, 434.0, 283.0, 185.0, 120.0, 94.0, 69.0, 48.0, 37.0, 23.0, 19.0, 15.0, 16.0, 6.0, 9.0, 9.0, 11.0, 12.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.828125, -12.397705078125, -11.96728515625, -11.536865234375, -11.1064453125, -10.676025390625, -10.24560546875, -9.815185546875, -9.384765625, -8.954345703125, -8.52392578125, -8.093505859375, -7.6630859375, -7.232666015625, -6.80224609375, -6.371826171875, -5.94140625, -5.510986328125, -5.08056640625, -4.650146484375, -4.2197265625, -3.789306640625, -3.35888671875, -2.928466796875, -2.498046875, -2.067626953125, -1.63720703125, -1.206787109375, -0.7763671875, -0.345947265625, 0.08447265625, 0.514892578125, 0.9453125, 1.375732421875, 1.80615234375, 2.236572265625, 2.6669921875, 3.097412109375, 3.52783203125, 3.958251953125, 4.388671875, 4.819091796875, 5.24951171875, 5.679931640625, 6.1103515625, 6.540771484375, 6.97119140625, 7.401611328125, 7.83203125, 8.262451171875, 8.69287109375, 9.123291015625, 9.5537109375, 9.984130859375, 10.41455078125, 10.844970703125, 11.275390625, 11.705810546875, 12.13623046875, 12.566650390625, 12.9970703125, 13.427490234375, 13.85791015625, 14.288330078125, 14.71875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 11.0, 9.0, 12.0, 17.0, 10.0, 18.0, 30.0, 41.0, 42.0, 102.0, 174.0, 431.0, 1079.0, 4076.0, 19297.0, 188276.0, 3689107.0, 261755.0, 23021.0, 4652.0, 1275.0, 403.0, 162.0, 101.0, 48.0, 35.0, 26.0, 12.0, 14.0, 10.0, 11.0, 8.0, 5.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-45.46875, -44.2578125, -43.046875, -41.8359375, -40.625, -39.4140625, -38.203125, -36.9921875, -35.78125, -34.5703125, -33.359375, -32.1484375, -30.9375, -29.7265625, -28.515625, -27.3046875, -26.09375, -24.8828125, -23.671875, -22.4609375, -21.25, -20.0390625, -18.828125, -17.6171875, -16.40625, -15.1953125, -13.984375, -12.7734375, -11.5625, -10.3515625, -9.140625, -7.9296875, -6.71875, -5.5078125, -4.296875, -3.0859375, -1.875, -0.6640625, 0.546875, 1.7578125, 2.96875, 4.1796875, 5.390625, 6.6015625, 7.8125, 9.0234375, 10.234375, 11.4453125, 12.65625, 13.8671875, 15.078125, 16.2890625, 17.5, 18.7109375, 19.921875, 21.1328125, 22.34375, 23.5546875, 24.765625, 25.9765625, 27.1875, 28.3984375, 29.609375, 30.8203125, 32.03125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 7.0, 6.0, 12.0, 21.0, 31.0, 49.0, 53.0, 84.0, 119.0, 139.0, 135.0, 128.0, 77.0, 53.0, 30.0, 22.0, 9.0, 12.0, 5.0, 8.0, 2.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-77.667724609375, -75.27259826660156, -72.87747192382812, -70.48235321044922, -68.08722686767578, -65.69210052490234, -63.296974182128906, -60.90184783935547, -58.5067253112793, -56.11159896850586, -53.71647644042969, -51.32135009765625, -48.92622375488281, -46.53110122680664, -44.1359748840332, -41.74085235595703, -39.345726013183594, -36.950599670410156, -34.555477142333984, -32.16035079956055, -29.765226364135742, -27.370101928710938, -24.9749755859375, -22.579851150512695, -20.18472671508789, -17.789602279663086, -15.394476890563965, -12.999351501464844, -10.604227066040039, -8.209102630615234, -5.813977241516113, -3.418851852416992, -1.0237197875976562, 1.3714051246643066, 3.7665300369262695, 6.161654949188232, 8.556779861450195, 10.951904296875, 13.347029685974121, 15.742155075073242, 18.137279510498047, 20.53240394592285, 22.927528381347656, 25.322654724121094, 27.7177791595459, 30.112903594970703, 32.50802993774414, 34.90315246582031, 37.29827880859375, 39.69340515136719, 42.08852767944336, 44.4836540222168, 46.87877655029297, 49.273902893066406, 51.669029235839844, 54.06415557861328, 56.45927810668945, 58.85440444946289, 61.24952697753906, 63.6446533203125, 66.03977966308594, 68.43490600585938, 70.83002471923828, 73.22515106201172, 75.62027740478516]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 2.0, 8.0, 8.0, 10.0, 8.0, 14.0, 21.0, 18.0, 16.0, 18.0, 21.0, 26.0, 40.0, 22.0, 32.0, 34.0, 41.0, 38.0, 45.0, 29.0, 37.0, 34.0, 45.0, 33.0, 50.0, 53.0, 37.0, 41.0, 32.0, 33.0, 21.0, 22.0, 20.0, 15.0, 16.0, 14.0, 9.0, 10.0, 7.0, 3.0, 4.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-48.651527404785156, -47.16160202026367, -45.67168045043945, -44.18175506591797, -42.69183349609375, -41.201908111572266, -39.71198654174805, -38.22206115722656, -36.732139587402344, -35.24221420288086, -33.75229263305664, -32.262367248535156, -30.772445678710938, -29.282522201538086, -27.792598724365234, -26.30267333984375, -24.8127498626709, -23.322826385498047, -21.832902908325195, -20.342979431152344, -18.853055953979492, -17.36313247680664, -15.873208045959473, -14.383284568786621, -12.89336109161377, -11.403437614440918, -9.913514137268066, -8.423589706420898, -6.933666706085205, -5.4437432289123535, -3.9538192749023438, -2.463895797729492, -0.9739723205566406, 0.5159512758255005, 2.0058748722076416, 3.4957985877990723, 4.985722064971924, 6.475645542144775, 7.965569496154785, 9.455492973327637, 10.945416450500488, 12.43533992767334, 13.925263404846191, 15.41518783569336, 16.90511131286621, 18.395034790039062, 19.884958267211914, 21.374881744384766, 22.864805221557617, 24.35472869873047, 25.84465217590332, 27.334575653076172, 28.824499130249023, 30.314422607421875, 31.80434799194336, 33.29426956176758, 34.78419494628906, 36.27412033081055, 37.764041900634766, 39.25396728515625, 40.74388885498047, 42.23381423950195, 43.72373580932617, 45.213661193847656, 46.703582763671875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 7.0, 8.0, 8.0, 11.0, 18.0, 4.0, 15.0, 11.0, 16.0, 26.0, 29.0, 19.0, 29.0, 39.0, 27.0, 30.0, 35.0, 42.0, 38.0, 32.0, 35.0, 46.0, 37.0, 43.0, 39.0, 29.0, 24.0, 39.0, 26.0, 24.0, 27.0, 19.0, 24.0, 22.0, 18.0, 12.0, 13.0, 9.0, 11.0, 13.0, 6.0, 4.0, 8.0, 6.0, 5.0, 5.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.49609375, -5.3145751953125, -5.133056640625, -4.9515380859375, -4.77001953125, -4.5885009765625, -4.406982421875, -4.2254638671875, -4.0439453125, -3.8624267578125, -3.680908203125, -3.4993896484375, -3.31787109375, -3.1363525390625, -2.954833984375, -2.7733154296875, -2.591796875, -2.4102783203125, -2.228759765625, -2.0472412109375, -1.86572265625, -1.6842041015625, -1.502685546875, -1.3211669921875, -1.1396484375, -0.9581298828125, -0.776611328125, -0.5950927734375, -0.41357421875, -0.2320556640625, -0.050537109375, 0.1309814453125, 0.3125, 0.4940185546875, 0.675537109375, 0.8570556640625, 1.03857421875, 1.2200927734375, 1.401611328125, 1.5831298828125, 1.7646484375, 1.9461669921875, 2.127685546875, 2.3092041015625, 2.49072265625, 2.6722412109375, 2.853759765625, 3.0352783203125, 3.216796875, 3.3983154296875, 3.579833984375, 3.7613525390625, 3.94287109375, 4.1243896484375, 4.305908203125, 4.4874267578125, 4.6689453125, 4.8504638671875, 5.031982421875, 5.2135009765625, 5.39501953125, 5.5765380859375, 5.758056640625, 5.9395751953125, 6.12109375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 11.0, 7.0, 16.0, 10.0, 32.0, 26.0, 44.0, 62.0, 72.0, 126.0, 176.0, 225.0, 318.0, 444.0, 607.0, 880.0, 1225.0, 1835.0, 2850.0, 4612.0, 8142.0, 15195.0, 30945.0, 67939.0, 159938.0, 321866.0, 236967.0, 100762.0, 44620.0, 20954.0, 10815.0, 5890.0, 3458.0, 2293.0, 1555.0, 1026.0, 743.0, 552.0, 361.0, 290.0, 174.0, 129.0, 98.0, 83.0, 49.0, 41.0, 23.0, 21.0, 14.0, 10.0, 11.0, 8.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.833984375, -1.772308349609375, -1.71063232421875, -1.648956298828125, -1.5872802734375, -1.525604248046875, -1.46392822265625, -1.402252197265625, -1.340576171875, -1.278900146484375, -1.21722412109375, -1.155548095703125, -1.0938720703125, -1.032196044921875, -0.97052001953125, -0.908843994140625, -0.84716796875, -0.785491943359375, -0.72381591796875, -0.662139892578125, -0.6004638671875, -0.538787841796875, -0.47711181640625, -0.415435791015625, -0.353759765625, -0.292083740234375, -0.23040771484375, -0.168731689453125, -0.1070556640625, -0.045379638671875, 0.01629638671875, 0.077972412109375, 0.1396484375, 0.201324462890625, 0.26300048828125, 0.324676513671875, 0.3863525390625, 0.448028564453125, 0.50970458984375, 0.571380615234375, 0.633056640625, 0.694732666015625, 0.75640869140625, 0.818084716796875, 0.8797607421875, 0.941436767578125, 1.00311279296875, 1.064788818359375, 1.12646484375, 1.188140869140625, 1.24981689453125, 1.311492919921875, 1.3731689453125, 1.434844970703125, 1.49652099609375, 1.558197021484375, 1.619873046875, 1.681549072265625, 1.74322509765625, 1.804901123046875, 1.8665771484375, 1.928253173828125, 1.98992919921875, 2.051605224609375, 2.11328125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 5.0, 5.0, 8.0, 7.0, 9.0, 16.0, 12.0, 10.0, 19.0, 16.0, 23.0, 22.0, 21.0, 30.0, 34.0, 40.0, 46.0, 41.0, 43.0, 37.0, 28.0, 41.0, 1059.0, 35.0, 39.0, 44.0, 34.0, 34.0, 27.0, 40.0, 42.0, 19.0, 22.0, 21.0, 19.0, 15.0, 11.0, 12.0, 6.0, 10.0, 8.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26953125, -4.1273193359375, -3.985107421875, -3.8428955078125, -3.70068359375, -3.5584716796875, -3.416259765625, -3.2740478515625, -3.1318359375, -2.9896240234375, -2.847412109375, -2.7052001953125, -2.56298828125, -2.4207763671875, -2.278564453125, -2.1363525390625, -1.994140625, -1.8519287109375, -1.709716796875, -1.5675048828125, -1.42529296875, -1.2830810546875, -1.140869140625, -0.9986572265625, -0.8564453125, -0.7142333984375, -0.572021484375, -0.4298095703125, -0.28759765625, -0.1453857421875, -0.003173828125, 0.1390380859375, 0.28125, 0.4234619140625, 0.565673828125, 0.7078857421875, 0.85009765625, 0.9923095703125, 1.134521484375, 1.2767333984375, 1.4189453125, 1.5611572265625, 1.703369140625, 1.8455810546875, 1.98779296875, 2.1300048828125, 2.272216796875, 2.4144287109375, 2.556640625, 2.6988525390625, 2.841064453125, 2.9832763671875, 3.12548828125, 3.2677001953125, 3.409912109375, 3.5521240234375, 3.6943359375, 3.8365478515625, 3.978759765625, 4.1209716796875, 4.26318359375, 4.4053955078125, 4.547607421875, 4.6898193359375, 4.83203125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 5.0, 8.0, 5.0, 12.0, 19.0, 37.0, 49.0, 86.0, 125.0, 193.0, 349.0, 615.0, 1201.0, 2642.0, 7182.0, 24811.0, 133630.0, 1518188.0, 341263.0, 47660.0, 11465.0, 3945.0, 1668.0, 797.0, 481.0, 273.0, 150.0, 87.0, 70.0, 44.0, 24.0, 18.0, 7.0, 5.0, 7.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.400390625, -2.32470703125, -2.2490234375, -2.17333984375, -2.09765625, -2.02197265625, -1.9462890625, -1.87060546875, -1.794921875, -1.71923828125, -1.6435546875, -1.56787109375, -1.4921875, -1.41650390625, -1.3408203125, -1.26513671875, -1.189453125, -1.11376953125, -1.0380859375, -0.96240234375, -0.88671875, -0.81103515625, -0.7353515625, -0.65966796875, -0.583984375, -0.50830078125, -0.4326171875, -0.35693359375, -0.28125, -0.20556640625, -0.1298828125, -0.05419921875, 0.021484375, 0.09716796875, 0.1728515625, 0.24853515625, 0.32421875, 0.39990234375, 0.4755859375, 0.55126953125, 0.626953125, 0.70263671875, 0.7783203125, 0.85400390625, 0.9296875, 1.00537109375, 1.0810546875, 1.15673828125, 1.232421875, 1.30810546875, 1.3837890625, 1.45947265625, 1.53515625, 1.61083984375, 1.6865234375, 1.76220703125, 1.837890625, 1.91357421875, 1.9892578125, 2.06494140625, 2.140625, 2.21630859375, 2.2919921875, 2.36767578125, 2.443359375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 7.0, 12.0, 11.0, 15.0, 17.0, 13.0, 17.0, 30.0, 24.0, 47.0, 45.0, 69.0, 89.0, 158.0, 91.0, 69.0, 39.0, 45.0, 37.0, 17.0, 24.0, 16.0, 16.0, 16.0, 16.0, 11.0, 6.0, 8.0, 2.0, 4.0, 4.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.207275390625, -0.20026397705078125, -0.1932525634765625, -0.18624114990234375, -0.179229736328125, -0.17221832275390625, -0.1652069091796875, -0.15819549560546875, -0.15118408203125, -0.14417266845703125, -0.1371612548828125, -0.13014984130859375, -0.123138427734375, -0.11612701416015625, -0.1091156005859375, -0.10210418701171875, -0.0950927734375, -0.08808135986328125, -0.0810699462890625, -0.07405853271484375, -0.067047119140625, -0.06003570556640625, -0.0530242919921875, -0.04601287841796875, -0.03900146484375, -0.03199005126953125, -0.0249786376953125, -0.01796722412109375, -0.010955810546875, -0.00394439697265625, 0.0030670166015625, 0.01007843017578125, 0.01708984375, 0.02410125732421875, 0.0311126708984375, 0.03812408447265625, 0.045135498046875, 0.05214691162109375, 0.0591583251953125, 0.06616973876953125, 0.07318115234375, 0.08019256591796875, 0.0872039794921875, 0.09421539306640625, 0.101226806640625, 0.10823822021484375, 0.1152496337890625, 0.12226104736328125, 0.1292724609375, 0.13628387451171875, 0.1432952880859375, 0.15030670166015625, 0.157318115234375, 0.16432952880859375, 0.1713409423828125, 0.17835235595703125, 0.18536376953125, 0.19237518310546875, 0.1993865966796875, 0.20639801025390625, 0.213409423828125, 0.22042083740234375, 0.2274322509765625, 0.23444366455078125, 0.241455078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 8.0, 10.0, 14.0, 18.0, 21.0, 17.0, 33.0, 47.0, 62.0, 106.0, 217.0, 651.0, 3635.0, 72422.0, 955746.0, 13419.0, 1319.0, 340.0, 152.0, 90.0, 46.0, 28.0, 35.0, 16.0, 21.0, 15.0, 13.0, 8.0, 5.0, 9.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.6875, -4.5506591796875, -4.413818359375, -4.2769775390625, -4.14013671875, -4.0032958984375, -3.866455078125, -3.7296142578125, -3.5927734375, -3.4559326171875, -3.319091796875, -3.1822509765625, -3.04541015625, -2.9085693359375, -2.771728515625, -2.6348876953125, -2.498046875, -2.3612060546875, -2.224365234375, -2.0875244140625, -1.95068359375, -1.8138427734375, -1.677001953125, -1.5401611328125, -1.4033203125, -1.2664794921875, -1.129638671875, -0.9927978515625, -0.85595703125, -0.7191162109375, -0.582275390625, -0.4454345703125, -0.30859375, -0.1717529296875, -0.034912109375, 0.1019287109375, 0.23876953125, 0.3756103515625, 0.512451171875, 0.6492919921875, 0.7861328125, 0.9229736328125, 1.059814453125, 1.1966552734375, 1.33349609375, 1.4703369140625, 1.607177734375, 1.7440185546875, 1.880859375, 2.0177001953125, 2.154541015625, 2.2913818359375, 2.42822265625, 2.5650634765625, 2.701904296875, 2.8387451171875, 2.9755859375, 3.1124267578125, 3.249267578125, 3.3861083984375, 3.52294921875, 3.6597900390625, 3.796630859375, 3.9334716796875, 4.0703125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 13.0, 18.0, 35.0, 83.0, 125.0, 196.0, 216.0, 154.0, 85.0, 42.0, 16.0, 17.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5326188206672668, -0.5113019943237305, -0.4899851977825165, -0.4686684012413025, -0.4473515748977661, -0.42603474855422974, -0.40471795201301575, -0.38340115547180176, -0.3620843291282654, -0.340767502784729, -0.319450706243515, -0.298133909702301, -0.27681708335876465, -0.25550025701522827, -0.23418346047401428, -0.2128666490316391, -0.19154983758926392, -0.17023302614688873, -0.14891621470451355, -0.12759940326213837, -0.10628259181976318, -0.084965780377388, -0.06364896893501282, -0.042332157492637634, -0.02101534605026245, 0.00030146539211273193, 0.021618276834487915, 0.0429350882768631, 0.06425189971923828, 0.08556871116161346, 0.10688552260398865, 0.12820233404636383, 0.14951908588409424, 0.17083589732646942, 0.1921527087688446, 0.2134695202112198, 0.23478633165359497, 0.25610315799713135, 0.27741995453834534, 0.2987367510795593, 0.3200535774230957, 0.3413704037666321, 0.36268720030784607, 0.38400399684906006, 0.40532082319259644, 0.4266376495361328, 0.4479544460773468, 0.4692712426185608, 0.49058806896209717, 0.5119048953056335, 0.5332217216491699, 0.5545384883880615, 0.5758553147315979, 0.5971721410751343, 0.6184889078140259, 0.6398057341575623, 0.6611225605010986, 0.682439386844635, 0.7037562131881714, 0.725072979927063, 0.7463898062705994, 0.7677066326141357, 0.7890233993530273, 0.8103402256965637, 0.8316570520401001]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 1.0, 6.0, 4.0, 3.0, 0.0, 7.0, 10.0, 6.0, 13.0, 11.0, 19.0, 22.0, 17.0, 26.0, 18.0, 14.0, 31.0, 36.0, 29.0, 29.0, 29.0, 40.0, 50.0, 46.0, 38.0, 45.0, 38.0, 38.0, 38.0, 27.0, 29.0, 35.0, 31.0, 29.0, 34.0, 29.0, 20.0, 18.0, 15.0, 11.0, 9.0, 7.0, 11.0, 9.0, 7.0, 4.0, 2.0, 5.0, 4.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.17120659351348877, -0.16573093831539154, -0.1602552831172943, -0.15477962791919708, -0.14930397272109985, -0.14382831752300262, -0.1383526623249054, -0.13287700712680817, -0.12740135192871094, -0.12192569673061371, -0.11645004153251648, -0.11097438633441925, -0.10549873113632202, -0.10002307593822479, -0.09454742074012756, -0.08907176554203033, -0.0835961103439331, -0.07812045514583588, -0.07264479994773865, -0.06716914474964142, -0.06169348955154419, -0.05621783435344696, -0.05074217915534973, -0.0452665239572525, -0.03979086875915527, -0.034315213561058044, -0.028839558362960815, -0.023363903164863586, -0.017888247966766357, -0.012412592768669128, -0.006936937570571899, -0.0014612823724746704, 0.004014372825622559, 0.009490028023719788, 0.014965683221817017, 0.020441338419914246, 0.025916993618011475, 0.031392648816108704, 0.03686830401420593, 0.04234395921230316, 0.04781961441040039, 0.05329526960849762, 0.05877092480659485, 0.06424658000469208, 0.0697222352027893, 0.07519789040088654, 0.08067354559898376, 0.086149200797081, 0.09162485599517822, 0.09710051119327545, 0.10257616639137268, 0.10805182158946991, 0.11352747678756714, 0.11900313198566437, 0.1244787871837616, 0.12995444238185883, 0.13543009757995605, 0.14090575277805328, 0.1463814079761505, 0.15185706317424774, 0.15733271837234497, 0.1628083735704422, 0.16828402876853943, 0.17375968396663666, 0.1792353391647339]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 5.0, 9.0, 5.0, 12.0, 10.0, 10.0, 14.0, 17.0, 30.0, 18.0, 23.0, 34.0, 22.0, 28.0, 28.0, 34.0, 35.0, 44.0, 40.0, 37.0, 53.0, 40.0, 34.0, 33.0, 55.0, 37.0, 23.0, 27.0, 38.0, 23.0, 14.0, 21.0, 20.0, 23.0, 12.0, 14.0, 16.0, 11.0, 7.0, 8.0, 7.0, 3.0, 8.0, 5.0, 9.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.51171875, -5.321533203125, -5.13134765625, -4.941162109375, -4.7509765625, -4.560791015625, -4.37060546875, -4.180419921875, -3.990234375, -3.800048828125, -3.60986328125, -3.419677734375, -3.2294921875, -3.039306640625, -2.84912109375, -2.658935546875, -2.46875, -2.278564453125, -2.08837890625, -1.898193359375, -1.7080078125, -1.517822265625, -1.32763671875, -1.137451171875, -0.947265625, -0.757080078125, -0.56689453125, -0.376708984375, -0.1865234375, 0.003662109375, 0.19384765625, 0.384033203125, 0.57421875, 0.764404296875, 0.95458984375, 1.144775390625, 1.3349609375, 1.525146484375, 1.71533203125, 1.905517578125, 2.095703125, 2.285888671875, 2.47607421875, 2.666259765625, 2.8564453125, 3.046630859375, 3.23681640625, 3.427001953125, 3.6171875, 3.807373046875, 3.99755859375, 4.187744140625, 4.3779296875, 4.568115234375, 4.75830078125, 4.948486328125, 5.138671875, 5.328857421875, 5.51904296875, 5.709228515625, 5.8994140625, 6.089599609375, 6.27978515625, 6.469970703125, 6.66015625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 6.0, 11.0, 10.0, 14.0, 29.0, 31.0, 51.0, 56.0, 83.0, 100.0, 166.0, 220.0, 309.0, 427.0, 659.0, 1016.0, 1504.0, 2607.0, 4419.0, 8618.0, 17800.0, 43814.0, 152642.0, 537420.0, 185058.0, 49800.0, 19739.0, 9342.0, 4749.0, 2750.0, 1698.0, 1011.0, 706.0, 482.0, 318.0, 246.0, 162.0, 131.0, 89.0, 64.0, 57.0, 33.0, 29.0, 25.0, 18.0, 11.0, 10.0, 2.0, 4.0, 5.0, 3.0, 1.0, 3.0], "bins": [-12.75, -12.381103515625, -12.01220703125, -11.643310546875, -11.2744140625, -10.905517578125, -10.53662109375, -10.167724609375, -9.798828125, -9.429931640625, -9.06103515625, -8.692138671875, -8.3232421875, -7.954345703125, -7.58544921875, -7.216552734375, -6.84765625, -6.478759765625, -6.10986328125, -5.740966796875, -5.3720703125, -5.003173828125, -4.63427734375, -4.265380859375, -3.896484375, -3.527587890625, -3.15869140625, -2.789794921875, -2.4208984375, -2.052001953125, -1.68310546875, -1.314208984375, -0.9453125, -0.576416015625, -0.20751953125, 0.161376953125, 0.5302734375, 0.899169921875, 1.26806640625, 1.636962890625, 2.005859375, 2.374755859375, 2.74365234375, 3.112548828125, 3.4814453125, 3.850341796875, 4.21923828125, 4.588134765625, 4.95703125, 5.325927734375, 5.69482421875, 6.063720703125, 6.4326171875, 6.801513671875, 7.17041015625, 7.539306640625, 7.908203125, 8.277099609375, 8.64599609375, 9.014892578125, 9.3837890625, 9.752685546875, 10.12158203125, 10.490478515625, 10.859375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 5.0, 2.0, 4.0, 2.0, 8.0, 3.0, 8.0, 11.0, 15.0, 16.0, 15.0, 16.0, 22.0, 22.0, 23.0, 27.0, 34.0, 34.0, 49.0, 75.0, 92.0, 147.0, 343.0, 1397.0, 150.0, 68.0, 64.0, 67.0, 50.0, 38.0, 34.0, 28.0, 33.0, 21.0, 17.0, 14.0, 13.0, 19.0, 16.0, 7.0, 6.0, 6.0, 1.0, 7.0, 2.0, 4.0, 4.0, 3.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-19.84375, -19.18310546875, -18.5224609375, -17.86181640625, -17.201171875, -16.54052734375, -15.8798828125, -15.21923828125, -14.55859375, -13.89794921875, -13.2373046875, -12.57666015625, -11.916015625, -11.25537109375, -10.5947265625, -9.93408203125, -9.2734375, -8.61279296875, -7.9521484375, -7.29150390625, -6.630859375, -5.97021484375, -5.3095703125, -4.64892578125, -3.98828125, -3.32763671875, -2.6669921875, -2.00634765625, -1.345703125, -0.68505859375, -0.0244140625, 0.63623046875, 1.296875, 1.95751953125, 2.6181640625, 3.27880859375, 3.939453125, 4.60009765625, 5.2607421875, 5.92138671875, 6.58203125, 7.24267578125, 7.9033203125, 8.56396484375, 9.224609375, 9.88525390625, 10.5458984375, 11.20654296875, 11.8671875, 12.52783203125, 13.1884765625, 13.84912109375, 14.509765625, 15.17041015625, 15.8310546875, 16.49169921875, 17.15234375, 17.81298828125, 18.4736328125, 19.13427734375, 19.794921875, 20.45556640625, 21.1162109375, 21.77685546875, 22.4375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 5.0, 4.0, 10.0, 5.0, 7.0, 5.0, 11.0, 12.0, 20.0, 24.0, 46.0, 46.0, 70.0, 124.0, 154.0, 356.0, 1071.0, 9077.0, 2892130.0, 236953.0, 4115.0, 718.0, 268.0, 152.0, 89.0, 57.0, 41.0, 31.0, 21.0, 14.0, 8.0, 9.0, 8.0, 8.0, 4.0, 5.0, 4.0, 5.0, 6.0, 3.0, 0.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-79.1875, -76.3447265625, -73.501953125, -70.6591796875, -67.81640625, -64.9736328125, -62.130859375, -59.2880859375, -56.4453125, -53.6025390625, -50.759765625, -47.9169921875, -45.07421875, -42.2314453125, -39.388671875, -36.5458984375, -33.703125, -30.8603515625, -28.017578125, -25.1748046875, -22.33203125, -19.4892578125, -16.646484375, -13.8037109375, -10.9609375, -8.1181640625, -5.275390625, -2.4326171875, 0.41015625, 3.2529296875, 6.095703125, 8.9384765625, 11.78125, 14.6240234375, 17.466796875, 20.3095703125, 23.15234375, 25.9951171875, 28.837890625, 31.6806640625, 34.5234375, 37.3662109375, 40.208984375, 43.0517578125, 45.89453125, 48.7373046875, 51.580078125, 54.4228515625, 57.265625, 60.1083984375, 62.951171875, 65.7939453125, 68.63671875, 71.4794921875, 74.322265625, 77.1650390625, 80.0078125, 82.8505859375, 85.693359375, 88.5361328125, 91.37890625, 94.2216796875, 97.064453125, 99.9072265625, 102.75]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 30.0, 683.0, 296.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.8226432800293, -48.93228530883789, -36.04193115234375, -23.151573181152344, -10.261215209960938, 2.629138946533203, 15.51949691772461, 28.409854888916016, 41.30021286010742, 54.19057083129883, 67.08092498779297, 79.97128295898438, 92.86164093017578, 105.75199890136719, 118.64234924316406, 131.53271484375, 144.42306518554688, 157.31341552734375, 170.2037811279297, 183.09413146972656, 195.9844970703125, 208.87484741210938, 221.76519775390625, 234.6555633544922, 247.54592895507812, 260.436279296875, 273.3266296386719, 286.2170104980469, 299.10736083984375, 311.9977111816406, 324.8880615234375, 337.7784423828125, 350.6687927246094, 363.55914306640625, 376.4494934082031, 389.3398742675781, 402.230224609375, 415.1205749511719, 428.01092529296875, 440.90130615234375, 453.7916564941406, 466.6820068359375, 479.5723571777344, 492.4627380371094, 505.35308837890625, 518.243408203125, 531.1337890625, 544.024169921875, 556.9144897460938, 569.8048706054688, 582.6951904296875, 595.5855712890625, 608.4758911132812, 621.3662719726562, 634.2566528320312, 647.14697265625, 660.037353515625, 672.927734375, 685.8180541992188, 698.7084350585938, 711.5987548828125, 724.4891357421875, 737.3795166015625, 750.2698364257812, 763.1602172851562]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 4.0, 6.0, 8.0, 4.0, 12.0, 10.0, 10.0, 16.0, 23.0, 21.0, 28.0, 31.0, 31.0, 26.0, 30.0, 32.0, 37.0, 36.0, 30.0, 37.0, 28.0, 36.0, 45.0, 38.0, 44.0, 41.0, 41.0, 42.0, 22.0, 33.0, 34.0, 29.0, 24.0, 25.0, 18.0, 9.0, 14.0, 12.0, 10.0, 4.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0], "bins": [-58.8868293762207, -57.15303421020508, -55.41923522949219, -53.68544006347656, -51.95164489746094, -50.21784591674805, -48.48405075073242, -46.75025177001953, -45.016456604003906, -43.28266143798828, -41.54886245727539, -39.815067291259766, -38.081268310546875, -36.34747314453125, -34.613677978515625, -32.8798828125, -31.14608383178711, -29.41228675842285, -27.678489685058594, -25.94469451904297, -24.21089744567871, -22.477100372314453, -20.743305206298828, -19.00950813293457, -17.275711059570312, -15.541913986206055, -13.808117866516113, -12.074321746826172, -10.340524673461914, -8.606727600097656, -6.872931480407715, -5.139135360717773, -3.4053421020507812, -1.6715455055236816, 0.06225109100341797, 1.7960476875305176, 3.529844284057617, 5.263641357421875, 6.997437477111816, 8.731233596801758, 10.465030670166016, 12.198827743530273, 13.932623863220215, 15.666419982910156, 17.400217056274414, 19.134014129638672, 20.867809295654297, 22.601606369018555, 24.335403442382812, 26.06920051574707, 27.802997589111328, 29.536792755126953, 31.27058982849121, 33.00438690185547, 34.738182067871094, 36.47197723388672, 38.20577621459961, 39.939571380615234, 41.673370361328125, 43.40716552734375, 45.140960693359375, 46.874759674072266, 48.60855484008789, 50.34235382080078, 52.076148986816406]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 5.0, 6.0, 4.0, 6.0, 6.0, 11.0, 9.0, 10.0, 23.0, 22.0, 24.0, 21.0, 29.0, 20.0, 39.0, 27.0, 28.0, 38.0, 36.0, 45.0, 41.0, 41.0, 46.0, 36.0, 43.0, 37.0, 38.0, 28.0, 32.0, 27.0, 25.0, 26.0, 20.0, 17.0, 23.0, 20.0, 13.0, 12.0, 13.0, 7.0, 9.0, 6.0, 8.0, 4.0, 7.0, 2.0, 2.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-6.68359375, -6.4713134765625, -6.259033203125, -6.0467529296875, -5.83447265625, -5.6221923828125, -5.409912109375, -5.1976318359375, -4.9853515625, -4.7730712890625, -4.560791015625, -4.3485107421875, -4.13623046875, -3.9239501953125, -3.711669921875, -3.4993896484375, -3.287109375, -3.0748291015625, -2.862548828125, -2.6502685546875, -2.43798828125, -2.2257080078125, -2.013427734375, -1.8011474609375, -1.5888671875, -1.3765869140625, -1.164306640625, -0.9520263671875, -0.73974609375, -0.5274658203125, -0.315185546875, -0.1029052734375, 0.109375, 0.3216552734375, 0.533935546875, 0.7462158203125, 0.95849609375, 1.1707763671875, 1.383056640625, 1.5953369140625, 1.8076171875, 2.0198974609375, 2.232177734375, 2.4444580078125, 2.65673828125, 2.8690185546875, 3.081298828125, 3.2935791015625, 3.505859375, 3.7181396484375, 3.930419921875, 4.1427001953125, 4.35498046875, 4.5672607421875, 4.779541015625, 4.9918212890625, 5.2041015625, 5.4163818359375, 5.628662109375, 5.8409423828125, 6.05322265625, 6.2655029296875, 6.477783203125, 6.6900634765625, 6.90234375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 6.0, 3.0, 7.0, 16.0, 10.0, 26.0, 22.0, 24.0, 51.0, 72.0, 114.0, 158.0, 189.0, 347.0, 528.0, 804.0, 1533.0, 2891.0, 5617.0, 12681.0, 33905.0, 153323.0, 1199662.0, 2321215.0, 365407.0, 59087.0, 19364.0, 8119.0, 3957.0, 2087.0, 1097.0, 633.0, 434.0, 305.0, 176.0, 118.0, 87.0, 52.0, 39.0, 25.0, 19.0, 17.0, 11.0, 9.0, 11.0, 5.0, 6.0, 5.0, 2.0, 1.0, 3.0, 3.0], "bins": [-15.296875, -14.862548828125, -14.42822265625, -13.993896484375, -13.5595703125, -13.125244140625, -12.69091796875, -12.256591796875, -11.822265625, -11.387939453125, -10.95361328125, -10.519287109375, -10.0849609375, -9.650634765625, -9.21630859375, -8.781982421875, -8.34765625, -7.913330078125, -7.47900390625, -7.044677734375, -6.6103515625, -6.176025390625, -5.74169921875, -5.307373046875, -4.873046875, -4.438720703125, -4.00439453125, -3.570068359375, -3.1357421875, -2.701416015625, -2.26708984375, -1.832763671875, -1.3984375, -0.964111328125, -0.52978515625, -0.095458984375, 0.3388671875, 0.773193359375, 1.20751953125, 1.641845703125, 2.076171875, 2.510498046875, 2.94482421875, 3.379150390625, 3.8134765625, 4.247802734375, 4.68212890625, 5.116455078125, 5.55078125, 5.985107421875, 6.41943359375, 6.853759765625, 7.2880859375, 7.722412109375, 8.15673828125, 8.591064453125, 9.025390625, 9.459716796875, 9.89404296875, 10.328369140625, 10.7626953125, 11.197021484375, 11.63134765625, 12.065673828125, 12.5]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 0.0, 4.0, 4.0, 8.0, 3.0, 9.0, 11.0, 18.0, 21.0, 21.0, 24.0, 45.0, 53.0, 71.0, 110.0, 191.0, 300.0, 518.0, 698.0, 679.0, 456.0, 285.0, 164.0, 111.0, 64.0, 46.0, 34.0, 25.0, 19.0, 20.0, 18.0, 7.0, 5.0, 11.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.78125, -15.285888671875, -14.79052734375, -14.295166015625, -13.7998046875, -13.304443359375, -12.80908203125, -12.313720703125, -11.818359375, -11.322998046875, -10.82763671875, -10.332275390625, -9.8369140625, -9.341552734375, -8.84619140625, -8.350830078125, -7.85546875, -7.360107421875, -6.86474609375, -6.369384765625, -5.8740234375, -5.378662109375, -4.88330078125, -4.387939453125, -3.892578125, -3.397216796875, -2.90185546875, -2.406494140625, -1.9111328125, -1.415771484375, -0.92041015625, -0.425048828125, 0.0703125, 0.565673828125, 1.06103515625, 1.556396484375, 2.0517578125, 2.547119140625, 3.04248046875, 3.537841796875, 4.033203125, 4.528564453125, 5.02392578125, 5.519287109375, 6.0146484375, 6.510009765625, 7.00537109375, 7.500732421875, 7.99609375, 8.491455078125, 8.98681640625, 9.482177734375, 9.9775390625, 10.472900390625, 10.96826171875, 11.463623046875, 11.958984375, 12.454345703125, 12.94970703125, 13.445068359375, 13.9404296875, 14.435791015625, 14.93115234375, 15.426513671875, 15.921875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 6.0, 9.0, 7.0, 6.0, 10.0, 18.0, 21.0, 22.0, 42.0, 67.0, 122.0, 235.0, 586.0, 1776.0, 7050.0, 42522.0, 1320546.0, 2745444.0, 63223.0, 9019.0, 2209.0, 729.0, 273.0, 111.0, 73.0, 42.0, 29.0, 17.0, 17.0, 11.0, 13.0, 6.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.3125, -35.06396484375, -33.8154296875, -32.56689453125, -31.318359375, -30.06982421875, -28.8212890625, -27.57275390625, -26.32421875, -25.07568359375, -23.8271484375, -22.57861328125, -21.330078125, -20.08154296875, -18.8330078125, -17.58447265625, -16.3359375, -15.08740234375, -13.8388671875, -12.59033203125, -11.341796875, -10.09326171875, -8.8447265625, -7.59619140625, -6.34765625, -5.09912109375, -3.8505859375, -2.60205078125, -1.353515625, -0.10498046875, 1.1435546875, 2.39208984375, 3.640625, 4.88916015625, 6.1376953125, 7.38623046875, 8.634765625, 9.88330078125, 11.1318359375, 12.38037109375, 13.62890625, 14.87744140625, 16.1259765625, 17.37451171875, 18.623046875, 19.87158203125, 21.1201171875, 22.36865234375, 23.6171875, 24.86572265625, 26.1142578125, 27.36279296875, 28.611328125, 29.85986328125, 31.1083984375, 32.35693359375, 33.60546875, 34.85400390625, 36.1025390625, 37.35107421875, 38.599609375, 39.84814453125, 41.0966796875, 42.34521484375, 43.59375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 13.0, 54.0, 67.0, 189.0, 238.0, 228.0, 123.0, 59.0, 26.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-204.87384033203125, -200.57501220703125, -196.2761688232422, -191.97732543945312, -187.67849731445312, -183.37966918945312, -179.08082580566406, -174.781982421875, -170.483154296875, -166.184326171875, -161.88548278808594, -157.58663940429688, -153.28781127929688, -148.98898315429688, -144.6901397705078, -140.39129638671875, -136.09246826171875, -131.79364013671875, -127.49479675292969, -123.19596099853516, -118.89712524414062, -114.5982894897461, -110.29945373535156, -106.00061798095703, -101.7017822265625, -97.40294647216797, -93.10411071777344, -88.8052749633789, -84.50643920898438, -80.20760345458984, -75.90876770019531, -71.60993194580078, -67.31109619140625, -63.01226043701172, -58.71342468261719, -54.414588928222656, -50.115753173828125, -45.816917419433594, -41.51808166503906, -37.21924591064453, -32.92041015625, -28.62157440185547, -24.322738647460938, -20.023902893066406, -15.725067138671875, -11.426231384277344, -7.1273956298828125, -2.8285598754882812, 1.47027587890625, 5.769111633300781, 10.067947387695312, 14.366783142089844, 18.665618896484375, 22.964454650878906, 27.263290405273438, 31.56212615966797, 35.8609619140625, 40.15979766845703, 44.45863342285156, 48.757469177246094, 53.056304931640625, 57.355140686035156, 61.65397644042969, 65.95281219482422, 70.25164794921875]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 10.0, 7.0, 7.0, 17.0, 22.0, 20.0, 20.0, 24.0, 28.0, 26.0, 28.0, 37.0, 26.0, 34.0, 42.0, 38.0, 47.0, 44.0, 50.0, 34.0, 44.0, 39.0, 30.0, 32.0, 38.0, 35.0, 31.0, 32.0, 29.0, 21.0, 20.0, 16.0, 16.0, 14.0, 8.0, 7.0, 7.0, 5.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-47.331844329833984, -45.90064239501953, -44.469444274902344, -43.03824234008789, -41.60704040527344, -40.17584228515625, -38.7446403503418, -37.313438415527344, -35.882240295410156, -34.4510383605957, -33.019840240478516, -31.588638305664062, -30.15743637084961, -28.72623634338379, -27.29503631591797, -25.863834381103516, -24.432632446289062, -23.001432418823242, -21.57023048400879, -20.13903045654297, -18.707828521728516, -17.276628494262695, -15.845428466796875, -14.414227485656738, -12.983026504516602, -11.551825523376465, -10.120624542236328, -8.689424514770508, -7.258223533630371, -5.827022552490234, -4.395822525024414, -2.9646215438842773, -1.5334205627441406, -0.10221982002258301, 1.3289809226989746, 2.760181427001953, 4.19138240814209, 5.622583389282227, 7.053783416748047, 8.484984397888184, 9.91618537902832, 11.347386360168457, 12.778587341308594, 14.209787368774414, 15.64098834991455, 17.072189331054688, 18.503389358520508, 19.934589385986328, 21.36579132080078, 22.7969913482666, 24.228193283081055, 25.659393310546875, 27.090595245361328, 28.52179527282715, 29.95299530029297, 31.384197235107422, 32.815399169921875, 34.24660110473633, 35.677799224853516, 37.10900115966797, 38.54020309448242, 39.971405029296875, 41.40260314941406, 42.833805084228516, 44.2650032043457]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 11.0, 10.0, 11.0, 15.0, 19.0, 12.0, 25.0, 29.0, 23.0, 29.0, 30.0, 44.0, 34.0, 44.0, 29.0, 51.0, 38.0, 37.0, 53.0, 44.0, 43.0, 46.0, 47.0, 33.0, 33.0, 20.0, 24.0, 16.0, 24.0, 24.0, 12.0, 8.0, 17.0, 11.0, 9.0, 3.0, 9.0, 8.0, 7.0, 6.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16015625, -5.94586181640625, -5.7315673828125, -5.51727294921875, -5.302978515625, -5.08868408203125, -4.8743896484375, -4.66009521484375, -4.44580078125, -4.23150634765625, -4.0172119140625, -3.80291748046875, -3.588623046875, -3.37432861328125, -3.1600341796875, -2.94573974609375, -2.7314453125, -2.51715087890625, -2.3028564453125, -2.08856201171875, -1.874267578125, -1.65997314453125, -1.4456787109375, -1.23138427734375, -1.01708984375, -0.80279541015625, -0.5885009765625, -0.37420654296875, -0.159912109375, 0.05438232421875, 0.2686767578125, 0.48297119140625, 0.697265625, 0.91156005859375, 1.1258544921875, 1.34014892578125, 1.554443359375, 1.76873779296875, 1.9830322265625, 2.19732666015625, 2.41162109375, 2.62591552734375, 2.8402099609375, 3.05450439453125, 3.268798828125, 3.48309326171875, 3.6973876953125, 3.91168212890625, 4.1259765625, 4.34027099609375, 4.5545654296875, 4.76885986328125, 4.983154296875, 5.19744873046875, 5.4117431640625, 5.62603759765625, 5.84033203125, 6.05462646484375, 6.2689208984375, 6.48321533203125, 6.697509765625, 6.91180419921875, 7.1260986328125, 7.34039306640625, 7.5546875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 5.0, 6.0, 8.0, 7.0, 16.0, 10.0, 17.0, 24.0, 33.0, 56.0, 77.0, 134.0, 173.0, 287.0, 412.0, 597.0, 1046.0, 1639.0, 2806.0, 5106.0, 9686.0, 20031.0, 49262.0, 143822.0, 412992.0, 259237.0, 80918.0, 30315.0, 13569.0, 6745.0, 3802.0, 2101.0, 1295.0, 745.0, 517.0, 344.0, 211.0, 164.0, 99.0, 67.0, 42.0, 34.0, 20.0, 21.0, 20.0, 6.0, 8.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.384765625, -3.27813720703125, -3.1715087890625, -3.06488037109375, -2.958251953125, -2.85162353515625, -2.7449951171875, -2.63836669921875, -2.53173828125, -2.42510986328125, -2.3184814453125, -2.21185302734375, -2.105224609375, -1.99859619140625, -1.8919677734375, -1.78533935546875, -1.6787109375, -1.57208251953125, -1.4654541015625, -1.35882568359375, -1.252197265625, -1.14556884765625, -1.0389404296875, -0.93231201171875, -0.82568359375, -0.71905517578125, -0.6124267578125, -0.50579833984375, -0.399169921875, -0.29254150390625, -0.1859130859375, -0.07928466796875, 0.02734375, 0.13397216796875, 0.2406005859375, 0.34722900390625, 0.453857421875, 0.56048583984375, 0.6671142578125, 0.77374267578125, 0.88037109375, 0.98699951171875, 1.0936279296875, 1.20025634765625, 1.306884765625, 1.41351318359375, 1.5201416015625, 1.62677001953125, 1.7333984375, 1.84002685546875, 1.9466552734375, 2.05328369140625, 2.159912109375, 2.26654052734375, 2.3731689453125, 2.47979736328125, 2.58642578125, 2.69305419921875, 2.7996826171875, 2.90631103515625, 3.012939453125, 3.11956787109375, 3.2261962890625, 3.33282470703125, 3.439453125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 3.0, 9.0, 13.0, 15.0, 20.0, 13.0, 22.0, 21.0, 28.0, 21.0, 29.0, 25.0, 39.0, 45.0, 33.0, 50.0, 49.0, 1077.0, 48.0, 49.0, 63.0, 43.0, 36.0, 37.0, 29.0, 35.0, 25.0, 25.0, 19.0, 25.0, 16.0, 13.0, 13.0, 9.0, 12.0, 4.0, 5.0, 2.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.55078125, -5.3868408203125, -5.222900390625, -5.0589599609375, -4.89501953125, -4.7310791015625, -4.567138671875, -4.4031982421875, -4.2392578125, -4.0753173828125, -3.911376953125, -3.7474365234375, -3.58349609375, -3.4195556640625, -3.255615234375, -3.0916748046875, -2.927734375, -2.7637939453125, -2.599853515625, -2.4359130859375, -2.27197265625, -2.1080322265625, -1.944091796875, -1.7801513671875, -1.6162109375, -1.4522705078125, -1.288330078125, -1.1243896484375, -0.96044921875, -0.7965087890625, -0.632568359375, -0.4686279296875, -0.3046875, -0.1407470703125, 0.023193359375, 0.1871337890625, 0.35107421875, 0.5150146484375, 0.678955078125, 0.8428955078125, 1.0068359375, 1.1707763671875, 1.334716796875, 1.4986572265625, 1.66259765625, 1.8265380859375, 1.990478515625, 2.1544189453125, 2.318359375, 2.4822998046875, 2.646240234375, 2.8101806640625, 2.97412109375, 3.1380615234375, 3.302001953125, 3.4659423828125, 3.6298828125, 3.7938232421875, 3.957763671875, 4.1217041015625, 4.28564453125, 4.4495849609375, 4.613525390625, 4.7774658203125, 4.94140625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 8.0, 3.0, 8.0, 27.0, 23.0, 26.0, 52.0, 66.0, 87.0, 133.0, 258.0, 327.0, 598.0, 994.0, 1868.0, 3787.0, 9042.0, 30211.0, 189440.0, 1622658.0, 189820.0, 30631.0, 9000.0, 3709.0, 1802.0, 983.0, 604.0, 335.0, 203.0, 145.0, 93.0, 66.0, 37.0, 29.0, 17.0, 22.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.671875, -3.55889892578125, -3.4459228515625, -3.33294677734375, -3.219970703125, -3.10699462890625, -2.9940185546875, -2.88104248046875, -2.76806640625, -2.65509033203125, -2.5421142578125, -2.42913818359375, -2.316162109375, -2.20318603515625, -2.0902099609375, -1.97723388671875, -1.8642578125, -1.75128173828125, -1.6383056640625, -1.52532958984375, -1.412353515625, -1.29937744140625, -1.1864013671875, -1.07342529296875, -0.96044921875, -0.84747314453125, -0.7344970703125, -0.62152099609375, -0.508544921875, -0.39556884765625, -0.2825927734375, -0.16961669921875, -0.056640625, 0.05633544921875, 0.1693115234375, 0.28228759765625, 0.395263671875, 0.50823974609375, 0.6212158203125, 0.73419189453125, 0.84716796875, 0.96014404296875, 1.0731201171875, 1.18609619140625, 1.299072265625, 1.41204833984375, 1.5250244140625, 1.63800048828125, 1.7509765625, 1.86395263671875, 1.9769287109375, 2.08990478515625, 2.202880859375, 2.31585693359375, 2.4288330078125, 2.54180908203125, 2.65478515625, 2.76776123046875, 2.8807373046875, 2.99371337890625, 3.106689453125, 3.21966552734375, 3.3326416015625, 3.44561767578125, 3.55859375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 6.0, 14.0, 18.0, 48.0, 65.0, 101.0, 184.0, 205.0, 125.0, 78.0, 50.0, 29.0, 21.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9931640625, -0.9663848876953125, -0.939605712890625, -0.9128265380859375, -0.88604736328125, -0.8592681884765625, -0.832489013671875, -0.8057098388671875, -0.7789306640625, -0.7521514892578125, -0.725372314453125, -0.6985931396484375, -0.67181396484375, -0.6450347900390625, -0.618255615234375, -0.5914764404296875, -0.564697265625, -0.5379180908203125, -0.511138916015625, -0.4843597412109375, -0.45758056640625, -0.4308013916015625, -0.404022216796875, -0.3772430419921875, -0.3504638671875, -0.3236846923828125, -0.296905517578125, -0.2701263427734375, -0.24334716796875, -0.2165679931640625, -0.189788818359375, -0.1630096435546875, -0.13623046875, -0.1094512939453125, -0.082672119140625, -0.0558929443359375, -0.02911376953125, -0.0023345947265625, 0.024444580078125, 0.0512237548828125, 0.0780029296875, 0.1047821044921875, 0.131561279296875, 0.1583404541015625, 0.18511962890625, 0.2118988037109375, 0.238677978515625, 0.2654571533203125, 0.292236328125, 0.3190155029296875, 0.345794677734375, 0.3725738525390625, 0.39935302734375, 0.4261322021484375, 0.452911376953125, 0.4796905517578125, 0.5064697265625, 0.5332489013671875, 0.560028076171875, 0.5868072509765625, 0.61358642578125, 0.6403656005859375, 0.667144775390625, 0.6939239501953125, 0.720703125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 2.0, 4.0, 3.0, 9.0, 9.0, 13.0, 14.0, 17.0, 15.0, 36.0, 60.0, 91.0, 199.0, 841.0, 8261.0, 1001189.0, 35374.0, 1729.0, 319.0, 133.0, 74.0, 28.0, 29.0, 16.0, 16.0, 10.0, 7.0, 7.0, 7.0, 6.0, 5.0, 4.0, 2.0, 9.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2109375, -11.7996826171875, -11.388427734375, -10.9771728515625, -10.56591796875, -10.1546630859375, -9.743408203125, -9.3321533203125, -8.9208984375, -8.5096435546875, -8.098388671875, -7.6871337890625, -7.27587890625, -6.8646240234375, -6.453369140625, -6.0421142578125, -5.630859375, -5.2196044921875, -4.808349609375, -4.3970947265625, -3.98583984375, -3.5745849609375, -3.163330078125, -2.7520751953125, -2.3408203125, -1.9295654296875, -1.518310546875, -1.1070556640625, -0.69580078125, -0.2845458984375, 0.126708984375, 0.5379638671875, 0.94921875, 1.3604736328125, 1.771728515625, 2.1829833984375, 2.59423828125, 3.0054931640625, 3.416748046875, 3.8280029296875, 4.2392578125, 4.6505126953125, 5.061767578125, 5.4730224609375, 5.88427734375, 6.2955322265625, 6.706787109375, 7.1180419921875, 7.529296875, 7.9405517578125, 8.351806640625, 8.7630615234375, 9.17431640625, 9.5855712890625, 9.996826171875, 10.4080810546875, 10.8193359375, 11.2305908203125, 11.641845703125, 12.0531005859375, 12.46435546875, 12.8756103515625, 13.286865234375, 13.6981201171875, 14.109375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 18.0, 121.0, 453.0, 335.0, 72.0, 10.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4320948123931885, -3.308811902999878, -3.1855287551879883, -3.0622458457946777, -2.938962697982788, -2.8156797885894775, -2.692396640777588, -2.5691137313842773, -2.445830821990967, -2.3225479125976562, -2.1992647647857666, -2.075981855392456, -1.9526987075805664, -1.8294157981872559, -1.7061327695846558, -1.5828497409820557, -1.459566593170166, -1.336283564567566, -1.2130005359649658, -1.0897176265716553, -0.9664345383644104, -0.8431515097618103, -0.719868540763855, -0.5965855121612549, -0.4733024835586548, -0.3500194549560547, -0.22673645615577698, -0.10345345735549927, 0.01982957124710083, 0.14311259984970093, 0.26639556884765625, 0.38967859745025635, 0.5129618644714355, 0.6362448930740356, 0.7595279216766357, 0.8828108906745911, 1.006093978881836, 1.1293768882751465, 1.2526599168777466, 1.3759429454803467, 1.4992259740829468, 1.6225090026855469, 1.745792031288147, 1.869075059890747, 1.9923579692840576, 2.1156411170959473, 2.238924026489258, 2.3622069358825684, 2.485490083694458, 2.6087729930877686, 2.732056140899658, 2.8553390502929688, 2.9786221981048584, 3.101905107498169, 3.2251882553100586, 3.348471164703369, 3.4717540740966797, 3.5950369834899902, 3.71832013130188, 3.8416030406951904, 3.96488618850708, 4.088169097900391, 4.211452007293701, 4.334734916687012, 4.4580183029174805]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 6.0, 6.0, 11.0, 17.0, 13.0, 11.0, 15.0, 18.0, 15.0, 19.0, 30.0, 35.0, 33.0, 39.0, 29.0, 53.0, 37.0, 42.0, 34.0, 39.0, 38.0, 38.0, 45.0, 32.0, 38.0, 41.0, 29.0, 31.0, 40.0, 35.0, 14.0, 18.0, 14.0, 12.0, 10.0, 12.0, 9.0, 7.0, 6.0, 4.0, 2.0, 6.0, 3.0, 0.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5835478901863098, -0.5644182562828064, -0.5452886819839478, -0.5261590480804443, -0.5070294737815857, -0.48789986968040466, -0.46877026557922363, -0.4496406316757202, -0.4305110573768616, -0.41138145327568054, -0.3922518491744995, -0.3731222450733185, -0.35399264097213745, -0.3348630368709564, -0.3157334327697754, -0.296603798866272, -0.27747419476509094, -0.2583445906639099, -0.23921498656272888, -0.22008538246154785, -0.20095577836036682, -0.1818261742591858, -0.16269655525684357, -0.14356695115566254, -0.1244373470544815, -0.10530774295330048, -0.08617813885211945, -0.06704852730035782, -0.04791892319917679, -0.028789319097995758, -0.00965970754623413, 0.0094698965549469, 0.02859950065612793, 0.04772910475730896, 0.06685870885848999, 0.08598832041025162, 0.10511792451143265, 0.12424752861261368, 0.1433771401643753, 0.16250674426555634, 0.18163634836673737, 0.2007659524679184, 0.21989555656909943, 0.23902517557144165, 0.2581547796726227, 0.2772843837738037, 0.29641398787498474, 0.31554359197616577, 0.3346731960773468, 0.35380280017852783, 0.37293240427970886, 0.3920620083808899, 0.4111916124820709, 0.43032121658325195, 0.44945085048675537, 0.468580424785614, 0.48771005868911743, 0.5068396925926208, 0.5259692668914795, 0.5450989007949829, 0.5642284750938416, 0.583358108997345, 0.6024876832962036, 0.621617317199707, 0.6407468914985657]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 5.0, 12.0, 18.0, 12.0, 17.0, 11.0, 17.0, 20.0, 31.0, 26.0, 24.0, 24.0, 34.0, 49.0, 43.0, 35.0, 42.0, 44.0, 47.0, 37.0, 39.0, 38.0, 51.0, 40.0, 37.0, 21.0, 16.0, 30.0, 24.0, 20.0, 18.0, 14.0, 17.0, 18.0, 13.0, 10.0, 12.0, 10.0, 2.0, 7.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.13671875, -5.92462158203125, -5.7125244140625, -5.50042724609375, -5.288330078125, -5.07623291015625, -4.8641357421875, -4.65203857421875, -4.43994140625, -4.22784423828125, -4.0157470703125, -3.80364990234375, -3.591552734375, -3.37945556640625, -3.1673583984375, -2.95526123046875, -2.7431640625, -2.53106689453125, -2.3189697265625, -2.10687255859375, -1.894775390625, -1.68267822265625, -1.4705810546875, -1.25848388671875, -1.04638671875, -0.83428955078125, -0.6221923828125, -0.41009521484375, -0.197998046875, 0.01409912109375, 0.2261962890625, 0.43829345703125, 0.650390625, 0.86248779296875, 1.0745849609375, 1.28668212890625, 1.498779296875, 1.71087646484375, 1.9229736328125, 2.13507080078125, 2.34716796875, 2.55926513671875, 2.7713623046875, 2.98345947265625, 3.195556640625, 3.40765380859375, 3.6197509765625, 3.83184814453125, 4.0439453125, 4.25604248046875, 4.4681396484375, 4.68023681640625, 4.892333984375, 5.10443115234375, 5.3165283203125, 5.52862548828125, 5.74072265625, 5.95281982421875, 6.1649169921875, 6.37701416015625, 6.589111328125, 6.80120849609375, 7.0133056640625, 7.22540283203125, 7.4375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 5.0, 10.0, 9.0, 5.0, 8.0, 17.0, 37.0, 30.0, 57.0, 83.0, 95.0, 165.0, 203.0, 307.0, 465.0, 718.0, 1036.0, 1624.0, 2693.0, 4331.0, 7510.0, 13491.0, 26725.0, 59337.0, 155511.0, 454401.0, 185552.0, 68358.0, 30032.0, 14859.0, 8234.0, 4739.0, 2777.0, 1625.0, 1127.0, 747.0, 487.0, 315.0, 261.0, 161.0, 111.0, 90.0, 60.0, 43.0, 28.0, 27.0, 17.0, 12.0, 11.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.0078125, -7.737060546875, -7.46630859375, -7.195556640625, -6.9248046875, -6.654052734375, -6.38330078125, -6.112548828125, -5.841796875, -5.571044921875, -5.30029296875, -5.029541015625, -4.7587890625, -4.488037109375, -4.21728515625, -3.946533203125, -3.67578125, -3.405029296875, -3.13427734375, -2.863525390625, -2.5927734375, -2.322021484375, -2.05126953125, -1.780517578125, -1.509765625, -1.239013671875, -0.96826171875, -0.697509765625, -0.4267578125, -0.156005859375, 0.11474609375, 0.385498046875, 0.65625, 0.927001953125, 1.19775390625, 1.468505859375, 1.7392578125, 2.010009765625, 2.28076171875, 2.551513671875, 2.822265625, 3.093017578125, 3.36376953125, 3.634521484375, 3.9052734375, 4.176025390625, 4.44677734375, 4.717529296875, 4.98828125, 5.259033203125, 5.52978515625, 5.800537109375, 6.0712890625, 6.342041015625, 6.61279296875, 6.883544921875, 7.154296875, 7.425048828125, 7.69580078125, 7.966552734375, 8.2373046875, 8.508056640625, 8.77880859375, 9.049560546875, 9.3203125]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 3.0, 11.0, 11.0, 8.0, 15.0, 19.0, 22.0, 35.0, 31.0, 37.0, 49.0, 52.0, 53.0, 79.0, 135.0, 242.0, 1477.0, 249.0, 103.0, 64.0, 48.0, 41.0, 49.0, 33.0, 31.0, 19.0, 22.0, 18.0, 19.0, 11.0, 14.0, 13.0, 7.0, 6.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.171875, -22.324951171875, -21.47802734375, -20.631103515625, -19.7841796875, -18.937255859375, -18.09033203125, -17.243408203125, -16.396484375, -15.549560546875, -14.70263671875, -13.855712890625, -13.0087890625, -12.161865234375, -11.31494140625, -10.468017578125, -9.62109375, -8.774169921875, -7.92724609375, -7.080322265625, -6.2333984375, -5.386474609375, -4.53955078125, -3.692626953125, -2.845703125, -1.998779296875, -1.15185546875, -0.304931640625, 0.5419921875, 1.388916015625, 2.23583984375, 3.082763671875, 3.9296875, 4.776611328125, 5.62353515625, 6.470458984375, 7.3173828125, 8.164306640625, 9.01123046875, 9.858154296875, 10.705078125, 11.552001953125, 12.39892578125, 13.245849609375, 14.0927734375, 14.939697265625, 15.78662109375, 16.633544921875, 17.48046875, 18.327392578125, 19.17431640625, 20.021240234375, 20.8681640625, 21.715087890625, 22.56201171875, 23.408935546875, 24.255859375, 25.102783203125, 25.94970703125, 26.796630859375, 27.6435546875, 28.490478515625, 29.33740234375, 30.184326171875, 31.03125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 3.0, 4.0, 13.0, 12.0, 18.0, 30.0, 37.0, 81.0, 129.0, 236.0, 532.0, 1525.0, 18593.0, 3107898.0, 14141.0, 1391.0, 503.0, 234.0, 122.0, 78.0, 36.0, 23.0, 21.0, 18.0, 5.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-116.8125, -113.21484375, -109.6171875, -106.01953125, -102.421875, -98.82421875, -95.2265625, -91.62890625, -88.03125, -84.43359375, -80.8359375, -77.23828125, -73.640625, -70.04296875, -66.4453125, -62.84765625, -59.25, -55.65234375, -52.0546875, -48.45703125, -44.859375, -41.26171875, -37.6640625, -34.06640625, -30.46875, -26.87109375, -23.2734375, -19.67578125, -16.078125, -12.48046875, -8.8828125, -5.28515625, -1.6875, 1.91015625, 5.5078125, 9.10546875, 12.703125, 16.30078125, 19.8984375, 23.49609375, 27.09375, 30.69140625, 34.2890625, 37.88671875, 41.484375, 45.08203125, 48.6796875, 52.27734375, 55.875, 59.47265625, 63.0703125, 66.66796875, 70.265625, 73.86328125, 77.4609375, 81.05859375, 84.65625, 88.25390625, 91.8515625, 95.44921875, 99.046875, 102.64453125, 106.2421875, 109.83984375, 113.4375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 5.0, 267.0, 688.0, 55.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.845659255981445, -22.082050323486328, -12.318439483642578, -2.554830551147461, 7.208780288696289, 16.97239112854004, 26.735998153686523, 36.499610900878906, 46.263221740722656, 56.026832580566406, 65.79044342041016, 75.55404663085938, 85.31765747070312, 95.08126831054688, 104.84487915039062, 114.60848999023438, 124.37210083007812, 134.13571166992188, 143.89932250976562, 153.66293334960938, 163.42654418945312, 173.19015502929688, 182.95376586914062, 192.71737670898438, 202.48097229003906, 212.2445831298828, 222.00819396972656, 231.7718048095703, 241.53541564941406, 251.2990264892578, 261.0626220703125, 270.82623291015625, 280.5898742675781, 290.3534851074219, 300.1170959472656, 309.8807067871094, 319.6443176269531, 329.4079284667969, 339.1715393066406, 348.9351501464844, 358.6987609863281, 368.4623718261719, 378.2259826660156, 387.9895935058594, 397.7532043457031, 407.5168151855469, 417.2804260253906, 427.0440368652344, 436.8076171875, 446.57122802734375, 456.3348388671875, 466.09844970703125, 475.862060546875, 485.62567138671875, 495.3892822265625, 505.15289306640625, 514.91650390625, 524.6801147460938, 534.4437255859375, 544.2073364257812, 553.970947265625, 563.7345581054688, 573.4981689453125, 583.2617797851562, 593.025390625]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 13.0, 10.0, 13.0, 12.0, 13.0, 15.0, 20.0, 14.0, 18.0, 19.0, 20.0, 15.0, 27.0, 21.0, 38.0, 33.0, 38.0, 41.0, 35.0, 39.0, 38.0, 50.0, 30.0, 42.0, 41.0, 39.0, 27.0, 27.0, 19.0, 24.0, 20.0, 27.0, 17.0, 19.0, 15.0, 16.0, 18.0, 10.0, 11.0, 15.0, 12.0, 3.0, 6.0, 6.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-52.3376579284668, -50.684295654296875, -49.03093719482422, -47.3775749206543, -45.72421646118164, -44.07085418701172, -42.41749572753906, -40.76413345336914, -39.11077117919922, -37.4574089050293, -35.80405044555664, -34.15068817138672, -32.49732971191406, -30.84396743774414, -29.19060707092285, -27.537246704101562, -25.883886337280273, -24.230525970458984, -22.577165603637695, -20.923805236816406, -19.270442962646484, -17.617082595825195, -15.963722229003906, -14.3103609085083, -12.657000541687012, -11.003640174865723, -9.350278854370117, -7.696918487548828, -6.043557643890381, -4.390196800231934, -2.7368364334106445, -1.083475112915039, 0.56988525390625, 2.2232460975646973, 3.8766067028045654, 5.529967308044434, 7.183328151702881, 8.836688995361328, 10.490049362182617, 12.143410682678223, 13.796771049499512, 15.4501314163208, 17.103492736816406, 18.756853103637695, 20.410213470458984, 22.063575744628906, 23.716934204101562, 25.370296478271484, 27.023656845092773, 28.677017211914062, 30.33037757873535, 31.98373794555664, 33.63710021972656, 35.29045867919922, 36.94382095336914, 38.59718322753906, 40.25054168701172, 41.90390396118164, 43.5572624206543, 45.21062469482422, 46.863983154296875, 48.5173454284668, 50.17070770263672, 51.824066162109375, 53.4774284362793]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 7.0, 7.0, 11.0, 10.0, 14.0, 15.0, 17.0, 17.0, 21.0, 21.0, 18.0, 30.0, 30.0, 31.0, 34.0, 37.0, 37.0, 36.0, 33.0, 45.0, 41.0, 41.0, 35.0, 35.0, 42.0, 36.0, 30.0, 27.0, 26.0, 31.0, 20.0, 19.0, 29.0, 13.0, 17.0, 11.0, 13.0, 13.0, 5.0, 14.0, 5.0, 3.0, 4.0, 7.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.58203125, -6.3740234375, -6.166015625, -5.9580078125, -5.75, -5.5419921875, -5.333984375, -5.1259765625, -4.91796875, -4.7099609375, -4.501953125, -4.2939453125, -4.0859375, -3.8779296875, -3.669921875, -3.4619140625, -3.25390625, -3.0458984375, -2.837890625, -2.6298828125, -2.421875, -2.2138671875, -2.005859375, -1.7978515625, -1.58984375, -1.3818359375, -1.173828125, -0.9658203125, -0.7578125, -0.5498046875, -0.341796875, -0.1337890625, 0.07421875, 0.2822265625, 0.490234375, 0.6982421875, 0.90625, 1.1142578125, 1.322265625, 1.5302734375, 1.73828125, 1.9462890625, 2.154296875, 2.3623046875, 2.5703125, 2.7783203125, 2.986328125, 3.1943359375, 3.40234375, 3.6103515625, 3.818359375, 4.0263671875, 4.234375, 4.4423828125, 4.650390625, 4.8583984375, 5.06640625, 5.2744140625, 5.482421875, 5.6904296875, 5.8984375, 6.1064453125, 6.314453125, 6.5224609375, 6.73046875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 6.0, 10.0, 11.0, 12.0, 23.0, 40.0, 39.0, 63.0, 83.0, 138.0, 194.0, 309.0, 455.0, 684.0, 1179.0, 1804.0, 3045.0, 5493.0, 10450.0, 23529.0, 71818.0, 387312.0, 1901670.0, 1445027.0, 248396.0, 52538.0, 19220.0, 8860.0, 4821.0, 2708.0, 1565.0, 1021.0, 619.0, 402.0, 236.0, 145.0, 105.0, 81.0, 52.0, 38.0, 28.0, 12.0, 12.0, 8.0, 5.0, 4.0, 4.0, 0.0, 5.0, 5.0, 1.0, 1.0, 3.0], "bins": [-12.3046875, -11.9415283203125, -11.578369140625, -11.2152099609375, -10.85205078125, -10.4888916015625, -10.125732421875, -9.7625732421875, -9.3994140625, -9.0362548828125, -8.673095703125, -8.3099365234375, -7.94677734375, -7.5836181640625, -7.220458984375, -6.8572998046875, -6.494140625, -6.1309814453125, -5.767822265625, -5.4046630859375, -5.04150390625, -4.6783447265625, -4.315185546875, -3.9520263671875, -3.5888671875, -3.2257080078125, -2.862548828125, -2.4993896484375, -2.13623046875, -1.7730712890625, -1.409912109375, -1.0467529296875, -0.68359375, -0.3204345703125, 0.042724609375, 0.4058837890625, 0.76904296875, 1.1322021484375, 1.495361328125, 1.8585205078125, 2.2216796875, 2.5848388671875, 2.947998046875, 3.3111572265625, 3.67431640625, 4.0374755859375, 4.400634765625, 4.7637939453125, 5.126953125, 5.4901123046875, 5.853271484375, 6.2164306640625, 6.57958984375, 6.9427490234375, 7.305908203125, 7.6690673828125, 8.0322265625, 8.3953857421875, 8.758544921875, 9.1217041015625, 9.48486328125, 9.8480224609375, 10.211181640625, 10.5743408203125, 10.9375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 5.0, 2.0, 9.0, 14.0, 17.0, 10.0, 13.0, 27.0, 28.0, 50.0, 57.0, 69.0, 84.0, 142.0, 211.0, 293.0, 487.0, 549.0, 565.0, 431.0, 302.0, 187.0, 125.0, 93.0, 91.0, 47.0, 31.0, 27.0, 15.0, 15.0, 12.0, 7.0, 10.0, 8.0, 9.0, 7.0, 7.0, 4.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.1171875, -12.7183837890625, -12.319580078125, -11.9207763671875, -11.52197265625, -11.1231689453125, -10.724365234375, -10.3255615234375, -9.9267578125, -9.5279541015625, -9.129150390625, -8.7303466796875, -8.33154296875, -7.9327392578125, -7.533935546875, -7.1351318359375, -6.736328125, -6.3375244140625, -5.938720703125, -5.5399169921875, -5.14111328125, -4.7423095703125, -4.343505859375, -3.9447021484375, -3.5458984375, -3.1470947265625, -2.748291015625, -2.3494873046875, -1.95068359375, -1.5518798828125, -1.153076171875, -0.7542724609375, -0.35546875, 0.0433349609375, 0.442138671875, 0.8409423828125, 1.23974609375, 1.6385498046875, 2.037353515625, 2.4361572265625, 2.8349609375, 3.2337646484375, 3.632568359375, 4.0313720703125, 4.43017578125, 4.8289794921875, 5.227783203125, 5.6265869140625, 6.025390625, 6.4241943359375, 6.822998046875, 7.2218017578125, 7.62060546875, 8.0194091796875, 8.418212890625, 8.8170166015625, 9.2158203125, 9.6146240234375, 10.013427734375, 10.4122314453125, 10.81103515625, 11.2098388671875, 11.608642578125, 12.0074462890625, 12.40625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 4.0, 4.0, 2.0, 3.0, 3.0, 7.0, 12.0, 11.0, 14.0, 16.0, 13.0, 24.0, 35.0, 39.0, 77.0, 94.0, 157.0, 295.0, 889.0, 3739.0, 26556.0, 804861.0, 3283328.0, 65086.0, 6659.0, 1352.0, 428.0, 180.0, 101.0, 58.0, 54.0, 46.0, 32.0, 24.0, 10.0, 13.0, 14.0, 13.0, 9.0, 5.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-41.03125, -39.71484375, -38.3984375, -37.08203125, -35.765625, -34.44921875, -33.1328125, -31.81640625, -30.5, -29.18359375, -27.8671875, -26.55078125, -25.234375, -23.91796875, -22.6015625, -21.28515625, -19.96875, -18.65234375, -17.3359375, -16.01953125, -14.703125, -13.38671875, -12.0703125, -10.75390625, -9.4375, -8.12109375, -6.8046875, -5.48828125, -4.171875, -2.85546875, -1.5390625, -0.22265625, 1.09375, 2.41015625, 3.7265625, 5.04296875, 6.359375, 7.67578125, 8.9921875, 10.30859375, 11.625, 12.94140625, 14.2578125, 15.57421875, 16.890625, 18.20703125, 19.5234375, 20.83984375, 22.15625, 23.47265625, 24.7890625, 26.10546875, 27.421875, 28.73828125, 30.0546875, 31.37109375, 32.6875, 34.00390625, 35.3203125, 36.63671875, 37.953125, 39.26953125, 40.5859375, 41.90234375, 43.21875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 15.0, 49.0, 70.0, 153.0, 230.0, 188.0, 150.0, 70.0, 41.0, 22.0, 10.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-186.3714599609375, -182.85475158691406, -179.33802795410156, -175.82131958007812, -172.30459594726562, -168.7878875732422, -165.27117919921875, -161.75445556640625, -158.2377471923828, -154.72103881835938, -151.20431518554688, -147.68760681152344, -144.17088317871094, -140.6541748046875, -137.137451171875, -133.62074279785156, -130.10403442382812, -126.58731842041016, -123.07060241699219, -119.55389404296875, -116.03717803955078, -112.52046203613281, -109.00374603271484, -105.48703002929688, -101.97030639648438, -98.4535903930664, -94.93687438964844, -91.420166015625, -87.90345001220703, -84.38673400878906, -80.8700180053711, -77.35330200195312, -73.83660125732422, -70.31988525390625, -66.80316925048828, -63.28645706176758, -59.769744873046875, -56.253028869628906, -52.73631286621094, -49.21959686279297, -45.702884674072266, -42.1861686706543, -38.669456481933594, -35.152740478515625, -31.63602638244629, -28.119312286376953, -24.602596282958984, -21.08588218688965, -17.569168090820312, -14.052453994750977, -10.535738945007324, -7.019023895263672, -3.502309799194336, 0.014404296875, 3.5311203002929688, 7.047834396362305, 10.56454849243164, 14.081262588500977, 17.597976684570312, 21.11469268798828, 24.631406784057617, 28.148120880126953, 31.664836883544922, 35.181549072265625, 38.698265075683594]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 10.0, 7.0, 6.0, 11.0, 8.0, 16.0, 20.0, 27.0, 21.0, 14.0, 22.0, 29.0, 26.0, 37.0, 33.0, 42.0, 43.0, 40.0, 49.0, 28.0, 42.0, 39.0, 28.0, 39.0, 29.0, 37.0, 25.0, 33.0, 27.0, 31.0, 28.0, 30.0, 24.0, 21.0, 21.0, 16.0, 6.0, 4.0, 6.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-43.047080993652344, -41.76441955566406, -40.481754302978516, -39.199092864990234, -37.91642761230469, -36.633766174316406, -35.35110092163086, -34.06843948364258, -32.78577423095703, -31.503110885620117, -30.220447540283203, -28.93778419494629, -27.655120849609375, -26.372459411621094, -25.08979606628418, -23.807132720947266, -22.524471282958984, -21.24180793762207, -19.959144592285156, -18.676481246948242, -17.393817901611328, -16.111156463623047, -14.828493118286133, -13.545829772949219, -12.263166427612305, -10.98050308227539, -9.697839736938477, -8.415177345275879, -7.132513999938965, -5.849850654602051, -4.567187786102295, -3.284524917602539, -2.0018653869628906, -0.7192022800445557, 0.5634608268737793, 1.8461239337921143, 3.128787040710449, 4.411450386047363, 5.694113254547119, 6.976776123046875, 8.259439468383789, 9.542102813720703, 10.824766159057617, 12.107428550720215, 13.390091896057129, 14.672755241394043, 15.95541763305664, 17.238080978393555, 18.52074432373047, 19.803407669067383, 21.086071014404297, 22.36873435974121, 23.651397705078125, 24.934059143066406, 26.21672248840332, 27.499385833740234, 28.78204917907715, 30.064712524414062, 31.347375869750977, 32.63003921508789, 33.91270065307617, 35.19536590576172, 36.47802734375, 37.76068878173828, 39.04335403442383]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 2.0, 3.0, 3.0, 4.0, 5.0, 12.0, 11.0, 13.0, 20.0, 20.0, 16.0, 18.0, 26.0, 30.0, 39.0, 40.0, 35.0, 44.0, 42.0, 44.0, 36.0, 58.0, 37.0, 42.0, 45.0, 42.0, 33.0, 29.0, 31.0, 23.0, 32.0, 22.0, 10.0, 21.0, 20.0, 18.0, 16.0, 11.0, 13.0, 9.0, 8.0, 2.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 5.0, 0.0, 0.0, 2.0], "bins": [-7.27734375, -7.06268310546875, -6.8480224609375, -6.63336181640625, -6.418701171875, -6.20404052734375, -5.9893798828125, -5.77471923828125, -5.56005859375, -5.34539794921875, -5.1307373046875, -4.91607666015625, -4.701416015625, -4.48675537109375, -4.2720947265625, -4.05743408203125, -3.8427734375, -3.62811279296875, -3.4134521484375, -3.19879150390625, -2.984130859375, -2.76947021484375, -2.5548095703125, -2.34014892578125, -2.12548828125, -1.91082763671875, -1.6961669921875, -1.48150634765625, -1.266845703125, -1.05218505859375, -0.8375244140625, -0.62286376953125, -0.408203125, -0.19354248046875, 0.0211181640625, 0.23577880859375, 0.450439453125, 0.66510009765625, 0.8797607421875, 1.09442138671875, 1.30908203125, 1.52374267578125, 1.7384033203125, 1.95306396484375, 2.167724609375, 2.38238525390625, 2.5970458984375, 2.81170654296875, 3.0263671875, 3.24102783203125, 3.4556884765625, 3.67034912109375, 3.885009765625, 4.09967041015625, 4.3143310546875, 4.52899169921875, 4.74365234375, 4.95831298828125, 5.1729736328125, 5.38763427734375, 5.602294921875, 5.81695556640625, 6.0316162109375, 6.24627685546875, 6.4609375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 9.0, 12.0, 14.0, 12.0, 22.0, 15.0, 42.0, 55.0, 65.0, 88.0, 129.0, 184.0, 241.0, 395.0, 545.0, 797.0, 1168.0, 1886.0, 3054.0, 5290.0, 10251.0, 22556.0, 57961.0, 179578.0, 418661.0, 221286.0, 70482.0, 26373.0, 11801.0, 5933.0, 3386.0, 2046.0, 1358.0, 850.0, 580.0, 400.0, 253.0, 210.0, 153.0, 110.0, 79.0, 60.0, 40.0, 35.0, 26.0, 18.0, 14.0, 12.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 4.0], "bins": [-3.091796875, -2.999755859375, -2.90771484375, -2.815673828125, -2.7236328125, -2.631591796875, -2.53955078125, -2.447509765625, -2.35546875, -2.263427734375, -2.17138671875, -2.079345703125, -1.9873046875, -1.895263671875, -1.80322265625, -1.711181640625, -1.619140625, -1.527099609375, -1.43505859375, -1.343017578125, -1.2509765625, -1.158935546875, -1.06689453125, -0.974853515625, -0.8828125, -0.790771484375, -0.69873046875, -0.606689453125, -0.5146484375, -0.422607421875, -0.33056640625, -0.238525390625, -0.146484375, -0.054443359375, 0.03759765625, 0.129638671875, 0.2216796875, 0.313720703125, 0.40576171875, 0.497802734375, 0.58984375, 0.681884765625, 0.77392578125, 0.865966796875, 0.9580078125, 1.050048828125, 1.14208984375, 1.234130859375, 1.326171875, 1.418212890625, 1.51025390625, 1.602294921875, 1.6943359375, 1.786376953125, 1.87841796875, 1.970458984375, 2.0625, 2.154541015625, 2.24658203125, 2.338623046875, 2.4306640625, 2.522705078125, 2.61474609375, 2.706787109375, 2.798828125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 0.0, 6.0, 8.0, 7.0, 14.0, 20.0, 10.0, 11.0, 15.0, 19.0, 21.0, 20.0, 21.0, 28.0, 29.0, 23.0, 38.0, 42.0, 38.0, 38.0, 39.0, 37.0, 1058.0, 48.0, 46.0, 35.0, 29.0, 40.0, 34.0, 31.0, 24.0, 27.0, 25.0, 27.0, 19.0, 19.0, 18.0, 11.0, 10.0, 9.0, 7.0, 5.0, 5.0, 6.0, 2.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 4.0], "bins": [-5.09765625, -4.94952392578125, -4.8013916015625, -4.65325927734375, -4.505126953125, -4.35699462890625, -4.2088623046875, -4.06072998046875, -3.91259765625, -3.76446533203125, -3.6163330078125, -3.46820068359375, -3.320068359375, -3.17193603515625, -3.0238037109375, -2.87567138671875, -2.7275390625, -2.57940673828125, -2.4312744140625, -2.28314208984375, -2.135009765625, -1.98687744140625, -1.8387451171875, -1.69061279296875, -1.54248046875, -1.39434814453125, -1.2462158203125, -1.09808349609375, -0.949951171875, -0.80181884765625, -0.6536865234375, -0.50555419921875, -0.357421875, -0.20928955078125, -0.0611572265625, 0.08697509765625, 0.235107421875, 0.38323974609375, 0.5313720703125, 0.67950439453125, 0.82763671875, 0.97576904296875, 1.1239013671875, 1.27203369140625, 1.420166015625, 1.56829833984375, 1.7164306640625, 1.86456298828125, 2.0126953125, 2.16082763671875, 2.3089599609375, 2.45709228515625, 2.605224609375, 2.75335693359375, 2.9014892578125, 3.04962158203125, 3.19775390625, 3.34588623046875, 3.4940185546875, 3.64215087890625, 3.790283203125, 3.93841552734375, 4.0865478515625, 4.23468017578125, 4.3828125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 7.0, 2.0, 9.0, 14.0, 19.0, 26.0, 40.0, 54.0, 81.0, 105.0, 146.0, 229.0, 371.0, 634.0, 1041.0, 1901.0, 3298.0, 6499.0, 14090.0, 39289.0, 172693.0, 1419835.0, 336915.0, 62006.0, 19574.0, 8470.0, 4152.0, 2274.0, 1251.0, 759.0, 443.0, 280.0, 197.0, 113.0, 88.0, 55.0, 50.0, 29.0, 20.0, 17.0, 13.0, 10.0, 17.0, 6.0, 3.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.841796875, -2.75482177734375, -2.6678466796875, -2.58087158203125, -2.493896484375, -2.40692138671875, -2.3199462890625, -2.23297119140625, -2.14599609375, -2.05902099609375, -1.9720458984375, -1.88507080078125, -1.798095703125, -1.71112060546875, -1.6241455078125, -1.53717041015625, -1.4501953125, -1.36322021484375, -1.2762451171875, -1.18927001953125, -1.102294921875, -1.01531982421875, -0.9283447265625, -0.84136962890625, -0.75439453125, -0.66741943359375, -0.5804443359375, -0.49346923828125, -0.406494140625, -0.31951904296875, -0.2325439453125, -0.14556884765625, -0.05859375, 0.02838134765625, 0.1153564453125, 0.20233154296875, 0.289306640625, 0.37628173828125, 0.4632568359375, 0.55023193359375, 0.63720703125, 0.72418212890625, 0.8111572265625, 0.89813232421875, 0.985107421875, 1.07208251953125, 1.1590576171875, 1.24603271484375, 1.3330078125, 1.41998291015625, 1.5069580078125, 1.59393310546875, 1.680908203125, 1.76788330078125, 1.8548583984375, 1.94183349609375, 2.02880859375, 2.11578369140625, 2.2027587890625, 2.28973388671875, 2.376708984375, 2.46368408203125, 2.5506591796875, 2.63763427734375, 2.724609375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 2.0, 1.0, 9.0, 6.0, 9.0, 6.0, 10.0, 18.0, 23.0, 66.0, 74.0, 144.0, 252.0, 129.0, 74.0, 54.0, 27.0, 22.0, 9.0, 7.0, 9.0, 6.0, 9.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.927734375, -0.897125244140625, -0.86651611328125, -0.835906982421875, -0.8052978515625, -0.774688720703125, -0.74407958984375, -0.713470458984375, -0.682861328125, -0.652252197265625, -0.62164306640625, -0.591033935546875, -0.5604248046875, -0.529815673828125, -0.49920654296875, -0.468597412109375, -0.43798828125, -0.407379150390625, -0.37677001953125, -0.346160888671875, -0.3155517578125, -0.284942626953125, -0.25433349609375, -0.223724365234375, -0.193115234375, -0.162506103515625, -0.13189697265625, -0.101287841796875, -0.0706787109375, -0.040069580078125, -0.00946044921875, 0.021148681640625, 0.0517578125, 0.082366943359375, 0.11297607421875, 0.143585205078125, 0.1741943359375, 0.204803466796875, 0.23541259765625, 0.266021728515625, 0.296630859375, 0.327239990234375, 0.35784912109375, 0.388458251953125, 0.4190673828125, 0.449676513671875, 0.48028564453125, 0.510894775390625, 0.54150390625, 0.572113037109375, 0.60272216796875, 0.633331298828125, 0.6639404296875, 0.694549560546875, 0.72515869140625, 0.755767822265625, 0.786376953125, 0.816986083984375, 0.84759521484375, 0.878204345703125, 0.9088134765625, 0.939422607421875, 0.97003173828125, 1.000640869140625, 1.03125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 8.0, 10.0, 4.0, 13.0, 10.0, 21.0, 20.0, 24.0, 37.0, 40.0, 74.0, 89.0, 148.0, 372.0, 2973.0, 65509.0, 968625.0, 9176.0, 773.0, 196.0, 130.0, 43.0, 53.0, 40.0, 27.0, 25.0, 15.0, 15.0, 12.0, 12.0, 11.0, 5.0, 3.0, 5.0, 2.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-14.8828125, -14.44775390625, -14.0126953125, -13.57763671875, -13.142578125, -12.70751953125, -12.2724609375, -11.83740234375, -11.40234375, -10.96728515625, -10.5322265625, -10.09716796875, -9.662109375, -9.22705078125, -8.7919921875, -8.35693359375, -7.921875, -7.48681640625, -7.0517578125, -6.61669921875, -6.181640625, -5.74658203125, -5.3115234375, -4.87646484375, -4.44140625, -4.00634765625, -3.5712890625, -3.13623046875, -2.701171875, -2.26611328125, -1.8310546875, -1.39599609375, -0.9609375, -0.52587890625, -0.0908203125, 0.34423828125, 0.779296875, 1.21435546875, 1.6494140625, 2.08447265625, 2.51953125, 2.95458984375, 3.3896484375, 3.82470703125, 4.259765625, 4.69482421875, 5.1298828125, 5.56494140625, 6.0, 6.43505859375, 6.8701171875, 7.30517578125, 7.740234375, 8.17529296875, 8.6103515625, 9.04541015625, 9.48046875, 9.91552734375, 10.3505859375, 10.78564453125, 11.220703125, 11.65576171875, 12.0908203125, 12.52587890625, 12.9609375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 18.0, 97.0, 467.0, 362.0, 58.0, 11.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.233728408813477, -4.069983005523682, -3.9062376022338867, -3.742492198944092, -3.578746795654297, -3.415001392364502, -3.251255989074707, -3.087510585784912, -2.923765182495117, -2.7600197792053223, -2.5962743759155273, -2.4325289726257324, -2.2687835693359375, -2.1050381660461426, -1.941292643547058, -1.7775472402572632, -1.6138017177581787, -1.4500563144683838, -1.2863109111785889, -1.122565507888794, -0.9588200449943542, -0.7950746417045593, -0.6313291788101196, -0.4675837755203247, -0.3038383722305298, -0.14009295403957367, 0.023652464151382446, 0.18739789724349976, 0.3511433005332947, 0.5148887038230896, 0.6786341667175293, 0.8423795700073242, 1.0061249732971191, 1.169870376586914, 1.333615779876709, 1.497361183166504, 1.6611065864562988, 1.8248519897460938, 1.9885975122451782, 2.1523427963256836, 2.3160881996154785, 2.4798336029052734, 2.6435790061950684, 2.8073244094848633, 2.971069812774658, 3.134815216064453, 3.298560619354248, 3.462306022644043, 3.626051664352417, 3.789797067642212, 3.953542470932007, 4.117288112640381, 4.281033515930176, 4.444778919219971, 4.608524322509766, 4.7722697257995605, 4.9360151290893555, 5.09976053237915, 5.263505935668945, 5.42725133895874, 5.590996742248535, 5.75474214553833, 5.918487548828125, 6.08223295211792, 6.245978355407715]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 4.0, 6.0, 6.0, 9.0, 16.0, 13.0, 17.0, 18.0, 20.0, 31.0, 22.0, 29.0, 23.0, 34.0, 29.0, 30.0, 46.0, 39.0, 41.0, 50.0, 44.0, 49.0, 37.0, 45.0, 36.0, 34.0, 43.0, 40.0, 38.0, 34.0, 22.0, 25.0, 21.0, 11.0, 6.0, 6.0, 6.0, 4.0, 2.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0], "bins": [-0.9355704188346863, -0.9113280177116394, -0.8870856165885925, -0.8628432154655457, -0.8386008143424988, -0.8143584132194519, -0.7901160717010498, -0.7658736705780029, -0.741631269454956, -0.7173888683319092, -0.6931464672088623, -0.6689040660858154, -0.6446616649627686, -0.6204192638397217, -0.5961768627166748, -0.5719344615936279, -0.547692060470581, -0.5234496593475342, -0.4992072582244873, -0.47496485710144043, -0.45072245597839355, -0.4264800548553467, -0.4022376835346222, -0.3779952824115753, -0.35375288128852844, -0.32951048016548157, -0.3052680790424347, -0.2810257077217102, -0.25678330659866333, -0.23254089057445526, -0.20829850435256958, -0.1840561032295227, -0.15981364250183105, -0.13557124137878418, -0.1113288477063179, -0.08708645403385162, -0.06284405291080475, -0.038601651787757874, -0.014359265565872192, 0.009883135557174683, 0.03412553668022156, 0.058367934077978134, 0.08261033147573471, 0.10685272514820099, 0.13109512627124786, 0.15533752739429474, 0.17957991361618042, 0.2038223147392273, 0.22806471586227417, 0.25230711698532104, 0.2765495181083679, 0.3007919192314148, 0.32503432035446167, 0.34927672147750854, 0.37351909279823303, 0.3977614939212799, 0.4220038950443268, 0.44624629616737366, 0.47048869729042053, 0.494731068611145, 0.5189734697341919, 0.5432158708572388, 0.5674582719802856, 0.5917006731033325, 0.6159430742263794]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 14.0, 6.0, 15.0, 15.0, 21.0, 13.0, 23.0, 21.0, 30.0, 24.0, 35.0, 42.0, 31.0, 43.0, 45.0, 39.0, 41.0, 41.0, 45.0, 37.0, 36.0, 41.0, 34.0, 36.0, 29.0, 26.0, 19.0, 19.0, 18.0, 24.0, 16.0, 12.0, 24.0, 19.0, 17.0, 8.0, 3.0, 8.0, 2.0, 8.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-6.89453125, -6.6868896484375, -6.479248046875, -6.2716064453125, -6.06396484375, -5.8563232421875, -5.648681640625, -5.4410400390625, -5.2333984375, -5.0257568359375, -4.818115234375, -4.6104736328125, -4.40283203125, -4.1951904296875, -3.987548828125, -3.7799072265625, -3.572265625, -3.3646240234375, -3.156982421875, -2.9493408203125, -2.74169921875, -2.5340576171875, -2.326416015625, -2.1187744140625, -1.9111328125, -1.7034912109375, -1.495849609375, -1.2882080078125, -1.08056640625, -0.8729248046875, -0.665283203125, -0.4576416015625, -0.25, -0.0423583984375, 0.165283203125, 0.3729248046875, 0.58056640625, 0.7882080078125, 0.995849609375, 1.2034912109375, 1.4111328125, 1.6187744140625, 1.826416015625, 2.0340576171875, 2.24169921875, 2.4493408203125, 2.656982421875, 2.8646240234375, 3.072265625, 3.2799072265625, 3.487548828125, 3.6951904296875, 3.90283203125, 4.1104736328125, 4.318115234375, 4.5257568359375, 4.7333984375, 4.9410400390625, 5.148681640625, 5.3563232421875, 5.56396484375, 5.7716064453125, 5.979248046875, 6.1868896484375, 6.39453125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 10.0, 8.0, 8.0, 14.0, 21.0, 32.0, 38.0, 45.0, 65.0, 93.0, 135.0, 198.0, 230.0, 335.0, 450.0, 657.0, 1002.0, 1506.0, 2346.0, 3994.0, 7110.0, 13138.0, 26401.0, 59939.0, 184718.0, 480147.0, 158206.0, 54143.0, 24192.0, 12171.0, 6532.0, 3788.0, 2331.0, 1431.0, 878.0, 642.0, 436.0, 330.0, 215.0, 153.0, 122.0, 100.0, 60.0, 64.0, 37.0, 30.0, 13.0, 18.0, 16.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-10.9609375, -10.6331787109375, -10.305419921875, -9.9776611328125, -9.64990234375, -9.3221435546875, -8.994384765625, -8.6666259765625, -8.3388671875, -8.0111083984375, -7.683349609375, -7.3555908203125, -7.02783203125, -6.7000732421875, -6.372314453125, -6.0445556640625, -5.716796875, -5.3890380859375, -5.061279296875, -4.7335205078125, -4.40576171875, -4.0780029296875, -3.750244140625, -3.4224853515625, -3.0947265625, -2.7669677734375, -2.439208984375, -2.1114501953125, -1.78369140625, -1.4559326171875, -1.128173828125, -0.8004150390625, -0.47265625, -0.1448974609375, 0.182861328125, 0.5106201171875, 0.83837890625, 1.1661376953125, 1.493896484375, 1.8216552734375, 2.1494140625, 2.4771728515625, 2.804931640625, 3.1326904296875, 3.46044921875, 3.7882080078125, 4.115966796875, 4.4437255859375, 4.771484375, 5.0992431640625, 5.427001953125, 5.7547607421875, 6.08251953125, 6.4102783203125, 6.738037109375, 7.0657958984375, 7.3935546875, 7.7213134765625, 8.049072265625, 8.3768310546875, 8.70458984375, 9.0323486328125, 9.360107421875, 9.6878662109375, 10.015625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 1.0, 2.0, 6.0, 7.0, 10.0, 3.0, 8.0, 12.0, 16.0, 17.0, 18.0, 29.0, 27.0, 20.0, 44.0, 36.0, 47.0, 43.0, 51.0, 55.0, 86.0, 164.0, 336.0, 1370.0, 171.0, 82.0, 51.0, 35.0, 39.0, 37.0, 33.0, 34.0, 27.0, 21.0, 18.0, 14.0, 15.0, 14.0, 7.0, 8.0, 19.0, 6.0, 2.0, 5.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.96875, -22.273193359375, -21.57763671875, -20.882080078125, -20.1865234375, -19.490966796875, -18.79541015625, -18.099853515625, -17.404296875, -16.708740234375, -16.01318359375, -15.317626953125, -14.6220703125, -13.926513671875, -13.23095703125, -12.535400390625, -11.83984375, -11.144287109375, -10.44873046875, -9.753173828125, -9.0576171875, -8.362060546875, -7.66650390625, -6.970947265625, -6.275390625, -5.579833984375, -4.88427734375, -4.188720703125, -3.4931640625, -2.797607421875, -2.10205078125, -1.406494140625, -0.7109375, -0.015380859375, 0.68017578125, 1.375732421875, 2.0712890625, 2.766845703125, 3.46240234375, 4.157958984375, 4.853515625, 5.549072265625, 6.24462890625, 6.940185546875, 7.6357421875, 8.331298828125, 9.02685546875, 9.722412109375, 10.41796875, 11.113525390625, 11.80908203125, 12.504638671875, 13.2001953125, 13.895751953125, 14.59130859375, 15.286865234375, 15.982421875, 16.677978515625, 17.37353515625, 18.069091796875, 18.7646484375, 19.460205078125, 20.15576171875, 20.851318359375, 21.546875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 9.0, 6.0, 13.0, 6.0, 14.0, 16.0, 20.0, 25.0, 23.0, 30.0, 45.0, 40.0, 66.0, 89.0, 113.0, 149.0, 234.0, 499.0, 1711.0, 10670.0, 239140.0, 2844217.0, 41985.0, 4476.0, 915.0, 342.0, 202.0, 154.0, 108.0, 75.0, 64.0, 33.0, 42.0, 41.0, 30.0, 18.0, 19.0, 11.0, 10.0, 11.0, 7.0, 2.0, 5.0, 6.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0], "bins": [-52.65625, -51.07373046875, -49.4912109375, -47.90869140625, -46.326171875, -44.74365234375, -43.1611328125, -41.57861328125, -39.99609375, -38.41357421875, -36.8310546875, -35.24853515625, -33.666015625, -32.08349609375, -30.5009765625, -28.91845703125, -27.3359375, -25.75341796875, -24.1708984375, -22.58837890625, -21.005859375, -19.42333984375, -17.8408203125, -16.25830078125, -14.67578125, -13.09326171875, -11.5107421875, -9.92822265625, -8.345703125, -6.76318359375, -5.1806640625, -3.59814453125, -2.015625, -0.43310546875, 1.1494140625, 2.73193359375, 4.314453125, 5.89697265625, 7.4794921875, 9.06201171875, 10.64453125, 12.22705078125, 13.8095703125, 15.39208984375, 16.974609375, 18.55712890625, 20.1396484375, 21.72216796875, 23.3046875, 24.88720703125, 26.4697265625, 28.05224609375, 29.634765625, 31.21728515625, 32.7998046875, 34.38232421875, 35.96484375, 37.54736328125, 39.1298828125, 40.71240234375, 42.294921875, 43.87744140625, 45.4599609375, 47.04248046875, 48.625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 6.0, 60.0, 277.0, 474.0, 164.0, 30.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.5859432220459, -25.71642303466797, -20.846904754638672, -15.977384567260742, -11.107864379882812, -6.238344192504883, -1.368825912475586, 3.5006961822509766, 8.370214462280273, 13.239734649658203, 18.1092529296875, 22.97877311706543, 27.84829330444336, 32.717811584472656, 37.58733367919922, 42.45685577392578, 47.32637023925781, 52.19588851928711, 57.06541061401367, 61.93492889404297, 66.80445098876953, 71.67396545410156, 76.54348754882812, 81.41300964355469, 86.28253173828125, 91.15205383300781, 96.02156829833984, 100.8910903930664, 105.76061248779297, 110.630126953125, 115.49964904785156, 120.36917114257812, 125.23869323730469, 130.10821533203125, 134.9777374267578, 139.84725952148438, 144.71676635742188, 149.58628845214844, 154.455810546875, 159.32533264160156, 164.19485473632812, 169.0643768310547, 173.93389892578125, 178.80340576171875, 183.6729278564453, 188.54244995117188, 193.41197204589844, 198.281494140625, 203.1510009765625, 208.02052307128906, 212.89004516601562, 217.75955200195312, 222.6290740966797, 227.49859619140625, 232.3681182861328, 237.23764038085938, 242.10716247558594, 246.9766845703125, 251.84620666503906, 256.7157287597656, 261.5852355957031, 266.45477294921875, 271.32427978515625, 276.19378662109375, 281.0633239746094]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 9.0, 18.0, 11.0, 12.0, 18.0, 17.0, 22.0, 24.0, 26.0, 27.0, 20.0, 30.0, 35.0, 36.0, 36.0, 39.0, 47.0, 48.0, 43.0, 46.0, 33.0, 55.0, 28.0, 31.0, 29.0, 26.0, 24.0, 32.0, 22.0, 19.0, 18.0, 18.0, 17.0, 11.0, 6.0, 12.0, 13.0, 6.0, 4.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-55.228755950927734, -53.60174560546875, -51.974735260009766, -50.34772491455078, -48.72071838378906, -47.09370422363281, -45.466697692871094, -43.83968734741211, -42.212677001953125, -40.58566665649414, -38.958656311035156, -37.33164596557617, -35.70463562011719, -34.07762908935547, -32.450618743896484, -30.8236083984375, -29.196598052978516, -27.56958770751953, -25.942577362060547, -24.315568923950195, -22.68855857849121, -21.061548233032227, -19.434539794921875, -17.80752944946289, -16.180519104003906, -14.553508758544922, -12.926499366760254, -11.299489974975586, -9.672479629516602, -8.045469284057617, -6.418459892272949, -4.791450500488281, -3.164440155029297, -1.5374302864074707, 0.08957958221435547, 1.7165894508361816, 3.343599319458008, 4.970609664916992, 6.59761905670166, 8.224628448486328, 9.851638793945312, 11.478649139404297, 13.105658531188965, 14.732667922973633, 16.359678268432617, 17.9866886138916, 19.613697052001953, 21.240707397460938, 22.867717742919922, 24.494728088378906, 26.12173843383789, 27.748746871948242, 29.375757217407227, 31.00276756286621, 32.62977600097656, 34.25678634643555, 35.88379669189453, 37.510807037353516, 39.1378173828125, 40.764827728271484, 42.39183807373047, 44.01884460449219, 45.64585494995117, 47.272865295410156, 48.89987564086914]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 5.0, 7.0, 10.0, 11.0, 16.0, 19.0, 16.0, 21.0, 16.0, 19.0, 28.0, 29.0, 36.0, 40.0, 37.0, 34.0, 28.0, 39.0, 45.0, 45.0, 34.0, 43.0, 25.0, 38.0, 46.0, 19.0, 26.0, 17.0, 32.0, 27.0, 27.0, 24.0, 15.0, 12.0, 18.0, 12.0, 13.0, 10.0, 9.0, 7.0, 7.0, 8.0, 4.0, 5.0, 3.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.51953125, -6.31005859375, -6.1005859375, -5.89111328125, -5.681640625, -5.47216796875, -5.2626953125, -5.05322265625, -4.84375, -4.63427734375, -4.4248046875, -4.21533203125, -4.005859375, -3.79638671875, -3.5869140625, -3.37744140625, -3.16796875, -2.95849609375, -2.7490234375, -2.53955078125, -2.330078125, -2.12060546875, -1.9111328125, -1.70166015625, -1.4921875, -1.28271484375, -1.0732421875, -0.86376953125, -0.654296875, -0.44482421875, -0.2353515625, -0.02587890625, 0.18359375, 0.39306640625, 0.6025390625, 0.81201171875, 1.021484375, 1.23095703125, 1.4404296875, 1.64990234375, 1.859375, 2.06884765625, 2.2783203125, 2.48779296875, 2.697265625, 2.90673828125, 3.1162109375, 3.32568359375, 3.53515625, 3.74462890625, 3.9541015625, 4.16357421875, 4.373046875, 4.58251953125, 4.7919921875, 5.00146484375, 5.2109375, 5.42041015625, 5.6298828125, 5.83935546875, 6.048828125, 6.25830078125, 6.4677734375, 6.67724609375, 6.88671875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 7.0, 14.0, 11.0, 17.0, 24.0, 36.0, 43.0, 85.0, 92.0, 142.0, 219.0, 308.0, 517.0, 845.0, 1417.0, 2508.0, 4948.0, 11349.0, 35090.0, 229704.0, 2059667.0, 1638267.0, 157631.0, 29423.0, 10803.0, 4804.0, 2500.0, 1404.0, 821.0, 502.0, 349.0, 226.0, 145.0, 90.0, 75.0, 60.0, 42.0, 22.0, 27.0, 14.0, 11.0, 7.0, 6.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0], "bins": [-17.828125, -17.3319091796875, -16.835693359375, -16.3394775390625, -15.84326171875, -15.3470458984375, -14.850830078125, -14.3546142578125, -13.8583984375, -13.3621826171875, -12.865966796875, -12.3697509765625, -11.87353515625, -11.3773193359375, -10.881103515625, -10.3848876953125, -9.888671875, -9.3924560546875, -8.896240234375, -8.4000244140625, -7.90380859375, -7.4075927734375, -6.911376953125, -6.4151611328125, -5.9189453125, -5.4227294921875, -4.926513671875, -4.4302978515625, -3.93408203125, -3.4378662109375, -2.941650390625, -2.4454345703125, -1.94921875, -1.4530029296875, -0.956787109375, -0.4605712890625, 0.03564453125, 0.5318603515625, 1.028076171875, 1.5242919921875, 2.0205078125, 2.5167236328125, 3.012939453125, 3.5091552734375, 4.00537109375, 4.5015869140625, 4.997802734375, 5.4940185546875, 5.990234375, 6.4864501953125, 6.982666015625, 7.4788818359375, 7.97509765625, 8.4713134765625, 8.967529296875, 9.4637451171875, 9.9599609375, 10.4561767578125, 10.952392578125, 11.4486083984375, 11.94482421875, 12.4410400390625, 12.937255859375, 13.4334716796875, 13.9296875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 10.0, 4.0, 7.0, 7.0, 15.0, 19.0, 15.0, 30.0, 30.0, 46.0, 53.0, 68.0, 96.0, 120.0, 176.0, 279.0, 381.0, 585.0, 607.0, 480.0, 303.0, 217.0, 138.0, 93.0, 59.0, 60.0, 34.0, 29.0, 23.0, 18.0, 7.0, 9.0, 16.0, 8.0, 3.0, 8.0, 2.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-14.0546875, -13.654052734375, -13.25341796875, -12.852783203125, -12.4521484375, -12.051513671875, -11.65087890625, -11.250244140625, -10.849609375, -10.448974609375, -10.04833984375, -9.647705078125, -9.2470703125, -8.846435546875, -8.44580078125, -8.045166015625, -7.64453125, -7.243896484375, -6.84326171875, -6.442626953125, -6.0419921875, -5.641357421875, -5.24072265625, -4.840087890625, -4.439453125, -4.038818359375, -3.63818359375, -3.237548828125, -2.8369140625, -2.436279296875, -2.03564453125, -1.635009765625, -1.234375, -0.833740234375, -0.43310546875, -0.032470703125, 0.3681640625, 0.768798828125, 1.16943359375, 1.570068359375, 1.970703125, 2.371337890625, 2.77197265625, 3.172607421875, 3.5732421875, 3.973876953125, 4.37451171875, 4.775146484375, 5.17578125, 5.576416015625, 5.97705078125, 6.377685546875, 6.7783203125, 7.178955078125, 7.57958984375, 7.980224609375, 8.380859375, 8.781494140625, 9.18212890625, 9.582763671875, 9.9833984375, 10.384033203125, 10.78466796875, 11.185302734375, 11.5859375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 3.0, 6.0, 3.0, 1.0, 2.0, 4.0, 3.0, 9.0, 9.0, 8.0, 13.0, 18.0, 20.0, 29.0, 39.0, 66.0, 70.0, 124.0, 216.0, 494.0, 2219.0, 22078.0, 1008329.0, 3113031.0, 42587.0, 3484.0, 660.0, 266.0, 133.0, 92.0, 60.0, 60.0, 36.0, 31.0, 28.0, 12.0, 10.0, 10.0, 5.0, 9.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.625, -37.14599609375, -35.6669921875, -34.18798828125, -32.708984375, -31.22998046875, -29.7509765625, -28.27197265625, -26.79296875, -25.31396484375, -23.8349609375, -22.35595703125, -20.876953125, -19.39794921875, -17.9189453125, -16.43994140625, -14.9609375, -13.48193359375, -12.0029296875, -10.52392578125, -9.044921875, -7.56591796875, -6.0869140625, -4.60791015625, -3.12890625, -1.64990234375, -0.1708984375, 1.30810546875, 2.787109375, 4.26611328125, 5.7451171875, 7.22412109375, 8.703125, 10.18212890625, 11.6611328125, 13.14013671875, 14.619140625, 16.09814453125, 17.5771484375, 19.05615234375, 20.53515625, 22.01416015625, 23.4931640625, 24.97216796875, 26.451171875, 27.93017578125, 29.4091796875, 30.88818359375, 32.3671875, 33.84619140625, 35.3251953125, 36.80419921875, 38.283203125, 39.76220703125, 41.2412109375, 42.72021484375, 44.19921875, 45.67822265625, 47.1572265625, 48.63623046875, 50.115234375, 51.59423828125, 53.0732421875, 54.55224609375, 56.03125]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 15.0, 51.0, 196.0, 364.0, 255.0, 97.0, 23.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-267.5663146972656, -262.0649108886719, -256.56353759765625, -251.0621337890625, -245.56072998046875, -240.05934143066406, -234.55795288085938, -229.05654907226562, -223.55516052246094, -218.05377197265625, -212.5523681640625, -207.0509796142578, -201.54957580566406, -196.04818725585938, -190.54678344726562, -185.04539489746094, -179.54400634765625, -174.04261779785156, -168.5412139892578, -163.03982543945312, -157.53842163085938, -152.0370330810547, -146.53564453125, -141.03424072265625, -135.5328369140625, -130.0314483642578, -124.53004455566406, -119.02865600585938, -113.52725982666016, -108.02586364746094, -102.52446746826172, -97.0230712890625, -91.52169036865234, -86.02029418945312, -80.5188980102539, -75.01750183105469, -69.51611328125, -64.01471710205078, -58.51332092285156, -53.01192855834961, -47.51053237915039, -42.00913619995117, -36.50774383544922, -31.00634765625, -25.504953384399414, -20.003559112548828, -14.50216293334961, -9.000770568847656, -3.4993743896484375, 2.0020203590393066, 7.503415107727051, 13.004810333251953, 18.50620460510254, 24.007598876953125, 29.508995056152344, 35.0103874206543, 40.511783599853516, 46.013179779052734, 51.51457214355469, 57.015968322753906, 62.517364501953125, 68.01875305175781, 73.52015686035156, 79.02154541015625, 84.52294158935547]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 14.0, 10.0, 30.0, 27.0, 25.0, 25.0, 28.0, 22.0, 25.0, 48.0, 46.0, 43.0, 44.0, 46.0, 55.0, 55.0, 48.0, 42.0, 38.0, 38.0, 32.0, 37.0, 35.0, 24.0, 29.0, 25.0, 13.0, 12.0, 15.0, 9.0, 7.0, 6.0, 6.0, 7.0, 4.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.775054931640625, -46.30236053466797, -44.82966613769531, -43.356971740722656, -41.88427734375, -40.411582946777344, -38.93888854980469, -37.46619415283203, -35.993499755859375, -34.52080535888672, -33.04811096191406, -31.575416564941406, -30.10272216796875, -28.630027770996094, -27.157331466674805, -25.68463706970215, -24.21194076538086, -22.739246368408203, -21.266551971435547, -19.79385757446289, -18.321163177490234, -16.848468780517578, -15.375772476196289, -13.903078079223633, -12.430383682250977, -10.95768928527832, -9.484994888305664, -8.012299537658691, -6.539605140686035, -5.066910743713379, -3.5942153930664062, -2.12152099609375, -0.6488304138183594, 0.823864221572876, 2.2965588569641113, 3.769253730773926, 5.241948127746582, 6.714642524719238, 8.187337875366211, 9.660032272338867, 11.132726669311523, 12.60542106628418, 14.078115463256836, 15.550810813903809, 17.02350616455078, 18.496200561523438, 19.968894958496094, 21.44158935546875, 22.914283752441406, 24.386978149414062, 25.85967254638672, 27.332366943359375, 28.80506134033203, 30.277755737304688, 31.750452041625977, 33.22314453125, 34.695838928222656, 36.16853332519531, 37.64122772216797, 39.113922119140625, 40.58661651611328, 42.05931091308594, 43.532005310058594, 45.00469970703125, 46.47739791870117]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 6.0, 5.0, 7.0, 8.0, 2.0, 13.0, 7.0, 15.0, 24.0, 13.0, 15.0, 21.0, 28.0, 25.0, 33.0, 36.0, 47.0, 33.0, 37.0, 29.0, 35.0, 41.0, 47.0, 40.0, 39.0, 43.0, 39.0, 30.0, 29.0, 23.0, 26.0, 31.0, 16.0, 26.0, 29.0, 17.0, 12.0, 17.0, 15.0, 5.0, 4.0, 6.0, 7.0, 5.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-6.4140625, -6.21038818359375, -6.0067138671875, -5.80303955078125, -5.599365234375, -5.39569091796875, -5.1920166015625, -4.98834228515625, -4.78466796875, -4.58099365234375, -4.3773193359375, -4.17364501953125, -3.969970703125, -3.76629638671875, -3.5626220703125, -3.35894775390625, -3.1552734375, -2.95159912109375, -2.7479248046875, -2.54425048828125, -2.340576171875, -2.13690185546875, -1.9332275390625, -1.72955322265625, -1.52587890625, -1.32220458984375, -1.1185302734375, -0.91485595703125, -0.711181640625, -0.50750732421875, -0.3038330078125, -0.10015869140625, 0.103515625, 0.30718994140625, 0.5108642578125, 0.71453857421875, 0.918212890625, 1.12188720703125, 1.3255615234375, 1.52923583984375, 1.73291015625, 1.93658447265625, 2.1402587890625, 2.34393310546875, 2.547607421875, 2.75128173828125, 2.9549560546875, 3.15863037109375, 3.3623046875, 3.56597900390625, 3.7696533203125, 3.97332763671875, 4.177001953125, 4.38067626953125, 4.5843505859375, 4.78802490234375, 4.99169921875, 5.19537353515625, 5.3990478515625, 5.60272216796875, 5.806396484375, 6.01007080078125, 6.2137451171875, 6.41741943359375, 6.62109375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 10.0, 6.0, 16.0, 32.0, 32.0, 43.0, 102.0, 142.0, 208.0, 317.0, 470.0, 696.0, 1137.0, 1678.0, 2644.0, 4201.0, 6693.0, 10897.0, 17992.0, 30775.0, 53420.0, 97926.0, 179495.0, 248217.0, 171706.0, 93223.0, 51447.0, 29146.0, 17448.0, 10643.0, 6458.0, 4060.0, 2537.0, 1609.0, 1084.0, 717.0, 448.0, 316.0, 200.0, 130.0, 81.0, 53.0, 30.0, 31.0, 16.0, 9.0, 10.0, 9.0, 0.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0830078125, -1.047454833984375, -1.01190185546875, -0.976348876953125, -0.9407958984375, -0.905242919921875, -0.86968994140625, -0.834136962890625, -0.798583984375, -0.763031005859375, -0.72747802734375, -0.691925048828125, -0.6563720703125, -0.620819091796875, -0.58526611328125, -0.549713134765625, -0.51416015625, -0.478607177734375, -0.44305419921875, -0.407501220703125, -0.3719482421875, -0.336395263671875, -0.30084228515625, -0.265289306640625, -0.229736328125, -0.194183349609375, -0.15863037109375, -0.123077392578125, -0.0875244140625, -0.051971435546875, -0.01641845703125, 0.019134521484375, 0.0546875, 0.090240478515625, 0.12579345703125, 0.161346435546875, 0.1968994140625, 0.232452392578125, 0.26800537109375, 0.303558349609375, 0.339111328125, 0.374664306640625, 0.41021728515625, 0.445770263671875, 0.4813232421875, 0.516876220703125, 0.55242919921875, 0.587982177734375, 0.62353515625, 0.659088134765625, 0.69464111328125, 0.730194091796875, 0.7657470703125, 0.801300048828125, 0.83685302734375, 0.872406005859375, 0.907958984375, 0.943511962890625, 0.97906494140625, 1.014617919921875, 1.0501708984375, 1.085723876953125, 1.12127685546875, 1.156829833984375, 1.1923828125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 4.0, 3.0, 8.0, 7.0, 7.0, 14.0, 13.0, 13.0, 16.0, 12.0, 24.0, 19.0, 19.0, 18.0, 39.0, 34.0, 36.0, 40.0, 51.0, 40.0, 37.0, 1070.0, 42.0, 42.0, 39.0, 31.0, 37.0, 32.0, 33.0, 43.0, 23.0, 22.0, 28.0, 19.0, 17.0, 15.0, 12.0, 12.0, 15.0, 10.0, 7.0, 5.0, 6.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.07867431640625, -3.9307861328125, -3.78289794921875, -3.635009765625, -3.48712158203125, -3.3392333984375, -3.19134521484375, -3.04345703125, -2.89556884765625, -2.7476806640625, -2.59979248046875, -2.451904296875, -2.30401611328125, -2.1561279296875, -2.00823974609375, -1.8603515625, -1.71246337890625, -1.5645751953125, -1.41668701171875, -1.268798828125, -1.12091064453125, -0.9730224609375, -0.82513427734375, -0.67724609375, -0.52935791015625, -0.3814697265625, -0.23358154296875, -0.085693359375, 0.06219482421875, 0.2100830078125, 0.35797119140625, 0.505859375, 0.65374755859375, 0.8016357421875, 0.94952392578125, 1.097412109375, 1.24530029296875, 1.3931884765625, 1.54107666015625, 1.68896484375, 1.83685302734375, 1.9847412109375, 2.13262939453125, 2.280517578125, 2.42840576171875, 2.5762939453125, 2.72418212890625, 2.8720703125, 3.01995849609375, 3.1678466796875, 3.31573486328125, 3.463623046875, 3.61151123046875, 3.7593994140625, 3.90728759765625, 4.05517578125, 4.20306396484375, 4.3509521484375, 4.49884033203125, 4.646728515625, 4.79461669921875, 4.9425048828125, 5.09039306640625, 5.23828125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 7.0, 3.0, 2.0, 14.0, 10.0, 27.0, 20.0, 37.0, 59.0, 103.0, 142.0, 243.0, 435.0, 750.0, 1384.0, 2513.0, 5232.0, 11046.0, 25182.0, 60419.0, 165341.0, 1118515.0, 501342.0, 120652.0, 46224.0, 19638.0, 8737.0, 4261.0, 2134.0, 1110.0, 651.0, 337.0, 222.0, 110.0, 75.0, 58.0, 39.0, 29.0, 10.0, 8.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.3505859375, -1.314910888671875, -1.27923583984375, -1.243560791015625, -1.2078857421875, -1.172210693359375, -1.13653564453125, -1.100860595703125, -1.065185546875, -1.029510498046875, -0.99383544921875, -0.958160400390625, -0.9224853515625, -0.886810302734375, -0.85113525390625, -0.815460205078125, -0.77978515625, -0.744110107421875, -0.70843505859375, -0.672760009765625, -0.6370849609375, -0.601409912109375, -0.56573486328125, -0.530059814453125, -0.494384765625, -0.458709716796875, -0.42303466796875, -0.387359619140625, -0.3516845703125, -0.316009521484375, -0.28033447265625, -0.244659423828125, -0.208984375, -0.173309326171875, -0.13763427734375, -0.101959228515625, -0.0662841796875, -0.030609130859375, 0.00506591796875, 0.040740966796875, 0.076416015625, 0.112091064453125, 0.14776611328125, 0.183441162109375, 0.2191162109375, 0.254791259765625, 0.29046630859375, 0.326141357421875, 0.36181640625, 0.397491455078125, 0.43316650390625, 0.468841552734375, 0.5045166015625, 0.540191650390625, 0.57586669921875, 0.611541748046875, 0.647216796875, 0.682891845703125, 0.71856689453125, 0.754241943359375, 0.7899169921875, 0.825592041015625, 0.86126708984375, 0.896942138671875, 0.9326171875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 3.0, 12.0, 4.0, 7.0, 11.0, 10.0, 10.0, 15.0, 15.0, 18.0, 25.0, 23.0, 40.0, 42.0, 52.0, 83.0, 109.0, 97.0, 84.0, 59.0, 39.0, 38.0, 26.0, 26.0, 21.0, 17.0, 22.0, 9.0, 12.0, 9.0, 8.0, 11.0, 5.0, 5.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.11834716796875, -0.11428356170654297, -0.11021995544433594, -0.1061563491821289, -0.10209274291992188, -0.09802913665771484, -0.09396553039550781, -0.08990192413330078, -0.08583831787109375, -0.08177471160888672, -0.07771110534667969, -0.07364749908447266, -0.06958389282226562, -0.0655202865600586, -0.06145668029785156, -0.05739307403564453, -0.0533294677734375, -0.04926586151123047, -0.04520225524902344, -0.041138648986816406, -0.037075042724609375, -0.033011436462402344, -0.028947830200195312, -0.02488422393798828, -0.02082061767578125, -0.01675701141357422, -0.012693405151367188, -0.008629798889160156, -0.004566192626953125, -0.0005025863647460938, 0.0035610198974609375, 0.007624626159667969, 0.011688232421875, 0.01575183868408203, 0.019815444946289062, 0.023879051208496094, 0.027942657470703125, 0.032006263732910156, 0.03606986999511719, 0.04013347625732422, 0.04419708251953125, 0.04826068878173828, 0.05232429504394531, 0.056387901306152344, 0.060451507568359375, 0.0645151138305664, 0.06857872009277344, 0.07264232635498047, 0.0767059326171875, 0.08076953887939453, 0.08483314514160156, 0.0888967514038086, 0.09296035766601562, 0.09702396392822266, 0.10108757019042969, 0.10515117645263672, 0.10921478271484375, 0.11327838897705078, 0.11734199523925781, 0.12140560150146484, 0.12546920776367188, 0.1295328140258789, 0.13359642028808594, 0.13766002655029297, 0.1417236328125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 5.0, 6.0, 5.0, 8.0, 9.0, 10.0, 10.0, 9.0, 23.0, 29.0, 24.0, 33.0, 38.0, 53.0, 71.0, 87.0, 117.0, 302.0, 1031.0, 10777.0, 760002.0, 266981.0, 7237.0, 876.0, 261.0, 128.0, 88.0, 74.0, 50.0, 41.0, 29.0, 20.0, 25.0, 11.0, 11.0, 10.0, 6.0, 12.0, 5.0, 9.0, 4.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-2.509765625, -2.437896728515625, -2.36602783203125, -2.294158935546875, -2.2222900390625, -2.150421142578125, -2.07855224609375, -2.006683349609375, -1.934814453125, -1.862945556640625, -1.79107666015625, -1.719207763671875, -1.6473388671875, -1.575469970703125, -1.50360107421875, -1.431732177734375, -1.35986328125, -1.287994384765625, -1.21612548828125, -1.144256591796875, -1.0723876953125, -1.000518798828125, -0.92864990234375, -0.856781005859375, -0.784912109375, -0.713043212890625, -0.64117431640625, -0.569305419921875, -0.4974365234375, -0.425567626953125, -0.35369873046875, -0.281829833984375, -0.2099609375, -0.138092041015625, -0.06622314453125, 0.005645751953125, 0.0775146484375, 0.149383544921875, 0.22125244140625, 0.293121337890625, 0.364990234375, 0.436859130859375, 0.50872802734375, 0.580596923828125, 0.6524658203125, 0.724334716796875, 0.79620361328125, 0.868072509765625, 0.93994140625, 1.011810302734375, 1.08367919921875, 1.155548095703125, 1.2274169921875, 1.299285888671875, 1.37115478515625, 1.443023681640625, 1.514892578125, 1.586761474609375, 1.65863037109375, 1.730499267578125, 1.8023681640625, 1.874237060546875, 1.94610595703125, 2.017974853515625, 2.08984375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 18.0, 68.0, 190.0, 395.0, 238.0, 76.0, 17.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3928728103637695, -1.3641382455825806, -1.3354036808013916, -1.306668996810913, -1.2779344320297241, -1.2491998672485352, -1.2204653024673462, -1.1917306184768677, -1.1629960536956787, -1.1342614889144897, -1.1055269241333008, -1.0767922401428223, -1.0480576753616333, -1.0193231105804443, -0.9905884861946106, -0.9618539214134216, -0.9331192970275879, -0.9043847322463989, -0.8756501078605652, -0.8469155430793762, -0.8181809186935425, -0.7894463539123535, -0.7607117295265198, -0.7319771647453308, -0.7032425999641418, -0.6745080351829529, -0.6457734107971191, -0.6170388460159302, -0.5883042216300964, -0.5595696568489075, -0.5308350324630737, -0.5021004676818848, -0.473365843296051, -0.4446312487125397, -0.4158966541290283, -0.38716205954551697, -0.3584274649620056, -0.32969290018081665, -0.3009582757949829, -0.27222371101379395, -0.2434891015291214, -0.21475450694561005, -0.1860199123620987, -0.15728533267974854, -0.12855073809623718, -0.09981614351272583, -0.07108154892921448, -0.042346954345703125, -0.013612359762191772, 0.01512223295867443, 0.043856825679540634, 0.07259141653776169, 0.10132601112127304, 0.1300605982542038, 0.15879519283771515, 0.1875297874212265, 0.21626438200473785, 0.2449989765882492, 0.27373355627059937, 0.3024681508541107, 0.33120274543762207, 0.3599373400211334, 0.3886719346046448, 0.41740652918815613, 0.4461411237716675]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 6.0, 3.0, 12.0, 8.0, 15.0, 8.0, 12.0, 19.0, 20.0, 27.0, 31.0, 35.0, 21.0, 25.0, 18.0, 44.0, 39.0, 41.0, 40.0, 37.0, 42.0, 25.0, 48.0, 41.0, 31.0, 38.0, 29.0, 33.0, 33.0, 26.0, 20.0, 23.0, 27.0, 14.0, 25.0, 14.0, 11.0, 9.0, 6.0, 6.0, 9.0, 8.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.17373013496398926, -0.16876357793807983, -0.16379700601100922, -0.1588304489850998, -0.15386389195919037, -0.14889732003211975, -0.14393076300621033, -0.1389642059803009, -0.13399764895439148, -0.12903109192848206, -0.12406452745199203, -0.11909796297550201, -0.11413140594959259, -0.10916484147310257, -0.10419827699661255, -0.09923171997070312, -0.09426514804363251, -0.08929858356714249, -0.08433202654123306, -0.07936546206474304, -0.07439890503883362, -0.0694323405623436, -0.06446577608585358, -0.059499215334653854, -0.05453265458345413, -0.04956609383225441, -0.04459953308105469, -0.03963296860456467, -0.034666407853364944, -0.029699847102165222, -0.02473328448832035, -0.01976672187447548, -0.014800161123275757, -0.00983359944075346, -0.004867037758231163, 9.952392429113388e-05, 0.005066085606813431, 0.010032646358013153, 0.014999208971858025, 0.019965771585702896, 0.02493233233690262, 0.02989889308810234, 0.03486545383930206, 0.039832018315792084, 0.044798579066991806, 0.04976513981819153, 0.05473170429468155, 0.05969826504588127, 0.064664825797081, 0.06963139027357101, 0.07459794729948044, 0.07956451177597046, 0.08453106880187988, 0.0894976332783699, 0.09446419775485992, 0.09943075478076935, 0.10439731925725937, 0.10936388373374939, 0.11433044075965881, 0.11929700523614883, 0.12426356971263885, 0.12923012673854828, 0.1341966837644577, 0.13916325569152832, 0.14412981271743774]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 6.0, 4.0, 6.0, 5.0, 8.0, 11.0, 9.0, 9.0, 8.0, 13.0, 15.0, 22.0, 24.0, 21.0, 18.0, 23.0, 31.0, 38.0, 31.0, 42.0, 37.0, 41.0, 39.0, 44.0, 41.0, 26.0, 39.0, 39.0, 36.0, 35.0, 33.0, 20.0, 24.0, 30.0, 25.0, 22.0, 19.0, 20.0, 14.0, 17.0, 10.0, 11.0, 7.0, 4.0, 7.0, 6.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 3.0, 4.0, 0.0, 2.0], "bins": [-6.3515625, -6.1546630859375, -5.957763671875, -5.7608642578125, -5.56396484375, -5.3670654296875, -5.170166015625, -4.9732666015625, -4.7763671875, -4.5794677734375, -4.382568359375, -4.1856689453125, -3.98876953125, -3.7918701171875, -3.594970703125, -3.3980712890625, -3.201171875, -3.0042724609375, -2.807373046875, -2.6104736328125, -2.41357421875, -2.2166748046875, -2.019775390625, -1.8228759765625, -1.6259765625, -1.4290771484375, -1.232177734375, -1.0352783203125, -0.83837890625, -0.6414794921875, -0.444580078125, -0.2476806640625, -0.05078125, 0.1461181640625, 0.343017578125, 0.5399169921875, 0.73681640625, 0.9337158203125, 1.130615234375, 1.3275146484375, 1.5244140625, 1.7213134765625, 1.918212890625, 2.1151123046875, 2.31201171875, 2.5089111328125, 2.705810546875, 2.9027099609375, 3.099609375, 3.2965087890625, 3.493408203125, 3.6903076171875, 3.88720703125, 4.0841064453125, 4.281005859375, 4.4779052734375, 4.6748046875, 4.8717041015625, 5.068603515625, 5.2655029296875, 5.46240234375, 5.6593017578125, 5.856201171875, 6.0531005859375, 6.25]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 5.0, 7.0, 5.0, 12.0, 21.0, 22.0, 25.0, 35.0, 50.0, 69.0, 118.0, 168.0, 249.0, 356.0, 480.0, 711.0, 1127.0, 1721.0, 2807.0, 4602.0, 7906.0, 14189.0, 27260.0, 55221.0, 120055.0, 319446.0, 275359.0, 108112.0, 50789.0, 25301.0, 13048.0, 7390.0, 4267.0, 2657.0, 1704.0, 1001.0, 702.0, 477.0, 314.0, 219.0, 163.0, 109.0, 86.0, 58.0, 38.0, 26.0, 22.0, 13.0, 8.0, 9.0, 9.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.34375, -8.0650634765625, -7.786376953125, -7.5076904296875, -7.22900390625, -6.9503173828125, -6.671630859375, -6.3929443359375, -6.1142578125, -5.8355712890625, -5.556884765625, -5.2781982421875, -4.99951171875, -4.7208251953125, -4.442138671875, -4.1634521484375, -3.884765625, -3.6060791015625, -3.327392578125, -3.0487060546875, -2.77001953125, -2.4913330078125, -2.212646484375, -1.9339599609375, -1.6552734375, -1.3765869140625, -1.097900390625, -0.8192138671875, -0.54052734375, -0.2618408203125, 0.016845703125, 0.2955322265625, 0.57421875, 0.8529052734375, 1.131591796875, 1.4102783203125, 1.68896484375, 1.9676513671875, 2.246337890625, 2.5250244140625, 2.8037109375, 3.0823974609375, 3.361083984375, 3.6397705078125, 3.91845703125, 4.1971435546875, 4.475830078125, 4.7545166015625, 5.033203125, 5.3118896484375, 5.590576171875, 5.8692626953125, 6.14794921875, 6.4266357421875, 6.705322265625, 6.9840087890625, 7.2626953125, 7.5413818359375, 7.820068359375, 8.0987548828125, 8.37744140625, 8.6561279296875, 8.934814453125, 9.2135009765625, 9.4921875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 4.0, 6.0, 7.0, 10.0, 8.0, 10.0, 7.0, 18.0, 12.0, 11.0, 24.0, 15.0, 33.0, 31.0, 36.0, 31.0, 38.0, 43.0, 68.0, 82.0, 174.0, 1359.0, 370.0, 153.0, 99.0, 50.0, 46.0, 31.0, 33.0, 40.0, 27.0, 26.0, 22.0, 14.0, 17.0, 15.0, 13.0, 16.0, 11.0, 7.0, 5.0, 7.0, 10.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.8125, -17.19775390625, -16.5830078125, -15.96826171875, -15.353515625, -14.73876953125, -14.1240234375, -13.50927734375, -12.89453125, -12.27978515625, -11.6650390625, -11.05029296875, -10.435546875, -9.82080078125, -9.2060546875, -8.59130859375, -7.9765625, -7.36181640625, -6.7470703125, -6.13232421875, -5.517578125, -4.90283203125, -4.2880859375, -3.67333984375, -3.05859375, -2.44384765625, -1.8291015625, -1.21435546875, -0.599609375, 0.01513671875, 0.6298828125, 1.24462890625, 1.859375, 2.47412109375, 3.0888671875, 3.70361328125, 4.318359375, 4.93310546875, 5.5478515625, 6.16259765625, 6.77734375, 7.39208984375, 8.0068359375, 8.62158203125, 9.236328125, 9.85107421875, 10.4658203125, 11.08056640625, 11.6953125, 12.31005859375, 12.9248046875, 13.53955078125, 14.154296875, 14.76904296875, 15.3837890625, 15.99853515625, 16.61328125, 17.22802734375, 17.8427734375, 18.45751953125, 19.072265625, 19.68701171875, 20.3017578125, 20.91650390625, 21.53125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 5.0, 6.0, 6.0, 4.0, 8.0, 6.0, 12.0, 18.0, 23.0, 24.0, 27.0, 28.0, 49.0, 55.0, 79.0, 82.0, 126.0, 179.0, 255.0, 459.0, 1804.0, 28150.0, 3016125.0, 93433.0, 3077.0, 587.0, 282.0, 174.0, 136.0, 100.0, 80.0, 69.0, 42.0, 47.0, 26.0, 29.0, 20.0, 20.0, 7.0, 11.0, 7.0, 6.0, 5.0, 6.0, 5.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-62.875, -60.822265625, -58.76953125, -56.716796875, -54.6640625, -52.611328125, -50.55859375, -48.505859375, -46.453125, -44.400390625, -42.34765625, -40.294921875, -38.2421875, -36.189453125, -34.13671875, -32.083984375, -30.03125, -27.978515625, -25.92578125, -23.873046875, -21.8203125, -19.767578125, -17.71484375, -15.662109375, -13.609375, -11.556640625, -9.50390625, -7.451171875, -5.3984375, -3.345703125, -1.29296875, 0.759765625, 2.8125, 4.865234375, 6.91796875, 8.970703125, 11.0234375, 13.076171875, 15.12890625, 17.181640625, 19.234375, 21.287109375, 23.33984375, 25.392578125, 27.4453125, 29.498046875, 31.55078125, 33.603515625, 35.65625, 37.708984375, 39.76171875, 41.814453125, 43.8671875, 45.919921875, 47.97265625, 50.025390625, 52.078125, 54.130859375, 56.18359375, 58.236328125, 60.2890625, 62.341796875, 64.39453125, 66.447265625, 68.5]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 22.0, 65.0, 157.0, 243.0, 250.0, 168.0, 70.0, 23.0, 10.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.608661651611328, -17.197418212890625, -14.786172866821289, -12.37492847442627, -9.96368408203125, -7.5524396896362305, -5.141195297241211, -2.729949951171875, -0.3187065124511719, 2.0925378799438477, 4.503782272338867, 6.915026664733887, 9.326271057128906, 11.737515449523926, 14.148759841918945, 16.56000518798828, 18.971248626708984, 21.382492065429688, 23.793737411499023, 26.20498275756836, 28.616226196289062, 31.027469635009766, 33.43871307373047, 35.84996032714844, 38.26120376586914, 40.672447204589844, 43.08369445800781, 45.494937896728516, 47.90618133544922, 50.31742477416992, 52.728668212890625, 55.139915466308594, 57.55116271972656, 59.962406158447266, 62.37364959716797, 64.78489685058594, 67.19613647460938, 69.60738372802734, 72.01863098144531, 74.42987060546875, 76.84111785888672, 79.25236511230469, 81.66360473632812, 84.0748519897461, 86.48609924316406, 88.8973388671875, 91.30858612060547, 93.71983337402344, 96.13107299804688, 98.54232025146484, 100.95355987548828, 103.36480712890625, 105.77604675292969, 108.18729400634766, 110.59854125976562, 113.00978088378906, 115.42102813720703, 117.832275390625, 120.24351501464844, 122.6547622680664, 125.06600952148438, 127.47724914550781, 129.88848876953125, 132.29974365234375, 134.7109832763672]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 7.0, 10.0, 9.0, 12.0, 16.0, 9.0, 22.0, 14.0, 23.0, 27.0, 19.0, 35.0, 33.0, 37.0, 35.0, 40.0, 35.0, 53.0, 32.0, 41.0, 36.0, 30.0, 51.0, 44.0, 43.0, 43.0, 33.0, 34.0, 19.0, 29.0, 24.0, 27.0, 15.0, 11.0, 9.0, 8.0, 5.0, 8.0, 6.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.92280960083008, -43.230770111083984, -41.538726806640625, -39.84668731689453, -38.15464401245117, -36.46260452270508, -34.77056121826172, -33.078521728515625, -31.3864803314209, -29.694438934326172, -28.002397537231445, -26.31035614013672, -24.618316650390625, -22.926273345947266, -21.234233856201172, -19.542192459106445, -17.85015106201172, -16.158109664916992, -14.466068267822266, -12.774027824401855, -11.081986427307129, -9.389945030212402, -7.697904586791992, -6.005863189697266, -4.313821792602539, -2.6217806339263916, -0.9297394752502441, 0.7623014450073242, 2.454342842102051, 4.146384239196777, 5.8384246826171875, 7.530466079711914, 9.222511291503906, 10.914552688598633, 12.60659408569336, 14.29863452911377, 15.990675926208496, 17.682716369628906, 19.374757766723633, 21.06679916381836, 22.758840560913086, 24.450881958007812, 26.14292335510254, 27.834964752197266, 29.52700424194336, 31.21904754638672, 32.91108703613281, 34.603126525878906, 36.295169830322266, 37.98720932006836, 39.67925262451172, 41.37129211425781, 43.06333541870117, 44.755374908447266, 46.447418212890625, 48.13945770263672, 49.83149719238281, 51.523536682128906, 53.215579986572266, 54.90761947631836, 56.59966278076172, 58.29170227050781, 59.983741760253906, 61.675785064697266, 63.367828369140625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 12.0, 10.0, 11.0, 6.0, 14.0, 8.0, 17.0, 20.0, 13.0, 18.0, 34.0, 25.0, 29.0, 31.0, 36.0, 40.0, 53.0, 35.0, 46.0, 42.0, 44.0, 44.0, 31.0, 32.0, 35.0, 33.0, 32.0, 38.0, 29.0, 20.0, 22.0, 17.0, 28.0, 16.0, 14.0, 19.0, 4.0, 7.0, 4.0, 8.0, 6.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.31640625, -6.09478759765625, -5.8731689453125, -5.65155029296875, -5.429931640625, -5.20831298828125, -4.9866943359375, -4.76507568359375, -4.54345703125, -4.32183837890625, -4.1002197265625, -3.87860107421875, -3.656982421875, -3.43536376953125, -3.2137451171875, -2.99212646484375, -2.7705078125, -2.54888916015625, -2.3272705078125, -2.10565185546875, -1.884033203125, -1.66241455078125, -1.4407958984375, -1.21917724609375, -0.99755859375, -0.77593994140625, -0.5543212890625, -0.33270263671875, -0.111083984375, 0.11053466796875, 0.3321533203125, 0.55377197265625, 0.775390625, 0.99700927734375, 1.2186279296875, 1.44024658203125, 1.661865234375, 1.88348388671875, 2.1051025390625, 2.32672119140625, 2.54833984375, 2.76995849609375, 2.9915771484375, 3.21319580078125, 3.434814453125, 3.65643310546875, 3.8780517578125, 4.09967041015625, 4.3212890625, 4.54290771484375, 4.7645263671875, 4.98614501953125, 5.207763671875, 5.42938232421875, 5.6510009765625, 5.87261962890625, 6.09423828125, 6.31585693359375, 6.5374755859375, 6.75909423828125, 6.980712890625, 7.20233154296875, 7.4239501953125, 7.64556884765625, 7.8671875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 10.0, 10.0, 13.0, 19.0, 23.0, 34.0, 49.0, 50.0, 76.0, 120.0, 159.0, 299.0, 443.0, 784.0, 1385.0, 2858.0, 6332.0, 18046.0, 75055.0, 554764.0, 2545647.0, 845471.0, 103810.0, 23456.0, 7880.0, 3477.0, 1574.0, 877.0, 536.0, 329.0, 219.0, 132.0, 114.0, 53.0, 35.0, 49.0, 19.0, 13.0, 18.0, 9.0, 3.0, 5.0, 3.0, 7.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 3.0], "bins": [-14.359375, -13.9320068359375, -13.504638671875, -13.0772705078125, -12.64990234375, -12.2225341796875, -11.795166015625, -11.3677978515625, -10.9404296875, -10.5130615234375, -10.085693359375, -9.6583251953125, -9.23095703125, -8.8035888671875, -8.376220703125, -7.9488525390625, -7.521484375, -7.0941162109375, -6.666748046875, -6.2393798828125, -5.81201171875, -5.3846435546875, -4.957275390625, -4.5299072265625, -4.1025390625, -3.6751708984375, -3.247802734375, -2.8204345703125, -2.39306640625, -1.9656982421875, -1.538330078125, -1.1109619140625, -0.68359375, -0.2562255859375, 0.171142578125, 0.5985107421875, 1.02587890625, 1.4532470703125, 1.880615234375, 2.3079833984375, 2.7353515625, 3.1627197265625, 3.590087890625, 4.0174560546875, 4.44482421875, 4.8721923828125, 5.299560546875, 5.7269287109375, 6.154296875, 6.5816650390625, 7.009033203125, 7.4364013671875, 7.86376953125, 8.2911376953125, 8.718505859375, 9.1458740234375, 9.5732421875, 10.0006103515625, 10.427978515625, 10.8553466796875, 11.28271484375, 11.7100830078125, 12.137451171875, 12.5648193359375, 12.9921875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 6.0, 2.0, 5.0, 4.0, 8.0, 7.0, 17.0, 22.0, 18.0, 26.0, 42.0, 46.0, 54.0, 75.0, 104.0, 156.0, 237.0, 389.0, 592.0, 646.0, 555.0, 347.0, 224.0, 142.0, 93.0, 56.0, 44.0, 34.0, 17.0, 19.0, 23.0, 13.0, 11.0, 12.0, 5.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.140625, -11.740478515625, -11.34033203125, -10.940185546875, -10.5400390625, -10.139892578125, -9.73974609375, -9.339599609375, -8.939453125, -8.539306640625, -8.13916015625, -7.739013671875, -7.3388671875, -6.938720703125, -6.53857421875, -6.138427734375, -5.73828125, -5.338134765625, -4.93798828125, -4.537841796875, -4.1376953125, -3.737548828125, -3.33740234375, -2.937255859375, -2.537109375, -2.136962890625, -1.73681640625, -1.336669921875, -0.9365234375, -0.536376953125, -0.13623046875, 0.263916015625, 0.6640625, 1.064208984375, 1.46435546875, 1.864501953125, 2.2646484375, 2.664794921875, 3.06494140625, 3.465087890625, 3.865234375, 4.265380859375, 4.66552734375, 5.065673828125, 5.4658203125, 5.865966796875, 6.26611328125, 6.666259765625, 7.06640625, 7.466552734375, 7.86669921875, 8.266845703125, 8.6669921875, 9.067138671875, 9.46728515625, 9.867431640625, 10.267578125, 10.667724609375, 11.06787109375, 11.468017578125, 11.8681640625, 12.268310546875, 12.66845703125, 13.068603515625, 13.46875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 5.0, 15.0, 12.0, 16.0, 21.0, 17.0, 33.0, 31.0, 71.0, 99.0, 142.0, 332.0, 1119.0, 12389.0, 2200428.0, 1965949.0, 11631.0, 1108.0, 304.0, 157.0, 105.0, 72.0, 60.0, 29.0, 29.0, 20.0, 21.0, 11.0, 11.0, 7.0, 9.0, 3.0, 7.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-63.375, -61.4541015625, -59.533203125, -57.6123046875, -55.69140625, -53.7705078125, -51.849609375, -49.9287109375, -48.0078125, -46.0869140625, -44.166015625, -42.2451171875, -40.32421875, -38.4033203125, -36.482421875, -34.5615234375, -32.640625, -30.7197265625, -28.798828125, -26.8779296875, -24.95703125, -23.0361328125, -21.115234375, -19.1943359375, -17.2734375, -15.3525390625, -13.431640625, -11.5107421875, -9.58984375, -7.6689453125, -5.748046875, -3.8271484375, -1.90625, 0.0146484375, 1.935546875, 3.8564453125, 5.77734375, 7.6982421875, 9.619140625, 11.5400390625, 13.4609375, 15.3818359375, 17.302734375, 19.2236328125, 21.14453125, 23.0654296875, 24.986328125, 26.9072265625, 28.828125, 30.7490234375, 32.669921875, 34.5908203125, 36.51171875, 38.4326171875, 40.353515625, 42.2744140625, 44.1953125, 46.1162109375, 48.037109375, 49.9580078125, 51.87890625, 53.7998046875, 55.720703125, 57.6416015625, 59.5625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 12.0, 17.0, 47.0, 71.0, 90.0, 132.0, 146.0, 157.0, 140.0, 91.0, 46.0, 20.0, 16.0, 5.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.80999755859375, -102.61931610107422, -100.42863464355469, -98.23796081542969, -96.04727935791016, -93.85659790039062, -91.6659164428711, -89.47523498535156, -87.28456115722656, -85.09387969970703, -82.9031982421875, -80.7125244140625, -78.52184295654297, -76.33116149902344, -74.1404800415039, -71.94979858398438, -69.75911712646484, -67.56843566894531, -65.37775421142578, -63.187076568603516, -60.99639892578125, -58.80571746826172, -56.61503601074219, -54.424354553222656, -52.23367691040039, -50.04299545288086, -47.852317810058594, -45.66163635253906, -43.47095489501953, -41.280277252197266, -39.089595794677734, -36.89891815185547, -34.708229064941406, -32.517547607421875, -30.32686996459961, -28.136188507080078, -25.94550895690918, -23.75482940673828, -21.56414794921875, -19.37346839904785, -17.182788848876953, -14.992109298706055, -12.80142879486084, -10.610748291015625, -8.420068740844727, -6.229389190673828, -4.038708686828613, -1.8480281829833984, 0.3426513671875, 2.5333313941955566, 4.724011421203613, 6.91469144821167, 9.105371475219727, 11.296051025390625, 13.48673152923584, 15.677412033081055, 17.868091583251953, 20.05877113342285, 22.24945068359375, 24.44013214111328, 26.63081169128418, 28.821491241455078, 31.01217269897461, 33.202850341796875, 35.393531799316406]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 2.0, 9.0, 7.0, 7.0, 8.0, 5.0, 13.0, 10.0, 20.0, 26.0, 19.0, 25.0, 25.0, 24.0, 27.0, 27.0, 30.0, 29.0, 33.0, 33.0, 34.0, 45.0, 45.0, 40.0, 42.0, 46.0, 28.0, 29.0, 24.0, 43.0, 24.0, 28.0, 27.0, 23.0, 17.0, 19.0, 20.0, 19.0, 17.0, 11.0, 6.0, 7.0, 8.0, 4.0, 4.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0], "bins": [-35.264747619628906, -34.132568359375, -33.00038528442383, -31.86820411682129, -30.73602294921875, -29.60384178161621, -28.471660614013672, -27.339479446411133, -26.207298278808594, -25.075117111206055, -23.942935943603516, -22.810754776000977, -21.678573608398438, -20.5463924407959, -19.41421127319336, -18.28203010559082, -17.14984893798828, -16.017667770385742, -14.885486602783203, -13.753305435180664, -12.621124267578125, -11.488943099975586, -10.356761932373047, -9.224580764770508, -8.092399597167969, -6.96021842956543, -5.828037261962891, -4.695856094360352, -3.5636749267578125, -2.4314937591552734, -1.2993125915527344, -0.1671314239501953, 0.9650535583496094, 2.0972347259521484, 3.2294158935546875, 4.361597061157227, 5.493778228759766, 6.625959396362305, 7.758140563964844, 8.890321731567383, 10.022502899169922, 11.154684066772461, 12.286865234375, 13.419046401977539, 14.551227569580078, 15.683408737182617, 16.815589904785156, 17.947771072387695, 19.079952239990234, 20.212133407592773, 21.344314575195312, 22.47649574279785, 23.60867691040039, 24.74085807800293, 25.87303924560547, 27.005220413208008, 28.137401580810547, 29.269582748413086, 30.401763916015625, 31.533945083618164, 32.6661262512207, 33.798309326171875, 34.93048858642578, 36.06266784667969, 37.19485092163086]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 5.0, 7.0, 13.0, 5.0, 11.0, 13.0, 18.0, 18.0, 21.0, 30.0, 30.0, 32.0, 32.0, 29.0, 38.0, 68.0, 34.0, 47.0, 49.0, 44.0, 54.0, 35.0, 24.0, 30.0, 37.0, 17.0, 27.0, 35.0, 22.0, 24.0, 21.0, 17.0, 18.0, 21.0, 11.0, 11.0, 10.0, 8.0, 8.0, 4.0, 10.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.7734375, -6.5587158203125, -6.343994140625, -6.1292724609375, -5.91455078125, -5.6998291015625, -5.485107421875, -5.2703857421875, -5.0556640625, -4.8409423828125, -4.626220703125, -4.4114990234375, -4.19677734375, -3.9820556640625, -3.767333984375, -3.5526123046875, -3.337890625, -3.1231689453125, -2.908447265625, -2.6937255859375, -2.47900390625, -2.2642822265625, -2.049560546875, -1.8348388671875, -1.6201171875, -1.4053955078125, -1.190673828125, -0.9759521484375, -0.76123046875, -0.5465087890625, -0.331787109375, -0.1170654296875, 0.09765625, 0.3123779296875, 0.527099609375, 0.7418212890625, 0.95654296875, 1.1712646484375, 1.385986328125, 1.6007080078125, 1.8154296875, 2.0301513671875, 2.244873046875, 2.4595947265625, 2.67431640625, 2.8890380859375, 3.103759765625, 3.3184814453125, 3.533203125, 3.7479248046875, 3.962646484375, 4.1773681640625, 4.39208984375, 4.6068115234375, 4.821533203125, 5.0362548828125, 5.2509765625, 5.4656982421875, 5.680419921875, 5.8951416015625, 6.10986328125, 6.3245849609375, 6.539306640625, 6.7540283203125, 6.96875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 8.0, 2.0, 10.0, 16.0, 22.0, 33.0, 43.0, 69.0, 129.0, 185.0, 332.0, 466.0, 750.0, 1303.0, 1991.0, 3126.0, 5143.0, 8570.0, 13885.0, 23595.0, 40429.0, 71441.0, 126487.0, 212521.0, 221769.0, 134398.0, 75844.0, 42891.0, 24774.0, 14689.0, 8854.0, 5519.0, 3479.0, 2154.0, 1349.0, 834.0, 583.0, 319.0, 208.0, 115.0, 92.0, 48.0, 36.0, 18.0, 17.0, 8.0, 7.0, 5.0, 2.0, 3.0], "bins": [-1.375, -1.3388671875, -1.302734375, -1.2666015625, -1.23046875, -1.1943359375, -1.158203125, -1.1220703125, -1.0859375, -1.0498046875, -1.013671875, -0.9775390625, -0.94140625, -0.9052734375, -0.869140625, -0.8330078125, -0.796875, -0.7607421875, -0.724609375, -0.6884765625, -0.65234375, -0.6162109375, -0.580078125, -0.5439453125, -0.5078125, -0.4716796875, -0.435546875, -0.3994140625, -0.36328125, -0.3271484375, -0.291015625, -0.2548828125, -0.21875, -0.1826171875, -0.146484375, -0.1103515625, -0.07421875, -0.0380859375, -0.001953125, 0.0341796875, 0.0703125, 0.1064453125, 0.142578125, 0.1787109375, 0.21484375, 0.2509765625, 0.287109375, 0.3232421875, 0.359375, 0.3955078125, 0.431640625, 0.4677734375, 0.50390625, 0.5400390625, 0.576171875, 0.6123046875, 0.6484375, 0.6845703125, 0.720703125, 0.7568359375, 0.79296875, 0.8291015625, 0.865234375, 0.9013671875, 0.9375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 6.0, 13.0, 2.0, 5.0, 3.0, 12.0, 9.0, 12.0, 14.0, 22.0, 16.0, 22.0, 30.0, 29.0, 27.0, 34.0, 29.0, 32.0, 34.0, 36.0, 37.0, 31.0, 1057.0, 43.0, 42.0, 39.0, 39.0, 38.0, 29.0, 35.0, 27.0, 28.0, 21.0, 31.0, 17.0, 25.0, 16.0, 21.0, 11.0, 11.0, 8.0, 7.0, 6.0, 7.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0], "bins": [-4.90625, -4.76055908203125, -4.6148681640625, -4.46917724609375, -4.323486328125, -4.17779541015625, -4.0321044921875, -3.88641357421875, -3.74072265625, -3.59503173828125, -3.4493408203125, -3.30364990234375, -3.157958984375, -3.01226806640625, -2.8665771484375, -2.72088623046875, -2.5751953125, -2.42950439453125, -2.2838134765625, -2.13812255859375, -1.992431640625, -1.84674072265625, -1.7010498046875, -1.55535888671875, -1.40966796875, -1.26397705078125, -1.1182861328125, -0.97259521484375, -0.826904296875, -0.68121337890625, -0.5355224609375, -0.38983154296875, -0.244140625, -0.09844970703125, 0.0472412109375, 0.19293212890625, 0.338623046875, 0.48431396484375, 0.6300048828125, 0.77569580078125, 0.92138671875, 1.06707763671875, 1.2127685546875, 1.35845947265625, 1.504150390625, 1.64984130859375, 1.7955322265625, 1.94122314453125, 2.0869140625, 2.23260498046875, 2.3782958984375, 2.52398681640625, 2.669677734375, 2.81536865234375, 2.9610595703125, 3.10675048828125, 3.25244140625, 3.39813232421875, 3.5438232421875, 3.68951416015625, 3.835205078125, 3.98089599609375, 4.1265869140625, 4.27227783203125, 4.41796875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 8.0, 10.0, 17.0, 23.0, 27.0, 54.0, 110.0, 124.0, 229.0, 381.0, 601.0, 1074.0, 1968.0, 3380.0, 6718.0, 13093.0, 27732.0, 60361.0, 147133.0, 659656.0, 889223.0, 161252.0, 65028.0, 29345.0, 14157.0, 7131.0, 3610.0, 1987.0, 1100.0, 627.0, 393.0, 218.0, 135.0, 95.0, 40.0, 28.0, 17.0, 9.0, 9.0, 7.0, 7.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0224609375, -0.988433837890625, -0.95440673828125, -0.920379638671875, -0.8863525390625, -0.852325439453125, -0.81829833984375, -0.784271240234375, -0.750244140625, -0.716217041015625, -0.68218994140625, -0.648162841796875, -0.6141357421875, -0.580108642578125, -0.54608154296875, -0.512054443359375, -0.47802734375, -0.444000244140625, -0.40997314453125, -0.375946044921875, -0.3419189453125, -0.307891845703125, -0.27386474609375, -0.239837646484375, -0.205810546875, -0.171783447265625, -0.13775634765625, -0.103729248046875, -0.0697021484375, -0.035675048828125, -0.00164794921875, 0.032379150390625, 0.06640625, 0.100433349609375, 0.13446044921875, 0.168487548828125, 0.2025146484375, 0.236541748046875, 0.27056884765625, 0.304595947265625, 0.338623046875, 0.372650146484375, 0.40667724609375, 0.440704345703125, 0.4747314453125, 0.508758544921875, 0.54278564453125, 0.576812744140625, 0.61083984375, 0.644866943359375, 0.67889404296875, 0.712921142578125, 0.7469482421875, 0.780975341796875, 0.81500244140625, 0.849029541015625, 0.883056640625, 0.917083740234375, 0.95111083984375, 0.985137939453125, 1.0191650390625, 1.053192138671875, 1.08721923828125, 1.121246337890625, 1.1552734375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 5.0, 4.0, 12.0, 9.0, 21.0, 24.0, 32.0, 50.0, 59.0, 84.0, 155.0, 170.0, 117.0, 68.0, 62.0, 38.0, 24.0, 19.0, 13.0, 15.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.400634765625, -0.39155006408691406, -0.3824653625488281, -0.3733806610107422, -0.36429595947265625, -0.3552112579345703, -0.3461265563964844, -0.33704185485839844, -0.3279571533203125, -0.31887245178222656, -0.3097877502441406, -0.3007030487060547, -0.29161834716796875, -0.2825336456298828, -0.2734489440917969, -0.26436424255371094, -0.255279541015625, -0.24619483947753906, -0.23711013793945312, -0.2280254364013672, -0.21894073486328125, -0.2098560333251953, -0.20077133178710938, -0.19168663024902344, -0.1826019287109375, -0.17351722717285156, -0.16443252563476562, -0.1553478240966797, -0.14626312255859375, -0.1371784210205078, -0.12809371948242188, -0.11900901794433594, -0.10992431640625, -0.10083961486816406, -0.09175491333007812, -0.08267021179199219, -0.07358551025390625, -0.06450080871582031, -0.055416107177734375, -0.04633140563964844, -0.0372467041015625, -0.028162002563476562, -0.019077301025390625, -0.009992599487304688, -0.00090789794921875, 0.008176803588867188, 0.017261505126953125, 0.026346206665039062, 0.035430908203125, 0.04451560974121094, 0.053600311279296875, 0.06268501281738281, 0.07176971435546875, 0.08085441589355469, 0.08993911743164062, 0.09902381896972656, 0.1081085205078125, 0.11719322204589844, 0.12627792358398438, 0.1353626251220703, 0.14444732666015625, 0.1535320281982422, 0.16261672973632812, 0.17170143127441406, 0.1807861328125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 6.0, 16.0, 19.0, 32.0, 32.0, 69.0, 143.0, 423.0, 51783.0, 994863.0, 744.0, 179.0, 96.0, 41.0, 33.0, 22.0, 15.0, 10.0, 8.0, 5.0, 1.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.39892578125, -4.1806640625, -3.96240234375, -3.744140625, -3.52587890625, -3.3076171875, -3.08935546875, -2.87109375, -2.65283203125, -2.4345703125, -2.21630859375, -1.998046875, -1.77978515625, -1.5615234375, -1.34326171875, -1.125, -0.90673828125, -0.6884765625, -0.47021484375, -0.251953125, -0.03369140625, 0.1845703125, 0.40283203125, 0.62109375, 0.83935546875, 1.0576171875, 1.27587890625, 1.494140625, 1.71240234375, 1.9306640625, 2.14892578125, 2.3671875, 2.58544921875, 2.8037109375, 3.02197265625, 3.240234375, 3.45849609375, 3.6767578125, 3.89501953125, 4.11328125, 4.33154296875, 4.5498046875, 4.76806640625, 4.986328125, 5.20458984375, 5.4228515625, 5.64111328125, 5.859375, 6.07763671875, 6.2958984375, 6.51416015625, 6.732421875, 6.95068359375, 7.1689453125, 7.38720703125, 7.60546875, 7.82373046875, 8.0419921875, 8.26025390625, 8.478515625, 8.69677734375, 8.9150390625, 9.13330078125, 9.3515625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 6.0, 45.0, 161.0, 339.0, 283.0, 122.0, 39.0, 8.0, 5.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14567077159881592, -0.12084317207336426, -0.0960155725479126, -0.07118797302246094, -0.04636037349700928, -0.021532773971557617, 0.003294825553894043, 0.028122425079345703, 0.05295002460479736, 0.07777762413024902, 0.10260522365570068, 0.12743282318115234, 0.152260422706604, 0.17708802223205566, 0.20191562175750732, 0.22674322128295898, 0.25157082080841064, 0.2763984203338623, 0.30122601985931396, 0.3260536193847656, 0.3508812189102173, 0.37570881843566895, 0.4005364179611206, 0.42536401748657227, 0.4501916170120239, 0.4750192165374756, 0.49984681606292725, 0.5246744155883789, 0.5495020151138306, 0.5743296146392822, 0.5991572141647339, 0.6239848136901855, 0.6488124132156372, 0.6736400127410889, 0.6984676122665405, 0.7232952117919922, 0.7481228113174438, 0.7729504108428955, 0.7977780103683472, 0.8226056098937988, 0.8474332094192505, 0.8722608089447021, 0.8970884084701538, 0.9219160079956055, 0.9467436075210571, 0.9715712070465088, 0.9963988065719604, 1.021226406097412, 1.0460540056228638, 1.0708816051483154, 1.095709204673767, 1.1205368041992188, 1.1453644037246704, 1.170192003250122, 1.1950196027755737, 1.2198472023010254, 1.244674801826477, 1.2695024013519287, 1.2943300008773804, 1.319157600402832, 1.3439851999282837, 1.3688127994537354, 1.393640398979187, 1.4184679985046387, 1.4432955980300903]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 7.0, 8.0, 5.0, 9.0, 11.0, 14.0, 12.0, 17.0, 14.0, 20.0, 24.0, 17.0, 22.0, 35.0, 39.0, 36.0, 30.0, 42.0, 39.0, 40.0, 32.0, 40.0, 40.0, 27.0, 38.0, 38.0, 34.0, 37.0, 38.0, 29.0, 26.0, 19.0, 20.0, 19.0, 19.0, 17.0, 19.0, 9.0, 11.0, 8.0, 6.0, 5.0, 4.0, 4.0, 3.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0], "bins": [-0.16896575689315796, -0.16402976214885712, -0.15909375250339508, -0.15415775775909424, -0.1492217630147934, -0.14428576827049255, -0.13934975862503052, -0.13441376388072968, -0.12947776913642883, -0.1245417669415474, -0.11960577219724655, -0.11466977000236511, -0.10973377525806427, -0.10479777306318283, -0.09986177086830139, -0.09492577612400055, -0.08998976647853851, -0.08505376428365707, -0.08011776953935623, -0.07518176734447479, -0.07024577260017395, -0.06530977040529251, -0.06037376821041107, -0.05543776974081993, -0.05050177127122879, -0.04556577280163765, -0.04062977433204651, -0.03569377213716507, -0.03075777366757393, -0.025821775197982788, -0.020885774865746498, -0.015949774533510208, -0.011013776063919067, -0.006077776663005352, -0.0011417772620916367, 0.0037942221388220787, 0.008730221539735794, 0.013666220009326935, 0.018602220341563225, 0.023538220673799515, 0.028474219143390656, 0.033410217612981796, 0.03834621608257294, 0.043282218277454376, 0.04821821674704552, 0.05315421521663666, 0.0580902174115181, 0.06302621960639954, 0.06796221435070038, 0.07289821654558182, 0.07783421128988266, 0.0827702134847641, 0.08770620822906494, 0.09264221042394638, 0.09757821261882782, 0.10251420736312866, 0.1074502095580101, 0.11238621175289154, 0.11732220649719238, 0.12225820869207382, 0.12719421088695526, 0.1321302056312561, 0.13706620037555695, 0.14200221002101898, 0.14693820476531982]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 3.0, 8.0, 5.0, 12.0, 9.0, 13.0, 10.0, 25.0, 28.0, 21.0, 21.0, 36.0, 32.0, 33.0, 36.0, 46.0, 38.0, 42.0, 45.0, 48.0, 40.0, 40.0, 43.0, 31.0, 39.0, 35.0, 24.0, 22.0, 22.0, 20.0, 25.0, 23.0, 16.0, 22.0, 9.0, 15.0, 17.0, 7.0, 10.0, 5.0, 13.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6015625, -6.3909912109375, -6.180419921875, -5.9698486328125, -5.75927734375, -5.5487060546875, -5.338134765625, -5.1275634765625, -4.9169921875, -4.7064208984375, -4.495849609375, -4.2852783203125, -4.07470703125, -3.8641357421875, -3.653564453125, -3.4429931640625, -3.232421875, -3.0218505859375, -2.811279296875, -2.6007080078125, -2.39013671875, -2.1795654296875, -1.968994140625, -1.7584228515625, -1.5478515625, -1.3372802734375, -1.126708984375, -0.9161376953125, -0.70556640625, -0.4949951171875, -0.284423828125, -0.0738525390625, 0.13671875, 0.3472900390625, 0.557861328125, 0.7684326171875, 0.97900390625, 1.1895751953125, 1.400146484375, 1.6107177734375, 1.8212890625, 2.0318603515625, 2.242431640625, 2.4530029296875, 2.66357421875, 2.8741455078125, 3.084716796875, 3.2952880859375, 3.505859375, 3.7164306640625, 3.927001953125, 4.1375732421875, 4.34814453125, 4.5587158203125, 4.769287109375, 4.9798583984375, 5.1904296875, 5.4010009765625, 5.611572265625, 5.8221435546875, 6.03271484375, 6.2432861328125, 6.453857421875, 6.6644287109375, 6.875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 4.0, 10.0, 8.0, 20.0, 27.0, 34.0, 33.0, 69.0, 103.0, 168.0, 221.0, 338.0, 521.0, 780.0, 1159.0, 1799.0, 2979.0, 4530.0, 7985.0, 13938.0, 26211.0, 53360.0, 127995.0, 405659.0, 235267.0, 81468.0, 37599.0, 19291.0, 10542.0, 6042.0, 3662.0, 2287.0, 1453.0, 1038.0, 647.0, 423.0, 283.0, 178.0, 119.0, 81.0, 79.0, 46.0, 27.0, 30.0, 18.0, 14.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.98828125, -7.73675537109375, -7.4852294921875, -7.23370361328125, -6.982177734375, -6.73065185546875, -6.4791259765625, -6.22760009765625, -5.97607421875, -5.72454833984375, -5.4730224609375, -5.22149658203125, -4.969970703125, -4.71844482421875, -4.4669189453125, -4.21539306640625, -3.9638671875, -3.71234130859375, -3.4608154296875, -3.20928955078125, -2.957763671875, -2.70623779296875, -2.4547119140625, -2.20318603515625, -1.95166015625, -1.70013427734375, -1.4486083984375, -1.19708251953125, -0.945556640625, -0.69403076171875, -0.4425048828125, -0.19097900390625, 0.060546875, 0.31207275390625, 0.5635986328125, 0.81512451171875, 1.066650390625, 1.31817626953125, 1.5697021484375, 1.82122802734375, 2.07275390625, 2.32427978515625, 2.5758056640625, 2.82733154296875, 3.078857421875, 3.33038330078125, 3.5819091796875, 3.83343505859375, 4.0849609375, 4.33648681640625, 4.5880126953125, 4.83953857421875, 5.091064453125, 5.34259033203125, 5.5941162109375, 5.84564208984375, 6.09716796875, 6.34869384765625, 6.6002197265625, 6.85174560546875, 7.103271484375, 7.35479736328125, 7.6063232421875, 7.85784912109375, 8.109375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 6.0, 4.0, 2.0, 6.0, 14.0, 13.0, 8.0, 19.0, 10.0, 20.0, 32.0, 22.0, 30.0, 27.0, 42.0, 33.0, 48.0, 57.0, 106.0, 168.0, 1466.0, 357.0, 133.0, 79.0, 52.0, 38.0, 31.0, 27.0, 29.0, 33.0, 21.0, 23.0, 16.0, 16.0, 11.0, 13.0, 9.0, 9.0, 9.0, 6.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-21.78125, -21.09619140625, -20.4111328125, -19.72607421875, -19.041015625, -18.35595703125, -17.6708984375, -16.98583984375, -16.30078125, -15.61572265625, -14.9306640625, -14.24560546875, -13.560546875, -12.87548828125, -12.1904296875, -11.50537109375, -10.8203125, -10.13525390625, -9.4501953125, -8.76513671875, -8.080078125, -7.39501953125, -6.7099609375, -6.02490234375, -5.33984375, -4.65478515625, -3.9697265625, -3.28466796875, -2.599609375, -1.91455078125, -1.2294921875, -0.54443359375, 0.140625, 0.82568359375, 1.5107421875, 2.19580078125, 2.880859375, 3.56591796875, 4.2509765625, 4.93603515625, 5.62109375, 6.30615234375, 6.9912109375, 7.67626953125, 8.361328125, 9.04638671875, 9.7314453125, 10.41650390625, 11.1015625, 11.78662109375, 12.4716796875, 13.15673828125, 13.841796875, 14.52685546875, 15.2119140625, 15.89697265625, 16.58203125, 17.26708984375, 17.9521484375, 18.63720703125, 19.322265625, 20.00732421875, 20.6923828125, 21.37744140625, 22.0625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 9.0, 5.0, 7.0, 15.0, 14.0, 27.0, 23.0, 25.0, 33.0, 38.0, 36.0, 65.0, 84.0, 96.0, 143.0, 217.0, 378.0, 862.0, 4949.0, 145166.0, 2942986.0, 45871.0, 2875.0, 692.0, 326.0, 184.0, 129.0, 82.0, 82.0, 54.0, 45.0, 38.0, 28.0, 40.0, 17.0, 16.0, 17.0, 9.0, 4.0, 6.0, 9.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.875, -42.43017578125, -40.9853515625, -39.54052734375, -38.095703125, -36.65087890625, -35.2060546875, -33.76123046875, -32.31640625, -30.87158203125, -29.4267578125, -27.98193359375, -26.537109375, -25.09228515625, -23.6474609375, -22.20263671875, -20.7578125, -19.31298828125, -17.8681640625, -16.42333984375, -14.978515625, -13.53369140625, -12.0888671875, -10.64404296875, -9.19921875, -7.75439453125, -6.3095703125, -4.86474609375, -3.419921875, -1.97509765625, -0.5302734375, 0.91455078125, 2.359375, 3.80419921875, 5.2490234375, 6.69384765625, 8.138671875, 9.58349609375, 11.0283203125, 12.47314453125, 13.91796875, 15.36279296875, 16.8076171875, 18.25244140625, 19.697265625, 21.14208984375, 22.5869140625, 24.03173828125, 25.4765625, 26.92138671875, 28.3662109375, 29.81103515625, 31.255859375, 32.70068359375, 34.1455078125, 35.59033203125, 37.03515625, 38.47998046875, 39.9248046875, 41.36962890625, 42.814453125, 44.25927734375, 45.7041015625, 47.14892578125, 48.59375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [306.0, 705.0, 7.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9082670211792, -1.7639751434326172, 9.380316734313965, 20.524608612060547, 31.668899536132812, 42.81319046020508, 53.95748519897461, 65.10177612304688, 76.2460708618164, 87.39036560058594, 98.53465270996094, 109.67894744873047, 120.8232421875, 131.967529296875, 143.11181640625, 154.256103515625, 165.40040588378906, 176.54469299316406, 187.68899536132812, 198.83328247070312, 209.97756958007812, 221.12185668945312, 232.2661590576172, 243.4104461669922, 254.5547332763672, 265.69903564453125, 276.84332275390625, 287.98760986328125, 299.13189697265625, 310.27618408203125, 321.42047119140625, 332.56475830078125, 343.7090759277344, 354.8533630371094, 365.9976501464844, 377.1419677734375, 388.2862548828125, 399.4305419921875, 410.5748291015625, 421.7191162109375, 432.8634033203125, 444.0076904296875, 455.1519775390625, 466.2962646484375, 477.4405822753906, 488.5848693847656, 499.7291564941406, 510.8734436035156, 522.0177612304688, 533.1620483398438, 544.3063354492188, 555.4506225585938, 566.5949096679688, 577.7391967773438, 588.883544921875, 600.02783203125, 611.1720581054688, 622.3163452148438, 633.4606323242188, 644.6049194335938, 655.7492065429688, 666.8934936523438, 678.037841796875, 689.18212890625, 700.326416015625]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 2.0, 3.0, 5.0, 2.0, 13.0, 11.0, 10.0, 9.0, 12.0, 18.0, 15.0, 22.0, 18.0, 26.0, 19.0, 23.0, 29.0, 27.0, 32.0, 46.0, 34.0, 38.0, 34.0, 35.0, 39.0, 41.0, 39.0, 38.0, 36.0, 27.0, 31.0, 35.0, 30.0, 28.0, 20.0, 20.0, 17.0, 18.0, 17.0, 18.0, 10.0, 8.0, 12.0, 8.0, 8.0, 6.0, 4.0, 4.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0], "bins": [-52.930999755859375, -51.380340576171875, -49.82968521118164, -48.27902603149414, -46.72836685180664, -45.177711486816406, -43.627052307128906, -42.076393127441406, -40.52573776245117, -38.97507858276367, -37.42442321777344, -35.87376403808594, -34.32310485839844, -32.7724494934082, -31.221790313720703, -29.671133041381836, -28.120473861694336, -26.56981658935547, -25.01915740966797, -23.4685001373291, -21.917842864990234, -20.367183685302734, -18.816526412963867, -17.265869140625, -15.715210914611816, -14.164552688598633, -12.613895416259766, -11.063237190246582, -9.512578964233398, -7.961921691894531, -6.411263465881348, -4.8606061935424805, -3.309947967529297, -1.759290099143982, -0.208632230758667, 1.3420257568359375, 2.892683506011963, 4.443341255187988, 5.993999481201172, 7.544656753540039, 9.095314979553223, 10.645973205566406, 12.196630477905273, 13.747288703918457, 15.29794692993164, 16.848604202270508, 18.399261474609375, 19.949920654296875, 21.500577926635742, 23.05123519897461, 24.60189437866211, 26.152551651000977, 27.703208923339844, 29.253868103027344, 30.80452537536621, 32.35518264770508, 33.90584182739258, 35.45650100708008, 37.00715637207031, 38.55781555175781, 40.10847473144531, 41.65913009643555, 43.20978927612305, 44.76044464111328, 46.31110382080078]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 3.0, 6.0, 6.0, 6.0, 5.0, 10.0, 15.0, 12.0, 21.0, 19.0, 30.0, 27.0, 27.0, 23.0, 40.0, 34.0, 38.0, 34.0, 39.0, 47.0, 31.0, 56.0, 38.0, 32.0, 44.0, 35.0, 30.0, 36.0, 27.0, 19.0, 20.0, 15.0, 26.0, 22.0, 19.0, 16.0, 13.0, 16.0, 14.0, 12.0, 12.0, 5.0, 7.0, 1.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.7421875, -6.52301025390625, -6.3038330078125, -6.08465576171875, -5.865478515625, -5.64630126953125, -5.4271240234375, -5.20794677734375, -4.98876953125, -4.76959228515625, -4.5504150390625, -4.33123779296875, -4.112060546875, -3.89288330078125, -3.6737060546875, -3.45452880859375, -3.2353515625, -3.01617431640625, -2.7969970703125, -2.57781982421875, -2.358642578125, -2.13946533203125, -1.9202880859375, -1.70111083984375, -1.48193359375, -1.26275634765625, -1.0435791015625, -0.82440185546875, -0.605224609375, -0.38604736328125, -0.1668701171875, 0.05230712890625, 0.271484375, 0.49066162109375, 0.7098388671875, 0.92901611328125, 1.148193359375, 1.36737060546875, 1.5865478515625, 1.80572509765625, 2.02490234375, 2.24407958984375, 2.4632568359375, 2.68243408203125, 2.901611328125, 3.12078857421875, 3.3399658203125, 3.55914306640625, 3.7783203125, 3.99749755859375, 4.2166748046875, 4.43585205078125, 4.655029296875, 4.87420654296875, 5.0933837890625, 5.31256103515625, 5.53173828125, 5.75091552734375, 5.9700927734375, 6.18927001953125, 6.408447265625, 6.62762451171875, 6.8468017578125, 7.06597900390625, 7.28515625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 14.0, 12.0, 14.0, 26.0, 39.0, 49.0, 74.0, 100.0, 185.0, 324.0, 527.0, 929.0, 1743.0, 3404.0, 7214.0, 18244.0, 59608.0, 297585.0, 1389025.0, 1833406.0, 452578.0, 86221.0, 24285.0, 9547.0, 4228.0, 2120.0, 1155.0, 607.0, 377.0, 216.0, 147.0, 90.0, 59.0, 40.0, 33.0, 20.0, 11.0, 11.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.5078125, -11.149658203125, -10.79150390625, -10.433349609375, -10.0751953125, -9.717041015625, -9.35888671875, -9.000732421875, -8.642578125, -8.284423828125, -7.92626953125, -7.568115234375, -7.2099609375, -6.851806640625, -6.49365234375, -6.135498046875, -5.77734375, -5.419189453125, -5.06103515625, -4.702880859375, -4.3447265625, -3.986572265625, -3.62841796875, -3.270263671875, -2.912109375, -2.553955078125, -2.19580078125, -1.837646484375, -1.4794921875, -1.121337890625, -0.76318359375, -0.405029296875, -0.046875, 0.311279296875, 0.66943359375, 1.027587890625, 1.3857421875, 1.743896484375, 2.10205078125, 2.460205078125, 2.818359375, 3.176513671875, 3.53466796875, 3.892822265625, 4.2509765625, 4.609130859375, 4.96728515625, 5.325439453125, 5.68359375, 6.041748046875, 6.39990234375, 6.758056640625, 7.1162109375, 7.474365234375, 7.83251953125, 8.190673828125, 8.548828125, 8.906982421875, 9.26513671875, 9.623291015625, 9.9814453125, 10.339599609375, 10.69775390625, 11.055908203125, 11.4140625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 9.0, 8.0, 7.0, 14.0, 15.0, 16.0, 24.0, 23.0, 49.0, 48.0, 70.0, 73.0, 116.0, 177.0, 259.0, 386.0, 539.0, 578.0, 517.0, 317.0, 206.0, 170.0, 97.0, 71.0, 64.0, 48.0, 37.0, 33.0, 25.0, 21.0, 13.0, 10.0, 9.0, 7.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.8046875, -11.40234375, -11.0, -10.59765625, -10.1953125, -9.79296875, -9.390625, -8.98828125, -8.5859375, -8.18359375, -7.78125, -7.37890625, -6.9765625, -6.57421875, -6.171875, -5.76953125, -5.3671875, -4.96484375, -4.5625, -4.16015625, -3.7578125, -3.35546875, -2.953125, -2.55078125, -2.1484375, -1.74609375, -1.34375, -0.94140625, -0.5390625, -0.13671875, 0.265625, 0.66796875, 1.0703125, 1.47265625, 1.875, 2.27734375, 2.6796875, 3.08203125, 3.484375, 3.88671875, 4.2890625, 4.69140625, 5.09375, 5.49609375, 5.8984375, 6.30078125, 6.703125, 7.10546875, 7.5078125, 7.91015625, 8.3125, 8.71484375, 9.1171875, 9.51953125, 9.921875, 10.32421875, 10.7265625, 11.12890625, 11.53125, 11.93359375, 12.3359375, 12.73828125, 13.140625, 13.54296875, 13.9453125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 8.0, 6.0, 8.0, 11.0, 22.0, 19.0, 29.0, 47.0, 59.0, 77.0, 117.0, 141.0, 144.0, 268.0, 469.0, 1134.0, 5622.0, 125586.0, 3874023.0, 177015.0, 6818.0, 1189.0, 492.0, 266.0, 174.0, 133.0, 99.0, 86.0, 60.0, 47.0, 24.0, 26.0, 23.0, 17.0, 3.0, 5.0, 10.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.0, -46.56884765625, -45.1376953125, -43.70654296875, -42.275390625, -40.84423828125, -39.4130859375, -37.98193359375, -36.55078125, -35.11962890625, -33.6884765625, -32.25732421875, -30.826171875, -29.39501953125, -27.9638671875, -26.53271484375, -25.1015625, -23.67041015625, -22.2392578125, -20.80810546875, -19.376953125, -17.94580078125, -16.5146484375, -15.08349609375, -13.65234375, -12.22119140625, -10.7900390625, -9.35888671875, -7.927734375, -6.49658203125, -5.0654296875, -3.63427734375, -2.203125, -0.77197265625, 0.6591796875, 2.09033203125, 3.521484375, 4.95263671875, 6.3837890625, 7.81494140625, 9.24609375, 10.67724609375, 12.1083984375, 13.53955078125, 14.970703125, 16.40185546875, 17.8330078125, 19.26416015625, 20.6953125, 22.12646484375, 23.5576171875, 24.98876953125, 26.419921875, 27.85107421875, 29.2822265625, 30.71337890625, 32.14453125, 33.57568359375, 35.0068359375, 36.43798828125, 37.869140625, 39.30029296875, 40.7314453125, 42.16259765625, 43.59375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 23.0, 69.0, 247.0, 411.0, 198.0, 56.0, 12.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.3002700805664, -82.17893981933594, -76.0576171875, -69.93628692626953, -63.814964294433594, -57.693634033203125, -51.57230758666992, -45.45098114013672, -39.329654693603516, -33.20832824707031, -27.08700180053711, -20.965673446655273, -14.84434700012207, -8.723020553588867, -2.6016921997070312, 3.519634246826172, 9.640960693359375, 15.762287139892578, 21.88361358642578, 28.004941940307617, 34.12626647949219, 40.247596740722656, 46.36892318725586, 52.49024963378906, 58.611576080322266, 64.73290252685547, 70.85423278808594, 76.97555541992188, 83.09688568115234, 89.21820831298828, 95.33953857421875, 101.46086120605469, 107.58219909667969, 113.70352935791016, 119.8248519897461, 125.94618225097656, 132.0675048828125, 138.18882751464844, 144.31016540527344, 150.43148803710938, 156.5528106689453, 162.67413330078125, 168.79547119140625, 174.9167938232422, 181.03811645507812, 187.15943908691406, 193.28077697753906, 199.402099609375, 205.5234375, 211.64476013183594, 217.76609802246094, 223.88742065429688, 230.0087432861328, 236.13006591796875, 242.25140380859375, 248.3727264404297, 254.49404907226562, 260.6153869628906, 266.7366943359375, 272.8580322265625, 278.9793701171875, 285.1006774902344, 291.2220153808594, 297.34332275390625, 303.46466064453125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 5.0, 3.0, 15.0, 6.0, 10.0, 16.0, 14.0, 16.0, 17.0, 26.0, 27.0, 36.0, 36.0, 48.0, 41.0, 39.0, 41.0, 29.0, 41.0, 38.0, 44.0, 38.0, 37.0, 46.0, 38.0, 31.0, 30.0, 29.0, 28.0, 38.0, 18.0, 11.0, 17.0, 9.0, 9.0, 13.0, 15.0, 9.0, 5.0, 10.0, 2.0, 6.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-44.059242248535156, -42.73255920410156, -41.405879974365234, -40.07919692993164, -38.75251770019531, -37.42583465576172, -36.099151611328125, -34.7724723815918, -33.4457893371582, -32.11910629272461, -30.79242706298828, -29.465744018554688, -28.139062881469727, -26.812381744384766, -25.485700607299805, -24.159019470214844, -22.832338333129883, -21.505657196044922, -20.17897605895996, -18.852294921875, -17.525611877441406, -16.198930740356445, -14.872249603271484, -13.545567512512207, -12.218886375427246, -10.892205238342285, -9.565523147583008, -8.238842010498047, -6.912160396575928, -5.585478782653809, -4.258797645568848, -2.9321155548095703, -1.6054344177246094, -0.2787529230117798, 1.0479285717010498, 2.37460994720459, 3.701291561126709, 5.027973175048828, 6.354654312133789, 7.681336402893066, 9.008017539978027, 10.334698677062988, 11.661380767822266, 12.988061904907227, 14.314743041992188, 15.641425132751465, 16.96810531616211, 18.294788360595703, 19.621469497680664, 20.948150634765625, 22.274831771850586, 23.601512908935547, 24.92819595336914, 26.2548770904541, 27.581558227539062, 28.908241271972656, 30.234920501708984, 31.561601638793945, 32.888282775878906, 34.2149658203125, 35.54164505004883, 36.86832809448242, 38.19500732421875, 39.521690368652344, 40.84837341308594]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 5.0, 6.0, 9.0, 11.0, 11.0, 22.0, 19.0, 18.0, 27.0, 36.0, 35.0, 32.0, 35.0, 33.0, 42.0, 36.0, 48.0, 42.0, 37.0, 37.0, 33.0, 40.0, 39.0, 32.0, 33.0, 29.0, 22.0, 33.0, 22.0, 17.0, 23.0, 18.0, 19.0, 12.0, 14.0, 9.0, 12.0, 10.0, 7.0, 6.0, 3.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-6.5078125, -6.29742431640625, -6.0870361328125, -5.87664794921875, -5.666259765625, -5.45587158203125, -5.2454833984375, -5.03509521484375, -4.82470703125, -4.61431884765625, -4.4039306640625, -4.19354248046875, -3.983154296875, -3.77276611328125, -3.5623779296875, -3.35198974609375, -3.1416015625, -2.93121337890625, -2.7208251953125, -2.51043701171875, -2.300048828125, -2.08966064453125, -1.8792724609375, -1.66888427734375, -1.45849609375, -1.24810791015625, -1.0377197265625, -0.82733154296875, -0.616943359375, -0.40655517578125, -0.1961669921875, 0.01422119140625, 0.224609375, 0.43499755859375, 0.6453857421875, 0.85577392578125, 1.066162109375, 1.27655029296875, 1.4869384765625, 1.69732666015625, 1.90771484375, 2.11810302734375, 2.3284912109375, 2.53887939453125, 2.749267578125, 2.95965576171875, 3.1700439453125, 3.38043212890625, 3.5908203125, 3.80120849609375, 4.0115966796875, 4.22198486328125, 4.432373046875, 4.64276123046875, 4.8531494140625, 5.06353759765625, 5.27392578125, 5.48431396484375, 5.6947021484375, 5.90509033203125, 6.115478515625, 6.32586669921875, 6.5362548828125, 6.74664306640625, 6.95703125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 8.0, 5.0, 13.0, 18.0, 27.0, 58.0, 69.0, 88.0, 156.0, 233.0, 340.0, 487.0, 730.0, 1097.0, 1526.0, 2354.0, 3606.0, 5491.0, 8422.0, 13109.0, 20611.0, 33216.0, 55214.0, 91386.0, 150280.0, 208197.0, 172202.0, 107746.0, 64645.0, 39177.0, 24607.0, 15191.0, 9642.0, 6308.0, 4171.0, 2645.0, 1827.0, 1237.0, 806.0, 515.0, 311.0, 261.0, 158.0, 120.0, 86.0, 51.0, 37.0, 30.0, 16.0, 14.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.005859375, -0.974090576171875, -0.94232177734375, -0.910552978515625, -0.8787841796875, -0.847015380859375, -0.81524658203125, -0.783477783203125, -0.751708984375, -0.719940185546875, -0.68817138671875, -0.656402587890625, -0.6246337890625, -0.592864990234375, -0.56109619140625, -0.529327392578125, -0.49755859375, -0.465789794921875, -0.43402099609375, -0.402252197265625, -0.3704833984375, -0.338714599609375, -0.30694580078125, -0.275177001953125, -0.243408203125, -0.211639404296875, -0.17987060546875, -0.148101806640625, -0.1163330078125, -0.084564208984375, -0.05279541015625, -0.021026611328125, 0.0107421875, 0.042510986328125, 0.07427978515625, 0.106048583984375, 0.1378173828125, 0.169586181640625, 0.20135498046875, 0.233123779296875, 0.264892578125, 0.296661376953125, 0.32843017578125, 0.360198974609375, 0.3919677734375, 0.423736572265625, 0.45550537109375, 0.487274169921875, 0.51904296875, 0.550811767578125, 0.58258056640625, 0.614349365234375, 0.6461181640625, 0.677886962890625, 0.70965576171875, 0.741424560546875, 0.773193359375, 0.804962158203125, 0.83673095703125, 0.868499755859375, 0.9002685546875, 0.932037353515625, 0.96380615234375, 0.995574951171875, 1.02734375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 4.0, 7.0, 6.0, 13.0, 9.0, 14.0, 16.0, 26.0, 29.0, 32.0, 23.0, 37.0, 41.0, 33.0, 41.0, 49.0, 44.0, 45.0, 1073.0, 41.0, 56.0, 50.0, 44.0, 45.0, 40.0, 39.0, 30.0, 23.0, 16.0, 20.0, 14.0, 19.0, 15.0, 5.0, 6.0, 7.0, 2.0, 5.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.0625, -5.8880615234375, -5.713623046875, -5.5391845703125, -5.36474609375, -5.1903076171875, -5.015869140625, -4.8414306640625, -4.6669921875, -4.4925537109375, -4.318115234375, -4.1436767578125, -3.96923828125, -3.7947998046875, -3.620361328125, -3.4459228515625, -3.271484375, -3.0970458984375, -2.922607421875, -2.7481689453125, -2.57373046875, -2.3992919921875, -2.224853515625, -2.0504150390625, -1.8759765625, -1.7015380859375, -1.527099609375, -1.3526611328125, -1.17822265625, -1.0037841796875, -0.829345703125, -0.6549072265625, -0.48046875, -0.3060302734375, -0.131591796875, 0.0428466796875, 0.21728515625, 0.3917236328125, 0.566162109375, 0.7406005859375, 0.9150390625, 1.0894775390625, 1.263916015625, 1.4383544921875, 1.61279296875, 1.7872314453125, 1.961669921875, 2.1361083984375, 2.310546875, 2.4849853515625, 2.659423828125, 2.8338623046875, 3.00830078125, 3.1827392578125, 3.357177734375, 3.5316162109375, 3.7060546875, 3.8804931640625, 4.054931640625, 4.2293701171875, 4.40380859375, 4.5782470703125, 4.752685546875, 4.9271240234375, 5.1015625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 8.0, 7.0, 15.0, 19.0, 24.0, 26.0, 46.0, 78.0, 118.0, 165.0, 270.0, 487.0, 757.0, 1376.0, 2445.0, 5056.0, 11381.0, 28337.0, 79838.0, 271877.0, 1314106.0, 254980.0, 76391.0, 27396.0, 11201.0, 4937.0, 2444.0, 1341.0, 750.0, 461.0, 260.0, 169.0, 121.0, 59.0, 53.0, 40.0, 31.0, 13.0, 13.0, 10.0, 8.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.458984375, -1.4140625, -1.369140625, -1.32421875, -1.279296875, -1.234375, -1.189453125, -1.14453125, -1.099609375, -1.0546875, -1.009765625, -0.96484375, -0.919921875, -0.875, -0.830078125, -0.78515625, -0.740234375, -0.6953125, -0.650390625, -0.60546875, -0.560546875, -0.515625, -0.470703125, -0.42578125, -0.380859375, -0.3359375, -0.291015625, -0.24609375, -0.201171875, -0.15625, -0.111328125, -0.06640625, -0.021484375, 0.0234375, 0.068359375, 0.11328125, 0.158203125, 0.203125, 0.248046875, 0.29296875, 0.337890625, 0.3828125, 0.427734375, 0.47265625, 0.517578125, 0.5625, 0.607421875, 0.65234375, 0.697265625, 0.7421875, 0.787109375, 0.83203125, 0.876953125, 0.921875, 0.966796875, 1.01171875, 1.056640625, 1.1015625, 1.146484375, 1.19140625, 1.236328125, 1.28125, 1.326171875, 1.37109375, 1.416015625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 3.0, 3.0, 5.0, 7.0, 8.0, 12.0, 8.0, 13.0, 19.0, 10.0, 25.0, 23.0, 24.0, 38.0, 44.0, 40.0, 113.0, 177.0, 146.0, 50.0, 35.0, 32.0, 27.0, 23.0, 26.0, 15.0, 14.0, 7.0, 4.0, 7.0, 4.0, 11.0, 3.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.264404296875, -0.25605010986328125, -0.2476959228515625, -0.23934173583984375, -0.230987548828125, -0.22263336181640625, -0.2142791748046875, -0.20592498779296875, -0.19757080078125, -0.18921661376953125, -0.1808624267578125, -0.17250823974609375, -0.164154052734375, -0.15579986572265625, -0.1474456787109375, -0.13909149169921875, -0.1307373046875, -0.12238311767578125, -0.1140289306640625, -0.10567474365234375, -0.097320556640625, -0.08896636962890625, -0.0806121826171875, -0.07225799560546875, -0.06390380859375, -0.05554962158203125, -0.0471954345703125, -0.03884124755859375, -0.030487060546875, -0.02213287353515625, -0.0137786865234375, -0.00542449951171875, 0.0029296875, 0.01128387451171875, 0.0196380615234375, 0.02799224853515625, 0.036346435546875, 0.04470062255859375, 0.0530548095703125, 0.06140899658203125, 0.06976318359375, 0.07811737060546875, 0.0864715576171875, 0.09482574462890625, 0.103179931640625, 0.11153411865234375, 0.1198883056640625, 0.12824249267578125, 0.1365966796875, 0.14495086669921875, 0.1533050537109375, 0.16165924072265625, 0.170013427734375, 0.17836761474609375, 0.1867218017578125, 0.19507598876953125, 0.20343017578125, 0.21178436279296875, 0.2201385498046875, 0.22849273681640625, 0.236846923828125, 0.24520111083984375, 0.2535552978515625, 0.26190948486328125, 0.270263671875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 5.0, 5.0, 9.0, 5.0, 7.0, 13.0, 17.0, 21.0, 35.0, 47.0, 39.0, 76.0, 108.0, 184.0, 467.0, 6911.0, 1005521.0, 33441.0, 852.0, 240.0, 151.0, 84.0, 70.0, 54.0, 32.0, 31.0, 18.0, 19.0, 12.0, 8.0, 11.0, 9.0, 5.0, 6.0, 3.0, 6.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.21875, -5.05902099609375, -4.8992919921875, -4.73956298828125, -4.579833984375, -4.42010498046875, -4.2603759765625, -4.10064697265625, -3.94091796875, -3.78118896484375, -3.6214599609375, -3.46173095703125, -3.302001953125, -3.14227294921875, -2.9825439453125, -2.82281494140625, -2.6630859375, -2.50335693359375, -2.3436279296875, -2.18389892578125, -2.024169921875, -1.86444091796875, -1.7047119140625, -1.54498291015625, -1.38525390625, -1.22552490234375, -1.0657958984375, -0.90606689453125, -0.746337890625, -0.58660888671875, -0.4268798828125, -0.26715087890625, -0.107421875, 0.05230712890625, 0.2120361328125, 0.37176513671875, 0.531494140625, 0.69122314453125, 0.8509521484375, 1.01068115234375, 1.17041015625, 1.33013916015625, 1.4898681640625, 1.64959716796875, 1.809326171875, 1.96905517578125, 2.1287841796875, 2.28851318359375, 2.4482421875, 2.60797119140625, 2.7677001953125, 2.92742919921875, 3.087158203125, 3.24688720703125, 3.4066162109375, 3.56634521484375, 3.72607421875, 3.88580322265625, 4.0455322265625, 4.20526123046875, 4.364990234375, 4.52471923828125, 4.6844482421875, 4.84417724609375, 5.00390625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 6.0, 13.0, 21.0, 35.0, 59.0, 103.0, 159.0, 188.0, 152.0, 115.0, 65.0, 33.0, 20.0, 18.0, 8.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2705734074115753, -0.25496622920036316, -0.2393590658903122, -0.22375190258026123, -0.20814472436904907, -0.1925375610589981, -0.17693039774894714, -0.16132321953773499, -0.14571605622768402, -0.13010889291763306, -0.1145017147064209, -0.09889455139636993, -0.08328738063573837, -0.06768020987510681, -0.05207304656505585, -0.036465875804424286, -0.020858705043792725, -0.0052515361458063126, 0.0103556327521801, 0.025962799787521362, 0.041569970548152924, 0.057177141308784485, 0.07278430461883545, 0.08839147537946701, 0.10399864614009857, 0.11960581690073013, 0.1352129876613617, 0.15082015097141266, 0.16642731428146362, 0.18203449249267578, 0.19764165580272675, 0.2132488191127777, 0.22885602712631226, 0.24446319043636322, 0.2600703537464142, 0.27567753195762634, 0.2912847101688385, 0.30689185857772827, 0.32249903678894043, 0.3381062150001526, 0.35371339321136475, 0.3693205714225769, 0.3849277198314667, 0.40053489804267883, 0.416142076253891, 0.43174922466278076, 0.4473564028739929, 0.4629635810852051, 0.47857072949409485, 0.494177907705307, 0.5097850561141968, 0.5253922343254089, 0.5409994125366211, 0.5566065907478333, 0.5722137689590454, 0.5878208875656128, 0.603428065776825, 0.6190352439880371, 0.6346424221992493, 0.6502496004104614, 0.6658567190170288, 0.681463897228241, 0.6970710754394531, 0.7126782536506653, 0.7282854318618774]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 8.0, 6.0, 8.0, 7.0, 6.0, 16.0, 11.0, 10.0, 16.0, 17.0, 17.0, 20.0, 31.0, 25.0, 31.0, 45.0, 38.0, 35.0, 37.0, 43.0, 28.0, 28.0, 31.0, 29.0, 33.0, 37.0, 35.0, 45.0, 28.0, 24.0, 23.0, 30.0, 30.0, 26.0, 19.0, 21.0, 14.0, 13.0, 7.0, 12.0, 7.0, 12.0, 8.0, 10.0, 5.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.20523911714553833, -0.1985865980386734, -0.19193407893180847, -0.18528154492378235, -0.17862902581691742, -0.1719765067100525, -0.16532397270202637, -0.15867145359516144, -0.1520189344882965, -0.14536641538143158, -0.13871389627456665, -0.13206136226654053, -0.1254088431596756, -0.11875632405281067, -0.11210379749536514, -0.10545127093791962, -0.09879875183105469, -0.09214623272418976, -0.08549370616674423, -0.0788411796092987, -0.07218866050243378, -0.06553614139556885, -0.05888361483812332, -0.052231092005968094, -0.045578569173812866, -0.03892604634165764, -0.03227352350950241, -0.025621000677347183, -0.018968477845191956, -0.012315955013036728, -0.0056634321808815, 0.0009890906512737274, 0.007641613483428955, 0.014294136315584183, 0.02094665914773941, 0.027599181979894638, 0.034251704812049866, 0.04090422764420509, 0.04755675047636032, 0.05420927330851555, 0.060861796140670776, 0.0675143152475357, 0.07416684180498123, 0.08081936836242676, 0.08747188746929169, 0.09412440657615662, 0.10077693313360214, 0.10742945969104767, 0.1140819787979126, 0.12073449790477753, 0.12738701701164246, 0.13403955101966858, 0.1406920701265335, 0.14734458923339844, 0.15399712324142456, 0.1606496423482895, 0.16730216145515442, 0.17395468056201935, 0.18060719966888428, 0.1872597336769104, 0.19391225278377533, 0.20056477189064026, 0.20721730589866638, 0.2138698250055313, 0.22052234411239624]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 3.0, 8.0, 9.0, 11.0, 6.0, 13.0, 16.0, 27.0, 22.0, 29.0, 30.0, 31.0, 29.0, 41.0, 40.0, 38.0, 40.0, 41.0, 48.0, 40.0, 39.0, 42.0, 43.0, 32.0, 30.0, 28.0, 29.0, 33.0, 15.0, 27.0, 26.0, 16.0, 19.0, 15.0, 19.0, 10.0, 9.0, 12.0, 7.0, 3.0, 4.0, 6.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.26171875, -7.045654296875, -6.82958984375, -6.613525390625, -6.3974609375, -6.181396484375, -5.96533203125, -5.749267578125, -5.533203125, -5.317138671875, -5.10107421875, -4.885009765625, -4.6689453125, -4.452880859375, -4.23681640625, -4.020751953125, -3.8046875, -3.588623046875, -3.37255859375, -3.156494140625, -2.9404296875, -2.724365234375, -2.50830078125, -2.292236328125, -2.076171875, -1.860107421875, -1.64404296875, -1.427978515625, -1.2119140625, -0.995849609375, -0.77978515625, -0.563720703125, -0.34765625, -0.131591796875, 0.08447265625, 0.300537109375, 0.5166015625, 0.732666015625, 0.94873046875, 1.164794921875, 1.380859375, 1.596923828125, 1.81298828125, 2.029052734375, 2.2451171875, 2.461181640625, 2.67724609375, 2.893310546875, 3.109375, 3.325439453125, 3.54150390625, 3.757568359375, 3.9736328125, 4.189697265625, 4.40576171875, 4.621826171875, 4.837890625, 5.053955078125, 5.27001953125, 5.486083984375, 5.7021484375, 5.918212890625, 6.13427734375, 6.350341796875, 6.56640625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 7.0, 6.0, 13.0, 24.0, 26.0, 35.0, 47.0, 81.0, 110.0, 154.0, 212.0, 288.0, 479.0, 672.0, 946.0, 1579.0, 2361.0, 3732.0, 5980.0, 9997.0, 17606.0, 31768.0, 63285.0, 136423.0, 276410.0, 253057.0, 118041.0, 56122.0, 28801.0, 15728.0, 9173.0, 5499.0, 3414.0, 2204.0, 1375.0, 917.0, 597.0, 391.0, 312.0, 222.0, 122.0, 85.0, 62.0, 73.0, 29.0, 26.0, 18.0, 16.0, 9.0, 9.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-7.89453125, -7.6546630859375, -7.414794921875, -7.1749267578125, -6.93505859375, -6.6951904296875, -6.455322265625, -6.2154541015625, -5.9755859375, -5.7357177734375, -5.495849609375, -5.2559814453125, -5.01611328125, -4.7762451171875, -4.536376953125, -4.2965087890625, -4.056640625, -3.8167724609375, -3.576904296875, -3.3370361328125, -3.09716796875, -2.8572998046875, -2.617431640625, -2.3775634765625, -2.1376953125, -1.8978271484375, -1.657958984375, -1.4180908203125, -1.17822265625, -0.9383544921875, -0.698486328125, -0.4586181640625, -0.21875, 0.0211181640625, 0.260986328125, 0.5008544921875, 0.74072265625, 0.9805908203125, 1.220458984375, 1.4603271484375, 1.7001953125, 1.9400634765625, 2.179931640625, 2.4197998046875, 2.65966796875, 2.8995361328125, 3.139404296875, 3.3792724609375, 3.619140625, 3.8590087890625, 4.098876953125, 4.3387451171875, 4.57861328125, 4.8184814453125, 5.058349609375, 5.2982177734375, 5.5380859375, 5.7779541015625, 6.017822265625, 6.2576904296875, 6.49755859375, 6.7374267578125, 6.977294921875, 7.2171630859375, 7.45703125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 6.0, 3.0, 7.0, 9.0, 12.0, 14.0, 19.0, 13.0, 15.0, 24.0, 24.0, 26.0, 28.0, 30.0, 41.0, 52.0, 65.0, 72.0, 135.0, 287.0, 1341.0, 223.0, 123.0, 84.0, 50.0, 40.0, 44.0, 41.0, 23.0, 31.0, 19.0, 19.0, 25.0, 16.0, 15.0, 11.0, 15.0, 6.0, 5.0, 6.0, 7.0, 4.0, 4.0, 7.0, 1.0, 1.0, 2.0, 3.0], "bins": [-23.359375, -22.718505859375, -22.07763671875, -21.436767578125, -20.7958984375, -20.155029296875, -19.51416015625, -18.873291015625, -18.232421875, -17.591552734375, -16.95068359375, -16.309814453125, -15.6689453125, -15.028076171875, -14.38720703125, -13.746337890625, -13.10546875, -12.464599609375, -11.82373046875, -11.182861328125, -10.5419921875, -9.901123046875, -9.26025390625, -8.619384765625, -7.978515625, -7.337646484375, -6.69677734375, -6.055908203125, -5.4150390625, -4.774169921875, -4.13330078125, -3.492431640625, -2.8515625, -2.210693359375, -1.56982421875, -0.928955078125, -0.2880859375, 0.352783203125, 0.99365234375, 1.634521484375, 2.275390625, 2.916259765625, 3.55712890625, 4.197998046875, 4.8388671875, 5.479736328125, 6.12060546875, 6.761474609375, 7.40234375, 8.043212890625, 8.68408203125, 9.324951171875, 9.9658203125, 10.606689453125, 11.24755859375, 11.888427734375, 12.529296875, 13.170166015625, 13.81103515625, 14.451904296875, 15.0927734375, 15.733642578125, 16.37451171875, 17.015380859375, 17.65625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 5.0, 8.0, 4.0, 9.0, 18.0, 14.0, 13.0, 16.0, 33.0, 32.0, 33.0, 52.0, 90.0, 108.0, 141.0, 213.0, 316.0, 551.0, 1442.0, 8278.0, 105742.0, 2792083.0, 220279.0, 12425.0, 1987.0, 643.0, 281.0, 239.0, 159.0, 109.0, 92.0, 49.0, 50.0, 45.0, 29.0, 21.0, 18.0, 20.0, 13.0, 10.0, 14.0, 7.0, 2.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0], "bins": [-37.0625, -35.95947265625, -34.8564453125, -33.75341796875, -32.650390625, -31.54736328125, -30.4443359375, -29.34130859375, -28.23828125, -27.13525390625, -26.0322265625, -24.92919921875, -23.826171875, -22.72314453125, -21.6201171875, -20.51708984375, -19.4140625, -18.31103515625, -17.2080078125, -16.10498046875, -15.001953125, -13.89892578125, -12.7958984375, -11.69287109375, -10.58984375, -9.48681640625, -8.3837890625, -7.28076171875, -6.177734375, -5.07470703125, -3.9716796875, -2.86865234375, -1.765625, -0.66259765625, 0.4404296875, 1.54345703125, 2.646484375, 3.74951171875, 4.8525390625, 5.95556640625, 7.05859375, 8.16162109375, 9.2646484375, 10.36767578125, 11.470703125, 12.57373046875, 13.6767578125, 14.77978515625, 15.8828125, 16.98583984375, 18.0888671875, 19.19189453125, 20.294921875, 21.39794921875, 22.5009765625, 23.60400390625, 24.70703125, 25.81005859375, 26.9130859375, 28.01611328125, 29.119140625, 30.22216796875, 31.3251953125, 32.42822265625, 33.53125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [3.0, 3.0, 287.0, 684.0, 36.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.933895111083984, -21.49590301513672, -12.057910919189453, -2.6199188232421875, 6.818073272705078, 16.256065368652344, 25.69405746459961, 35.13205337524414, 44.57004165649414, 54.008033752441406, 63.44602584838867, 72.88401794433594, 82.32200622558594, 91.76000213623047, 101.197998046875, 110.635986328125, 120.073974609375, 129.511962890625, 138.949951171875, 148.38795471191406, 157.82594299316406, 167.26393127441406, 176.70193481445312, 186.13992309570312, 195.57791137695312, 205.01589965820312, 214.45388793945312, 223.8918914794922, 233.3298797607422, 242.7678680419922, 252.20587158203125, 261.64385986328125, 271.08184814453125, 280.51983642578125, 289.95782470703125, 299.39581298828125, 308.83380126953125, 318.2718200683594, 327.7098083496094, 337.1477966308594, 346.5857849121094, 356.0237731933594, 365.4617614746094, 374.8997497558594, 384.3377685546875, 393.7757568359375, 403.2137451171875, 412.6517333984375, 422.0897216796875, 431.5277099609375, 440.9656982421875, 450.4036865234375, 459.8416748046875, 469.2796936035156, 478.7176818847656, 488.1556701660156, 497.5936584472656, 507.0316467285156, 516.4696655273438, 525.9076538085938, 535.3456420898438, 544.7836303710938, 554.2216186523438, 563.6596069335938, 573.0975952148438]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 10.0, 7.0, 14.0, 8.0, 7.0, 12.0, 17.0, 17.0, 22.0, 20.0, 25.0, 24.0, 40.0, 30.0, 35.0, 37.0, 34.0, 34.0, 46.0, 34.0, 44.0, 42.0, 34.0, 40.0, 39.0, 32.0, 32.0, 27.0, 32.0, 30.0, 20.0, 22.0, 27.0, 23.0, 23.0, 10.0, 7.0, 7.0, 14.0, 1.0, 1.0, 0.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.67521667480469, -48.023345947265625, -46.37147903442383, -44.719608306884766, -43.06774139404297, -41.415870666503906, -39.763999938964844, -38.11213302612305, -36.460262298583984, -34.80839157104492, -33.156524658203125, -31.504653930664062, -29.852785110473633, -28.200916290283203, -26.549047470092773, -24.897178649902344, -23.245309829711914, -21.593441009521484, -19.941572189331055, -18.289703369140625, -16.637832641601562, -14.985963821411133, -13.334095001220703, -11.682225227355957, -10.030356407165527, -8.378487586975098, -6.726617813110352, -5.074748992919922, -3.422879695892334, -1.771010398864746, -0.1191415786743164, 1.5327281951904297, 3.1845970153808594, 4.836466312408447, 6.488335609436035, 8.140204429626465, 9.792074203491211, 11.44394302368164, 13.09581184387207, 14.747681617736816, 16.399551391601562, 18.051420211791992, 19.703289031982422, 21.355159759521484, 23.007028579711914, 24.658897399902344, 26.310766220092773, 27.962635040283203, 29.614503860473633, 31.266372680664062, 32.918243408203125, 34.57011032104492, 36.221981048583984, 37.87384796142578, 39.525718688964844, 41.177589416503906, 42.8294563293457, 44.481327056884766, 46.13319396972656, 47.785064697265625, 49.43693161010742, 51.088802337646484, 52.74066925048828, 54.392539978027344, 56.044410705566406]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 6.0, 2.0, 3.0, 6.0, 13.0, 18.0, 10.0, 19.0, 17.0, 34.0, 24.0, 42.0, 33.0, 43.0, 37.0, 34.0, 52.0, 40.0, 48.0, 40.0, 37.0, 43.0, 36.0, 32.0, 44.0, 35.0, 32.0, 26.0, 24.0, 26.0, 19.0, 27.0, 15.0, 16.0, 20.0, 9.0, 8.0, 13.0, 3.0, 9.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.83984375, -7.6077880859375, -7.375732421875, -7.1436767578125, -6.91162109375, -6.6795654296875, -6.447509765625, -6.2154541015625, -5.9833984375, -5.7513427734375, -5.519287109375, -5.2872314453125, -5.05517578125, -4.8231201171875, -4.591064453125, -4.3590087890625, -4.126953125, -3.8948974609375, -3.662841796875, -3.4307861328125, -3.19873046875, -2.9666748046875, -2.734619140625, -2.5025634765625, -2.2705078125, -2.0384521484375, -1.806396484375, -1.5743408203125, -1.34228515625, -1.1102294921875, -0.878173828125, -0.6461181640625, -0.4140625, -0.1820068359375, 0.050048828125, 0.2821044921875, 0.51416015625, 0.7462158203125, 0.978271484375, 1.2103271484375, 1.4423828125, 1.6744384765625, 1.906494140625, 2.1385498046875, 2.37060546875, 2.6026611328125, 2.834716796875, 3.0667724609375, 3.298828125, 3.5308837890625, 3.762939453125, 3.9949951171875, 4.22705078125, 4.4591064453125, 4.691162109375, 4.9232177734375, 5.1552734375, 5.3873291015625, 5.619384765625, 5.8514404296875, 6.08349609375, 6.3155517578125, 6.547607421875, 6.7796630859375, 7.01171875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 7.0, 8.0, 14.0, 17.0, 20.0, 20.0, 37.0, 77.0, 74.0, 118.0, 204.0, 309.0, 541.0, 1033.0, 2059.0, 4286.0, 10478.0, 29729.0, 120237.0, 697800.0, 2323636.0, 811034.0, 137418.0, 33496.0, 11538.0, 5007.0, 2314.0, 1125.0, 640.0, 355.0, 198.0, 139.0, 88.0, 64.0, 49.0, 38.0, 18.0, 15.0, 10.0, 13.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0], "bins": [-12.875, -12.522705078125, -12.17041015625, -11.818115234375, -11.4658203125, -11.113525390625, -10.76123046875, -10.408935546875, -10.056640625, -9.704345703125, -9.35205078125, -8.999755859375, -8.6474609375, -8.295166015625, -7.94287109375, -7.590576171875, -7.23828125, -6.885986328125, -6.53369140625, -6.181396484375, -5.8291015625, -5.476806640625, -5.12451171875, -4.772216796875, -4.419921875, -4.067626953125, -3.71533203125, -3.363037109375, -3.0107421875, -2.658447265625, -2.30615234375, -1.953857421875, -1.6015625, -1.249267578125, -0.89697265625, -0.544677734375, -0.1923828125, 0.159912109375, 0.51220703125, 0.864501953125, 1.216796875, 1.569091796875, 1.92138671875, 2.273681640625, 2.6259765625, 2.978271484375, 3.33056640625, 3.682861328125, 4.03515625, 4.387451171875, 4.73974609375, 5.092041015625, 5.4443359375, 5.796630859375, 6.14892578125, 6.501220703125, 6.853515625, 7.205810546875, 7.55810546875, 7.910400390625, 8.2626953125, 8.614990234375, 8.96728515625, 9.319580078125, 9.671875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 7.0, 10.0, 11.0, 15.0, 19.0, 23.0, 28.0, 28.0, 51.0, 84.0, 113.0, 168.0, 284.0, 378.0, 581.0, 600.0, 481.0, 365.0, 242.0, 146.0, 108.0, 82.0, 63.0, 50.0, 27.0, 30.0, 13.0, 12.0, 13.0, 11.0, 11.0, 2.0, 2.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.6451416015625, -8.274658203125, -7.9041748046875, -7.53369140625, -7.1632080078125, -6.792724609375, -6.4222412109375, -6.0517578125, -5.6812744140625, -5.310791015625, -4.9403076171875, -4.56982421875, -4.1993408203125, -3.828857421875, -3.4583740234375, -3.087890625, -2.7174072265625, -2.346923828125, -1.9764404296875, -1.60595703125, -1.2354736328125, -0.864990234375, -0.4945068359375, -0.1240234375, 0.2464599609375, 0.616943359375, 0.9874267578125, 1.35791015625, 1.7283935546875, 2.098876953125, 2.4693603515625, 2.83984375, 3.2103271484375, 3.580810546875, 3.9512939453125, 4.32177734375, 4.6922607421875, 5.062744140625, 5.4332275390625, 5.8037109375, 6.1741943359375, 6.544677734375, 6.9151611328125, 7.28564453125, 7.6561279296875, 8.026611328125, 8.3970947265625, 8.767578125, 9.1380615234375, 9.508544921875, 9.8790283203125, 10.24951171875, 10.6199951171875, 10.990478515625, 11.3609619140625, 11.7314453125, 12.1019287109375, 12.472412109375, 12.8428955078125, 13.21337890625, 13.5838623046875, 13.954345703125, 14.3248291015625, 14.6953125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 5.0, 15.0, 12.0, 11.0, 14.0, 24.0, 36.0, 43.0, 59.0, 110.0, 148.0, 197.0, 423.0, 1097.0, 6228.0, 90057.0, 3523261.0, 548953.0, 19883.0, 2290.0, 607.0, 294.0, 167.0, 92.0, 72.0, 37.0, 34.0, 29.0, 19.0, 14.0, 14.0, 12.0, 6.0, 4.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0], "bins": [-47.53125, -46.335205078125, -45.13916015625, -43.943115234375, -42.7470703125, -41.551025390625, -40.35498046875, -39.158935546875, -37.962890625, -36.766845703125, -35.57080078125, -34.374755859375, -33.1787109375, -31.982666015625, -30.78662109375, -29.590576171875, -28.39453125, -27.198486328125, -26.00244140625, -24.806396484375, -23.6103515625, -22.414306640625, -21.21826171875, -20.022216796875, -18.826171875, -17.630126953125, -16.43408203125, -15.238037109375, -14.0419921875, -12.845947265625, -11.64990234375, -10.453857421875, -9.2578125, -8.061767578125, -6.86572265625, -5.669677734375, -4.4736328125, -3.277587890625, -2.08154296875, -0.885498046875, 0.310546875, 1.506591796875, 2.70263671875, 3.898681640625, 5.0947265625, 6.290771484375, 7.48681640625, 8.682861328125, 9.87890625, 11.074951171875, 12.27099609375, 13.467041015625, 14.6630859375, 15.859130859375, 17.05517578125, 18.251220703125, 19.447265625, 20.643310546875, 21.83935546875, 23.035400390625, 24.2314453125, 25.427490234375, 26.62353515625, 27.819580078125, 29.015625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 14.0, 108.0, 382.0, 388.0, 104.0, 13.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.61289978027344, -146.72996520996094, -140.84703063964844, -134.964111328125, -129.0811767578125, -123.1982421875, -117.3153076171875, -111.432373046875, -105.54944610595703, -99.66651153564453, -93.78358459472656, -87.90065002441406, -82.01771545410156, -76.1347885131836, -70.2518539428711, -64.36892700195312, -58.485992431640625, -52.60306167602539, -46.720130920410156, -40.837196350097656, -34.95426559448242, -29.071334838867188, -23.188400268554688, -17.305469512939453, -11.422538757324219, -5.539607048034668, 0.3433246612548828, 6.22625732421875, 12.109188079833984, 17.99211883544922, 23.87505340576172, 29.757984161376953, 35.64093017578125, 41.523860931396484, 47.40679168701172, 53.28972625732422, 59.17265701293945, 65.05558776855469, 70.93852233886719, 76.82145690917969, 82.70438385009766, 88.58731842041016, 94.47024536132812, 100.35317993164062, 106.23611450195312, 112.1190414428711, 118.0019760131836, 123.88490295410156, 129.76783752441406, 135.65077209472656, 141.53370666503906, 147.4166259765625, 153.299560546875, 159.1824951171875, 165.0654296875, 170.9483642578125, 176.831298828125, 182.7142333984375, 188.59716796875, 194.4801025390625, 200.36302185058594, 206.24595642089844, 212.12889099121094, 218.01182556152344, 223.89474487304688]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 7.0, 6.0, 4.0, 13.0, 12.0, 15.0, 13.0, 12.0, 19.0, 24.0, 26.0, 30.0, 22.0, 31.0, 38.0, 30.0, 39.0, 40.0, 37.0, 33.0, 35.0, 37.0, 46.0, 36.0, 43.0, 42.0, 24.0, 30.0, 37.0, 41.0, 28.0, 21.0, 23.0, 14.0, 12.0, 16.0, 18.0, 6.0, 9.0, 6.0, 10.0, 3.0, 6.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.40915298461914, -31.302013397216797, -30.194873809814453, -29.08773422241211, -27.980594635009766, -26.873455047607422, -25.766313552856445, -24.6591739654541, -23.552034378051758, -22.444894790649414, -21.33775520324707, -20.230615615844727, -19.12347412109375, -18.016334533691406, -16.909194946289062, -15.802055358886719, -14.694915771484375, -13.587776184082031, -12.480636596679688, -11.373496055603027, -10.266356468200684, -9.15921688079834, -8.05207633972168, -6.944936752319336, -5.837797164916992, -4.730657577514648, -3.6235175132751465, -2.5163776874542236, -1.4092378616333008, -0.30209827423095703, 0.8050417900085449, 1.9121818542480469, 3.019317626953125, 4.126457214355469, 5.233597278594971, 6.340737342834473, 7.447876930236816, 8.55501651763916, 9.66215705871582, 10.769296646118164, 11.876436233520508, 12.983575820922852, 14.090715408325195, 15.197855949401855, 16.304996490478516, 17.41213607788086, 18.519275665283203, 19.626415252685547, 20.73355484008789, 21.840694427490234, 22.947834014892578, 24.054973602294922, 25.162113189697266, 26.26925277709961, 27.376394271850586, 28.48353385925293, 29.590673446655273, 30.697813034057617, 31.80495262145996, 32.91209411621094, 34.01923370361328, 35.126373291015625, 36.23351287841797, 37.34065246582031, 38.447792053222656]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 6.0, 8.0, 3.0, 14.0, 21.0, 28.0, 23.0, 27.0, 29.0, 33.0, 40.0, 38.0, 35.0, 37.0, 39.0, 40.0, 45.0, 48.0, 47.0, 52.0, 33.0, 47.0, 43.0, 32.0, 33.0, 25.0, 19.0, 21.0, 26.0, 18.0, 13.0, 10.0, 12.0, 11.0, 11.0, 6.0, 10.0, 1.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.1640625, -6.9366455078125, -6.709228515625, -6.4818115234375, -6.25439453125, -6.0269775390625, -5.799560546875, -5.5721435546875, -5.3447265625, -5.1173095703125, -4.889892578125, -4.6624755859375, -4.43505859375, -4.2076416015625, -3.980224609375, -3.7528076171875, -3.525390625, -3.2979736328125, -3.070556640625, -2.8431396484375, -2.61572265625, -2.3883056640625, -2.160888671875, -1.9334716796875, -1.7060546875, -1.4786376953125, -1.251220703125, -1.0238037109375, -0.79638671875, -0.5689697265625, -0.341552734375, -0.1141357421875, 0.11328125, 0.3406982421875, 0.568115234375, 0.7955322265625, 1.02294921875, 1.2503662109375, 1.477783203125, 1.7052001953125, 1.9326171875, 2.1600341796875, 2.387451171875, 2.6148681640625, 2.84228515625, 3.0697021484375, 3.297119140625, 3.5245361328125, 3.751953125, 3.9793701171875, 4.206787109375, 4.4342041015625, 4.66162109375, 4.8890380859375, 5.116455078125, 5.3438720703125, 5.5712890625, 5.7987060546875, 6.026123046875, 6.2535400390625, 6.48095703125, 6.7083740234375, 6.935791015625, 7.1632080078125, 7.390625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 9.0, 14.0, 12.0, 18.0, 39.0, 46.0, 53.0, 81.0, 139.0, 158.0, 225.0, 319.0, 422.0, 615.0, 892.0, 1350.0, 1908.0, 2906.0, 4277.0, 6289.0, 9727.0, 14817.0, 23010.0, 36879.0, 58996.0, 98129.0, 158618.0, 203381.0, 160788.0, 99406.0, 59676.0, 37215.0, 22986.0, 14944.0, 9785.0, 6569.0, 4286.0, 2885.0, 2034.0, 1408.0, 1004.0, 661.0, 450.0, 333.0, 242.0, 165.0, 111.0, 76.0, 64.0, 41.0, 33.0, 27.0, 16.0, 9.0, 8.0, 3.0, 5.0, 2.0, 5.0], "bins": [-0.81689453125, -0.7917709350585938, -0.7666473388671875, -0.7415237426757812, -0.716400146484375, -0.6912765502929688, -0.6661529541015625, -0.6410293579101562, -0.61590576171875, -0.5907821655273438, -0.5656585693359375, -0.5405349731445312, -0.515411376953125, -0.49028778076171875, -0.4651641845703125, -0.44004058837890625, -0.4149169921875, -0.38979339599609375, -0.3646697998046875, -0.33954620361328125, -0.314422607421875, -0.28929901123046875, -0.2641754150390625, -0.23905181884765625, -0.21392822265625, -0.18880462646484375, -0.1636810302734375, -0.13855743408203125, -0.113433837890625, -0.08831024169921875, -0.0631866455078125, -0.03806304931640625, -0.012939453125, 0.01218414306640625, 0.0373077392578125, 0.06243133544921875, 0.087554931640625, 0.11267852783203125, 0.1378021240234375, 0.16292572021484375, 0.18804931640625, 0.21317291259765625, 0.2382965087890625, 0.26342010498046875, 0.288543701171875, 0.31366729736328125, 0.3387908935546875, 0.36391448974609375, 0.3890380859375, 0.41416168212890625, 0.4392852783203125, 0.46440887451171875, 0.489532470703125, 0.5146560668945312, 0.5397796630859375, 0.5649032592773438, 0.59002685546875, 0.6151504516601562, 0.6402740478515625, 0.6653976440429688, 0.690521240234375, 0.7156448364257812, 0.7407684326171875, 0.7658920288085938, 0.791015625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 9.0, 7.0, 8.0, 5.0, 11.0, 19.0, 19.0, 20.0, 14.0, 25.0, 30.0, 30.0, 27.0, 37.0, 27.0, 35.0, 41.0, 53.0, 50.0, 1076.0, 44.0, 37.0, 41.0, 43.0, 60.0, 30.0, 29.0, 36.0, 27.0, 21.0, 24.0, 19.0, 13.0, 9.0, 10.0, 10.0, 7.0, 7.0, 9.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.16796875, -5.00726318359375, -4.8465576171875, -4.68585205078125, -4.525146484375, -4.36444091796875, -4.2037353515625, -4.04302978515625, -3.88232421875, -3.72161865234375, -3.5609130859375, -3.40020751953125, -3.239501953125, -3.07879638671875, -2.9180908203125, -2.75738525390625, -2.5966796875, -2.43597412109375, -2.2752685546875, -2.11456298828125, -1.953857421875, -1.79315185546875, -1.6324462890625, -1.47174072265625, -1.31103515625, -1.15032958984375, -0.9896240234375, -0.82891845703125, -0.668212890625, -0.50750732421875, -0.3468017578125, -0.18609619140625, -0.025390625, 0.13531494140625, 0.2960205078125, 0.45672607421875, 0.617431640625, 0.77813720703125, 0.9388427734375, 1.09954833984375, 1.26025390625, 1.42095947265625, 1.5816650390625, 1.74237060546875, 1.903076171875, 2.06378173828125, 2.2244873046875, 2.38519287109375, 2.5458984375, 2.70660400390625, 2.8673095703125, 3.02801513671875, 3.188720703125, 3.34942626953125, 3.5101318359375, 3.67083740234375, 3.83154296875, 3.99224853515625, 4.1529541015625, 4.31365966796875, 4.474365234375, 4.63507080078125, 4.7957763671875, 4.95648193359375, 5.1171875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 13.0, 20.0, 28.0, 32.0, 57.0, 104.0, 174.0, 303.0, 577.0, 1109.0, 2138.0, 4745.0, 10561.0, 24522.0, 60870.0, 167327.0, 1196999.0, 434337.0, 116362.0, 43645.0, 18120.0, 7875.0, 3581.0, 1738.0, 851.0, 443.0, 228.0, 145.0, 84.0, 53.0, 20.0, 26.0, 10.0, 9.0, 11.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88330078125, -0.8490982055664062, -0.8148956298828125, -0.7806930541992188, -0.746490478515625, -0.7122879028320312, -0.6780853271484375, -0.6438827514648438, -0.60968017578125, -0.5754776000976562, -0.5412750244140625, -0.5070724487304688, -0.472869873046875, -0.43866729736328125, -0.4044647216796875, -0.37026214599609375, -0.3360595703125, -0.30185699462890625, -0.2676544189453125, -0.23345184326171875, -0.199249267578125, -0.16504669189453125, -0.1308441162109375, -0.09664154052734375, -0.06243896484375, -0.02823638916015625, 0.0059661865234375, 0.04016876220703125, 0.074371337890625, 0.10857391357421875, 0.1427764892578125, 0.17697906494140625, 0.211181640625, 0.24538421630859375, 0.2795867919921875, 0.31378936767578125, 0.347991943359375, 0.38219451904296875, 0.4163970947265625, 0.45059967041015625, 0.48480224609375, 0.5190048217773438, 0.5532073974609375, 0.5874099731445312, 0.621612548828125, 0.6558151245117188, 0.6900177001953125, 0.7242202758789062, 0.7584228515625, 0.7926254272460938, 0.8268280029296875, 0.8610305786132812, 0.895233154296875, 0.9294357299804688, 0.9636383056640625, 0.9978408813476562, 1.03204345703125, 1.0662460327148438, 1.1004486083984375, 1.1346511840820312, 1.168853759765625, 1.2030563354492188, 1.2372589111328125, 1.2714614868164062, 1.3056640625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 9.0, 14.0, 24.0, 15.0, 48.0, 58.0, 81.0, 122.0, 119.0, 138.0, 102.0, 74.0, 46.0, 30.0, 31.0, 21.0, 13.0, 15.0, 5.0, 5.0, 5.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.143798828125, -0.13861846923828125, -0.1334381103515625, -0.12825775146484375, -0.123077392578125, -0.11789703369140625, -0.1127166748046875, -0.10753631591796875, -0.10235595703125, -0.09717559814453125, -0.0919952392578125, -0.08681488037109375, -0.081634521484375, -0.07645416259765625, -0.0712738037109375, -0.06609344482421875, -0.0609130859375, -0.05573272705078125, -0.0505523681640625, -0.04537200927734375, -0.040191650390625, -0.03501129150390625, -0.0298309326171875, -0.02465057373046875, -0.01947021484375, -0.01428985595703125, -0.0091094970703125, -0.00392913818359375, 0.001251220703125, 0.00643157958984375, 0.0116119384765625, 0.01679229736328125, 0.02197265625, 0.02715301513671875, 0.0323333740234375, 0.03751373291015625, 0.042694091796875, 0.04787445068359375, 0.0530548095703125, 0.05823516845703125, 0.06341552734375, 0.06859588623046875, 0.0737762451171875, 0.07895660400390625, 0.084136962890625, 0.08931732177734375, 0.0944976806640625, 0.09967803955078125, 0.1048583984375, 0.11003875732421875, 0.1152191162109375, 0.12039947509765625, 0.125579833984375, 0.13076019287109375, 0.1359405517578125, 0.14112091064453125, 0.14630126953125, 0.15148162841796875, 0.1566619873046875, 0.16184234619140625, 0.167022705078125, 0.17220306396484375, 0.1773834228515625, 0.18256378173828125, 0.187744140625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 4.0, 12.0, 13.0, 12.0, 11.0, 20.0, 29.0, 61.0, 84.0, 178.0, 494.0, 348892.0, 697810.0, 503.0, 189.0, 100.0, 47.0, 27.0, 13.0, 19.0, 15.0, 2.0, 4.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.47265625, -4.348480224609375, -4.22430419921875, -4.100128173828125, -3.9759521484375, -3.851776123046875, -3.72760009765625, -3.603424072265625, -3.479248046875, -3.355072021484375, -3.23089599609375, -3.106719970703125, -2.9825439453125, -2.858367919921875, -2.73419189453125, -2.610015869140625, -2.48583984375, -2.361663818359375, -2.23748779296875, -2.113311767578125, -1.9891357421875, -1.864959716796875, -1.74078369140625, -1.616607666015625, -1.492431640625, -1.368255615234375, -1.24407958984375, -1.119903564453125, -0.9957275390625, -0.871551513671875, -0.74737548828125, -0.623199462890625, -0.4990234375, -0.374847412109375, -0.25067138671875, -0.126495361328125, -0.0023193359375, 0.121856689453125, 0.24603271484375, 0.370208740234375, 0.494384765625, 0.618560791015625, 0.74273681640625, 0.866912841796875, 0.9910888671875, 1.115264892578125, 1.23944091796875, 1.363616943359375, 1.48779296875, 1.611968994140625, 1.73614501953125, 1.860321044921875, 1.9844970703125, 2.108673095703125, 2.23284912109375, 2.357025146484375, 2.481201171875, 2.605377197265625, 2.72955322265625, 2.853729248046875, 2.9779052734375, 3.102081298828125, 3.22625732421875, 3.350433349609375, 3.474609375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [6.0, 119.0, 643.0, 232.0, 19.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06312727183103561, -0.03839648887515068, -0.013665705919265747, 0.011065073311328888, 0.03579585999250412, 0.06052664667367935, 0.08525741845369339, 0.10998820513486862, 0.13471898436546326, 0.1594497710466385, 0.18418055772781372, 0.20891132950782776, 0.233642116189003, 0.2583729028701782, 0.28310367465019226, 0.3078344464302063, 0.3325652480125427, 0.35729601979255676, 0.3820268213748932, 0.4067575931549072, 0.43148839473724365, 0.4562191665172577, 0.48094993829727173, 0.5056807398796082, 0.5304115414619446, 0.555142343044281, 0.5798730850219727, 0.6046038866043091, 0.6293346881866455, 0.6540654897689819, 0.6787962317466736, 0.70352703332901, 0.7282577753067017, 0.7529885768890381, 0.7777193188667297, 0.8024501204490662, 0.8271809220314026, 0.8519116640090942, 0.8766424655914307, 0.9013732671737671, 0.9261040687561035, 0.9508348703384399, 0.9755656123161316, 1.0002963542938232, 1.0250271558761597, 1.049757957458496, 1.0744887590408325, 1.099219560623169, 1.1239502429962158, 1.1486810445785522, 1.1734118461608887, 1.1981425285339355, 1.222873330116272, 1.2476041316986084, 1.2723349332809448, 1.2970657348632812, 1.3217965364456177, 1.346527338027954, 1.3712581396102905, 1.395988941192627, 1.4207196235656738, 1.4454504251480103, 1.4701812267303467, 1.494912028312683, 1.5196428298950195]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 6.0, 8.0, 18.0, 12.0, 17.0, 21.0, 27.0, 28.0, 22.0, 37.0, 39.0, 34.0, 35.0, 47.0, 26.0, 34.0, 31.0, 43.0, 39.0, 37.0, 36.0, 36.0, 38.0, 32.0, 23.0, 43.0, 30.0, 28.0, 20.0, 26.0, 20.0, 20.0, 17.0, 10.0, 15.0, 7.0, 10.0, 5.0, 2.0, 1.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.11109155416488647, -0.10736467689275742, -0.10363780707120895, -0.0999109297990799, -0.09618405997753143, -0.09245718270540237, -0.08873030543327332, -0.08500343561172485, -0.0812765583395958, -0.07754968106746674, -0.07382281124591827, -0.07009593397378922, -0.06636905670166016, -0.0626421868801117, -0.058915309607982635, -0.055188436061143875, -0.051461562514305115, -0.047734688967466354, -0.044007815420627594, -0.040280938148498535, -0.036554064601659775, -0.032827191054821014, -0.029100315645337105, -0.025373440235853195, -0.021646566689014435, -0.017919693142175674, -0.014192817732691765, -0.01046594325453043, -0.006739068776369095, -0.0030121952295303345, 0.0007146801799535751, 0.004441555589437485, 0.008168429136276245, 0.01189530361443758, 0.015622178092598915, 0.019349053502082825, 0.023075927048921585, 0.026802800595760345, 0.030529676005244255, 0.034256551414728165, 0.037983424961566925, 0.041710298508405685, 0.045437172055244446, 0.049164049327373505, 0.052890922874212265, 0.056617796421051025, 0.060344673693180084, 0.06407155096530914, 0.0677984207868576, 0.07152529805898666, 0.07525216788053513, 0.07897904515266418, 0.08270591497421265, 0.0864327922463417, 0.09015966951847076, 0.09388653934001923, 0.09761341661214828, 0.10134029388427734, 0.1050671637058258, 0.10879404097795486, 0.11252091825008392, 0.11624778807163239, 0.11997466534376144, 0.1237015426158905, 0.12742841243743896]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 7.0, 10.0, 7.0, 22.0, 24.0, 36.0, 27.0, 45.0, 36.0, 32.0, 53.0, 31.0, 47.0, 52.0, 42.0, 51.0, 60.0, 32.0, 33.0, 41.0, 48.0, 30.0, 42.0, 28.0, 30.0, 15.0, 20.0, 25.0, 9.0, 7.0, 15.0, 9.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.6171875, -7.37451171875, -7.1318359375, -6.88916015625, -6.646484375, -6.40380859375, -6.1611328125, -5.91845703125, -5.67578125, -5.43310546875, -5.1904296875, -4.94775390625, -4.705078125, -4.46240234375, -4.2197265625, -3.97705078125, -3.734375, -3.49169921875, -3.2490234375, -3.00634765625, -2.763671875, -2.52099609375, -2.2783203125, -2.03564453125, -1.79296875, -1.55029296875, -1.3076171875, -1.06494140625, -0.822265625, -0.57958984375, -0.3369140625, -0.09423828125, 0.1484375, 0.39111328125, 0.6337890625, 0.87646484375, 1.119140625, 1.36181640625, 1.6044921875, 1.84716796875, 2.08984375, 2.33251953125, 2.5751953125, 2.81787109375, 3.060546875, 3.30322265625, 3.5458984375, 3.78857421875, 4.03125, 4.27392578125, 4.5166015625, 4.75927734375, 5.001953125, 5.24462890625, 5.4873046875, 5.72998046875, 5.97265625, 6.21533203125, 6.4580078125, 6.70068359375, 6.943359375, 7.18603515625, 7.4287109375, 7.67138671875, 7.9140625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 5.0, 5.0, 3.0, 5.0, 13.0, 10.0, 13.0, 28.0, 23.0, 23.0, 51.0, 77.0, 145.0, 240.0, 482.0, 848.0, 1856.0, 3996.0, 9628.0, 25801.0, 88221.0, 452672.0, 355952.0, 70929.0, 22159.0, 8465.0, 3536.0, 1558.0, 800.0, 391.0, 201.0, 133.0, 88.0, 55.0, 29.0, 33.0, 23.0, 14.0, 12.0, 8.0, 8.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6015625, -12.180419921875, -11.75927734375, -11.338134765625, -10.9169921875, -10.495849609375, -10.07470703125, -9.653564453125, -9.232421875, -8.811279296875, -8.39013671875, -7.968994140625, -7.5478515625, -7.126708984375, -6.70556640625, -6.284423828125, -5.86328125, -5.442138671875, -5.02099609375, -4.599853515625, -4.1787109375, -3.757568359375, -3.33642578125, -2.915283203125, -2.494140625, -2.072998046875, -1.65185546875, -1.230712890625, -0.8095703125, -0.388427734375, 0.03271484375, 0.453857421875, 0.875, 1.296142578125, 1.71728515625, 2.138427734375, 2.5595703125, 2.980712890625, 3.40185546875, 3.822998046875, 4.244140625, 4.665283203125, 5.08642578125, 5.507568359375, 5.9287109375, 6.349853515625, 6.77099609375, 7.192138671875, 7.61328125, 8.034423828125, 8.45556640625, 8.876708984375, 9.2978515625, 9.718994140625, 10.14013671875, 10.561279296875, 10.982421875, 11.403564453125, 11.82470703125, 12.245849609375, 12.6669921875, 13.088134765625, 13.50927734375, 13.930419921875, 14.3515625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 4.0, 7.0, 6.0, 5.0, 6.0, 12.0, 12.0, 15.0, 24.0, 19.0, 21.0, 10.0, 24.0, 25.0, 36.0, 40.0, 43.0, 38.0, 68.0, 114.0, 163.0, 1394.0, 305.0, 131.0, 92.0, 72.0, 42.0, 43.0, 40.0, 30.0, 28.0, 24.0, 23.0, 25.0, 16.0, 15.0, 21.0, 15.0, 10.0, 7.0, 7.0, 6.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.734375, -16.15380859375, -15.5732421875, -14.99267578125, -14.412109375, -13.83154296875, -13.2509765625, -12.67041015625, -12.08984375, -11.50927734375, -10.9287109375, -10.34814453125, -9.767578125, -9.18701171875, -8.6064453125, -8.02587890625, -7.4453125, -6.86474609375, -6.2841796875, -5.70361328125, -5.123046875, -4.54248046875, -3.9619140625, -3.38134765625, -2.80078125, -2.22021484375, -1.6396484375, -1.05908203125, -0.478515625, 0.10205078125, 0.6826171875, 1.26318359375, 1.84375, 2.42431640625, 3.0048828125, 3.58544921875, 4.166015625, 4.74658203125, 5.3271484375, 5.90771484375, 6.48828125, 7.06884765625, 7.6494140625, 8.22998046875, 8.810546875, 9.39111328125, 9.9716796875, 10.55224609375, 11.1328125, 11.71337890625, 12.2939453125, 12.87451171875, 13.455078125, 14.03564453125, 14.6162109375, 15.19677734375, 15.77734375, 16.35791015625, 16.9384765625, 17.51904296875, 18.099609375, 18.68017578125, 19.2607421875, 19.84130859375, 20.421875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 7.0, 9.0, 9.0, 9.0, 17.0, 22.0, 23.0, 33.0, 44.0, 56.0, 65.0, 71.0, 95.0, 106.0, 194.0, 289.0, 526.0, 1305.0, 3984.0, 19167.0, 318015.0, 2712328.0, 75462.0, 9286.0, 2436.0, 854.0, 417.0, 203.0, 143.0, 100.0, 87.0, 61.0, 51.0, 48.0, 35.0, 33.0, 17.0, 16.0, 17.0, 14.0, 13.0, 5.0, 5.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-34.21875, -33.19091796875, -32.1630859375, -31.13525390625, -30.107421875, -29.07958984375, -28.0517578125, -27.02392578125, -25.99609375, -24.96826171875, -23.9404296875, -22.91259765625, -21.884765625, -20.85693359375, -19.8291015625, -18.80126953125, -17.7734375, -16.74560546875, -15.7177734375, -14.68994140625, -13.662109375, -12.63427734375, -11.6064453125, -10.57861328125, -9.55078125, -8.52294921875, -7.4951171875, -6.46728515625, -5.439453125, -4.41162109375, -3.3837890625, -2.35595703125, -1.328125, -0.30029296875, 0.7275390625, 1.75537109375, 2.783203125, 3.81103515625, 4.8388671875, 5.86669921875, 6.89453125, 7.92236328125, 8.9501953125, 9.97802734375, 11.005859375, 12.03369140625, 13.0615234375, 14.08935546875, 15.1171875, 16.14501953125, 17.1728515625, 18.20068359375, 19.228515625, 20.25634765625, 21.2841796875, 22.31201171875, 23.33984375, 24.36767578125, 25.3955078125, 26.42333984375, 27.451171875, 28.47900390625, 29.5068359375, 30.53466796875, 31.5625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [74.0, 907.0, 36.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.8857479095459, -7.051213264465332, 7.783321380615234, 22.617856979370117, 37.452392578125, 52.28692626953125, 67.1214599609375, 81.95599365234375, 96.79052734375, 111.62506103515625, 126.4595947265625, 141.29412841796875, 156.128662109375, 170.96319580078125, 185.7977294921875, 200.63226318359375, 215.46681213378906, 230.3013458251953, 245.13587951660156, 259.9704284667969, 274.8049621582031, 289.6394958496094, 304.4740295410156, 319.3085632324219, 334.1430969238281, 348.9776306152344, 363.8121643066406, 378.6466979980469, 393.4812316894531, 408.3157653808594, 423.1502990722656, 437.9848327636719, 452.8193664550781, 467.6539001464844, 482.4884338378906, 497.3229675292969, 512.1575317382812, 526.9920654296875, 541.8265991210938, 556.6611328125, 571.4956665039062, 586.3302001953125, 601.1647338867188, 615.999267578125, 630.8338012695312, 645.6683349609375, 660.5028686523438, 675.33740234375, 690.1719360351562, 705.0064697265625, 719.8410034179688, 734.675537109375, 749.5100708007812, 764.3446044921875, 779.1791381835938, 794.013671875, 808.8482055664062, 823.6827392578125, 838.5172729492188, 853.351806640625, 868.1863403320312, 883.0208740234375, 897.8554077148438, 912.68994140625, 927.5244750976562]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 11.0, 9.0, 16.0, 11.0, 15.0, 15.0, 21.0, 29.0, 19.0, 28.0, 36.0, 26.0, 41.0, 52.0, 35.0, 29.0, 48.0, 31.0, 47.0, 37.0, 46.0, 30.0, 33.0, 27.0, 33.0, 24.0, 27.0, 28.0, 28.0, 22.0, 28.0, 14.0, 15.0, 8.0, 16.0, 7.0, 14.0, 5.0, 3.0, 5.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 2.0], "bins": [-58.382991790771484, -56.82843780517578, -55.27388381958008, -53.719329833984375, -52.16477584838867, -50.61022186279297, -49.0556640625, -47.50111389160156, -45.946556091308594, -44.39200210571289, -42.83744812011719, -41.282894134521484, -39.72834014892578, -38.17378616333008, -36.619232177734375, -35.064674377441406, -33.51012420654297, -31.955570220947266, -30.401016235351562, -28.84646224975586, -27.291908264160156, -25.737354278564453, -24.182798385620117, -22.628244400024414, -21.07369041442871, -19.519136428833008, -17.964582443237305, -16.41002655029297, -14.855473518371582, -13.300919532775879, -11.74636459350586, -10.191810607910156, -8.637260437011719, -7.082706451416016, -5.528151988983154, -3.973597526550293, -2.41904354095459, -0.8644895553588867, 0.6900653839111328, 2.244619369506836, 3.799173355102539, 5.353727340698242, 6.9082818031311035, 8.462836265563965, 10.017390251159668, 11.571944236755371, 13.12649917602539, 14.681053161621094, 16.235607147216797, 17.7901611328125, 19.344715118408203, 20.899269104003906, 22.45382308959961, 24.008377075195312, 25.56293296813965, 27.11748695373535, 28.672040939331055, 30.226594924926758, 31.78114891052246, 33.3357048034668, 34.8902587890625, 36.4448127746582, 37.999366760253906, 39.55392074584961, 41.10847473144531]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 9.0, 7.0, 11.0, 7.0, 12.0, 18.0, 31.0, 22.0, 32.0, 35.0, 36.0, 39.0, 43.0, 53.0, 46.0, 55.0, 47.0, 49.0, 63.0, 43.0, 31.0, 32.0, 29.0, 26.0, 36.0, 28.0, 22.0, 23.0, 17.0, 14.0, 13.0, 17.0, 12.0, 5.0, 7.0, 5.0, 7.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.8560791015625, -7.602783203125, -7.3494873046875, -7.09619140625, -6.8428955078125, -6.589599609375, -6.3363037109375, -6.0830078125, -5.8297119140625, -5.576416015625, -5.3231201171875, -5.06982421875, -4.8165283203125, -4.563232421875, -4.3099365234375, -4.056640625, -3.8033447265625, -3.550048828125, -3.2967529296875, -3.04345703125, -2.7901611328125, -2.536865234375, -2.2835693359375, -2.0302734375, -1.7769775390625, -1.523681640625, -1.2703857421875, -1.01708984375, -0.7637939453125, -0.510498046875, -0.2572021484375, -0.00390625, 0.2493896484375, 0.502685546875, 0.7559814453125, 1.00927734375, 1.2625732421875, 1.515869140625, 1.7691650390625, 2.0224609375, 2.2757568359375, 2.529052734375, 2.7823486328125, 3.03564453125, 3.2889404296875, 3.542236328125, 3.7955322265625, 4.048828125, 4.3021240234375, 4.555419921875, 4.8087158203125, 5.06201171875, 5.3153076171875, 5.568603515625, 5.8218994140625, 6.0751953125, 6.3284912109375, 6.581787109375, 6.8350830078125, 7.08837890625, 7.3416748046875, 7.594970703125, 7.8482666015625, 8.1015625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 6.0, 7.0, 10.0, 17.0, 21.0, 38.0, 56.0, 74.0, 123.0, 180.0, 251.0, 568.0, 1009.0, 2038.0, 4599.0, 11153.0, 32858.0, 135852.0, 768481.0, 2271454.0, 776271.0, 136846.0, 32820.0, 10750.0, 4425.0, 2074.0, 1003.0, 511.0, 313.0, 150.0, 98.0, 65.0, 45.0, 35.0, 14.0, 25.0, 10.0, 7.0, 4.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.984375, -9.634033203125, -9.28369140625, -8.933349609375, -8.5830078125, -8.232666015625, -7.88232421875, -7.531982421875, -7.181640625, -6.831298828125, -6.48095703125, -6.130615234375, -5.7802734375, -5.429931640625, -5.07958984375, -4.729248046875, -4.37890625, -4.028564453125, -3.67822265625, -3.327880859375, -2.9775390625, -2.627197265625, -2.27685546875, -1.926513671875, -1.576171875, -1.225830078125, -0.87548828125, -0.525146484375, -0.1748046875, 0.175537109375, 0.52587890625, 0.876220703125, 1.2265625, 1.576904296875, 1.92724609375, 2.277587890625, 2.6279296875, 2.978271484375, 3.32861328125, 3.678955078125, 4.029296875, 4.379638671875, 4.72998046875, 5.080322265625, 5.4306640625, 5.781005859375, 6.13134765625, 6.481689453125, 6.83203125, 7.182373046875, 7.53271484375, 7.883056640625, 8.2333984375, 8.583740234375, 8.93408203125, 9.284423828125, 9.634765625, 9.985107421875, 10.33544921875, 10.685791015625, 11.0361328125, 11.386474609375, 11.73681640625, 12.087158203125, 12.4375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 2.0, 3.0, 5.0, 5.0, 11.0, 10.0, 19.0, 25.0, 39.0, 56.0, 69.0, 119.0, 190.0, 246.0, 436.0, 598.0, 665.0, 500.0, 342.0, 215.0, 126.0, 102.0, 66.0, 48.0, 44.0, 35.0, 18.0, 14.0, 10.0, 14.0, 11.0, 12.0, 7.0, 5.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3671875, -10.9783935546875, -10.589599609375, -10.2008056640625, -9.81201171875, -9.4232177734375, -9.034423828125, -8.6456298828125, -8.2568359375, -7.8680419921875, -7.479248046875, -7.0904541015625, -6.70166015625, -6.3128662109375, -5.924072265625, -5.5352783203125, -5.146484375, -4.7576904296875, -4.368896484375, -3.9801025390625, -3.59130859375, -3.2025146484375, -2.813720703125, -2.4249267578125, -2.0361328125, -1.6473388671875, -1.258544921875, -0.8697509765625, -0.48095703125, -0.0921630859375, 0.296630859375, 0.6854248046875, 1.07421875, 1.4630126953125, 1.851806640625, 2.2406005859375, 2.62939453125, 3.0181884765625, 3.406982421875, 3.7957763671875, 4.1845703125, 4.5733642578125, 4.962158203125, 5.3509521484375, 5.73974609375, 6.1285400390625, 6.517333984375, 6.9061279296875, 7.294921875, 7.6837158203125, 8.072509765625, 8.4613037109375, 8.85009765625, 9.2388916015625, 9.627685546875, 10.0164794921875, 10.4052734375, 10.7940673828125, 11.182861328125, 11.5716552734375, 11.96044921875, 12.3492431640625, 12.738037109375, 13.1268310546875, 13.515625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 10.0, 2.0, 5.0, 6.0, 13.0, 12.0, 21.0, 21.0, 27.0, 52.0, 52.0, 96.0, 138.0, 217.0, 414.0, 1109.0, 4489.0, 35004.0, 777087.0, 3255101.0, 107310.0, 9902.0, 1826.0, 596.0, 280.0, 174.0, 97.0, 60.0, 41.0, 29.0, 22.0, 19.0, 13.0, 10.0, 11.0, 8.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.90625, -30.915771484375, -29.92529296875, -28.934814453125, -27.9443359375, -26.953857421875, -25.96337890625, -24.972900390625, -23.982421875, -22.991943359375, -22.00146484375, -21.010986328125, -20.0205078125, -19.030029296875, -18.03955078125, -17.049072265625, -16.05859375, -15.068115234375, -14.07763671875, -13.087158203125, -12.0966796875, -11.106201171875, -10.11572265625, -9.125244140625, -8.134765625, -7.144287109375, -6.15380859375, -5.163330078125, -4.1728515625, -3.182373046875, -2.19189453125, -1.201416015625, -0.2109375, 0.779541015625, 1.77001953125, 2.760498046875, 3.7509765625, 4.741455078125, 5.73193359375, 6.722412109375, 7.712890625, 8.703369140625, 9.69384765625, 10.684326171875, 11.6748046875, 12.665283203125, 13.65576171875, 14.646240234375, 15.63671875, 16.627197265625, 17.61767578125, 18.608154296875, 19.5986328125, 20.589111328125, 21.57958984375, 22.570068359375, 23.560546875, 24.551025390625, 25.54150390625, 26.531982421875, 27.5224609375, 28.512939453125, 29.50341796875, 30.493896484375, 31.484375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 3.0, 6.0, 17.0, 93.0, 296.0, 340.0, 206.0, 41.0, 10.0, 3.0, 2.0, 0.0, 1.0], "bins": [-263.8110046386719, -259.10791015625, -254.40481567382812, -249.70172119140625, -244.99862670898438, -240.2955322265625, -235.59243774414062, -230.8893585205078, -226.18626403808594, -221.48316955566406, -216.7800750732422, -212.0769805908203, -207.37388610839844, -202.67080688476562, -197.96771240234375, -193.26461791992188, -188.5615234375, -183.85842895507812, -179.15533447265625, -174.45223999023438, -169.7491455078125, -165.04605102539062, -160.34295654296875, -155.63987731933594, -150.936767578125, -146.23367309570312, -141.53057861328125, -136.82748413085938, -132.1243896484375, -127.42130279541016, -122.71820831298828, -118.01512145996094, -113.31201934814453, -108.60892486572266, -103.90583038330078, -99.20274353027344, -94.49964904785156, -89.79655456542969, -85.09346008300781, -80.39036560058594, -75.68727111816406, -70.98417663574219, -66.28108215332031, -61.5779914855957, -56.874900817871094, -52.17180633544922, -47.468711853027344, -42.765621185302734, -38.062530517578125, -33.35943603515625, -28.65634536743164, -23.953250885009766, -19.250158309936523, -14.547065734863281, -9.843971252441406, -5.140880584716797, -0.4377861022949219, 4.2653069496154785, 8.968400001525879, 13.671493530273438, 18.37458610534668, 23.077678680419922, 27.780773162841797, 32.483863830566406, 37.18695831298828]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 0.0, 8.0, 10.0, 4.0, 7.0, 16.0, 13.0, 14.0, 22.0, 19.0, 24.0, 22.0, 27.0, 50.0, 35.0, 54.0, 32.0, 45.0, 39.0, 39.0, 44.0, 45.0, 42.0, 44.0, 41.0, 32.0, 43.0, 24.0, 26.0, 48.0, 20.0, 11.0, 19.0, 15.0, 8.0, 12.0, 11.0, 10.0, 5.0, 3.0, 5.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-38.63576889038086, -37.37422180175781, -36.1126708984375, -34.85112380981445, -33.58957290649414, -32.328025817871094, -31.066476821899414, -29.804927825927734, -28.543378829956055, -27.281829833984375, -26.020280838012695, -24.758731842041016, -23.49718475341797, -22.235633850097656, -20.97408676147461, -19.71253776550293, -18.45098876953125, -17.18943977355957, -15.92789077758789, -14.666342735290527, -13.404793739318848, -12.143244743347168, -10.881696701049805, -9.620147705078125, -8.358598709106445, -7.097049713134766, -5.835501194000244, -4.573952674865723, -3.312403678894043, -2.0508546829223633, -0.7893061637878418, 0.4722423553466797, 1.733795166015625, 2.9953439235687256, 4.256892681121826, 5.518441200256348, 6.779990196228027, 8.041539192199707, 9.30308723449707, 10.56463623046875, 11.82618522644043, 13.08773422241211, 14.349283218383789, 15.610831260681152, 16.872379302978516, 18.133930206298828, 19.395477294921875, 20.657026290893555, 21.918575286865234, 23.180124282836914, 24.441673278808594, 25.703222274780273, 26.964771270751953, 28.226318359375, 29.48786735534668, 30.74941635131836, 32.010963439941406, 33.27251052856445, 34.534061431884766, 35.79560852050781, 37.057159423828125, 38.31870651245117, 39.580257415771484, 40.84180450439453, 42.103355407714844]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 8.0, 7.0, 7.0, 13.0, 16.0, 36.0, 19.0, 31.0, 32.0, 30.0, 38.0, 38.0, 43.0, 41.0, 59.0, 40.0, 54.0, 51.0, 47.0, 38.0, 45.0, 39.0, 23.0, 32.0, 36.0, 23.0, 21.0, 24.0, 16.0, 10.0, 23.0, 10.0, 6.0, 11.0, 8.0, 7.0, 8.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.3515625, -7.11932373046875, -6.8870849609375, -6.65484619140625, -6.422607421875, -6.19036865234375, -5.9581298828125, -5.72589111328125, -5.49365234375, -5.26141357421875, -5.0291748046875, -4.79693603515625, -4.564697265625, -4.33245849609375, -4.1002197265625, -3.86798095703125, -3.6357421875, -3.40350341796875, -3.1712646484375, -2.93902587890625, -2.706787109375, -2.47454833984375, -2.2423095703125, -2.01007080078125, -1.77783203125, -1.54559326171875, -1.3133544921875, -1.08111572265625, -0.848876953125, -0.61663818359375, -0.3843994140625, -0.15216064453125, 0.080078125, 0.31231689453125, 0.5445556640625, 0.77679443359375, 1.009033203125, 1.24127197265625, 1.4735107421875, 1.70574951171875, 1.93798828125, 2.17022705078125, 2.4024658203125, 2.63470458984375, 2.866943359375, 3.09918212890625, 3.3314208984375, 3.56365966796875, 3.7958984375, 4.02813720703125, 4.2603759765625, 4.49261474609375, 4.724853515625, 4.95709228515625, 5.1893310546875, 5.42156982421875, 5.65380859375, 5.88604736328125, 6.1182861328125, 6.35052490234375, 6.582763671875, 6.81500244140625, 7.0472412109375, 7.27947998046875, 7.51171875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 6.0, 4.0, 4.0, 18.0, 13.0, 22.0, 25.0, 42.0, 57.0, 76.0, 116.0, 159.0, 249.0, 364.0, 518.0, 829.0, 1247.0, 1915.0, 3117.0, 5001.0, 8380.0, 14643.0, 25976.0, 46594.0, 88028.0, 166750.0, 247800.0, 197498.0, 108161.0, 56694.0, 30936.0, 17233.0, 9994.0, 6043.0, 3642.0, 2290.0, 1372.0, 886.0, 544.0, 402.0, 291.0, 174.0, 136.0, 88.0, 63.0, 47.0, 34.0, 25.0, 14.0, 7.0, 16.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.8759765625, -0.8483047485351562, -0.8206329345703125, -0.7929611206054688, -0.765289306640625, -0.7376174926757812, -0.7099456787109375, -0.6822738647460938, -0.65460205078125, -0.6269302368164062, -0.5992584228515625, -0.5715866088867188, -0.543914794921875, -0.5162429809570312, -0.4885711669921875, -0.46089935302734375, -0.4332275390625, -0.40555572509765625, -0.3778839111328125, -0.35021209716796875, -0.322540283203125, -0.29486846923828125, -0.2671966552734375, -0.23952484130859375, -0.21185302734375, -0.18418121337890625, -0.1565093994140625, -0.12883758544921875, -0.101165771484375, -0.07349395751953125, -0.0458221435546875, -0.01815032958984375, 0.009521484375, 0.03719329833984375, 0.0648651123046875, 0.09253692626953125, 0.120208740234375, 0.14788055419921875, 0.1755523681640625, 0.20322418212890625, 0.23089599609375, 0.25856781005859375, 0.2862396240234375, 0.31391143798828125, 0.341583251953125, 0.36925506591796875, 0.3969268798828125, 0.42459869384765625, 0.4522705078125, 0.47994232177734375, 0.5076141357421875, 0.5352859497070312, 0.562957763671875, 0.5906295776367188, 0.6183013916015625, 0.6459732055664062, 0.67364501953125, 0.7013168334960938, 0.7289886474609375, 0.7566604614257812, 0.784332275390625, 0.8120040893554688, 0.8396759033203125, 0.8673477172851562, 0.89501953125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 8.0, 5.0, 9.0, 10.0, 10.0, 15.0, 16.0, 15.0, 19.0, 21.0, 28.0, 19.0, 31.0, 33.0, 31.0, 33.0, 27.0, 36.0, 27.0, 34.0, 29.0, 1052.0, 32.0, 29.0, 33.0, 33.0, 40.0, 41.0, 36.0, 27.0, 30.0, 29.0, 21.0, 15.0, 21.0, 23.0, 12.0, 16.0, 11.0, 10.0, 11.0, 11.0, 5.0, 7.0, 4.0, 2.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-3.90625, -3.77978515625, -3.6533203125, -3.52685546875, -3.400390625, -3.27392578125, -3.1474609375, -3.02099609375, -2.89453125, -2.76806640625, -2.6416015625, -2.51513671875, -2.388671875, -2.26220703125, -2.1357421875, -2.00927734375, -1.8828125, -1.75634765625, -1.6298828125, -1.50341796875, -1.376953125, -1.25048828125, -1.1240234375, -0.99755859375, -0.87109375, -0.74462890625, -0.6181640625, -0.49169921875, -0.365234375, -0.23876953125, -0.1123046875, 0.01416015625, 0.140625, 0.26708984375, 0.3935546875, 0.52001953125, 0.646484375, 0.77294921875, 0.8994140625, 1.02587890625, 1.15234375, 1.27880859375, 1.4052734375, 1.53173828125, 1.658203125, 1.78466796875, 1.9111328125, 2.03759765625, 2.1640625, 2.29052734375, 2.4169921875, 2.54345703125, 2.669921875, 2.79638671875, 2.9228515625, 3.04931640625, 3.17578125, 3.30224609375, 3.4287109375, 3.55517578125, 3.681640625, 3.80810546875, 3.9345703125, 4.06103515625, 4.1875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 5.0, 5.0, 6.0, 17.0, 13.0, 25.0, 42.0, 34.0, 68.0, 96.0, 152.0, 225.0, 422.0, 636.0, 1170.0, 2021.0, 3815.0, 7306.0, 14319.0, 29417.0, 63342.0, 146600.0, 812361.0, 751136.0, 142652.0, 62331.0, 28909.0, 14201.0, 7159.0, 3741.0, 2067.0, 1099.0, 669.0, 368.0, 248.0, 148.0, 104.0, 59.0, 30.0, 36.0, 25.0, 14.0, 7.0, 9.0, 6.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.80517578125, -0.7783279418945312, -0.7514801025390625, -0.7246322631835938, -0.697784423828125, -0.6709365844726562, -0.6440887451171875, -0.6172409057617188, -0.59039306640625, -0.5635452270507812, -0.5366973876953125, -0.5098495483398438, -0.483001708984375, -0.45615386962890625, -0.4293060302734375, -0.40245819091796875, -0.3756103515625, -0.34876251220703125, -0.3219146728515625, -0.29506683349609375, -0.268218994140625, -0.24137115478515625, -0.2145233154296875, -0.18767547607421875, -0.16082763671875, -0.13397979736328125, -0.1071319580078125, -0.08028411865234375, -0.053436279296875, -0.02658843994140625, 0.0002593994140625, 0.02710723876953125, 0.053955078125, 0.08080291748046875, 0.1076507568359375, 0.13449859619140625, 0.161346435546875, 0.18819427490234375, 0.2150421142578125, 0.24188995361328125, 0.26873779296875, 0.29558563232421875, 0.3224334716796875, 0.34928131103515625, 0.376129150390625, 0.40297698974609375, 0.4298248291015625, 0.45667266845703125, 0.4835205078125, 0.5103683471679688, 0.5372161865234375, 0.5640640258789062, 0.590911865234375, 0.6177597045898438, 0.6446075439453125, 0.6714553833007812, 0.69830322265625, 0.7251510620117188, 0.7519989013671875, 0.7788467407226562, 0.805694580078125, 0.8325424194335938, 0.8593902587890625, 0.8862380981445312, 0.9130859375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 9.0, 11.0, 16.0, 22.0, 33.0, 52.0, 71.0, 86.0, 113.0, 111.0, 107.0, 102.0, 86.0, 58.0, 32.0, 22.0, 17.0, 15.0, 5.0, 6.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09271240234375, -0.08898067474365234, -0.08524894714355469, -0.08151721954345703, -0.07778549194335938, -0.07405376434326172, -0.07032203674316406, -0.0665903091430664, -0.06285858154296875, -0.059126853942871094, -0.05539512634277344, -0.05166339874267578, -0.047931671142578125, -0.04419994354248047, -0.04046821594238281, -0.036736488342285156, -0.0330047607421875, -0.029273033142089844, -0.025541305541992188, -0.02180957794189453, -0.018077850341796875, -0.014346122741699219, -0.010614395141601562, -0.006882667541503906, -0.00315093994140625, 0.0005807876586914062, 0.0043125152587890625, 0.008044242858886719, 0.011775970458984375, 0.015507698059082031, 0.019239425659179688, 0.022971153259277344, 0.026702880859375, 0.030434608459472656, 0.03416633605957031, 0.03789806365966797, 0.041629791259765625, 0.04536151885986328, 0.04909324645996094, 0.052824974060058594, 0.05655670166015625, 0.060288429260253906, 0.06402015686035156, 0.06775188446044922, 0.07148361206054688, 0.07521533966064453, 0.07894706726074219, 0.08267879486083984, 0.0864105224609375, 0.09014225006103516, 0.09387397766113281, 0.09760570526123047, 0.10133743286132812, 0.10506916046142578, 0.10880088806152344, 0.1125326156616211, 0.11626434326171875, 0.1199960708618164, 0.12372779846191406, 0.12745952606201172, 0.13119125366210938, 0.13492298126220703, 0.1386547088623047, 0.14238643646240234, 0.1461181640625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 11.0, 21.0, 17.0, 35.0, 59.0, 112.0, 213.0, 567.0, 27262.0, 1018423.0, 1150.0, 301.0, 139.0, 73.0, 43.0, 39.0, 24.0, 11.0, 11.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.361328125, -3.275543212890625, -3.18975830078125, -3.103973388671875, -3.0181884765625, -2.932403564453125, -2.84661865234375, -2.760833740234375, -2.675048828125, -2.589263916015625, -2.50347900390625, -2.417694091796875, -2.3319091796875, -2.246124267578125, -2.16033935546875, -2.074554443359375, -1.98876953125, -1.902984619140625, -1.81719970703125, -1.731414794921875, -1.6456298828125, -1.559844970703125, -1.47406005859375, -1.388275146484375, -1.302490234375, -1.216705322265625, -1.13092041015625, -1.045135498046875, -0.9593505859375, -0.873565673828125, -0.78778076171875, -0.701995849609375, -0.6162109375, -0.530426025390625, -0.44464111328125, -0.358856201171875, -0.2730712890625, -0.187286376953125, -0.10150146484375, -0.015716552734375, 0.070068359375, 0.155853271484375, 0.24163818359375, 0.327423095703125, 0.4132080078125, 0.498992919921875, 0.58477783203125, 0.670562744140625, 0.75634765625, 0.842132568359375, 0.92791748046875, 1.013702392578125, 1.0994873046875, 1.185272216796875, 1.27105712890625, 1.356842041015625, 1.442626953125, 1.528411865234375, 1.61419677734375, 1.699981689453125, 1.7857666015625, 1.871551513671875, 1.95733642578125, 2.043121337890625, 2.12890625]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 356.0, 650.0, 9.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33576706051826477, -0.30245694518089294, -0.2691468298435211, -0.2358366996049881, -0.20252658426761627, -0.16921646893024445, -0.13590633869171143, -0.1025962233543396, -0.06928610801696777, -0.03597598895430565, -0.002665869891643524, 0.0306442528963089, 0.06395436823368073, 0.09726448357105255, 0.13057461380958557, 0.1638847291469574, 0.19719484448432922, 0.23050495982170105, 0.2638150751590729, 0.2971252202987671, 0.3304353356361389, 0.36374545097351074, 0.39705556631088257, 0.4303656816482544, 0.4636757969856262, 0.49698591232299805, 0.5302960276603699, 0.5636061429977417, 0.5969162583351135, 0.6302263736724854, 0.663536548614502, 0.696846604347229, 0.730156660079956, 0.7634667754173279, 0.7967768907546997, 0.8300870060920715, 0.8633971214294434, 0.8967072367668152, 0.930017352104187, 0.9633275270462036, 0.9966375827789307, 1.0299477577209473, 1.0632578134536743, 1.096567988395691, 1.129878044128418, 1.1631882190704346, 1.1964982748031616, 1.2298084497451782, 1.2631185054779053, 1.2964286804199219, 1.329738736152649, 1.3630489110946655, 1.3963589668273926, 1.4296691417694092, 1.4629791975021362, 1.4962893724441528, 1.5295995473861694, 1.562909722328186, 1.596219778060913, 1.6295299530029297, 1.6628400087356567, 1.6961501836776733, 1.7294602394104004, 1.762770414352417, 1.796080470085144]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 4.0, 5.0, 5.0, 10.0, 10.0, 9.0, 11.0, 12.0, 7.0, 18.0, 12.0, 23.0, 22.0, 30.0, 24.0, 33.0, 26.0, 29.0, 44.0, 45.0, 47.0, 40.0, 31.0, 47.0, 37.0, 36.0, 35.0, 33.0, 38.0, 27.0, 30.0, 33.0, 34.0, 16.0, 14.0, 14.0, 19.0, 18.0, 14.0, 9.0, 9.0, 8.0, 3.0, 4.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.1301332712173462, -0.1260582059621811, -0.12198314070701599, -0.11790807545185089, -0.11383301019668579, -0.10975794494152069, -0.105682872235775, -0.1016078069806099, -0.0975327417254448, -0.0934576764702797, -0.0893826112151146, -0.0853075459599495, -0.0812324732542038, -0.0771574079990387, -0.0730823427438736, -0.0690072774887085, -0.0649322122335434, -0.060857146978378296, -0.056782081723213196, -0.0527070127427578, -0.0486319474875927, -0.0445568822324276, -0.0404818132519722, -0.0364067479968071, -0.032331682741642, -0.028256617486476898, -0.02418155036866665, -0.0201064832508564, -0.0160314179956913, -0.0119563527405262, -0.00788128562271595, -0.0038062185049057007, 0.0002688467502593994, 0.004343912936747074, 0.008418979123234749, 0.012494045309722424, 0.0165691114962101, 0.0206441767513752, 0.024719243869185448, 0.028794310986995697, 0.0328693762421608, 0.0369444414973259, 0.041019506752491, 0.045094575732946396, 0.049169640988111496, 0.053244706243276596, 0.057319775223731995, 0.061394840478897095, 0.0654699057340622, 0.0695449709892273, 0.0736200362443924, 0.0776951014995575, 0.0817701667547226, 0.0858452320098877, 0.08992030471563339, 0.09399536997079849, 0.09807043522596359, 0.10214550048112869, 0.10622056573629379, 0.11029563099145889, 0.11437070369720459, 0.11844576895236969, 0.12252083420753479, 0.1265958994626999, 0.130670964717865]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 7.0, 2.0, 8.0, 14.0, 11.0, 18.0, 18.0, 24.0, 28.0, 18.0, 39.0, 32.0, 31.0, 35.0, 47.0, 34.0, 47.0, 49.0, 48.0, 52.0, 50.0, 41.0, 39.0, 39.0, 31.0, 27.0, 28.0, 30.0, 22.0, 21.0, 19.0, 23.0, 15.0, 13.0, 8.0, 7.0, 8.0, 10.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.59375, -7.36346435546875, -7.1331787109375, -6.90289306640625, -6.672607421875, -6.44232177734375, -6.2120361328125, -5.98175048828125, -5.75146484375, -5.52117919921875, -5.2908935546875, -5.06060791015625, -4.830322265625, -4.60003662109375, -4.3697509765625, -4.13946533203125, -3.9091796875, -3.67889404296875, -3.4486083984375, -3.21832275390625, -2.988037109375, -2.75775146484375, -2.5274658203125, -2.29718017578125, -2.06689453125, -1.83660888671875, -1.6063232421875, -1.37603759765625, -1.145751953125, -0.91546630859375, -0.6851806640625, -0.45489501953125, -0.224609375, 0.00567626953125, 0.2359619140625, 0.46624755859375, 0.696533203125, 0.92681884765625, 1.1571044921875, 1.38739013671875, 1.61767578125, 1.84796142578125, 2.0782470703125, 2.30853271484375, 2.538818359375, 2.76910400390625, 2.9993896484375, 3.22967529296875, 3.4599609375, 3.69024658203125, 3.9205322265625, 4.15081787109375, 4.381103515625, 4.61138916015625, 4.8416748046875, 5.07196044921875, 5.30224609375, 5.53253173828125, 5.7628173828125, 5.99310302734375, 6.223388671875, 6.45367431640625, 6.6839599609375, 6.91424560546875, 7.14453125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 11.0, 20.0, 17.0, 21.0, 28.0, 24.0, 45.0, 59.0, 81.0, 144.0, 224.0, 417.0, 1076.0, 2563.0, 7050.0, 21908.0, 91044.0, 599106.0, 259048.0, 45224.0, 12830.0, 4434.0, 1649.0, 676.0, 288.0, 182.0, 97.0, 78.0, 40.0, 45.0, 28.0, 25.0, 14.0, 12.0, 13.0, 12.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.9375, -17.39013671875, -16.8427734375, -16.29541015625, -15.748046875, -15.20068359375, -14.6533203125, -14.10595703125, -13.55859375, -13.01123046875, -12.4638671875, -11.91650390625, -11.369140625, -10.82177734375, -10.2744140625, -9.72705078125, -9.1796875, -8.63232421875, -8.0849609375, -7.53759765625, -6.990234375, -6.44287109375, -5.8955078125, -5.34814453125, -4.80078125, -4.25341796875, -3.7060546875, -3.15869140625, -2.611328125, -2.06396484375, -1.5166015625, -0.96923828125, -0.421875, 0.12548828125, 0.6728515625, 1.22021484375, 1.767578125, 2.31494140625, 2.8623046875, 3.40966796875, 3.95703125, 4.50439453125, 5.0517578125, 5.59912109375, 6.146484375, 6.69384765625, 7.2412109375, 7.78857421875, 8.3359375, 8.88330078125, 9.4306640625, 9.97802734375, 10.525390625, 11.07275390625, 11.6201171875, 12.16748046875, 12.71484375, 13.26220703125, 13.8095703125, 14.35693359375, 14.904296875, 15.45166015625, 15.9990234375, 16.54638671875, 17.09375]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 4.0, 4.0, 1.0, 6.0, 14.0, 9.0, 7.0, 15.0, 17.0, 19.0, 21.0, 22.0, 29.0, 35.0, 46.0, 47.0, 67.0, 74.0, 161.0, 375.0, 1397.0, 176.0, 90.0, 65.0, 51.0, 48.0, 35.0, 40.0, 35.0, 26.0, 15.0, 17.0, 13.0, 12.0, 18.0, 7.0, 9.0, 3.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.625, -16.99658203125, -16.3681640625, -15.73974609375, -15.111328125, -14.48291015625, -13.8544921875, -13.22607421875, -12.59765625, -11.96923828125, -11.3408203125, -10.71240234375, -10.083984375, -9.45556640625, -8.8271484375, -8.19873046875, -7.5703125, -6.94189453125, -6.3134765625, -5.68505859375, -5.056640625, -4.42822265625, -3.7998046875, -3.17138671875, -2.54296875, -1.91455078125, -1.2861328125, -0.65771484375, -0.029296875, 0.59912109375, 1.2275390625, 1.85595703125, 2.484375, 3.11279296875, 3.7412109375, 4.36962890625, 4.998046875, 5.62646484375, 6.2548828125, 6.88330078125, 7.51171875, 8.14013671875, 8.7685546875, 9.39697265625, 10.025390625, 10.65380859375, 11.2822265625, 11.91064453125, 12.5390625, 13.16748046875, 13.7958984375, 14.42431640625, 15.052734375, 15.68115234375, 16.3095703125, 16.93798828125, 17.56640625, 18.19482421875, 18.8232421875, 19.45166015625, 20.080078125, 20.70849609375, 21.3369140625, 21.96533203125, 22.59375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 9.0, 8.0, 21.0, 18.0, 19.0, 39.0, 44.0, 61.0, 93.0, 143.0, 187.0, 333.0, 696.0, 2631.0, 21324.0, 1657371.0, 1438494.0, 19989.0, 2555.0, 689.0, 308.0, 212.0, 128.0, 70.0, 65.0, 44.0, 36.0, 33.0, 18.0, 20.0, 10.0, 8.0, 3.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-42.8125, -41.5888671875, -40.365234375, -39.1416015625, -37.91796875, -36.6943359375, -35.470703125, -34.2470703125, -33.0234375, -31.7998046875, -30.576171875, -29.3525390625, -28.12890625, -26.9052734375, -25.681640625, -24.4580078125, -23.234375, -22.0107421875, -20.787109375, -19.5634765625, -18.33984375, -17.1162109375, -15.892578125, -14.6689453125, -13.4453125, -12.2216796875, -10.998046875, -9.7744140625, -8.55078125, -7.3271484375, -6.103515625, -4.8798828125, -3.65625, -2.4326171875, -1.208984375, 0.0146484375, 1.23828125, 2.4619140625, 3.685546875, 4.9091796875, 6.1328125, 7.3564453125, 8.580078125, 9.8037109375, 11.02734375, 12.2509765625, 13.474609375, 14.6982421875, 15.921875, 17.1455078125, 18.369140625, 19.5927734375, 20.81640625, 22.0400390625, 23.263671875, 24.4873046875, 25.7109375, 26.9345703125, 28.158203125, 29.3818359375, 30.60546875, 31.8291015625, 33.052734375, 34.2763671875, 35.5]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 23.0, 83.0, 197.0, 293.0, 253.0, 117.0, 28.0, 10.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.49787139892578, -62.845359802246094, -60.192848205566406, -57.54033660888672, -54.88782501220703, -52.235313415527344, -49.58280563354492, -46.930294036865234, -44.27778244018555, -41.62527084350586, -38.97275924682617, -36.320247650146484, -33.66773986816406, -31.015226364135742, -28.362716674804688, -25.710205078125, -23.057693481445312, -20.405181884765625, -17.752670288085938, -15.100160598754883, -12.447649002075195, -9.795137405395508, -7.142626762390137, -4.490116119384766, -1.8376045227050781, 0.8149065971374512, 3.4674177169799805, 6.11992883682251, 8.772439956665039, 11.424951553344727, 14.077462196350098, 16.72997283935547, 19.382476806640625, 22.034988403320312, 24.6875, 27.340009689331055, 29.992521286010742, 32.64503479003906, 35.297542572021484, 37.95005416870117, 40.60256576538086, 43.25507736206055, 45.907588958740234, 48.56010055541992, 51.212608337402344, 53.86511993408203, 56.51763153076172, 59.170143127441406, 61.822654724121094, 64.47516632080078, 67.12767791748047, 69.78018951416016, 72.43270111083984, 75.08521270751953, 77.73772430419922, 80.39022827148438, 83.04273986816406, 85.69525146484375, 88.34776306152344, 91.00027465820312, 93.65278625488281, 96.3052978515625, 98.95780944824219, 101.61032104492188, 104.26283264160156]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 7.0, 13.0, 17.0, 5.0, 16.0, 24.0, 15.0, 18.0, 23.0, 16.0, 33.0, 29.0, 32.0, 37.0, 34.0, 38.0, 32.0, 42.0, 50.0, 37.0, 33.0, 33.0, 34.0, 41.0, 35.0, 37.0, 35.0, 31.0, 27.0, 23.0, 17.0, 12.0, 23.0, 19.0, 15.0, 13.0, 8.0, 5.0, 7.0, 5.0, 3.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-48.97601318359375, -47.54582977294922, -46.11564254760742, -44.685455322265625, -43.255271911621094, -41.82508850097656, -40.394901275634766, -38.96471405029297, -37.53453063964844, -36.104347229003906, -34.67416000366211, -33.24397277832031, -31.81378936767578, -30.383604049682617, -28.953418731689453, -27.52323341369629, -26.093048095703125, -24.66286277770996, -23.232677459716797, -21.802492141723633, -20.37230682373047, -18.942121505737305, -17.51193618774414, -16.081750869750977, -14.651565551757812, -13.221380233764648, -11.791194915771484, -10.36100959777832, -8.930824279785156, -7.500638961791992, -6.070453643798828, -4.640268325805664, -3.2100868225097656, -1.7799015045166016, -0.3497161865234375, 1.0804691314697266, 2.5106544494628906, 3.9408397674560547, 5.371025085449219, 6.801210403442383, 8.231395721435547, 9.661581039428711, 11.091766357421875, 12.521951675415039, 13.952136993408203, 15.382322311401367, 16.81250762939453, 18.242692947387695, 19.67287826538086, 21.103063583374023, 22.533248901367188, 23.96343421936035, 25.393619537353516, 26.82380485534668, 28.253990173339844, 29.684175491333008, 31.114360809326172, 32.54454803466797, 33.9747314453125, 35.40491485595703, 36.83510208129883, 38.265289306640625, 39.695472717285156, 41.12565612792969, 42.555843353271484]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 6.0, 5.0, 5.0, 10.0, 3.0, 12.0, 22.0, 20.0, 21.0, 18.0, 27.0, 46.0, 40.0, 33.0, 42.0, 44.0, 45.0, 48.0, 53.0, 63.0, 48.0, 41.0, 40.0, 31.0, 40.0, 23.0, 32.0, 19.0, 18.0, 24.0, 20.0, 24.0, 21.0, 10.0, 14.0, 9.0, 9.0, 6.0, 7.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.99609375, -7.757568359375, -7.51904296875, -7.280517578125, -7.0419921875, -6.803466796875, -6.56494140625, -6.326416015625, -6.087890625, -5.849365234375, -5.61083984375, -5.372314453125, -5.1337890625, -4.895263671875, -4.65673828125, -4.418212890625, -4.1796875, -3.941162109375, -3.70263671875, -3.464111328125, -3.2255859375, -2.987060546875, -2.74853515625, -2.510009765625, -2.271484375, -2.032958984375, -1.79443359375, -1.555908203125, -1.3173828125, -1.078857421875, -0.84033203125, -0.601806640625, -0.36328125, -0.124755859375, 0.11376953125, 0.352294921875, 0.5908203125, 0.829345703125, 1.06787109375, 1.306396484375, 1.544921875, 1.783447265625, 2.02197265625, 2.260498046875, 2.4990234375, 2.737548828125, 2.97607421875, 3.214599609375, 3.453125, 3.691650390625, 3.93017578125, 4.168701171875, 4.4072265625, 4.645751953125, 4.88427734375, 5.122802734375, 5.361328125, 5.599853515625, 5.83837890625, 6.076904296875, 6.3154296875, 6.553955078125, 6.79248046875, 7.031005859375, 7.26953125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 4.0, 7.0, 6.0, 15.0, 11.0, 12.0, 24.0, 35.0, 37.0, 74.0, 98.0, 121.0, 168.0, 256.0, 336.0, 479.0, 646.0, 1098.0, 1810.0, 2930.0, 5379.0, 10305.0, 21151.0, 49381.0, 140924.0, 478548.0, 1436646.0, 1391509.0, 436403.0, 127613.0, 45735.0, 19726.0, 9571.0, 5089.0, 2980.0, 1677.0, 1091.0, 729.0, 462.0, 313.0, 261.0, 172.0, 129.0, 82.0, 74.0, 42.0, 41.0, 30.0, 18.0, 16.0, 10.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.44921875, -7.20062255859375, -6.9520263671875, -6.70343017578125, -6.454833984375, -6.20623779296875, -5.9576416015625, -5.70904541015625, -5.46044921875, -5.21185302734375, -4.9632568359375, -4.71466064453125, -4.466064453125, -4.21746826171875, -3.9688720703125, -3.72027587890625, -3.4716796875, -3.22308349609375, -2.9744873046875, -2.72589111328125, -2.477294921875, -2.22869873046875, -1.9801025390625, -1.73150634765625, -1.48291015625, -1.23431396484375, -0.9857177734375, -0.73712158203125, -0.488525390625, -0.23992919921875, 0.0086669921875, 0.25726318359375, 0.505859375, 0.75445556640625, 1.0030517578125, 1.25164794921875, 1.500244140625, 1.74884033203125, 1.9974365234375, 2.24603271484375, 2.49462890625, 2.74322509765625, 2.9918212890625, 3.24041748046875, 3.489013671875, 3.73760986328125, 3.9862060546875, 4.23480224609375, 4.4833984375, 4.73199462890625, 4.9805908203125, 5.22918701171875, 5.477783203125, 5.72637939453125, 5.9749755859375, 6.22357177734375, 6.47216796875, 6.72076416015625, 6.9693603515625, 7.21795654296875, 7.466552734375, 7.71514892578125, 7.9637451171875, 8.21234130859375, 8.4609375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 9.0, 4.0, 7.0, 12.0, 25.0, 36.0, 51.0, 68.0, 104.0, 153.0, 215.0, 403.0, 620.0, 759.0, 575.0, 370.0, 254.0, 108.0, 83.0, 53.0, 50.0, 38.0, 22.0, 18.0, 9.0, 8.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.359375, -11.9251708984375, -11.490966796875, -11.0567626953125, -10.62255859375, -10.1883544921875, -9.754150390625, -9.3199462890625, -8.8857421875, -8.4515380859375, -8.017333984375, -7.5831298828125, -7.14892578125, -6.7147216796875, -6.280517578125, -5.8463134765625, -5.412109375, -4.9779052734375, -4.543701171875, -4.1094970703125, -3.67529296875, -3.2410888671875, -2.806884765625, -2.3726806640625, -1.9384765625, -1.5042724609375, -1.070068359375, -0.6358642578125, -0.20166015625, 0.2325439453125, 0.666748046875, 1.1009521484375, 1.53515625, 1.9693603515625, 2.403564453125, 2.8377685546875, 3.27197265625, 3.7061767578125, 4.140380859375, 4.5745849609375, 5.0087890625, 5.4429931640625, 5.877197265625, 6.3114013671875, 6.74560546875, 7.1798095703125, 7.614013671875, 8.0482177734375, 8.482421875, 8.9166259765625, 9.350830078125, 9.7850341796875, 10.21923828125, 10.6534423828125, 11.087646484375, 11.5218505859375, 11.9560546875, 12.3902587890625, 12.824462890625, 13.2586669921875, 13.69287109375, 14.1270751953125, 14.561279296875, 14.9954833984375, 15.4296875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 6.0, 7.0, 9.0, 13.0, 22.0, 39.0, 44.0, 78.0, 123.0, 198.0, 327.0, 958.0, 5144.0, 86209.0, 3633018.0, 450272.0, 14832.0, 1754.0, 545.0, 253.0, 151.0, 89.0, 66.0, 42.0, 19.0, 16.0, 16.0, 12.0, 5.0, 9.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.875, -39.66259765625, -38.4501953125, -37.23779296875, -36.025390625, -34.81298828125, -33.6005859375, -32.38818359375, -31.17578125, -29.96337890625, -28.7509765625, -27.53857421875, -26.326171875, -25.11376953125, -23.9013671875, -22.68896484375, -21.4765625, -20.26416015625, -19.0517578125, -17.83935546875, -16.626953125, -15.41455078125, -14.2021484375, -12.98974609375, -11.77734375, -10.56494140625, -9.3525390625, -8.14013671875, -6.927734375, -5.71533203125, -4.5029296875, -3.29052734375, -2.078125, -0.86572265625, 0.3466796875, 1.55908203125, 2.771484375, 3.98388671875, 5.1962890625, 6.40869140625, 7.62109375, 8.83349609375, 10.0458984375, 11.25830078125, 12.470703125, 13.68310546875, 14.8955078125, 16.10791015625, 17.3203125, 18.53271484375, 19.7451171875, 20.95751953125, 22.169921875, 23.38232421875, 24.5947265625, 25.80712890625, 27.01953125, 28.23193359375, 29.4443359375, 30.65673828125, 31.869140625, 33.08154296875, 34.2939453125, 35.50634765625, 36.71875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 9.0, 315.0, 658.0, 35.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.85899353027344, -182.59104919433594, -171.3231201171875, -160.05517578125, -148.7872314453125, -137.519287109375, -126.25135040283203, -114.98341369628906, -103.71546936035156, -92.44752502441406, -81.1795883178711, -69.91165161132812, -58.643707275390625, -47.37576675415039, -36.107826232910156, -24.839889526367188, -13.571945190429688, -2.304004669189453, 8.963935852050781, 20.231876373291016, 31.49981689453125, 42.767757415771484, 54.03569793701172, 65.30363464355469, 76.57157897949219, 87.83952331542969, 99.10746002197266, 110.37539672851562, 121.64334106445312, 132.91128540039062, 144.17922973632812, 155.44715881347656, 166.715087890625, 177.9830322265625, 189.2509765625, 200.51890563964844, 211.78684997558594, 223.05479431152344, 234.32272338867188, 245.59066772460938, 256.8586120605469, 268.1265563964844, 279.3945007324219, 290.6624450683594, 301.93035888671875, 313.19830322265625, 324.46624755859375, 335.73419189453125, 347.00213623046875, 358.27008056640625, 369.53802490234375, 380.80596923828125, 392.07391357421875, 403.3418273925781, 414.6097717285156, 425.8777160644531, 437.1456604003906, 448.4136047363281, 459.6815490722656, 470.9494934082031, 482.2174072265625, 493.4853515625, 504.7532958984375, 516.021240234375, 527.2891845703125]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 8.0, 3.0, 8.0, 16.0, 7.0, 12.0, 13.0, 14.0, 17.0, 16.0, 29.0, 24.0, 25.0, 40.0, 40.0, 41.0, 42.0, 41.0, 47.0, 42.0, 42.0, 52.0, 45.0, 45.0, 36.0, 35.0, 28.0, 28.0, 27.0, 27.0, 23.0, 20.0, 20.0, 18.0, 13.0, 12.0, 8.0, 9.0, 3.0, 11.0, 8.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.55177307128906, -33.365909576416016, -32.18004608154297, -30.99418067932129, -29.808317184448242, -28.622453689575195, -27.436588287353516, -26.25072479248047, -25.064861297607422, -23.878997802734375, -22.693134307861328, -21.50726890563965, -20.3214054107666, -19.135541915893555, -17.949676513671875, -16.763813018798828, -15.577949523925781, -14.392086029052734, -13.206221580505371, -12.020357131958008, -10.834493637084961, -9.648630142211914, -8.46276569366455, -7.2769012451171875, -6.091037750244141, -4.9051737785339355, -3.7193098068237305, -2.5334458351135254, -1.3475818634033203, -0.16171789169311523, 1.0241460800170898, 2.210010528564453, 3.3958702087402344, 4.5817341804504395, 5.7675981521606445, 6.95346212387085, 8.139326095581055, 9.325189590454102, 10.511054039001465, 11.696918487548828, 12.882781982421875, 14.068645477294922, 15.254509925842285, 16.44037437438965, 17.626237869262695, 18.812101364135742, 19.997966766357422, 21.18383026123047, 22.369693756103516, 23.555557250976562, 24.74142074584961, 25.92728614807129, 27.113149642944336, 28.299013137817383, 29.484878540039062, 30.67074203491211, 31.856605529785156, 33.0424690246582, 34.22833251953125, 35.4141960144043, 36.600059509277344, 37.785926818847656, 38.9717903137207, 40.15765380859375, 41.3435173034668]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 10.0, 11.0, 12.0, 10.0, 17.0, 16.0, 19.0, 19.0, 29.0, 24.0, 23.0, 34.0, 37.0, 37.0, 42.0, 35.0, 39.0, 55.0, 54.0, 38.0, 40.0, 35.0, 34.0, 31.0, 39.0, 23.0, 27.0, 12.0, 27.0, 26.0, 18.0, 14.0, 26.0, 16.0, 13.0, 7.0, 5.0, 7.0, 8.0, 7.0, 6.0, 2.0, 5.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.98046875, -5.77423095703125, -5.5679931640625, -5.36175537109375, -5.155517578125, -4.94927978515625, -4.7430419921875, -4.53680419921875, -4.33056640625, -4.12432861328125, -3.9180908203125, -3.71185302734375, -3.505615234375, -3.29937744140625, -3.0931396484375, -2.88690185546875, -2.6806640625, -2.47442626953125, -2.2681884765625, -2.06195068359375, -1.855712890625, -1.64947509765625, -1.4432373046875, -1.23699951171875, -1.03076171875, -0.82452392578125, -0.6182861328125, -0.41204833984375, -0.205810546875, 0.00042724609375, 0.2066650390625, 0.41290283203125, 0.619140625, 0.82537841796875, 1.0316162109375, 1.23785400390625, 1.444091796875, 1.65032958984375, 1.8565673828125, 2.06280517578125, 2.26904296875, 2.47528076171875, 2.6815185546875, 2.88775634765625, 3.093994140625, 3.30023193359375, 3.5064697265625, 3.71270751953125, 3.9189453125, 4.12518310546875, 4.3314208984375, 4.53765869140625, 4.743896484375, 4.95013427734375, 5.1563720703125, 5.36260986328125, 5.56884765625, 5.77508544921875, 5.9813232421875, 6.18756103515625, 6.393798828125, 6.60003662109375, 6.8062744140625, 7.01251220703125, 7.21875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 14.0, 4.0, 19.0, 28.0, 43.0, 60.0, 118.0, 172.0, 300.0, 536.0, 911.0, 1617.0, 2986.0, 5551.0, 10338.0, 20102.0, 41272.0, 87961.0, 187388.0, 295414.0, 204389.0, 96891.0, 45292.0, 22458.0, 11243.0, 6051.0, 3251.0, 1718.0, 991.0, 572.0, 336.0, 200.0, 124.0, 59.0, 49.0, 34.0, 21.0, 17.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.1209030151367188, -1.0875091552734375, -1.0541152954101562, -1.020721435546875, -0.9873275756835938, -0.9539337158203125, -0.9205398559570312, -0.88714599609375, -0.8537521362304688, -0.8203582763671875, -0.7869644165039062, -0.753570556640625, -0.7201766967773438, -0.6867828369140625, -0.6533889770507812, -0.6199951171875, -0.5866012573242188, -0.5532073974609375, -0.5198135375976562, -0.486419677734375, -0.45302581787109375, -0.4196319580078125, -0.38623809814453125, -0.35284423828125, -0.31945037841796875, -0.2860565185546875, -0.25266265869140625, -0.219268798828125, -0.18587493896484375, -0.1524810791015625, -0.11908721923828125, -0.085693359375, -0.05229949951171875, -0.0189056396484375, 0.01448822021484375, 0.047882080078125, 0.08127593994140625, 0.1146697998046875, 0.14806365966796875, 0.18145751953125, 0.21485137939453125, 0.2482452392578125, 0.28163909912109375, 0.315032958984375, 0.34842681884765625, 0.3818206787109375, 0.41521453857421875, 0.4486083984375, 0.48200225830078125, 0.5153961181640625, 0.5487899780273438, 0.582183837890625, 0.6155776977539062, 0.6489715576171875, 0.6823654174804688, 0.71575927734375, 0.7491531372070312, 0.7825469970703125, 0.8159408569335938, 0.849334716796875, 0.8827285766601562, 0.9161224365234375, 0.9495162963867188, 0.98291015625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 9.0, 8.0, 9.0, 7.0, 14.0, 9.0, 14.0, 22.0, 22.0, 27.0, 22.0, 28.0, 26.0, 27.0, 40.0, 29.0, 31.0, 43.0, 44.0, 50.0, 1065.0, 41.0, 40.0, 30.0, 39.0, 40.0, 25.0, 28.0, 30.0, 21.0, 35.0, 23.0, 17.0, 21.0, 17.0, 19.0, 9.0, 9.0, 9.0, 9.0, 6.0, 4.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0], "bins": [-4.9609375, -4.823089599609375, -4.68524169921875, -4.547393798828125, -4.4095458984375, -4.271697998046875, -4.13385009765625, -3.996002197265625, -3.858154296875, -3.720306396484375, -3.58245849609375, -3.444610595703125, -3.3067626953125, -3.168914794921875, -3.03106689453125, -2.893218994140625, -2.75537109375, -2.617523193359375, -2.47967529296875, -2.341827392578125, -2.2039794921875, -2.066131591796875, -1.92828369140625, -1.790435791015625, -1.652587890625, -1.514739990234375, -1.37689208984375, -1.239044189453125, -1.1011962890625, -0.963348388671875, -0.82550048828125, -0.687652587890625, -0.5498046875, -0.411956787109375, -0.27410888671875, -0.136260986328125, 0.0015869140625, 0.139434814453125, 0.27728271484375, 0.415130615234375, 0.552978515625, 0.690826416015625, 0.82867431640625, 0.966522216796875, 1.1043701171875, 1.242218017578125, 1.38006591796875, 1.517913818359375, 1.65576171875, 1.793609619140625, 1.93145751953125, 2.069305419921875, 2.2071533203125, 2.345001220703125, 2.48284912109375, 2.620697021484375, 2.758544921875, 2.896392822265625, 3.03424072265625, 3.172088623046875, 3.3099365234375, 3.447784423828125, 3.58563232421875, 3.723480224609375, 3.861328125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 11.0, 12.0, 15.0, 24.0, 32.0, 30.0, 93.0, 136.0, 218.0, 454.0, 784.0, 1573.0, 3028.0, 6554.0, 14485.0, 33061.0, 80333.0, 212915.0, 1369636.0, 226317.0, 83673.0, 34924.0, 14999.0, 7106.0, 3264.0, 1534.0, 831.0, 462.0, 238.0, 146.0, 81.0, 53.0, 32.0, 26.0, 15.0, 7.0, 6.0, 3.0, 3.0, 3.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.099609375, -1.0686569213867188, -1.0377044677734375, -1.0067520141601562, -0.975799560546875, -0.9448471069335938, -0.9138946533203125, -0.8829421997070312, -0.85198974609375, -0.8210372924804688, -0.7900848388671875, -0.7591323852539062, -0.728179931640625, -0.6972274780273438, -0.6662750244140625, -0.6353225708007812, -0.6043701171875, -0.5734176635742188, -0.5424652099609375, -0.5115127563476562, -0.480560302734375, -0.44960784912109375, -0.4186553955078125, -0.38770294189453125, -0.35675048828125, -0.32579803466796875, -0.2948455810546875, -0.26389312744140625, -0.232940673828125, -0.20198822021484375, -0.1710357666015625, -0.14008331298828125, -0.109130859375, -0.07817840576171875, -0.0472259521484375, -0.01627349853515625, 0.014678955078125, 0.04563140869140625, 0.0765838623046875, 0.10753631591796875, 0.13848876953125, 0.16944122314453125, 0.2003936767578125, 0.23134613037109375, 0.262298583984375, 0.29325103759765625, 0.3242034912109375, 0.35515594482421875, 0.3861083984375, 0.41706085205078125, 0.4480133056640625, 0.47896575927734375, 0.509918212890625, 0.5408706665039062, 0.5718231201171875, 0.6027755737304688, 0.63372802734375, 0.6646804809570312, 0.6956329345703125, 0.7265853881835938, 0.757537841796875, 0.7884902954101562, 0.8194427490234375, 0.8503952026367188, 0.88134765625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 2.0, 1.0, 1.0, 9.0, 7.0, 22.0, 12.0, 15.0, 19.0, 21.0, 33.0, 27.0, 52.0, 48.0, 48.0, 53.0, 54.0, 47.0, 44.0, 43.0, 49.0, 53.0, 47.0, 39.0, 33.0, 39.0, 33.0, 31.0, 23.0, 18.0, 16.0, 5.0, 5.0, 12.0, 6.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.043121337890625, -0.04175996780395508, -0.040398597717285156, -0.039037227630615234, -0.03767585754394531, -0.03631448745727539, -0.03495311737060547, -0.03359174728393555, -0.032230377197265625, -0.030869007110595703, -0.02950763702392578, -0.02814626693725586, -0.026784896850585938, -0.025423526763916016, -0.024062156677246094, -0.022700786590576172, -0.02133941650390625, -0.019978046417236328, -0.018616676330566406, -0.017255306243896484, -0.015893936157226562, -0.01453256607055664, -0.013171195983886719, -0.011809825897216797, -0.010448455810546875, -0.009087085723876953, -0.007725715637207031, -0.006364345550537109, -0.0050029754638671875, -0.0036416053771972656, -0.0022802352905273438, -0.0009188652038574219, 0.0004425048828125, 0.0018038749694824219, 0.0031652450561523438, 0.004526615142822266, 0.0058879852294921875, 0.007249355316162109, 0.008610725402832031, 0.009972095489501953, 0.011333465576171875, 0.012694835662841797, 0.014056205749511719, 0.01541757583618164, 0.016778945922851562, 0.018140316009521484, 0.019501686096191406, 0.020863056182861328, 0.02222442626953125, 0.023585796356201172, 0.024947166442871094, 0.026308536529541016, 0.027669906616210938, 0.02903127670288086, 0.03039264678955078, 0.0317540168762207, 0.033115386962890625, 0.03447675704956055, 0.03583812713623047, 0.03719949722290039, 0.03856086730957031, 0.039922237396240234, 0.041283607482910156, 0.04264497756958008, 0.04400634765625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 2.0, 5.0, 0.0, 5.0, 4.0, 7.0, 11.0, 13.0, 14.0, 29.0, 43.0, 56.0, 68.0, 78.0, 126.0, 254.0, 555.0, 7327.0, 1034770.0, 3984.0, 496.0, 223.0, 140.0, 94.0, 53.0, 46.0, 44.0, 28.0, 18.0, 14.0, 10.0, 5.0, 5.0, 3.0, 3.0, 5.0, 3.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.224609375, -1.1856689453125, -1.146728515625, -1.1077880859375, -1.06884765625, -1.0299072265625, -0.990966796875, -0.9520263671875, -0.9130859375, -0.8741455078125, -0.835205078125, -0.7962646484375, -0.75732421875, -0.7183837890625, -0.679443359375, -0.6405029296875, -0.6015625, -0.5626220703125, -0.523681640625, -0.4847412109375, -0.44580078125, -0.4068603515625, -0.367919921875, -0.3289794921875, -0.2900390625, -0.2510986328125, -0.212158203125, -0.1732177734375, -0.13427734375, -0.0953369140625, -0.056396484375, -0.0174560546875, 0.021484375, 0.0604248046875, 0.099365234375, 0.1383056640625, 0.17724609375, 0.2161865234375, 0.255126953125, 0.2940673828125, 0.3330078125, 0.3719482421875, 0.410888671875, 0.4498291015625, 0.48876953125, 0.5277099609375, 0.566650390625, 0.6055908203125, 0.64453125, 0.6834716796875, 0.722412109375, 0.7613525390625, 0.80029296875, 0.8392333984375, 0.878173828125, 0.9171142578125, 0.9560546875, 0.9949951171875, 1.033935546875, 1.0728759765625, 1.11181640625, 1.1507568359375, 1.189697265625, 1.2286376953125, 1.267578125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 52.0, 791.0, 164.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10948170721530914, -0.08996988087892532, -0.0704580545425415, -0.050946228206157684, -0.031434401869773865, -0.011922575533390045, 0.007589250802993774, 0.02710108458995819, 0.046612903475761414, 0.06612472981214523, 0.08563655614852905, 0.10514838248491287, 0.12466020882129669, 0.1441720426082611, 0.16368386149406433, 0.18319569528102875, 0.20270751416683197, 0.2222193479537964, 0.2417311668395996, 0.26124298572540283, 0.28075480461120605, 0.30026665329933167, 0.3197784721851349, 0.3392903208732605, 0.3588021397590637, 0.37831395864486694, 0.39782577753067017, 0.4173376262187958, 0.436849445104599, 0.4563612639904022, 0.47587311267852783, 0.49538493156433105, 0.5148967504501343, 0.5344085693359375, 0.5539203882217407, 0.573432207107544, 0.5929440259933472, 0.6124559044837952, 0.6319677233695984, 0.6514795422554016, 0.6709913611412048, 0.6905031800270081, 0.7100149989128113, 0.7295268177986145, 0.7490386962890625, 0.7685505151748657, 0.788062334060669, 0.8075741529464722, 0.8270859718322754, 0.8465977907180786, 0.8661096096038818, 0.8856214284896851, 0.9051332473754883, 0.9246451258659363, 0.9441569447517395, 0.9636687636375427, 0.983180582523346, 1.002692461013794, 1.0222042798995972, 1.0417160987854004, 1.0612279176712036, 1.0807397365570068, 1.10025155544281, 1.1197633743286133, 1.1392751932144165]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 7.0, 9.0, 10.0, 10.0, 12.0, 18.0, 17.0, 25.0, 32.0, 26.0, 31.0, 28.0, 41.0, 50.0, 46.0, 35.0, 53.0, 43.0, 44.0, 45.0, 51.0, 39.0, 38.0, 37.0, 36.0, 30.0, 30.0, 37.0, 24.0, 19.0, 13.0, 18.0, 11.0, 10.0, 11.0, 6.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07285809516906738, -0.07038619369268417, -0.06791429221630096, -0.06544238328933716, -0.06297048181295395, -0.06049858033657074, -0.05802667513489723, -0.055554769933223724, -0.053082868456840515, -0.050610966980457306, -0.0481390617787838, -0.04566715657711029, -0.04319525510072708, -0.04072335362434387, -0.038251448422670364, -0.03577954322099686, -0.03330764174461365, -0.03083573840558529, -0.02836383506655693, -0.025891931727528572, -0.023420028388500214, -0.020948125049471855, -0.018476221710443497, -0.016004318371415138, -0.01353241503238678, -0.011060511693358421, -0.008588608354330063, -0.006116705015301704, -0.003644801676273346, -0.0011728983372449875, 0.001299005001783371, 0.0037709083408117294, 0.006242811679840088, 0.008714715018868446, 0.011186618357896805, 0.013658521696925163, 0.01613042503595352, 0.01860232837498188, 0.02107423171401024, 0.023546135053038597, 0.026018038392066956, 0.028489941731095314, 0.030961845070123672, 0.03343375027179718, 0.03590565174818039, 0.0383775532245636, 0.040849458426237106, 0.043321363627910614, 0.04579326510429382, 0.04826516658067703, 0.05073707178235054, 0.05320897698402405, 0.05568087846040726, 0.058152779936790466, 0.060624685138463974, 0.06309659034013748, 0.06556849181652069, 0.0680403932929039, 0.07051229476928711, 0.07298420369625092, 0.07545610517263412, 0.07792800664901733, 0.08039991557598114, 0.08287181705236435, 0.08534371852874756]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 1.0, 9.0, 13.0, 9.0, 17.0, 20.0, 19.0, 25.0, 25.0, 29.0, 26.0, 19.0, 36.0, 22.0, 38.0, 47.0, 43.0, 45.0, 38.0, 43.0, 37.0, 42.0, 32.0, 32.0, 35.0, 27.0, 35.0, 27.0, 24.0, 25.0, 21.0, 19.0, 12.0, 16.0, 16.0, 14.0, 9.0, 11.0, 4.0, 11.0, 2.0, 3.0, 2.0, 6.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.22265625, -6.01934814453125, -5.8160400390625, -5.61273193359375, -5.409423828125, -5.20611572265625, -5.0028076171875, -4.79949951171875, -4.59619140625, -4.39288330078125, -4.1895751953125, -3.98626708984375, -3.782958984375, -3.57965087890625, -3.3763427734375, -3.17303466796875, -2.9697265625, -2.76641845703125, -2.5631103515625, -2.35980224609375, -2.156494140625, -1.95318603515625, -1.7498779296875, -1.54656982421875, -1.34326171875, -1.13995361328125, -0.9366455078125, -0.73333740234375, -0.530029296875, -0.32672119140625, -0.1234130859375, 0.07989501953125, 0.283203125, 0.48651123046875, 0.6898193359375, 0.89312744140625, 1.096435546875, 1.29974365234375, 1.5030517578125, 1.70635986328125, 1.90966796875, 2.11297607421875, 2.3162841796875, 2.51959228515625, 2.722900390625, 2.92620849609375, 3.1295166015625, 3.33282470703125, 3.5361328125, 3.73944091796875, 3.9427490234375, 4.14605712890625, 4.349365234375, 4.55267333984375, 4.7559814453125, 4.95928955078125, 5.16259765625, 5.36590576171875, 5.5692138671875, 5.77252197265625, 5.975830078125, 6.17913818359375, 6.3824462890625, 6.58575439453125, 6.7890625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 7.0, 7.0, 12.0, 14.0, 18.0, 27.0, 50.0, 62.0, 103.0, 140.0, 193.0, 308.0, 499.0, 703.0, 1108.0, 1809.0, 2887.0, 4690.0, 7837.0, 13347.0, 23670.0, 42373.0, 79913.0, 151869.0, 258738.0, 210770.0, 111869.0, 58794.0, 32197.0, 18049.0, 10263.0, 6030.0, 3884.0, 2199.0, 1448.0, 901.0, 593.0, 365.0, 248.0, 183.0, 120.0, 79.0, 56.0, 38.0, 34.0, 21.0, 11.0, 8.0, 6.0, 3.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.75390625, -6.53436279296875, -6.3148193359375, -6.09527587890625, -5.875732421875, -5.65618896484375, -5.4366455078125, -5.21710205078125, -4.99755859375, -4.77801513671875, -4.5584716796875, -4.33892822265625, -4.119384765625, -3.89984130859375, -3.6802978515625, -3.46075439453125, -3.2412109375, -3.02166748046875, -2.8021240234375, -2.58258056640625, -2.363037109375, -2.14349365234375, -1.9239501953125, -1.70440673828125, -1.48486328125, -1.26531982421875, -1.0457763671875, -0.82623291015625, -0.606689453125, -0.38714599609375, -0.1676025390625, 0.05194091796875, 0.271484375, 0.49102783203125, 0.7105712890625, 0.93011474609375, 1.149658203125, 1.36920166015625, 1.5887451171875, 1.80828857421875, 2.02783203125, 2.24737548828125, 2.4669189453125, 2.68646240234375, 2.906005859375, 3.12554931640625, 3.3450927734375, 3.56463623046875, 3.7841796875, 4.00372314453125, 4.2232666015625, 4.44281005859375, 4.662353515625, 4.88189697265625, 5.1014404296875, 5.32098388671875, 5.54052734375, 5.76007080078125, 5.9796142578125, 6.19915771484375, 6.418701171875, 6.63824462890625, 6.8577880859375, 7.07733154296875, 7.296875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 5.0, 10.0, 8.0, 12.0, 21.0, 21.0, 22.0, 25.0, 34.0, 19.0, 49.0, 45.0, 55.0, 72.0, 96.0, 181.0, 1313.0, 332.0, 193.0, 109.0, 84.0, 50.0, 38.0, 44.0, 24.0, 34.0, 18.0, 23.0, 22.0, 9.0, 16.0, 10.0, 9.0, 4.0, 8.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.765625, -16.16650390625, -15.5673828125, -14.96826171875, -14.369140625, -13.77001953125, -13.1708984375, -12.57177734375, -11.97265625, -11.37353515625, -10.7744140625, -10.17529296875, -9.576171875, -8.97705078125, -8.3779296875, -7.77880859375, -7.1796875, -6.58056640625, -5.9814453125, -5.38232421875, -4.783203125, -4.18408203125, -3.5849609375, -2.98583984375, -2.38671875, -1.78759765625, -1.1884765625, -0.58935546875, 0.009765625, 0.60888671875, 1.2080078125, 1.80712890625, 2.40625, 3.00537109375, 3.6044921875, 4.20361328125, 4.802734375, 5.40185546875, 6.0009765625, 6.60009765625, 7.19921875, 7.79833984375, 8.3974609375, 8.99658203125, 9.595703125, 10.19482421875, 10.7939453125, 11.39306640625, 11.9921875, 12.59130859375, 13.1904296875, 13.78955078125, 14.388671875, 14.98779296875, 15.5869140625, 16.18603515625, 16.78515625, 17.38427734375, 17.9833984375, 18.58251953125, 19.181640625, 19.78076171875, 20.3798828125, 20.97900390625, 21.578125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 7.0, 8.0, 8.0, 10.0, 6.0, 13.0, 14.0, 18.0, 22.0, 53.0, 36.0, 72.0, 86.0, 112.0, 192.0, 245.0, 374.0, 753.0, 2210.0, 10947.0, 96159.0, 2238114.0, 745153.0, 42046.0, 5885.0, 1508.0, 563.0, 304.0, 223.0, 136.0, 115.0, 78.0, 38.0, 48.0, 35.0, 28.0, 17.0, 18.0, 11.0, 11.0, 7.0, 9.0, 8.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.65625, -25.84423828125, -25.0322265625, -24.22021484375, -23.408203125, -22.59619140625, -21.7841796875, -20.97216796875, -20.16015625, -19.34814453125, -18.5361328125, -17.72412109375, -16.912109375, -16.10009765625, -15.2880859375, -14.47607421875, -13.6640625, -12.85205078125, -12.0400390625, -11.22802734375, -10.416015625, -9.60400390625, -8.7919921875, -7.97998046875, -7.16796875, -6.35595703125, -5.5439453125, -4.73193359375, -3.919921875, -3.10791015625, -2.2958984375, -1.48388671875, -0.671875, 0.14013671875, 0.9521484375, 1.76416015625, 2.576171875, 3.38818359375, 4.2001953125, 5.01220703125, 5.82421875, 6.63623046875, 7.4482421875, 8.26025390625, 9.072265625, 9.88427734375, 10.6962890625, 11.50830078125, 12.3203125, 13.13232421875, 13.9443359375, 14.75634765625, 15.568359375, 16.38037109375, 17.1923828125, 18.00439453125, 18.81640625, 19.62841796875, 20.4404296875, 21.25244140625, 22.064453125, 22.87646484375, 23.6884765625, 24.50048828125, 25.3125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [5.0, 205.0, 739.0, 69.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.383800506591797, -15.29759407043457, -4.211387634277344, 6.874820709228516, 17.96102523803711, 29.047229766845703, 40.13344192504883, 51.21964645385742, 62.305850982666016, 73.39205932617188, 84.47826385498047, 95.56446838378906, 106.65068054199219, 117.73687744140625, 128.82308959960938, 139.9093017578125, 150.99549865722656, 162.0817108154297, 173.16790771484375, 184.25411987304688, 195.34033203125, 206.42652893066406, 217.5127410888672, 228.59893798828125, 239.68515014648438, 250.7713623046875, 261.8575744628906, 272.94378662109375, 284.02996826171875, 295.1161804199219, 306.202392578125, 317.2886047363281, 328.37481689453125, 339.4610290527344, 350.5472412109375, 361.6334228515625, 372.7196350097656, 383.80584716796875, 394.8920593261719, 405.978271484375, 417.064453125, 428.1506652832031, 439.23687744140625, 450.32305908203125, 461.4092712402344, 472.4954833984375, 483.5816955566406, 494.66790771484375, 505.7541198730469, 516.84033203125, 527.926513671875, 539.0127563476562, 550.0989379882812, 561.1851806640625, 572.2713623046875, 583.3575439453125, 594.4437866210938, 605.5299682617188, 616.6162109375, 627.702392578125, 638.7886352539062, 649.8748168945312, 660.9610595703125, 672.0472412109375, 683.1334228515625]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 2.0, 10.0, 9.0, 7.0, 8.0, 13.0, 16.0, 17.0, 21.0, 35.0, 17.0, 32.0, 26.0, 24.0, 39.0, 42.0, 33.0, 32.0, 43.0, 50.0, 40.0, 49.0, 44.0, 35.0, 40.0, 33.0, 36.0, 17.0, 28.0, 40.0, 18.0, 22.0, 12.0, 17.0, 20.0, 11.0, 14.0, 11.0, 8.0, 12.0, 5.0, 6.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0], "bins": [-52.304683685302734, -50.9275016784668, -49.55031967163086, -48.17313766479492, -46.79595184326172, -45.41876983642578, -44.041587829589844, -42.664405822753906, -41.28722381591797, -39.91004180908203, -38.532859802246094, -37.155677795410156, -35.77849578857422, -34.401309967041016, -33.02412796020508, -31.64694595336914, -30.269763946533203, -28.892581939697266, -27.515399932861328, -26.138216018676758, -24.76103401184082, -23.383852005004883, -22.006668090820312, -20.629486083984375, -19.252304077148438, -17.8751220703125, -16.497940063476562, -15.120756149291992, -13.743574142456055, -12.366392135620117, -10.989209175109863, -9.61202621459961, -8.234840393066406, -6.8576579093933105, -5.480475425720215, -4.103292942047119, -2.7261104583740234, -1.3489279747009277, 0.02825450897216797, 1.4054374694824219, 2.7826194763183594, 4.159801959991455, 5.536984443664551, 6.9141669273376465, 8.291349411010742, 9.66853141784668, 11.045714378356934, 12.422897338867188, 13.800079345703125, 15.177261352539062, 16.554443359375, 17.93162727355957, 19.308809280395508, 20.685991287231445, 22.063175201416016, 23.440357208251953, 24.81753921508789, 26.194721221923828, 27.571903228759766, 28.949087142944336, 30.326269149780273, 31.70345115661621, 33.08063507080078, 34.45781707763672, 35.834999084472656]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 7.0, 6.0, 10.0, 13.0, 16.0, 16.0, 26.0, 20.0, 27.0, 23.0, 37.0, 43.0, 35.0, 40.0, 37.0, 39.0, 42.0, 47.0, 34.0, 51.0, 37.0, 41.0, 41.0, 30.0, 30.0, 29.0, 32.0, 30.0, 28.0, 22.0, 25.0, 15.0, 8.0, 7.0, 7.0, 8.0, 7.0, 5.0, 6.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.0546875, -6.82916259765625, -6.6036376953125, -6.37811279296875, -6.152587890625, -5.92706298828125, -5.7015380859375, -5.47601318359375, -5.25048828125, -5.02496337890625, -4.7994384765625, -4.57391357421875, -4.348388671875, -4.12286376953125, -3.8973388671875, -3.67181396484375, -3.4462890625, -3.22076416015625, -2.9952392578125, -2.76971435546875, -2.544189453125, -2.31866455078125, -2.0931396484375, -1.86761474609375, -1.64208984375, -1.41656494140625, -1.1910400390625, -0.96551513671875, -0.739990234375, -0.51446533203125, -0.2889404296875, -0.06341552734375, 0.162109375, 0.38763427734375, 0.6131591796875, 0.83868408203125, 1.064208984375, 1.28973388671875, 1.5152587890625, 1.74078369140625, 1.96630859375, 2.19183349609375, 2.4173583984375, 2.64288330078125, 2.868408203125, 3.09393310546875, 3.3194580078125, 3.54498291015625, 3.7705078125, 3.99603271484375, 4.2215576171875, 4.44708251953125, 4.672607421875, 4.89813232421875, 5.1236572265625, 5.34918212890625, 5.57470703125, 5.80023193359375, 6.0257568359375, 6.25128173828125, 6.476806640625, 6.70233154296875, 6.9278564453125, 7.15338134765625, 7.37890625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 6.0, 5.0, 9.0, 11.0, 11.0, 25.0, 27.0, 36.0, 81.0, 105.0, 144.0, 228.0, 370.0, 564.0, 904.0, 1495.0, 2607.0, 4455.0, 8754.0, 18087.0, 44253.0, 134028.0, 498792.0, 1620417.0, 1329495.0, 361846.0, 99868.0, 35282.0, 14979.0, 7388.0, 4077.0, 2333.0, 1344.0, 804.0, 487.0, 331.0, 192.0, 141.0, 99.0, 68.0, 44.0, 20.0, 29.0, 17.0, 11.0, 8.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-9.4765625, -9.21246337890625, -8.9483642578125, -8.68426513671875, -8.420166015625, -8.15606689453125, -7.8919677734375, -7.62786865234375, -7.36376953125, -7.09967041015625, -6.8355712890625, -6.57147216796875, -6.307373046875, -6.04327392578125, -5.7791748046875, -5.51507568359375, -5.2509765625, -4.98687744140625, -4.7227783203125, -4.45867919921875, -4.194580078125, -3.93048095703125, -3.6663818359375, -3.40228271484375, -3.13818359375, -2.87408447265625, -2.6099853515625, -2.34588623046875, -2.081787109375, -1.81768798828125, -1.5535888671875, -1.28948974609375, -1.025390625, -0.76129150390625, -0.4971923828125, -0.23309326171875, 0.031005859375, 0.29510498046875, 0.5592041015625, 0.82330322265625, 1.08740234375, 1.35150146484375, 1.6156005859375, 1.87969970703125, 2.143798828125, 2.40789794921875, 2.6719970703125, 2.93609619140625, 3.2001953125, 3.46429443359375, 3.7283935546875, 3.99249267578125, 4.256591796875, 4.52069091796875, 4.7847900390625, 5.04888916015625, 5.31298828125, 5.57708740234375, 5.8411865234375, 6.10528564453125, 6.369384765625, 6.63348388671875, 6.8975830078125, 7.16168212890625, 7.42578125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 9.0, 16.0, 14.0, 20.0, 17.0, 25.0, 40.0, 67.0, 91.0, 105.0, 176.0, 236.0, 375.0, 535.0, 625.0, 519.0, 348.0, 234.0, 184.0, 120.0, 79.0, 56.0, 48.0, 36.0, 23.0, 14.0, 15.0, 9.0, 11.0, 2.0, 10.0, 5.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.390625, -10.060302734375, -9.72998046875, -9.399658203125, -9.0693359375, -8.739013671875, -8.40869140625, -8.078369140625, -7.748046875, -7.417724609375, -7.08740234375, -6.757080078125, -6.4267578125, -6.096435546875, -5.76611328125, -5.435791015625, -5.10546875, -4.775146484375, -4.44482421875, -4.114501953125, -3.7841796875, -3.453857421875, -3.12353515625, -2.793212890625, -2.462890625, -2.132568359375, -1.80224609375, -1.471923828125, -1.1416015625, -0.811279296875, -0.48095703125, -0.150634765625, 0.1796875, 0.510009765625, 0.84033203125, 1.170654296875, 1.5009765625, 1.831298828125, 2.16162109375, 2.491943359375, 2.822265625, 3.152587890625, 3.48291015625, 3.813232421875, 4.1435546875, 4.473876953125, 4.80419921875, 5.134521484375, 5.46484375, 5.795166015625, 6.12548828125, 6.455810546875, 6.7861328125, 7.116455078125, 7.44677734375, 7.777099609375, 8.107421875, 8.437744140625, 8.76806640625, 9.098388671875, 9.4287109375, 9.759033203125, 10.08935546875, 10.419677734375, 10.75]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 7.0, 6.0, 7.0, 20.0, 20.0, 29.0, 52.0, 70.0, 88.0, 151.0, 336.0, 867.0, 3226.0, 16218.0, 110954.0, 1823580.0, 2092757.0, 122922.0, 17632.0, 3526.0, 1006.0, 359.0, 136.0, 101.0, 67.0, 38.0, 33.0, 17.0, 15.0, 13.0, 9.0, 5.0, 5.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.65625, -22.9609375, -22.265625, -21.5703125, -20.875, -20.1796875, -19.484375, -18.7890625, -18.09375, -17.3984375, -16.703125, -16.0078125, -15.3125, -14.6171875, -13.921875, -13.2265625, -12.53125, -11.8359375, -11.140625, -10.4453125, -9.75, -9.0546875, -8.359375, -7.6640625, -6.96875, -6.2734375, -5.578125, -4.8828125, -4.1875, -3.4921875, -2.796875, -2.1015625, -1.40625, -0.7109375, -0.015625, 0.6796875, 1.375, 2.0703125, 2.765625, 3.4609375, 4.15625, 4.8515625, 5.546875, 6.2421875, 6.9375, 7.6328125, 8.328125, 9.0234375, 9.71875, 10.4140625, 11.109375, 11.8046875, 12.5, 13.1953125, 13.890625, 14.5859375, 15.28125, 15.9765625, 16.671875, 17.3671875, 18.0625, 18.7578125, 19.453125, 20.1484375, 20.84375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 16.0, 19.0, 62.0, 97.0, 168.0, 184.0, 196.0, 129.0, 72.0, 35.0, 22.0, 10.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.97679901123047, -73.7922592163086, -71.60772705078125, -69.42318725585938, -67.23865509033203, -65.05411529541016, -62.86957931518555, -60.68504333496094, -58.50050735473633, -56.31597137451172, -54.13143539428711, -51.9468994140625, -49.762359619140625, -47.57782745361328, -45.393287658691406, -43.2087516784668, -41.02421569824219, -38.83967971801758, -36.65514373779297, -34.47060775756836, -32.28607177734375, -30.101533889770508, -27.916996002197266, -25.732460021972656, -23.547924041748047, -21.363388061523438, -19.178852081298828, -16.994314193725586, -14.809778213500977, -12.625242233276367, -10.440705299377441, -8.256168365478516, -6.0716400146484375, -3.88710355758667, -1.7025671005249023, 0.48196935653686523, 2.666505813598633, 4.851041793823242, 7.035578727722168, 9.220115661621094, 11.404651641845703, 13.589187622070312, 15.773724555969238, 17.958261489868164, 20.142797470092773, 22.327333450317383, 24.511871337890625, 26.696407318115234, 28.880943298339844, 31.065479278564453, 33.25001525878906, 35.43455123901367, 37.61908721923828, 39.803627014160156, 41.988162994384766, 44.172698974609375, 46.357234954833984, 48.541770935058594, 50.7263069152832, 52.91084289550781, 55.09538269042969, 57.27991485595703, 59.464454650878906, 61.648990631103516, 63.833526611328125]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 8.0, 13.0, 18.0, 10.0, 18.0, 14.0, 16.0, 18.0, 26.0, 29.0, 31.0, 32.0, 26.0, 45.0, 35.0, 35.0, 35.0, 53.0, 47.0, 47.0, 42.0, 29.0, 37.0, 38.0, 33.0, 27.0, 30.0, 27.0, 27.0, 21.0, 25.0, 19.0, 12.0, 10.0, 20.0, 7.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-31.154857635498047, -30.19528579711914, -29.235713958740234, -28.276142120361328, -27.316570281982422, -26.356998443603516, -25.39742660522461, -24.437854766845703, -23.478282928466797, -22.51871109008789, -21.559139251708984, -20.599567413330078, -19.639995574951172, -18.680423736572266, -17.72085189819336, -16.761280059814453, -15.80171012878418, -14.842138290405273, -13.882566452026367, -12.922994613647461, -11.963422775268555, -11.003850936889648, -10.044280052185059, -9.084708213806152, -8.125136375427246, -7.16556453704834, -6.205992698669434, -5.2464213371276855, -4.286849498748779, -3.327277660369873, -2.367706298828125, -1.4081344604492188, -0.4485607147216797, 0.511011004447937, 1.4705827236175537, 2.430154323577881, 3.389726161956787, 4.349298000335693, 5.308869361877441, 6.268441200256348, 7.228013038635254, 8.18758487701416, 9.147156715393066, 10.106727600097656, 11.066299438476562, 12.025871276855469, 12.985443115234375, 13.945014953613281, 14.904586791992188, 15.864158630371094, 16.82373046875, 17.783302307128906, 18.742874145507812, 19.70244598388672, 20.662017822265625, 21.62158966064453, 22.581161499023438, 23.540733337402344, 24.50030517578125, 25.459877014160156, 26.419448852539062, 27.37902069091797, 28.338592529296875, 29.29816436767578, 30.257734298706055]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 3.0, 11.0, 9.0, 4.0, 8.0, 13.0, 14.0, 23.0, 20.0, 30.0, 27.0, 44.0, 27.0, 49.0, 41.0, 38.0, 36.0, 63.0, 63.0, 46.0, 47.0, 50.0, 47.0, 35.0, 36.0, 35.0, 29.0, 20.0, 22.0, 19.0, 16.0, 13.0, 7.0, 19.0, 7.0, 8.0, 6.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.48046875, -7.23590087890625, -6.9913330078125, -6.74676513671875, -6.502197265625, -6.25762939453125, -6.0130615234375, -5.76849365234375, -5.52392578125, -5.27935791015625, -5.0347900390625, -4.79022216796875, -4.545654296875, -4.30108642578125, -4.0565185546875, -3.81195068359375, -3.5673828125, -3.32281494140625, -3.0782470703125, -2.83367919921875, -2.589111328125, -2.34454345703125, -2.0999755859375, -1.85540771484375, -1.61083984375, -1.36627197265625, -1.1217041015625, -0.87713623046875, -0.632568359375, -0.38800048828125, -0.1434326171875, 0.10113525390625, 0.345703125, 0.59027099609375, 0.8348388671875, 1.07940673828125, 1.323974609375, 1.56854248046875, 1.8131103515625, 2.05767822265625, 2.30224609375, 2.54681396484375, 2.7913818359375, 3.03594970703125, 3.280517578125, 3.52508544921875, 3.7696533203125, 4.01422119140625, 4.2587890625, 4.50335693359375, 4.7479248046875, 4.99249267578125, 5.237060546875, 5.48162841796875, 5.7261962890625, 5.97076416015625, 6.21533203125, 6.45989990234375, 6.7044677734375, 6.94903564453125, 7.193603515625, 7.43817138671875, 7.6827392578125, 7.92730712890625, 8.171875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 3.0, 7.0, 19.0, 26.0, 22.0, 29.0, 53.0, 79.0, 108.0, 141.0, 224.0, 303.0, 518.0, 747.0, 1101.0, 1724.0, 2712.0, 4380.0, 6894.0, 11372.0, 19090.0, 32292.0, 55727.0, 97957.0, 162959.0, 213931.0, 175908.0, 108300.0, 62025.0, 35721.0, 20731.0, 12671.0, 7626.0, 4640.0, 2902.0, 1881.0, 1283.0, 788.0, 491.0, 387.0, 264.0, 168.0, 103.0, 72.0, 52.0, 39.0, 26.0, 19.0, 14.0, 15.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.859375, -0.8330078125, -0.806640625, -0.7802734375, -0.75390625, -0.7275390625, -0.701171875, -0.6748046875, -0.6484375, -0.6220703125, -0.595703125, -0.5693359375, -0.54296875, -0.5166015625, -0.490234375, -0.4638671875, -0.4375, -0.4111328125, -0.384765625, -0.3583984375, -0.33203125, -0.3056640625, -0.279296875, -0.2529296875, -0.2265625, -0.2001953125, -0.173828125, -0.1474609375, -0.12109375, -0.0947265625, -0.068359375, -0.0419921875, -0.015625, 0.0107421875, 0.037109375, 0.0634765625, 0.08984375, 0.1162109375, 0.142578125, 0.1689453125, 0.1953125, 0.2216796875, 0.248046875, 0.2744140625, 0.30078125, 0.3271484375, 0.353515625, 0.3798828125, 0.40625, 0.4326171875, 0.458984375, 0.4853515625, 0.51171875, 0.5380859375, 0.564453125, 0.5908203125, 0.6171875, 0.6435546875, 0.669921875, 0.6962890625, 0.72265625, 0.7490234375, 0.775390625, 0.8017578125, 0.828125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 6.0, 9.0, 5.0, 5.0, 16.0, 16.0, 26.0, 15.0, 23.0, 22.0, 26.0, 37.0, 25.0, 42.0, 41.0, 46.0, 42.0, 37.0, 1059.0, 48.0, 43.0, 39.0, 43.0, 43.0, 39.0, 28.0, 31.0, 33.0, 27.0, 27.0, 20.0, 17.0, 15.0, 18.0, 15.0, 8.0, 7.0, 4.0, 2.0, 7.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84375, -4.685546875, -4.52734375, -4.369140625, -4.2109375, -4.052734375, -3.89453125, -3.736328125, -3.578125, -3.419921875, -3.26171875, -3.103515625, -2.9453125, -2.787109375, -2.62890625, -2.470703125, -2.3125, -2.154296875, -1.99609375, -1.837890625, -1.6796875, -1.521484375, -1.36328125, -1.205078125, -1.046875, -0.888671875, -0.73046875, -0.572265625, -0.4140625, -0.255859375, -0.09765625, 0.060546875, 0.21875, 0.376953125, 0.53515625, 0.693359375, 0.8515625, 1.009765625, 1.16796875, 1.326171875, 1.484375, 1.642578125, 1.80078125, 1.958984375, 2.1171875, 2.275390625, 2.43359375, 2.591796875, 2.75, 2.908203125, 3.06640625, 3.224609375, 3.3828125, 3.541015625, 3.69921875, 3.857421875, 4.015625, 4.173828125, 4.33203125, 4.490234375, 4.6484375, 4.806640625, 4.96484375, 5.123046875, 5.28125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 9.0, 6.0, 18.0, 23.0, 29.0, 50.0, 67.0, 119.0, 226.0, 386.0, 735.0, 1432.0, 2814.0, 5629.0, 12348.0, 27676.0, 66064.0, 165838.0, 1276489.0, 343576.0, 111824.0, 45209.0, 19239.0, 8743.0, 4163.0, 2034.0, 1058.0, 558.0, 317.0, 175.0, 101.0, 49.0, 35.0, 20.0, 23.0, 10.0, 12.0, 5.0, 5.0, 4.0, 2.0, 5.0, 5.0], "bins": [-1.26953125, -1.2376251220703125, -1.205718994140625, -1.1738128662109375, -1.14190673828125, -1.1100006103515625, -1.078094482421875, -1.0461883544921875, -1.0142822265625, -0.9823760986328125, -0.950469970703125, -0.9185638427734375, -0.88665771484375, -0.8547515869140625, -0.822845458984375, -0.7909393310546875, -0.759033203125, -0.7271270751953125, -0.695220947265625, -0.6633148193359375, -0.63140869140625, -0.5995025634765625, -0.567596435546875, -0.5356903076171875, -0.5037841796875, -0.4718780517578125, -0.439971923828125, -0.4080657958984375, -0.37615966796875, -0.3442535400390625, -0.312347412109375, -0.2804412841796875, -0.24853515625, -0.2166290283203125, -0.184722900390625, -0.1528167724609375, -0.12091064453125, -0.0890045166015625, -0.057098388671875, -0.0251922607421875, 0.0067138671875, 0.0386199951171875, 0.070526123046875, 0.1024322509765625, 0.13433837890625, 0.1662445068359375, 0.198150634765625, 0.2300567626953125, 0.261962890625, 0.2938690185546875, 0.325775146484375, 0.3576812744140625, 0.38958740234375, 0.4214935302734375, 0.453399658203125, 0.4853057861328125, 0.5172119140625, 0.5491180419921875, 0.581024169921875, 0.6129302978515625, 0.64483642578125, 0.6767425537109375, 0.708648681640625, 0.7405548095703125, 0.7724609375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 2.0, 6.0, 2.0, 5.0, 6.0, 8.0, 7.0, 10.0, 13.0, 9.0, 14.0, 14.0, 16.0, 24.0, 29.0, 47.0, 48.0, 49.0, 62.0, 49.0, 63.0, 72.0, 76.0, 65.0, 54.0, 37.0, 41.0, 22.0, 18.0, 23.0, 16.0, 14.0, 18.0, 11.0, 6.0, 7.0, 7.0, 5.0, 9.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.058929443359375, -0.05719280242919922, -0.05545616149902344, -0.053719520568847656, -0.051982879638671875, -0.050246238708496094, -0.04850959777832031, -0.04677295684814453, -0.04503631591796875, -0.04329967498779297, -0.04156303405761719, -0.039826393127441406, -0.038089752197265625, -0.036353111267089844, -0.03461647033691406, -0.03287982940673828, -0.0311431884765625, -0.02940654754638672, -0.027669906616210938, -0.025933265686035156, -0.024196624755859375, -0.022459983825683594, -0.020723342895507812, -0.01898670196533203, -0.01725006103515625, -0.015513420104980469, -0.013776779174804688, -0.012040138244628906, -0.010303497314453125, -0.008566856384277344, -0.0068302154541015625, -0.005093574523925781, -0.00335693359375, -0.0016202926635742188, 0.0001163482666015625, 0.0018529891967773438, 0.003589630126953125, 0.005326271057128906, 0.0070629119873046875, 0.008799552917480469, 0.01053619384765625, 0.012272834777832031, 0.014009475708007812, 0.015746116638183594, 0.017482757568359375, 0.019219398498535156, 0.020956039428710938, 0.02269268035888672, 0.0244293212890625, 0.02616596221923828, 0.027902603149414062, 0.029639244079589844, 0.031375885009765625, 0.033112525939941406, 0.03484916687011719, 0.03658580780029297, 0.03832244873046875, 0.04005908966064453, 0.04179573059082031, 0.043532371520996094, 0.045269012451171875, 0.047005653381347656, 0.04874229431152344, 0.05047893524169922, 0.052215576171875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 6.0, 5.0, 11.0, 12.0, 11.0, 15.0, 12.0, 14.0, 16.0, 28.0, 19.0, 27.0, 45.0, 39.0, 87.0, 128.0, 183.0, 301.0, 763.0, 8708.0, 1020078.0, 16168.0, 847.0, 319.0, 185.0, 125.0, 98.0, 65.0, 42.0, 26.0, 22.0, 25.0, 19.0, 14.0, 17.0, 13.0, 7.0, 5.0, 7.0, 10.0, 8.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 4.0], "bins": [-1.0947265625, -1.0600433349609375, -1.025360107421875, -0.9906768798828125, -0.95599365234375, -0.9213104248046875, -0.886627197265625, -0.8519439697265625, -0.8172607421875, -0.7825775146484375, -0.747894287109375, -0.7132110595703125, -0.67852783203125, -0.6438446044921875, -0.609161376953125, -0.5744781494140625, -0.539794921875, -0.5051116943359375, -0.470428466796875, -0.4357452392578125, -0.40106201171875, -0.3663787841796875, -0.331695556640625, -0.2970123291015625, -0.2623291015625, -0.2276458740234375, -0.192962646484375, -0.1582794189453125, -0.12359619140625, -0.0889129638671875, -0.054229736328125, -0.0195465087890625, 0.01513671875, 0.0498199462890625, 0.084503173828125, 0.1191864013671875, 0.15386962890625, 0.1885528564453125, 0.223236083984375, 0.2579193115234375, 0.2926025390625, 0.3272857666015625, 0.361968994140625, 0.3966522216796875, 0.43133544921875, 0.4660186767578125, 0.500701904296875, 0.5353851318359375, 0.570068359375, 0.6047515869140625, 0.639434814453125, 0.6741180419921875, 0.70880126953125, 0.7434844970703125, 0.778167724609375, 0.8128509521484375, 0.8475341796875, 0.8822174072265625, 0.916900634765625, 0.9515838623046875, 0.98626708984375, 1.0209503173828125, 1.055633544921875, 1.0903167724609375, 1.125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 10.0, 20.0, 41.0, 89.0, 190.0, 279.0, 213.0, 99.0, 40.0, 20.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09815242141485214, -0.09309753775596619, -0.08804265409708023, -0.08298777043819427, -0.07793288677930832, -0.07287800312042236, -0.06782311201095581, -0.06276823580265045, -0.0577133484184742, -0.05265846475958824, -0.047603581100702286, -0.04254869371652603, -0.037493810057640076, -0.03243892639875412, -0.027384042739868164, -0.022329159080982208, -0.017274275422096252, -0.012219391763210297, -0.007164507173001766, -0.0021096225827932358, 0.00294526107609272, 0.008000144734978676, 0.013055030256509781, 0.018109913915395737, 0.023164797574281693, 0.02821968123316765, 0.033274564892053604, 0.03832945227622986, 0.043384335935115814, 0.04843921959400177, 0.053494103252887726, 0.05854898691177368, 0.06360387802124023, 0.06865876168012619, 0.07371364533901215, 0.0787685289978981, 0.08382341265678406, 0.08887829631567001, 0.09393317997455597, 0.09898807108402252, 0.10404294729232788, 0.10909783095121384, 0.11415271461009979, 0.11920759826898575, 0.1242624819278717, 0.12931737303733826, 0.13437224924564362, 0.13942714035511017, 0.14448201656341553, 0.14953690767288208, 0.15459178388118744, 0.159646674990654, 0.16470155119895935, 0.1697564423084259, 0.17481131851673126, 0.17986620962619781, 0.18492110073566437, 0.18997599184513092, 0.19503086805343628, 0.20008575916290283, 0.2051406353712082, 0.21019552648067474, 0.2152504026889801, 0.22030529379844666, 0.22536017000675201]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 9.0, 2.0, 8.0, 11.0, 9.0, 13.0, 19.0, 12.0, 14.0, 18.0, 18.0, 24.0, 26.0, 22.0, 28.0, 34.0, 28.0, 28.0, 27.0, 31.0, 54.0, 37.0, 39.0, 46.0, 37.0, 30.0, 41.0, 22.0, 28.0, 23.0, 24.0, 35.0, 24.0, 28.0, 18.0, 16.0, 15.0, 12.0, 10.0, 11.0, 13.0, 11.0, 5.0, 13.0, 5.0, 8.0, 3.0, 3.0, 0.0, 5.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.05248302221298218, -0.05086439102888107, -0.04924575984477997, -0.047627128660678864, -0.04600849747657776, -0.044389866292476654, -0.04277123510837555, -0.041152603924274445, -0.03953397274017334, -0.037915341556072235, -0.03629671037197113, -0.034678079187870026, -0.03305944800376892, -0.031440816819667816, -0.02982218563556671, -0.028203554451465607, -0.026584923267364502, -0.024966292083263397, -0.023347660899162292, -0.021729029715061188, -0.020110398530960083, -0.01849176734685898, -0.016873136162757874, -0.015254504978656769, -0.013635873794555664, -0.01201724261045456, -0.010398611426353455, -0.00877998024225235, -0.007161349058151245, -0.00554271787405014, -0.003924086689949036, -0.002305455505847931, -0.0006868243217468262, 0.0009318068623542786, 0.0025504380464553833, 0.004169069230556488, 0.005787700414657593, 0.0074063315987586975, 0.009024962782859802, 0.010643593966960907, 0.012262225151062012, 0.013880856335163116, 0.015499487519264221, 0.017118118703365326, 0.01873674988746643, 0.020355381071567535, 0.02197401225566864, 0.023592643439769745, 0.02521127462387085, 0.026829905807971954, 0.02844853699207306, 0.030067168176174164, 0.03168579936027527, 0.03330443054437637, 0.03492306172847748, 0.03654169291257858, 0.03816032409667969, 0.03977895528078079, 0.0413975864648819, 0.043016217648983, 0.044634848833084106, 0.04625348001718521, 0.047872111201286316, 0.04949074238538742, 0.051109373569488525]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 13.0, 4.0, 11.0, 9.0, 16.0, 15.0, 26.0, 18.0, 24.0, 26.0, 33.0, 40.0, 34.0, 30.0, 42.0, 43.0, 53.0, 58.0, 49.0, 49.0, 42.0, 46.0, 44.0, 39.0, 28.0, 26.0, 25.0, 21.0, 19.0, 9.0, 22.0, 17.0, 8.0, 12.0, 6.0, 6.0, 6.0, 5.0, 8.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.328125, -7.0987548828125, -6.869384765625, -6.6400146484375, -6.41064453125, -6.1812744140625, -5.951904296875, -5.7225341796875, -5.4931640625, -5.2637939453125, -5.034423828125, -4.8050537109375, -4.57568359375, -4.3463134765625, -4.116943359375, -3.8875732421875, -3.658203125, -3.4288330078125, -3.199462890625, -2.9700927734375, -2.74072265625, -2.5113525390625, -2.281982421875, -2.0526123046875, -1.8232421875, -1.5938720703125, -1.364501953125, -1.1351318359375, -0.90576171875, -0.6763916015625, -0.447021484375, -0.2176513671875, 0.01171875, 0.2410888671875, 0.470458984375, 0.6998291015625, 0.92919921875, 1.1585693359375, 1.387939453125, 1.6173095703125, 1.8466796875, 2.0760498046875, 2.305419921875, 2.5347900390625, 2.76416015625, 2.9935302734375, 3.222900390625, 3.4522705078125, 3.681640625, 3.9110107421875, 4.140380859375, 4.3697509765625, 4.59912109375, 4.8284912109375, 5.057861328125, 5.2872314453125, 5.5166015625, 5.7459716796875, 5.975341796875, 6.2047119140625, 6.43408203125, 6.6634521484375, 6.892822265625, 7.1221923828125, 7.3515625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 13.0, 10.0, 22.0, 14.0, 19.0, 39.0, 41.0, 57.0, 88.0, 120.0, 202.0, 281.0, 435.0, 735.0, 1113.0, 1714.0, 2995.0, 4995.0, 8897.0, 15772.0, 28541.0, 55344.0, 119517.0, 266040.0, 281843.0, 130233.0, 59261.0, 30669.0, 16773.0, 9193.0, 5376.0, 3140.0, 1923.0, 1081.0, 691.0, 420.0, 313.0, 196.0, 125.0, 77.0, 69.0, 56.0, 30.0, 29.0, 16.0, 15.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.61328125, -7.35992431640625, -7.1065673828125, -6.85321044921875, -6.599853515625, -6.34649658203125, -6.0931396484375, -5.83978271484375, -5.58642578125, -5.33306884765625, -5.0797119140625, -4.82635498046875, -4.572998046875, -4.31964111328125, -4.0662841796875, -3.81292724609375, -3.5595703125, -3.30621337890625, -3.0528564453125, -2.79949951171875, -2.546142578125, -2.29278564453125, -2.0394287109375, -1.78607177734375, -1.53271484375, -1.27935791015625, -1.0260009765625, -0.77264404296875, -0.519287109375, -0.26593017578125, -0.0125732421875, 0.24078369140625, 0.494140625, 0.74749755859375, 1.0008544921875, 1.25421142578125, 1.507568359375, 1.76092529296875, 2.0142822265625, 2.26763916015625, 2.52099609375, 2.77435302734375, 3.0277099609375, 3.28106689453125, 3.534423828125, 3.78778076171875, 4.0411376953125, 4.29449462890625, 4.5478515625, 4.80120849609375, 5.0545654296875, 5.30792236328125, 5.561279296875, 5.81463623046875, 6.0679931640625, 6.32135009765625, 6.57470703125, 6.82806396484375, 7.0814208984375, 7.33477783203125, 7.588134765625, 7.84149169921875, 8.0948486328125, 8.34820556640625, 8.6015625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 9.0, 9.0, 8.0, 13.0, 9.0, 9.0, 19.0, 23.0, 23.0, 18.0, 23.0, 35.0, 33.0, 38.0, 48.0, 61.0, 92.0, 134.0, 219.0, 1336.0, 245.0, 146.0, 89.0, 63.0, 52.0, 30.0, 34.0, 35.0, 38.0, 30.0, 23.0, 18.0, 13.0, 23.0, 10.0, 5.0, 11.0, 4.0, 6.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.34375, -12.841796875, -12.33984375, -11.837890625, -11.3359375, -10.833984375, -10.33203125, -9.830078125, -9.328125, -8.826171875, -8.32421875, -7.822265625, -7.3203125, -6.818359375, -6.31640625, -5.814453125, -5.3125, -4.810546875, -4.30859375, -3.806640625, -3.3046875, -2.802734375, -2.30078125, -1.798828125, -1.296875, -0.794921875, -0.29296875, 0.208984375, 0.7109375, 1.212890625, 1.71484375, 2.216796875, 2.71875, 3.220703125, 3.72265625, 4.224609375, 4.7265625, 5.228515625, 5.73046875, 6.232421875, 6.734375, 7.236328125, 7.73828125, 8.240234375, 8.7421875, 9.244140625, 9.74609375, 10.248046875, 10.75, 11.251953125, 11.75390625, 12.255859375, 12.7578125, 13.259765625, 13.76171875, 14.263671875, 14.765625, 15.267578125, 15.76953125, 16.271484375, 16.7734375, 17.275390625, 17.77734375, 18.279296875, 18.78125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 6.0, 2.0, 7.0, 10.0, 14.0, 22.0, 12.0, 25.0, 42.0, 38.0, 69.0, 101.0, 132.0, 204.0, 338.0, 528.0, 1218.0, 4126.0, 23720.0, 281348.0, 2652874.0, 158990.0, 16307.0, 3082.0, 1007.0, 463.0, 312.0, 202.0, 149.0, 103.0, 56.0, 56.0, 35.0, 32.0, 14.0, 11.0, 11.0, 8.0, 7.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.34375, -23.515869140625, -22.68798828125, -21.860107421875, -21.0322265625, -20.204345703125, -19.37646484375, -18.548583984375, -17.720703125, -16.892822265625, -16.06494140625, -15.237060546875, -14.4091796875, -13.581298828125, -12.75341796875, -11.925537109375, -11.09765625, -10.269775390625, -9.44189453125, -8.614013671875, -7.7861328125, -6.958251953125, -6.13037109375, -5.302490234375, -4.474609375, -3.646728515625, -2.81884765625, -1.990966796875, -1.1630859375, -0.335205078125, 0.49267578125, 1.320556640625, 2.1484375, 2.976318359375, 3.80419921875, 4.632080078125, 5.4599609375, 6.287841796875, 7.11572265625, 7.943603515625, 8.771484375, 9.599365234375, 10.42724609375, 11.255126953125, 12.0830078125, 12.910888671875, 13.73876953125, 14.566650390625, 15.39453125, 16.222412109375, 17.05029296875, 17.878173828125, 18.7060546875, 19.533935546875, 20.36181640625, 21.189697265625, 22.017578125, 22.845458984375, 23.67333984375, 24.501220703125, 25.3291015625, 26.156982421875, 26.98486328125, 27.812744140625, 28.640625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 13.0, 61.0, 234.0, 422.0, 214.0, 46.0, 17.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.1397933959961, -83.39500427246094, -77.65020751953125, -71.9054183959961, -66.1606216430664, -60.41583251953125, -54.67103958129883, -48.926246643066406, -43.181453704833984, -37.43666076660156, -31.69186782836914, -25.94707679748535, -20.20228385925293, -14.457490921020508, -8.712699890136719, -2.967906951904297, 2.776885986328125, 8.521678924560547, 14.266470909118652, 20.011262893676758, 25.75605583190918, 31.5008487701416, 37.24563980102539, 42.99043273925781, 48.735225677490234, 54.480018615722656, 60.22481155395508, 65.9696044921875, 71.71439361572266, 77.45919036865234, 83.2039794921875, 88.94877624511719, 94.69355773925781, 100.43834686279297, 106.18314361572266, 111.92793273925781, 117.6727294921875, 123.41751861572266, 129.1623077392578, 134.9071044921875, 140.6519012451172, 146.39669799804688, 152.1414794921875, 157.8862762451172, 163.63107299804688, 169.37586975097656, 175.1206512451172, 180.86544799804688, 186.6102294921875, 192.3550262451172, 198.0998077392578, 203.8446044921875, 209.5894012451172, 215.33419799804688, 221.0789794921875, 226.8237762451172, 232.56857299804688, 238.31336975097656, 244.0581512451172, 249.80294799804688, 255.54774475097656, 261.29254150390625, 267.0373229980469, 272.7821044921875, 278.52691650390625]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 8.0, 5.0, 15.0, 11.0, 18.0, 14.0, 21.0, 19.0, 19.0, 25.0, 24.0, 28.0, 38.0, 32.0, 44.0, 45.0, 39.0, 41.0, 55.0, 45.0, 34.0, 39.0, 28.0, 43.0, 38.0, 36.0, 27.0, 27.0, 23.0, 18.0, 18.0, 24.0, 14.0, 13.0, 13.0, 17.0, 14.0, 7.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.63214111328125, -37.38907241821289, -36.14600372314453, -34.90293884277344, -33.65987014770508, -32.41680145263672, -31.17373275756836, -29.930665969848633, -28.687599182128906, -27.444530487060547, -26.20146369934082, -24.95839500427246, -23.715328216552734, -22.472259521484375, -21.229190826416016, -19.98612403869629, -18.74305534362793, -17.49998664855957, -16.256919860839844, -15.013851165771484, -13.770784378051758, -12.527715682983398, -11.284647941589355, -10.041580200195312, -8.79851245880127, -7.555444717407227, -6.312376976013184, -5.069308757781982, -3.8262410163879395, -2.5831732749938965, -1.3401050567626953, -0.09703731536865234, 1.1460304260253906, 2.3890981674194336, 3.6321661472320557, 4.875234127044678, 6.118301868438721, 7.361369609832764, 8.604437828063965, 9.847505569458008, 11.09057331085205, 12.333641052246094, 13.576708793640137, 14.81977653503418, 16.06284523010254, 17.305912017822266, 18.548980712890625, 19.792049407958984, 21.03511619567871, 22.27818489074707, 23.521251678466797, 24.764320373535156, 26.007387161254883, 27.250455856323242, 28.49352264404297, 29.736591339111328, 30.979660034179688, 32.22272872924805, 33.465797424316406, 34.7088623046875, 35.95193099975586, 37.19499969482422, 38.43806838989258, 39.68113708496094, 40.92420196533203]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 7.0, 13.0, 10.0, 15.0, 13.0, 6.0, 16.0, 20.0, 28.0, 39.0, 27.0, 29.0, 45.0, 38.0, 54.0, 42.0, 44.0, 58.0, 37.0, 42.0, 56.0, 53.0, 27.0, 39.0, 30.0, 35.0, 24.0, 20.0, 25.0, 17.0, 22.0, 10.0, 10.0, 8.0, 7.0, 8.0, 5.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4140625, -7.1663818359375, -6.918701171875, -6.6710205078125, -6.42333984375, -6.1756591796875, -5.927978515625, -5.6802978515625, -5.4326171875, -5.1849365234375, -4.937255859375, -4.6895751953125, -4.44189453125, -4.1942138671875, -3.946533203125, -3.6988525390625, -3.451171875, -3.2034912109375, -2.955810546875, -2.7081298828125, -2.46044921875, -2.2127685546875, -1.965087890625, -1.7174072265625, -1.4697265625, -1.2220458984375, -0.974365234375, -0.7266845703125, -0.47900390625, -0.2313232421875, 0.016357421875, 0.2640380859375, 0.51171875, 0.7593994140625, 1.007080078125, 1.2547607421875, 1.50244140625, 1.7501220703125, 1.997802734375, 2.2454833984375, 2.4931640625, 2.7408447265625, 2.988525390625, 3.2362060546875, 3.48388671875, 3.7315673828125, 3.979248046875, 4.2269287109375, 4.474609375, 4.7222900390625, 4.969970703125, 5.2176513671875, 5.46533203125, 5.7130126953125, 5.960693359375, 6.2083740234375, 6.4560546875, 6.7037353515625, 6.951416015625, 7.1990966796875, 7.44677734375, 7.6944580078125, 7.942138671875, 8.1898193359375, 8.4375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 2.0, 5.0, 8.0, 9.0, 8.0, 13.0, 10.0, 12.0, 18.0, 15.0, 36.0, 39.0, 46.0, 36.0, 67.0, 89.0, 127.0, 167.0, 231.0, 444.0, 1025.0, 5582.0, 217258.0, 3927406.0, 37064.0, 2676.0, 731.0, 309.0, 222.0, 155.0, 90.0, 73.0, 65.0, 43.0, 35.0, 27.0, 28.0, 21.0, 18.0, 8.0, 18.0, 9.0, 10.0, 5.0, 11.0, 4.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0], "bins": [-50.96875, -49.34130859375, -47.7138671875, -46.08642578125, -44.458984375, -42.83154296875, -41.2041015625, -39.57666015625, -37.94921875, -36.32177734375, -34.6943359375, -33.06689453125, -31.439453125, -29.81201171875, -28.1845703125, -26.55712890625, -24.9296875, -23.30224609375, -21.6748046875, -20.04736328125, -18.419921875, -16.79248046875, -15.1650390625, -13.53759765625, -11.91015625, -10.28271484375, -8.6552734375, -7.02783203125, -5.400390625, -3.77294921875, -2.1455078125, -0.51806640625, 1.109375, 2.73681640625, 4.3642578125, 5.99169921875, 7.619140625, 9.24658203125, 10.8740234375, 12.50146484375, 14.12890625, 15.75634765625, 17.3837890625, 19.01123046875, 20.638671875, 22.26611328125, 23.8935546875, 25.52099609375, 27.1484375, 28.77587890625, 30.4033203125, 32.03076171875, 33.658203125, 35.28564453125, 36.9130859375, 38.54052734375, 40.16796875, 41.79541015625, 43.4228515625, 45.05029296875, 46.677734375, 48.30517578125, 49.9326171875, 51.56005859375, 53.1875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 9.0, 10.0, 5.0, 15.0, 23.0, 13.0, 28.0, 57.0, 64.0, 87.0, 143.0, 197.0, 333.0, 608.0, 759.0, 604.0, 394.0, 238.0, 145.0, 96.0, 60.0, 49.0, 33.0, 25.0, 21.0, 10.0, 11.0, 8.0, 6.0, 6.0, 9.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -10.9627685546875, -10.566162109375, -10.1695556640625, -9.77294921875, -9.3763427734375, -8.979736328125, -8.5831298828125, -8.1865234375, -7.7899169921875, -7.393310546875, -6.9967041015625, -6.60009765625, -6.2034912109375, -5.806884765625, -5.4102783203125, -5.013671875, -4.6170654296875, -4.220458984375, -3.8238525390625, -3.42724609375, -3.0306396484375, -2.634033203125, -2.2374267578125, -1.8408203125, -1.4442138671875, -1.047607421875, -0.6510009765625, -0.25439453125, 0.1422119140625, 0.538818359375, 0.9354248046875, 1.33203125, 1.7286376953125, 2.125244140625, 2.5218505859375, 2.91845703125, 3.3150634765625, 3.711669921875, 4.1082763671875, 4.5048828125, 4.9014892578125, 5.298095703125, 5.6947021484375, 6.09130859375, 6.4879150390625, 6.884521484375, 7.2811279296875, 7.677734375, 8.0743408203125, 8.470947265625, 8.8675537109375, 9.26416015625, 9.6607666015625, 10.057373046875, 10.4539794921875, 10.8505859375, 11.2471923828125, 11.643798828125, 12.0404052734375, 12.43701171875, 12.8336181640625, 13.230224609375, 13.6268310546875, 14.0234375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 3.0, 8.0, 9.0, 10.0, 9.0, 19.0, 28.0, 42.0, 64.0, 89.0, 172.0, 329.0, 616.0, 1438.0, 4085.0, 20614.0, 240609.0, 3654317.0, 244086.0, 20642.0, 4178.0, 1421.0, 633.0, 315.0, 205.0, 120.0, 59.0, 49.0, 31.0, 22.0, 19.0, 10.0, 11.0, 11.0, 9.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.328125, -25.334716796875, -24.34130859375, -23.347900390625, -22.3544921875, -21.361083984375, -20.36767578125, -19.374267578125, -18.380859375, -17.387451171875, -16.39404296875, -15.400634765625, -14.4072265625, -13.413818359375, -12.42041015625, -11.427001953125, -10.43359375, -9.440185546875, -8.44677734375, -7.453369140625, -6.4599609375, -5.466552734375, -4.47314453125, -3.479736328125, -2.486328125, -1.492919921875, -0.49951171875, 0.493896484375, 1.4873046875, 2.480712890625, 3.47412109375, 4.467529296875, 5.4609375, 6.454345703125, 7.44775390625, 8.441162109375, 9.4345703125, 10.427978515625, 11.42138671875, 12.414794921875, 13.408203125, 14.401611328125, 15.39501953125, 16.388427734375, 17.3818359375, 18.375244140625, 19.36865234375, 20.362060546875, 21.35546875, 22.348876953125, 23.34228515625, 24.335693359375, 25.3291015625, 26.322509765625, 27.31591796875, 28.309326171875, 29.302734375, 30.296142578125, 31.28955078125, 32.282958984375, 33.2763671875, 34.269775390625, 35.26318359375, 36.256591796875, 37.25]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 19.0, 29.0, 58.0, 111.0, 160.0, 173.0, 173.0, 140.0, 71.0, 42.0, 13.0, 13.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-127.17195892333984, -124.71599578857422, -122.2600326538086, -119.80406951904297, -117.34810638427734, -114.89214324951172, -112.4361801147461, -109.98021697998047, -107.52425384521484, -105.06829071044922, -102.6123275756836, -100.15636444091797, -97.70040130615234, -95.24443817138672, -92.7884750366211, -90.33251190185547, -87.87654113769531, -85.42057800292969, -82.96461486816406, -80.50865173339844, -78.05268859863281, -75.59672546386719, -73.14076232910156, -70.68479919433594, -68.22883605957031, -65.77287292480469, -63.31690979003906, -60.86094665527344, -58.40498352050781, -55.94902038574219, -53.49305725097656, -51.03709411621094, -48.581138610839844, -46.12517547607422, -43.669212341308594, -41.21324920654297, -38.757286071777344, -36.30132293701172, -33.845359802246094, -31.389394760131836, -28.933429718017578, -26.477466583251953, -24.021503448486328, -21.565540313720703, -19.109577178955078, -16.653614044189453, -14.197649002075195, -11.74168586730957, -9.285722732543945, -6.82975959777832, -4.373795986175537, -1.917832374572754, 0.5381307601928711, 2.994093894958496, 5.4500579833984375, 7.9060211181640625, 10.361984252929688, 12.817947387695312, 15.273910522460938, 17.729873657226562, 20.185836791992188, 22.641799926757812, 25.09776496887207, 27.553728103637695, 30.00969123840332]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 7.0, 10.0, 12.0, 9.0, 8.0, 11.0, 13.0, 18.0, 24.0, 21.0, 28.0, 22.0, 30.0, 39.0, 30.0, 37.0, 32.0, 37.0, 42.0, 35.0, 42.0, 37.0, 44.0, 48.0, 36.0, 32.0, 34.0, 27.0, 22.0, 34.0, 22.0, 23.0, 17.0, 14.0, 14.0, 12.0, 16.0, 4.0, 9.0, 8.0, 9.0, 2.0, 8.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-30.647640228271484, -29.681854248046875, -28.7160701751709, -27.75028419494629, -26.784500122070312, -25.818714141845703, -24.852928161621094, -23.887144088745117, -22.921358108520508, -21.9555721282959, -20.989788055419922, -20.024002075195312, -19.058218002319336, -18.092432022094727, -17.12664794921875, -16.16086196899414, -15.195076942443848, -14.229291915893555, -13.263506889343262, -12.297721862792969, -11.33193588256836, -10.366150856018066, -9.400365829467773, -8.434579849243164, -7.468795299530029, -6.503010272979736, -5.537224769592285, -4.571439743041992, -3.60565447807312, -2.639869213104248, -1.674084186553955, -0.7082986831665039, 0.25748634338378906, 1.2232716083526611, 2.189056873321533, 3.154841899871826, 4.120627403259277, 5.08641242980957, 6.052197456359863, 7.0179829597473145, 7.983767986297607, 8.949553489685059, 9.915338516235352, 10.881123542785645, 11.846908569335938, 12.812694549560547, 13.778478622436523, 14.744264602661133, 15.710049629211426, 16.67583465576172, 17.641620635986328, 18.607404708862305, 19.573190689086914, 20.53897476196289, 21.5047607421875, 22.47054672241211, 23.436330795288086, 24.402116775512695, 25.367900848388672, 26.33368682861328, 27.299470901489258, 28.265256881713867, 29.231040954589844, 30.196826934814453, 31.162612915039062]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 6.0, 11.0, 16.0, 18.0, 4.0, 26.0, 27.0, 26.0, 33.0, 33.0, 30.0, 38.0, 39.0, 53.0, 47.0, 67.0, 35.0, 43.0, 51.0, 57.0, 37.0, 42.0, 53.0, 38.0, 24.0, 28.0, 22.0, 10.0, 17.0, 9.0, 8.0, 16.0, 8.0, 4.0, 2.0, 3.0, 2.0, 6.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.140625, -6.8807373046875, -6.620849609375, -6.3609619140625, -6.10107421875, -5.8411865234375, -5.581298828125, -5.3214111328125, -5.0615234375, -4.8016357421875, -4.541748046875, -4.2818603515625, -4.02197265625, -3.7620849609375, -3.502197265625, -3.2423095703125, -2.982421875, -2.7225341796875, -2.462646484375, -2.2027587890625, -1.94287109375, -1.6829833984375, -1.423095703125, -1.1632080078125, -0.9033203125, -0.6434326171875, -0.383544921875, -0.1236572265625, 0.13623046875, 0.3961181640625, 0.656005859375, 0.9158935546875, 1.17578125, 1.4356689453125, 1.695556640625, 1.9554443359375, 2.21533203125, 2.4752197265625, 2.735107421875, 2.9949951171875, 3.2548828125, 3.5147705078125, 3.774658203125, 4.0345458984375, 4.29443359375, 4.5543212890625, 4.814208984375, 5.0740966796875, 5.333984375, 5.5938720703125, 5.853759765625, 6.1136474609375, 6.37353515625, 6.6334228515625, 6.893310546875, 7.1531982421875, 7.4130859375, 7.6729736328125, 7.932861328125, 8.1927490234375, 8.45263671875, 8.7125244140625, 8.972412109375, 9.2322998046875, 9.4921875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 13.0, 13.0, 23.0, 28.0, 36.0, 52.0, 57.0, 79.0, 132.0, 165.0, 285.0, 342.0, 536.0, 806.0, 1329.0, 2172.0, 3779.0, 7711.0, 16902.0, 41179.0, 111075.0, 292477.0, 337988.0, 139912.0, 50834.0, 20332.0, 9164.0, 4480.0, 2421.0, 1409.0, 901.0, 570.0, 424.0, 259.0, 182.0, 141.0, 107.0, 68.0, 55.0, 34.0, 20.0, 11.0, 14.0, 7.0, 8.0, 8.0, 1.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9326171875, -1.8704986572265625, -1.808380126953125, -1.7462615966796875, -1.68414306640625, -1.6220245361328125, -1.559906005859375, -1.4977874755859375, -1.4356689453125, -1.3735504150390625, -1.311431884765625, -1.2493133544921875, -1.18719482421875, -1.1250762939453125, -1.062957763671875, -1.0008392333984375, -0.938720703125, -0.8766021728515625, -0.814483642578125, -0.7523651123046875, -0.69024658203125, -0.6281280517578125, -0.566009521484375, -0.5038909912109375, -0.4417724609375, -0.3796539306640625, -0.317535400390625, -0.2554168701171875, -0.19329833984375, -0.1311798095703125, -0.069061279296875, -0.0069427490234375, 0.05517578125, 0.1172943115234375, 0.179412841796875, 0.2415313720703125, 0.30364990234375, 0.3657684326171875, 0.427886962890625, 0.4900054931640625, 0.5521240234375, 0.6142425537109375, 0.676361083984375, 0.7384796142578125, 0.80059814453125, 0.8627166748046875, 0.924835205078125, 0.9869537353515625, 1.049072265625, 1.1111907958984375, 1.173309326171875, 1.2354278564453125, 1.29754638671875, 1.3596649169921875, 1.421783447265625, 1.4839019775390625, 1.5460205078125, 1.6081390380859375, 1.670257568359375, 1.7323760986328125, 1.79449462890625, 1.8566131591796875, 1.918731689453125, 1.9808502197265625, 2.04296875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 8.0, 4.0, 9.0, 7.0, 5.0, 11.0, 12.0, 18.0, 19.0, 20.0, 24.0, 24.0, 24.0, 28.0, 42.0, 42.0, 37.0, 57.0, 40.0, 53.0, 1063.0, 33.0, 48.0, 49.0, 35.0, 41.0, 31.0, 36.0, 28.0, 31.0, 38.0, 24.0, 21.0, 7.0, 13.0, 10.0, 11.0, 10.0, 4.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.52734375, -6.349609375, -6.171875, -5.994140625, -5.81640625, -5.638671875, -5.4609375, -5.283203125, -5.10546875, -4.927734375, -4.75, -4.572265625, -4.39453125, -4.216796875, -4.0390625, -3.861328125, -3.68359375, -3.505859375, -3.328125, -3.150390625, -2.97265625, -2.794921875, -2.6171875, -2.439453125, -2.26171875, -2.083984375, -1.90625, -1.728515625, -1.55078125, -1.373046875, -1.1953125, -1.017578125, -0.83984375, -0.662109375, -0.484375, -0.306640625, -0.12890625, 0.048828125, 0.2265625, 0.404296875, 0.58203125, 0.759765625, 0.9375, 1.115234375, 1.29296875, 1.470703125, 1.6484375, 1.826171875, 2.00390625, 2.181640625, 2.359375, 2.537109375, 2.71484375, 2.892578125, 3.0703125, 3.248046875, 3.42578125, 3.603515625, 3.78125, 3.958984375, 4.13671875, 4.314453125, 4.4921875, 4.669921875, 4.84765625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 6.0, 9.0, 14.0, 26.0, 33.0, 43.0, 60.0, 111.0, 139.0, 201.0, 337.0, 507.0, 794.0, 1308.0, 2183.0, 3978.0, 7812.0, 17794.0, 45869.0, 143948.0, 1074606.0, 609233.0, 117449.0, 39312.0, 15341.0, 7004.0, 3581.0, 2066.0, 1199.0, 751.0, 501.0, 277.0, 218.0, 137.0, 94.0, 46.0, 38.0, 34.0, 25.0, 13.0, 5.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.529296875, -1.478179931640625, -1.42706298828125, -1.375946044921875, -1.3248291015625, -1.273712158203125, -1.22259521484375, -1.171478271484375, -1.120361328125, -1.069244384765625, -1.01812744140625, -0.967010498046875, -0.9158935546875, -0.864776611328125, -0.81365966796875, -0.762542724609375, -0.71142578125, -0.660308837890625, -0.60919189453125, -0.558074951171875, -0.5069580078125, -0.455841064453125, -0.40472412109375, -0.353607177734375, -0.302490234375, -0.251373291015625, -0.20025634765625, -0.149139404296875, -0.0980224609375, -0.046905517578125, 0.00421142578125, 0.055328369140625, 0.1064453125, 0.157562255859375, 0.20867919921875, 0.259796142578125, 0.3109130859375, 0.362030029296875, 0.41314697265625, 0.464263916015625, 0.515380859375, 0.566497802734375, 0.61761474609375, 0.668731689453125, 0.7198486328125, 0.770965576171875, 0.82208251953125, 0.873199462890625, 0.92431640625, 0.975433349609375, 1.02655029296875, 1.077667236328125, 1.1287841796875, 1.179901123046875, 1.23101806640625, 1.282135009765625, 1.333251953125, 1.384368896484375, 1.43548583984375, 1.486602783203125, 1.5377197265625, 1.588836669921875, 1.63995361328125, 1.691070556640625, 1.7421875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 4.0, 12.0, 23.0, 88.0, 423.0, 309.0, 75.0, 25.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74267578125, -0.7116012573242188, -0.6805267333984375, -0.6494522094726562, -0.618377685546875, -0.5873031616210938, -0.5562286376953125, -0.5251541137695312, -0.49407958984375, -0.46300506591796875, -0.4319305419921875, -0.40085601806640625, -0.369781494140625, -0.33870697021484375, -0.3076324462890625, -0.27655792236328125, -0.2454833984375, -0.21440887451171875, -0.1833343505859375, -0.15225982666015625, -0.121185302734375, -0.09011077880859375, -0.0590362548828125, -0.02796173095703125, 0.00311279296875, 0.03418731689453125, 0.0652618408203125, 0.09633636474609375, 0.127410888671875, 0.15848541259765625, 0.1895599365234375, 0.22063446044921875, 0.251708984375, 0.28278350830078125, 0.3138580322265625, 0.34493255615234375, 0.376007080078125, 0.40708160400390625, 0.4381561279296875, 0.46923065185546875, 0.50030517578125, 0.5313796997070312, 0.5624542236328125, 0.5935287475585938, 0.624603271484375, 0.6556777954101562, 0.6867523193359375, 0.7178268432617188, 0.7489013671875, 0.7799758911132812, 0.8110504150390625, 0.8421249389648438, 0.873199462890625, 0.9042739868164062, 0.9353485107421875, 0.9664230346679688, 0.99749755859375, 1.0285720825195312, 1.0596466064453125, 1.0907211303710938, 1.121795654296875, 1.1528701782226562, 1.1839447021484375, 1.2150192260742188, 1.24609375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 1.0, 4.0, 1.0, 6.0, 11.0, 10.0, 14.0, 43.0, 84.0, 420.0, 7333.0, 1036801.0, 3373.0, 299.0, 71.0, 24.0, 13.0, 7.0, 5.0, 1.0, 4.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.125, -22.5523681640625, -21.979736328125, -21.4071044921875, -20.83447265625, -20.2618408203125, -19.689208984375, -19.1165771484375, -18.5439453125, -17.9713134765625, -17.398681640625, -16.8260498046875, -16.25341796875, -15.6807861328125, -15.108154296875, -14.5355224609375, -13.962890625, -13.3902587890625, -12.817626953125, -12.2449951171875, -11.67236328125, -11.0997314453125, -10.527099609375, -9.9544677734375, -9.3818359375, -8.8092041015625, -8.236572265625, -7.6639404296875, -7.09130859375, -6.5186767578125, -5.946044921875, -5.3734130859375, -4.80078125, -4.2281494140625, -3.655517578125, -3.0828857421875, -2.51025390625, -1.9376220703125, -1.364990234375, -0.7923583984375, -0.2197265625, 0.3529052734375, 0.925537109375, 1.4981689453125, 2.07080078125, 2.6434326171875, 3.216064453125, 3.7886962890625, 4.361328125, 4.9339599609375, 5.506591796875, 6.0792236328125, 6.65185546875, 7.2244873046875, 7.797119140625, 8.3697509765625, 8.9423828125, 9.5150146484375, 10.087646484375, 10.6602783203125, 11.23291015625, 11.8055419921875, 12.378173828125, 12.9508056640625, 13.5234375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 19.0, 45.0, 119.0, 325.0, 311.0, 128.0, 40.0, 15.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9082821607589722, -1.8553962707519531, -1.802510380744934, -1.749624490737915, -1.6967384815216064, -1.6438525915145874, -1.5909667015075684, -1.5380808115005493, -1.4851949214935303, -1.4323090314865112, -1.3794231414794922, -1.3265371322631836, -1.2736512422561646, -1.2207653522491455, -1.1678794622421265, -1.1149935722351074, -1.0621075630187988, -1.0092216730117798, -0.956335723400116, -0.9034498333930969, -0.8505638837814331, -0.7976779937744141, -0.744792103767395, -0.691906213760376, -0.6390202641487122, -0.5861343741416931, -0.5332484245300293, -0.48036253452301025, -0.4274766147136688, -0.3745906949043274, -0.32170480489730835, -0.2688188850879669, -0.21593284606933594, -0.1630469262599945, -0.11016102135181427, -0.05727511644363403, -0.0043891966342926025, 0.04849672317504883, 0.10138261318206787, 0.1542685329914093, 0.20715445280075073, 0.26004037261009216, 0.3129262924194336, 0.36581218242645264, 0.41869810223579407, 0.4715840220451355, 0.5244699120521545, 0.5773558616638184, 0.6302417516708374, 0.6831276416778564, 0.7360135912895203, 0.7888994812965393, 0.8417854309082031, 0.8946713209152222, 0.9475572109222412, 1.0004431009292603, 1.0533289909362793, 1.1062148809432983, 1.1591007709503174, 1.211986780166626, 1.264872670173645, 1.317758560180664, 1.370644450187683, 1.4235303401947021, 1.4764163494110107]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 7.0, 3.0, 5.0, 7.0, 14.0, 11.0, 9.0, 18.0, 14.0, 17.0, 15.0, 28.0, 28.0, 22.0, 28.0, 29.0, 36.0, 36.0, 38.0, 42.0, 32.0, 36.0, 48.0, 31.0, 36.0, 24.0, 31.0, 28.0, 38.0, 29.0, 25.0, 22.0, 27.0, 21.0, 27.0, 16.0, 15.0, 15.0, 9.0, 13.0, 13.0, 9.0, 5.0, 5.0, 4.0, 5.0, 4.0, 6.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.2979714274406433, -0.28837889432907104, -0.2787863612174988, -0.2691938281059265, -0.25960129499435425, -0.250008761882782, -0.24041621387004852, -0.23082368075847626, -0.221231147646904, -0.21163861453533173, -0.20204608142375946, -0.1924535483121872, -0.18286100029945374, -0.17326846718788147, -0.1636759340763092, -0.15408340096473694, -0.14449086785316467, -0.1348983347415924, -0.12530580163002014, -0.11571326106786728, -0.10612072795629501, -0.09652819484472275, -0.08693565428256989, -0.07734312117099762, -0.06775058805942535, -0.05815805494785309, -0.048565518110990524, -0.03897298127412796, -0.029380448162555695, -0.01978791505098343, -0.010195378214120865, -0.0006028413772583008, 0.008989691734313965, 0.01858222670853138, 0.028174761682748795, 0.03776729851961136, 0.047359831631183624, 0.05695236474275589, 0.06654490530490875, 0.07613743841648102, 0.08572997152805328, 0.09532250463962555, 0.10491503775119781, 0.11450757831335068, 0.12410011142492294, 0.1336926519870758, 0.14328518509864807, 0.15287771821022034, 0.1624702513217926, 0.17206278443336487, 0.18165531754493713, 0.1912478506565094, 0.20084038376808167, 0.21043291687965393, 0.2200254648923874, 0.22961799800395966, 0.23921053111553192, 0.2488030642271042, 0.25839561223983765, 0.2679881453514099, 0.2775806784629822, 0.28717321157455444, 0.2967657446861267, 0.306358277797699, 0.31595081090927124]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 7.0, 10.0, 1.0, 8.0, 6.0, 7.0, 19.0, 14.0, 21.0, 16.0, 16.0, 29.0, 29.0, 29.0, 37.0, 32.0, 33.0, 46.0, 47.0, 35.0, 57.0, 37.0, 41.0, 53.0, 46.0, 44.0, 30.0, 37.0, 39.0, 26.0, 15.0, 31.0, 16.0, 15.0, 8.0, 9.0, 8.0, 9.0, 7.0, 9.0, 5.0, 3.0, 5.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.13671875, -6.90692138671875, -6.6771240234375, -6.44732666015625, -6.217529296875, -5.98773193359375, -5.7579345703125, -5.52813720703125, -5.29833984375, -5.06854248046875, -4.8387451171875, -4.60894775390625, -4.379150390625, -4.14935302734375, -3.9195556640625, -3.68975830078125, -3.4599609375, -3.23016357421875, -3.0003662109375, -2.77056884765625, -2.540771484375, -2.31097412109375, -2.0811767578125, -1.85137939453125, -1.62158203125, -1.39178466796875, -1.1619873046875, -0.93218994140625, -0.702392578125, -0.47259521484375, -0.2427978515625, -0.01300048828125, 0.216796875, 0.44659423828125, 0.6763916015625, 0.90618896484375, 1.135986328125, 1.36578369140625, 1.5955810546875, 1.82537841796875, 2.05517578125, 2.28497314453125, 2.5147705078125, 2.74456787109375, 2.974365234375, 3.20416259765625, 3.4339599609375, 3.66375732421875, 3.8935546875, 4.12335205078125, 4.3531494140625, 4.58294677734375, 4.812744140625, 5.04254150390625, 5.2723388671875, 5.50213623046875, 5.73193359375, 5.96173095703125, 6.1915283203125, 6.42132568359375, 6.651123046875, 6.88092041015625, 7.1107177734375, 7.34051513671875, 7.5703125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 8.0, 11.0, 19.0, 17.0, 26.0, 30.0, 41.0, 52.0, 96.0, 102.0, 168.0, 278.0, 445.0, 724.0, 1356.0, 2749.0, 5697.0, 12637.0, 29003.0, 69201.0, 165482.0, 325345.0, 248244.0, 106743.0, 44413.0, 18820.0, 8457.0, 3865.0, 1930.0, 1017.0, 528.0, 332.0, 206.0, 126.0, 99.0, 67.0, 53.0, 34.0, 42.0, 15.0, 26.0, 12.0, 12.0, 4.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.921875, -8.6219482421875, -8.322021484375, -8.0220947265625, -7.72216796875, -7.4222412109375, -7.122314453125, -6.8223876953125, -6.5224609375, -6.2225341796875, -5.922607421875, -5.6226806640625, -5.32275390625, -5.0228271484375, -4.722900390625, -4.4229736328125, -4.123046875, -3.8231201171875, -3.523193359375, -3.2232666015625, -2.92333984375, -2.6234130859375, -2.323486328125, -2.0235595703125, -1.7236328125, -1.4237060546875, -1.123779296875, -0.8238525390625, -0.52392578125, -0.2239990234375, 0.075927734375, 0.3758544921875, 0.67578125, 0.9757080078125, 1.275634765625, 1.5755615234375, 1.87548828125, 2.1754150390625, 2.475341796875, 2.7752685546875, 3.0751953125, 3.3751220703125, 3.675048828125, 3.9749755859375, 4.27490234375, 4.5748291015625, 4.874755859375, 5.1746826171875, 5.474609375, 5.7745361328125, 6.074462890625, 6.3743896484375, 6.67431640625, 6.9742431640625, 7.274169921875, 7.5740966796875, 7.8740234375, 8.1739501953125, 8.473876953125, 8.7738037109375, 9.07373046875, 9.3736572265625, 9.673583984375, 9.9735107421875, 10.2734375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 10.0, 8.0, 9.0, 15.0, 24.0, 24.0, 39.0, 35.0, 48.0, 61.0, 92.0, 129.0, 212.0, 1397.0, 284.0, 185.0, 125.0, 77.0, 59.0, 55.0, 46.0, 25.0, 19.0, 9.0, 12.0, 10.0, 10.0, 7.0, 4.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-24.484375, -23.7138671875, -22.943359375, -22.1728515625, -21.40234375, -20.6318359375, -19.861328125, -19.0908203125, -18.3203125, -17.5498046875, -16.779296875, -16.0087890625, -15.23828125, -14.4677734375, -13.697265625, -12.9267578125, -12.15625, -11.3857421875, -10.615234375, -9.8447265625, -9.07421875, -8.3037109375, -7.533203125, -6.7626953125, -5.9921875, -5.2216796875, -4.451171875, -3.6806640625, -2.91015625, -2.1396484375, -1.369140625, -0.5986328125, 0.171875, 0.9423828125, 1.712890625, 2.4833984375, 3.25390625, 4.0244140625, 4.794921875, 5.5654296875, 6.3359375, 7.1064453125, 7.876953125, 8.6474609375, 9.41796875, 10.1884765625, 10.958984375, 11.7294921875, 12.5, 13.2705078125, 14.041015625, 14.8115234375, 15.58203125, 16.3525390625, 17.123046875, 17.8935546875, 18.6640625, 19.4345703125, 20.205078125, 20.9755859375, 21.74609375, 22.5166015625, 23.287109375, 24.0576171875, 24.828125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 11.0, 4.0, 13.0, 16.0, 19.0, 34.0, 39.0, 69.0, 90.0, 140.0, 208.0, 320.0, 643.0, 1724.0, 16363.0, 3101583.0, 20993.0, 1765.0, 690.0, 333.0, 205.0, 141.0, 89.0, 52.0, 43.0, 34.0, 25.0, 17.0, 13.0, 13.0, 7.0, 3.0, 0.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-82.0, -79.5537109375, -77.107421875, -74.6611328125, -72.21484375, -69.7685546875, -67.322265625, -64.8759765625, -62.4296875, -59.9833984375, -57.537109375, -55.0908203125, -52.64453125, -50.1982421875, -47.751953125, -45.3056640625, -42.859375, -40.4130859375, -37.966796875, -35.5205078125, -33.07421875, -30.6279296875, -28.181640625, -25.7353515625, -23.2890625, -20.8427734375, -18.396484375, -15.9501953125, -13.50390625, -11.0576171875, -8.611328125, -6.1650390625, -3.71875, -1.2724609375, 1.173828125, 3.6201171875, 6.06640625, 8.5126953125, 10.958984375, 13.4052734375, 15.8515625, 18.2978515625, 20.744140625, 23.1904296875, 25.63671875, 28.0830078125, 30.529296875, 32.9755859375, 35.421875, 37.8681640625, 40.314453125, 42.7607421875, 45.20703125, 47.6533203125, 50.099609375, 52.5458984375, 54.9921875, 57.4384765625, 59.884765625, 62.3310546875, 64.77734375, 67.2236328125, 69.669921875, 72.1162109375, 74.5625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 10.0, 27.0, 74.0, 184.0, 338.0, 247.0, 93.0, 24.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.49199676513672, -103.90157318115234, -98.31114196777344, -92.72071838378906, -87.13028717041016, -81.53986358642578, -75.94943237304688, -70.3590087890625, -64.76858520507812, -59.178157806396484, -53.587730407714844, -47.99730682373047, -42.40687561035156, -36.81645202636719, -31.226024627685547, -25.635597229003906, -20.045166015625, -14.45473861694336, -8.864312171936035, -3.273885726928711, 2.3165416717529297, 7.90696907043457, 13.497394561767578, 19.08782196044922, 24.67824935913086, 30.2686767578125, 35.85910415649414, 41.44953155517578, 47.039955139160156, 52.63038635253906, 58.22080993652344, 63.81123733520508, 69.40165710449219, 74.99208068847656, 80.58251190185547, 86.17293548583984, 91.76336669921875, 97.35379028320312, 102.9442138671875, 108.5346450805664, 114.12507629394531, 119.71549987792969, 125.3059310913086, 130.8963623046875, 136.48678588867188, 142.07720947265625, 147.66763305664062, 153.258056640625, 158.84848022460938, 164.43890380859375, 170.02932739257812, 175.61976623535156, 181.21018981933594, 186.8006134033203, 192.3910369873047, 197.98147583007812, 203.5718994140625, 209.16232299804688, 214.75274658203125, 220.3431854248047, 225.93360900878906, 231.52403259277344, 237.1144561767578, 242.70489501953125, 248.29531860351562]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 5.0, 12.0, 9.0, 8.0, 12.0, 19.0, 17.0, 21.0, 21.0, 25.0, 33.0, 16.0, 28.0, 25.0, 38.0, 37.0, 32.0, 36.0, 32.0, 39.0, 41.0, 37.0, 41.0, 42.0, 37.0, 36.0, 29.0, 33.0, 29.0, 29.0, 17.0, 24.0, 21.0, 14.0, 16.0, 16.0, 12.0, 8.0, 8.0, 8.0, 8.0, 4.0, 3.0, 0.0, 4.0, 1.0, 4.0, 2.0, 3.0], "bins": [-60.11222839355469, -58.45820236206055, -56.804176330566406, -55.150150299072266, -53.496124267578125, -51.84209442138672, -50.18806838989258, -48.53404235839844, -46.8800163269043, -45.225990295410156, -43.571964263916016, -41.917938232421875, -40.26390838623047, -38.609886169433594, -36.95585632324219, -35.30183029174805, -33.647804260253906, -31.993778228759766, -30.339752197265625, -28.68572425842285, -27.03169822692871, -25.37767219543457, -23.723644256591797, -22.069618225097656, -20.415592193603516, -18.761566162109375, -17.107540130615234, -15.453512191772461, -13.79948616027832, -12.14546012878418, -10.491433143615723, -8.837406158447266, -7.183376312255859, -5.5293498039245605, -3.8753232955932617, -2.221296787261963, -0.5672702789306641, 1.0867557525634766, 2.7407827377319336, 4.394809722900391, 6.048835754394531, 7.70286226272583, 9.356888771057129, 11.010915756225586, 12.664941787719727, 14.318967819213867, 15.972994804382324, 17.62702178955078, 19.281047821044922, 20.935073852539062, 22.589099884033203, 24.243127822875977, 25.897153854370117, 27.551179885864258, 29.20520782470703, 30.859233856201172, 32.51325988769531, 34.16728591918945, 35.821311950683594, 37.475337982177734, 39.129364013671875, 40.78339385986328, 42.43741989135742, 44.09144592285156, 45.7454719543457]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 5.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 6.0, 6.0, 6.0, 7.0, 6.0, 13.0, 8.0, 12.0, 13.0, 19.0, 22.0, 19.0, 22.0, 37.0, 32.0, 38.0, 34.0, 38.0, 43.0, 45.0, 41.0, 36.0, 37.0, 34.0, 49.0, 40.0, 33.0, 35.0, 37.0, 26.0, 32.0, 20.0, 21.0, 30.0, 10.0, 11.0, 20.0, 8.0, 11.0, 10.0, 8.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0], "bins": [-7.26953125, -7.05224609375, -6.8349609375, -6.61767578125, -6.400390625, -6.18310546875, -5.9658203125, -5.74853515625, -5.53125, -5.31396484375, -5.0966796875, -4.87939453125, -4.662109375, -4.44482421875, -4.2275390625, -4.01025390625, -3.79296875, -3.57568359375, -3.3583984375, -3.14111328125, -2.923828125, -2.70654296875, -2.4892578125, -2.27197265625, -2.0546875, -1.83740234375, -1.6201171875, -1.40283203125, -1.185546875, -0.96826171875, -0.7509765625, -0.53369140625, -0.31640625, -0.09912109375, 0.1181640625, 0.33544921875, 0.552734375, 0.77001953125, 0.9873046875, 1.20458984375, 1.421875, 1.63916015625, 1.8564453125, 2.07373046875, 2.291015625, 2.50830078125, 2.7255859375, 2.94287109375, 3.16015625, 3.37744140625, 3.5947265625, 3.81201171875, 4.029296875, 4.24658203125, 4.4638671875, 4.68115234375, 4.8984375, 5.11572265625, 5.3330078125, 5.55029296875, 5.767578125, 5.98486328125, 6.2021484375, 6.41943359375, 6.63671875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 6.0, 7.0, 23.0, 19.0, 42.0, 94.0, 165.0, 340.0, 750.0, 1980.0, 6817.0, 49741.0, 2712747.0, 1381576.0, 31642.0, 5281.0, 1746.0, 656.0, 302.0, 149.0, 84.0, 37.0, 28.0, 18.0, 11.0, 10.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.15625, -38.00146484375, -36.8466796875, -35.69189453125, -34.537109375, -33.38232421875, -32.2275390625, -31.07275390625, -29.91796875, -28.76318359375, -27.6083984375, -26.45361328125, -25.298828125, -24.14404296875, -22.9892578125, -21.83447265625, -20.6796875, -19.52490234375, -18.3701171875, -17.21533203125, -16.060546875, -14.90576171875, -13.7509765625, -12.59619140625, -11.44140625, -10.28662109375, -9.1318359375, -7.97705078125, -6.822265625, -5.66748046875, -4.5126953125, -3.35791015625, -2.203125, -1.04833984375, 0.1064453125, 1.26123046875, 2.416015625, 3.57080078125, 4.7255859375, 5.88037109375, 7.03515625, 8.18994140625, 9.3447265625, 10.49951171875, 11.654296875, 12.80908203125, 13.9638671875, 15.11865234375, 16.2734375, 17.42822265625, 18.5830078125, 19.73779296875, 20.892578125, 22.04736328125, 23.2021484375, 24.35693359375, 25.51171875, 26.66650390625, 27.8212890625, 28.97607421875, 30.130859375, 31.28564453125, 32.4404296875, 33.59521484375, 34.75]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 8.0, 4.0, 8.0, 9.0, 15.0, 25.0, 25.0, 32.0, 47.0, 54.0, 84.0, 115.0, 145.0, 211.0, 288.0, 388.0, 518.0, 527.0, 424.0, 287.0, 223.0, 140.0, 134.0, 79.0, 72.0, 53.0, 37.0, 32.0, 25.0, 13.0, 12.0, 12.0, 9.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7578125, -11.37744140625, -10.9970703125, -10.61669921875, -10.236328125, -9.85595703125, -9.4755859375, -9.09521484375, -8.71484375, -8.33447265625, -7.9541015625, -7.57373046875, -7.193359375, -6.81298828125, -6.4326171875, -6.05224609375, -5.671875, -5.29150390625, -4.9111328125, -4.53076171875, -4.150390625, -3.77001953125, -3.3896484375, -3.00927734375, -2.62890625, -2.24853515625, -1.8681640625, -1.48779296875, -1.107421875, -0.72705078125, -0.3466796875, 0.03369140625, 0.4140625, 0.79443359375, 1.1748046875, 1.55517578125, 1.935546875, 2.31591796875, 2.6962890625, 3.07666015625, 3.45703125, 3.83740234375, 4.2177734375, 4.59814453125, 4.978515625, 5.35888671875, 5.7392578125, 6.11962890625, 6.5, 6.88037109375, 7.2607421875, 7.64111328125, 8.021484375, 8.40185546875, 8.7822265625, 9.16259765625, 9.54296875, 9.92333984375, 10.3037109375, 10.68408203125, 11.064453125, 11.44482421875, 11.8251953125, 12.20556640625, 12.5859375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 9.0, 12.0, 17.0, 30.0, 30.0, 57.0, 70.0, 152.0, 218.0, 296.0, 493.0, 793.0, 1349.0, 2648.0, 6444.0, 25066.0, 186356.0, 2621848.0, 1225325.0, 97167.0, 16097.0, 4799.0, 2036.0, 1126.0, 640.0, 399.0, 284.0, 171.0, 94.0, 75.0, 57.0, 35.0, 26.0, 22.0, 14.0, 8.0, 3.0, 2.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.890625, -20.19091796875, -19.4912109375, -18.79150390625, -18.091796875, -17.39208984375, -16.6923828125, -15.99267578125, -15.29296875, -14.59326171875, -13.8935546875, -13.19384765625, -12.494140625, -11.79443359375, -11.0947265625, -10.39501953125, -9.6953125, -8.99560546875, -8.2958984375, -7.59619140625, -6.896484375, -6.19677734375, -5.4970703125, -4.79736328125, -4.09765625, -3.39794921875, -2.6982421875, -1.99853515625, -1.298828125, -0.59912109375, 0.1005859375, 0.80029296875, 1.5, 2.19970703125, 2.8994140625, 3.59912109375, 4.298828125, 4.99853515625, 5.6982421875, 6.39794921875, 7.09765625, 7.79736328125, 8.4970703125, 9.19677734375, 9.896484375, 10.59619140625, 11.2958984375, 11.99560546875, 12.6953125, 13.39501953125, 14.0947265625, 14.79443359375, 15.494140625, 16.19384765625, 16.8935546875, 17.59326171875, 18.29296875, 18.99267578125, 19.6923828125, 20.39208984375, 21.091796875, 21.79150390625, 22.4912109375, 23.19091796875, 23.890625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 46.0, 168.0, 358.0, 307.0, 103.0, 16.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.52845764160156, -113.49405670166016, -107.45966339111328, -101.42526245117188, -95.390869140625, -89.3564682006836, -83.32206726074219, -77.28767395019531, -71.2532730102539, -65.2188720703125, -59.184478759765625, -53.15007781982422, -47.11568069458008, -41.08128356933594, -35.04688262939453, -29.01248550415039, -22.97808837890625, -16.94369125366211, -10.909292221069336, -4.8748931884765625, 1.1595039367675781, 7.193901062011719, 13.228302001953125, 19.262699127197266, 25.297096252441406, 31.331493377685547, 37.36589050292969, 43.400291442871094, 49.434688568115234, 55.469085693359375, 61.50348663330078, 67.53788757324219, 73.57229614257812, 79.60669708251953, 85.6410903930664, 91.67549133300781, 97.70988464355469, 103.7442855834961, 109.7786865234375, 115.81307983398438, 121.84748077392578, 127.88188171386719, 133.91627502441406, 139.95068359375, 145.98507690429688, 152.01947021484375, 158.05386352539062, 164.08827209472656, 170.12266540527344, 176.1570587158203, 182.19146728515625, 188.22586059570312, 194.26025390625, 200.29464721679688, 206.3290557861328, 212.3634490966797, 218.39785766601562, 224.4322509765625, 230.46665954589844, 236.5010528564453, 242.5354461669922, 248.56985473632812, 254.604248046875, 260.6386413574219, 266.67303466796875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 5.0, 7.0, 9.0, 11.0, 9.0, 17.0, 17.0, 25.0, 24.0, 28.0, 26.0, 30.0, 36.0, 33.0, 39.0, 42.0, 47.0, 46.0, 56.0, 50.0, 37.0, 32.0, 44.0, 47.0, 24.0, 40.0, 28.0, 26.0, 25.0, 27.0, 20.0, 17.0, 13.0, 8.0, 11.0, 13.0, 9.0, 5.0, 3.0, 1.0, 7.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.992488861083984, -51.53632736206055, -50.080169677734375, -48.62400817871094, -47.1678466796875, -45.71168518066406, -44.25552749633789, -42.79936599731445, -41.34320831298828, -39.887046813964844, -38.43088912963867, -36.974727630615234, -35.5185661315918, -34.062408447265625, -32.60624694824219, -31.15008544921875, -29.693923950195312, -28.237764358520508, -26.78160285949707, -25.325443267822266, -23.869281768798828, -22.413122177124023, -20.95696258544922, -19.50080108642578, -18.044641494750977, -16.588481903076172, -15.132320404052734, -13.67616081237793, -12.220000267028809, -10.763839721679688, -9.307680130004883, -7.851519584655762, -6.395362854003906, -4.939202308654785, -3.4830422401428223, -2.0268821716308594, -0.5707216262817383, 0.8854389190673828, 2.3415985107421875, 3.7977590560913086, 5.25391960144043, 6.710080146789551, 8.166240692138672, 9.622400283813477, 11.078560829162598, 12.534721374511719, 13.990880966186523, 15.447041511535645, 16.903202056884766, 18.35936164855957, 19.815523147583008, 21.271682739257812, 22.72784423828125, 24.184003829956055, 25.64016342163086, 27.096324920654297, 28.5524845123291, 30.008644104003906, 31.464805603027344, 32.92096710205078, 34.37712478637695, 35.83328628540039, 37.28944396972656, 38.74560546875, 40.20176696777344]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 10.0, 8.0, 11.0, 11.0, 14.0, 18.0, 16.0, 18.0, 39.0, 23.0, 26.0, 35.0, 33.0, 43.0, 34.0, 43.0, 40.0, 39.0, 39.0, 46.0, 45.0, 45.0, 42.0, 24.0, 32.0, 25.0, 36.0, 32.0, 29.0, 30.0, 18.0, 9.0, 9.0, 15.0, 10.0, 8.0, 11.0, 3.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.3671875, -6.16961669921875, -5.9720458984375, -5.77447509765625, -5.576904296875, -5.37933349609375, -5.1817626953125, -4.98419189453125, -4.78662109375, -4.58905029296875, -4.3914794921875, -4.19390869140625, -3.996337890625, -3.79876708984375, -3.6011962890625, -3.40362548828125, -3.2060546875, -3.00848388671875, -2.8109130859375, -2.61334228515625, -2.415771484375, -2.21820068359375, -2.0206298828125, -1.82305908203125, -1.62548828125, -1.42791748046875, -1.2303466796875, -1.03277587890625, -0.835205078125, -0.63763427734375, -0.4400634765625, -0.24249267578125, -0.044921875, 0.15264892578125, 0.3502197265625, 0.54779052734375, 0.745361328125, 0.94293212890625, 1.1405029296875, 1.33807373046875, 1.53564453125, 1.73321533203125, 1.9307861328125, 2.12835693359375, 2.325927734375, 2.52349853515625, 2.7210693359375, 2.91864013671875, 3.1162109375, 3.31378173828125, 3.5113525390625, 3.70892333984375, 3.906494140625, 4.10406494140625, 4.3016357421875, 4.49920654296875, 4.69677734375, 4.89434814453125, 5.0919189453125, 5.28948974609375, 5.487060546875, 5.68463134765625, 5.8822021484375, 6.07977294921875, 6.27734375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 4.0, 6.0, 6.0, 9.0, 16.0, 25.0, 34.0, 67.0, 98.0, 161.0, 230.0, 384.0, 611.0, 1034.0, 1678.0, 2696.0, 4568.0, 7986.0, 13672.0, 23964.0, 42787.0, 77219.0, 138741.0, 215579.0, 211537.0, 134235.0, 74769.0, 41367.0, 23106.0, 12997.0, 7557.0, 4493.0, 2689.0, 1547.0, 969.0, 673.0, 377.0, 242.0, 149.0, 91.0, 52.0, 43.0, 40.0, 9.0, 15.0, 9.0, 4.0, 1.0, 7.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.9951171875, -0.964935302734375, -0.93475341796875, -0.904571533203125, -0.8743896484375, -0.844207763671875, -0.81402587890625, -0.783843994140625, -0.753662109375, -0.723480224609375, -0.69329833984375, -0.663116455078125, -0.6329345703125, -0.602752685546875, -0.57257080078125, -0.542388916015625, -0.51220703125, -0.482025146484375, -0.45184326171875, -0.421661376953125, -0.3914794921875, -0.361297607421875, -0.33111572265625, -0.300933837890625, -0.270751953125, -0.240570068359375, -0.21038818359375, -0.180206298828125, -0.1500244140625, -0.119842529296875, -0.08966064453125, -0.059478759765625, -0.029296875, 0.000885009765625, 0.03106689453125, 0.061248779296875, 0.0914306640625, 0.121612548828125, 0.15179443359375, 0.181976318359375, 0.212158203125, 0.242340087890625, 0.27252197265625, 0.302703857421875, 0.3328857421875, 0.363067626953125, 0.39324951171875, 0.423431396484375, 0.45361328125, 0.483795166015625, 0.51397705078125, 0.544158935546875, 0.5743408203125, 0.604522705078125, 0.63470458984375, 0.664886474609375, 0.695068359375, 0.725250244140625, 0.75543212890625, 0.785614013671875, 0.8157958984375, 0.845977783203125, 0.87615966796875, 0.906341552734375, 0.9365234375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 10.0, 2.0, 7.0, 12.0, 11.0, 13.0, 20.0, 21.0, 15.0, 26.0, 34.0, 31.0, 32.0, 40.0, 36.0, 28.0, 32.0, 38.0, 36.0, 1072.0, 45.0, 48.0, 29.0, 32.0, 36.0, 28.0, 33.0, 32.0, 32.0, 23.0, 27.0, 31.0, 20.0, 12.0, 9.0, 13.0, 12.0, 8.0, 4.0, 7.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.23046875, -4.10003662109375, -3.9696044921875, -3.83917236328125, -3.708740234375, -3.57830810546875, -3.4478759765625, -3.31744384765625, -3.18701171875, -3.05657958984375, -2.9261474609375, -2.79571533203125, -2.665283203125, -2.53485107421875, -2.4044189453125, -2.27398681640625, -2.1435546875, -2.01312255859375, -1.8826904296875, -1.75225830078125, -1.621826171875, -1.49139404296875, -1.3609619140625, -1.23052978515625, -1.10009765625, -0.96966552734375, -0.8392333984375, -0.70880126953125, -0.578369140625, -0.44793701171875, -0.3175048828125, -0.18707275390625, -0.056640625, 0.07379150390625, 0.2042236328125, 0.33465576171875, 0.465087890625, 0.59552001953125, 0.7259521484375, 0.85638427734375, 0.98681640625, 1.11724853515625, 1.2476806640625, 1.37811279296875, 1.508544921875, 1.63897705078125, 1.7694091796875, 1.89984130859375, 2.0302734375, 2.16070556640625, 2.2911376953125, 2.42156982421875, 2.552001953125, 2.68243408203125, 2.8128662109375, 2.94329833984375, 3.07373046875, 3.20416259765625, 3.3345947265625, 3.46502685546875, 3.595458984375, 3.72589111328125, 3.8563232421875, 3.98675537109375, 4.1171875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 4.0, 10.0, 10.0, 29.0, 27.0, 36.0, 65.0, 104.0, 173.0, 282.0, 498.0, 975.0, 1768.0, 3718.0, 7553.0, 16540.0, 37688.0, 88014.0, 229122.0, 1201425.0, 314063.0, 110076.0, 46416.0, 20151.0, 9354.0, 4383.0, 2161.0, 1069.0, 610.0, 347.0, 168.0, 106.0, 65.0, 41.0, 27.0, 20.0, 13.0, 11.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.828125, -0.7991943359375, -0.770263671875, -0.7413330078125, -0.71240234375, -0.6834716796875, -0.654541015625, -0.6256103515625, -0.5966796875, -0.5677490234375, -0.538818359375, -0.5098876953125, -0.48095703125, -0.4520263671875, -0.423095703125, -0.3941650390625, -0.365234375, -0.3363037109375, -0.307373046875, -0.2784423828125, -0.24951171875, -0.2205810546875, -0.191650390625, -0.1627197265625, -0.1337890625, -0.1048583984375, -0.075927734375, -0.0469970703125, -0.01806640625, 0.0108642578125, 0.039794921875, 0.0687255859375, 0.09765625, 0.1265869140625, 0.155517578125, 0.1844482421875, 0.21337890625, 0.2423095703125, 0.271240234375, 0.3001708984375, 0.3291015625, 0.3580322265625, 0.386962890625, 0.4158935546875, 0.44482421875, 0.4737548828125, 0.502685546875, 0.5316162109375, 0.560546875, 0.5894775390625, 0.618408203125, 0.6473388671875, 0.67626953125, 0.7052001953125, 0.734130859375, 0.7630615234375, 0.7919921875, 0.8209228515625, 0.849853515625, 0.8787841796875, 0.90771484375, 0.9366455078125, 0.965576171875, 0.9945068359375, 1.0234375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 3.0, 5.0, 3.0, 3.0, 11.0, 5.0, 9.0, 23.0, 11.0, 10.0, 30.0, 38.0, 64.0, 99.0, 176.0, 183.0, 105.0, 72.0, 33.0, 15.0, 10.0, 17.0, 10.0, 11.0, 7.0, 8.0, 6.0, 3.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2081298828125, -0.20067787170410156, -0.19322586059570312, -0.1857738494873047, -0.17832183837890625, -0.1708698272705078, -0.16341781616210938, -0.15596580505371094, -0.1485137939453125, -0.14106178283691406, -0.13360977172851562, -0.1261577606201172, -0.11870574951171875, -0.11125373840332031, -0.10380172729492188, -0.09634971618652344, -0.088897705078125, -0.08144569396972656, -0.07399368286132812, -0.06654167175292969, -0.05908966064453125, -0.05163764953613281, -0.044185638427734375, -0.03673362731933594, -0.0292816162109375, -0.021829605102539062, -0.014377593994140625, -0.0069255828857421875, 0.00052642822265625, 0.007978439331054688, 0.015430450439453125, 0.022882461547851562, 0.03033447265625, 0.03778648376464844, 0.045238494873046875, 0.05269050598144531, 0.06014251708984375, 0.06759452819824219, 0.07504653930664062, 0.08249855041503906, 0.0899505615234375, 0.09740257263183594, 0.10485458374023438, 0.11230659484863281, 0.11975860595703125, 0.1272106170654297, 0.13466262817382812, 0.14211463928222656, 0.149566650390625, 0.15701866149902344, 0.16447067260742188, 0.1719226837158203, 0.17937469482421875, 0.1868267059326172, 0.19427871704101562, 0.20173072814941406, 0.2091827392578125, 0.21663475036621094, 0.22408676147460938, 0.2315387725830078, 0.23899078369140625, 0.2464427947998047, 0.2538948059082031, 0.26134681701660156, 0.268798828125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 1.0, 8.0, 3.0, 4.0, 4.0, 10.0, 10.0, 14.0, 38.0, 34.0, 54.0, 83.0, 150.0, 356.0, 1603.0, 1007132.0, 37620.0, 724.0, 270.0, 132.0, 70.0, 71.0, 37.0, 32.0, 13.0, 10.0, 10.0, 9.0, 5.0, 7.0, 5.0, 7.0, 6.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0], "bins": [-5.8046875, -5.64697265625, -5.4892578125, -5.33154296875, -5.173828125, -5.01611328125, -4.8583984375, -4.70068359375, -4.54296875, -4.38525390625, -4.2275390625, -4.06982421875, -3.912109375, -3.75439453125, -3.5966796875, -3.43896484375, -3.28125, -3.12353515625, -2.9658203125, -2.80810546875, -2.650390625, -2.49267578125, -2.3349609375, -2.17724609375, -2.01953125, -1.86181640625, -1.7041015625, -1.54638671875, -1.388671875, -1.23095703125, -1.0732421875, -0.91552734375, -0.7578125, -0.60009765625, -0.4423828125, -0.28466796875, -0.126953125, 0.03076171875, 0.1884765625, 0.34619140625, 0.50390625, 0.66162109375, 0.8193359375, 0.97705078125, 1.134765625, 1.29248046875, 1.4501953125, 1.60791015625, 1.765625, 1.92333984375, 2.0810546875, 2.23876953125, 2.396484375, 2.55419921875, 2.7119140625, 2.86962890625, 3.02734375, 3.18505859375, 3.3427734375, 3.50048828125, 3.658203125, 3.81591796875, 3.9736328125, 4.13134765625, 4.2890625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 16.0, 46.0, 85.0, 157.0, 228.0, 194.0, 124.0, 70.0, 41.0, 24.0, 7.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5944207906723022, -0.5831496715545654, -0.5718786120414734, -0.5606074929237366, -0.5493364334106445, -0.5380653142929077, -0.5267942547798157, -0.5155231356620789, -0.5042520761489868, -0.4929809868335724, -0.48170989751815796, -0.47043880820274353, -0.4591677188873291, -0.4478965997695923, -0.43662554025650024, -0.4253544211387634, -0.4140833020210266, -0.4028122127056122, -0.39154112339019775, -0.3802700340747833, -0.3689989447593689, -0.3577278256416321, -0.34645676612854004, -0.3351856470108032, -0.3239145874977112, -0.31264349818229675, -0.3013724088668823, -0.2901013195514679, -0.27883023023605347, -0.26755911111831665, -0.2562880516052246, -0.2450169324874878, -0.23374585807323456, -0.22247476875782013, -0.2112036794424057, -0.19993257522583008, -0.18866148591041565, -0.17739039659500122, -0.1661193072795868, -0.15484821796417236, -0.14357712864875793, -0.1323060393333435, -0.12103494256734848, -0.10976385325193405, -0.09849275648593903, -0.0872216671705246, -0.07595057785511017, -0.06467948108911514, -0.05340838432312012, -0.04213729128241539, -0.030866200104355812, -0.019595108926296234, -0.008324015885591507, 0.00294707715511322, 0.014218166470527649, 0.025489263236522675, 0.0367603525519371, 0.04803144559264183, 0.05930253863334656, 0.07057362794876099, 0.08184471726417542, 0.09311581403017044, 0.10438690334558487, 0.1156580001115799, 0.12692908942699432]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 8.0, 6.0, 8.0, 8.0, 11.0, 14.0, 19.0, 15.0, 20.0, 32.0, 16.0, 26.0, 26.0, 29.0, 32.0, 40.0, 38.0, 45.0, 49.0, 43.0, 46.0, 41.0, 36.0, 26.0, 38.0, 22.0, 40.0, 42.0, 28.0, 25.0, 28.0, 24.0, 19.0, 18.0, 12.0, 11.0, 9.0, 14.0, 11.0, 6.0, 3.0, 8.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2128503918647766, -0.20623408257961273, -0.19961777329444885, -0.19300146400928497, -0.1863851547241211, -0.17976884543895721, -0.17315253615379333, -0.16653621196746826, -0.15991991758346558, -0.1533036082983017, -0.14668729901313782, -0.14007098972797394, -0.13345468044281006, -0.12683837115764618, -0.1202220544219017, -0.11360574513673782, -0.10698942840099335, -0.10037311911582947, -0.09375680983066559, -0.08714050054550171, -0.08052419126033783, -0.07390788197517395, -0.06729156523942947, -0.060675255954265594, -0.054058946669101715, -0.047442637383937836, -0.040826328098773956, -0.03421001508831978, -0.0275937058031559, -0.02097739651799202, -0.014361083507537842, -0.007744774222373962, -0.001128464937210083, 0.005487845279276371, 0.012104155495762825, 0.018720466643571854, 0.025336775928735733, 0.03195308521389961, 0.03856939822435379, 0.04518570750951767, 0.05180201679468155, 0.05841832607984543, 0.06503463536500931, 0.07165095210075378, 0.07826726138591766, 0.08488357067108154, 0.09149987995624542, 0.0981161892414093, 0.10473249852657318, 0.11134880781173706, 0.11796511709690094, 0.12458142638206482, 0.1311977356672287, 0.13781404495239258, 0.14443036913871765, 0.15104666352272034, 0.1576629877090454, 0.1642792969942093, 0.17089560627937317, 0.17751191556453705, 0.18412822484970093, 0.1907445341348648, 0.1973608434200287, 0.20397716760635376, 0.21059346199035645]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 6.0, 3.0, 3.0, 10.0, 13.0, 15.0, 11.0, 12.0, 23.0, 20.0, 31.0, 29.0, 32.0, 36.0, 44.0, 45.0, 38.0, 43.0, 55.0, 59.0, 50.0, 39.0, 45.0, 45.0, 33.0, 33.0, 34.0, 27.0, 26.0, 34.0, 19.0, 16.0, 10.0, 20.0, 9.0, 8.0, 3.0, 4.0, 7.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9140625, -6.69427490234375, -6.4744873046875, -6.25469970703125, -6.034912109375, -5.81512451171875, -5.5953369140625, -5.37554931640625, -5.15576171875, -4.93597412109375, -4.7161865234375, -4.49639892578125, -4.276611328125, -4.05682373046875, -3.8370361328125, -3.61724853515625, -3.3974609375, -3.17767333984375, -2.9578857421875, -2.73809814453125, -2.518310546875, -2.29852294921875, -2.0787353515625, -1.85894775390625, -1.63916015625, -1.41937255859375, -1.1995849609375, -0.97979736328125, -0.760009765625, -0.54022216796875, -0.3204345703125, -0.10064697265625, 0.119140625, 0.33892822265625, 0.5587158203125, 0.77850341796875, 0.998291015625, 1.21807861328125, 1.4378662109375, 1.65765380859375, 1.87744140625, 2.09722900390625, 2.3170166015625, 2.53680419921875, 2.756591796875, 2.97637939453125, 3.1961669921875, 3.41595458984375, 3.6357421875, 3.85552978515625, 4.0753173828125, 4.29510498046875, 4.514892578125, 4.73468017578125, 4.9544677734375, 5.17425537109375, 5.39404296875, 5.61383056640625, 5.8336181640625, 6.05340576171875, 6.273193359375, 6.49298095703125, 6.7127685546875, 6.93255615234375, 7.15234375]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 3.0, 10.0, 13.0, 10.0, 31.0, 38.0, 50.0, 73.0, 84.0, 135.0, 213.0, 276.0, 400.0, 690.0, 1110.0, 2070.0, 3920.0, 8509.0, 19021.0, 46472.0, 130425.0, 437748.0, 260383.0, 80439.0, 30559.0, 12936.0, 5844.0, 3000.0, 1536.0, 890.0, 573.0, 322.0, 210.0, 144.0, 102.0, 82.0, 56.0, 50.0, 27.0, 18.0, 25.0, 17.0, 12.0, 11.0, 11.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.765625, -10.4371337890625, -10.108642578125, -9.7801513671875, -9.45166015625, -9.1231689453125, -8.794677734375, -8.4661865234375, -8.1376953125, -7.8092041015625, -7.480712890625, -7.1522216796875, -6.82373046875, -6.4952392578125, -6.166748046875, -5.8382568359375, -5.509765625, -5.1812744140625, -4.852783203125, -4.5242919921875, -4.19580078125, -3.8673095703125, -3.538818359375, -3.2103271484375, -2.8818359375, -2.5533447265625, -2.224853515625, -1.8963623046875, -1.56787109375, -1.2393798828125, -0.910888671875, -0.5823974609375, -0.25390625, 0.0745849609375, 0.403076171875, 0.7315673828125, 1.06005859375, 1.3885498046875, 1.717041015625, 2.0455322265625, 2.3740234375, 2.7025146484375, 3.031005859375, 3.3594970703125, 3.68798828125, 4.0164794921875, 4.344970703125, 4.6734619140625, 5.001953125, 5.3304443359375, 5.658935546875, 5.9874267578125, 6.31591796875, 6.6444091796875, 6.972900390625, 7.3013916015625, 7.6298828125, 7.9583740234375, 8.286865234375, 8.6153564453125, 8.94384765625, 9.2723388671875, 9.600830078125, 9.9293212890625, 10.2578125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 5.0, 8.0, 8.0, 2.0, 15.0, 16.0, 11.0, 24.0, 16.0, 36.0, 36.0, 40.0, 46.0, 66.0, 69.0, 122.0, 170.0, 1317.0, 303.0, 192.0, 118.0, 114.0, 60.0, 43.0, 29.0, 31.0, 26.0, 20.0, 17.0, 15.0, 18.0, 8.0, 14.0, 4.0, 7.0, 7.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.078125, -15.522216796875, -14.96630859375, -14.410400390625, -13.8544921875, -13.298583984375, -12.74267578125, -12.186767578125, -11.630859375, -11.074951171875, -10.51904296875, -9.963134765625, -9.4072265625, -8.851318359375, -8.29541015625, -7.739501953125, -7.18359375, -6.627685546875, -6.07177734375, -5.515869140625, -4.9599609375, -4.404052734375, -3.84814453125, -3.292236328125, -2.736328125, -2.180419921875, -1.62451171875, -1.068603515625, -0.5126953125, 0.043212890625, 0.59912109375, 1.155029296875, 1.7109375, 2.266845703125, 2.82275390625, 3.378662109375, 3.9345703125, 4.490478515625, 5.04638671875, 5.602294921875, 6.158203125, 6.714111328125, 7.27001953125, 7.825927734375, 8.3818359375, 8.937744140625, 9.49365234375, 10.049560546875, 10.60546875, 11.161376953125, 11.71728515625, 12.273193359375, 12.8291015625, 13.385009765625, 13.94091796875, 14.496826171875, 15.052734375, 15.608642578125, 16.16455078125, 16.720458984375, 17.2763671875, 17.832275390625, 18.38818359375, 18.944091796875, 19.5]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 3.0, 5.0, 3.0, 5.0, 9.0, 10.0, 17.0, 12.0, 21.0, 32.0, 43.0, 58.0, 80.0, 103.0, 174.0, 288.0, 478.0, 966.0, 2263.0, 8378.0, 306322.0, 2803186.0, 17152.0, 3285.0, 1199.0, 599.0, 312.0, 197.0, 160.0, 77.0, 75.0, 40.0, 34.0, 32.0, 18.0, 12.0, 9.0, 8.0, 8.0, 6.0, 2.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0], "bins": [-59.875, -58.2197265625, -56.564453125, -54.9091796875, -53.25390625, -51.5986328125, -49.943359375, -48.2880859375, -46.6328125, -44.9775390625, -43.322265625, -41.6669921875, -40.01171875, -38.3564453125, -36.701171875, -35.0458984375, -33.390625, -31.7353515625, -30.080078125, -28.4248046875, -26.76953125, -25.1142578125, -23.458984375, -21.8037109375, -20.1484375, -18.4931640625, -16.837890625, -15.1826171875, -13.52734375, -11.8720703125, -10.216796875, -8.5615234375, -6.90625, -5.2509765625, -3.595703125, -1.9404296875, -0.28515625, 1.3701171875, 3.025390625, 4.6806640625, 6.3359375, 7.9912109375, 9.646484375, 11.3017578125, 12.95703125, 14.6123046875, 16.267578125, 17.9228515625, 19.578125, 21.2333984375, 22.888671875, 24.5439453125, 26.19921875, 27.8544921875, 29.509765625, 31.1650390625, 32.8203125, 34.4755859375, 36.130859375, 37.7861328125, 39.44140625, 41.0966796875, 42.751953125, 44.4072265625, 46.0625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 11.0, 12.0, 49.0, 89.0, 217.0, 302.0, 196.0, 83.0, 28.0, 15.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.4060516357422, -126.72715759277344, -119.04825592041016, -111.3693618774414, -103.69046020507812, -96.01156616210938, -88.33267211914062, -80.65377807617188, -72.9748764038086, -65.29598236083984, -57.61708068847656, -49.93818664550781, -42.2592887878418, -34.58039093017578, -26.90149688720703, -19.222599029541016, -11.543701171875, -3.864804267883301, 3.8140926361083984, 11.492988586425781, 19.171886444091797, 26.850784301757812, 34.52967834472656, 42.20857620239258, 49.887474060058594, 57.56637191772461, 65.24526977539062, 72.92416381835938, 80.60305786132812, 88.2819595336914, 95.96085357666016, 103.63975524902344, 111.31863403320312, 118.99752807617188, 126.67642974853516, 134.35531616210938, 142.0342254638672, 149.71311950683594, 157.3920135498047, 165.07090759277344, 172.74981689453125, 180.4287109375, 188.10760498046875, 195.7864990234375, 203.4654083251953, 211.14430236816406, 218.8231964111328, 226.50209045410156, 234.1809844970703, 241.85987854003906, 249.5387725830078, 257.2176818847656, 264.8965759277344, 272.5754699707031, 280.2543640136719, 287.9332580566406, 295.6121520996094, 303.2910461425781, 310.9699401855469, 318.6488342285156, 326.3277282714844, 334.00665283203125, 341.685546875, 349.36444091796875, 357.0433349609375]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 6.0, 9.0, 7.0, 10.0, 8.0, 14.0, 13.0, 14.0, 20.0, 19.0, 22.0, 29.0, 28.0, 23.0, 39.0, 36.0, 35.0, 37.0, 46.0, 42.0, 35.0, 30.0, 47.0, 35.0, 40.0, 37.0, 26.0, 32.0, 35.0, 33.0, 31.0, 18.0, 21.0, 17.0, 12.0, 15.0, 19.0, 16.0, 12.0, 8.0, 2.0, 8.0, 10.0, 6.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-58.33087158203125, -56.54862976074219, -54.766387939453125, -52.98414611816406, -51.201904296875, -49.41966247558594, -47.637420654296875, -45.85517883300781, -44.07293701171875, -42.29069519042969, -40.508453369140625, -38.72621154785156, -36.9439697265625, -35.16172790527344, -33.379486083984375, -31.597244262695312, -29.815004348754883, -28.03276252746582, -26.250520706176758, -24.468278884887695, -22.686037063598633, -20.903797149658203, -19.12155532836914, -17.339313507080078, -15.5570707321167, -13.774828910827637, -11.992587089538574, -10.210346221923828, -8.428104400634766, -6.645862579345703, -4.863620758056641, -3.081378936767578, -1.2991371154785156, 0.4831045866012573, 2.2653462886810303, 4.047587871551514, 5.829829692840576, 7.6120710372924805, 9.394312858581543, 11.176554679870605, 12.958796501159668, 14.74103832244873, 16.523279190063477, 18.30552101135254, 20.0877628326416, 21.870004653930664, 23.652246475219727, 25.43448829650879, 27.21673011779785, 28.998971939086914, 30.781213760375977, 32.563453674316406, 34.34569549560547, 36.12793731689453, 37.910179138183594, 39.692420959472656, 41.47466278076172, 43.25690460205078, 45.039146423339844, 46.821388244628906, 48.60363006591797, 50.38587188720703, 52.168113708496094, 53.950355529785156, 55.73259735107422]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 1.0, 6.0, 6.0, 10.0, 8.0, 16.0, 18.0, 19.0, 22.0, 19.0, 21.0, 35.0, 39.0, 47.0, 45.0, 38.0, 57.0, 47.0, 53.0, 49.0, 39.0, 47.0, 45.0, 43.0, 35.0, 40.0, 38.0, 18.0, 36.0, 24.0, 18.0, 17.0, 9.0, 9.0, 6.0, 6.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.9609375, -7.71832275390625, -7.4757080078125, -7.23309326171875, -6.990478515625, -6.74786376953125, -6.5052490234375, -6.26263427734375, -6.02001953125, -5.77740478515625, -5.5347900390625, -5.29217529296875, -5.049560546875, -4.80694580078125, -4.5643310546875, -4.32171630859375, -4.0791015625, -3.83648681640625, -3.5938720703125, -3.35125732421875, -3.108642578125, -2.86602783203125, -2.6234130859375, -2.38079833984375, -2.13818359375, -1.89556884765625, -1.6529541015625, -1.41033935546875, -1.167724609375, -0.92510986328125, -0.6824951171875, -0.43988037109375, -0.197265625, 0.04534912109375, 0.2879638671875, 0.53057861328125, 0.773193359375, 1.01580810546875, 1.2584228515625, 1.50103759765625, 1.74365234375, 1.98626708984375, 2.2288818359375, 2.47149658203125, 2.714111328125, 2.95672607421875, 3.1993408203125, 3.44195556640625, 3.6845703125, 3.92718505859375, 4.1697998046875, 4.41241455078125, 4.655029296875, 4.89764404296875, 5.1402587890625, 5.38287353515625, 5.62548828125, 5.86810302734375, 6.1107177734375, 6.35333251953125, 6.595947265625, 6.83856201171875, 7.0811767578125, 7.32379150390625, 7.56640625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 6.0, 10.0, 16.0, 36.0, 50.0, 101.0, 213.0, 340.0, 625.0, 1265.0, 2800.0, 7883.0, 37499.0, 716910.0, 3191976.0, 205563.0, 19701.0, 5057.0, 2032.0, 994.0, 517.0, 307.0, 159.0, 97.0, 37.0, 32.0, 11.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-26.625, -25.80126953125, -24.9775390625, -24.15380859375, -23.330078125, -22.50634765625, -21.6826171875, -20.85888671875, -20.03515625, -19.21142578125, -18.3876953125, -17.56396484375, -16.740234375, -15.91650390625, -15.0927734375, -14.26904296875, -13.4453125, -12.62158203125, -11.7978515625, -10.97412109375, -10.150390625, -9.32666015625, -8.5029296875, -7.67919921875, -6.85546875, -6.03173828125, -5.2080078125, -4.38427734375, -3.560546875, -2.73681640625, -1.9130859375, -1.08935546875, -0.265625, 0.55810546875, 1.3818359375, 2.20556640625, 3.029296875, 3.85302734375, 4.6767578125, 5.50048828125, 6.32421875, 7.14794921875, 7.9716796875, 8.79541015625, 9.619140625, 10.44287109375, 11.2666015625, 12.09033203125, 12.9140625, 13.73779296875, 14.5615234375, 15.38525390625, 16.208984375, 17.03271484375, 17.8564453125, 18.68017578125, 19.50390625, 20.32763671875, 21.1513671875, 21.97509765625, 22.798828125, 23.62255859375, 24.4462890625, 25.27001953125, 26.09375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 8.0, 5.0, 9.0, 15.0, 16.0, 23.0, 31.0, 47.0, 56.0, 97.0, 112.0, 179.0, 235.0, 300.0, 422.0, 550.0, 528.0, 416.0, 294.0, 204.0, 165.0, 107.0, 80.0, 45.0, 37.0, 27.0, 21.0, 11.0, 9.0, 10.0, 5.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.203125, -11.7933349609375, -11.383544921875, -10.9737548828125, -10.56396484375, -10.1541748046875, -9.744384765625, -9.3345947265625, -8.9248046875, -8.5150146484375, -8.105224609375, -7.6954345703125, -7.28564453125, -6.8758544921875, -6.466064453125, -6.0562744140625, -5.646484375, -5.2366943359375, -4.826904296875, -4.4171142578125, -4.00732421875, -3.5975341796875, -3.187744140625, -2.7779541015625, -2.3681640625, -1.9583740234375, -1.548583984375, -1.1387939453125, -0.72900390625, -0.3192138671875, 0.090576171875, 0.5003662109375, 0.91015625, 1.3199462890625, 1.729736328125, 2.1395263671875, 2.54931640625, 2.9591064453125, 3.368896484375, 3.7786865234375, 4.1884765625, 4.5982666015625, 5.008056640625, 5.4178466796875, 5.82763671875, 6.2374267578125, 6.647216796875, 7.0570068359375, 7.466796875, 7.8765869140625, 8.286376953125, 8.6961669921875, 9.10595703125, 9.5157470703125, 9.925537109375, 10.3353271484375, 10.7451171875, 11.1549072265625, 11.564697265625, 11.9744873046875, 12.38427734375, 12.7940673828125, 13.203857421875, 13.6136474609375, 14.0234375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 6.0, 5.0, 13.0, 12.0, 10.0, 21.0, 23.0, 26.0, 37.0, 52.0, 81.0, 107.0, 214.0, 306.0, 512.0, 991.0, 2107.0, 5296.0, 19933.0, 187283.0, 3434187.0, 497211.0, 32969.0, 7409.0, 2641.0, 1153.0, 646.0, 340.0, 215.0, 140.0, 102.0, 58.0, 43.0, 38.0, 28.0, 22.0, 13.0, 10.0, 8.0, 4.0, 8.0, 1.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.265625, -28.369140625, -27.47265625, -26.576171875, -25.6796875, -24.783203125, -23.88671875, -22.990234375, -22.09375, -21.197265625, -20.30078125, -19.404296875, -18.5078125, -17.611328125, -16.71484375, -15.818359375, -14.921875, -14.025390625, -13.12890625, -12.232421875, -11.3359375, -10.439453125, -9.54296875, -8.646484375, -7.75, -6.853515625, -5.95703125, -5.060546875, -4.1640625, -3.267578125, -2.37109375, -1.474609375, -0.578125, 0.318359375, 1.21484375, 2.111328125, 3.0078125, 3.904296875, 4.80078125, 5.697265625, 6.59375, 7.490234375, 8.38671875, 9.283203125, 10.1796875, 11.076171875, 11.97265625, 12.869140625, 13.765625, 14.662109375, 15.55859375, 16.455078125, 17.3515625, 18.248046875, 19.14453125, 20.041015625, 20.9375, 21.833984375, 22.73046875, 23.626953125, 24.5234375, 25.419921875, 26.31640625, 27.212890625, 28.109375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 7.0, 149.0, 743.0, 110.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-850.8346557617188, -834.6129760742188, -818.3912963867188, -802.169677734375, -785.947998046875, -769.726318359375, -753.504638671875, -737.282958984375, -721.0613403320312, -704.8396606445312, -688.6179809570312, -672.3963623046875, -656.1746826171875, -639.9530029296875, -623.7313232421875, -607.5096435546875, -591.2879638671875, -575.0662841796875, -558.8446044921875, -542.6229858398438, -526.4013061523438, -510.17962646484375, -493.95794677734375, -477.7362976074219, -461.5146484375, -445.29296875, -429.0713195800781, -412.8496398925781, -396.62799072265625, -380.40631103515625, -364.18463134765625, -347.9629821777344, -331.74139404296875, -315.51971435546875, -299.2980651855469, -283.0763854980469, -266.854736328125, -250.633056640625, -234.41139221191406, -218.18972778320312, -201.96804809570312, -185.7463836669922, -169.52471923828125, -153.30303955078125, -137.08139038085938, -120.8597183227539, -104.63804626464844, -88.4163818359375, -72.19471740722656, -55.973052978515625, -39.75138473510742, -23.52971649169922, -7.308052062988281, 8.913612365722656, 25.135284423828125, 41.35694885253906, 57.57861328125, 73.80027770996094, 90.02194213867188, 106.24361419677734, 122.46527862548828, 138.68695068359375, 154.9086151123047, 171.13027954101562, 187.35194396972656]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 5.0, 7.0, 11.0, 14.0, 28.0, 27.0, 31.0, 43.0, 32.0, 29.0, 44.0, 43.0, 60.0, 45.0, 51.0, 54.0, 54.0, 57.0, 50.0, 50.0, 34.0, 49.0, 38.0, 30.0, 22.0, 26.0, 8.0, 11.0, 7.0, 8.0, 9.0, 2.0, 5.0, 4.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.5804557800293, -61.82351303100586, -60.066566467285156, -58.30962371826172, -56.55268096923828, -54.795738220214844, -53.038795471191406, -51.2818489074707, -49.524906158447266, -47.76796340942383, -46.011016845703125, -44.25407409667969, -42.49713134765625, -40.74018859863281, -38.983245849609375, -37.22629928588867, -35.469356536865234, -33.7124137878418, -31.955469131469727, -30.198524475097656, -28.44158172607422, -26.68463897705078, -24.92769432067871, -23.17074966430664, -21.413806915283203, -19.656864166259766, -17.899919509887695, -16.142974853515625, -14.386032104492188, -12.629088401794434, -10.87214469909668, -9.115200996398926, -7.3582611083984375, -5.601317405700684, -3.8443737030029297, -2.087430000305176, -0.3304862976074219, 1.426457405090332, 3.183401107788086, 4.94034481048584, 6.697288513183594, 8.454232215881348, 10.211175918579102, 11.968119621276855, 13.72506332397461, 15.482007026672363, 17.238950729370117, 18.995895385742188, 20.752838134765625, 22.509780883789062, 24.266725540161133, 26.023670196533203, 27.78061294555664, 29.537555694580078, 31.29450035095215, 33.05144500732422, 34.808387756347656, 36.565330505371094, 38.32227325439453, 40.079219818115234, 41.83616256713867, 43.59310531616211, 45.35005187988281, 47.10699462890625, 48.86393737792969]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 2.0, 5.0, 8.0, 5.0, 10.0, 8.0, 6.0, 11.0, 13.0, 19.0, 17.0, 32.0, 28.0, 42.0, 35.0, 30.0, 31.0, 39.0, 27.0, 42.0, 38.0, 48.0, 42.0, 32.0, 41.0, 30.0, 37.0, 31.0, 31.0, 38.0, 25.0, 38.0, 20.0, 24.0, 22.0, 11.0, 11.0, 15.0, 12.0, 9.0, 7.0, 7.0, 5.0, 1.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.4140625, -6.23529052734375, -6.0565185546875, -5.87774658203125, -5.698974609375, -5.52020263671875, -5.3414306640625, -5.16265869140625, -4.98388671875, -4.80511474609375, -4.6263427734375, -4.44757080078125, -4.268798828125, -4.09002685546875, -3.9112548828125, -3.73248291015625, -3.5537109375, -3.37493896484375, -3.1961669921875, -3.01739501953125, -2.838623046875, -2.65985107421875, -2.4810791015625, -2.30230712890625, -2.12353515625, -1.94476318359375, -1.7659912109375, -1.58721923828125, -1.408447265625, -1.22967529296875, -1.0509033203125, -0.87213134765625, -0.693359375, -0.51458740234375, -0.3358154296875, -0.15704345703125, 0.021728515625, 0.20050048828125, 0.3792724609375, 0.55804443359375, 0.73681640625, 0.91558837890625, 1.0943603515625, 1.27313232421875, 1.451904296875, 1.63067626953125, 1.8094482421875, 1.98822021484375, 2.1669921875, 2.34576416015625, 2.5245361328125, 2.70330810546875, 2.882080078125, 3.06085205078125, 3.2396240234375, 3.41839599609375, 3.59716796875, 3.77593994140625, 3.9547119140625, 4.13348388671875, 4.312255859375, 4.49102783203125, 4.6697998046875, 4.84857177734375, 5.02734375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 6.0, 2.0, 9.0, 9.0, 18.0, 22.0, 25.0, 43.0, 65.0, 81.0, 105.0, 184.0, 309.0, 519.0, 979.0, 1955.0, 4515.0, 13742.0, 62913.0, 571479.0, 334288.0, 39802.0, 10215.0, 3593.0, 1621.0, 858.0, 450.0, 261.0, 159.0, 105.0, 69.0, 42.0, 41.0, 15.0, 17.0, 16.0, 10.0, 6.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.798828125, -3.671661376953125, -3.54449462890625, -3.417327880859375, -3.2901611328125, -3.162994384765625, -3.03582763671875, -2.908660888671875, -2.781494140625, -2.654327392578125, -2.52716064453125, -2.399993896484375, -2.2728271484375, -2.145660400390625, -2.01849365234375, -1.891326904296875, -1.76416015625, -1.636993408203125, -1.50982666015625, -1.382659912109375, -1.2554931640625, -1.128326416015625, -1.00115966796875, -0.873992919921875, -0.746826171875, -0.619659423828125, -0.49249267578125, -0.365325927734375, -0.2381591796875, -0.110992431640625, 0.01617431640625, 0.143341064453125, 0.2705078125, 0.397674560546875, 0.52484130859375, 0.652008056640625, 0.7791748046875, 0.906341552734375, 1.03350830078125, 1.160675048828125, 1.287841796875, 1.415008544921875, 1.54217529296875, 1.669342041015625, 1.7965087890625, 1.923675537109375, 2.05084228515625, 2.178009033203125, 2.30517578125, 2.432342529296875, 2.55950927734375, 2.686676025390625, 2.8138427734375, 2.941009521484375, 3.06817626953125, 3.195343017578125, 3.322509765625, 3.449676513671875, 3.57684326171875, 3.704010009765625, 3.8311767578125, 3.958343505859375, 4.08551025390625, 4.212677001953125, 4.33984375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 10.0, 9.0, 12.0, 9.0, 18.0, 13.0, 20.0, 17.0, 22.0, 31.0, 32.0, 46.0, 37.0, 45.0, 36.0, 50.0, 37.0, 1064.0, 41.0, 53.0, 37.0, 41.0, 30.0, 35.0, 41.0, 31.0, 33.0, 17.0, 20.0, 25.0, 19.0, 17.0, 9.0, 13.0, 7.0, 10.0, 7.0, 7.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.89453125, -3.7547607421875, -3.614990234375, -3.4752197265625, -3.33544921875, -3.1956787109375, -3.055908203125, -2.9161376953125, -2.7763671875, -2.6365966796875, -2.496826171875, -2.3570556640625, -2.21728515625, -2.0775146484375, -1.937744140625, -1.7979736328125, -1.658203125, -1.5184326171875, -1.378662109375, -1.2388916015625, -1.09912109375, -0.9593505859375, -0.819580078125, -0.6798095703125, -0.5400390625, -0.4002685546875, -0.260498046875, -0.1207275390625, 0.01904296875, 0.1588134765625, 0.298583984375, 0.4383544921875, 0.578125, 0.7178955078125, 0.857666015625, 0.9974365234375, 1.13720703125, 1.2769775390625, 1.416748046875, 1.5565185546875, 1.6962890625, 1.8360595703125, 1.975830078125, 2.1156005859375, 2.25537109375, 2.3951416015625, 2.534912109375, 2.6746826171875, 2.814453125, 2.9542236328125, 3.093994140625, 3.2337646484375, 3.37353515625, 3.5133056640625, 3.653076171875, 3.7928466796875, 3.9326171875, 4.0723876953125, 4.212158203125, 4.3519287109375, 4.49169921875, 4.6314697265625, 4.771240234375, 4.9110107421875, 5.05078125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 6.0, 12.0, 14.0, 18.0, 42.0, 34.0, 49.0, 62.0, 86.0, 155.0, 274.0, 432.0, 669.0, 1142.0, 2191.0, 4698.0, 12763.0, 57125.0, 888868.0, 1047063.0, 58280.0, 13099.0, 4781.0, 2225.0, 1190.0, 669.0, 427.0, 255.0, 167.0, 91.0, 64.0, 53.0, 32.0, 27.0, 23.0, 16.0, 12.0, 7.0, 5.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.92578125, -2.839752197265625, -2.75372314453125, -2.667694091796875, -2.5816650390625, -2.495635986328125, -2.40960693359375, -2.323577880859375, -2.237548828125, -2.151519775390625, -2.06549072265625, -1.979461669921875, -1.8934326171875, -1.807403564453125, -1.72137451171875, -1.635345458984375, -1.54931640625, -1.463287353515625, -1.37725830078125, -1.291229248046875, -1.2052001953125, -1.119171142578125, -1.03314208984375, -0.947113037109375, -0.861083984375, -0.775054931640625, -0.68902587890625, -0.602996826171875, -0.5169677734375, -0.430938720703125, -0.34490966796875, -0.258880615234375, -0.1728515625, -0.086822509765625, -0.00079345703125, 0.085235595703125, 0.1712646484375, 0.257293701171875, 0.34332275390625, 0.429351806640625, 0.515380859375, 0.601409912109375, 0.68743896484375, 0.773468017578125, 0.8594970703125, 0.945526123046875, 1.03155517578125, 1.117584228515625, 1.20361328125, 1.289642333984375, 1.37567138671875, 1.461700439453125, 1.5477294921875, 1.633758544921875, 1.71978759765625, 1.805816650390625, 1.891845703125, 1.977874755859375, 2.06390380859375, 2.149932861328125, 2.2359619140625, 2.321990966796875, 2.40802001953125, 2.494049072265625, 2.580078125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 11.0, 6.0, 6.0, 10.0, 47.0, 77.0, 179.0, 318.0, 146.0, 91.0, 39.0, 14.0, 11.0, 6.0, 5.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3583984375, -0.34799957275390625, -0.3376007080078125, -0.32720184326171875, -0.316802978515625, -0.30640411376953125, -0.2960052490234375, -0.28560638427734375, -0.27520751953125, -0.26480865478515625, -0.2544097900390625, -0.24401092529296875, -0.233612060546875, -0.22321319580078125, -0.2128143310546875, -0.20241546630859375, -0.1920166015625, -0.18161773681640625, -0.1712188720703125, -0.16082000732421875, -0.150421142578125, -0.14002227783203125, -0.1296234130859375, -0.11922454833984375, -0.10882568359375, -0.09842681884765625, -0.0880279541015625, -0.07762908935546875, -0.067230224609375, -0.05683135986328125, -0.0464324951171875, -0.03603363037109375, -0.025634765625, -0.01523590087890625, -0.0048370361328125, 0.00556182861328125, 0.015960693359375, 0.02635955810546875, 0.0367584228515625, 0.04715728759765625, 0.05755615234375, 0.06795501708984375, 0.0783538818359375, 0.08875274658203125, 0.099151611328125, 0.10955047607421875, 0.1199493408203125, 0.13034820556640625, 0.1407470703125, 0.15114593505859375, 0.1615447998046875, 0.17194366455078125, 0.182342529296875, 0.19274139404296875, 0.2031402587890625, 0.21353912353515625, 0.22393798828125, 0.23433685302734375, 0.2447357177734375, 0.25513458251953125, 0.265533447265625, 0.27593231201171875, 0.2863311767578125, 0.29673004150390625, 0.30712890625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 9.0, 7.0, 15.0, 11.0, 18.0, 16.0, 28.0, 43.0, 89.0, 215.0, 915.0, 6507.0, 1007919.0, 30116.0, 1938.0, 378.0, 111.0, 49.0, 30.0, 22.0, 16.0, 26.0, 21.0, 8.0, 2.0, 7.0, 4.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-4.75390625, -4.593994140625, -4.43408203125, -4.274169921875, -4.1142578125, -3.954345703125, -3.79443359375, -3.634521484375, -3.474609375, -3.314697265625, -3.15478515625, -2.994873046875, -2.8349609375, -2.675048828125, -2.51513671875, -2.355224609375, -2.1953125, -2.035400390625, -1.87548828125, -1.715576171875, -1.5556640625, -1.395751953125, -1.23583984375, -1.075927734375, -0.916015625, -0.756103515625, -0.59619140625, -0.436279296875, -0.2763671875, -0.116455078125, 0.04345703125, 0.203369140625, 0.36328125, 0.523193359375, 0.68310546875, 0.843017578125, 1.0029296875, 1.162841796875, 1.32275390625, 1.482666015625, 1.642578125, 1.802490234375, 1.96240234375, 2.122314453125, 2.2822265625, 2.442138671875, 2.60205078125, 2.761962890625, 2.921875, 3.081787109375, 3.24169921875, 3.401611328125, 3.5615234375, 3.721435546875, 3.88134765625, 4.041259765625, 4.201171875, 4.361083984375, 4.52099609375, 4.680908203125, 4.8408203125, 5.000732421875, 5.16064453125, 5.320556640625, 5.48046875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 12.0, 50.0, 181.0, 298.0, 274.0, 108.0, 50.0, 23.0, 9.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1471014022827148, -1.1257257461547852, -1.1043500900268555, -1.0829743146896362, -1.0615986585617065, -1.0402230024337769, -1.0188473463058472, -0.9974716305732727, -0.9760959148406982, -0.9547202587127686, -0.9333445429801941, -0.9119688868522644, -0.8905931711196899, -0.8692175149917603, -0.8478418588638306, -0.8264661431312561, -0.8050904870033264, -0.7837148308753967, -0.7623391151428223, -0.7409634590148926, -0.7195877432823181, -0.6982120871543884, -0.676836371421814, -0.6554607152938843, -0.6340850591659546, -0.6127094030380249, -0.5913336873054504, -0.5699580311775208, -0.5485823154449463, -0.5272066593170166, -0.5058310031890869, -0.48445528745651245, -0.4630795121192932, -0.44170382618904114, -0.42032814025878906, -0.3989524841308594, -0.3775767683982849, -0.3562011122703552, -0.33482542634010315, -0.3134497404098511, -0.2920740842819214, -0.2706983983516693, -0.24932271242141724, -0.22794704139232635, -0.20657135546207428, -0.1851956695318222, -0.16381999850273132, -0.14244431257247925, -0.12106861174106598, -0.0996929258108139, -0.07831724733114243, -0.05694156885147095, -0.03556588292121887, -0.014190196990966797, 0.0071854740381240845, 0.02856115996837616, 0.049936845898628235, 0.07131253182888031, 0.09268821030855179, 0.11406388878822327, 0.13543957471847534, 0.15681526064872742, 0.1781909316778183, 0.19956661760807037, 0.22094230353832245]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 6.0, 8.0, 8.0, 14.0, 9.0, 20.0, 28.0, 31.0, 34.0, 35.0, 32.0, 45.0, 57.0, 54.0, 55.0, 42.0, 45.0, 57.0, 54.0, 47.0, 42.0, 38.0, 31.0, 40.0, 24.0, 28.0, 29.0, 23.0, 12.0, 19.0, 8.0, 9.0, 9.0, 7.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21800941228866577, -0.2108687162399292, -0.20372800529003143, -0.19658729434013367, -0.1894465982913971, -0.18230590224266052, -0.17516519129276276, -0.168024480342865, -0.16088378429412842, -0.15374308824539185, -0.14660237729549408, -0.1394616663455963, -0.13232097029685974, -0.12518027424812317, -0.1180395632982254, -0.11089885979890823, -0.10375815629959106, -0.0966174528002739, -0.08947674930095673, -0.08233604580163956, -0.07519534230232239, -0.06805463880300522, -0.06091393530368805, -0.05377323180437088, -0.04663252830505371, -0.03949182480573654, -0.03235112130641937, -0.025210417807102203, -0.018069714307785034, -0.010929010808467865, -0.003788307309150696, 0.0033523961901664734, 0.010493099689483643, 0.017633803188800812, 0.02477450668811798, 0.03191521018743515, 0.03905591368675232, 0.04619661718606949, 0.05333732068538666, 0.06047802418470383, 0.067618727684021, 0.07475943118333817, 0.08190013468265533, 0.0890408381819725, 0.09618154168128967, 0.10332224518060684, 0.11046294867992401, 0.11760365217924118, 0.12474435567855835, 0.13188505172729492, 0.1390257626771927, 0.14616647362709045, 0.15330716967582703, 0.1604478657245636, 0.16758857667446136, 0.17472928762435913, 0.1818699836730957, 0.18901067972183228, 0.19615139067173004, 0.2032921016216278, 0.21043279767036438, 0.21757349371910095, 0.22471420466899872, 0.23185491561889648, 0.23899561166763306]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 8.0, 4.0, 10.0, 10.0, 6.0, 13.0, 19.0, 13.0, 14.0, 24.0, 20.0, 29.0, 43.0, 30.0, 39.0, 33.0, 38.0, 54.0, 36.0, 28.0, 45.0, 35.0, 45.0, 35.0, 36.0, 42.0, 44.0, 32.0, 30.0, 18.0, 27.0, 25.0, 26.0, 17.0, 17.0, 10.0, 11.0, 9.0, 6.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-7.23828125, -7.0443115234375, -6.850341796875, -6.6563720703125, -6.46240234375, -6.2684326171875, -6.074462890625, -5.8804931640625, -5.6865234375, -5.4925537109375, -5.298583984375, -5.1046142578125, -4.91064453125, -4.7166748046875, -4.522705078125, -4.3287353515625, -4.134765625, -3.9407958984375, -3.746826171875, -3.5528564453125, -3.35888671875, -3.1649169921875, -2.970947265625, -2.7769775390625, -2.5830078125, -2.3890380859375, -2.195068359375, -2.0010986328125, -1.80712890625, -1.6131591796875, -1.419189453125, -1.2252197265625, -1.03125, -0.8372802734375, -0.643310546875, -0.4493408203125, -0.25537109375, -0.0614013671875, 0.132568359375, 0.3265380859375, 0.5205078125, 0.7144775390625, 0.908447265625, 1.1024169921875, 1.29638671875, 1.4903564453125, 1.684326171875, 1.8782958984375, 2.072265625, 2.2662353515625, 2.460205078125, 2.6541748046875, 2.84814453125, 3.0421142578125, 3.236083984375, 3.4300537109375, 3.6240234375, 3.8179931640625, 4.011962890625, 4.2059326171875, 4.39990234375, 4.5938720703125, 4.787841796875, 4.9818115234375, 5.17578125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 5.0, 10.0, 7.0, 16.0, 17.0, 21.0, 26.0, 31.0, 46.0, 55.0, 83.0, 127.0, 172.0, 224.0, 341.0, 426.0, 690.0, 1160.0, 2233.0, 4937.0, 12312.0, 37827.0, 151004.0, 500277.0, 248336.0, 57480.0, 17310.0, 6492.0, 2869.0, 1402.0, 792.0, 523.0, 389.0, 235.0, 183.0, 133.0, 116.0, 76.0, 42.0, 37.0, 24.0, 21.0, 15.0, 9.0, 6.0, 8.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.796875, -8.51904296875, -8.2412109375, -7.96337890625, -7.685546875, -7.40771484375, -7.1298828125, -6.85205078125, -6.57421875, -6.29638671875, -6.0185546875, -5.74072265625, -5.462890625, -5.18505859375, -4.9072265625, -4.62939453125, -4.3515625, -4.07373046875, -3.7958984375, -3.51806640625, -3.240234375, -2.96240234375, -2.6845703125, -2.40673828125, -2.12890625, -1.85107421875, -1.5732421875, -1.29541015625, -1.017578125, -0.73974609375, -0.4619140625, -0.18408203125, 0.09375, 0.37158203125, 0.6494140625, 0.92724609375, 1.205078125, 1.48291015625, 1.7607421875, 2.03857421875, 2.31640625, 2.59423828125, 2.8720703125, 3.14990234375, 3.427734375, 3.70556640625, 3.9833984375, 4.26123046875, 4.5390625, 4.81689453125, 5.0947265625, 5.37255859375, 5.650390625, 5.92822265625, 6.2060546875, 6.48388671875, 6.76171875, 7.03955078125, 7.3173828125, 7.59521484375, 7.873046875, 8.15087890625, 8.4287109375, 8.70654296875, 8.984375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 7.0, 17.0, 7.0, 9.0, 19.0, 21.0, 24.0, 20.0, 22.0, 31.0, 51.0, 55.0, 64.0, 88.0, 153.0, 287.0, 1385.0, 208.0, 129.0, 76.0, 70.0, 59.0, 44.0, 35.0, 18.0, 22.0, 18.0, 21.0, 11.0, 15.0, 11.0, 7.0, 9.0, 3.0, 3.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-15.8125, -15.270751953125, -14.72900390625, -14.187255859375, -13.6455078125, -13.103759765625, -12.56201171875, -12.020263671875, -11.478515625, -10.936767578125, -10.39501953125, -9.853271484375, -9.3115234375, -8.769775390625, -8.22802734375, -7.686279296875, -7.14453125, -6.602783203125, -6.06103515625, -5.519287109375, -4.9775390625, -4.435791015625, -3.89404296875, -3.352294921875, -2.810546875, -2.268798828125, -1.72705078125, -1.185302734375, -0.6435546875, -0.101806640625, 0.43994140625, 0.981689453125, 1.5234375, 2.065185546875, 2.60693359375, 3.148681640625, 3.6904296875, 4.232177734375, 4.77392578125, 5.315673828125, 5.857421875, 6.399169921875, 6.94091796875, 7.482666015625, 8.0244140625, 8.566162109375, 9.10791015625, 9.649658203125, 10.19140625, 10.733154296875, 11.27490234375, 11.816650390625, 12.3583984375, 12.900146484375, 13.44189453125, 13.983642578125, 14.525390625, 15.067138671875, 15.60888671875, 16.150634765625, 16.6923828125, 17.234130859375, 17.77587890625, 18.317626953125, 18.859375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 5.0, 2.0, 5.0, 9.0, 8.0, 18.0, 13.0, 16.0, 21.0, 37.0, 35.0, 44.0, 67.0, 88.0, 143.0, 219.0, 358.0, 714.0, 1955.0, 13512.0, 2626871.0, 491878.0, 6731.0, 1460.0, 561.0, 301.0, 172.0, 111.0, 82.0, 62.0, 53.0, 42.0, 24.0, 23.0, 16.0, 12.0, 14.0, 6.0, 4.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.71875, -31.752685546875, -30.78662109375, -29.820556640625, -28.8544921875, -27.888427734375, -26.92236328125, -25.956298828125, -24.990234375, -24.024169921875, -23.05810546875, -22.092041015625, -21.1259765625, -20.159912109375, -19.19384765625, -18.227783203125, -17.26171875, -16.295654296875, -15.32958984375, -14.363525390625, -13.3974609375, -12.431396484375, -11.46533203125, -10.499267578125, -9.533203125, -8.567138671875, -7.60107421875, -6.635009765625, -5.6689453125, -4.702880859375, -3.73681640625, -2.770751953125, -1.8046875, -0.838623046875, 0.12744140625, 1.093505859375, 2.0595703125, 3.025634765625, 3.99169921875, 4.957763671875, 5.923828125, 6.889892578125, 7.85595703125, 8.822021484375, 9.7880859375, 10.754150390625, 11.72021484375, 12.686279296875, 13.65234375, 14.618408203125, 15.58447265625, 16.550537109375, 17.5166015625, 18.482666015625, 19.44873046875, 20.414794921875, 21.380859375, 22.346923828125, 23.31298828125, 24.279052734375, 25.2451171875, 26.211181640625, 27.17724609375, 28.143310546875, 29.109375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 143.0, 849.0, 20.0, 0.0, 1.0, 0.0, 2.0], "bins": [-869.2963256835938, -854.3916625976562, -839.487060546875, -824.5823974609375, -809.677734375, -794.7730712890625, -779.8684692382812, -764.9638061523438, -750.0591430664062, -735.1544799804688, -720.2498779296875, -705.34521484375, -690.4405517578125, -675.535888671875, -660.6312866210938, -645.7266235351562, -630.8219604492188, -615.9172973632812, -601.0126953125, -586.1080322265625, -571.203369140625, -556.2987060546875, -541.3941040039062, -526.4894409179688, -511.5848083496094, -496.68017578125, -481.7755126953125, -466.8708801269531, -451.9662170410156, -437.06158447265625, -422.15692138671875, -407.2522888183594, -392.3476257324219, -377.4429931640625, -362.538330078125, -347.6336975097656, -332.7290344238281, -317.82440185546875, -302.91973876953125, -288.0151062011719, -273.1104736328125, -258.2058410644531, -243.30117797851562, -228.3965301513672, -213.49188232421875, -198.58724975585938, -183.68258666992188, -168.7779541015625, -153.873291015625, -138.96864318847656, -124.06399536132812, -109.15934753417969, -94.25469970703125, -79.35005950927734, -64.4454116821289, -49.54076385498047, -34.6361083984375, -19.731460571289062, -4.826814651489258, 10.077831268310547, 24.982479095458984, 39.887123107910156, 54.791770935058594, 69.69641876220703, 84.60106658935547]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 7.0, 4.0, 7.0, 4.0, 10.0, 8.0, 13.0, 21.0, 18.0, 19.0, 21.0, 23.0, 37.0, 25.0, 39.0, 28.0, 28.0, 44.0, 41.0, 41.0, 37.0, 35.0, 30.0, 41.0, 42.0, 39.0, 31.0, 35.0, 41.0, 32.0, 36.0, 19.0, 20.0, 16.0, 15.0, 17.0, 12.0, 13.0, 15.0, 12.0, 7.0, 7.0, 2.0, 1.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-56.94044876098633, -55.305442810058594, -53.670433044433594, -52.03542709350586, -50.40041732788086, -48.765411376953125, -47.130401611328125, -45.49539566040039, -43.860389709472656, -42.22538375854492, -40.59037399291992, -38.95536804199219, -37.32035827636719, -35.68535232543945, -34.05034637451172, -32.41533660888672, -30.78032684326172, -29.14531898498535, -27.510311126708984, -25.87530517578125, -24.24029541015625, -22.605289459228516, -20.97028160095215, -19.33527374267578, -17.700265884399414, -16.065258026123047, -14.43025016784668, -12.795243263244629, -11.160235404968262, -9.525227546691895, -7.890220642089844, -6.255212783813477, -4.620204925537109, -2.9851973056793213, -1.3501896858215332, 0.2848176956176758, 1.919825553894043, 3.55483341217041, 5.189840316772461, 6.824848175048828, 8.459856033325195, 10.094863891601562, 11.72987174987793, 13.36487865447998, 14.999886512756348, 16.63489532470703, 18.269901275634766, 19.904909133911133, 21.5399169921875, 23.174924850463867, 24.809932708740234, 26.44493865966797, 28.07994842529297, 29.714954376220703, 31.34996223449707, 32.98497009277344, 34.61997985839844, 36.25498580932617, 37.88999557495117, 39.525001525878906, 41.160011291503906, 42.79501724243164, 44.430023193359375, 46.065032958984375, 47.70003890991211]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 5.0, 9.0, 8.0, 7.0, 9.0, 8.0, 10.0, 15.0, 28.0, 25.0, 25.0, 31.0, 30.0, 22.0, 36.0, 36.0, 38.0, 37.0, 46.0, 43.0, 56.0, 52.0, 45.0, 24.0, 46.0, 35.0, 43.0, 36.0, 27.0, 29.0, 24.0, 17.0, 19.0, 17.0, 15.0, 8.0, 4.0, 10.0, 5.0, 2.0, 6.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-7.9921875, -7.765869140625, -7.53955078125, -7.313232421875, -7.0869140625, -6.860595703125, -6.63427734375, -6.407958984375, -6.181640625, -5.955322265625, -5.72900390625, -5.502685546875, -5.2763671875, -5.050048828125, -4.82373046875, -4.597412109375, -4.37109375, -4.144775390625, -3.91845703125, -3.692138671875, -3.4658203125, -3.239501953125, -3.01318359375, -2.786865234375, -2.560546875, -2.334228515625, -2.10791015625, -1.881591796875, -1.6552734375, -1.428955078125, -1.20263671875, -0.976318359375, -0.75, -0.523681640625, -0.29736328125, -0.071044921875, 0.1552734375, 0.381591796875, 0.60791015625, 0.834228515625, 1.060546875, 1.286865234375, 1.51318359375, 1.739501953125, 1.9658203125, 2.192138671875, 2.41845703125, 2.644775390625, 2.87109375, 3.097412109375, 3.32373046875, 3.550048828125, 3.7763671875, 4.002685546875, 4.22900390625, 4.455322265625, 4.681640625, 4.907958984375, 5.13427734375, 5.360595703125, 5.5869140625, 5.813232421875, 6.03955078125, 6.265869140625, 6.4921875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 7.0, 8.0, 12.0, 11.0, 13.0, 20.0, 34.0, 31.0, 61.0, 90.0, 121.0, 172.0, 252.0, 398.0, 581.0, 914.0, 1644.0, 3474.0, 11230.0, 60314.0, 884756.0, 2967052.0, 224850.0, 26462.0, 6170.0, 2277.0, 1173.0, 757.0, 456.0, 282.0, 204.0, 161.0, 91.0, 65.0, 46.0, 26.0, 12.0, 10.0, 10.0, 18.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-31.734375, -30.80859375, -29.8828125, -28.95703125, -28.03125, -27.10546875, -26.1796875, -25.25390625, -24.328125, -23.40234375, -22.4765625, -21.55078125, -20.625, -19.69921875, -18.7734375, -17.84765625, -16.921875, -15.99609375, -15.0703125, -14.14453125, -13.21875, -12.29296875, -11.3671875, -10.44140625, -9.515625, -8.58984375, -7.6640625, -6.73828125, -5.8125, -4.88671875, -3.9609375, -3.03515625, -2.109375, -1.18359375, -0.2578125, 0.66796875, 1.59375, 2.51953125, 3.4453125, 4.37109375, 5.296875, 6.22265625, 7.1484375, 8.07421875, 9.0, 9.92578125, 10.8515625, 11.77734375, 12.703125, 13.62890625, 14.5546875, 15.48046875, 16.40625, 17.33203125, 18.2578125, 19.18359375, 20.109375, 21.03515625, 21.9609375, 22.88671875, 23.8125, 24.73828125, 25.6640625, 26.58984375, 27.515625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 3.0, 6.0, 8.0, 13.0, 25.0, 30.0, 40.0, 56.0, 66.0, 95.0, 117.0, 164.0, 216.0, 315.0, 375.0, 468.0, 402.0, 389.0, 328.0, 236.0, 187.0, 118.0, 113.0, 86.0, 68.0, 45.0, 22.0, 13.0, 20.0, 11.0, 8.0, 5.0, 9.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.1397705078125, -8.724853515625, -8.3099365234375, -7.89501953125, -7.4801025390625, -7.065185546875, -6.6502685546875, -6.2353515625, -5.8204345703125, -5.405517578125, -4.9906005859375, -4.57568359375, -4.1607666015625, -3.745849609375, -3.3309326171875, -2.916015625, -2.5010986328125, -2.086181640625, -1.6712646484375, -1.25634765625, -0.8414306640625, -0.426513671875, -0.0115966796875, 0.4033203125, 0.8182373046875, 1.233154296875, 1.6480712890625, 2.06298828125, 2.4779052734375, 2.892822265625, 3.3077392578125, 3.72265625, 4.1375732421875, 4.552490234375, 4.9674072265625, 5.38232421875, 5.7972412109375, 6.212158203125, 6.6270751953125, 7.0419921875, 7.4569091796875, 7.871826171875, 8.2867431640625, 8.70166015625, 9.1165771484375, 9.531494140625, 9.9464111328125, 10.361328125, 10.7762451171875, 11.191162109375, 11.6060791015625, 12.02099609375, 12.4359130859375, 12.850830078125, 13.2657470703125, 13.6806640625, 14.0955810546875, 14.510498046875, 14.9254150390625, 15.34033203125, 15.7552490234375, 16.170166015625, 16.5850830078125, 17.0]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 12.0, 16.0, 22.0, 47.0, 92.0, 199.0, 419.0, 1123.0, 4895.0, 49074.0, 977336.0, 2974785.0, 170687.0, 12409.0, 1974.0, 645.0, 255.0, 138.0, 69.0, 34.0, 15.0, 9.0, 9.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.984375, -24.15771484375, -23.3310546875, -22.50439453125, -21.677734375, -20.85107421875, -20.0244140625, -19.19775390625, -18.37109375, -17.54443359375, -16.7177734375, -15.89111328125, -15.064453125, -14.23779296875, -13.4111328125, -12.58447265625, -11.7578125, -10.93115234375, -10.1044921875, -9.27783203125, -8.451171875, -7.62451171875, -6.7978515625, -5.97119140625, -5.14453125, -4.31787109375, -3.4912109375, -2.66455078125, -1.837890625, -1.01123046875, -0.1845703125, 0.64208984375, 1.46875, 2.29541015625, 3.1220703125, 3.94873046875, 4.775390625, 5.60205078125, 6.4287109375, 7.25537109375, 8.08203125, 8.90869140625, 9.7353515625, 10.56201171875, 11.388671875, 12.21533203125, 13.0419921875, 13.86865234375, 14.6953125, 15.52197265625, 16.3486328125, 17.17529296875, 18.001953125, 18.82861328125, 19.6552734375, 20.48193359375, 21.30859375, 22.13525390625, 22.9619140625, 23.78857421875, 24.615234375, 25.44189453125, 26.2685546875, 27.09521484375, 27.921875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 8.0, 6.0, 12.0, 12.0, 17.0, 26.0, 40.0, 52.0, 71.0, 81.0, 119.0, 97.0, 103.0, 89.0, 68.0, 53.0, 41.0, 23.0, 29.0, 19.0, 13.0, 10.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.03022003173828, -75.66656494140625, -72.30290985107422, -68.93925476074219, -65.57560729980469, -62.211952209472656, -58.848297119140625, -55.484642028808594, -52.12099075317383, -48.7573356628418, -45.39368438720703, -42.030029296875, -38.66637420654297, -35.3027229309082, -31.939067840576172, -28.575414657592773, -25.211761474609375, -21.848108291625977, -18.484455108642578, -15.120800018310547, -11.757146835327148, -8.39349365234375, -5.029838562011719, -1.6661853790283203, 1.6974678039550781, 5.061121463775635, 8.424775123596191, 11.788429260253906, 15.152082443237305, 18.515735626220703, 21.879390716552734, 25.243043899536133, 28.606704711914062, 31.97035789489746, 35.33401107788086, 38.69766616821289, 42.061317443847656, 45.42497253417969, 48.78862762451172, 52.15228271484375, 55.515933990478516, 58.87958908081055, 62.24324035644531, 65.60689544677734, 68.97055053710938, 72.33419799804688, 75.69786071777344, 79.06150817871094, 82.42516326904297, 85.788818359375, 89.15247344970703, 92.51612854003906, 95.87977600097656, 99.2434310913086, 102.60708618164062, 105.97074127197266, 109.33439636230469, 112.69805145263672, 116.06170654296875, 119.42535400390625, 122.78900909423828, 126.15266418457031, 129.51632690429688, 132.87997436523438, 136.24362182617188]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 7.0, 4.0, 10.0, 14.0, 3.0, 17.0, 11.0, 16.0, 18.0, 21.0, 27.0, 30.0, 30.0, 28.0, 45.0, 30.0, 39.0, 41.0, 48.0, 41.0, 45.0, 47.0, 41.0, 43.0, 40.0, 32.0, 43.0, 40.0, 21.0, 24.0, 24.0, 18.0, 23.0, 20.0, 15.0, 6.0, 8.0, 4.0, 8.0, 6.0, 3.0, 4.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.854591369628906, -59.93022918701172, -58.00586700439453, -56.081504821777344, -54.15713882446289, -52.2327766418457, -50.308414459228516, -48.38405227661133, -46.459686279296875, -44.53532409667969, -42.6109619140625, -40.68659973144531, -38.76223373413086, -36.83787155151367, -34.913509368896484, -32.9891471862793, -31.06478500366211, -29.140422821044922, -27.2160587310791, -25.291696548461914, -23.367332458496094, -21.442970275878906, -19.51860809326172, -17.59424591064453, -15.669881820678711, -13.745518684387207, -11.821155548095703, -9.896793365478516, -7.972430229187012, -6.048067092895508, -4.12370491027832, -2.1993417739868164, -0.2749748229980469, 1.649388074874878, 3.5737509727478027, 5.498113632202148, 7.422476768493652, 9.346839904785156, 11.271202087402344, 13.195565223693848, 15.119928359985352, 17.04429054260254, 18.96865463256836, 20.893016815185547, 22.817378997802734, 24.741743087768555, 26.666105270385742, 28.590469360351562, 30.51483154296875, 32.43919372558594, 34.363555908203125, 36.28791809082031, 38.212284088134766, 40.13664627075195, 42.06100845336914, 43.98537063598633, 45.90973663330078, 47.83409881591797, 49.758460998535156, 51.682823181152344, 53.6071891784668, 55.531551361083984, 57.45591354370117, 59.38027572631836, 61.30463790893555]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 6.0, 8.0, 8.0, 7.0, 12.0, 14.0, 16.0, 13.0, 21.0, 26.0, 26.0, 34.0, 28.0, 34.0, 36.0, 23.0, 40.0, 36.0, 43.0, 45.0, 57.0, 33.0, 50.0, 50.0, 42.0, 40.0, 36.0, 23.0, 29.0, 29.0, 23.0, 22.0, 18.0, 21.0, 11.0, 8.0, 10.0, 4.0, 6.0, 3.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-116.0625, -112.33203125, -108.6015625, -104.87109375, -101.140625, -97.41015625, -93.6796875, -89.94921875, -86.21875, -82.48828125, -78.7578125, -75.02734375, -71.296875, -67.56640625, -63.8359375, -60.10546875, -56.375, -52.64453125, -48.9140625, -45.18359375, -41.453125, -37.72265625, -33.9921875, -30.26171875, -26.53125, -22.80078125, -19.0703125, -15.33984375, -11.609375, -7.87890625, -4.1484375, -0.41796875, 3.3125, 7.04296875, 10.7734375, 14.50390625, 18.234375, 21.96484375, 25.6953125, 29.42578125, 33.15625, 36.88671875, 40.6171875, 44.34765625, 48.078125, 51.80859375, 55.5390625, 59.26953125, 63.0, 66.73046875, 70.4609375, 74.19140625, 77.921875, 81.65234375, 85.3828125, 89.11328125, 92.84375, 96.57421875, 100.3046875, 104.03515625, 107.765625, 111.49609375, 115.2265625, 118.95703125, 122.6875]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 17.0, 21.0, 25.0, 45.0, 51.0, 112.0, 175.0, 244.0, 402.0, 687.0, 1112.0, 1820.0, 3046.0, 5066.0, 8562.0, 15048.0, 26916.0, 49722.0, 98912.0, 199028.0, 276697.0, 175071.0, 85675.0, 43800.0, 23652.0, 13341.0, 7748.0, 4598.0, 2683.0, 1646.0, 1010.0, 616.0, 365.0, 223.0, 146.0, 103.0, 68.0, 34.0, 28.0, 17.0, 9.0, 10.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.931640625, -7.65234375, -7.373046875, -7.09375, -6.814453125, -6.53515625, -6.255859375, -5.9765625, -5.697265625, -5.41796875, -5.138671875, -4.859375, -4.580078125, -4.30078125, -4.021484375, -3.7421875, -3.462890625, -3.18359375, -2.904296875, -2.625, -2.345703125, -2.06640625, -1.787109375, -1.5078125, -1.228515625, -0.94921875, -0.669921875, -0.390625, -0.111328125, 0.16796875, 0.447265625, 0.7265625, 1.005859375, 1.28515625, 1.564453125, 1.84375, 2.123046875, 2.40234375, 2.681640625, 2.9609375, 3.240234375, 3.51953125, 3.798828125, 4.078125, 4.357421875, 4.63671875, 4.916015625, 5.1953125, 5.474609375, 5.75390625, 6.033203125, 6.3125, 6.591796875, 6.87109375, 7.150390625, 7.4296875, 7.708984375, 7.98828125, 8.267578125, 8.546875, 8.826171875, 9.10546875, 9.384765625, 9.6640625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 6.0, 13.0, 15.0, 9.0, 24.0, 17.0, 25.0, 29.0, 25.0, 27.0, 39.0, 38.0, 43.0, 53.0, 56.0, 30.0, 40.0, 1076.0, 52.0, 43.0, 45.0, 35.0, 43.0, 45.0, 30.0, 15.0, 20.0, 18.0, 26.0, 18.0, 18.0, 12.0, 7.0, 4.0, 9.0, 3.0, 4.0, 4.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.5, -71.095703125, -68.69140625, -66.287109375, -63.8828125, -61.478515625, -59.07421875, -56.669921875, -54.265625, -51.861328125, -49.45703125, -47.052734375, -44.6484375, -42.244140625, -39.83984375, -37.435546875, -35.03125, -32.626953125, -30.22265625, -27.818359375, -25.4140625, -23.009765625, -20.60546875, -18.201171875, -15.796875, -13.392578125, -10.98828125, -8.583984375, -6.1796875, -3.775390625, -1.37109375, 1.033203125, 3.4375, 5.841796875, 8.24609375, 10.650390625, 13.0546875, 15.458984375, 17.86328125, 20.267578125, 22.671875, 25.076171875, 27.48046875, 29.884765625, 32.2890625, 34.693359375, 37.09765625, 39.501953125, 41.90625, 44.310546875, 46.71484375, 49.119140625, 51.5234375, 53.927734375, 56.33203125, 58.736328125, 61.140625, 63.544921875, 65.94921875, 68.353515625, 70.7578125, 73.162109375, 75.56640625, 77.970703125, 80.375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 1.0, 5.0, 6.0, 15.0, 18.0, 21.0, 34.0, 55.0, 87.0, 156.0, 226.0, 396.0, 542.0, 888.0, 1554.0, 2563.0, 4578.0, 7624.0, 13480.0, 24569.0, 44804.0, 85734.0, 177692.0, 1278300.0, 231857.0, 101778.0, 53328.0, 28559.0, 15890.0, 9200.0, 5366.0, 3058.0, 1869.0, 1153.0, 659.0, 373.0, 224.0, 174.0, 100.0, 70.0, 49.0, 31.0, 17.0, 9.0, 7.0, 9.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.46875, -8.1922607421875, -7.915771484375, -7.6392822265625, -7.36279296875, -7.0863037109375, -6.809814453125, -6.5333251953125, -6.2568359375, -5.9803466796875, -5.703857421875, -5.4273681640625, -5.15087890625, -4.8743896484375, -4.597900390625, -4.3214111328125, -4.044921875, -3.7684326171875, -3.491943359375, -3.2154541015625, -2.93896484375, -2.6624755859375, -2.385986328125, -2.1094970703125, -1.8330078125, -1.5565185546875, -1.280029296875, -1.0035400390625, -0.72705078125, -0.4505615234375, -0.174072265625, 0.1024169921875, 0.37890625, 0.6553955078125, 0.931884765625, 1.2083740234375, 1.48486328125, 1.7613525390625, 2.037841796875, 2.3143310546875, 2.5908203125, 2.8673095703125, 3.143798828125, 3.4202880859375, 3.69677734375, 3.9732666015625, 4.249755859375, 4.5262451171875, 4.802734375, 5.0792236328125, 5.355712890625, 5.6322021484375, 5.90869140625, 6.1851806640625, 6.461669921875, 6.7381591796875, 7.0146484375, 7.2911376953125, 7.567626953125, 7.8441162109375, 8.12060546875, 8.3970947265625, 8.673583984375, 8.9500732421875, 9.2265625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 9.0, 8.0, 9.0, 16.0, 12.0, 20.0, 28.0, 50.0, 43.0, 45.0, 65.0, 90.0, 85.0, 96.0, 84.0, 58.0, 43.0, 42.0, 31.0, 24.0, 22.0, 19.0, 16.0, 14.0, 10.0, 11.0, 7.0, 6.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.297607421875, -0.28797149658203125, -0.2783355712890625, -0.26869964599609375, -0.259063720703125, -0.24942779541015625, -0.2397918701171875, -0.23015594482421875, -0.22052001953125, -0.21088409423828125, -0.2012481689453125, -0.19161224365234375, -0.181976318359375, -0.17234039306640625, -0.1627044677734375, -0.15306854248046875, -0.1434326171875, -0.13379669189453125, -0.1241607666015625, -0.11452484130859375, -0.104888916015625, -0.09525299072265625, -0.0856170654296875, -0.07598114013671875, -0.06634521484375, -0.05670928955078125, -0.0470733642578125, -0.03743743896484375, -0.027801513671875, -0.01816558837890625, -0.0085296630859375, 0.00110626220703125, 0.0107421875, 0.02037811279296875, 0.0300140380859375, 0.03964996337890625, 0.049285888671875, 0.05892181396484375, 0.0685577392578125, 0.07819366455078125, 0.08782958984375, 0.09746551513671875, 0.1071014404296875, 0.11673736572265625, 0.126373291015625, 0.13600921630859375, 0.1456451416015625, 0.15528106689453125, 0.1649169921875, 0.17455291748046875, 0.1841888427734375, 0.19382476806640625, 0.203460693359375, 0.21309661865234375, 0.2227325439453125, 0.23236846923828125, 0.24200439453125, 0.25164031982421875, 0.2612762451171875, 0.27091217041015625, 0.280548095703125, 0.29018402099609375, 0.2998199462890625, 0.30945587158203125, 0.319091796875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 7.0, 13.0, 17.0, 10.0, 37.0, 28.0, 63.0, 59.0, 97.0, 131.0, 187.0, 263.0, 364.0, 550.0, 735.0, 1098.0, 1652.0, 2877.0, 5781.0, 13370.0, 37853.0, 165446.0, 574028.0, 176506.0, 39258.0, 13737.0, 6046.0, 2896.0, 1739.0, 1096.0, 766.0, 564.0, 352.0, 264.0, 200.0, 136.0, 88.0, 58.0, 45.0, 48.0, 33.0, 20.0, 13.0, 11.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-1.767578125, -1.71636962890625, -1.6651611328125, -1.61395263671875, -1.562744140625, -1.51153564453125, -1.4603271484375, -1.40911865234375, -1.35791015625, -1.30670166015625, -1.2554931640625, -1.20428466796875, -1.153076171875, -1.10186767578125, -1.0506591796875, -0.99945068359375, -0.9482421875, -0.89703369140625, -0.8458251953125, -0.79461669921875, -0.743408203125, -0.69219970703125, -0.6409912109375, -0.58978271484375, -0.53857421875, -0.48736572265625, -0.4361572265625, -0.38494873046875, -0.333740234375, -0.28253173828125, -0.2313232421875, -0.18011474609375, -0.12890625, -0.07769775390625, -0.0264892578125, 0.02471923828125, 0.075927734375, 0.12713623046875, 0.1783447265625, 0.22955322265625, 0.28076171875, 0.33197021484375, 0.3831787109375, 0.43438720703125, 0.485595703125, 0.53680419921875, 0.5880126953125, 0.63922119140625, 0.6904296875, 0.74163818359375, 0.7928466796875, 0.84405517578125, 0.895263671875, 0.94647216796875, 0.9976806640625, 1.04888916015625, 1.10009765625, 1.15130615234375, 1.2025146484375, 1.25372314453125, 1.304931640625, 1.35614013671875, 1.4073486328125, 1.45855712890625, 1.509765625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 9.0, 2.0, 7.0, 9.0, 17.0, 24.0, 32.0, 51.0, 77.0, 100.0, 124.0, 131.0, 125.0, 122.0, 62.0, 39.0, 28.0, 22.0, 11.0, 6.0, 1.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8307793140411377, -0.8086284399032593, -0.7864775657653809, -0.7643266916275024, -0.742175817489624, -0.7200250029563904, -0.697874128818512, -0.6757232546806335, -0.6535723805427551, -0.6314215064048767, -0.6092706322669983, -0.5871197581291199, -0.5649689435958862, -0.5428180694580078, -0.5206671953201294, -0.498516321182251, -0.47636544704437256, -0.45421457290649414, -0.4320636987686157, -0.4099128544330597, -0.3877619802951813, -0.36561110615730286, -0.3434602618217468, -0.3213093876838684, -0.29915851354599, -0.2770076394081116, -0.25485676527023315, -0.23270592093467712, -0.2105550467967987, -0.1884041726589203, -0.16625331342220306, -0.14410245418548584, -0.12195158004760742, -0.0998007133603096, -0.07764984667301178, -0.05549897998571396, -0.03334811329841614, -0.011197246611118317, 0.010953620076179504, 0.03310447931289673, 0.055255353450775146, 0.07740622013807297, 0.09955708682537079, 0.12170795351266861, 0.14385882019996643, 0.16600969433784485, 0.18816055357456207, 0.2103114128112793, 0.23246228694915771, 0.25461316108703613, 0.27676403522491455, 0.2989148795604706, 0.321065753698349, 0.3432166278362274, 0.36536747217178345, 0.38751834630966187, 0.4096692204475403, 0.4318200945854187, 0.4539709687232971, 0.47612181305885315, 0.49827268719673157, 0.5204235315322876, 0.542574405670166, 0.5647252798080444, 0.5868761539459229]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 8.0, 9.0, 11.0, 8.0, 12.0, 17.0, 13.0, 30.0, 23.0, 26.0, 27.0, 27.0, 34.0, 35.0, 33.0, 38.0, 54.0, 38.0, 40.0, 36.0, 50.0, 38.0, 39.0, 40.0, 33.0, 36.0, 17.0, 29.0, 23.0, 24.0, 24.0, 17.0, 13.0, 17.0, 19.0, 11.0, 12.0, 2.0, 8.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22672247886657715, -0.21937517821788788, -0.2120278775691986, -0.20468059182167053, -0.19733329117298126, -0.189985990524292, -0.18263868987560272, -0.17529138922691345, -0.16794410347938538, -0.1605968028306961, -0.15324950218200684, -0.14590221643447876, -0.1385549157857895, -0.13120761513710022, -0.12386031448841095, -0.11651301383972168, -0.10916571319103241, -0.10181841254234314, -0.09447111934423447, -0.0871238186955452, -0.07977652549743652, -0.07242922484874725, -0.06508192420005798, -0.05773462727665901, -0.05038733035326004, -0.04304003342986107, -0.0356927365064621, -0.028345435857772827, -0.020998138934373856, -0.013650842010974884, -0.006303541362285614, 0.0010437555611133575, 0.008391052484512329, 0.0157383494079113, 0.02308564819395542, 0.030432946979999542, 0.037780243903398514, 0.045127540826797485, 0.052474841475486755, 0.05982213839888573, 0.0671694353222847, 0.07451673597097397, 0.08186402916908264, 0.08921132981777191, 0.09655863046646118, 0.10390592366456985, 0.11125322431325912, 0.1186005175113678, 0.12594781816005707, 0.13329511880874634, 0.1406424194574356, 0.14798972010612488, 0.15533700585365295, 0.16268430650234222, 0.1700316071510315, 0.17737890779972076, 0.18472620844841003, 0.1920735090970993, 0.19942080974578857, 0.20676809549331665, 0.21411539614200592, 0.2214626967906952, 0.22880999743938446, 0.23615729808807373, 0.2435045838356018]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 4.0, 14.0, 6.0, 11.0, 11.0, 11.0, 14.0, 11.0, 21.0, 24.0, 19.0, 35.0, 35.0, 39.0, 36.0, 42.0, 30.0, 45.0, 42.0, 51.0, 46.0, 35.0, 52.0, 41.0, 47.0, 32.0, 33.0, 28.0, 20.0, 31.0, 30.0, 17.0, 13.0, 14.0, 10.0, 10.0, 6.0, 7.0, 6.0, 3.0, 2.0, 2.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.0625, -100.4365234375, -96.810546875, -93.1845703125, -89.55859375, -85.9326171875, -82.306640625, -78.6806640625, -75.0546875, -71.4287109375, -67.802734375, -64.1767578125, -60.55078125, -56.9248046875, -53.298828125, -49.6728515625, -46.046875, -42.4208984375, -38.794921875, -35.1689453125, -31.54296875, -27.9169921875, -24.291015625, -20.6650390625, -17.0390625, -13.4130859375, -9.787109375, -6.1611328125, -2.53515625, 1.0908203125, 4.716796875, 8.3427734375, 11.96875, 15.5947265625, 19.220703125, 22.8466796875, 26.47265625, 30.0986328125, 33.724609375, 37.3505859375, 40.9765625, 44.6025390625, 48.228515625, 51.8544921875, 55.48046875, 59.1064453125, 62.732421875, 66.3583984375, 69.984375, 73.6103515625, 77.236328125, 80.8623046875, 84.48828125, 88.1142578125, 91.740234375, 95.3662109375, 98.9921875, 102.6181640625, 106.244140625, 109.8701171875, 113.49609375, 117.1220703125, 120.748046875, 124.3740234375, 128.0]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 1.0, 4.0, 3.0, 9.0, 11.0, 11.0, 8.0, 16.0, 16.0, 20.0, 36.0, 42.0, 55.0, 64.0, 94.0, 168.0, 264.0, 526.0, 1226.0, 4081.0, 21812.0, 208194.0, 683298.0, 109866.0, 13652.0, 2946.0, 979.0, 437.0, 214.0, 136.0, 91.0, 64.0, 55.0, 34.0, 25.0, 20.0, 20.0, 11.0, 8.0, 9.0, 4.0, 9.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.40625, -21.616455078125, -20.82666015625, -20.036865234375, -19.2470703125, -18.457275390625, -17.66748046875, -16.877685546875, -16.087890625, -15.298095703125, -14.50830078125, -13.718505859375, -12.9287109375, -12.138916015625, -11.34912109375, -10.559326171875, -9.76953125, -8.979736328125, -8.18994140625, -7.400146484375, -6.6103515625, -5.820556640625, -5.03076171875, -4.240966796875, -3.451171875, -2.661376953125, -1.87158203125, -1.081787109375, -0.2919921875, 0.497802734375, 1.28759765625, 2.077392578125, 2.8671875, 3.656982421875, 4.44677734375, 5.236572265625, 6.0263671875, 6.816162109375, 7.60595703125, 8.395751953125, 9.185546875, 9.975341796875, 10.76513671875, 11.554931640625, 12.3447265625, 13.134521484375, 13.92431640625, 14.714111328125, 15.50390625, 16.293701171875, 17.08349609375, 17.873291015625, 18.6630859375, 19.452880859375, 20.24267578125, 21.032470703125, 21.822265625, 22.612060546875, 23.40185546875, 24.191650390625, 24.9814453125, 25.771240234375, 26.56103515625, 27.350830078125, 28.140625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 3.0, 13.0, 10.0, 14.0, 21.0, 21.0, 27.0, 25.0, 38.0, 51.0, 56.0, 69.0, 62.0, 79.0, 2089.0, 68.0, 61.0, 58.0, 47.0, 50.0, 40.0, 31.0, 24.0, 20.0, 13.0, 16.0, 17.0, 12.0, 5.0, 1.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-177.5, -170.978515625, -164.45703125, -157.935546875, -151.4140625, -144.892578125, -138.37109375, -131.849609375, -125.328125, -118.806640625, -112.28515625, -105.763671875, -99.2421875, -92.720703125, -86.19921875, -79.677734375, -73.15625, -66.634765625, -60.11328125, -53.591796875, -47.0703125, -40.548828125, -34.02734375, -27.505859375, -20.984375, -14.462890625, -7.94140625, -1.419921875, 5.1015625, 11.623046875, 18.14453125, 24.666015625, 31.1875, 37.708984375, 44.23046875, 50.751953125, 57.2734375, 63.794921875, 70.31640625, 76.837890625, 83.359375, 89.880859375, 96.40234375, 102.923828125, 109.4453125, 115.966796875, 122.48828125, 129.009765625, 135.53125, 142.052734375, 148.57421875, 155.095703125, 161.6171875, 168.138671875, 174.66015625, 181.181640625, 187.703125, 194.224609375, 200.74609375, 207.267578125, 213.7890625, 220.310546875, 226.83203125, 233.353515625, 239.875]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 7.0, 4.0, 9.0, 14.0, 16.0, 42.0, 45.0, 92.0, 125.0, 245.0, 445.0, 1147.0, 3703.0, 21451.0, 369963.0, 2701984.0, 38615.0, 5158.0, 1416.0, 586.0, 253.0, 146.0, 83.0, 57.0, 31.0, 25.0, 11.0, 8.0, 5.0, 5.0, 7.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.765625, -23.943359375, -23.12109375, -22.298828125, -21.4765625, -20.654296875, -19.83203125, -19.009765625, -18.1875, -17.365234375, -16.54296875, -15.720703125, -14.8984375, -14.076171875, -13.25390625, -12.431640625, -11.609375, -10.787109375, -9.96484375, -9.142578125, -8.3203125, -7.498046875, -6.67578125, -5.853515625, -5.03125, -4.208984375, -3.38671875, -2.564453125, -1.7421875, -0.919921875, -0.09765625, 0.724609375, 1.546875, 2.369140625, 3.19140625, 4.013671875, 4.8359375, 5.658203125, 6.48046875, 7.302734375, 8.125, 8.947265625, 9.76953125, 10.591796875, 11.4140625, 12.236328125, 13.05859375, 13.880859375, 14.703125, 15.525390625, 16.34765625, 17.169921875, 17.9921875, 18.814453125, 19.63671875, 20.458984375, 21.28125, 22.103515625, 22.92578125, 23.748046875, 24.5703125, 25.392578125, 26.21484375, 27.037109375, 27.859375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 6.0, 17.0, 30.0, 47.0, 61.0, 146.0, 197.0, 171.0, 129.0, 65.0, 40.0, 22.0, 14.0, 10.0, 9.0, 2.0, 5.0, 5.0, 3.0, 6.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-302.72509765625, -294.0524597167969, -285.3797912597656, -276.7071533203125, -268.03448486328125, -259.3618469238281, -250.68917846679688, -242.01654052734375, -233.3438720703125, -224.6712188720703, -215.99856567382812, -207.32591247558594, -198.65325927734375, -189.98060607910156, -181.30795288085938, -172.63531494140625, -163.96266174316406, -155.29000854492188, -146.6173553466797, -137.9447021484375, -129.2720489501953, -120.59939575195312, -111.92675018310547, -103.25409698486328, -94.5814437866211, -85.9087905883789, -77.23613739013672, -68.56349182128906, -59.89083480834961, -51.21818161010742, -42.5455322265625, -33.87287902832031, -25.200210571289062, -16.527557373046875, -7.85490608215332, 0.8177452087402344, 9.490398406982422, 18.16305160522461, 26.83570098876953, 35.50835418701172, 44.181007385253906, 52.853660583496094, 61.52631378173828, 70.19895935058594, 78.87161254882812, 87.54426574707031, 96.2169189453125, 104.88957214355469, 113.56222534179688, 122.23487854003906, 130.90753173828125, 139.58018493652344, 148.25283813476562, 156.9254913330078, 165.59814453125, 174.27078247070312, 182.94345092773438, 191.61610412597656, 200.28875732421875, 208.96141052246094, 217.63406372070312, 226.3067169189453, 234.9793701171875, 243.65200805664062, 252.3246612548828]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 5.0, 6.0, 2.0, 8.0, 10.0, 16.0, 10.0, 10.0, 14.0, 17.0, 25.0, 23.0, 25.0, 35.0, 43.0, 36.0, 42.0, 41.0, 38.0, 43.0, 45.0, 47.0, 38.0, 49.0, 38.0, 54.0, 42.0, 32.0, 27.0, 28.0, 32.0, 19.0, 17.0, 18.0, 16.0, 11.0, 5.0, 7.0, 5.0, 12.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-215.72418212890625, -208.71995544433594, -201.71572875976562, -194.71148681640625, -187.70726013183594, -180.70303344726562, -173.69879150390625, -166.69456481933594, -159.69033813476562, -152.6861114501953, -145.681884765625, -138.67764282226562, -131.6734161376953, -124.669189453125, -117.66495513916016, -110.66072082519531, -103.656494140625, -96.65226745605469, -89.64803314208984, -82.643798828125, -75.63957214355469, -68.63534545898438, -61.63111114501953, -54.62688064575195, -47.622650146484375, -40.6184196472168, -33.61418914794922, -26.60995864868164, -19.605728149414062, -12.601497650146484, -5.597267150878906, 1.4069633483886719, 8.411209106445312, 15.41543960571289, 22.41967010498047, 29.423900604248047, 36.428131103515625, 43.4323616027832, 50.43659210205078, 57.44082260131836, 64.44505310058594, 71.44927978515625, 78.4535140991211, 85.45774841308594, 92.46197509765625, 99.46620178222656, 106.4704360961914, 113.47467041015625, 120.47889709472656, 127.48312377929688, 134.48736572265625, 141.49159240722656, 148.49581909179688, 155.5000457763672, 162.5042724609375, 169.50851440429688, 176.5127410888672, 183.5169677734375, 190.52120971679688, 197.5254364013672, 204.5296630859375, 211.5338897705078, 218.53811645507812, 225.5423583984375, 232.5465850830078]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 6.0, 8.0, 4.0, 16.0, 13.0, 16.0, 25.0, 34.0, 49.0, 49.0, 68.0, 80.0, 116.0, 155.0, 190.0, 279.0, 426.0, 607.0, 1162.0, 2007.0, 4191.0, 8921.0, 1015063.0, 7125.0, 3360.0, 1669.0, 935.0, 563.0, 354.0, 268.0, 188.0, 134.0, 88.0, 84.0, 70.0, 58.0, 31.0, 35.0, 24.0, 25.0, 21.0, 10.0, 5.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0], "bins": [-49.940921783447266, -48.34784698486328, -46.75477600097656, -45.16170120239258, -43.568626403808594, -41.975555419921875, -40.38248062133789, -38.789405822753906, -37.19633483886719, -35.6032600402832, -34.010189056396484, -32.4171142578125, -30.82404136657715, -29.230968475341797, -27.637893676757812, -26.04482078552246, -24.45174789428711, -22.858675003051758, -21.265602111816406, -19.672527313232422, -18.07945442199707, -16.48638153076172, -14.89330768585205, -13.300233840942383, -11.707160949707031, -10.11408805847168, -8.521014213562012, -6.927940845489502, -5.334867477416992, -3.7417941093444824, -2.1487207412719727, -0.5556468963623047, 1.0374298095703125, 2.6305031776428223, 4.223576545715332, 5.816649913787842, 7.409723281860352, 9.002796173095703, 10.595870018005371, 12.188943862915039, 13.78201675415039, 15.375089645385742, 16.968162536621094, 18.561237335205078, 20.15431022644043, 21.74738311767578, 23.340457916259766, 24.933530807495117, 26.52660369873047, 28.11967658996582, 29.712749481201172, 31.305824279785156, 32.898895263671875, 34.49197006225586, 36.085044860839844, 37.67811584472656, 39.27119064331055, 40.86426544189453, 42.45733642578125, 44.050411224365234, 45.64348602294922, 47.23655700683594, 48.82963180541992, 50.422706604003906, 52.015777587890625]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 5.0, 5.0, 4.0, 8.0, 4.0, 13.0, 14.0, 23.0, 29.0, 53.0, 180.0, 5312.0, 51455360.0, 1881.0, 131.0, 49.0, 33.0, 16.0, 12.0, 6.0, 5.0, 3.0, 7.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-897.4190063476562, -872.0631103515625, -846.7071533203125, -821.3511962890625, -795.9953002929688, -770.639404296875, -745.283447265625, -719.927490234375, -694.5715942382812, -669.2156982421875, -643.8597412109375, -618.5037841796875, -593.1478881835938, -567.7919921875, -542.43603515625, -517.080078125, -491.72418212890625, -466.3682556152344, -441.0123291015625, -415.6564025878906, -390.30047607421875, -364.9445495605469, -339.588623046875, -314.2326965332031, -288.87677001953125, -263.5208435058594, -238.1649169921875, -212.80899047851562, -187.45306396484375, -162.09713745117188, -136.7412109375, -111.38528442382812, -86.02935791015625, -60.673431396484375, -35.3175048828125, -9.961578369140625, 15.39434814453125, 40.750274658203125, 66.106201171875, 91.46212768554688, 116.81805419921875, 142.17398071289062, 167.5299072265625, 192.88583374023438, 218.24176025390625, 243.59768676757812, 268.95361328125, 294.3095397949219, 319.66546630859375, 345.0213928222656, 370.3773193359375, 395.7332458496094, 421.08917236328125, 446.4450988769531, 471.801025390625, 497.1569519042969, 522.5128784179688, 547.8687744140625, 573.2247314453125, 598.5806884765625, 623.9365844726562, 649.29248046875, 674.6484375, 700.00439453125, 725.3602905273438]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 8.0, 11.0, 13.0, 28.0, 51.0, 78.0, 87.0, 157.0, 237.0, 375.0, 577.0, 990.0, 1642.0, 2773.0, 4907.0, 8870.0, 16543.0, 32900.0, 69026.0, 159870.0, 420533.0, 1644468.0, 3003889.0, 551408.0, 202637.0, 85715.0, 39533.0, 19787.0, 10390.0, 5792.0, 3250.0, 1839.0, 1139.0, 684.0, 445.0, 277.0, 173.0, 113.0, 74.0, 39.0, 34.0, 25.0, 21.0, 7.0, 10.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-32.875, -31.8828125, -30.890625, -29.8984375, -28.90625, -27.9140625, -26.921875, -25.9296875, -24.9375, -23.9453125, -22.953125, -21.9609375, -20.96875, -19.9765625, -18.984375, -17.9921875, -17.0, -16.0078125, -15.015625, -14.0234375, -13.03125, -12.0390625, -11.046875, -10.0546875, -9.0625, -8.0703125, -7.078125, -6.0859375, -5.09375, -4.1015625, -3.109375, -2.1171875, -1.125, -0.1328125, 0.859375, 1.8515625, 2.84375, 3.8359375, 4.828125, 5.8203125, 6.8125, 7.8046875, 8.796875, 9.7890625, 10.78125, 11.7734375, 12.765625, 13.7578125, 14.75, 15.7421875, 16.734375, 17.7265625, 18.71875, 19.7109375, 20.703125, 21.6953125, 22.6875, 23.6796875, 24.671875, 25.6640625, 26.65625, 27.6484375, 28.640625, 29.6328125, 30.625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 3.0, 5.0, 11.0, 10.0, 11.0, 18.0, 16.0, 11.0, 25.0, 26.0, 23.0, 26.0, 27.0, 38.0, 33.0, 61.0, 54.0, 88.0, 133.0, 222.0, 364.0, 265.0, 102.0, 71.0, 36.0, 40.0, 37.0, 33.0, 34.0, 28.0, 21.0, 19.0, 21.0, 15.0, 17.0, 14.0, 11.0, 9.0, 8.0, 5.0, 7.0, 3.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-34.15625, -33.0751953125, -31.994140625, -30.9130859375, -29.83203125, -28.7509765625, -27.669921875, -26.5888671875, -25.5078125, -24.4267578125, -23.345703125, -22.2646484375, -21.18359375, -20.1025390625, -19.021484375, -17.9404296875, -16.859375, -15.7783203125, -14.697265625, -13.6162109375, -12.53515625, -11.4541015625, -10.373046875, -9.2919921875, -8.2109375, -7.1298828125, -6.048828125, -4.9677734375, -3.88671875, -2.8056640625, -1.724609375, -0.6435546875, 0.4375, 1.5185546875, 2.599609375, 3.6806640625, 4.76171875, 5.8427734375, 6.923828125, 8.0048828125, 9.0859375, 10.1669921875, 11.248046875, 12.3291015625, 13.41015625, 14.4912109375, 15.572265625, 16.6533203125, 17.734375, 18.8154296875, 19.896484375, 20.9775390625, 22.05859375, 23.1396484375, 24.220703125, 25.3017578125, 26.3828125, 27.4638671875, 28.544921875, 29.6259765625, 30.70703125, 31.7880859375, 32.869140625, 33.9501953125, 35.03125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [6.0, 6.0, 7.0, 11.0, 23.0, 37.0, 59.0, 82.0, 108.0, 185.0, 253.0, 373.0, 493.0, 777.0, 1042.0, 1573.0, 2316.0, 3340.0, 4770.0, 7088.0, 10999.0, 17356.0, 26704.0, 42972.0, 69220.0, 111773.0, 182478.0, 294768.0, 523525.0, 2453482.0, 1427437.0, 428126.0, 257382.0, 159093.0, 97405.0, 59926.0, 37336.0, 23766.0, 14989.0, 9900.0, 6644.0, 4404.0, 2905.0, 1935.0, 1355.0, 901.0, 675.0, 445.0, 319.0, 219.0, 163.0, 102.0, 63.0, 55.0, 32.0, 15.0, 13.0, 5.0, 9.0, 6.0, 3.0, 1.0, 0.0, 1.0], "bins": [-9.453125, -9.136474609375, -8.81982421875, -8.503173828125, -8.1865234375, -7.869873046875, -7.55322265625, -7.236572265625, -6.919921875, -6.603271484375, -6.28662109375, -5.969970703125, -5.6533203125, -5.336669921875, -5.02001953125, -4.703369140625, -4.38671875, -4.070068359375, -3.75341796875, -3.436767578125, -3.1201171875, -2.803466796875, -2.48681640625, -2.170166015625, -1.853515625, -1.536865234375, -1.22021484375, -0.903564453125, -0.5869140625, -0.270263671875, 0.04638671875, 0.363037109375, 0.6796875, 0.996337890625, 1.31298828125, 1.629638671875, 1.9462890625, 2.262939453125, 2.57958984375, 2.896240234375, 3.212890625, 3.529541015625, 3.84619140625, 4.162841796875, 4.4794921875, 4.796142578125, 5.11279296875, 5.429443359375, 5.74609375, 6.062744140625, 6.37939453125, 6.696044921875, 7.0126953125, 7.329345703125, 7.64599609375, 7.962646484375, 8.279296875, 8.595947265625, 8.91259765625, 9.229248046875, 9.5458984375, 9.862548828125, 10.17919921875, 10.495849609375, 10.8125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 5.0, 3.0, 5.0, 7.0, 12.0, 7.0, 12.0, 15.0, 11.0, 16.0, 21.0, 18.0, 30.0, 30.0, 36.0, 27.0, 42.0, 53.0, 56.0, 69.0, 115.0, 448.0, 452.0, 134.0, 52.0, 42.0, 38.0, 49.0, 28.0, 16.0, 30.0, 24.0, 17.0, 20.0, 17.0, 13.0, 12.0, 9.0, 8.0, 10.0, 7.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.65625, -49.9892578125, -48.322265625, -46.6552734375, -44.98828125, -43.3212890625, -41.654296875, -39.9873046875, -38.3203125, -36.6533203125, -34.986328125, -33.3193359375, -31.65234375, -29.9853515625, -28.318359375, -26.6513671875, -24.984375, -23.3173828125, -21.650390625, -19.9833984375, -18.31640625, -16.6494140625, -14.982421875, -13.3154296875, -11.6484375, -9.9814453125, -8.314453125, -6.6474609375, -4.98046875, -3.3134765625, -1.646484375, 0.0205078125, 1.6875, 3.3544921875, 5.021484375, 6.6884765625, 8.35546875, 10.0224609375, 11.689453125, 13.3564453125, 15.0234375, 16.6904296875, 18.357421875, 20.0244140625, 21.69140625, 23.3583984375, 25.025390625, 26.6923828125, 28.359375, 30.0263671875, 31.693359375, 33.3603515625, 35.02734375, 36.6943359375, 38.361328125, 40.0283203125, 41.6953125, 43.3623046875, 45.029296875, 46.6962890625, 48.36328125, 50.0302734375, 51.697265625, 53.3642578125, 55.03125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 0.0, 7.0, 10.0, 8.0, 6.0, 9.0, 20.0, 23.0, 27.0, 29.0, 58.0, 83.0, 113.0, 134.0, 161.0, 238.0, 315.0, 433.0, 618.0, 997.0, 1620.0, 2949.0, 5579.0, 12426.0, 31712.0, 91881.0, 5487559.0, 516704.0, 84390.0, 29232.0, 11628.0, 5113.0, 2715.0, 1518.0, 901.0, 629.0, 392.0, 271.0, 200.0, 173.0, 139.0, 107.0, 87.0, 69.0, 52.0, 31.0, 17.0, 11.0, 14.0, 12.0, 12.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-62.65625, -60.63232421875, -58.6083984375, -56.58447265625, -54.560546875, -52.53662109375, -50.5126953125, -48.48876953125, -46.46484375, -44.44091796875, -42.4169921875, -40.39306640625, -38.369140625, -36.34521484375, -34.3212890625, -32.29736328125, -30.2734375, -28.24951171875, -26.2255859375, -24.20166015625, -22.177734375, -20.15380859375, -18.1298828125, -16.10595703125, -14.08203125, -12.05810546875, -10.0341796875, -8.01025390625, -5.986328125, -3.96240234375, -1.9384765625, 0.08544921875, 2.109375, 4.13330078125, 6.1572265625, 8.18115234375, 10.205078125, 12.22900390625, 14.2529296875, 16.27685546875, 18.30078125, 20.32470703125, 22.3486328125, 24.37255859375, 26.396484375, 28.42041015625, 30.4443359375, 32.46826171875, 34.4921875, 36.51611328125, 38.5400390625, 40.56396484375, 42.587890625, 44.61181640625, 46.6357421875, 48.65966796875, 50.68359375, 52.70751953125, 54.7314453125, 56.75537109375, 58.779296875, 60.80322265625, 62.8271484375, 64.85107421875, 66.875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 2.0, 6.0, 8.0, 11.0, 7.0, 14.0, 12.0, 17.0, 24.0, 19.0, 24.0, 27.0, 31.0, 25.0, 43.0, 33.0, 36.0, 46.0, 66.0, 279.0, 705.0, 130.0, 45.0, 37.0, 46.0, 44.0, 31.0, 32.0, 29.0, 34.0, 22.0, 24.0, 17.0, 16.0, 7.0, 17.0, 10.0, 10.0, 6.0, 7.0, 8.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-99.0, -96.025390625, -93.05078125, -90.076171875, -87.1015625, -84.126953125, -81.15234375, -78.177734375, -75.203125, -72.228515625, -69.25390625, -66.279296875, -63.3046875, -60.330078125, -57.35546875, -54.380859375, -51.40625, -48.431640625, -45.45703125, -42.482421875, -39.5078125, -36.533203125, -33.55859375, -30.583984375, -27.609375, -24.634765625, -21.66015625, -18.685546875, -15.7109375, -12.736328125, -9.76171875, -6.787109375, -3.8125, -0.837890625, 2.13671875, 5.111328125, 8.0859375, 11.060546875, 14.03515625, 17.009765625, 19.984375, 22.958984375, 25.93359375, 28.908203125, 31.8828125, 34.857421875, 37.83203125, 40.806640625, 43.78125, 46.755859375, 49.73046875, 52.705078125, 55.6796875, 58.654296875, 61.62890625, 64.603515625, 67.578125, 70.552734375, 73.52734375, 76.501953125, 79.4765625, 82.451171875, 85.42578125, 88.400390625, 91.375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 20.0, 109.0, 750.0, 83.0, 15.0, 9.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1551.8057861328125, -1513.3818359375, -1474.957763671875, -1436.5338134765625, -1398.10986328125, -1359.6859130859375, -1321.261962890625, -1282.837890625, -1244.4139404296875, -1205.989990234375, -1167.56591796875, -1129.1419677734375, -1090.718017578125, -1052.2940673828125, -1013.8700561523438, -975.446044921875, -937.0220947265625, -898.59814453125, -860.1741333007812, -821.7501220703125, -783.326171875, -744.9022216796875, -706.4782104492188, -668.05419921875, -629.6302490234375, -591.206298828125, -552.7822875976562, -514.3582763671875, -475.934326171875, -437.5103454589844, -399.08636474609375, -360.6623840332031, -322.238525390625, -283.8145446777344, -245.39056396484375, -206.96658325195312, -168.5426025390625, -130.11862182617188, -91.69464111328125, -53.270660400390625, -14.8466796875, 23.577301025390625, 62.00128173828125, 100.42526245117188, 138.8492431640625, 177.27322387695312, 215.69720458984375, 254.12118530273438, 292.545166015625, 330.9691467285156, 369.39312744140625, 407.8171081542969, 446.2410888671875, 484.6650695800781, 523.0890502929688, 561.5130615234375, 599.93701171875, 638.3609619140625, 676.7849731445312, 715.208984375, 753.6329345703125, 792.056884765625, 830.4808959960938, 868.9049072265625, 907.328857421875]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 6.0, 6.0, 9.0, 16.0, 17.0, 18.0, 26.0, 31.0, 76.0, 201.0, 243.0, 148.0, 72.0, 25.0, 19.0, 10.0, 13.0, 15.0, 10.0, 6.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-613.2197265625, -595.3973388671875, -577.574951171875, -559.7526245117188, -541.9302368164062, -524.1078491210938, -506.2854919433594, -488.463134765625, -470.6407470703125, -452.818359375, -434.9960021972656, -417.17364501953125, -399.35125732421875, -381.52886962890625, -363.7065124511719, -345.8841552734375, -328.061767578125, -310.2393798828125, -292.4170227050781, -274.59466552734375, -256.77227783203125, -238.9499053955078, -221.12753295898438, -203.30516052246094, -185.4827880859375, -167.66041564941406, -149.83804321289062, -132.0156707763672, -114.19329833984375, -96.37092590332031, -78.54855346679688, -60.72618103027344, -42.90380859375, -25.081436157226562, -7.259063720703125, 10.563308715820312, 28.38568115234375, 46.20805358886719, 64.03042602539062, 81.85279846191406, 99.6751708984375, 117.49754333496094, 135.31991577148438, 153.1422882080078, 170.96466064453125, 188.7870330810547, 206.60940551757812, 224.43177795410156, 242.254150390625, 260.0765380859375, 277.8988952636719, 295.72125244140625, 313.54364013671875, 331.36602783203125, 349.1883850097656, 367.0107421875, 384.8331298828125, 402.655517578125, 420.4778747558594, 438.30023193359375, 456.12261962890625, 473.94500732421875, 491.7673645019531, 509.5897216796875, 527.412109375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 6.0, 5.0, 8.0, 16.0, 13.0, 14.0, 19.0, 34.0, 28.0, 53.0, 58.0, 98.0, 160.0, 182.0, 278.0, 415.0, 585.0, 904.0, 1510.0, 2471.0, 4378.0, 8911.0, 24156.0, 217378.0, 3872781.0, 36909.0, 11135.0, 5067.0, 2731.0, 1518.0, 889.0, 523.0, 337.0, 238.0, 172.0, 95.0, 71.0, 36.0, 27.0, 21.0, 12.0, 12.0, 14.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0], "bins": [-4.3671875, -4.255645751953125, -4.14410400390625, -4.032562255859375, -3.9210205078125, -3.809478759765625, -3.69793701171875, -3.586395263671875, -3.474853515625, -3.363311767578125, -3.25177001953125, -3.140228271484375, -3.0286865234375, -2.917144775390625, -2.80560302734375, -2.694061279296875, -2.58251953125, -2.470977783203125, -2.35943603515625, -2.247894287109375, -2.1363525390625, -2.024810791015625, -1.91326904296875, -1.801727294921875, -1.690185546875, -1.578643798828125, -1.46710205078125, -1.355560302734375, -1.2440185546875, -1.132476806640625, -1.02093505859375, -0.909393310546875, -0.7978515625, -0.686309814453125, -0.57476806640625, -0.463226318359375, -0.3516845703125, -0.240142822265625, -0.12860107421875, -0.017059326171875, 0.094482421875, 0.206024169921875, 0.31756591796875, 0.429107666015625, 0.5406494140625, 0.652191162109375, 0.76373291015625, 0.875274658203125, 0.98681640625, 1.098358154296875, 1.20989990234375, 1.321441650390625, 1.4329833984375, 1.544525146484375, 1.65606689453125, 1.767608642578125, 1.879150390625, 1.990692138671875, 2.10223388671875, 2.213775634765625, 2.3253173828125, 2.436859130859375, 2.54840087890625, 2.659942626953125, 2.771484375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 5.0, 3.0, 5.0, 4.0, 5.0, 8.0, 6.0, 5.0, 4.0, 10.0, 13.0, 13.0, 7.0, 13.0, 359.0, 425.0, 14.0, 9.0, 13.0, 16.0, 6.0, 8.0, 7.0, 6.0, 2.0, 6.0, 2.0, 6.0, 2.0, 2.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.59375, -1.5505523681640625, -1.507354736328125, -1.4641571044921875, -1.42095947265625, -1.3777618408203125, -1.334564208984375, -1.2913665771484375, -1.2481689453125, -1.2049713134765625, -1.161773681640625, -1.1185760498046875, -1.07537841796875, -1.0321807861328125, -0.988983154296875, -0.9457855224609375, -0.902587890625, -0.8593902587890625, -0.816192626953125, -0.7729949951171875, -0.72979736328125, -0.6865997314453125, -0.643402099609375, -0.6002044677734375, -0.5570068359375, -0.5138092041015625, -0.470611572265625, -0.4274139404296875, -0.38421630859375, -0.3410186767578125, -0.297821044921875, -0.2546234130859375, -0.21142578125, -0.1682281494140625, -0.125030517578125, -0.0818328857421875, -0.03863525390625, 0.0045623779296875, 0.047760009765625, 0.0909576416015625, 0.1341552734375, 0.1773529052734375, 0.220550537109375, 0.2637481689453125, 0.30694580078125, 0.3501434326171875, 0.393341064453125, 0.4365386962890625, 0.479736328125, 0.5229339599609375, 0.566131591796875, 0.6093292236328125, 0.65252685546875, 0.6957244873046875, 0.738922119140625, 0.7821197509765625, 0.8253173828125, 0.8685150146484375, 0.911712646484375, 0.9549102783203125, 0.99810791015625, 1.0413055419921875, 1.084503173828125, 1.1277008056640625, 1.1708984375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 7.0, 3.0, 20.0, 25.0, 38.0, 71.0, 93.0, 173.0, 299.0, 547.0, 1139.0, 2731.0, 8497.0, 35099.0, 365108.0, 3658598.0, 95696.0, 17398.0, 5059.0, 1890.0, 825.0, 380.0, 220.0, 135.0, 83.0, 52.0, 33.0, 20.0, 10.0, 11.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 2.0], "bins": [-8.4375, -8.21099853515625, -7.9844970703125, -7.75799560546875, -7.531494140625, -7.30499267578125, -7.0784912109375, -6.85198974609375, -6.62548828125, -6.39898681640625, -6.1724853515625, -5.94598388671875, -5.719482421875, -5.49298095703125, -5.2664794921875, -5.03997802734375, -4.8134765625, -4.58697509765625, -4.3604736328125, -4.13397216796875, -3.907470703125, -3.68096923828125, -3.4544677734375, -3.22796630859375, -3.00146484375, -2.77496337890625, -2.5484619140625, -2.32196044921875, -2.095458984375, -1.86895751953125, -1.6424560546875, -1.41595458984375, -1.189453125, -0.96295166015625, -0.7364501953125, -0.50994873046875, -0.283447265625, -0.05694580078125, 0.1695556640625, 0.39605712890625, 0.62255859375, 0.84906005859375, 1.0755615234375, 1.30206298828125, 1.528564453125, 1.75506591796875, 1.9815673828125, 2.20806884765625, 2.4345703125, 2.66107177734375, 2.8875732421875, 3.11407470703125, 3.340576171875, 3.56707763671875, 3.7935791015625, 4.02008056640625, 4.24658203125, 4.47308349609375, 4.6995849609375, 4.92608642578125, 5.152587890625, 5.37908935546875, 5.6055908203125, 5.83209228515625, 6.05859375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 3.0, 12.0, 7.0, 14.0, 21.0, 30.0, 42.0, 69.0, 138.0, 308.0, 1779.0, 1027.0, 252.0, 119.0, 83.0, 56.0, 30.0, 19.0, 17.0, 9.0, 12.0, 7.0, 4.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.65625, -2.584228515625, -2.51220703125, -2.440185546875, -2.3681640625, -2.296142578125, -2.22412109375, -2.152099609375, -2.080078125, -2.008056640625, -1.93603515625, -1.864013671875, -1.7919921875, -1.719970703125, -1.64794921875, -1.575927734375, -1.50390625, -1.431884765625, -1.35986328125, -1.287841796875, -1.2158203125, -1.143798828125, -1.07177734375, -0.999755859375, -0.927734375, -0.855712890625, -0.78369140625, -0.711669921875, -0.6396484375, -0.567626953125, -0.49560546875, -0.423583984375, -0.3515625, -0.279541015625, -0.20751953125, -0.135498046875, -0.0634765625, 0.008544921875, 0.08056640625, 0.152587890625, 0.224609375, 0.296630859375, 0.36865234375, 0.440673828125, 0.5126953125, 0.584716796875, 0.65673828125, 0.728759765625, 0.80078125, 0.872802734375, 0.94482421875, 1.016845703125, 1.0888671875, 1.160888671875, 1.23291015625, 1.304931640625, 1.376953125, 1.448974609375, 1.52099609375, 1.593017578125, 1.6650390625, 1.737060546875, 1.80908203125, 1.881103515625, 1.953125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 8.0, 18.0, 27.0, 51.0, 111.0, 225.0, 244.0, 161.0, 77.0, 33.0, 19.0, 10.0, 11.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.901721954345703, -11.459807395935059, -11.017892837524414, -10.575979232788086, -10.134064674377441, -9.692150115966797, -9.250235557556152, -8.808320999145508, -8.366406440734863, -7.924491882324219, -7.482577800750732, -7.040663242340088, -6.598748683929443, -6.156834602355957, -5.7149200439453125, -5.273005485534668, -4.831091403961182, -4.389176845550537, -3.9472625255584717, -3.5053482055664062, -3.0634336471557617, -2.6215193271636963, -2.179605007171631, -1.7376904487609863, -1.295776128768921, -0.8538616895675659, -0.4119473099708557, 0.029967069625854492, 0.4718815088272095, 0.9137959480285645, 1.3557102680206299, 1.7976248264312744, 2.23953914642334, 2.6814534664154053, 3.12336802482605, 3.5652823448181152, 4.00719690322876, 4.449110984802246, 4.891025543212891, 5.332940101623535, 5.77485466003418, 6.216769218444824, 6.6586833000183105, 7.100597858428955, 7.5425124168396, 7.984426498413086, 8.42634105682373, 8.868255615234375, 9.310169219970703, 9.752083778381348, 10.193998336791992, 10.63591194152832, 11.077826499938965, 11.51974105834961, 11.961655616760254, 12.403570175170898, 12.845484733581543, 13.287399291992188, 13.729313850402832, 14.171228408813477, 14.613142013549805, 15.05505657196045, 15.496971130371094, 15.938885688781738, 16.380800247192383]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 7.0, 6.0, 4.0, 9.0, 10.0, 11.0, 15.0, 19.0, 18.0, 26.0, 31.0, 48.0, 60.0, 53.0, 70.0, 56.0, 56.0, 68.0, 54.0, 50.0, 55.0, 45.0, 41.0, 42.0, 33.0, 26.0, 20.0, 18.0, 14.0, 14.0, 11.0, 9.0, 10.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.608412742614746, -5.394190311431885, -5.179967403411865, -4.965744972229004, -4.751522541046143, -4.537300109863281, -4.323077201843262, -4.1088547706604, -3.894632339477539, -3.6804096698760986, -3.4661872386932373, -3.251964569091797, -3.0377421379089355, -2.823519468307495, -2.6092967987060547, -2.3950743675231934, -2.180851697921753, -1.966629147529602, -1.7524065971374512, -1.5381839275360107, -1.3239614963531494, -1.109738826751709, -0.8955162763595581, -0.6812937259674072, -0.46707117557525635, -0.25284862518310547, -0.0386260449886322, 0.17559653520584106, 0.38981908559799194, 0.6040416955947876, 0.8182642459869385, 1.0324867963790894, 1.2467093467712402, 1.4609318971633911, 1.675154447555542, 1.8893771171569824, 2.1035995483398438, 2.317822217941284, 2.5320448875427246, 2.746267318725586, 2.9604897499084473, 3.1747124195098877, 3.388934850692749, 3.6031575202941895, 3.817379951477051, 4.03160285949707, 4.245825290679932, 4.460047721862793, 4.6742706298828125, 4.888493061065674, 5.102715969085693, 5.316938400268555, 5.531160831451416, 5.745383262634277, 5.959606170654297, 6.173828601837158, 6.3880510330200195, 6.602273464202881, 6.8164963722229, 7.030718803405762, 7.244941234588623, 7.459163665771484, 7.673386573791504, 7.887609004974365, 8.101831436157227]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 6.0, 7.0, 5.0, 11.0, 9.0, 19.0, 37.0, 44.0, 69.0, 89.0, 139.0, 206.0, 277.0, 450.0, 642.0, 965.0, 1627.0, 2458.0, 3771.0, 6410.0, 10569.0, 18903.0, 38092.0, 822589.0, 80870.0, 25236.0, 13774.0, 7921.0, 4802.0, 3043.0, 1899.0, 1193.0, 829.0, 519.0, 312.0, 242.0, 171.0, 105.0, 68.0, 54.0, 41.0, 26.0, 22.0, 4.0, 9.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.091796875, -2.98779296875, -2.8837890625, -2.77978515625, -2.67578125, -2.57177734375, -2.4677734375, -2.36376953125, -2.259765625, -2.15576171875, -2.0517578125, -1.94775390625, -1.84375, -1.73974609375, -1.6357421875, -1.53173828125, -1.427734375, -1.32373046875, -1.2197265625, -1.11572265625, -1.01171875, -0.90771484375, -0.8037109375, -0.69970703125, -0.595703125, -0.49169921875, -0.3876953125, -0.28369140625, -0.1796875, -0.07568359375, 0.0283203125, 0.13232421875, 0.236328125, 0.34033203125, 0.4443359375, 0.54833984375, 0.65234375, 0.75634765625, 0.8603515625, 0.96435546875, 1.068359375, 1.17236328125, 1.2763671875, 1.38037109375, 1.484375, 1.58837890625, 1.6923828125, 1.79638671875, 1.900390625, 2.00439453125, 2.1083984375, 2.21240234375, 2.31640625, 2.42041015625, 2.5244140625, 2.62841796875, 2.732421875, 2.83642578125, 2.9404296875, 3.04443359375, 3.1484375, 3.25244140625, 3.3564453125, 3.46044921875, 3.564453125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 1.0, 5.0, 8.0, 2.0, 5.0, 5.0, 8.0, 7.0, 10.0, 6.0, 13.0, 12.0, 20.0, 357.0, 407.0, 28.0, 13.0, 9.0, 11.0, 11.0, 10.0, 6.0, 7.0, 4.0, 4.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.7236328125, -1.67816162109375, -1.6326904296875, -1.58721923828125, -1.541748046875, -1.49627685546875, -1.4508056640625, -1.40533447265625, -1.35986328125, -1.31439208984375, -1.2689208984375, -1.22344970703125, -1.177978515625, -1.13250732421875, -1.0870361328125, -1.04156494140625, -0.99609375, -0.95062255859375, -0.9051513671875, -0.85968017578125, -0.814208984375, -0.76873779296875, -0.7232666015625, -0.67779541015625, -0.63232421875, -0.58685302734375, -0.5413818359375, -0.49591064453125, -0.450439453125, -0.40496826171875, -0.3594970703125, -0.31402587890625, -0.2685546875, -0.22308349609375, -0.1776123046875, -0.13214111328125, -0.086669921875, -0.04119873046875, 0.0042724609375, 0.04974365234375, 0.09521484375, 0.14068603515625, 0.1861572265625, 0.23162841796875, 0.277099609375, 0.32257080078125, 0.3680419921875, 0.41351318359375, 0.458984375, 0.50445556640625, 0.5499267578125, 0.59539794921875, 0.640869140625, 0.68634033203125, 0.7318115234375, 0.77728271484375, 0.82275390625, 0.86822509765625, 0.9136962890625, 0.95916748046875, 1.004638671875, 1.05010986328125, 1.0955810546875, 1.14105224609375, 1.1865234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 8.0, 4.0, 9.0, 11.0, 11.0, 19.0, 20.0, 28.0, 24.0, 37.0, 62.0, 75.0, 107.0, 125.0, 187.0, 285.0, 512.0, 988.0, 1820.0, 4015.0, 9121.0, 24217.0, 76149.0, 319819.0, 449685.0, 107714.0, 31950.0, 11698.0, 4796.0, 2157.0, 1111.0, 641.0, 327.0, 220.0, 153.0, 87.0, 81.0, 70.0, 51.0, 34.0, 29.0, 39.0, 19.0, 12.0, 7.0, 9.0, 6.0, 4.0, 3.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.43359375, -3.32330322265625, -3.2130126953125, -3.10272216796875, -2.992431640625, -2.88214111328125, -2.7718505859375, -2.66156005859375, -2.55126953125, -2.44097900390625, -2.3306884765625, -2.22039794921875, -2.110107421875, -1.99981689453125, -1.8895263671875, -1.77923583984375, -1.6689453125, -1.55865478515625, -1.4483642578125, -1.33807373046875, -1.227783203125, -1.11749267578125, -1.0072021484375, -0.89691162109375, -0.78662109375, -0.67633056640625, -0.5660400390625, -0.45574951171875, -0.345458984375, -0.23516845703125, -0.1248779296875, -0.01458740234375, 0.095703125, 0.20599365234375, 0.3162841796875, 0.42657470703125, 0.536865234375, 0.64715576171875, 0.7574462890625, 0.86773681640625, 0.97802734375, 1.08831787109375, 1.1986083984375, 1.30889892578125, 1.419189453125, 1.52947998046875, 1.6397705078125, 1.75006103515625, 1.8603515625, 1.97064208984375, 2.0809326171875, 2.19122314453125, 2.301513671875, 2.41180419921875, 2.5220947265625, 2.63238525390625, 2.74267578125, 2.85296630859375, 2.9632568359375, 3.07354736328125, 3.183837890625, 3.29412841796875, 3.4044189453125, 3.51470947265625, 3.625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 6.0, 9.0, 11.0, 14.0, 13.0, 15.0, 14.0, 26.0, 26.0, 26.0, 22.0, 36.0, 27.0, 50.0, 40.0, 33.0, 39.0, 34.0, 51.0, 40.0, 40.0, 35.0, 46.0, 31.0, 36.0, 27.0, 29.0, 38.0, 31.0, 29.0, 18.0, 14.0, 21.0, 12.0, 10.0, 9.0, 11.0, 11.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.99609375, -5.81610107421875, -5.6361083984375, -5.45611572265625, -5.276123046875, -5.09613037109375, -4.9161376953125, -4.73614501953125, -4.55615234375, -4.37615966796875, -4.1961669921875, -4.01617431640625, -3.836181640625, -3.65618896484375, -3.4761962890625, -3.29620361328125, -3.1162109375, -2.93621826171875, -2.7562255859375, -2.57623291015625, -2.396240234375, -2.21624755859375, -2.0362548828125, -1.85626220703125, -1.67626953125, -1.49627685546875, -1.3162841796875, -1.13629150390625, -0.956298828125, -0.77630615234375, -0.5963134765625, -0.41632080078125, -0.236328125, -0.05633544921875, 0.1236572265625, 0.30364990234375, 0.483642578125, 0.66363525390625, 0.8436279296875, 1.02362060546875, 1.20361328125, 1.38360595703125, 1.5635986328125, 1.74359130859375, 1.923583984375, 2.10357666015625, 2.2835693359375, 2.46356201171875, 2.6435546875, 2.82354736328125, 3.0035400390625, 3.18353271484375, 3.363525390625, 3.54351806640625, 3.7235107421875, 3.90350341796875, 4.08349609375, 4.26348876953125, 4.4434814453125, 4.62347412109375, 4.803466796875, 4.98345947265625, 5.1634521484375, 5.34344482421875, 5.5234375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 6.0, 3.0, 5.0, 5.0, 4.0, 5.0, 10.0, 12.0, 24.0, 34.0, 57.0, 78.0, 93.0, 143.0, 235.0, 394.0, 633.0, 1179.0, 2302.0, 5090.0, 13431.0, 48191.0, 270333.0, 565702.0, 102408.0, 23333.0, 7880.0, 3249.0, 1570.0, 789.0, 474.0, 295.0, 167.0, 134.0, 79.0, 51.0, 50.0, 33.0, 23.0, 13.0, 12.0, 3.0, 8.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.642578125, -3.525970458984375, -3.40936279296875, -3.292755126953125, -3.1761474609375, -3.059539794921875, -2.94293212890625, -2.826324462890625, -2.709716796875, -2.593109130859375, -2.47650146484375, -2.359893798828125, -2.2432861328125, -2.126678466796875, -2.01007080078125, -1.893463134765625, -1.77685546875, -1.660247802734375, -1.54364013671875, -1.427032470703125, -1.3104248046875, -1.193817138671875, -1.07720947265625, -0.960601806640625, -0.843994140625, -0.727386474609375, -0.61077880859375, -0.494171142578125, -0.3775634765625, -0.260955810546875, -0.14434814453125, -0.027740478515625, 0.0888671875, 0.205474853515625, 0.32208251953125, 0.438690185546875, 0.5552978515625, 0.671905517578125, 0.78851318359375, 0.905120849609375, 1.021728515625, 1.138336181640625, 1.25494384765625, 1.371551513671875, 1.4881591796875, 1.604766845703125, 1.72137451171875, 1.837982177734375, 1.95458984375, 2.071197509765625, 2.18780517578125, 2.304412841796875, 2.4210205078125, 2.537628173828125, 2.65423583984375, 2.770843505859375, 2.887451171875, 3.004058837890625, 3.12066650390625, 3.237274169921875, 3.3538818359375, 3.470489501953125, 3.58709716796875, 3.703704833984375, 3.8203125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 4.0, 5.0, 8.0, 11.0, 12.0, 14.0, 24.0, 38.0, 34.0, 56.0, 65.0, 85.0, 79.0, 100.0, 115.0, 79.0, 76.0, 54.0, 31.0, 34.0, 21.0, 13.0, 19.0, 6.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002357959747314453, -0.00022902898490428925, -0.00022226199507713318, -0.0002154950052499771, -0.00020872801542282104, -0.00020196102559566498, -0.0001951940357685089, -0.00018842704594135284, -0.00018166005611419678, -0.0001748930662870407, -0.00016812607645988464, -0.00016135908663272858, -0.0001545920968055725, -0.00014782510697841644, -0.00014105811715126038, -0.0001342911273241043, -0.00012752413749694824, -0.00012075714766979218, -0.00011399015784263611, -0.00010722316801548004, -0.00010045617818832397, -9.368918836116791e-05, -8.692219853401184e-05, -8.015520870685577e-05, -7.338821887969971e-05, -6.662122905254364e-05, -5.985423922538757e-05, -5.3087249398231506e-05, -4.632025957107544e-05, -3.955326974391937e-05, -3.2786279916763306e-05, -2.601929008960724e-05, -1.9252300262451172e-05, -1.2485310435295105e-05, -5.718320608139038e-06, 1.0486692190170288e-06, 7.815659046173096e-06, 1.4582648873329163e-05, 2.134963870048523e-05, 2.8116628527641296e-05, 3.488361835479736e-05, 4.165060818195343e-05, 4.84175980091095e-05, 5.5184587836265564e-05, 6.195157766342163e-05, 6.87185674905777e-05, 7.548555731773376e-05, 8.225254714488983e-05, 8.90195369720459e-05, 9.578652679920197e-05, 0.00010255351662635803, 0.0001093205064535141, 0.00011608749628067017, 0.00012285448610782623, 0.0001296214759349823, 0.00013638846576213837, 0.00014315545558929443, 0.0001499224454164505, 0.00015668943524360657, 0.00016345642507076263, 0.0001702234148979187, 0.00017699040472507477, 0.00018375739455223083, 0.0001905243843793869, 0.00019729137420654297]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 4.0, 5.0, 5.0, 18.0, 33.0, 26.0, 41.0, 71.0, 111.0, 141.0, 268.0, 458.0, 823.0, 1585.0, 3690.0, 9222.0, 30927.0, 151174.0, 615077.0, 181762.0, 35064.0, 10134.0, 3962.0, 1788.0, 932.0, 462.0, 263.0, 166.0, 110.0, 73.0, 43.0, 34.0, 14.0, 20.0, 9.0, 8.0, 13.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0], "bins": [-4.15234375, -4.01641845703125, -3.8804931640625, -3.74456787109375, -3.608642578125, -3.47271728515625, -3.3367919921875, -3.20086669921875, -3.06494140625, -2.92901611328125, -2.7930908203125, -2.65716552734375, -2.521240234375, -2.38531494140625, -2.2493896484375, -2.11346435546875, -1.9775390625, -1.84161376953125, -1.7056884765625, -1.56976318359375, -1.433837890625, -1.29791259765625, -1.1619873046875, -1.02606201171875, -0.89013671875, -0.75421142578125, -0.6182861328125, -0.48236083984375, -0.346435546875, -0.21051025390625, -0.0745849609375, 0.06134033203125, 0.197265625, 0.33319091796875, 0.4691162109375, 0.60504150390625, 0.740966796875, 0.87689208984375, 1.0128173828125, 1.14874267578125, 1.28466796875, 1.42059326171875, 1.5565185546875, 1.69244384765625, 1.828369140625, 1.96429443359375, 2.1002197265625, 2.23614501953125, 2.3720703125, 2.50799560546875, 2.6439208984375, 2.77984619140625, 2.915771484375, 3.05169677734375, 3.1876220703125, 3.32354736328125, 3.45947265625, 3.59539794921875, 3.7313232421875, 3.86724853515625, 4.003173828125, 4.13909912109375, 4.2750244140625, 4.41094970703125, 4.546875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 7.0, 4.0, 2.0, 1.0, 6.0, 6.0, 9.0, 12.0, 13.0, 27.0, 20.0, 33.0, 38.0, 61.0, 55.0, 78.0, 57.0, 82.0, 86.0, 77.0, 53.0, 63.0, 41.0, 41.0, 28.0, 31.0, 16.0, 16.0, 7.0, 8.0, 7.0, 3.0, 4.0, 6.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.484375, -3.377899169921875, -3.27142333984375, -3.164947509765625, -3.0584716796875, -2.951995849609375, -2.84552001953125, -2.739044189453125, -2.632568359375, -2.526092529296875, -2.41961669921875, -2.313140869140625, -2.2066650390625, -2.100189208984375, -1.99371337890625, -1.887237548828125, -1.78076171875, -1.674285888671875, -1.56781005859375, -1.461334228515625, -1.3548583984375, -1.248382568359375, -1.14190673828125, -1.035430908203125, -0.928955078125, -0.822479248046875, -0.71600341796875, -0.609527587890625, -0.5030517578125, -0.396575927734375, -0.29010009765625, -0.183624267578125, -0.0771484375, 0.029327392578125, 0.13580322265625, 0.242279052734375, 0.3487548828125, 0.455230712890625, 0.56170654296875, 0.668182373046875, 0.774658203125, 0.881134033203125, 0.98760986328125, 1.094085693359375, 1.2005615234375, 1.307037353515625, 1.41351318359375, 1.519989013671875, 1.62646484375, 1.732940673828125, 1.83941650390625, 1.945892333984375, 2.0523681640625, 2.158843994140625, 2.26531982421875, 2.371795654296875, 2.478271484375, 2.584747314453125, 2.69122314453125, 2.797698974609375, 2.9041748046875, 3.010650634765625, 3.11712646484375, 3.223602294921875, 3.330078125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 7.0, 8.0, 26.0, 76.0, 264.0, 383.0, 137.0, 50.0, 20.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-108.98988342285156, -106.40969848632812, -103.82950592041016, -101.24932098388672, -98.66912841796875, -96.08894348144531, -93.50875091552734, -90.9285659790039, -88.34837341308594, -85.7681884765625, -83.18799591064453, -80.6078109741211, -78.02761840820312, -75.44743347167969, -72.86724090576172, -70.28705596923828, -67.70687103271484, -65.1266860961914, -62.54649353027344, -59.966304779052734, -57.38611602783203, -54.805931091308594, -52.22574234008789, -49.64555358886719, -47.065364837646484, -44.48517608642578, -41.90498733520508, -39.324798583984375, -36.74461364746094, -34.16442108154297, -31.58423614501953, -29.004047393798828, -26.423851013183594, -23.84366226196289, -21.263473510742188, -18.683286666870117, -16.103097915649414, -13.522909164428711, -10.942721366882324, -8.362533569335938, -5.782344818115234, -3.2021565437316895, -0.6219682693481445, 1.9582200050354004, 4.538408279418945, 7.118597030639648, 9.698784828186035, 12.278972625732422, 14.859161376953125, 17.439350128173828, 20.01953887939453, 22.5997257232666, 25.179914474487305, 27.760103225708008, 30.340290069580078, 32.92047882080078, 35.500667572021484, 38.08085632324219, 40.66104507446289, 43.241233825683594, 45.82141876220703, 48.401611328125, 50.98179626464844, 53.56198501586914, 56.142173767089844]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 2.0, 4.0, 6.0, 6.0, 5.0, 7.0, 4.0, 13.0, 13.0, 14.0, 33.0, 61.0, 96.0, 111.0, 181.0, 151.0, 103.0, 49.0, 38.0, 27.0, 14.0, 13.0, 7.0, 7.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 2.0, 6.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-117.9508285522461, -114.4417953491211, -110.93275451660156, -107.42372131347656, -103.91468811035156, -100.40565490722656, -96.89661407470703, -93.38758087158203, -89.8785400390625, -86.3695068359375, -82.86046600341797, -79.35143280029297, -75.84239959716797, -72.33335876464844, -68.82432556152344, -65.31529235839844, -61.80625915527344, -58.29722213745117, -54.78818893432617, -51.279151916503906, -47.770118713378906, -44.26108169555664, -40.752044677734375, -37.243011474609375, -33.73397445678711, -30.224939346313477, -26.715904235839844, -23.206867218017578, -19.697832107543945, -16.188796997070312, -12.679759979248047, -9.170724868774414, -5.66168212890625, -2.152646541595459, 1.356389045715332, 4.865425109863281, 8.374460220336914, 11.883495330810547, 15.392532348632812, 18.901567459106445, 22.410602569580078, 25.91963768005371, 29.428672790527344, 32.93770980834961, 36.446746826171875, 39.955780029296875, 43.46481704711914, 46.973854064941406, 50.482887268066406, 53.99192428588867, 57.50095748901367, 61.00999450683594, 64.51902770996094, 68.02806091308594, 71.53710174560547, 75.04613494873047, 78.55517578125, 82.064208984375, 85.57324981689453, 89.08228302001953, 92.59131622314453, 96.10035705566406, 99.60939025878906, 103.11842346191406, 106.62745666503906]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 5.0, 1.0, 4.0, 2.0, 7.0, 6.0, 10.0, 14.0, 18.0, 18.0, 28.0, 32.0, 50.0, 92.0, 133.0, 205.0, 321.0, 459.0, 826.0, 1204.0, 2034.0, 3607.0, 6870.0, 15675.0, 53143.0, 3891423.0, 173213.0, 25340.0, 9229.0, 4451.0, 2299.0, 1317.0, 871.0, 501.0, 316.0, 196.0, 112.0, 79.0, 50.0, 41.0, 30.0, 17.0, 9.0, 7.0, 9.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0], "bins": [-12.5625, -12.2381591796875, -11.913818359375, -11.5894775390625, -11.26513671875, -10.9407958984375, -10.616455078125, -10.2921142578125, -9.9677734375, -9.6434326171875, -9.319091796875, -8.9947509765625, -8.67041015625, -8.3460693359375, -8.021728515625, -7.6973876953125, -7.373046875, -7.0487060546875, -6.724365234375, -6.4000244140625, -6.07568359375, -5.7513427734375, -5.427001953125, -5.1026611328125, -4.7783203125, -4.4539794921875, -4.129638671875, -3.8052978515625, -3.48095703125, -3.1566162109375, -2.832275390625, -2.5079345703125, -2.18359375, -1.8592529296875, -1.534912109375, -1.2105712890625, -0.88623046875, -0.5618896484375, -0.237548828125, 0.0867919921875, 0.4111328125, 0.7354736328125, 1.059814453125, 1.3841552734375, 1.70849609375, 2.0328369140625, 2.357177734375, 2.6815185546875, 3.005859375, 3.3302001953125, 3.654541015625, 3.9788818359375, 4.30322265625, 4.6275634765625, 4.951904296875, 5.2762451171875, 5.6005859375, 5.9249267578125, 6.249267578125, 6.5736083984375, 6.89794921875, 7.2222900390625, 7.546630859375, 7.8709716796875, 8.1953125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 5.0, 10.0, 7.0, 1.0, 9.0, 10.0, 14.0, 15.0, 34.0, 118.0, 303.0, 268.0, 91.0, 30.0, 19.0, 18.0, 12.0, 10.0, 5.0, 8.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.599609375, -1.557342529296875, -1.51507568359375, -1.472808837890625, -1.4305419921875, -1.388275146484375, -1.34600830078125, -1.303741455078125, -1.261474609375, -1.219207763671875, -1.17694091796875, -1.134674072265625, -1.0924072265625, -1.050140380859375, -1.00787353515625, -0.965606689453125, -0.92333984375, -0.881072998046875, -0.83880615234375, -0.796539306640625, -0.7542724609375, -0.712005615234375, -0.66973876953125, -0.627471923828125, -0.585205078125, -0.542938232421875, -0.50067138671875, -0.458404541015625, -0.4161376953125, -0.373870849609375, -0.33160400390625, -0.289337158203125, -0.2470703125, -0.204803466796875, -0.16253662109375, -0.120269775390625, -0.0780029296875, -0.035736083984375, 0.00653076171875, 0.048797607421875, 0.091064453125, 0.133331298828125, 0.17559814453125, 0.217864990234375, 0.2601318359375, 0.302398681640625, 0.34466552734375, 0.386932373046875, 0.42919921875, 0.471466064453125, 0.51373291015625, 0.555999755859375, 0.5982666015625, 0.640533447265625, 0.68280029296875, 0.725067138671875, 0.767333984375, 0.809600830078125, 0.85186767578125, 0.894134521484375, 0.9364013671875, 0.978668212890625, 1.02093505859375, 1.063201904296875, 1.10546875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 6.0, 5.0, 5.0, 6.0, 15.0, 19.0, 39.0, 59.0, 86.0, 134.0, 253.0, 448.0, 835.0, 1773.0, 3754.0, 8830.0, 23859.0, 88629.0, 2599404.0, 1346608.0, 81207.0, 22474.0, 8545.0, 3673.0, 1717.0, 805.0, 424.0, 238.0, 153.0, 108.0, 40.0, 34.0, 30.0, 16.0, 12.0, 7.0, 5.0, 6.0, 5.0, 3.0, 7.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.2890625, -8.02978515625, -7.7705078125, -7.51123046875, -7.251953125, -6.99267578125, -6.7333984375, -6.47412109375, -6.21484375, -5.95556640625, -5.6962890625, -5.43701171875, -5.177734375, -4.91845703125, -4.6591796875, -4.39990234375, -4.140625, -3.88134765625, -3.6220703125, -3.36279296875, -3.103515625, -2.84423828125, -2.5849609375, -2.32568359375, -2.06640625, -1.80712890625, -1.5478515625, -1.28857421875, -1.029296875, -0.77001953125, -0.5107421875, -0.25146484375, 0.0078125, 0.26708984375, 0.5263671875, 0.78564453125, 1.044921875, 1.30419921875, 1.5634765625, 1.82275390625, 2.08203125, 2.34130859375, 2.6005859375, 2.85986328125, 3.119140625, 3.37841796875, 3.6376953125, 3.89697265625, 4.15625, 4.41552734375, 4.6748046875, 4.93408203125, 5.193359375, 5.45263671875, 5.7119140625, 5.97119140625, 6.23046875, 6.48974609375, 6.7490234375, 7.00830078125, 7.267578125, 7.52685546875, 7.7861328125, 8.04541015625, 8.3046875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 3.0, 7.0, 5.0, 8.0, 15.0, 13.0, 13.0, 21.0, 28.0, 34.0, 52.0, 95.0, 99.0, 161.0, 376.0, 1479.0, 789.0, 273.0, 181.0, 121.0, 69.0, 54.0, 35.0, 27.0, 29.0, 15.0, 10.0, 13.0, 10.0, 11.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0068359375, -0.9731292724609375, -0.939422607421875, -0.9057159423828125, -0.87200927734375, -0.8383026123046875, -0.804595947265625, -0.7708892822265625, -0.7371826171875, -0.7034759521484375, -0.669769287109375, -0.6360626220703125, -0.60235595703125, -0.5686492919921875, -0.534942626953125, -0.5012359619140625, -0.467529296875, -0.4338226318359375, -0.400115966796875, -0.3664093017578125, -0.33270263671875, -0.2989959716796875, -0.265289306640625, -0.2315826416015625, -0.1978759765625, -0.1641693115234375, -0.130462646484375, -0.0967559814453125, -0.06304931640625, -0.0293426513671875, 0.004364013671875, 0.0380706787109375, 0.07177734375, 0.1054840087890625, 0.139190673828125, 0.1728973388671875, 0.20660400390625, 0.2403106689453125, 0.274017333984375, 0.3077239990234375, 0.3414306640625, 0.3751373291015625, 0.408843994140625, 0.4425506591796875, 0.47625732421875, 0.5099639892578125, 0.543670654296875, 0.5773773193359375, 0.611083984375, 0.6447906494140625, 0.678497314453125, 0.7122039794921875, 0.74591064453125, 0.7796173095703125, 0.813323974609375, 0.8470306396484375, 0.8807373046875, 0.9144439697265625, 0.948150634765625, 0.9818572998046875, 1.01556396484375, 1.0492706298828125, 1.082977294921875, 1.1166839599609375, 1.150390625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 8.0, 33.0, 123.0, 309.0, 333.0, 127.0, 34.0, 18.0, 10.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.074148178100586, -8.534034729003906, -7.993920803070068, -7.4538068771362305, -6.913693428039551, -6.373579978942871, -5.833466053009033, -5.293352127075195, -4.753238677978516, -4.213125228881836, -3.673011302947998, -3.1328976154327393, -2.5927839279174805, -2.0526702404022217, -1.512556552886963, -0.9724428653717041, -0.4323291778564453, 0.10778450965881348, 0.6478981971740723, 1.188011884689331, 1.7281255722045898, 2.2682392597198486, 2.8083529472351074, 3.348466634750366, 3.888580322265625, 4.428693771362305, 4.968807697296143, 5.5089216232299805, 6.04903507232666, 6.58914852142334, 7.129262447357178, 7.669376373291016, 8.209491729736328, 8.749605178833008, 9.289718627929688, 9.829833030700684, 10.369946479797363, 10.910059928894043, 11.450174331665039, 11.990287780761719, 12.530401229858398, 13.070514678955078, 13.610628128051758, 14.150742530822754, 14.690855979919434, 15.230969429016113, 15.77108383178711, 16.31119728088379, 16.85131072998047, 17.39142417907715, 17.931537628173828, 18.471651077270508, 19.011764526367188, 19.5518798828125, 20.09199333190918, 20.63210678100586, 21.17222023010254, 21.71233367919922, 22.2524471282959, 22.792560577392578, 23.33267593383789, 23.87278938293457, 24.41290283203125, 24.95301628112793, 25.49312973022461]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 10.0, 17.0, 18.0, 14.0, 21.0, 16.0, 30.0, 36.0, 33.0, 52.0, 53.0, 62.0, 52.0, 76.0, 60.0, 56.0, 50.0, 45.0, 43.0, 43.0, 29.0, 39.0, 33.0, 19.0, 19.0, 17.0, 12.0, 8.0, 8.0, 4.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.030237197875977, -4.88551664352417, -4.7407965660095215, -4.596076011657715, -4.451355934143066, -4.30663537979126, -4.161914825439453, -4.017194747924805, -3.872474193572998, -3.7277538776397705, -3.583033561706543, -3.4383130073547363, -3.293592691421509, -3.1488723754882812, -3.0041518211364746, -2.859431505203247, -2.7147111892700195, -2.569990873336792, -2.4252705574035645, -2.280550003051758, -2.1358296871185303, -1.9911093711853027, -1.8463889360427856, -1.7016685009002686, -1.556948184967041, -1.4122278690338135, -1.2675074338912964, -1.1227869987487793, -0.9780666828155518, -0.8333463072776794, -0.6886259317398071, -0.54390549659729, -0.3991847038269043, -0.254464328289032, -0.10974395275115967, 0.034976422786712646, 0.17969679832458496, 0.3244171738624573, 0.4691375494003296, 0.6138579845428467, 0.7585783004760742, 0.9032986760139465, 1.0480190515518188, 1.192739486694336, 1.3374598026275635, 1.482180118560791, 1.626900553703308, 1.7716209888458252, 1.9163413047790527, 2.0610616207122803, 2.205781936645508, 2.3505024909973145, 2.495222806930542, 2.6399431228637695, 2.784663677215576, 2.9293839931488037, 3.0741043090820312, 3.218824625015259, 3.3635449409484863, 3.508265495300293, 3.6529858112335205, 3.797706127166748, 3.9424266815185547, 4.087146759033203, 4.23186731338501]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 13.0, 8.0, 12.0, 20.0, 36.0, 58.0, 84.0, 113.0, 173.0, 259.0, 477.0, 714.0, 1437.0, 2643.0, 5942.0, 15444.0, 59571.0, 825146.0, 102349.0, 19642.0, 7307.0, 3262.0, 1586.0, 838.0, 514.0, 292.0, 185.0, 136.0, 87.0, 60.0, 32.0, 38.0, 18.0, 13.0, 14.0, 3.0, 1.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-8.5234375, -8.2620849609375, -8.000732421875, -7.7393798828125, -7.47802734375, -7.2166748046875, -6.955322265625, -6.6939697265625, -6.4326171875, -6.1712646484375, -5.909912109375, -5.6485595703125, -5.38720703125, -5.1258544921875, -4.864501953125, -4.6031494140625, -4.341796875, -4.0804443359375, -3.819091796875, -3.5577392578125, -3.29638671875, -3.0350341796875, -2.773681640625, -2.5123291015625, -2.2509765625, -1.9896240234375, -1.728271484375, -1.4669189453125, -1.20556640625, -0.9442138671875, -0.682861328125, -0.4215087890625, -0.16015625, 0.1011962890625, 0.362548828125, 0.6239013671875, 0.88525390625, 1.1466064453125, 1.407958984375, 1.6693115234375, 1.9306640625, 2.1920166015625, 2.453369140625, 2.7147216796875, 2.97607421875, 3.2374267578125, 3.498779296875, 3.7601318359375, 4.021484375, 4.2828369140625, 4.544189453125, 4.8055419921875, 5.06689453125, 5.3282470703125, 5.589599609375, 5.8509521484375, 6.1123046875, 6.3736572265625, 6.635009765625, 6.8963623046875, 7.15771484375, 7.4190673828125, 7.680419921875, 7.9417724609375, 8.203125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 7.0, 4.0, 5.0, 5.0, 4.0, 8.0, 13.0, 8.0, 20.0, 31.0, 92.0, 221.0, 265.0, 145.0, 74.0, 24.0, 29.0, 10.0, 8.0, 7.0, 4.0, 6.0, 3.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5263671875, -1.4874725341796875, -1.448577880859375, -1.4096832275390625, -1.37078857421875, -1.3318939208984375, -1.292999267578125, -1.2541046142578125, -1.2152099609375, -1.1763153076171875, -1.137420654296875, -1.0985260009765625, -1.05963134765625, -1.0207366943359375, -0.981842041015625, -0.9429473876953125, -0.904052734375, -0.8651580810546875, -0.826263427734375, -0.7873687744140625, -0.74847412109375, -0.7095794677734375, -0.670684814453125, -0.6317901611328125, -0.5928955078125, -0.5540008544921875, -0.515106201171875, -0.4762115478515625, -0.43731689453125, -0.3984222412109375, -0.359527587890625, -0.3206329345703125, -0.28173828125, -0.2428436279296875, -0.203948974609375, -0.1650543212890625, -0.12615966796875, -0.0872650146484375, -0.048370361328125, -0.0094757080078125, 0.0294189453125, 0.0683135986328125, 0.107208251953125, 0.1461029052734375, 0.18499755859375, 0.2238922119140625, 0.262786865234375, 0.3016815185546875, 0.340576171875, 0.3794708251953125, 0.418365478515625, 0.4572601318359375, 0.49615478515625, 0.5350494384765625, 0.573944091796875, 0.6128387451171875, 0.6517333984375, 0.6906280517578125, 0.729522705078125, 0.7684173583984375, 0.80731201171875, 0.8462066650390625, 0.885101318359375, 0.9239959716796875, 0.962890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 8.0, 2.0, 8.0, 4.0, 11.0, 22.0, 27.0, 50.0, 78.0, 139.0, 247.0, 481.0, 1158.0, 3273.0, 12192.0, 88634.0, 783476.0, 135865.0, 16266.0, 3897.0, 1483.0, 601.0, 264.0, 137.0, 81.0, 54.0, 39.0, 23.0, 13.0, 7.0, 5.0, 3.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.83984375, -6.58245849609375, -6.3250732421875, -6.06768798828125, -5.810302734375, -5.55291748046875, -5.2955322265625, -5.03814697265625, -4.78076171875, -4.52337646484375, -4.2659912109375, -4.00860595703125, -3.751220703125, -3.49383544921875, -3.2364501953125, -2.97906494140625, -2.7216796875, -2.46429443359375, -2.2069091796875, -1.94952392578125, -1.692138671875, -1.43475341796875, -1.1773681640625, -0.91998291015625, -0.66259765625, -0.40521240234375, -0.1478271484375, 0.10955810546875, 0.366943359375, 0.62432861328125, 0.8817138671875, 1.13909912109375, 1.396484375, 1.65386962890625, 1.9112548828125, 2.16864013671875, 2.426025390625, 2.68341064453125, 2.9407958984375, 3.19818115234375, 3.45556640625, 3.71295166015625, 3.9703369140625, 4.22772216796875, 4.485107421875, 4.74249267578125, 4.9998779296875, 5.25726318359375, 5.5146484375, 5.77203369140625, 6.0294189453125, 6.28680419921875, 6.544189453125, 6.80157470703125, 7.0589599609375, 7.31634521484375, 7.57373046875, 7.83111572265625, 8.0885009765625, 8.34588623046875, 8.603271484375, 8.86065673828125, 9.1180419921875, 9.37542724609375, 9.6328125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 5.0, 12.0, 6.0, 15.0, 31.0, 28.0, 39.0, 33.0, 40.0, 48.0, 64.0, 68.0, 62.0, 65.0, 50.0, 75.0, 48.0, 56.0, 54.0, 48.0, 29.0, 23.0, 19.0, 23.0, 13.0, 11.0, 14.0, 3.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.943359375, -3.809234619140625, -3.67510986328125, -3.540985107421875, -3.4068603515625, -3.272735595703125, -3.13861083984375, -3.004486083984375, -2.870361328125, -2.736236572265625, -2.60211181640625, -2.467987060546875, -2.3338623046875, -2.199737548828125, -2.06561279296875, -1.931488037109375, -1.79736328125, -1.663238525390625, -1.52911376953125, -1.394989013671875, -1.2608642578125, -1.126739501953125, -0.99261474609375, -0.858489990234375, -0.724365234375, -0.590240478515625, -0.45611572265625, -0.321990966796875, -0.1878662109375, -0.053741455078125, 0.08038330078125, 0.214508056640625, 0.3486328125, 0.482757568359375, 0.61688232421875, 0.751007080078125, 0.8851318359375, 1.019256591796875, 1.15338134765625, 1.287506103515625, 1.421630859375, 1.555755615234375, 1.68988037109375, 1.824005126953125, 1.9581298828125, 2.092254638671875, 2.22637939453125, 2.360504150390625, 2.49462890625, 2.628753662109375, 2.76287841796875, 2.897003173828125, 3.0311279296875, 3.165252685546875, 3.29937744140625, 3.433502197265625, 3.567626953125, 3.701751708984375, 3.83587646484375, 3.970001220703125, 4.1041259765625, 4.238250732421875, 4.37237548828125, 4.506500244140625, 4.640625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 6.0, 6.0, 2.0, 4.0, 12.0, 19.0, 33.0, 34.0, 77.0, 107.0, 195.0, 385.0, 727.0, 1527.0, 3769.0, 10591.0, 42710.0, 272366.0, 583087.0, 101689.0, 20491.0, 6094.0, 2402.0, 1039.0, 530.0, 269.0, 136.0, 99.0, 55.0, 30.0, 26.0, 17.0, 10.0, 7.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.76953125, -5.59063720703125, -5.4117431640625, -5.23284912109375, -5.053955078125, -4.87506103515625, -4.6961669921875, -4.51727294921875, -4.33837890625, -4.15948486328125, -3.9805908203125, -3.80169677734375, -3.622802734375, -3.44390869140625, -3.2650146484375, -3.08612060546875, -2.9072265625, -2.72833251953125, -2.5494384765625, -2.37054443359375, -2.191650390625, -2.01275634765625, -1.8338623046875, -1.65496826171875, -1.47607421875, -1.29718017578125, -1.1182861328125, -0.93939208984375, -0.760498046875, -0.58160400390625, -0.4027099609375, -0.22381591796875, -0.044921875, 0.13397216796875, 0.3128662109375, 0.49176025390625, 0.670654296875, 0.84954833984375, 1.0284423828125, 1.20733642578125, 1.38623046875, 1.56512451171875, 1.7440185546875, 1.92291259765625, 2.101806640625, 2.28070068359375, 2.4595947265625, 2.63848876953125, 2.8173828125, 2.99627685546875, 3.1751708984375, 3.35406494140625, 3.532958984375, 3.71185302734375, 3.8907470703125, 4.06964111328125, 4.24853515625, 4.42742919921875, 4.6063232421875, 4.78521728515625, 4.964111328125, 5.14300537109375, 5.3218994140625, 5.50079345703125, 5.6796875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 3.0, 5.0, 5.0, 11.0, 9.0, 20.0, 26.0, 33.0, 32.0, 66.0, 89.0, 97.0, 130.0, 109.0, 110.0, 66.0, 53.0, 38.0, 13.0, 18.0, 16.0, 6.0, 7.0, 4.0, 4.0, 5.0, 6.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002789497375488281, -0.0002685077488422394, -0.00025806576013565063, -0.0002476237714290619, -0.00023718178272247314, -0.0002267397940158844, -0.00021629780530929565, -0.0002058558166027069, -0.00019541382789611816, -0.00018497183918952942, -0.00017452985048294067, -0.00016408786177635193, -0.00015364587306976318, -0.00014320388436317444, -0.0001327618956565857, -0.00012231990694999695, -0.0001118779182434082, -0.00010143592953681946, -9.099394083023071e-05, -8.055195212364197e-05, -7.010996341705322e-05, -5.966797471046448e-05, -4.922598600387573e-05, -3.878399729728699e-05, -2.8342008590698242e-05, -1.7900019884109497e-05, -7.458031177520752e-06, 2.983957529067993e-06, 1.3425946235656738e-05, 2.3867934942245483e-05, 3.430992364883423e-05, 4.4751912355422974e-05, 5.519390106201172e-05, 6.563588976860046e-05, 7.607787847518921e-05, 8.651986718177795e-05, 9.69618558883667e-05, 0.00010740384459495544, 0.00011784583330154419, 0.00012828782200813293, 0.00013872981071472168, 0.00014917179942131042, 0.00015961378812789917, 0.00017005577683448792, 0.00018049776554107666, 0.0001909397542476654, 0.00020138174295425415, 0.0002118237316608429, 0.00022226572036743164, 0.00023270770907402039, 0.00024314969778060913, 0.0002535916864871979, 0.0002640336751937866, 0.00027447566390037537, 0.0002849176526069641, 0.00029535964131355286, 0.0003058016300201416, 0.00031624361872673035, 0.0003266856074333191, 0.00033712759613990784, 0.0003475695848464966, 0.00035801157355308533, 0.00036845356225967407, 0.0003788955509662628, 0.00038933753967285156]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 7.0, 12.0, 7.0, 8.0, 17.0, 23.0, 42.0, 52.0, 86.0, 158.0, 262.0, 469.0, 868.0, 1783.0, 4409.0, 11566.0, 40547.0, 195024.0, 563822.0, 174199.0, 36377.0, 10949.0, 4114.0, 1784.0, 853.0, 456.0, 234.0, 131.0, 88.0, 59.0, 49.0, 29.0, 9.0, 16.0, 8.0, 9.0, 2.0, 4.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.61328125, -5.450439453125, -5.28759765625, -5.124755859375, -4.9619140625, -4.799072265625, -4.63623046875, -4.473388671875, -4.310546875, -4.147705078125, -3.98486328125, -3.822021484375, -3.6591796875, -3.496337890625, -3.33349609375, -3.170654296875, -3.0078125, -2.844970703125, -2.68212890625, -2.519287109375, -2.3564453125, -2.193603515625, -2.03076171875, -1.867919921875, -1.705078125, -1.542236328125, -1.37939453125, -1.216552734375, -1.0537109375, -0.890869140625, -0.72802734375, -0.565185546875, -0.40234375, -0.239501953125, -0.07666015625, 0.086181640625, 0.2490234375, 0.411865234375, 0.57470703125, 0.737548828125, 0.900390625, 1.063232421875, 1.22607421875, 1.388916015625, 1.5517578125, 1.714599609375, 1.87744140625, 2.040283203125, 2.203125, 2.365966796875, 2.52880859375, 2.691650390625, 2.8544921875, 3.017333984375, 3.18017578125, 3.343017578125, 3.505859375, 3.668701171875, 3.83154296875, 3.994384765625, 4.1572265625, 4.320068359375, 4.48291015625, 4.645751953125, 4.80859375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 4.0, 12.0, 14.0, 10.0, 20.0, 17.0, 28.0, 28.0, 33.0, 47.0, 51.0, 68.0, 78.0, 84.0, 70.0, 74.0, 68.0, 48.0, 50.0, 40.0, 47.0, 17.0, 23.0, 13.0, 13.0, 4.0, 5.0, 7.0, 8.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3828125, -2.29840087890625, -2.2139892578125, -2.12957763671875, -2.045166015625, -1.96075439453125, -1.8763427734375, -1.79193115234375, -1.70751953125, -1.62310791015625, -1.5386962890625, -1.45428466796875, -1.369873046875, -1.28546142578125, -1.2010498046875, -1.11663818359375, -1.0322265625, -0.94781494140625, -0.8634033203125, -0.77899169921875, -0.694580078125, -0.61016845703125, -0.5257568359375, -0.44134521484375, -0.35693359375, -0.27252197265625, -0.1881103515625, -0.10369873046875, -0.019287109375, 0.06512451171875, 0.1495361328125, 0.23394775390625, 0.318359375, 0.40277099609375, 0.4871826171875, 0.57159423828125, 0.656005859375, 0.74041748046875, 0.8248291015625, 0.90924072265625, 0.99365234375, 1.07806396484375, 1.1624755859375, 1.24688720703125, 1.331298828125, 1.41571044921875, 1.5001220703125, 1.58453369140625, 1.6689453125, 1.75335693359375, 1.8377685546875, 1.92218017578125, 2.006591796875, 2.09100341796875, 2.1754150390625, 2.25982666015625, 2.34423828125, 2.42864990234375, 2.5130615234375, 2.59747314453125, 2.681884765625, 2.76629638671875, 2.8507080078125, 2.93511962890625, 3.01953125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 3.0, 17.0, 36.0, 325.0, 500.0, 105.0, 16.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.83599853515625, -166.70291137695312, -163.56983947753906, -160.43675231933594, -157.3036651611328, -154.17059326171875, -151.03750610351562, -147.9044189453125, -144.77133178710938, -141.63824462890625, -138.5051727294922, -135.37208557128906, -132.23899841308594, -129.10592651367188, -125.97283935546875, -122.83975219726562, -119.70668029785156, -116.57360076904297, -113.44051361083984, -110.30743408203125, -107.17434692382812, -104.04126739501953, -100.90818786621094, -97.77510070800781, -94.64201354980469, -91.5089340209961, -88.37584686279297, -85.24276733398438, -82.10968017578125, -78.97660064697266, -75.84352111816406, -72.71043395996094, -69.57735443115234, -66.44427490234375, -63.311187744140625, -60.17810821533203, -57.04502487182617, -53.91194152832031, -50.77885818481445, -47.645774841308594, -44.5126953125, -41.37961196899414, -38.24652862548828, -35.11344909667969, -31.980365753173828, -28.84728240966797, -25.71419906616211, -22.581117630004883, -19.448034286499023, -16.314950942993164, -13.181869506835938, -10.048786163330078, -6.915703773498535, -3.782621383666992, -0.6495380401611328, 2.4835433959960938, 5.616626739501953, 8.749709129333496, 11.882791519165039, 15.015874862670898, 18.148956298828125, 21.282039642333984, 24.415122985839844, 27.54820442199707, 30.68128776550293]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 11.0, 12.0, 11.0, 25.0, 35.0, 38.0, 47.0, 56.0, 63.0, 85.0, 81.0, 92.0, 71.0, 58.0, 78.0, 51.0, 47.0, 35.0, 23.0, 16.0, 14.0, 10.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-31.666648864746094, -30.57804298400879, -29.489437103271484, -28.40083122253418, -27.312225341796875, -26.22361946105957, -25.135013580322266, -24.046405792236328, -22.957801818847656, -21.86919593811035, -20.780590057373047, -19.691984176635742, -18.603378295898438, -17.514772415161133, -16.426166534423828, -15.337559700012207, -14.248952865600586, -13.160346984863281, -12.071741104125977, -10.983135223388672, -9.894529342651367, -8.805923461914062, -7.717316627502441, -6.628710746765137, -5.540104866027832, -4.451498985290527, -3.3628928661346436, -2.2742867469787598, -1.185680866241455, -0.09707498550415039, 0.9915313720703125, 2.080137252807617, 3.168743133544922, 4.257349014282227, 5.345954895019531, 6.434561252593994, 7.523167133331299, 8.611772537231445, 9.700379371643066, 10.788985252380371, 11.877591133117676, 12.96619701385498, 14.054802894592285, 15.143409729003906, 16.23201560974121, 17.320621490478516, 18.40922737121582, 19.497833251953125, 20.58643913269043, 21.675045013427734, 22.76365089416504, 23.852256774902344, 24.94086265563965, 26.029468536376953, 27.11807632446289, 28.206680297851562, 29.2952880859375, 30.383893966674805, 31.47249984741211, 32.56110763549805, 33.64971160888672, 34.738319396972656, 35.82692337036133, 36.915531158447266, 38.00413513183594]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 0.0, 4.0, 11.0, 6.0, 13.0, 9.0, 18.0, 16.0, 19.0, 26.0, 31.0, 30.0, 38.0, 45.0, 67.0, 94.0, 143.0, 203.0, 316.0, 474.0, 722.0, 1173.0, 2094.0, 4027.0, 9363.0, 31102.0, 489314.0, 3587874.0, 45418.0, 11666.0, 4644.0, 2206.0, 1163.0, 678.0, 407.0, 269.0, 158.0, 136.0, 81.0, 54.0, 45.0, 30.0, 29.0, 22.0, 11.0, 11.0, 10.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-17.109375, -16.6353759765625, -16.161376953125, -15.6873779296875, -15.21337890625, -14.7393798828125, -14.265380859375, -13.7913818359375, -13.3173828125, -12.8433837890625, -12.369384765625, -11.8953857421875, -11.42138671875, -10.9473876953125, -10.473388671875, -9.9993896484375, -9.525390625, -9.0513916015625, -8.577392578125, -8.1033935546875, -7.62939453125, -7.1553955078125, -6.681396484375, -6.2073974609375, -5.7333984375, -5.2593994140625, -4.785400390625, -4.3114013671875, -3.83740234375, -3.3634033203125, -2.889404296875, -2.4154052734375, -1.94140625, -1.4674072265625, -0.993408203125, -0.5194091796875, -0.04541015625, 0.4285888671875, 0.902587890625, 1.3765869140625, 1.8505859375, 2.3245849609375, 2.798583984375, 3.2725830078125, 3.74658203125, 4.2205810546875, 4.694580078125, 5.1685791015625, 5.642578125, 6.1165771484375, 6.590576171875, 7.0645751953125, 7.53857421875, 8.0125732421875, 8.486572265625, 8.9605712890625, 9.4345703125, 9.9085693359375, 10.382568359375, 10.8565673828125, 11.33056640625, 11.8045654296875, 12.278564453125, 12.7525634765625, 13.2265625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 9.0, 9.0, 20.0, 40.0, 76.0, 138.0, 199.0, 219.0, 125.0, 56.0, 26.0, 19.0, 14.0, 14.0, 7.0, 3.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3583984375, -1.3225021362304688, -1.2866058349609375, -1.2507095336914062, -1.214813232421875, -1.1789169311523438, -1.1430206298828125, -1.1071243286132812, -1.07122802734375, -1.0353317260742188, -0.9994354248046875, -0.9635391235351562, -0.927642822265625, -0.8917465209960938, -0.8558502197265625, -0.8199539184570312, -0.7840576171875, -0.7481613159179688, -0.7122650146484375, -0.6763687133789062, -0.640472412109375, -0.6045761108398438, -0.5686798095703125, -0.5327835083007812, -0.49688720703125, -0.46099090576171875, -0.4250946044921875, -0.38919830322265625, -0.353302001953125, -0.31740570068359375, -0.2815093994140625, -0.24561309814453125, -0.209716796875, -0.17382049560546875, -0.1379241943359375, -0.10202789306640625, -0.066131591796875, -0.03023529052734375, 0.0056610107421875, 0.04155731201171875, 0.07745361328125, 0.11334991455078125, 0.1492462158203125, 0.18514251708984375, 0.221038818359375, 0.25693511962890625, 0.2928314208984375, 0.32872772216796875, 0.3646240234375, 0.40052032470703125, 0.4364166259765625, 0.47231292724609375, 0.508209228515625, 0.5441055297851562, 0.5800018310546875, 0.6158981323242188, 0.65179443359375, 0.6876907348632812, 0.7235870361328125, 0.7594833374023438, 0.795379638671875, 0.8312759399414062, 0.8671722412109375, 0.9030685424804688, 0.93896484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 5.0, 8.0, 10.0, 9.0, 9.0, 16.0, 34.0, 34.0, 42.0, 97.0, 183.0, 412.0, 810.0, 2034.0, 5979.0, 21926.0, 148376.0, 3757681.0, 218283.0, 27330.0, 6894.0, 2325.0, 883.0, 396.0, 202.0, 96.0, 68.0, 46.0, 16.0, 11.0, 18.0, 8.0, 10.0, 7.0, 8.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-14.34375, -13.87451171875, -13.4052734375, -12.93603515625, -12.466796875, -11.99755859375, -11.5283203125, -11.05908203125, -10.58984375, -10.12060546875, -9.6513671875, -9.18212890625, -8.712890625, -8.24365234375, -7.7744140625, -7.30517578125, -6.8359375, -6.36669921875, -5.8974609375, -5.42822265625, -4.958984375, -4.48974609375, -4.0205078125, -3.55126953125, -3.08203125, -2.61279296875, -2.1435546875, -1.67431640625, -1.205078125, -0.73583984375, -0.2666015625, 0.20263671875, 0.671875, 1.14111328125, 1.6103515625, 2.07958984375, 2.548828125, 3.01806640625, 3.4873046875, 3.95654296875, 4.42578125, 4.89501953125, 5.3642578125, 5.83349609375, 6.302734375, 6.77197265625, 7.2412109375, 7.71044921875, 8.1796875, 8.64892578125, 9.1181640625, 9.58740234375, 10.056640625, 10.52587890625, 10.9951171875, 11.46435546875, 11.93359375, 12.40283203125, 12.8720703125, 13.34130859375, 13.810546875, 14.27978515625, 14.7490234375, 15.21826171875, 15.6875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 6.0, 3.0, 7.0, 7.0, 9.0, 10.0, 8.0, 10.0, 17.0, 18.0, 38.0, 59.0, 89.0, 128.0, 228.0, 501.0, 1676.0, 510.0, 268.0, 137.0, 99.0, 70.0, 34.0, 32.0, 20.0, 16.0, 10.0, 10.0, 11.0, 8.0, 7.0, 8.0, 2.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.595703125, -1.5519561767578125, -1.508209228515625, -1.4644622802734375, -1.42071533203125, -1.3769683837890625, -1.333221435546875, -1.2894744873046875, -1.2457275390625, -1.2019805908203125, -1.158233642578125, -1.1144866943359375, -1.07073974609375, -1.0269927978515625, -0.983245849609375, -0.9394989013671875, -0.895751953125, -0.8520050048828125, -0.808258056640625, -0.7645111083984375, -0.72076416015625, -0.6770172119140625, -0.633270263671875, -0.5895233154296875, -0.5457763671875, -0.5020294189453125, -0.458282470703125, -0.4145355224609375, -0.37078857421875, -0.3270416259765625, -0.283294677734375, -0.2395477294921875, -0.19580078125, -0.1520538330078125, -0.108306884765625, -0.0645599365234375, -0.02081298828125, 0.0229339599609375, 0.066680908203125, 0.1104278564453125, 0.1541748046875, 0.1979217529296875, 0.241668701171875, 0.2854156494140625, 0.32916259765625, 0.3729095458984375, 0.416656494140625, 0.4604034423828125, 0.504150390625, 0.5478973388671875, 0.591644287109375, 0.6353912353515625, 0.67913818359375, 0.7228851318359375, 0.766632080078125, 0.8103790283203125, 0.8541259765625, 0.8978729248046875, 0.941619873046875, 0.9853668212890625, 1.02911376953125, 1.0728607177734375, 1.116607666015625, 1.1603546142578125, 1.2041015625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 14.0, 19.0, 40.0, 63.0, 126.0, 161.0, 202.0, 152.0, 92.0, 55.0, 32.0, 15.0, 10.0, 9.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.792753219604492, -14.404183387756348, -14.015613555908203, -13.627042770385742, -13.238472938537598, -12.849903106689453, -12.461333274841309, -12.072763442993164, -11.684192657470703, -11.295622825622559, -10.907052993774414, -10.518482208251953, -10.129912376403809, -9.741342544555664, -9.35277271270752, -8.964202880859375, -8.57563304901123, -8.187063217163086, -7.798492908477783, -7.409923076629639, -7.021352767944336, -6.632782936096191, -6.244213104248047, -5.855643272399902, -5.4670729637146, -5.078503131866455, -4.689932823181152, -4.301362991333008, -3.912792921066284, -3.5242228507995605, -3.135653018951416, -2.7470829486846924, -2.358513832092285, -1.9699437618255615, -1.5813738107681274, -1.1928038597106934, -0.8042337894439697, -0.4156637191772461, -0.027093887329101562, 0.36147618293762207, 0.7500462532043457, 1.1386163234710693, 1.5271862745285034, 1.9157562255859375, 2.304326295852661, 2.6928963661193848, 3.0814661979675293, 3.470036268234253, 3.8586063385009766, 4.247176170349121, 4.635746479034424, 5.024316310882568, 5.412886619567871, 5.801456451416016, 6.19002628326416, 6.578596115112305, 6.967166423797607, 7.355736255645752, 7.744306564331055, 8.1328763961792, 8.521446228027344, 8.910017013549805, 9.298585891723633, 9.687156677246094, 10.075726509094238]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 9.0, 8.0, 12.0, 9.0, 25.0, 24.0, 32.0, 35.0, 43.0, 48.0, 57.0, 49.0, 52.0, 60.0, 65.0, 63.0, 66.0, 66.0, 47.0, 41.0, 38.0, 32.0, 19.0, 23.0, 22.0, 16.0, 15.0, 12.0, 5.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.277908325195312, -8.062480926513672, -7.847053527832031, -7.631626129150391, -7.416199207305908, -7.200771808624268, -6.985344409942627, -6.769917011260986, -6.554490089416504, -6.339062690734863, -6.123635292053223, -5.908207893371582, -5.6927809715271, -5.477353572845459, -5.261926174163818, -5.046498775482178, -4.831071376800537, -4.6156439781188965, -4.400216579437256, -4.184789657592773, -3.969362258911133, -3.753934860229492, -3.5385074615478516, -3.323080062866211, -3.1076529026031494, -2.892225503921509, -2.6767983436584473, -2.4613709449768066, -2.245943546295166, -2.0305163860321045, -1.8150889873504639, -1.5996617078781128, -1.3842339515686035, -1.1688066720962524, -0.9533793330192566, -0.7379519939422607, -0.5225247144699097, -0.3070974349975586, -0.09167003631591797, 0.1237572431564331, 0.3391845226287842, 0.5546118021011353, 0.7700391411781311, 0.985466480255127, 1.200893759727478, 1.416321039199829, 1.6317484378814697, 1.8471757173538208, 2.062602996826172, 2.2780303955078125, 2.493457555770874, 2.7088849544525146, 2.924312114715576, 3.139739513397217, 3.3551669120788574, 3.570594310760498, 3.7860214710235596, 4.001448631286621, 4.216876029968262, 4.432303428649902, 4.647730827331543, 4.863158226013184, 5.078585624694824, 5.294012546539307, 5.509439945220947]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 11.0, 5.0, 5.0, 9.0, 11.0, 26.0, 17.0, 33.0, 54.0, 68.0, 98.0, 130.0, 180.0, 247.0, 396.0, 626.0, 1033.0, 1729.0, 3397.0, 7715.0, 22325.0, 104477.0, 647832.0, 203899.0, 34006.0, 10396.0, 4371.0, 2132.0, 1187.0, 677.0, 454.0, 274.0, 225.0, 152.0, 89.0, 70.0, 53.0, 39.0, 23.0, 21.0, 16.0, 14.0, 5.0, 9.0, 4.0, 5.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-9.296875, -9.01220703125, -8.7275390625, -8.44287109375, -8.158203125, -7.87353515625, -7.5888671875, -7.30419921875, -7.01953125, -6.73486328125, -6.4501953125, -6.16552734375, -5.880859375, -5.59619140625, -5.3115234375, -5.02685546875, -4.7421875, -4.45751953125, -4.1728515625, -3.88818359375, -3.603515625, -3.31884765625, -3.0341796875, -2.74951171875, -2.46484375, -2.18017578125, -1.8955078125, -1.61083984375, -1.326171875, -1.04150390625, -0.7568359375, -0.47216796875, -0.1875, 0.09716796875, 0.3818359375, 0.66650390625, 0.951171875, 1.23583984375, 1.5205078125, 1.80517578125, 2.08984375, 2.37451171875, 2.6591796875, 2.94384765625, 3.228515625, 3.51318359375, 3.7978515625, 4.08251953125, 4.3671875, 4.65185546875, 4.9365234375, 5.22119140625, 5.505859375, 5.79052734375, 6.0751953125, 6.35986328125, 6.64453125, 6.92919921875, 7.2138671875, 7.49853515625, 7.783203125, 8.06787109375, 8.3525390625, 8.63720703125, 8.921875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 4.0, 15.0, 22.0, 45.0, 72.0, 134.0, 166.0, 200.0, 137.0, 76.0, 52.0, 27.0, 17.0, 12.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3466796875, -1.310394287109375, -1.27410888671875, -1.237823486328125, -1.2015380859375, -1.165252685546875, -1.12896728515625, -1.092681884765625, -1.056396484375, -1.020111083984375, -0.98382568359375, -0.947540283203125, -0.9112548828125, -0.874969482421875, -0.83868408203125, -0.802398681640625, -0.76611328125, -0.729827880859375, -0.69354248046875, -0.657257080078125, -0.6209716796875, -0.584686279296875, -0.54840087890625, -0.512115478515625, -0.475830078125, -0.439544677734375, -0.40325927734375, -0.366973876953125, -0.3306884765625, -0.294403076171875, -0.25811767578125, -0.221832275390625, -0.185546875, -0.149261474609375, -0.11297607421875, -0.076690673828125, -0.0404052734375, -0.004119873046875, 0.03216552734375, 0.068450927734375, 0.104736328125, 0.141021728515625, 0.17730712890625, 0.213592529296875, 0.2498779296875, 0.286163330078125, 0.32244873046875, 0.358734130859375, 0.39501953125, 0.431304931640625, 0.46759033203125, 0.503875732421875, 0.5401611328125, 0.576446533203125, 0.61273193359375, 0.649017333984375, 0.685302734375, 0.721588134765625, 0.75787353515625, 0.794158935546875, 0.8304443359375, 0.866729736328125, 0.90301513671875, 0.939300537109375, 0.9755859375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 4.0, 12.0, 9.0, 22.0, 18.0, 27.0, 36.0, 52.0, 52.0, 72.0, 125.0, 152.0, 241.0, 312.0, 565.0, 956.0, 1928.0, 3796.0, 9406.0, 28042.0, 113378.0, 491614.0, 305284.0, 62064.0, 17507.0, 6447.0, 2792.0, 1465.0, 743.0, 464.0, 284.0, 189.0, 144.0, 95.0, 62.0, 61.0, 37.0, 31.0, 17.0, 11.0, 14.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0], "bins": [-9.0078125, -8.7413330078125, -8.474853515625, -8.2083740234375, -7.94189453125, -7.6754150390625, -7.408935546875, -7.1424560546875, -6.8759765625, -6.6094970703125, -6.343017578125, -6.0765380859375, -5.81005859375, -5.5435791015625, -5.277099609375, -5.0106201171875, -4.744140625, -4.4776611328125, -4.211181640625, -3.9447021484375, -3.67822265625, -3.4117431640625, -3.145263671875, -2.8787841796875, -2.6123046875, -2.3458251953125, -2.079345703125, -1.8128662109375, -1.54638671875, -1.2799072265625, -1.013427734375, -0.7469482421875, -0.48046875, -0.2139892578125, 0.052490234375, 0.3189697265625, 0.58544921875, 0.8519287109375, 1.118408203125, 1.3848876953125, 1.6513671875, 1.9178466796875, 2.184326171875, 2.4508056640625, 2.71728515625, 2.9837646484375, 3.250244140625, 3.5167236328125, 3.783203125, 4.0496826171875, 4.316162109375, 4.5826416015625, 4.84912109375, 5.1156005859375, 5.382080078125, 5.6485595703125, 5.9150390625, 6.1815185546875, 6.447998046875, 6.7144775390625, 6.98095703125, 7.2474365234375, 7.513916015625, 7.7803955078125, 8.046875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 7.0, 9.0, 11.0, 10.0, 9.0, 15.0, 20.0, 18.0, 26.0, 36.0, 33.0, 42.0, 42.0, 36.0, 44.0, 36.0, 53.0, 67.0, 58.0, 72.0, 51.0, 50.0, 31.0, 35.0, 28.0, 38.0, 30.0, 16.0, 16.0, 14.0, 20.0, 12.0, 6.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.634765625, -3.515350341796875, -3.39593505859375, -3.276519775390625, -3.1571044921875, -3.037689208984375, -2.91827392578125, -2.798858642578125, -2.679443359375, -2.560028076171875, -2.44061279296875, -2.321197509765625, -2.2017822265625, -2.082366943359375, -1.96295166015625, -1.843536376953125, -1.72412109375, -1.604705810546875, -1.48529052734375, -1.365875244140625, -1.2464599609375, -1.127044677734375, -1.00762939453125, -0.888214111328125, -0.768798828125, -0.649383544921875, -0.52996826171875, -0.410552978515625, -0.2911376953125, -0.171722412109375, -0.05230712890625, 0.067108154296875, 0.1865234375, 0.305938720703125, 0.42535400390625, 0.544769287109375, 0.6641845703125, 0.783599853515625, 0.90301513671875, 1.022430419921875, 1.141845703125, 1.261260986328125, 1.38067626953125, 1.500091552734375, 1.6195068359375, 1.738922119140625, 1.85833740234375, 1.977752685546875, 2.09716796875, 2.216583251953125, 2.33599853515625, 2.455413818359375, 2.5748291015625, 2.694244384765625, 2.81365966796875, 2.933074951171875, 3.052490234375, 3.171905517578125, 3.29132080078125, 3.410736083984375, 3.5301513671875, 3.649566650390625, 3.76898193359375, 3.888397216796875, 4.0078125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 5.0, 8.0, 13.0, 21.0, 23.0, 25.0, 25.0, 55.0, 66.0, 93.0, 184.0, 251.0, 417.0, 756.0, 1392.0, 2643.0, 5254.0, 12061.0, 30314.0, 89660.0, 298200.0, 398890.0, 134160.0, 43619.0, 16192.0, 6952.0, 3209.0, 1652.0, 911.0, 569.0, 336.0, 209.0, 122.0, 76.0, 67.0, 26.0, 26.0, 28.0, 11.0, 12.0, 5.0, 6.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.08203125, -3.95513916015625, -3.8282470703125, -3.70135498046875, -3.574462890625, -3.44757080078125, -3.3206787109375, -3.19378662109375, -3.06689453125, -2.94000244140625, -2.8131103515625, -2.68621826171875, -2.559326171875, -2.43243408203125, -2.3055419921875, -2.17864990234375, -2.0517578125, -1.92486572265625, -1.7979736328125, -1.67108154296875, -1.544189453125, -1.41729736328125, -1.2904052734375, -1.16351318359375, -1.03662109375, -0.90972900390625, -0.7828369140625, -0.65594482421875, -0.529052734375, -0.40216064453125, -0.2752685546875, -0.14837646484375, -0.021484375, 0.10540771484375, 0.2322998046875, 0.35919189453125, 0.486083984375, 0.61297607421875, 0.7398681640625, 0.86676025390625, 0.99365234375, 1.12054443359375, 1.2474365234375, 1.37432861328125, 1.501220703125, 1.62811279296875, 1.7550048828125, 1.88189697265625, 2.0087890625, 2.13568115234375, 2.2625732421875, 2.38946533203125, 2.516357421875, 2.64324951171875, 2.7701416015625, 2.89703369140625, 3.02392578125, 3.15081787109375, 3.2777099609375, 3.40460205078125, 3.531494140625, 3.65838623046875, 3.7852783203125, 3.91217041015625, 4.0390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 8.0, 6.0, 9.0, 8.0, 13.0, 13.0, 22.0, 26.0, 32.0, 50.0, 82.0, 93.0, 98.0, 114.0, 90.0, 83.0, 71.0, 47.0, 28.0, 28.0, 17.0, 11.0, 8.0, 8.0, 5.0, 5.0, 4.0, 6.0, 2.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007767677307128906, -0.0007540881633758545, -0.0007314085960388184, -0.0007087290287017822, -0.0006860494613647461, -0.00066336989402771, -0.0006406903266906738, -0.0006180107593536377, -0.0005953311920166016, -0.0005726516246795654, -0.0005499720573425293, -0.0005272924900054932, -0.000504612922668457, -0.0004819333553314209, -0.00045925378799438477, -0.00043657422065734863, -0.0004138946533203125, -0.00039121508598327637, -0.00036853551864624023, -0.0003458559513092041, -0.00032317638397216797, -0.00030049681663513184, -0.0002778172492980957, -0.00025513768196105957, -0.00023245811462402344, -0.0002097785472869873, -0.00018709897994995117, -0.00016441941261291504, -0.0001417398452758789, -0.00011906027793884277, -9.638071060180664e-05, -7.370114326477051e-05, -5.1021575927734375e-05, -2.8342008590698242e-05, -5.662441253662109e-06, 1.7017126083374023e-05, 3.9696693420410156e-05, 6.237626075744629e-05, 8.505582809448242e-05, 0.00010773539543151855, 0.0001304149627685547, 0.00015309453010559082, 0.00017577409744262695, 0.00019845366477966309, 0.00022113323211669922, 0.00024381279945373535, 0.0002664923667907715, 0.0002891719341278076, 0.00031185150146484375, 0.0003345310688018799, 0.000357210636138916, 0.00037989020347595215, 0.0004025697708129883, 0.0004252493381500244, 0.00044792890548706055, 0.0004706084728240967, 0.0004932880401611328, 0.0005159676074981689, 0.0005386471748352051, 0.0005613267421722412, 0.0005840063095092773, 0.0006066858768463135, 0.0006293654441833496, 0.0006520450115203857, 0.0006747245788574219]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 4.0, 10.0, 12.0, 15.0, 13.0, 16.0, 29.0, 39.0, 39.0, 49.0, 104.0, 144.0, 258.0, 390.0, 644.0, 1154.0, 2246.0, 4887.0, 11629.0, 36183.0, 153370.0, 550359.0, 213792.0, 46761.0, 14639.0, 5868.0, 2639.0, 1350.0, 730.0, 399.0, 263.0, 165.0, 115.0, 64.0, 49.0, 33.0, 23.0, 9.0, 18.0, 10.0, 3.0, 9.0, 5.0, 2.0, 4.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-5.26171875, -5.09521484375, -4.9287109375, -4.76220703125, -4.595703125, -4.42919921875, -4.2626953125, -4.09619140625, -3.9296875, -3.76318359375, -3.5966796875, -3.43017578125, -3.263671875, -3.09716796875, -2.9306640625, -2.76416015625, -2.59765625, -2.43115234375, -2.2646484375, -2.09814453125, -1.931640625, -1.76513671875, -1.5986328125, -1.43212890625, -1.265625, -1.09912109375, -0.9326171875, -0.76611328125, -0.599609375, -0.43310546875, -0.2666015625, -0.10009765625, 0.06640625, 0.23291015625, 0.3994140625, 0.56591796875, 0.732421875, 0.89892578125, 1.0654296875, 1.23193359375, 1.3984375, 1.56494140625, 1.7314453125, 1.89794921875, 2.064453125, 2.23095703125, 2.3974609375, 2.56396484375, 2.73046875, 2.89697265625, 3.0634765625, 3.22998046875, 3.396484375, 3.56298828125, 3.7294921875, 3.89599609375, 4.0625, 4.22900390625, 4.3955078125, 4.56201171875, 4.728515625, 4.89501953125, 5.0615234375, 5.22802734375, 5.39453125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 6.0, 6.0, 10.0, 11.0, 19.0, 20.0, 22.0, 38.0, 34.0, 53.0, 52.0, 60.0, 68.0, 80.0, 76.0, 70.0, 70.0, 58.0, 51.0, 36.0, 30.0, 22.0, 19.0, 13.0, 14.0, 13.0, 4.0, 9.0, 10.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.498046875, -2.4229736328125, -2.347900390625, -2.2728271484375, -2.19775390625, -2.1226806640625, -2.047607421875, -1.9725341796875, -1.8974609375, -1.8223876953125, -1.747314453125, -1.6722412109375, -1.59716796875, -1.5220947265625, -1.447021484375, -1.3719482421875, -1.296875, -1.2218017578125, -1.146728515625, -1.0716552734375, -0.99658203125, -0.9215087890625, -0.846435546875, -0.7713623046875, -0.6962890625, -0.6212158203125, -0.546142578125, -0.4710693359375, -0.39599609375, -0.3209228515625, -0.245849609375, -0.1707763671875, -0.095703125, -0.0206298828125, 0.054443359375, 0.1295166015625, 0.20458984375, 0.2796630859375, 0.354736328125, 0.4298095703125, 0.5048828125, 0.5799560546875, 0.655029296875, 0.7301025390625, 0.80517578125, 0.8802490234375, 0.955322265625, 1.0303955078125, 1.10546875, 1.1805419921875, 1.255615234375, 1.3306884765625, 1.40576171875, 1.4808349609375, 1.555908203125, 1.6309814453125, 1.7060546875, 1.7811279296875, 1.856201171875, 1.9312744140625, 2.00634765625, 2.0814208984375, 2.156494140625, 2.2315673828125, 2.306640625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 15.0, 55.0, 221.0, 386.0, 231.0, 63.0, 16.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.46278381347656, -139.41738891601562, -135.37200927734375, -131.3266143798828, -127.28123474121094, -123.23583984375, -119.1904525756836, -115.14506530761719, -111.09967803955078, -107.05429077148438, -103.00890350341797, -98.96351623535156, -94.91812133789062, -90.87274169921875, -86.82734680175781, -82.7819595336914, -78.736572265625, -74.6911849975586, -70.64579772949219, -66.60041046142578, -62.55501937866211, -58.5096321105957, -54.46424102783203, -50.418853759765625, -46.37346649169922, -42.32807922363281, -38.282691955566406, -34.237300872802734, -30.191913604736328, -26.146526336669922, -22.101137161254883, -18.055747985839844, -14.010353088378906, -9.964964866638184, -5.919576644897461, -1.8741884231567383, 2.1711997985839844, 6.216587066650391, 10.26197624206543, 14.307365417480469, 18.352752685546875, 22.39813995361328, 26.44352912902832, 30.48891830444336, 34.534305572509766, 38.57969284057617, 42.625083923339844, 46.67047119140625, 50.715858459472656, 54.76124572753906, 58.80663299560547, 62.85202407836914, 66.89741516113281, 70.94279479980469, 74.98818969726562, 79.03357696533203, 83.07896423339844, 87.12435150146484, 91.16973876953125, 95.21512603759766, 99.26051330566406, 103.305908203125, 107.3512954711914, 111.39668273925781, 115.44207000732422]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 12.0, 9.0, 20.0, 29.0, 20.0, 36.0, 38.0, 51.0, 47.0, 58.0, 75.0, 65.0, 67.0, 65.0, 61.0, 61.0, 61.0, 61.0, 32.0, 36.0, 20.0, 22.0, 14.0, 6.0, 5.0, 4.0, 10.0, 3.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.85041809082031, -40.723182678222656, -39.595951080322266, -38.46871566772461, -37.34148406982422, -36.21424865722656, -35.08701705932617, -33.959781646728516, -32.832550048828125, -31.7053165435791, -30.578083038330078, -29.450849533081055, -28.32361602783203, -27.196380615234375, -26.06914710998535, -24.941913604736328, -23.814678192138672, -22.68744468688965, -21.560211181640625, -20.4329776763916, -19.305744171142578, -18.178508758544922, -17.0512752532959, -15.924041748046875, -14.796808242797852, -13.669574737548828, -12.542341232299805, -11.415106773376465, -10.287873268127441, -9.160639762878418, -8.033405303955078, -6.906171798706055, -5.778934478759766, -4.651700973510742, -3.5244669914245605, -2.397233247756958, -1.2699995040893555, -0.14276599884033203, 0.9844679832458496, 2.1117019653320312, 3.2389354705810547, 4.366168975830078, 5.49340295791626, 6.620636940002441, 7.747870445251465, 8.875103950500488, 10.002338409423828, 11.129571914672852, 12.256805419921875, 13.384038925170898, 14.511272430419922, 15.638506889343262, 16.76573944091797, 17.892974853515625, 19.02020835876465, 20.147441864013672, 21.274675369262695, 22.40190887451172, 23.529142379760742, 24.656375885009766, 25.783611297607422, 26.910842895507812, 28.03807830810547, 29.165311813354492, 30.292545318603516]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 9.0, 6.0, 14.0, 9.0, 16.0, 36.0, 51.0, 90.0, 191.0, 328.0, 712.0, 2380.0, 13634.0, 3698185.0, 466129.0, 9915.0, 1734.0, 475.0, 200.0, 83.0, 47.0, 22.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.28125, -42.169189453125, -41.05712890625, -39.945068359375, -38.8330078125, -37.720947265625, -36.60888671875, -35.496826171875, -34.384765625, -33.272705078125, -32.16064453125, -31.048583984375, -29.9365234375, -28.824462890625, -27.71240234375, -26.600341796875, -25.48828125, -24.376220703125, -23.26416015625, -22.152099609375, -21.0400390625, -19.927978515625, -18.81591796875, -17.703857421875, -16.591796875, -15.479736328125, -14.36767578125, -13.255615234375, -12.1435546875, -11.031494140625, -9.91943359375, -8.807373046875, -7.6953125, -6.583251953125, -5.47119140625, -4.359130859375, -3.2470703125, -2.135009765625, -1.02294921875, 0.089111328125, 1.201171875, 2.313232421875, 3.42529296875, 4.537353515625, 5.6494140625, 6.761474609375, 7.87353515625, 8.985595703125, 10.09765625, 11.209716796875, 12.32177734375, 13.433837890625, 14.5458984375, 15.657958984375, 16.77001953125, 17.882080078125, 18.994140625, 20.106201171875, 21.21826171875, 22.330322265625, 23.4423828125, 24.554443359375, 25.66650390625, 26.778564453125, 27.890625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 8.0, 4.0, 6.0, 18.0, 27.0, 46.0, 89.0, 148.0, 180.0, 148.0, 114.0, 83.0, 57.0, 32.0, 11.0, 6.0, 11.0, 8.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.736328125, -1.692779541015625, -1.64923095703125, -1.605682373046875, -1.5621337890625, -1.518585205078125, -1.47503662109375, -1.431488037109375, -1.387939453125, -1.344390869140625, -1.30084228515625, -1.257293701171875, -1.2137451171875, -1.170196533203125, -1.12664794921875, -1.083099365234375, -1.03955078125, -0.996002197265625, -0.95245361328125, -0.908905029296875, -0.8653564453125, -0.821807861328125, -0.77825927734375, -0.734710693359375, -0.691162109375, -0.647613525390625, -0.60406494140625, -0.560516357421875, -0.5169677734375, -0.473419189453125, -0.42987060546875, -0.386322021484375, -0.3427734375, -0.299224853515625, -0.25567626953125, -0.212127685546875, -0.1685791015625, -0.125030517578125, -0.08148193359375, -0.037933349609375, 0.005615234375, 0.049163818359375, 0.09271240234375, 0.136260986328125, 0.1798095703125, 0.223358154296875, 0.26690673828125, 0.310455322265625, 0.35400390625, 0.397552490234375, 0.44110107421875, 0.484649658203125, 0.5281982421875, 0.571746826171875, 0.61529541015625, 0.658843994140625, 0.702392578125, 0.745941162109375, 0.78948974609375, 0.833038330078125, 0.8765869140625, 0.920135498046875, 0.96368408203125, 1.007232666015625, 1.05078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 6.0, 9.0, 12.0, 13.0, 8.0, 28.0, 48.0, 59.0, 91.0, 160.0, 215.0, 407.0, 731.0, 1399.0, 2944.0, 7627.0, 29298.0, 208603.0, 3649902.0, 245126.0, 33148.0, 8385.0, 3047.0, 1364.0, 677.0, 390.0, 237.0, 113.0, 81.0, 53.0, 32.0, 22.0, 17.0, 13.0, 7.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.625, -13.1787109375, -12.732421875, -12.2861328125, -11.83984375, -11.3935546875, -10.947265625, -10.5009765625, -10.0546875, -9.6083984375, -9.162109375, -8.7158203125, -8.26953125, -7.8232421875, -7.376953125, -6.9306640625, -6.484375, -6.0380859375, -5.591796875, -5.1455078125, -4.69921875, -4.2529296875, -3.806640625, -3.3603515625, -2.9140625, -2.4677734375, -2.021484375, -1.5751953125, -1.12890625, -0.6826171875, -0.236328125, 0.2099609375, 0.65625, 1.1025390625, 1.548828125, 1.9951171875, 2.44140625, 2.8876953125, 3.333984375, 3.7802734375, 4.2265625, 4.6728515625, 5.119140625, 5.5654296875, 6.01171875, 6.4580078125, 6.904296875, 7.3505859375, 7.796875, 8.2431640625, 8.689453125, 9.1357421875, 9.58203125, 10.0283203125, 10.474609375, 10.9208984375, 11.3671875, 11.8134765625, 12.259765625, 12.7060546875, 13.15234375, 13.5986328125, 14.044921875, 14.4912109375, 14.9375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 3.0, 3.0, 9.0, 9.0, 16.0, 31.0, 49.0, 66.0, 134.0, 214.0, 540.0, 1770.0, 662.0, 203.0, 107.0, 68.0, 46.0, 46.0, 27.0, 25.0, 13.0, 5.0, 2.0, 7.0, 2.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.955078125, -2.8719482421875, -2.788818359375, -2.7056884765625, -2.62255859375, -2.5394287109375, -2.456298828125, -2.3731689453125, -2.2900390625, -2.2069091796875, -2.123779296875, -2.0406494140625, -1.95751953125, -1.8743896484375, -1.791259765625, -1.7081298828125, -1.625, -1.5418701171875, -1.458740234375, -1.3756103515625, -1.29248046875, -1.2093505859375, -1.126220703125, -1.0430908203125, -0.9599609375, -0.8768310546875, -0.793701171875, -0.7105712890625, -0.62744140625, -0.5443115234375, -0.461181640625, -0.3780517578125, -0.294921875, -0.2117919921875, -0.128662109375, -0.0455322265625, 0.03759765625, 0.1207275390625, 0.203857421875, 0.2869873046875, 0.3701171875, 0.4532470703125, 0.536376953125, 0.6195068359375, 0.70263671875, 0.7857666015625, 0.868896484375, 0.9520263671875, 1.03515625, 1.1182861328125, 1.201416015625, 1.2845458984375, 1.36767578125, 1.4508056640625, 1.533935546875, 1.6170654296875, 1.7001953125, 1.7833251953125, 1.866455078125, 1.9495849609375, 2.03271484375, 2.1158447265625, 2.198974609375, 2.2821044921875, 2.365234375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 10.0, 15.0, 36.0, 70.0, 130.0, 201.0, 208.0, 168.0, 88.0, 39.0, 16.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.06146240234375, -26.35172462463379, -25.641986846923828, -24.932249069213867, -24.222511291503906, -23.512775421142578, -22.803035736083984, -22.093299865722656, -21.383562088012695, -20.673824310302734, -19.964086532592773, -19.254348754882812, -18.54461097717285, -17.83487319946289, -17.125137329101562, -16.4153995513916, -15.705660820007324, -14.995923042297363, -14.286185264587402, -13.576448440551758, -12.866710662841797, -12.156972885131836, -11.447235107421875, -10.737497329711914, -10.027759552001953, -9.318021774291992, -8.608283996582031, -7.8985466957092285, -7.188809394836426, -6.479071617126465, -5.769333839416504, -5.059596538543701, -4.349859237670898, -3.6401216983795166, -2.9303841590881348, -2.220646381378174, -1.510908842086792, -0.8011713027954102, -0.09143352508544922, 0.6183037757873535, 1.3280415534973145, 2.0377790927886963, 2.747516632080078, 3.457254409790039, 4.1669921875, 4.876729488372803, 5.586467266082764, 6.296204566955566, 7.005942344665527, 7.715680122375488, 8.42541790008545, 9.135154724121094, 9.844892501831055, 10.554630279541016, 11.264368057250977, 11.974105834960938, 12.683843612670898, 13.39358139038086, 14.10331916809082, 14.813056945800781, 15.522793769836426, 16.232532501220703, 16.94226837158203, 17.652006149291992, 18.361743927001953]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 4.0, 2.0, 7.0, 4.0, 5.0, 9.0, 15.0, 12.0, 11.0, 15.0, 23.0, 16.0, 25.0, 29.0, 35.0, 39.0, 27.0, 41.0, 37.0, 39.0, 44.0, 48.0, 49.0, 50.0, 39.0, 36.0, 52.0, 34.0, 37.0, 27.0, 26.0, 27.0, 22.0, 27.0, 18.0, 14.0, 9.0, 7.0, 7.0, 7.0, 7.0, 7.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0], "bins": [-8.621857643127441, -8.376824378967285, -8.131792068481445, -7.886758804321289, -7.641725540161133, -7.396692752838135, -7.151659965515137, -6.9066267013549805, -6.661593914031982, -6.416561126708984, -6.171527862548828, -5.92649507522583, -5.681462287902832, -5.436429023742676, -5.191396236419678, -4.94636344909668, -4.701330184936523, -4.456297397613525, -4.211264133453369, -3.966231346130371, -3.721198320388794, -3.476165294647217, -3.2311325073242188, -2.9860994815826416, -2.7410664558410645, -2.4960334300994873, -2.25100040435791, -2.005967617034912, -1.760934591293335, -1.5159015655517578, -1.2708686590194702, -1.0258357524871826, -0.7808027267456055, -0.5357697606086731, -0.2907367944717407, -0.04570382833480835, 0.19932913780212402, 0.44436216354370117, 0.6893950700759888, 0.9344279766082764, 1.1794610023498535, 1.4244940280914307, 1.6695269346237183, 1.9145598411560059, 2.159592866897583, 2.40462589263916, 2.649658679962158, 2.8946917057037354, 3.1397247314453125, 3.3847577571868896, 3.629790782928467, 3.874823570251465, 4.119856834411621, 4.364889621734619, 4.609922409057617, 4.854955673217773, 5.0999884605407715, 5.3450212478637695, 5.590054512023926, 5.835087299346924, 6.080120086669922, 6.325153350830078, 6.570186138153076, 6.815218925476074, 7.0602521896362305]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 14.0, 5.0, 21.0, 17.0, 25.0, 28.0, 48.0, 57.0, 78.0, 111.0, 203.0, 273.0, 432.0, 645.0, 1132.0, 2098.0, 4243.0, 9720.0, 28407.0, 118142.0, 507203.0, 286289.0, 58897.0, 16959.0, 6454.0, 3050.0, 1520.0, 889.0, 516.0, 328.0, 224.0, 117.0, 108.0, 82.0, 48.0, 50.0, 34.0, 22.0, 14.0, 16.0, 8.0, 3.0, 5.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0], "bins": [-8.3046875, -8.05126953125, -7.7978515625, -7.54443359375, -7.291015625, -7.03759765625, -6.7841796875, -6.53076171875, -6.27734375, -6.02392578125, -5.7705078125, -5.51708984375, -5.263671875, -5.01025390625, -4.7568359375, -4.50341796875, -4.25, -3.99658203125, -3.7431640625, -3.48974609375, -3.236328125, -2.98291015625, -2.7294921875, -2.47607421875, -2.22265625, -1.96923828125, -1.7158203125, -1.46240234375, -1.208984375, -0.95556640625, -0.7021484375, -0.44873046875, -0.1953125, 0.05810546875, 0.3115234375, 0.56494140625, 0.818359375, 1.07177734375, 1.3251953125, 1.57861328125, 1.83203125, 2.08544921875, 2.3388671875, 2.59228515625, 2.845703125, 3.09912109375, 3.3525390625, 3.60595703125, 3.859375, 4.11279296875, 4.3662109375, 4.61962890625, 4.873046875, 5.12646484375, 5.3798828125, 5.63330078125, 5.88671875, 6.14013671875, 6.3935546875, 6.64697265625, 6.900390625, 7.15380859375, 7.4072265625, 7.66064453125, 7.9140625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 2.0, 8.0, 23.0, 31.0, 51.0, 59.0, 104.0, 119.0, 143.0, 108.0, 107.0, 78.0, 59.0, 45.0, 15.0, 17.0, 12.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.7158203125, -1.6736526489257812, -1.6314849853515625, -1.5893173217773438, -1.547149658203125, -1.5049819946289062, -1.4628143310546875, -1.4206466674804688, -1.37847900390625, -1.3363113403320312, -1.2941436767578125, -1.2519760131835938, -1.209808349609375, -1.1676406860351562, -1.1254730224609375, -1.0833053588867188, -1.0411376953125, -0.9989700317382812, -0.9568023681640625, -0.9146347045898438, -0.872467041015625, -0.8302993774414062, -0.7881317138671875, -0.7459640502929688, -0.70379638671875, -0.6616287231445312, -0.6194610595703125, -0.5772933959960938, -0.535125732421875, -0.49295806884765625, -0.4507904052734375, -0.40862274169921875, -0.366455078125, -0.32428741455078125, -0.2821197509765625, -0.23995208740234375, -0.197784423828125, -0.15561676025390625, -0.1134490966796875, -0.07128143310546875, -0.02911376953125, 0.01305389404296875, 0.0552215576171875, 0.09738922119140625, 0.139556884765625, 0.18172454833984375, 0.2238922119140625, 0.26605987548828125, 0.3082275390625, 0.35039520263671875, 0.3925628662109375, 0.43473052978515625, 0.476898193359375, 0.5190658569335938, 0.5612335205078125, 0.6034011840820312, 0.64556884765625, 0.6877365112304688, 0.7299041748046875, 0.7720718383789062, 0.814239501953125, 0.8564071655273438, 0.8985748291015625, 0.9407424926757812, 0.98291015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 7.0, 5.0, 6.0, 10.0, 17.0, 16.0, 30.0, 39.0, 53.0, 66.0, 96.0, 115.0, 171.0, 217.0, 324.0, 494.0, 825.0, 1394.0, 2634.0, 5356.0, 12699.0, 34510.0, 117190.0, 440508.0, 308330.0, 79078.0, 25108.0, 9559.0, 4283.0, 2027.0, 1155.0, 688.0, 459.0, 291.0, 200.0, 157.0, 111.0, 74.0, 62.0, 45.0, 37.0, 37.0, 16.0, 14.0, 13.0, 9.0, 7.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.03125, -7.779052734375, -7.52685546875, -7.274658203125, -7.0224609375, -6.770263671875, -6.51806640625, -6.265869140625, -6.013671875, -5.761474609375, -5.50927734375, -5.257080078125, -5.0048828125, -4.752685546875, -4.50048828125, -4.248291015625, -3.99609375, -3.743896484375, -3.49169921875, -3.239501953125, -2.9873046875, -2.735107421875, -2.48291015625, -2.230712890625, -1.978515625, -1.726318359375, -1.47412109375, -1.221923828125, -0.9697265625, -0.717529296875, -0.46533203125, -0.213134765625, 0.0390625, 0.291259765625, 0.54345703125, 0.795654296875, 1.0478515625, 1.300048828125, 1.55224609375, 1.804443359375, 2.056640625, 2.308837890625, 2.56103515625, 2.813232421875, 3.0654296875, 3.317626953125, 3.56982421875, 3.822021484375, 4.07421875, 4.326416015625, 4.57861328125, 4.830810546875, 5.0830078125, 5.335205078125, 5.58740234375, 5.839599609375, 6.091796875, 6.343994140625, 6.59619140625, 6.848388671875, 7.1005859375, 7.352783203125, 7.60498046875, 7.857177734375, 8.109375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 8.0, 8.0, 3.0, 7.0, 12.0, 4.0, 13.0, 14.0, 8.0, 15.0, 22.0, 22.0, 28.0, 34.0, 37.0, 28.0, 40.0, 38.0, 55.0, 41.0, 43.0, 41.0, 48.0, 35.0, 43.0, 40.0, 40.0, 37.0, 36.0, 26.0, 33.0, 22.0, 19.0, 12.0, 21.0, 12.0, 10.0, 9.0, 9.0, 2.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.59765625, -4.46270751953125, -4.3277587890625, -4.19281005859375, -4.057861328125, -3.92291259765625, -3.7879638671875, -3.65301513671875, -3.51806640625, -3.38311767578125, -3.2481689453125, -3.11322021484375, -2.978271484375, -2.84332275390625, -2.7083740234375, -2.57342529296875, -2.4384765625, -2.30352783203125, -2.1685791015625, -2.03363037109375, -1.898681640625, -1.76373291015625, -1.6287841796875, -1.49383544921875, -1.35888671875, -1.22393798828125, -1.0889892578125, -0.95404052734375, -0.819091796875, -0.68414306640625, -0.5491943359375, -0.41424560546875, -0.279296875, -0.14434814453125, -0.0093994140625, 0.12554931640625, 0.260498046875, 0.39544677734375, 0.5303955078125, 0.66534423828125, 0.80029296875, 0.93524169921875, 1.0701904296875, 1.20513916015625, 1.340087890625, 1.47503662109375, 1.6099853515625, 1.74493408203125, 1.8798828125, 2.01483154296875, 2.1497802734375, 2.28472900390625, 2.419677734375, 2.55462646484375, 2.6895751953125, 2.82452392578125, 2.95947265625, 3.09442138671875, 3.2293701171875, 3.36431884765625, 3.499267578125, 3.63421630859375, 3.7691650390625, 3.90411376953125, 4.0390625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 9.0, 4.0, 9.0, 11.0, 14.0, 15.0, 24.0, 35.0, 45.0, 87.0, 113.0, 195.0, 276.0, 432.0, 696.0, 1195.0, 2048.0, 3699.0, 7318.0, 16296.0, 41805.0, 129415.0, 444299.0, 272792.0, 76531.0, 27376.0, 11431.0, 5435.0, 2822.0, 1521.0, 995.0, 561.0, 363.0, 211.0, 144.0, 117.0, 64.0, 54.0, 27.0, 25.0, 19.0, 14.0, 6.0, 10.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.99609375, -4.860260009765625, -4.72442626953125, -4.588592529296875, -4.4527587890625, -4.316925048828125, -4.18109130859375, -4.045257568359375, -3.909423828125, -3.773590087890625, -3.63775634765625, -3.501922607421875, -3.3660888671875, -3.230255126953125, -3.09442138671875, -2.958587646484375, -2.82275390625, -2.686920166015625, -2.55108642578125, -2.415252685546875, -2.2794189453125, -2.143585205078125, -2.00775146484375, -1.871917724609375, -1.736083984375, -1.600250244140625, -1.46441650390625, -1.328582763671875, -1.1927490234375, -1.056915283203125, -0.92108154296875, -0.785247802734375, -0.6494140625, -0.513580322265625, -0.37774658203125, -0.241912841796875, -0.1060791015625, 0.029754638671875, 0.16558837890625, 0.301422119140625, 0.437255859375, 0.573089599609375, 0.70892333984375, 0.844757080078125, 0.9805908203125, 1.116424560546875, 1.25225830078125, 1.388092041015625, 1.52392578125, 1.659759521484375, 1.79559326171875, 1.931427001953125, 2.0672607421875, 2.203094482421875, 2.33892822265625, 2.474761962890625, 2.610595703125, 2.746429443359375, 2.88226318359375, 3.018096923828125, 3.1539306640625, 3.289764404296875, 3.42559814453125, 3.561431884765625, 3.697265625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 5.0, 3.0, 9.0, 10.0, 16.0, 16.0, 28.0, 27.0, 27.0, 48.0, 44.0, 70.0, 103.0, 134.0, 109.0, 89.0, 55.0, 47.0, 26.0, 27.0, 18.0, 11.0, 14.0, 13.0, 15.0, 6.0, 5.0, 6.0, 1.0, 6.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0007486343383789062, -0.0007256194949150085, -0.0007026046514511108, -0.0006795898079872131, -0.0006565749645233154, -0.0006335601210594177, -0.00061054527759552, -0.0005875304341316223, -0.0005645155906677246, -0.0005415007472038269, -0.0005184859037399292, -0.0004954710602760315, -0.0004724562168121338, -0.0004494413733482361, -0.0004264265298843384, -0.0004034116864204407, -0.00038039684295654297, -0.00035738199949264526, -0.00033436715602874756, -0.00031135231256484985, -0.00028833746910095215, -0.00026532262563705444, -0.00024230778217315674, -0.00021929293870925903, -0.00019627809524536133, -0.00017326325178146362, -0.00015024840831756592, -0.0001272335648536682, -0.00010421872138977051, -8.12038779258728e-05, -5.81890344619751e-05, -3.517419099807739e-05, -1.2159347534179688e-05, 1.0855495929718018e-05, 3.387033939361572e-05, 5.688518285751343e-05, 7.990002632141113e-05, 0.00010291486978530884, 0.00012592971324920654, 0.00014894455671310425, 0.00017195940017700195, 0.00019497424364089966, 0.00021798908710479736, 0.00024100393056869507, 0.0002640187740325928, 0.0002870336174964905, 0.0003100484609603882, 0.0003330633044242859, 0.0003560781478881836, 0.0003790929913520813, 0.000402107834815979, 0.0004251226782798767, 0.0004481375217437744, 0.0004711523652076721, 0.0004941672086715698, 0.0005171820521354675, 0.0005401968955993652, 0.0005632117390632629, 0.0005862265825271606, 0.0006092414259910583, 0.0006322562694549561, 0.0006552711129188538, 0.0006782859563827515, 0.0007013007998466492, 0.0007243156433105469]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 10.0, 16.0, 18.0, 28.0, 44.0, 56.0, 90.0, 113.0, 238.0, 315.0, 620.0, 1166.0, 2493.0, 6210.0, 20075.0, 88619.0, 583678.0, 277204.0, 47051.0, 12197.0, 4333.0, 1844.0, 885.0, 472.0, 271.0, 163.0, 110.0, 80.0, 40.0, 34.0, 30.0, 11.0, 11.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-7.59375, -7.36907958984375, -7.1444091796875, -6.91973876953125, -6.695068359375, -6.47039794921875, -6.2457275390625, -6.02105712890625, -5.79638671875, -5.57171630859375, -5.3470458984375, -5.12237548828125, -4.897705078125, -4.67303466796875, -4.4483642578125, -4.22369384765625, -3.9990234375, -3.77435302734375, -3.5496826171875, -3.32501220703125, -3.100341796875, -2.87567138671875, -2.6510009765625, -2.42633056640625, -2.20166015625, -1.97698974609375, -1.7523193359375, -1.52764892578125, -1.302978515625, -1.07830810546875, -0.8536376953125, -0.62896728515625, -0.404296875, -0.17962646484375, 0.0450439453125, 0.26971435546875, 0.494384765625, 0.71905517578125, 0.9437255859375, 1.16839599609375, 1.39306640625, 1.61773681640625, 1.8424072265625, 2.06707763671875, 2.291748046875, 2.51641845703125, 2.7410888671875, 2.96575927734375, 3.1904296875, 3.41510009765625, 3.6397705078125, 3.86444091796875, 4.089111328125, 4.31378173828125, 4.5384521484375, 4.76312255859375, 4.98779296875, 5.21246337890625, 5.4371337890625, 5.66180419921875, 5.886474609375, 6.11114501953125, 6.3358154296875, 6.56048583984375, 6.78515625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 1.0, 6.0, 1.0, 5.0, 6.0, 7.0, 11.0, 16.0, 17.0, 18.0, 24.0, 31.0, 40.0, 41.0, 72.0, 97.0, 124.0, 96.0, 85.0, 62.0, 47.0, 36.0, 29.0, 25.0, 30.0, 16.0, 15.0, 8.0, 11.0, 6.0, 7.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.521484375, -3.4114990234375, -3.301513671875, -3.1915283203125, -3.08154296875, -2.9715576171875, -2.861572265625, -2.7515869140625, -2.6416015625, -2.5316162109375, -2.421630859375, -2.3116455078125, -2.20166015625, -2.0916748046875, -1.981689453125, -1.8717041015625, -1.76171875, -1.6517333984375, -1.541748046875, -1.4317626953125, -1.32177734375, -1.2117919921875, -1.101806640625, -0.9918212890625, -0.8818359375, -0.7718505859375, -0.661865234375, -0.5518798828125, -0.44189453125, -0.3319091796875, -0.221923828125, -0.1119384765625, -0.001953125, 0.1080322265625, 0.218017578125, 0.3280029296875, 0.43798828125, 0.5479736328125, 0.657958984375, 0.7679443359375, 0.8779296875, 0.9879150390625, 1.097900390625, 1.2078857421875, 1.31787109375, 1.4278564453125, 1.537841796875, 1.6478271484375, 1.7578125, 1.8677978515625, 1.977783203125, 2.0877685546875, 2.19775390625, 2.3077392578125, 2.417724609375, 2.5277099609375, 2.6376953125, 2.7476806640625, 2.857666015625, 2.9676513671875, 3.07763671875, 3.1876220703125, 3.297607421875, 3.4075927734375, 3.517578125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 10.0, 23.0, 30.0, 58.0, 87.0, 163.0, 195.0, 142.0, 109.0, 58.0, 46.0, 22.0, 18.0, 10.0, 5.0, 3.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.97011184692383, -50.0161247253418, -48.06214141845703, -46.108154296875, -44.15416717529297, -42.20018005371094, -40.24619674682617, -38.29220962524414, -36.338226318359375, -34.384239196777344, -32.43025588989258, -30.476268768310547, -28.522281646728516, -26.568296432495117, -24.61431121826172, -22.660324096679688, -20.706336975097656, -18.752351760864258, -16.798364639282227, -14.844379425048828, -12.890393257141113, -10.936407089233398, -8.982421875, -7.028435707092285, -5.07444953918457, -3.1204636096954346, -1.1664776802062988, 0.7875080108642578, 2.7414941787719727, 4.6954803466796875, 6.649465560913086, 8.6034517288208, 10.557441711425781, 12.511427879333496, 14.465414047241211, 16.41939926147461, 18.37338638305664, 20.32737159729004, 22.281356811523438, 24.23534393310547, 26.189329147338867, 28.143314361572266, 30.097301483154297, 32.05128479003906, 34.005271911621094, 35.959259033203125, 37.913246154785156, 39.86722946166992, 41.82121658325195, 43.775203704833984, 45.72918701171875, 47.68317413330078, 49.63716125488281, 51.591148376464844, 53.54513168334961, 55.49911880493164, 57.453102111816406, 59.40708923339844, 61.3610725402832, 63.315059661865234, 65.26904296875, 67.22303009033203, 69.17701721191406, 71.1310043334961, 73.08499145507812]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 2.0, 2.0, 5.0, 6.0, 4.0, 5.0, 7.0, 8.0, 6.0, 8.0, 19.0, 24.0, 16.0, 16.0, 17.0, 26.0, 30.0, 24.0, 28.0, 52.0, 55.0, 38.0, 46.0, 51.0, 47.0, 35.0, 41.0, 34.0, 40.0, 29.0, 34.0, 26.0, 35.0, 35.0, 22.0, 31.0, 18.0, 23.0, 13.0, 14.0, 9.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.17507553100586, -28.222301483154297, -27.269527435302734, -26.316753387451172, -25.363981246948242, -24.41120719909668, -23.458433151245117, -22.505659103393555, -21.552885055541992, -20.60011100769043, -19.647336959838867, -18.694564819335938, -17.741790771484375, -16.789016723632812, -15.83624267578125, -14.883468627929688, -13.930695533752441, -12.977921485900879, -12.025148391723633, -11.07237434387207, -10.119600296020508, -9.166826248168945, -8.2140531539917, -7.261279106140137, -6.308505535125732, -5.355731964111328, -4.402957916259766, -3.4501843452453613, -2.497410535812378, -1.5446367263793945, -0.5918631553649902, 0.36091089248657227, 1.3136844635009766, 2.26645827293396, 3.2192320823669434, 4.172005653381348, 5.12477970123291, 6.0775532722473145, 7.030326843261719, 7.983100891113281, 8.935874938964844, 9.888648986816406, 10.841422080993652, 11.794196128845215, 12.746970176696777, 13.699743270874023, 14.652517318725586, 15.605291366577148, 16.558063507080078, 17.51083755493164, 18.463611602783203, 19.416385650634766, 20.369157791137695, 21.321931838989258, 22.27470588684082, 23.227479934692383, 24.180253982543945, 25.133028030395508, 26.08580207824707, 27.03857421875, 27.991348266601562, 28.944122314453125, 29.896896362304688, 30.84967041015625, 31.802444458007812]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 4.0, 2.0, 6.0, 2.0, 8.0, 5.0, 7.0, 9.0, 14.0, 11.0, 12.0, 18.0, 33.0, 39.0, 52.0, 106.0, 116.0, 160.0, 260.0, 421.0, 616.0, 1204.0, 2449.0, 5741.0, 17776.0, 98953.0, 3834051.0, 192741.0, 25806.0, 7664.0, 2956.0, 1357.0, 714.0, 370.0, 202.0, 134.0, 96.0, 48.0, 40.0, 20.0, 19.0, 8.0, 8.0, 8.0, 11.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-14.21875, -13.8505859375, -13.482421875, -13.1142578125, -12.74609375, -12.3779296875, -12.009765625, -11.6416015625, -11.2734375, -10.9052734375, -10.537109375, -10.1689453125, -9.80078125, -9.4326171875, -9.064453125, -8.6962890625, -8.328125, -7.9599609375, -7.591796875, -7.2236328125, -6.85546875, -6.4873046875, -6.119140625, -5.7509765625, -5.3828125, -5.0146484375, -4.646484375, -4.2783203125, -3.91015625, -3.5419921875, -3.173828125, -2.8056640625, -2.4375, -2.0693359375, -1.701171875, -1.3330078125, -0.96484375, -0.5966796875, -0.228515625, 0.1396484375, 0.5078125, 0.8759765625, 1.244140625, 1.6123046875, 1.98046875, 2.3486328125, 2.716796875, 3.0849609375, 3.453125, 3.8212890625, 4.189453125, 4.5576171875, 4.92578125, 5.2939453125, 5.662109375, 6.0302734375, 6.3984375, 6.7666015625, 7.134765625, 7.5029296875, 7.87109375, 8.2392578125, 8.607421875, 8.9755859375, 9.34375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 8.0, 8.0, 13.0, 19.0, 24.0, 53.0, 72.0, 86.0, 95.0, 101.0, 93.0, 83.0, 73.0, 88.0, 56.0, 46.0, 30.0, 9.0, 11.0, 11.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.765625, -1.7216796875, -1.677734375, -1.6337890625, -1.58984375, -1.5458984375, -1.501953125, -1.4580078125, -1.4140625, -1.3701171875, -1.326171875, -1.2822265625, -1.23828125, -1.1943359375, -1.150390625, -1.1064453125, -1.0625, -1.0185546875, -0.974609375, -0.9306640625, -0.88671875, -0.8427734375, -0.798828125, -0.7548828125, -0.7109375, -0.6669921875, -0.623046875, -0.5791015625, -0.53515625, -0.4912109375, -0.447265625, -0.4033203125, -0.359375, -0.3154296875, -0.271484375, -0.2275390625, -0.18359375, -0.1396484375, -0.095703125, -0.0517578125, -0.0078125, 0.0361328125, 0.080078125, 0.1240234375, 0.16796875, 0.2119140625, 0.255859375, 0.2998046875, 0.34375, 0.3876953125, 0.431640625, 0.4755859375, 0.51953125, 0.5634765625, 0.607421875, 0.6513671875, 0.6953125, 0.7392578125, 0.783203125, 0.8271484375, 0.87109375, 0.9150390625, 0.958984375, 1.0029296875, 1.046875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 8.0, 11.0, 15.0, 20.0, 28.0, 61.0, 68.0, 109.0, 153.0, 260.0, 473.0, 732.0, 1274.0, 2446.0, 5119.0, 12774.0, 38913.0, 188046.0, 3380090.0, 466223.0, 64358.0, 18913.0, 7123.0, 3219.0, 1615.0, 925.0, 487.0, 281.0, 173.0, 112.0, 83.0, 58.0, 29.0, 20.0, 20.0, 9.0, 7.0, 6.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.796875, -8.54327392578125, -8.2896728515625, -8.03607177734375, -7.782470703125, -7.52886962890625, -7.2752685546875, -7.02166748046875, -6.76806640625, -6.51446533203125, -6.2608642578125, -6.00726318359375, -5.753662109375, -5.50006103515625, -5.2464599609375, -4.99285888671875, -4.7392578125, -4.48565673828125, -4.2320556640625, -3.97845458984375, -3.724853515625, -3.47125244140625, -3.2176513671875, -2.96405029296875, -2.71044921875, -2.45684814453125, -2.2032470703125, -1.94964599609375, -1.696044921875, -1.44244384765625, -1.1888427734375, -0.93524169921875, -0.681640625, -0.42803955078125, -0.1744384765625, 0.07916259765625, 0.332763671875, 0.58636474609375, 0.8399658203125, 1.09356689453125, 1.34716796875, 1.60076904296875, 1.8543701171875, 2.10797119140625, 2.361572265625, 2.61517333984375, 2.8687744140625, 3.12237548828125, 3.3759765625, 3.62957763671875, 3.8831787109375, 4.13677978515625, 4.390380859375, 4.64398193359375, 4.8975830078125, 5.15118408203125, 5.40478515625, 5.65838623046875, 5.9119873046875, 6.16558837890625, 6.419189453125, 6.67279052734375, 6.9263916015625, 7.17999267578125, 7.43359375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 4.0, 6.0, 10.0, 6.0, 16.0, 20.0, 30.0, 33.0, 55.0, 89.0, 114.0, 224.0, 548.0, 1644.0, 624.0, 252.0, 120.0, 82.0, 48.0, 36.0, 25.0, 20.0, 18.0, 9.0, 13.0, 9.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.326171875, -2.262542724609375, -2.19891357421875, -2.135284423828125, -2.0716552734375, -2.008026123046875, -1.94439697265625, -1.880767822265625, -1.817138671875, -1.753509521484375, -1.68988037109375, -1.626251220703125, -1.5626220703125, -1.498992919921875, -1.43536376953125, -1.371734619140625, -1.30810546875, -1.244476318359375, -1.18084716796875, -1.117218017578125, -1.0535888671875, -0.989959716796875, -0.92633056640625, -0.862701416015625, -0.799072265625, -0.735443115234375, -0.67181396484375, -0.608184814453125, -0.5445556640625, -0.480926513671875, -0.41729736328125, -0.353668212890625, -0.2900390625, -0.226409912109375, -0.16278076171875, -0.099151611328125, -0.0355224609375, 0.028106689453125, 0.09173583984375, 0.155364990234375, 0.218994140625, 0.282623291015625, 0.34625244140625, 0.409881591796875, 0.4735107421875, 0.537139892578125, 0.60076904296875, 0.664398193359375, 0.72802734375, 0.791656494140625, 0.85528564453125, 0.918914794921875, 0.9825439453125, 1.046173095703125, 1.10980224609375, 1.173431396484375, 1.237060546875, 1.300689697265625, 1.36431884765625, 1.427947998046875, 1.4915771484375, 1.555206298828125, 1.61883544921875, 1.682464599609375, 1.74609375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 7.0, 10.0, 24.0, 91.0, 210.0, 323.0, 209.0, 86.0, 32.0, 12.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.86993408203125, -24.92953109741211, -23.989126205444336, -23.048723220825195, -22.108318328857422, -21.16791534423828, -20.227510452270508, -19.287107467651367, -18.346702575683594, -17.406299591064453, -16.46589469909668, -15.525490760803223, -14.585086822509766, -13.644683837890625, -12.704278945922852, -11.763875961303711, -10.823472023010254, -9.883068084716797, -8.94266414642334, -8.002260208129883, -7.061856269836426, -6.121452808380127, -5.18104887008667, -4.240644931793213, -3.300240993499756, -2.359837055206299, -1.4194332361221313, -0.47902941703796387, 0.46137452125549316, 1.401778221130371, 2.342182159423828, 3.282586097717285, 4.222990036010742, 5.163393974304199, 6.103797912597656, 7.044201850891113, 7.98460578918457, 8.925008773803711, 9.865413665771484, 10.805816650390625, 11.746221542358398, 12.686625480651855, 13.627029418945312, 14.56743335723877, 15.507837295532227, 16.448240280151367, 17.38864517211914, 18.32904815673828, 19.269451141357422, 20.209854125976562, 21.150259017944336, 22.090662002563477, 23.03106689453125, 23.97146987915039, 24.911874771118164, 25.852277755737305, 26.792682647705078, 27.73308563232422, 28.673490524291992, 29.613893508911133, 30.554298400878906, 31.494701385498047, 32.43510437011719, 33.375511169433594, 34.315914154052734]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 7.0, 9.0, 15.0, 13.0, 16.0, 24.0, 32.0, 21.0, 26.0, 30.0, 38.0, 40.0, 53.0, 47.0, 43.0, 59.0, 57.0, 48.0, 45.0, 56.0, 53.0, 39.0, 33.0, 33.0, 20.0, 31.0, 18.0, 19.0, 15.0, 8.0, 9.0, 5.0, 6.0, 6.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.428889274597168, -7.2026143074035645, -6.976339817047119, -6.750064849853516, -6.52379035949707, -6.297515392303467, -6.0712409019470215, -5.844965934753418, -5.618691444396973, -5.392416477203369, -5.166141986846924, -4.93986701965332, -4.713592529296875, -4.4873175621032715, -4.261043071746826, -4.034768104553223, -3.8084933757781982, -3.582218647003174, -3.3559439182281494, -3.129669189453125, -2.9033944606781006, -2.677119731903076, -2.4508447647094727, -2.2245702743530273, -1.9982954263687134, -1.772020697593689, -1.5457459688186646, -1.3194711208343506, -1.0931963920593262, -0.8669216632843018, -0.6406469345092773, -0.41437220573425293, -0.18809747695922852, 0.03817726671695709, 0.2644520103931427, 0.4907267689704895, 0.7170014977455139, 0.9432762861251831, 1.1695510149002075, 1.395825743675232, 1.6221004724502563, 1.8483752012252808, 2.0746500492095947, 2.300924777984619, 2.5271995067596436, 2.753474235534668, 2.9797489643096924, 3.206023693084717, 3.432298421859741, 3.6585731506347656, 3.88484787940979, 4.1111226081848145, 4.337397575378418, 4.563672065734863, 4.789947032928467, 5.016221523284912, 5.242496490478516, 5.468771457672119, 5.6950459480285645, 5.921320915222168, 6.147595405578613, 6.373870372772217, 6.600144863128662, 6.826419830322266, 7.052694320678711]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 10.0, 12.0, 9.0, 15.0, 18.0, 22.0, 18.0, 29.0, 43.0, 54.0, 68.0, 83.0, 97.0, 167.0, 286.0, 393.0, 709.0, 1067.0, 1922.0, 3557.0, 7408.0, 17448.0, 47829.0, 158336.0, 440516.0, 250044.0, 73208.0, 24670.0, 10009.0, 4560.0, 2344.0, 1258.0, 792.0, 489.0, 312.0, 212.0, 141.0, 85.0, 70.0, 50.0, 53.0, 27.0, 22.0, 22.0, 20.0, 11.0, 20.0, 7.0, 4.0, 1.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09375, -5.8951416015625, -5.696533203125, -5.4979248046875, -5.29931640625, -5.1007080078125, -4.902099609375, -4.7034912109375, -4.5048828125, -4.3062744140625, -4.107666015625, -3.9090576171875, -3.71044921875, -3.5118408203125, -3.313232421875, -3.1146240234375, -2.916015625, -2.7174072265625, -2.518798828125, -2.3201904296875, -2.12158203125, -1.9229736328125, -1.724365234375, -1.5257568359375, -1.3271484375, -1.1285400390625, -0.929931640625, -0.7313232421875, -0.53271484375, -0.3341064453125, -0.135498046875, 0.0631103515625, 0.26171875, 0.4603271484375, 0.658935546875, 0.8575439453125, 1.05615234375, 1.2547607421875, 1.453369140625, 1.6519775390625, 1.8505859375, 2.0491943359375, 2.247802734375, 2.4464111328125, 2.64501953125, 2.8436279296875, 3.042236328125, 3.2408447265625, 3.439453125, 3.6380615234375, 3.836669921875, 4.0352783203125, 4.23388671875, 4.4324951171875, 4.631103515625, 4.8297119140625, 5.0283203125, 5.2269287109375, 5.425537109375, 5.6241455078125, 5.82275390625, 6.0213623046875, 6.219970703125, 6.4185791015625, 6.6171875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 8.0, 3.0, 5.0, 16.0, 24.0, 38.0, 47.0, 51.0, 66.0, 97.0, 85.0, 97.0, 87.0, 99.0, 75.0, 56.0, 41.0, 34.0, 27.0, 16.0, 9.0, 7.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.66796875, -1.625762939453125, -1.58355712890625, -1.541351318359375, -1.4991455078125, -1.456939697265625, -1.41473388671875, -1.372528076171875, -1.330322265625, -1.288116455078125, -1.24591064453125, -1.203704833984375, -1.1614990234375, -1.119293212890625, -1.07708740234375, -1.034881591796875, -0.99267578125, -0.950469970703125, -0.90826416015625, -0.866058349609375, -0.8238525390625, -0.781646728515625, -0.73944091796875, -0.697235107421875, -0.655029296875, -0.612823486328125, -0.57061767578125, -0.528411865234375, -0.4862060546875, -0.444000244140625, -0.40179443359375, -0.359588623046875, -0.3173828125, -0.275177001953125, -0.23297119140625, -0.190765380859375, -0.1485595703125, -0.106353759765625, -0.06414794921875, -0.021942138671875, 0.020263671875, 0.062469482421875, 0.10467529296875, 0.146881103515625, 0.1890869140625, 0.231292724609375, 0.27349853515625, 0.315704345703125, 0.35791015625, 0.400115966796875, 0.44232177734375, 0.484527587890625, 0.5267333984375, 0.568939208984375, 0.61114501953125, 0.653350830078125, 0.695556640625, 0.737762451171875, 0.77996826171875, 0.822174072265625, 0.8643798828125, 0.906585693359375, 0.94879150390625, 0.990997314453125, 1.033203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 11.0, 11.0, 17.0, 34.0, 39.0, 50.0, 57.0, 98.0, 129.0, 218.0, 326.0, 495.0, 759.0, 1397.0, 2684.0, 5743.0, 15036.0, 45496.0, 165205.0, 467496.0, 242262.0, 65672.0, 20252.0, 7560.0, 3356.0, 1576.0, 909.0, 546.0, 361.0, 241.0, 133.0, 114.0, 74.0, 63.0, 35.0, 26.0, 25.0, 12.0, 7.0, 8.0, 3.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.453125, -6.24920654296875, -6.0452880859375, -5.84136962890625, -5.637451171875, -5.43353271484375, -5.2296142578125, -5.02569580078125, -4.82177734375, -4.61785888671875, -4.4139404296875, -4.21002197265625, -4.006103515625, -3.80218505859375, -3.5982666015625, -3.39434814453125, -3.1904296875, -2.98651123046875, -2.7825927734375, -2.57867431640625, -2.374755859375, -2.17083740234375, -1.9669189453125, -1.76300048828125, -1.55908203125, -1.35516357421875, -1.1512451171875, -0.94732666015625, -0.743408203125, -0.53948974609375, -0.3355712890625, -0.13165283203125, 0.072265625, 0.27618408203125, 0.4801025390625, 0.68402099609375, 0.887939453125, 1.09185791015625, 1.2957763671875, 1.49969482421875, 1.70361328125, 1.90753173828125, 2.1114501953125, 2.31536865234375, 2.519287109375, 2.72320556640625, 2.9271240234375, 3.13104248046875, 3.3349609375, 3.53887939453125, 3.7427978515625, 3.94671630859375, 4.150634765625, 4.35455322265625, 4.5584716796875, 4.76239013671875, 4.96630859375, 5.17022705078125, 5.3741455078125, 5.57806396484375, 5.781982421875, 5.98590087890625, 6.1898193359375, 6.39373779296875, 6.59765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 3.0, 7.0, 8.0, 13.0, 10.0, 19.0, 25.0, 27.0, 27.0, 50.0, 50.0, 46.0, 63.0, 61.0, 67.0, 82.0, 63.0, 58.0, 59.0, 47.0, 46.0, 29.0, 29.0, 26.0, 18.0, 14.0, 15.0, 9.0, 6.0, 8.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.5594482421875, -4.376708984375, -4.1939697265625, -4.01123046875, -3.8284912109375, -3.645751953125, -3.4630126953125, -3.2802734375, -3.0975341796875, -2.914794921875, -2.7320556640625, -2.54931640625, -2.3665771484375, -2.183837890625, -2.0010986328125, -1.818359375, -1.6356201171875, -1.452880859375, -1.2701416015625, -1.08740234375, -0.9046630859375, -0.721923828125, -0.5391845703125, -0.3564453125, -0.1737060546875, 0.009033203125, 0.1917724609375, 0.37451171875, 0.5572509765625, 0.739990234375, 0.9227294921875, 1.10546875, 1.2882080078125, 1.470947265625, 1.6536865234375, 1.83642578125, 2.0191650390625, 2.201904296875, 2.3846435546875, 2.5673828125, 2.7501220703125, 2.932861328125, 3.1156005859375, 3.29833984375, 3.4810791015625, 3.663818359375, 3.8465576171875, 4.029296875, 4.2120361328125, 4.394775390625, 4.5775146484375, 4.76025390625, 4.9429931640625, 5.125732421875, 5.3084716796875, 5.4912109375, 5.6739501953125, 5.856689453125, 6.0394287109375, 6.22216796875, 6.4049072265625, 6.587646484375, 6.7703857421875, 6.953125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 6.0, 10.0, 14.0, 16.0, 24.0, 32.0, 33.0, 69.0, 138.0, 193.0, 356.0, 644.0, 1278.0, 2607.0, 6402.0, 18130.0, 65355.0, 301111.0, 479688.0, 124545.0, 30595.0, 9868.0, 3852.0, 1670.0, 797.0, 466.0, 226.0, 141.0, 93.0, 63.0, 42.0, 24.0, 22.0, 13.0, 15.0, 8.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.994140625, -2.895050048828125, -2.79595947265625, -2.696868896484375, -2.5977783203125, -2.498687744140625, -2.39959716796875, -2.300506591796875, -2.201416015625, -2.102325439453125, -2.00323486328125, -1.904144287109375, -1.8050537109375, -1.705963134765625, -1.60687255859375, -1.507781982421875, -1.40869140625, -1.309600830078125, -1.21051025390625, -1.111419677734375, -1.0123291015625, -0.913238525390625, -0.81414794921875, -0.715057373046875, -0.615966796875, -0.516876220703125, -0.41778564453125, -0.318695068359375, -0.2196044921875, -0.120513916015625, -0.02142333984375, 0.077667236328125, 0.1767578125, 0.275848388671875, 0.37493896484375, 0.474029541015625, 0.5731201171875, 0.672210693359375, 0.77130126953125, 0.870391845703125, 0.969482421875, 1.068572998046875, 1.16766357421875, 1.266754150390625, 1.3658447265625, 1.464935302734375, 1.56402587890625, 1.663116455078125, 1.76220703125, 1.861297607421875, 1.96038818359375, 2.059478759765625, 2.1585693359375, 2.257659912109375, 2.35675048828125, 2.455841064453125, 2.554931640625, 2.654022216796875, 2.75311279296875, 2.852203369140625, 2.9512939453125, 3.050384521484375, 3.14947509765625, 3.248565673828125, 3.34765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 7.0, 3.0, 2.0, 3.0, 7.0, 4.0, 9.0, 8.0, 6.0, 15.0, 21.0, 20.0, 34.0, 52.0, 49.0, 61.0, 71.0, 81.0, 88.0, 103.0, 68.0, 50.0, 59.0, 39.0, 30.0, 17.0, 21.0, 19.0, 12.0, 11.0, 9.0, 6.0, 3.0, 3.0, 2.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.0005655288696289062, -0.0005508400499820709, -0.0005361512303352356, -0.0005214624106884003, -0.0005067735910415649, -0.0004920847713947296, -0.0004773959517478943, -0.00046270713210105896, -0.00044801831245422363, -0.0004333294928073883, -0.000418640673160553, -0.00040395185351371765, -0.0003892630338668823, -0.000374574214220047, -0.00035988539457321167, -0.00034519657492637634, -0.000330507755279541, -0.0003158189356327057, -0.00030113011598587036, -0.00028644129633903503, -0.0002717524766921997, -0.0002570636570453644, -0.00024237483739852905, -0.00022768601775169373, -0.0002129971981048584, -0.00019830837845802307, -0.00018361955881118774, -0.00016893073916435242, -0.0001542419195175171, -0.00013955309987068176, -0.00012486428022384644, -0.00011017546057701111, -9.548664093017578e-05, -8.079782128334045e-05, -6.610900163650513e-05, -5.14201819896698e-05, -3.673136234283447e-05, -2.2042542695999146e-05, -7.353723049163818e-06, 7.335096597671509e-06, 2.2023916244506836e-05, 3.671273589134216e-05, 5.140155553817749e-05, 6.609037518501282e-05, 8.077919483184814e-05, 9.546801447868347e-05, 0.0001101568341255188, 0.00012484565377235413, 0.00013953447341918945, 0.00015422329306602478, 0.0001689121127128601, 0.00018360093235969543, 0.00019828975200653076, 0.0002129785716533661, 0.00022766739130020142, 0.00024235621094703674, 0.00025704503059387207, 0.0002717338502407074, 0.0002864226698875427, 0.00030111148953437805, 0.0003158003091812134, 0.0003304891288280487, 0.00034517794847488403, 0.00035986676812171936, 0.0003745555877685547]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 5.0, 2.0, 3.0, 8.0, 7.0, 12.0, 12.0, 21.0, 25.0, 44.0, 54.0, 81.0, 111.0, 192.0, 289.0, 449.0, 837.0, 1610.0, 3553.0, 8610.0, 25865.0, 100688.0, 454615.0, 346907.0, 71466.0, 19916.0, 6954.0, 2948.0, 1393.0, 739.0, 413.0, 252.0, 174.0, 91.0, 60.0, 49.0, 25.0, 21.0, 15.0, 7.0, 12.0, 9.0, 5.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.890625, -2.783111572265625, -2.67559814453125, -2.568084716796875, -2.4605712890625, -2.353057861328125, -2.24554443359375, -2.138031005859375, -2.030517578125, -1.923004150390625, -1.81549072265625, -1.707977294921875, -1.6004638671875, -1.492950439453125, -1.38543701171875, -1.277923583984375, -1.17041015625, -1.062896728515625, -0.95538330078125, -0.847869873046875, -0.7403564453125, -0.632843017578125, -0.52532958984375, -0.417816162109375, -0.310302734375, -0.202789306640625, -0.09527587890625, 0.012237548828125, 0.1197509765625, 0.227264404296875, 0.33477783203125, 0.442291259765625, 0.5498046875, 0.657318115234375, 0.76483154296875, 0.872344970703125, 0.9798583984375, 1.087371826171875, 1.19488525390625, 1.302398681640625, 1.409912109375, 1.517425537109375, 1.62493896484375, 1.732452392578125, 1.8399658203125, 1.947479248046875, 2.05499267578125, 2.162506103515625, 2.27001953125, 2.377532958984375, 2.48504638671875, 2.592559814453125, 2.7000732421875, 2.807586669921875, 2.91510009765625, 3.022613525390625, 3.130126953125, 3.237640380859375, 3.34515380859375, 3.452667236328125, 3.5601806640625, 3.667694091796875, 3.77520751953125, 3.882720947265625, 3.990234375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 7.0, 18.0, 14.0, 16.0, 30.0, 43.0, 40.0, 40.0, 50.0, 52.0, 53.0, 65.0, 78.0, 56.0, 51.0, 68.0, 54.0, 43.0, 40.0, 31.0, 22.0, 19.0, 14.0, 15.0, 7.0, 13.0, 9.0, 7.0, 8.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.521484375, -1.464324951171875, -1.40716552734375, -1.350006103515625, -1.2928466796875, -1.235687255859375, -1.17852783203125, -1.121368408203125, -1.064208984375, -1.007049560546875, -0.94989013671875, -0.892730712890625, -0.8355712890625, -0.778411865234375, -0.72125244140625, -0.664093017578125, -0.60693359375, -0.549774169921875, -0.49261474609375, -0.435455322265625, -0.3782958984375, -0.321136474609375, -0.26397705078125, -0.206817626953125, -0.149658203125, -0.092498779296875, -0.03533935546875, 0.021820068359375, 0.0789794921875, 0.136138916015625, 0.19329833984375, 0.250457763671875, 0.3076171875, 0.364776611328125, 0.42193603515625, 0.479095458984375, 0.5362548828125, 0.593414306640625, 0.65057373046875, 0.707733154296875, 0.764892578125, 0.822052001953125, 0.87921142578125, 0.936370849609375, 0.9935302734375, 1.050689697265625, 1.10784912109375, 1.165008544921875, 1.22216796875, 1.279327392578125, 1.33648681640625, 1.393646240234375, 1.4508056640625, 1.507965087890625, 1.56512451171875, 1.622283935546875, 1.679443359375, 1.736602783203125, 1.79376220703125, 1.850921630859375, 1.9080810546875, 1.965240478515625, 2.02239990234375, 2.079559326171875, 2.13671875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 4.0, 8.0, 6.0, 22.0, 24.0, 49.0, 52.0, 98.0, 102.0, 130.0, 117.0, 130.0, 93.0, 63.0, 39.0, 21.0, 16.0, 6.0, 9.0, 6.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.254756927490234, -30.047578811645508, -28.84040069580078, -27.633222579956055, -26.426044464111328, -25.21886444091797, -24.011686325073242, -22.804508209228516, -21.59733009338379, -20.390151977539062, -19.182973861694336, -17.97579574584961, -16.76861572265625, -15.56143856048584, -14.354259490966797, -13.14708137512207, -11.939903259277344, -10.732725143432617, -9.52554702758789, -8.318367958068848, -7.111189842224121, -5.9040117263793945, -4.69683313369751, -3.489654541015625, -2.2824764251708984, -1.0752980709075928, 0.1318802833557129, 1.3390586376190186, 2.546236991882324, 3.753415107727051, 4.9605937004089355, 6.16777229309082, 7.374946594238281, 8.582124710083008, 9.789302825927734, 10.996481895446777, 12.203660011291504, 13.41083812713623, 14.618017196655273, 15.8251953125, 17.032373428344727, 18.239551544189453, 19.44672966003418, 20.653907775878906, 21.861087799072266, 23.06826400756836, 24.27544403076172, 25.482622146606445, 26.689800262451172, 27.8969783782959, 29.104156494140625, 30.31133460998535, 31.518512725830078, 32.72569274902344, 33.93286895751953, 35.14004898071289, 36.34722900390625, 37.55440902709961, 38.7615852355957, 39.96876525878906, 41.175941467285156, 42.383121490478516, 43.59029769897461, 44.79747772216797, 46.00465393066406]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 9.0, 8.0, 9.0, 12.0, 11.0, 10.0, 22.0, 15.0, 21.0, 29.0, 37.0, 25.0, 29.0, 46.0, 35.0, 37.0, 33.0, 52.0, 40.0, 51.0, 55.0, 46.0, 42.0, 36.0, 32.0, 34.0, 23.0, 28.0, 28.0, 25.0, 17.0, 17.0, 17.0, 18.0, 8.0, 5.0, 7.0, 2.0, 9.0, 6.0, 7.0, 3.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.670129776000977, -22.955322265625, -22.240516662597656, -21.52570915222168, -20.810901641845703, -20.09609603881836, -19.381288528442383, -18.666481018066406, -17.951675415039062, -17.236867904663086, -16.522062301635742, -15.807254791259766, -15.092448234558105, -14.377641677856445, -13.662834167480469, -12.948027610778809, -12.233221054077148, -11.518414497375488, -10.803607940673828, -10.088800430297852, -9.373993873596191, -8.659187316894531, -7.944380283355713, -7.2295732498168945, -6.514766693115234, -5.799960136413574, -5.085153102874756, -4.3703460693359375, -3.6555395126342773, -2.940732717514038, -2.225925922393799, -1.5111188888549805, -0.7963104248046875, -0.08150362968444824, 0.633303165435791, 1.3481099605560303, 2.0629167556762695, 2.777723550796509, 3.492530345916748, 4.207337379455566, 4.922143936157227, 5.636950492858887, 6.351757526397705, 7.066564559936523, 7.781371116638184, 8.496177673339844, 9.21098518371582, 9.92579174041748, 10.64059829711914, 11.3554048538208, 12.070211410522461, 12.785018920898438, 13.499825477600098, 14.214632034301758, 14.929439544677734, 15.644246101379395, 16.359052658081055, 17.07386016845703, 17.788665771484375, 18.50347328186035, 19.218280792236328, 19.933086395263672, 20.64789390563965, 21.362701416015625, 22.07750701904297]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 5.0, 8.0, 8.0, 17.0, 15.0, 16.0, 24.0, 37.0, 49.0, 89.0, 91.0, 138.0, 216.0, 403.0, 584.0, 1096.0, 2085.0, 4552.0, 11770.0, 44440.0, 1119618.0, 2935486.0, 50841.0, 12911.0, 4840.0, 2170.0, 1161.0, 633.0, 366.0, 199.0, 124.0, 97.0, 55.0, 42.0, 25.0, 18.0, 15.0, 6.0, 8.0, 8.0, 1.0, 2.0, 2.0, 5.0], "bins": [-12.3203125, -12.02001953125, -11.7197265625, -11.41943359375, -11.119140625, -10.81884765625, -10.5185546875, -10.21826171875, -9.91796875, -9.61767578125, -9.3173828125, -9.01708984375, -8.716796875, -8.41650390625, -8.1162109375, -7.81591796875, -7.515625, -7.21533203125, -6.9150390625, -6.61474609375, -6.314453125, -6.01416015625, -5.7138671875, -5.41357421875, -5.11328125, -4.81298828125, -4.5126953125, -4.21240234375, -3.912109375, -3.61181640625, -3.3115234375, -3.01123046875, -2.7109375, -2.41064453125, -2.1103515625, -1.81005859375, -1.509765625, -1.20947265625, -0.9091796875, -0.60888671875, -0.30859375, -0.00830078125, 0.2919921875, 0.59228515625, 0.892578125, 1.19287109375, 1.4931640625, 1.79345703125, 2.09375, 2.39404296875, 2.6943359375, 2.99462890625, 3.294921875, 3.59521484375, 3.8955078125, 4.19580078125, 4.49609375, 4.79638671875, 5.0966796875, 5.39697265625, 5.697265625, 5.99755859375, 6.2978515625, 6.59814453125, 6.8984375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 7.0, 2.0, 6.0, 12.0, 15.0, 20.0, 26.0, 43.0, 49.0, 52.0, 64.0, 82.0, 85.0, 101.0, 73.0, 78.0, 66.0, 60.0, 39.0, 36.0, 24.0, 19.0, 16.0, 7.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.626953125, -1.5865325927734375, -1.546112060546875, -1.5056915283203125, -1.46527099609375, -1.4248504638671875, -1.384429931640625, -1.3440093994140625, -1.3035888671875, -1.2631683349609375, -1.222747802734375, -1.1823272705078125, -1.14190673828125, -1.1014862060546875, -1.061065673828125, -1.0206451416015625, -0.980224609375, -0.9398040771484375, -0.899383544921875, -0.8589630126953125, -0.81854248046875, -0.7781219482421875, -0.737701416015625, -0.6972808837890625, -0.6568603515625, -0.6164398193359375, -0.576019287109375, -0.5355987548828125, -0.49517822265625, -0.4547576904296875, -0.414337158203125, -0.3739166259765625, -0.33349609375, -0.2930755615234375, -0.252655029296875, -0.2122344970703125, -0.17181396484375, -0.1313934326171875, -0.090972900390625, -0.0505523681640625, -0.0101318359375, 0.0302886962890625, 0.070709228515625, 0.1111297607421875, 0.15155029296875, 0.1919708251953125, 0.232391357421875, 0.2728118896484375, 0.313232421875, 0.3536529541015625, 0.394073486328125, 0.4344940185546875, 0.47491455078125, 0.5153350830078125, 0.555755615234375, 0.5961761474609375, 0.6365966796875, 0.6770172119140625, 0.717437744140625, 0.7578582763671875, 0.79827880859375, 0.8386993408203125, 0.879119873046875, 0.9195404052734375, 0.9599609375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 5.0, 5.0, 10.0, 12.0, 22.0, 34.0, 35.0, 55.0, 80.0, 121.0, 181.0, 266.0, 425.0, 620.0, 999.0, 1847.0, 3592.0, 7738.0, 21046.0, 80155.0, 1130053.0, 2803778.0, 101315.0, 24362.0, 8857.0, 3867.0, 1927.0, 1085.0, 641.0, 375.0, 249.0, 152.0, 113.0, 53.0, 52.0, 44.0, 30.0, 21.0, 15.0, 18.0, 5.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.67578125, -6.43792724609375, -6.2000732421875, -5.96221923828125, -5.724365234375, -5.48651123046875, -5.2486572265625, -5.01080322265625, -4.77294921875, -4.53509521484375, -4.2972412109375, -4.05938720703125, -3.821533203125, -3.58367919921875, -3.3458251953125, -3.10797119140625, -2.8701171875, -2.63226318359375, -2.3944091796875, -2.15655517578125, -1.918701171875, -1.68084716796875, -1.4429931640625, -1.20513916015625, -0.96728515625, -0.72943115234375, -0.4915771484375, -0.25372314453125, -0.015869140625, 0.22198486328125, 0.4598388671875, 0.69769287109375, 0.935546875, 1.17340087890625, 1.4112548828125, 1.64910888671875, 1.886962890625, 2.12481689453125, 2.3626708984375, 2.60052490234375, 2.83837890625, 3.07623291015625, 3.3140869140625, 3.55194091796875, 3.789794921875, 4.02764892578125, 4.2655029296875, 4.50335693359375, 4.7412109375, 4.97906494140625, 5.2169189453125, 5.45477294921875, 5.692626953125, 5.93048095703125, 6.1683349609375, 6.40618896484375, 6.64404296875, 6.88189697265625, 7.1197509765625, 7.35760498046875, 7.595458984375, 7.83331298828125, 8.0711669921875, 8.30902099609375, 8.546875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 10.0, 14.0, 23.0, 36.0, 41.0, 60.0, 98.0, 182.0, 507.0, 2031.0, 527.0, 217.0, 101.0, 74.0, 36.0, 29.0, 14.0, 13.0, 10.0, 6.0, 6.0, 4.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.208984375, -2.13653564453125, -2.0640869140625, -1.99163818359375, -1.919189453125, -1.84674072265625, -1.7742919921875, -1.70184326171875, -1.62939453125, -1.55694580078125, -1.4844970703125, -1.41204833984375, -1.339599609375, -1.26715087890625, -1.1947021484375, -1.12225341796875, -1.0498046875, -0.97735595703125, -0.9049072265625, -0.83245849609375, -0.760009765625, -0.68756103515625, -0.6151123046875, -0.54266357421875, -0.47021484375, -0.39776611328125, -0.3253173828125, -0.25286865234375, -0.180419921875, -0.10797119140625, -0.0355224609375, 0.03692626953125, 0.109375, 0.18182373046875, 0.2542724609375, 0.32672119140625, 0.399169921875, 0.47161865234375, 0.5440673828125, 0.61651611328125, 0.68896484375, 0.76141357421875, 0.8338623046875, 0.90631103515625, 0.978759765625, 1.05120849609375, 1.1236572265625, 1.19610595703125, 1.2685546875, 1.34100341796875, 1.4134521484375, 1.48590087890625, 1.558349609375, 1.63079833984375, 1.7032470703125, 1.77569580078125, 1.84814453125, 1.92059326171875, 1.9930419921875, 2.06549072265625, 2.137939453125, 2.21038818359375, 2.2828369140625, 2.35528564453125, 2.427734375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 8.0, 9.0, 19.0, 28.0, 46.0, 67.0, 108.0, 145.0, 167.0, 130.0, 100.0, 67.0, 30.0, 23.0, 19.0, 16.0, 6.0, 7.0, 1.0, 7.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.134748458862305, -7.713335990905762, -7.291923522949219, -6.870511054992676, -6.449098110198975, -6.027685642242432, -5.606273174285889, -5.1848602294921875, -4.7634477615356445, -4.342035293579102, -3.9206225872039795, -3.4992101192474365, -3.0777974128723145, -2.6563849449157715, -2.2349724769592285, -1.8135597705841064, -1.3921475410461426, -0.9707349538803101, -0.5493224263191223, -0.12790989875793457, 0.29350268840789795, 0.7149152755737305, 1.1363277435302734, 1.5577404499053955, 1.9791529178619385, 2.4005653858184814, 2.8219780921936035, 3.2433905601501465, 3.6648030281066895, 4.086215972900391, 4.507628440856934, 4.929040908813477, 5.3504533767700195, 5.7718658447265625, 6.1932783126831055, 6.614690780639648, 7.03610372543335, 7.457516193389893, 7.8789286613464355, 8.300341606140137, 8.72175407409668, 9.143166542053223, 9.564579010009766, 9.985991477966309, 10.407403945922852, 10.828817367553711, 11.250228881835938, 11.671642303466797, 12.093053817749023, 12.514466285705566, 12.93587875366211, 13.357291221618652, 13.778703689575195, 14.200117111206055, 14.621528625488281, 15.04294204711914, 15.464354515075684, 15.885766983032227, 16.307180404663086, 16.728591918945312, 17.150005340576172, 17.5714168548584, 17.992830276489258, 18.414241790771484, 18.835655212402344]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 13.0, 3.0, 13.0, 10.0, 14.0, 18.0, 17.0, 20.0, 25.0, 28.0, 21.0, 30.0, 34.0, 29.0, 48.0, 43.0, 36.0, 25.0, 42.0, 37.0, 42.0, 53.0, 37.0, 38.0, 36.0, 51.0, 26.0, 29.0, 29.0, 34.0, 20.0, 26.0, 15.0, 7.0, 11.0, 11.0, 5.0, 5.0, 6.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.579960823059082, -6.375895023345947, -6.1718292236328125, -5.967763423919678, -5.763697624206543, -5.559631824493408, -5.355566024780273, -5.151500225067139, -4.947434425354004, -4.743368625640869, -4.539302825927734, -4.3352370262146, -4.131171226501465, -3.92710542678833, -3.7230396270751953, -3.5189738273620605, -3.314908027648926, -3.110842227935791, -2.9067764282226562, -2.7027106285095215, -2.4986448287963867, -2.294579029083252, -2.090513229370117, -1.8864474296569824, -1.6823816299438477, -1.478315830230713, -1.2742500305175781, -1.0701842308044434, -0.8661184310913086, -0.6620526313781738, -0.45798683166503906, -0.2539210319519043, -0.04985523223876953, 0.15421056747436523, 0.3582763671875, 0.5623421669006348, 0.7664079666137695, 0.9704737663269043, 1.174539566040039, 1.3786053657531738, 1.5826711654663086, 1.7867369651794434, 1.9908027648925781, 2.194868564605713, 2.3989343643188477, 2.6030001640319824, 2.807065963745117, 3.011131763458252, 3.2151975631713867, 3.4192633628845215, 3.6233291625976562, 3.827394962310791, 4.031460762023926, 4.2355265617370605, 4.439592361450195, 4.64365816116333, 4.847723960876465, 5.0517897605896, 5.255855560302734, 5.459921360015869, 5.663987159729004, 5.868052959442139, 6.072118759155273, 6.276184558868408, 6.480250358581543]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 6.0, 14.0, 15.0, 15.0, 29.0, 35.0, 57.0, 92.0, 145.0, 213.0, 393.0, 764.0, 1614.0, 3626.0, 9666.0, 33948.0, 169727.0, 590626.0, 183690.0, 36188.0, 10309.0, 3866.0, 1624.0, 815.0, 437.0, 222.0, 140.0, 92.0, 64.0, 32.0, 21.0, 27.0, 13.0, 9.0, 13.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0546875, -7.7818603515625, -7.509033203125, -7.2362060546875, -6.96337890625, -6.6905517578125, -6.417724609375, -6.1448974609375, -5.8720703125, -5.5992431640625, -5.326416015625, -5.0535888671875, -4.78076171875, -4.5079345703125, -4.235107421875, -3.9622802734375, -3.689453125, -3.4166259765625, -3.143798828125, -2.8709716796875, -2.59814453125, -2.3253173828125, -2.052490234375, -1.7796630859375, -1.5068359375, -1.2340087890625, -0.961181640625, -0.6883544921875, -0.41552734375, -0.1427001953125, 0.130126953125, 0.4029541015625, 0.67578125, 0.9486083984375, 1.221435546875, 1.4942626953125, 1.76708984375, 2.0399169921875, 2.312744140625, 2.5855712890625, 2.8583984375, 3.1312255859375, 3.404052734375, 3.6768798828125, 3.94970703125, 4.2225341796875, 4.495361328125, 4.7681884765625, 5.041015625, 5.3138427734375, 5.586669921875, 5.8594970703125, 6.13232421875, 6.4051513671875, 6.677978515625, 6.9508056640625, 7.2236328125, 7.4964599609375, 7.769287109375, 8.0421142578125, 8.31494140625, 8.5877685546875, 8.860595703125, 9.1334228515625, 9.40625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 4.0, 3.0, 9.0, 9.0, 17.0, 23.0, 27.0, 29.0, 33.0, 47.0, 56.0, 57.0, 63.0, 70.0, 76.0, 78.0, 57.0, 77.0, 58.0, 42.0, 35.0, 36.0, 20.0, 22.0, 12.0, 15.0, 7.0, 3.0, 7.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.3837890625, -1.3478622436523438, -1.3119354248046875, -1.2760086059570312, -1.240081787109375, -1.2041549682617188, -1.1682281494140625, -1.1323013305664062, -1.09637451171875, -1.0604476928710938, -1.0245208740234375, -0.9885940551757812, -0.952667236328125, -0.9167404174804688, -0.8808135986328125, -0.8448867797851562, -0.8089599609375, -0.7730331420898438, -0.7371063232421875, -0.7011795043945312, -0.665252685546875, -0.6293258666992188, -0.5933990478515625, -0.5574722290039062, -0.52154541015625, -0.48561859130859375, -0.4496917724609375, -0.41376495361328125, -0.377838134765625, -0.34191131591796875, -0.3059844970703125, -0.27005767822265625, -0.234130859375, -0.19820404052734375, -0.1622772216796875, -0.12635040283203125, -0.090423583984375, -0.05449676513671875, -0.0185699462890625, 0.01735687255859375, 0.05328369140625, 0.08921051025390625, 0.1251373291015625, 0.16106414794921875, 0.196990966796875, 0.23291778564453125, 0.2688446044921875, 0.30477142333984375, 0.3406982421875, 0.37662506103515625, 0.4125518798828125, 0.44847869873046875, 0.484405517578125, 0.5203323364257812, 0.5562591552734375, 0.5921859741210938, 0.62811279296875, 0.6640396118164062, 0.6999664306640625, 0.7358932495117188, 0.771820068359375, 0.8077468872070312, 0.8436737060546875, 0.8796005249023438, 0.91552734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 5.0, 7.0, 14.0, 7.0, 14.0, 11.0, 37.0, 41.0, 51.0, 74.0, 99.0, 136.0, 195.0, 295.0, 468.0, 727.0, 1248.0, 2361.0, 5417.0, 14731.0, 47507.0, 171464.0, 460993.0, 241985.0, 67052.0, 20023.0, 6821.0, 2912.0, 1416.0, 825.0, 489.0, 317.0, 240.0, 159.0, 100.0, 70.0, 54.0, 38.0, 43.0, 30.0, 19.0, 14.0, 16.0, 5.0, 6.0, 3.0, 5.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.90625, -5.73065185546875, -5.5550537109375, -5.37945556640625, -5.203857421875, -5.02825927734375, -4.8526611328125, -4.67706298828125, -4.50146484375, -4.32586669921875, -4.1502685546875, -3.97467041015625, -3.799072265625, -3.62347412109375, -3.4478759765625, -3.27227783203125, -3.0966796875, -2.92108154296875, -2.7454833984375, -2.56988525390625, -2.394287109375, -2.21868896484375, -2.0430908203125, -1.86749267578125, -1.69189453125, -1.51629638671875, -1.3406982421875, -1.16510009765625, -0.989501953125, -0.81390380859375, -0.6383056640625, -0.46270751953125, -0.287109375, -0.11151123046875, 0.0640869140625, 0.23968505859375, 0.415283203125, 0.59088134765625, 0.7664794921875, 0.94207763671875, 1.11767578125, 1.29327392578125, 1.4688720703125, 1.64447021484375, 1.820068359375, 1.99566650390625, 2.1712646484375, 2.34686279296875, 2.5224609375, 2.69805908203125, 2.8736572265625, 3.04925537109375, 3.224853515625, 3.40045166015625, 3.5760498046875, 3.75164794921875, 3.92724609375, 4.10284423828125, 4.2784423828125, 4.45404052734375, 4.629638671875, 4.80523681640625, 4.9808349609375, 5.15643310546875, 5.33203125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 6.0, 4.0, 5.0, 3.0, 11.0, 17.0, 14.0, 12.0, 19.0, 22.0, 21.0, 21.0, 27.0, 34.0, 39.0, 34.0, 37.0, 45.0, 53.0, 48.0, 52.0, 47.0, 46.0, 33.0, 34.0, 32.0, 46.0, 35.0, 32.0, 32.0, 30.0, 13.0, 14.0, 14.0, 20.0, 10.0, 11.0, 14.0, 2.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.982421875, -3.861053466796875, -3.73968505859375, -3.618316650390625, -3.4969482421875, -3.375579833984375, -3.25421142578125, -3.132843017578125, -3.011474609375, -2.890106201171875, -2.76873779296875, -2.647369384765625, -2.5260009765625, -2.404632568359375, -2.28326416015625, -2.161895751953125, -2.04052734375, -1.919158935546875, -1.79779052734375, -1.676422119140625, -1.5550537109375, -1.433685302734375, -1.31231689453125, -1.190948486328125, -1.069580078125, -0.948211669921875, -0.82684326171875, -0.705474853515625, -0.5841064453125, -0.462738037109375, -0.34136962890625, -0.220001220703125, -0.0986328125, 0.022735595703125, 0.14410400390625, 0.265472412109375, 0.3868408203125, 0.508209228515625, 0.62957763671875, 0.750946044921875, 0.872314453125, 0.993682861328125, 1.11505126953125, 1.236419677734375, 1.3577880859375, 1.479156494140625, 1.60052490234375, 1.721893310546875, 1.84326171875, 1.964630126953125, 2.08599853515625, 2.207366943359375, 2.3287353515625, 2.450103759765625, 2.57147216796875, 2.692840576171875, 2.814208984375, 2.935577392578125, 3.05694580078125, 3.178314208984375, 3.2996826171875, 3.421051025390625, 3.54241943359375, 3.663787841796875, 3.78515625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 15.0, 8.0, 7.0, 12.0, 34.0, 38.0, 72.0, 118.0, 170.0, 324.0, 662.0, 1416.0, 3375.0, 9966.0, 40264.0, 286793.0, 586501.0, 91581.0, 17718.0, 5400.0, 2039.0, 895.0, 480.0, 280.0, 129.0, 100.0, 50.0, 30.0, 25.0, 13.0, 7.0, 3.0, 11.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.5, -4.3685302734375, -4.237060546875, -4.1055908203125, -3.97412109375, -3.8426513671875, -3.711181640625, -3.5797119140625, -3.4482421875, -3.3167724609375, -3.185302734375, -3.0538330078125, -2.92236328125, -2.7908935546875, -2.659423828125, -2.5279541015625, -2.396484375, -2.2650146484375, -2.133544921875, -2.0020751953125, -1.87060546875, -1.7391357421875, -1.607666015625, -1.4761962890625, -1.3447265625, -1.2132568359375, -1.081787109375, -0.9503173828125, -0.81884765625, -0.6873779296875, -0.555908203125, -0.4244384765625, -0.29296875, -0.1614990234375, -0.030029296875, 0.1014404296875, 0.23291015625, 0.3643798828125, 0.495849609375, 0.6273193359375, 0.7587890625, 0.8902587890625, 1.021728515625, 1.1531982421875, 1.28466796875, 1.4161376953125, 1.547607421875, 1.6790771484375, 1.810546875, 1.9420166015625, 2.073486328125, 2.2049560546875, 2.33642578125, 2.4678955078125, 2.599365234375, 2.7308349609375, 2.8623046875, 2.9937744140625, 3.125244140625, 3.2567138671875, 3.38818359375, 3.5196533203125, 3.651123046875, 3.7825927734375, 3.9140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 1.0, 5.0, 10.0, 8.0, 7.0, 12.0, 13.0, 19.0, 23.0, 24.0, 29.0, 46.0, 63.0, 83.0, 96.0, 113.0, 85.0, 75.0, 61.0, 46.0, 30.0, 25.0, 30.0, 17.0, 13.0, 13.0, 13.0, 7.0, 14.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.0005893707275390625, -0.000573623925447464, -0.0005578771233558655, -0.000542130321264267, -0.0005263835191726685, -0.00051063671708107, -0.0004948899149894714, -0.0004791431128978729, -0.0004633963108062744, -0.0004476495087146759, -0.0004319027066230774, -0.0004161559045314789, -0.00040040910243988037, -0.00038466230034828186, -0.00036891549825668335, -0.00035316869616508484, -0.00033742189407348633, -0.0003216750919818878, -0.0003059282898902893, -0.0002901814877986908, -0.0002744346857070923, -0.0002586878836154938, -0.00024294108152389526, -0.00022719427943229675, -0.00021144747734069824, -0.00019570067524909973, -0.00017995387315750122, -0.0001642070710659027, -0.0001484602689743042, -0.0001327134668827057, -0.00011696666479110718, -0.00010121986269950867, -8.547306060791016e-05, -6.972625851631165e-05, -5.3979456424713135e-05, -3.8232654333114624e-05, -2.2485852241516113e-05, -6.7390501499176025e-06, 9.007751941680908e-06, 2.475455403327942e-05, 4.050135612487793e-05, 5.624815821647644e-05, 7.199496030807495e-05, 8.774176239967346e-05, 0.00010348856449127197, 0.00011923536658287048, 0.000134982168674469, 0.0001507289707660675, 0.00016647577285766602, 0.00018222257494926453, 0.00019796937704086304, 0.00021371617913246155, 0.00022946298122406006, 0.00024520978331565857, 0.0002609565854072571, 0.0002767033874988556, 0.0002924501895904541, 0.0003081969916820526, 0.0003239437937736511, 0.00033969059586524963, 0.00035543739795684814, 0.00037118420004844666, 0.00038693100214004517, 0.0004026778042316437, 0.0004184246063232422]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 1.0, 3.0, 2.0, 5.0, 4.0, 11.0, 14.0, 13.0, 14.0, 18.0, 36.0, 39.0, 56.0, 81.0, 112.0, 222.0, 304.0, 567.0, 981.0, 2066.0, 4879.0, 13773.0, 58647.0, 471523.0, 421228.0, 52128.0, 12876.0, 4600.0, 1923.0, 995.0, 526.0, 310.0, 190.0, 117.0, 83.0, 60.0, 36.0, 33.0, 9.0, 15.0, 14.0, 11.0, 7.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.9453125, -3.81365966796875, -3.6820068359375, -3.55035400390625, -3.418701171875, -3.28704833984375, -3.1553955078125, -3.02374267578125, -2.89208984375, -2.76043701171875, -2.6287841796875, -2.49713134765625, -2.365478515625, -2.23382568359375, -2.1021728515625, -1.97052001953125, -1.8388671875, -1.70721435546875, -1.5755615234375, -1.44390869140625, -1.312255859375, -1.18060302734375, -1.0489501953125, -0.91729736328125, -0.78564453125, -0.65399169921875, -0.5223388671875, -0.39068603515625, -0.259033203125, -0.12738037109375, 0.0042724609375, 0.13592529296875, 0.267578125, 0.39923095703125, 0.5308837890625, 0.66253662109375, 0.794189453125, 0.92584228515625, 1.0574951171875, 1.18914794921875, 1.32080078125, 1.45245361328125, 1.5841064453125, 1.71575927734375, 1.847412109375, 1.97906494140625, 2.1107177734375, 2.24237060546875, 2.3740234375, 2.50567626953125, 2.6373291015625, 2.76898193359375, 2.900634765625, 3.03228759765625, 3.1639404296875, 3.29559326171875, 3.42724609375, 3.55889892578125, 3.6905517578125, 3.82220458984375, 3.953857421875, 4.08551025390625, 4.2171630859375, 4.34881591796875, 4.48046875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 7.0, 7.0, 10.0, 14.0, 24.0, 33.0, 40.0, 61.0, 80.0, 113.0, 116.0, 110.0, 92.0, 70.0, 68.0, 37.0, 30.0, 24.0, 18.0, 7.0, 7.0, 5.0, 8.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.830078125, -2.74395751953125, -2.6578369140625, -2.57171630859375, -2.485595703125, -2.39947509765625, -2.3133544921875, -2.22723388671875, -2.14111328125, -2.05499267578125, -1.9688720703125, -1.88275146484375, -1.796630859375, -1.71051025390625, -1.6243896484375, -1.53826904296875, -1.4521484375, -1.36602783203125, -1.2799072265625, -1.19378662109375, -1.107666015625, -1.02154541015625, -0.9354248046875, -0.84930419921875, -0.76318359375, -0.67706298828125, -0.5909423828125, -0.50482177734375, -0.418701171875, -0.33258056640625, -0.2464599609375, -0.16033935546875, -0.07421875, 0.01190185546875, 0.0980224609375, 0.18414306640625, 0.270263671875, 0.35638427734375, 0.4425048828125, 0.52862548828125, 0.61474609375, 0.70086669921875, 0.7869873046875, 0.87310791015625, 0.959228515625, 1.04534912109375, 1.1314697265625, 1.21759033203125, 1.3037109375, 1.38983154296875, 1.4759521484375, 1.56207275390625, 1.648193359375, 1.73431396484375, 1.8204345703125, 1.90655517578125, 1.99267578125, 2.07879638671875, 2.1649169921875, 2.25103759765625, 2.337158203125, 2.42327880859375, 2.5093994140625, 2.59552001953125, 2.681640625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 12.0, 18.0, 44.0, 99.0, 150.0, 189.0, 181.0, 141.0, 76.0, 40.0, 25.0, 7.0, 10.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-66.99439239501953, -65.26271057128906, -63.53103256225586, -61.79935073852539, -60.06767272949219, -58.33599090576172, -56.604312896728516, -54.87263107299805, -53.140953063964844, -51.409271240234375, -49.67759323120117, -47.9459114074707, -46.2142333984375, -44.48255157470703, -42.75087356567383, -41.01919174194336, -39.287513732910156, -37.55583190917969, -35.824153900146484, -34.092472076416016, -32.36079406738281, -30.629112243652344, -28.89743423461914, -27.165752410888672, -25.434070587158203, -23.702390670776367, -21.97071075439453, -20.239030838012695, -18.50735092163086, -16.77566909790039, -15.043990135192871, -13.312310218811035, -11.580631256103516, -9.84895133972168, -8.117271423339844, -6.38559103012085, -4.653911113739014, -2.9222307205200195, -1.1905508041381836, 0.5411291122436523, 2.2728090286254883, 4.004488945007324, 5.73616886138916, 7.467849254608154, 9.199529647827148, 10.931209564208984, 12.66288948059082, 14.394569396972656, 16.126249313354492, 17.857929229736328, 19.589609146118164, 21.3212890625, 23.052968978881836, 24.784648895263672, 26.51633071899414, 28.248008728027344, 29.979690551757812, 31.71137046813965, 33.443050384521484, 35.17473220825195, 36.906410217285156, 38.638092041015625, 40.36977005004883, 42.1014518737793, 43.8331298828125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 6.0, 8.0, 8.0, 12.0, 8.0, 10.0, 21.0, 22.0, 22.0, 22.0, 29.0, 22.0, 33.0, 34.0, 35.0, 37.0, 39.0, 44.0, 40.0, 43.0, 43.0, 49.0, 42.0, 37.0, 35.0, 30.0, 29.0, 35.0, 22.0, 29.0, 19.0, 20.0, 20.0, 17.0, 18.0, 15.0, 9.0, 8.0, 9.0, 4.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.12846565246582, -20.500459671020508, -19.872453689575195, -19.244447708129883, -18.61644172668457, -17.988435745239258, -17.360429763793945, -16.732423782348633, -16.10441780090332, -15.476411819458008, -14.848405838012695, -14.220399856567383, -13.59239387512207, -12.964387893676758, -12.336381912231445, -11.708375930786133, -11.08036994934082, -10.452363967895508, -9.824357986450195, -9.196352005004883, -8.56834602355957, -7.940340042114258, -7.312334060668945, -6.684328079223633, -6.05632209777832, -5.428316116333008, -4.800310134887695, -4.172304153442383, -3.5442981719970703, -2.916292190551758, -2.2882862091064453, -1.6602802276611328, -1.0322761535644531, -0.4042701721191406, 0.22373580932617188, 0.8517417907714844, 1.4797477722167969, 2.1077537536621094, 2.735759735107422, 3.3637657165527344, 3.991771697998047, 4.619777679443359, 5.247783660888672, 5.875789642333984, 6.503795623779297, 7.131801605224609, 7.759807586669922, 8.387813568115234, 9.015819549560547, 9.64382553100586, 10.271831512451172, 10.899837493896484, 11.527843475341797, 12.15584945678711, 12.783855438232422, 13.411861419677734, 14.039867401123047, 14.66787338256836, 15.295879364013672, 15.923885345458984, 16.551891326904297, 17.17989730834961, 17.807903289794922, 18.435909271240234, 19.063915252685547]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 1.0, 4.0, 1.0, 4.0, 1.0, 5.0, 9.0, 11.0, 7.0, 13.0, 27.0, 23.0, 44.0, 49.0, 74.0, 110.0, 150.0, 222.0, 336.0, 566.0, 865.0, 1749.0, 3516.0, 8555.0, 26484.0, 145490.0, 3705347.0, 246953.0, 35362.0, 10281.0, 3971.0, 1854.0, 884.0, 508.0, 289.0, 188.0, 94.0, 81.0, 46.0, 33.0, 26.0, 13.0, 8.0, 6.0, 4.0, 4.0, 5.0, 1.0, 2.0, 5.0, 0.0, 2.0, 3.0], "bins": [-10.59375, -10.31195068359375, -10.0301513671875, -9.74835205078125, -9.466552734375, -9.18475341796875, -8.9029541015625, -8.62115478515625, -8.33935546875, -8.05755615234375, -7.7757568359375, -7.49395751953125, -7.212158203125, -6.93035888671875, -6.6485595703125, -6.36676025390625, -6.0849609375, -5.80316162109375, -5.5213623046875, -5.23956298828125, -4.957763671875, -4.67596435546875, -4.3941650390625, -4.11236572265625, -3.83056640625, -3.54876708984375, -3.2669677734375, -2.98516845703125, -2.703369140625, -2.42156982421875, -2.1397705078125, -1.85797119140625, -1.576171875, -1.29437255859375, -1.0125732421875, -0.73077392578125, -0.448974609375, -0.16717529296875, 0.1146240234375, 0.39642333984375, 0.67822265625, 0.96002197265625, 1.2418212890625, 1.52362060546875, 1.805419921875, 2.08721923828125, 2.3690185546875, 2.65081787109375, 2.9326171875, 3.21441650390625, 3.4962158203125, 3.77801513671875, 4.059814453125, 4.34161376953125, 4.6234130859375, 4.90521240234375, 5.18701171875, 5.46881103515625, 5.7506103515625, 6.03240966796875, 6.314208984375, 6.59600830078125, 6.8778076171875, 7.15960693359375, 7.44140625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 11.0, 7.0, 14.0, 13.0, 20.0, 23.0, 31.0, 43.0, 44.0, 46.0, 66.0, 68.0, 68.0, 76.0, 80.0, 53.0, 46.0, 66.0, 35.0, 39.0, 33.0, 28.0, 23.0, 12.0, 14.0, 12.0, 9.0, 3.0, 1.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.3359375, -1.3011856079101562, -1.2664337158203125, -1.2316818237304688, -1.196929931640625, -1.1621780395507812, -1.1274261474609375, -1.0926742553710938, -1.05792236328125, -1.0231704711914062, -0.9884185791015625, -0.9536666870117188, -0.918914794921875, -0.8841629028320312, -0.8494110107421875, -0.8146591186523438, -0.7799072265625, -0.7451553344726562, -0.7104034423828125, -0.6756515502929688, -0.640899658203125, -0.6061477661132812, -0.5713958740234375, -0.5366439819335938, -0.50189208984375, -0.46714019775390625, -0.4323883056640625, -0.39763641357421875, -0.362884521484375, -0.32813262939453125, -0.2933807373046875, -0.25862884521484375, -0.223876953125, -0.18912506103515625, -0.1543731689453125, -0.11962127685546875, -0.084869384765625, -0.05011749267578125, -0.0153656005859375, 0.01938629150390625, 0.05413818359375, 0.08889007568359375, 0.1236419677734375, 0.15839385986328125, 0.193145751953125, 0.22789764404296875, 0.2626495361328125, 0.29740142822265625, 0.3321533203125, 0.36690521240234375, 0.4016571044921875, 0.43640899658203125, 0.471160888671875, 0.5059127807617188, 0.5406646728515625, 0.5754165649414062, 0.61016845703125, 0.6449203491210938, 0.6796722412109375, 0.7144241333007812, 0.749176025390625, 0.7839279174804688, 0.8186798095703125, 0.8534317016601562, 0.88818359375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 0.0, 4.0, 4.0, 12.0, 18.0, 13.0, 20.0, 39.0, 44.0, 51.0, 109.0, 150.0, 232.0, 375.0, 555.0, 895.0, 1541.0, 2599.0, 5088.0, 10184.0, 21811.0, 53100.0, 167988.0, 1289679.0, 2306093.0, 218484.0, 63773.0, 25783.0, 11785.0, 5941.0, 3176.0, 1820.0, 1071.0, 602.0, 413.0, 253.0, 184.0, 118.0, 66.0, 62.0, 36.0, 28.0, 28.0, 16.0, 15.0, 5.0, 5.0, 10.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.0859375, -3.95013427734375, -3.8143310546875, -3.67852783203125, -3.542724609375, -3.40692138671875, -3.2711181640625, -3.13531494140625, -2.99951171875, -2.86370849609375, -2.7279052734375, -2.59210205078125, -2.456298828125, -2.32049560546875, -2.1846923828125, -2.04888916015625, -1.9130859375, -1.77728271484375, -1.6414794921875, -1.50567626953125, -1.369873046875, -1.23406982421875, -1.0982666015625, -0.96246337890625, -0.82666015625, -0.69085693359375, -0.5550537109375, -0.41925048828125, -0.283447265625, -0.14764404296875, -0.0118408203125, 0.12396240234375, 0.259765625, 0.39556884765625, 0.5313720703125, 0.66717529296875, 0.802978515625, 0.93878173828125, 1.0745849609375, 1.21038818359375, 1.34619140625, 1.48199462890625, 1.6177978515625, 1.75360107421875, 1.889404296875, 2.02520751953125, 2.1610107421875, 2.29681396484375, 2.4326171875, 2.56842041015625, 2.7042236328125, 2.84002685546875, 2.975830078125, 3.11163330078125, 3.2474365234375, 3.38323974609375, 3.51904296875, 3.65484619140625, 3.7906494140625, 3.92645263671875, 4.062255859375, 4.19805908203125, 4.3338623046875, 4.46966552734375, 4.60546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 6.0, 5.0, 11.0, 7.0, 12.0, 21.0, 25.0, 23.0, 43.0, 57.0, 100.0, 133.0, 249.0, 467.0, 1207.0, 779.0, 342.0, 186.0, 102.0, 71.0, 52.0, 37.0, 44.0, 26.0, 12.0, 9.0, 15.0, 9.0, 9.0, 4.0, 3.0, 6.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.470703125, -2.39752197265625, -2.3243408203125, -2.25115966796875, -2.177978515625, -2.10479736328125, -2.0316162109375, -1.95843505859375, -1.88525390625, -1.81207275390625, -1.7388916015625, -1.66571044921875, -1.592529296875, -1.51934814453125, -1.4461669921875, -1.37298583984375, -1.2998046875, -1.22662353515625, -1.1534423828125, -1.08026123046875, -1.007080078125, -0.93389892578125, -0.8607177734375, -0.78753662109375, -0.71435546875, -0.64117431640625, -0.5679931640625, -0.49481201171875, -0.421630859375, -0.34844970703125, -0.2752685546875, -0.20208740234375, -0.12890625, -0.05572509765625, 0.0174560546875, 0.09063720703125, 0.163818359375, 0.23699951171875, 0.3101806640625, 0.38336181640625, 0.45654296875, 0.52972412109375, 0.6029052734375, 0.67608642578125, 0.749267578125, 0.82244873046875, 0.8956298828125, 0.96881103515625, 1.0419921875, 1.11517333984375, 1.1883544921875, 1.26153564453125, 1.334716796875, 1.40789794921875, 1.4810791015625, 1.55426025390625, 1.62744140625, 1.70062255859375, 1.7738037109375, 1.84698486328125, 1.920166015625, 1.99334716796875, 2.0665283203125, 2.13970947265625, 2.212890625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 12.0, 29.0, 56.0, 86.0, 99.0, 155.0, 143.0, 126.0, 112.0, 54.0, 43.0, 26.0, 13.0, 10.0, 8.0, 3.0, 3.0, 5.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.913623809814453, -19.291202545166016, -18.668781280517578, -18.04636001586914, -17.423938751220703, -16.801517486572266, -16.179096221923828, -15.556674003601074, -14.934252738952637, -14.3118314743042, -13.689410209655762, -13.066988945007324, -12.44456672668457, -11.822145462036133, -11.199724197387695, -10.577302932739258, -9.95488166809082, -9.332460403442383, -8.710039138793945, -8.087617874145508, -7.465196132659912, -6.842774868011475, -6.220353126525879, -5.597931861877441, -4.975510597229004, -4.353089332580566, -3.73066782951355, -3.108246326446533, -2.4858250617980957, -1.8634037971496582, -1.2409822940826416, -0.618560791015625, 0.0038604736328125, 0.6262818574905396, 1.2487032413482666, 1.8711246252059937, 2.4935460090637207, 3.115967273712158, 3.738388776779175, 4.360810279846191, 4.983231544494629, 5.605652809143066, 6.228074073791504, 6.8504958152771, 7.472917079925537, 8.095338821411133, 8.71776008605957, 9.340181350708008, 9.962602615356445, 10.585023880004883, 11.20744514465332, 11.829866409301758, 12.452287673950195, 13.074708938598633, 13.697131156921387, 14.319552421569824, 14.941973686218262, 15.5643949508667, 16.186817169189453, 16.80923843383789, 17.431659698486328, 18.054080963134766, 18.676502227783203, 19.29892349243164, 19.921344757080078]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 1.0, 9.0, 5.0, 4.0, 8.0, 9.0, 9.0, 11.0, 12.0, 13.0, 17.0, 23.0, 21.0, 27.0, 29.0, 32.0, 36.0, 34.0, 34.0, 24.0, 42.0, 40.0, 35.0, 38.0, 36.0, 36.0, 38.0, 34.0, 43.0, 39.0, 29.0, 31.0, 30.0, 24.0, 22.0, 26.0, 14.0, 16.0, 17.0, 10.0, 8.0, 4.0, 9.0, 9.0, 4.0, 3.0, 5.0, 2.0, 1.0, 4.0, 2.0], "bins": [-9.701818466186523, -9.444954872131348, -9.188092231750488, -8.931228637695312, -8.674365997314453, -8.417502403259277, -8.160638809204102, -7.903775691986084, -7.646912574768066, -7.390049457550049, -7.133186340332031, -6.8763227462768555, -6.619459629058838, -6.36259651184082, -6.1057329177856445, -5.848869800567627, -5.592006683349609, -5.335143566131592, -5.078280448913574, -4.821416854858398, -4.564553737640381, -4.307690620422363, -4.0508270263671875, -3.79396390914917, -3.5371007919311523, -3.2802376747131348, -3.023374319076538, -2.7665109634399414, -2.509647846221924, -2.2527847290039062, -1.9959213733673096, -1.7390581369400024, -1.4821958541870117, -1.2253326177597046, -0.9684693813323975, -0.7116061449050903, -0.4547429084777832, -0.19787967205047607, 0.058983564376831055, 0.3158468008041382, 0.5727100372314453, 0.8295732736587524, 1.0864365100860596, 1.3432997465133667, 1.6001629829406738, 1.857026219367981, 2.113889455795288, 2.3707528114318848, 2.6276159286499023, 2.88447904586792, 3.1413424015045166, 3.3982057571411133, 3.655068874359131, 3.9119319915771484, 4.168795585632324, 4.425658702850342, 4.682521820068359, 4.939384937286377, 5.1962480545043945, 5.45311164855957, 5.709974765777588, 5.9668378829956055, 6.223701477050781, 6.480564594268799, 6.737427711486816]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 6.0, 9.0, 8.0, 7.0, 16.0, 22.0, 18.0, 33.0, 39.0, 89.0, 132.0, 232.0, 411.0, 739.0, 1490.0, 3488.0, 10041.0, 34972.0, 192415.0, 640303.0, 125001.0, 25992.0, 7604.0, 2841.0, 1191.0, 602.0, 358.0, 171.0, 116.0, 80.0, 49.0, 31.0, 15.0, 13.0, 9.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.484375, -9.16162109375, -8.8388671875, -8.51611328125, -8.193359375, -7.87060546875, -7.5478515625, -7.22509765625, -6.90234375, -6.57958984375, -6.2568359375, -5.93408203125, -5.611328125, -5.28857421875, -4.9658203125, -4.64306640625, -4.3203125, -3.99755859375, -3.6748046875, -3.35205078125, -3.029296875, -2.70654296875, -2.3837890625, -2.06103515625, -1.73828125, -1.41552734375, -1.0927734375, -0.77001953125, -0.447265625, -0.12451171875, 0.1982421875, 0.52099609375, 0.84375, 1.16650390625, 1.4892578125, 1.81201171875, 2.134765625, 2.45751953125, 2.7802734375, 3.10302734375, 3.42578125, 3.74853515625, 4.0712890625, 4.39404296875, 4.716796875, 5.03955078125, 5.3623046875, 5.68505859375, 6.0078125, 6.33056640625, 6.6533203125, 6.97607421875, 7.298828125, 7.62158203125, 7.9443359375, 8.26708984375, 8.58984375, 8.91259765625, 9.2353515625, 9.55810546875, 9.880859375, 10.20361328125, 10.5263671875, 10.84912109375, 11.171875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 4.0, 10.0, 6.0, 14.0, 18.0, 21.0, 23.0, 27.0, 52.0, 39.0, 55.0, 63.0, 63.0, 63.0, 69.0, 56.0, 75.0, 66.0, 48.0, 53.0, 35.0, 31.0, 21.0, 22.0, 15.0, 21.0, 6.0, 7.0, 4.0, 4.0, 5.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3525390625, -1.3174667358398438, -1.2823944091796875, -1.2473220825195312, -1.212249755859375, -1.1771774291992188, -1.1421051025390625, -1.1070327758789062, -1.07196044921875, -1.0368881225585938, -1.0018157958984375, -0.9667434692382812, -0.931671142578125, -0.8965988159179688, -0.8615264892578125, -0.8264541625976562, -0.7913818359375, -0.7563095092773438, -0.7212371826171875, -0.6861648559570312, -0.651092529296875, -0.6160202026367188, -0.5809478759765625, -0.5458755493164062, -0.51080322265625, -0.47573089599609375, -0.4406585693359375, -0.40558624267578125, -0.370513916015625, -0.33544158935546875, -0.3003692626953125, -0.26529693603515625, -0.230224609375, -0.19515228271484375, -0.1600799560546875, -0.12500762939453125, -0.089935302734375, -0.05486297607421875, -0.0197906494140625, 0.01528167724609375, 0.05035400390625, 0.08542633056640625, 0.1204986572265625, 0.15557098388671875, 0.190643310546875, 0.22571563720703125, 0.2607879638671875, 0.29586029052734375, 0.3309326171875, 0.36600494384765625, 0.4010772705078125, 0.43614959716796875, 0.471221923828125, 0.5062942504882812, 0.5413665771484375, 0.5764389038085938, 0.61151123046875, 0.6465835571289062, 0.6816558837890625, 0.7167282104492188, 0.751800537109375, 0.7868728637695312, 0.8219451904296875, 0.8570175170898438, 0.89208984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 9.0, 5.0, 7.0, 11.0, 24.0, 22.0, 30.0, 31.0, 33.0, 55.0, 89.0, 108.0, 173.0, 242.0, 375.0, 557.0, 960.0, 1657.0, 2940.0, 5916.0, 13559.0, 35435.0, 107598.0, 357515.0, 353294.0, 105449.0, 35685.0, 13467.0, 5858.0, 3041.0, 1615.0, 946.0, 591.0, 376.0, 273.0, 195.0, 116.0, 79.0, 64.0, 47.0, 37.0, 22.0, 19.0, 7.0, 8.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.4609375, -5.30029296875, -5.1396484375, -4.97900390625, -4.818359375, -4.65771484375, -4.4970703125, -4.33642578125, -4.17578125, -4.01513671875, -3.8544921875, -3.69384765625, -3.533203125, -3.37255859375, -3.2119140625, -3.05126953125, -2.890625, -2.72998046875, -2.5693359375, -2.40869140625, -2.248046875, -2.08740234375, -1.9267578125, -1.76611328125, -1.60546875, -1.44482421875, -1.2841796875, -1.12353515625, -0.962890625, -0.80224609375, -0.6416015625, -0.48095703125, -0.3203125, -0.15966796875, 0.0009765625, 0.16162109375, 0.322265625, 0.48291015625, 0.6435546875, 0.80419921875, 0.96484375, 1.12548828125, 1.2861328125, 1.44677734375, 1.607421875, 1.76806640625, 1.9287109375, 2.08935546875, 2.25, 2.41064453125, 2.5712890625, 2.73193359375, 2.892578125, 3.05322265625, 3.2138671875, 3.37451171875, 3.53515625, 3.69580078125, 3.8564453125, 4.01708984375, 4.177734375, 4.33837890625, 4.4990234375, 4.65966796875, 4.8203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 8.0, 10.0, 7.0, 6.0, 11.0, 11.0, 15.0, 23.0, 32.0, 36.0, 26.0, 27.0, 44.0, 41.0, 42.0, 37.0, 46.0, 47.0, 45.0, 41.0, 49.0, 48.0, 44.0, 35.0, 35.0, 41.0, 29.0, 31.0, 19.0, 30.0, 18.0, 12.0, 14.0, 12.0, 2.0, 10.0, 2.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.671875, -4.532470703125, -4.39306640625, -4.253662109375, -4.1142578125, -3.974853515625, -3.83544921875, -3.696044921875, -3.556640625, -3.417236328125, -3.27783203125, -3.138427734375, -2.9990234375, -2.859619140625, -2.72021484375, -2.580810546875, -2.44140625, -2.302001953125, -2.16259765625, -2.023193359375, -1.8837890625, -1.744384765625, -1.60498046875, -1.465576171875, -1.326171875, -1.186767578125, -1.04736328125, -0.907958984375, -0.7685546875, -0.629150390625, -0.48974609375, -0.350341796875, -0.2109375, -0.071533203125, 0.06787109375, 0.207275390625, 0.3466796875, 0.486083984375, 0.62548828125, 0.764892578125, 0.904296875, 1.043701171875, 1.18310546875, 1.322509765625, 1.4619140625, 1.601318359375, 1.74072265625, 1.880126953125, 2.01953125, 2.158935546875, 2.29833984375, 2.437744140625, 2.5771484375, 2.716552734375, 2.85595703125, 2.995361328125, 3.134765625, 3.274169921875, 3.41357421875, 3.552978515625, 3.6923828125, 3.831787109375, 3.97119140625, 4.110595703125, 4.25]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 15.0, 7.0, 14.0, 21.0, 38.0, 59.0, 155.0, 269.0, 844.0, 3180.0, 21316.0, 389610.0, 596297.0, 30907.0, 4139.0, 1018.0, 355.0, 128.0, 66.0, 32.0, 33.0, 18.0, 12.0, 4.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4609375, -8.212646484375, -7.96435546875, -7.716064453125, -7.4677734375, -7.219482421875, -6.97119140625, -6.722900390625, -6.474609375, -6.226318359375, -5.97802734375, -5.729736328125, -5.4814453125, -5.233154296875, -4.98486328125, -4.736572265625, -4.48828125, -4.239990234375, -3.99169921875, -3.743408203125, -3.4951171875, -3.246826171875, -2.99853515625, -2.750244140625, -2.501953125, -2.253662109375, -2.00537109375, -1.757080078125, -1.5087890625, -1.260498046875, -1.01220703125, -0.763916015625, -0.515625, -0.267333984375, -0.01904296875, 0.229248046875, 0.4775390625, 0.725830078125, 0.97412109375, 1.222412109375, 1.470703125, 1.718994140625, 1.96728515625, 2.215576171875, 2.4638671875, 2.712158203125, 2.96044921875, 3.208740234375, 3.45703125, 3.705322265625, 3.95361328125, 4.201904296875, 4.4501953125, 4.698486328125, 4.94677734375, 5.195068359375, 5.443359375, 5.691650390625, 5.93994140625, 6.188232421875, 6.4365234375, 6.684814453125, 6.93310546875, 7.181396484375, 7.4296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 5.0, 12.0, 9.0, 11.0, 16.0, 15.0, 34.0, 35.0, 57.0, 73.0, 112.0, 127.0, 128.0, 79.0, 58.0, 52.0, 32.0, 29.0, 17.0, 15.0, 19.0, 9.0, 8.0, 8.0, 6.0, 8.0, 1.0, 3.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0007309913635253906, -0.0007122457027435303, -0.0006935000419616699, -0.0006747543811798096, -0.0006560087203979492, -0.0006372630596160889, -0.0006185173988342285, -0.0005997717380523682, -0.0005810260772705078, -0.0005622804164886475, -0.0005435347557067871, -0.0005247890949249268, -0.0005060434341430664, -0.00048729777336120605, -0.0004685521125793457, -0.00044980645179748535, -0.000431060791015625, -0.00041231513023376465, -0.0003935694694519043, -0.00037482380867004395, -0.0003560781478881836, -0.00033733248710632324, -0.0003185868263244629, -0.00029984116554260254, -0.0002810955047607422, -0.00026234984397888184, -0.00024360418319702148, -0.00022485852241516113, -0.00020611286163330078, -0.00018736720085144043, -0.00016862154006958008, -0.00014987587928771973, -0.00013113021850585938, -0.00011238455772399902, -9.363889694213867e-05, -7.489323616027832e-05, -5.614757537841797e-05, -3.740191459655762e-05, -1.8656253814697266e-05, 8.940696716308594e-08, 1.8835067749023438e-05, 3.758072853088379e-05, 5.632638931274414e-05, 7.507205009460449e-05, 9.381771087646484e-05, 0.0001125633716583252, 0.00013130903244018555, 0.0001500546932220459, 0.00016880035400390625, 0.0001875460147857666, 0.00020629167556762695, 0.0002250373363494873, 0.00024378299713134766, 0.000262528657913208, 0.00028127431869506836, 0.0003000199794769287, 0.00031876564025878906, 0.0003375113010406494, 0.00035625696182250977, 0.0003750026226043701, 0.00039374828338623047, 0.0004124939441680908, 0.00043123960494995117, 0.0004499852657318115, 0.0004687309265136719]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 3.0, 11.0, 7.0, 11.0, 15.0, 35.0, 40.0, 85.0, 128.0, 250.0, 474.0, 970.0, 2459.0, 6960.0, 29828.0, 234692.0, 655304.0, 94610.0, 15145.0, 4333.0, 1616.0, 723.0, 333.0, 202.0, 107.0, 65.0, 47.0, 36.0, 14.0, 14.0, 5.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.4935302734375, -4.334716796875, -4.1759033203125, -4.01708984375, -3.8582763671875, -3.699462890625, -3.5406494140625, -3.3818359375, -3.2230224609375, -3.064208984375, -2.9053955078125, -2.74658203125, -2.5877685546875, -2.428955078125, -2.2701416015625, -2.111328125, -1.9525146484375, -1.793701171875, -1.6348876953125, -1.47607421875, -1.3172607421875, -1.158447265625, -0.9996337890625, -0.8408203125, -0.6820068359375, -0.523193359375, -0.3643798828125, -0.20556640625, -0.0467529296875, 0.112060546875, 0.2708740234375, 0.4296875, 0.5885009765625, 0.747314453125, 0.9061279296875, 1.06494140625, 1.2237548828125, 1.382568359375, 1.5413818359375, 1.7001953125, 1.8590087890625, 2.017822265625, 2.1766357421875, 2.33544921875, 2.4942626953125, 2.653076171875, 2.8118896484375, 2.970703125, 3.1295166015625, 3.288330078125, 3.4471435546875, 3.60595703125, 3.7647705078125, 3.923583984375, 4.0823974609375, 4.2412109375, 4.4000244140625, 4.558837890625, 4.7176513671875, 4.87646484375, 5.0352783203125, 5.194091796875, 5.3529052734375, 5.51171875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 8.0, 9.0, 7.0, 10.0, 8.0, 15.0, 19.0, 28.0, 23.0, 30.0, 46.0, 67.0, 72.0, 79.0, 86.0, 80.0, 87.0, 75.0, 53.0, 28.0, 21.0, 31.0, 23.0, 18.0, 15.0, 11.0, 12.0, 6.0, 11.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.16015625, -2.089691162109375, -2.01922607421875, -1.948760986328125, -1.8782958984375, -1.807830810546875, -1.73736572265625, -1.666900634765625, -1.596435546875, -1.525970458984375, -1.45550537109375, -1.385040283203125, -1.3145751953125, -1.244110107421875, -1.17364501953125, -1.103179931640625, -1.03271484375, -0.962249755859375, -0.89178466796875, -0.821319580078125, -0.7508544921875, -0.680389404296875, -0.60992431640625, -0.539459228515625, -0.468994140625, -0.398529052734375, -0.32806396484375, -0.257598876953125, -0.1871337890625, -0.116668701171875, -0.04620361328125, 0.024261474609375, 0.0947265625, 0.165191650390625, 0.23565673828125, 0.306121826171875, 0.3765869140625, 0.447052001953125, 0.51751708984375, 0.587982177734375, 0.658447265625, 0.728912353515625, 0.79937744140625, 0.869842529296875, 0.9403076171875, 1.010772705078125, 1.08123779296875, 1.151702880859375, 1.22216796875, 1.292633056640625, 1.36309814453125, 1.433563232421875, 1.5040283203125, 1.574493408203125, 1.64495849609375, 1.715423583984375, 1.785888671875, 1.856353759765625, 1.92681884765625, 1.997283935546875, 2.0677490234375, 2.138214111328125, 2.20867919921875, 2.279144287109375, 2.349609375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 3.0, 8.0, 7.0, 11.0, 15.0, 14.0, 23.0, 43.0, 45.0, 68.0, 82.0, 92.0, 98.0, 102.0, 73.0, 76.0, 83.0, 51.0, 30.0, 17.0, 13.0, 10.0, 11.0, 12.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.715721130371094, -25.685707092285156, -24.65569305419922, -23.62567901611328, -22.59566307067871, -21.565649032592773, -20.535634994506836, -19.5056209564209, -18.475605010986328, -17.44559097290039, -16.415576934814453, -15.3855619430542, -14.355546951293945, -13.325532913208008, -12.29551887512207, -11.265504837036133, -10.235490798950195, -9.205476760864258, -8.175461769104004, -7.145447731018066, -6.115433216094971, -5.085418701171875, -4.0554046630859375, -3.025390148162842, -1.995375633239746, -0.9653612375259399, 0.06465315818786621, 1.0946674346923828, 2.1246819496154785, 3.154696464538574, 4.184710502624512, 5.214725017547607, 6.244739532470703, 7.274754047393799, 8.304768562316895, 9.334782600402832, 10.364797592163086, 11.394811630249023, 12.424825668334961, 13.454839706420898, 14.484854698181152, 15.51486873626709, 16.544883728027344, 17.57489776611328, 18.60491180419922, 19.634925842285156, 20.664939880371094, 21.694955825805664, 22.7249698638916, 23.75498390197754, 24.784997940063477, 25.815013885498047, 26.845027923583984, 27.875041961669922, 28.90505599975586, 29.935070037841797, 30.965084075927734, 31.995098114013672, 33.02511215209961, 34.05512619018555, 35.085140228271484, 36.11515808105469, 37.145172119140625, 38.17518615722656, 39.2052001953125]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 7.0, 6.0, 15.0, 10.0, 9.0, 14.0, 20.0, 14.0, 19.0, 19.0, 17.0, 27.0, 34.0, 40.0, 34.0, 41.0, 41.0, 45.0, 30.0, 41.0, 32.0, 44.0, 40.0, 29.0, 35.0, 47.0, 41.0, 38.0, 33.0, 20.0, 19.0, 25.0, 24.0, 21.0, 19.0, 9.0, 13.0, 5.0, 7.0, 5.0, 5.0, 1.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-23.517778396606445, -22.787986755371094, -22.05819320678711, -21.328399658203125, -20.598608016967773, -19.868816375732422, -19.139022827148438, -18.409229278564453, -17.6794376373291, -16.94964599609375, -16.219852447509766, -15.490059852600098, -14.76026725769043, -14.030474662780762, -13.300682067871094, -12.570889472961426, -11.841096878051758, -11.11130428314209, -10.381511688232422, -9.651719093322754, -8.921926498413086, -8.192133903503418, -7.46234130859375, -6.732548713684082, -6.002756118774414, -5.272963523864746, -4.543170928955078, -3.81337833404541, -3.083585739135742, -2.353793144226074, -1.6240005493164062, -0.8942079544067383, -0.16441726684570312, 0.5653753280639648, 1.2951679229736328, 2.024960517883301, 2.7547531127929688, 3.4845457077026367, 4.214338302612305, 4.944130897521973, 5.673923492431641, 6.403716087341309, 7.133508682250977, 7.8633012771606445, 8.593093872070312, 9.32288646697998, 10.052679061889648, 10.782471656799316, 11.512264251708984, 12.242056846618652, 12.97184944152832, 13.701642036437988, 14.431434631347656, 15.161227226257324, 15.891019821166992, 16.620811462402344, 17.350605010986328, 18.080398559570312, 18.810190200805664, 19.539981842041016, 20.269775390625, 20.999568939208984, 21.729360580444336, 22.459152221679688, 23.188945770263672]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 7.0, 8.0, 7.0, 18.0, 18.0, 14.0, 25.0, 46.0, 68.0, 116.0, 178.0, 250.0, 473.0, 963.0, 2066.0, 5357.0, 17516.0, 121078.0, 3902390.0, 117223.0, 17646.0, 5017.0, 1947.0, 837.0, 445.0, 214.0, 141.0, 78.0, 48.0, 29.0, 26.0, 8.0, 8.0, 5.0, 8.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.104248046875, -11.76318359375, -11.422119140625, -11.0810546875, -10.739990234375, -10.39892578125, -10.057861328125, -9.716796875, -9.375732421875, -9.03466796875, -8.693603515625, -8.3525390625, -8.011474609375, -7.67041015625, -7.329345703125, -6.98828125, -6.647216796875, -6.30615234375, -5.965087890625, -5.6240234375, -5.282958984375, -4.94189453125, -4.600830078125, -4.259765625, -3.918701171875, -3.57763671875, -3.236572265625, -2.8955078125, -2.554443359375, -2.21337890625, -1.872314453125, -1.53125, -1.190185546875, -0.84912109375, -0.508056640625, -0.1669921875, 0.174072265625, 0.51513671875, 0.856201171875, 1.197265625, 1.538330078125, 1.87939453125, 2.220458984375, 2.5615234375, 2.902587890625, 3.24365234375, 3.584716796875, 3.92578125, 4.266845703125, 4.60791015625, 4.948974609375, 5.2900390625, 5.631103515625, 5.97216796875, 6.313232421875, 6.654296875, 6.995361328125, 7.33642578125, 7.677490234375, 8.0185546875, 8.359619140625, 8.70068359375, 9.041748046875, 9.3828125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 9.0, 8.0, 15.0, 11.0, 21.0, 26.0, 34.0, 38.0, 38.0, 40.0, 51.0, 50.0, 43.0, 61.0, 56.0, 54.0, 53.0, 62.0, 49.0, 46.0, 37.0, 33.0, 31.0, 34.0, 18.0, 18.0, 14.0, 19.0, 4.0, 7.0, 8.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.25, -1.2160568237304688, -1.1821136474609375, -1.1481704711914062, -1.114227294921875, -1.0802841186523438, -1.0463409423828125, -1.0123977661132812, -0.97845458984375, -0.9445114135742188, -0.9105682373046875, -0.8766250610351562, -0.842681884765625, -0.8087387084960938, -0.7747955322265625, -0.7408523559570312, -0.7069091796875, -0.6729660034179688, -0.6390228271484375, -0.6050796508789062, -0.571136474609375, -0.5371932983398438, -0.5032501220703125, -0.46930694580078125, -0.43536376953125, -0.40142059326171875, -0.3674774169921875, -0.33353424072265625, -0.299591064453125, -0.26564788818359375, -0.2317047119140625, -0.19776153564453125, -0.163818359375, -0.12987518310546875, -0.0959320068359375, -0.06198883056640625, -0.028045654296875, 0.00589752197265625, 0.0398406982421875, 0.07378387451171875, 0.10772705078125, 0.14167022705078125, 0.1756134033203125, 0.20955657958984375, 0.243499755859375, 0.27744293212890625, 0.3113861083984375, 0.34532928466796875, 0.3792724609375, 0.41321563720703125, 0.4471588134765625, 0.48110198974609375, 0.515045166015625, 0.5489883422851562, 0.5829315185546875, 0.6168746948242188, 0.65081787109375, 0.6847610473632812, 0.7187042236328125, 0.7526473999023438, 0.786590576171875, 0.8205337524414062, 0.8544769287109375, 0.8884201049804688, 0.92236328125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 6.0, 3.0, 10.0, 10.0, 8.0, 19.0, 29.0, 28.0, 36.0, 60.0, 98.0, 112.0, 165.0, 247.0, 378.0, 551.0, 867.0, 1387.0, 2336.0, 4220.0, 8201.0, 17123.0, 42040.0, 131807.0, 1033434.0, 2667152.0, 187309.0, 53618.0, 21227.0, 9906.0, 4897.0, 2662.0, 1595.0, 960.0, 546.0, 396.0, 248.0, 171.0, 133.0, 87.0, 54.0, 41.0, 35.0, 20.0, 15.0, 14.0, 12.0, 5.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.67578125, -4.53021240234375, -4.3846435546875, -4.23907470703125, -4.093505859375, -3.94793701171875, -3.8023681640625, -3.65679931640625, -3.51123046875, -3.36566162109375, -3.2200927734375, -3.07452392578125, -2.928955078125, -2.78338623046875, -2.6378173828125, -2.49224853515625, -2.3466796875, -2.20111083984375, -2.0555419921875, -1.90997314453125, -1.764404296875, -1.61883544921875, -1.4732666015625, -1.32769775390625, -1.18212890625, -1.03656005859375, -0.8909912109375, -0.74542236328125, -0.599853515625, -0.45428466796875, -0.3087158203125, -0.16314697265625, -0.017578125, 0.12799072265625, 0.2735595703125, 0.41912841796875, 0.564697265625, 0.71026611328125, 0.8558349609375, 1.00140380859375, 1.14697265625, 1.29254150390625, 1.4381103515625, 1.58367919921875, 1.729248046875, 1.87481689453125, 2.0203857421875, 2.16595458984375, 2.3115234375, 2.45709228515625, 2.6026611328125, 2.74822998046875, 2.893798828125, 3.03936767578125, 3.1849365234375, 3.33050537109375, 3.47607421875, 3.62164306640625, 3.7672119140625, 3.91278076171875, 4.058349609375, 4.20391845703125, 4.3494873046875, 4.49505615234375, 4.640625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 7.0, 5.0, 7.0, 4.0, 8.0, 14.0, 18.0, 17.0, 20.0, 47.0, 63.0, 78.0, 141.0, 250.0, 608.0, 1595.0, 573.0, 202.0, 107.0, 79.0, 56.0, 40.0, 28.0, 20.0, 15.0, 24.0, 13.0, 9.0, 6.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.423828125, -2.355377197265625, -2.28692626953125, -2.218475341796875, -2.1500244140625, -2.081573486328125, -2.01312255859375, -1.944671630859375, -1.876220703125, -1.807769775390625, -1.73931884765625, -1.670867919921875, -1.6024169921875, -1.533966064453125, -1.46551513671875, -1.397064208984375, -1.32861328125, -1.260162353515625, -1.19171142578125, -1.123260498046875, -1.0548095703125, -0.986358642578125, -0.91790771484375, -0.849456787109375, -0.781005859375, -0.712554931640625, -0.64410400390625, -0.575653076171875, -0.5072021484375, -0.438751220703125, -0.37030029296875, -0.301849365234375, -0.2333984375, -0.164947509765625, -0.09649658203125, -0.028045654296875, 0.0404052734375, 0.108856201171875, 0.17730712890625, 0.245758056640625, 0.314208984375, 0.382659912109375, 0.45111083984375, 0.519561767578125, 0.5880126953125, 0.656463623046875, 0.72491455078125, 0.793365478515625, 0.86181640625, 0.930267333984375, 0.99871826171875, 1.067169189453125, 1.1356201171875, 1.204071044921875, 1.27252197265625, 1.340972900390625, 1.409423828125, 1.477874755859375, 1.54632568359375, 1.614776611328125, 1.6832275390625, 1.751678466796875, 1.82012939453125, 1.888580322265625, 1.95703125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 8.0, 10.0, 19.0, 44.0, 68.0, 120.0, 149.0, 177.0, 151.0, 102.0, 68.0, 32.0, 24.0, 10.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.70559310913086, -19.080358505249023, -18.455123901367188, -17.82988929748535, -17.204654693603516, -16.57942008972168, -15.95418643951416, -15.328951835632324, -14.703717231750488, -14.078482627868652, -13.453248023986816, -12.82801342010498, -12.202779769897461, -11.577545166015625, -10.952310562133789, -10.327075958251953, -9.701841354370117, -9.076606750488281, -8.451372146606445, -7.826138019561768, -7.200903415679932, -6.575668811798096, -5.950434684753418, -5.325200080871582, -4.699965476989746, -4.07473087310791, -3.4494965076446533, -2.8242621421813965, -2.1990275382995605, -1.5737929344177246, -0.9485585689544678, -0.32332420349121094, 0.3019123077392578, 0.9271467924118042, 1.5523812770843506, 2.1776156425476074, 2.8028502464294434, 3.4280848503112793, 4.053318977355957, 4.678553581237793, 5.303788185119629, 5.929022789001465, 6.554257392883301, 7.1794915199279785, 7.8047261238098145, 8.429960250854492, 9.055194854736328, 9.680429458618164, 10.3056640625, 10.930898666381836, 11.556133270263672, 12.181367874145508, 12.806602478027344, 13.43183708190918, 14.0570707321167, 14.682305335998535, 15.307539939880371, 15.932774543762207, 16.558008193969727, 17.183242797851562, 17.8084774017334, 18.433712005615234, 19.05894660949707, 19.684181213378906, 20.309415817260742]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 2.0, 1.0, 7.0, 4.0, 5.0, 8.0, 12.0, 20.0, 19.0, 23.0, 20.0, 21.0, 23.0, 29.0, 31.0, 45.0, 46.0, 38.0, 49.0, 41.0, 35.0, 43.0, 46.0, 45.0, 31.0, 44.0, 42.0, 31.0, 27.0, 38.0, 26.0, 26.0, 13.0, 20.0, 14.0, 17.0, 16.0, 6.0, 9.0, 8.0, 6.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.572405815124512, -7.335194110870361, -7.097982406616211, -6.8607707023620605, -6.62355899810791, -6.38634729385376, -6.149135589599609, -5.911923885345459, -5.674712181091309, -5.437500476837158, -5.200288772583008, -4.963077068328857, -4.725865364074707, -4.488653659820557, -4.251441955566406, -4.014230251312256, -3.7770187854766846, -3.539807081222534, -3.302595376968384, -3.0653836727142334, -2.828171968460083, -2.5909605026245117, -2.3537487983703613, -2.116537094116211, -1.879325270652771, -1.6421135663986206, -1.4049018621444702, -1.1676902770996094, -0.9304785132408142, -0.6932668685913086, -0.4560551643371582, -0.2188434600830078, 0.018368244171142578, 0.25557994842529297, 0.49279162287712097, 0.730003297328949, 0.9672150015830994, 1.204426646232605, 1.4416383504867554, 1.6788500547409058, 1.9160617589950562, 2.153273344039917, 2.3904850482940674, 2.6276967525482178, 2.864908456802368, 3.1021201610565186, 3.339331865310669, 3.5765435695648193, 3.8137552738189697, 4.050966739654541, 4.288178443908691, 4.525390148162842, 4.762601852416992, 4.999813556671143, 5.237025260925293, 5.474236965179443, 5.711448669433594, 5.948660373687744, 6.1858720779418945, 6.423083782196045, 6.660295486450195, 6.897507190704346, 7.134718894958496, 7.3719305992126465, 7.609142303466797]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 5.0, 17.0, 5.0, 15.0, 18.0, 41.0, 84.0, 101.0, 187.0, 265.0, 475.0, 883.0, 1607.0, 3428.0, 7546.0, 18496.0, 52062.0, 164334.0, 460287.0, 226767.0, 69799.0, 24176.0, 9457.0, 4148.0, 1957.0, 1027.0, 523.0, 334.0, 183.0, 106.0, 75.0, 45.0, 29.0, 24.0, 22.0, 9.0, 5.0, 4.0, 5.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.1640625, -6.9510498046875, -6.738037109375, -6.5250244140625, -6.31201171875, -6.0989990234375, -5.885986328125, -5.6729736328125, -5.4599609375, -5.2469482421875, -5.033935546875, -4.8209228515625, -4.60791015625, -4.3948974609375, -4.181884765625, -3.9688720703125, -3.755859375, -3.5428466796875, -3.329833984375, -3.1168212890625, -2.90380859375, -2.6907958984375, -2.477783203125, -2.2647705078125, -2.0517578125, -1.8387451171875, -1.625732421875, -1.4127197265625, -1.19970703125, -0.9866943359375, -0.773681640625, -0.5606689453125, -0.34765625, -0.1346435546875, 0.078369140625, 0.2913818359375, 0.50439453125, 0.7174072265625, 0.930419921875, 1.1434326171875, 1.3564453125, 1.5694580078125, 1.782470703125, 1.9954833984375, 2.20849609375, 2.4215087890625, 2.634521484375, 2.8475341796875, 3.060546875, 3.2735595703125, 3.486572265625, 3.6995849609375, 3.91259765625, 4.1256103515625, 4.338623046875, 4.5516357421875, 4.7646484375, 4.9776611328125, 5.190673828125, 5.4036865234375, 5.61669921875, 5.8297119140625, 6.042724609375, 6.2557373046875, 6.46875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 8.0, 3.0, 5.0, 8.0, 8.0, 16.0, 21.0, 18.0, 39.0, 39.0, 40.0, 37.0, 48.0, 51.0, 52.0, 52.0, 54.0, 48.0, 46.0, 41.0, 46.0, 45.0, 53.0, 34.0, 39.0, 31.0, 21.0, 24.0, 18.0, 9.0, 16.0, 3.0, 4.0, 7.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.14453125, -1.11090087890625, -1.0772705078125, -1.04364013671875, -1.010009765625, -0.97637939453125, -0.9427490234375, -0.90911865234375, -0.87548828125, -0.84185791015625, -0.8082275390625, -0.77459716796875, -0.740966796875, -0.70733642578125, -0.6737060546875, -0.64007568359375, -0.6064453125, -0.57281494140625, -0.5391845703125, -0.50555419921875, -0.471923828125, -0.43829345703125, -0.4046630859375, -0.37103271484375, -0.33740234375, -0.30377197265625, -0.2701416015625, -0.23651123046875, -0.202880859375, -0.16925048828125, -0.1356201171875, -0.10198974609375, -0.068359375, -0.03472900390625, -0.0010986328125, 0.03253173828125, 0.066162109375, 0.09979248046875, 0.1334228515625, 0.16705322265625, 0.20068359375, 0.23431396484375, 0.2679443359375, 0.30157470703125, 0.335205078125, 0.36883544921875, 0.4024658203125, 0.43609619140625, 0.4697265625, 0.50335693359375, 0.5369873046875, 0.57061767578125, 0.604248046875, 0.63787841796875, 0.6715087890625, 0.70513916015625, 0.73876953125, 0.77239990234375, 0.8060302734375, 0.83966064453125, 0.873291015625, 0.90692138671875, 0.9405517578125, 0.97418212890625, 1.0078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 7.0, 8.0, 9.0, 3.0, 8.0, 23.0, 23.0, 27.0, 38.0, 52.0, 60.0, 77.0, 112.0, 151.0, 223.0, 356.0, 552.0, 1038.0, 2118.0, 5896.0, 22926.0, 110433.0, 520430.0, 305670.0, 57592.0, 13035.0, 3910.0, 1531.0, 779.0, 449.0, 315.0, 188.0, 143.0, 92.0, 81.0, 53.0, 38.0, 31.0, 19.0, 15.0, 13.0, 8.0, 6.0, 7.0, 5.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.8359375, -7.61077880859375, -7.3856201171875, -7.16046142578125, -6.935302734375, -6.71014404296875, -6.4849853515625, -6.25982666015625, -6.03466796875, -5.80950927734375, -5.5843505859375, -5.35919189453125, -5.134033203125, -4.90887451171875, -4.6837158203125, -4.45855712890625, -4.2333984375, -4.00823974609375, -3.7830810546875, -3.55792236328125, -3.332763671875, -3.10760498046875, -2.8824462890625, -2.65728759765625, -2.43212890625, -2.20697021484375, -1.9818115234375, -1.75665283203125, -1.531494140625, -1.30633544921875, -1.0811767578125, -0.85601806640625, -0.630859375, -0.40570068359375, -0.1805419921875, 0.04461669921875, 0.269775390625, 0.49493408203125, 0.7200927734375, 0.94525146484375, 1.17041015625, 1.39556884765625, 1.6207275390625, 1.84588623046875, 2.071044921875, 2.29620361328125, 2.5213623046875, 2.74652099609375, 2.9716796875, 3.19683837890625, 3.4219970703125, 3.64715576171875, 3.872314453125, 4.09747314453125, 4.3226318359375, 4.54779052734375, 4.77294921875, 4.99810791015625, 5.2232666015625, 5.44842529296875, 5.673583984375, 5.89874267578125, 6.1239013671875, 6.34906005859375, 6.57421875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 5.0, 10.0, 12.0, 11.0, 16.0, 20.0, 17.0, 15.0, 24.0, 33.0, 51.0, 30.0, 41.0, 45.0, 50.0, 33.0, 55.0, 53.0, 53.0, 53.0, 57.0, 39.0, 41.0, 37.0, 36.0, 29.0, 24.0, 20.0, 17.0, 18.0, 13.0, 12.0, 9.0, 6.0, 7.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.77734375, -4.62884521484375, -4.4803466796875, -4.33184814453125, -4.183349609375, -4.03485107421875, -3.8863525390625, -3.73785400390625, -3.58935546875, -3.44085693359375, -3.2923583984375, -3.14385986328125, -2.995361328125, -2.84686279296875, -2.6983642578125, -2.54986572265625, -2.4013671875, -2.25286865234375, -2.1043701171875, -1.95587158203125, -1.807373046875, -1.65887451171875, -1.5103759765625, -1.36187744140625, -1.21337890625, -1.06488037109375, -0.9163818359375, -0.76788330078125, -0.619384765625, -0.47088623046875, -0.3223876953125, -0.17388916015625, -0.025390625, 0.12310791015625, 0.2716064453125, 0.42010498046875, 0.568603515625, 0.71710205078125, 0.8656005859375, 1.01409912109375, 1.16259765625, 1.31109619140625, 1.4595947265625, 1.60809326171875, 1.756591796875, 1.90509033203125, 2.0535888671875, 2.20208740234375, 2.3505859375, 2.49908447265625, 2.6475830078125, 2.79608154296875, 2.944580078125, 3.09307861328125, 3.2415771484375, 3.39007568359375, 3.53857421875, 3.68707275390625, 3.8355712890625, 3.98406982421875, 4.132568359375, 4.28106689453125, 4.4295654296875, 4.57806396484375, 4.7265625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 8.0, 7.0, 19.0, 24.0, 32.0, 54.0, 96.0, 172.0, 293.0, 654.0, 1352.0, 3589.0, 12564.0, 87278.0, 788790.0, 130783.0, 15525.0, 4195.0, 1572.0, 684.0, 357.0, 214.0, 110.0, 75.0, 35.0, 21.0, 17.0, 10.0, 10.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.4296875, -9.197265625, -8.96484375, -8.732421875, -8.5, -8.267578125, -8.03515625, -7.802734375, -7.5703125, -7.337890625, -7.10546875, -6.873046875, -6.640625, -6.408203125, -6.17578125, -5.943359375, -5.7109375, -5.478515625, -5.24609375, -5.013671875, -4.78125, -4.548828125, -4.31640625, -4.083984375, -3.8515625, -3.619140625, -3.38671875, -3.154296875, -2.921875, -2.689453125, -2.45703125, -2.224609375, -1.9921875, -1.759765625, -1.52734375, -1.294921875, -1.0625, -0.830078125, -0.59765625, -0.365234375, -0.1328125, 0.099609375, 0.33203125, 0.564453125, 0.796875, 1.029296875, 1.26171875, 1.494140625, 1.7265625, 1.958984375, 2.19140625, 2.423828125, 2.65625, 2.888671875, 3.12109375, 3.353515625, 3.5859375, 3.818359375, 4.05078125, 4.283203125, 4.515625, 4.748046875, 4.98046875, 5.212890625, 5.4453125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 4.0, 5.0, 13.0, 7.0, 13.0, 18.0, 18.0, 17.0, 32.0, 26.0, 35.0, 47.0, 63.0, 76.0, 86.0, 111.0, 85.0, 76.0, 51.0, 37.0, 38.0, 33.0, 19.0, 14.0, 17.0, 11.0, 4.0, 7.0, 7.0, 4.0, 9.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004870891571044922, -0.0004704482853412628, -0.00045380741357803345, -0.0004371665418148041, -0.0004205256700515747, -0.00040388479828834534, -0.00038724392652511597, -0.0003706030547618866, -0.0003539621829986572, -0.00033732131123542786, -0.0003206804394721985, -0.0003040395677089691, -0.00028739869594573975, -0.0002707578241825104, -0.000254116952419281, -0.00023747608065605164, -0.00022083520889282227, -0.0002041943371295929, -0.00018755346536636353, -0.00017091259360313416, -0.00015427172183990479, -0.00013763085007667542, -0.00012098997831344604, -0.00010434910655021667, -8.77082347869873e-05, -7.106736302375793e-05, -5.4426491260528564e-05, -3.7785619497299194e-05, -2.1144747734069824e-05, -4.503875970840454e-06, 1.2136995792388916e-05, 2.8777867555618286e-05, 4.5418739318847656e-05, 6.205961108207703e-05, 7.87004828453064e-05, 9.534135460853577e-05, 0.00011198222637176514, 0.0001286230981349945, 0.00014526396989822388, 0.00016190484166145325, 0.00017854571342468262, 0.000195186585187912, 0.00021182745695114136, 0.00022846832871437073, 0.0002451092004776001, 0.00026175007224082947, 0.00027839094400405884, 0.0002950318157672882, 0.0003116726875305176, 0.00032831355929374695, 0.0003449544310569763, 0.0003615953028202057, 0.00037823617458343506, 0.00039487704634666443, 0.0004115179181098938, 0.00042815878987312317, 0.00044479966163635254, 0.0004614405333995819, 0.0004780814051628113, 0.0004947222769260406, 0.00051136314868927, 0.0005280040204524994, 0.0005446448922157288, 0.0005612857639789581, 0.0005779266357421875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 10.0, 5.0, 14.0, 11.0, 11.0, 22.0, 28.0, 41.0, 51.0, 73.0, 101.0, 191.0, 350.0, 727.0, 1884.0, 5565.0, 21218.0, 197750.0, 740807.0, 62466.0, 11278.0, 3320.0, 1322.0, 557.0, 289.0, 140.0, 98.0, 66.0, 44.0, 29.0, 23.0, 15.0, 18.0, 7.0, 1.0, 8.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.0546875, -5.84063720703125, -5.6265869140625, -5.41253662109375, -5.198486328125, -4.98443603515625, -4.7703857421875, -4.55633544921875, -4.34228515625, -4.12823486328125, -3.9141845703125, -3.70013427734375, -3.486083984375, -3.27203369140625, -3.0579833984375, -2.84393310546875, -2.6298828125, -2.41583251953125, -2.2017822265625, -1.98773193359375, -1.773681640625, -1.55963134765625, -1.3455810546875, -1.13153076171875, -0.91748046875, -0.70343017578125, -0.4893798828125, -0.27532958984375, -0.061279296875, 0.15277099609375, 0.3668212890625, 0.58087158203125, 0.794921875, 1.00897216796875, 1.2230224609375, 1.43707275390625, 1.651123046875, 1.86517333984375, 2.0792236328125, 2.29327392578125, 2.50732421875, 2.72137451171875, 2.9354248046875, 3.14947509765625, 3.363525390625, 3.57757568359375, 3.7916259765625, 4.00567626953125, 4.2197265625, 4.43377685546875, 4.6478271484375, 4.86187744140625, 5.075927734375, 5.28997802734375, 5.5040283203125, 5.71807861328125, 5.93212890625, 6.14617919921875, 6.3602294921875, 6.57427978515625, 6.788330078125, 7.00238037109375, 7.2164306640625, 7.43048095703125, 7.64453125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 5.0, 4.0, 6.0, 8.0, 9.0, 9.0, 12.0, 24.0, 40.0, 83.0, 125.0, 165.0, 162.0, 134.0, 76.0, 38.0, 39.0, 16.0, 16.0, 9.0, 8.0, 1.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7421875, -5.5823974609375, -5.422607421875, -5.2628173828125, -5.10302734375, -4.9432373046875, -4.783447265625, -4.6236572265625, -4.4638671875, -4.3040771484375, -4.144287109375, -3.9844970703125, -3.82470703125, -3.6649169921875, -3.505126953125, -3.3453369140625, -3.185546875, -3.0257568359375, -2.865966796875, -2.7061767578125, -2.54638671875, -2.3865966796875, -2.226806640625, -2.0670166015625, -1.9072265625, -1.7474365234375, -1.587646484375, -1.4278564453125, -1.26806640625, -1.1082763671875, -0.948486328125, -0.7886962890625, -0.62890625, -0.4691162109375, -0.309326171875, -0.1495361328125, 0.01025390625, 0.1700439453125, 0.329833984375, 0.4896240234375, 0.6494140625, 0.8092041015625, 0.968994140625, 1.1287841796875, 1.28857421875, 1.4483642578125, 1.608154296875, 1.7679443359375, 1.927734375, 2.0875244140625, 2.247314453125, 2.4071044921875, 2.56689453125, 2.7266845703125, 2.886474609375, 3.0462646484375, 3.2060546875, 3.3658447265625, 3.525634765625, 3.6854248046875, 3.84521484375, 4.0050048828125, 4.164794921875, 4.3245849609375, 4.484375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 12.0, 23.0, 52.0, 134.0, 236.0, 251.0, 160.0, 71.0, 35.0, 12.0, 9.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.72313690185547, -62.26317596435547, -59.80321502685547, -57.34325408935547, -54.88329315185547, -52.42333221435547, -49.96337127685547, -47.50341033935547, -45.04344940185547, -42.58348846435547, -40.12352752685547, -37.66356658935547, -35.20360565185547, -32.74364471435547, -30.28368377685547, -27.82372283935547, -25.36376190185547, -22.90380096435547, -20.44384002685547, -17.98387908935547, -15.523918151855469, -13.063957214355469, -10.603996276855469, -8.144035339355469, -5.684074401855469, -3.2241134643554688, -0.7641525268554688, 1.6958084106445312, 4.155769348144531, 6.615730285644531, 9.075691223144531, 11.535652160644531, 13.995613098144531, 16.45557403564453, 18.91553497314453, 21.37549591064453, 23.83545684814453, 26.29541778564453, 28.75537872314453, 31.21533966064453, 33.67530059814453, 36.13526153564453, 38.59522247314453, 41.05518341064453, 43.51514434814453, 45.97510528564453, 48.43506622314453, 50.89502716064453, 53.35498809814453, 55.81494903564453, 58.27490997314453, 60.73487091064453, 63.19483184814453, 65.65479278564453, 68.11475372314453, 70.57471466064453, 73.03467559814453, 75.49463653564453, 77.95459747314453, 80.41455841064453, 82.87451934814453, 85.33448028564453, 87.79444122314453, 90.25440216064453, 92.71436309814453]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 5.0, 5.0, 8.0, 9.0, 17.0, 19.0, 19.0, 18.0, 25.0, 20.0, 25.0, 37.0, 36.0, 40.0, 28.0, 38.0, 35.0, 36.0, 43.0, 39.0, 53.0, 43.0, 41.0, 35.0, 43.0, 34.0, 31.0, 31.0, 24.0, 27.0, 23.0, 18.0, 9.0, 16.0, 12.0, 3.0, 8.0, 15.0, 10.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.24639320373535, -21.511661529541016, -20.77692985534668, -20.042198181152344, -19.307466506958008, -18.572734832763672, -17.83800506591797, -17.103271484375, -16.368541717529297, -15.633810043334961, -14.899078369140625, -14.164346694946289, -13.429615020751953, -12.694883346557617, -11.960152626037598, -11.225420951843262, -10.49068832397461, -9.755956649780273, -9.021224975585938, -8.286493301391602, -7.551762104034424, -6.817030429840088, -6.08229923248291, -5.347567558288574, -4.612835884094238, -3.8781042098999023, -3.1433727741241455, -2.4086413383483887, -1.6739096641540527, -0.9391779899597168, -0.20444679260253906, 0.5302848815917969, 1.2650184631347656, 1.999750018119812, 2.7344815731048584, 3.4692130088806152, 4.203944683074951, 4.938676357269287, 5.673407554626465, 6.408139228820801, 7.142870903015137, 7.877602577209473, 8.612334251403809, 9.347064971923828, 10.081796646118164, 10.8165283203125, 11.551259994506836, 12.285991668701172, 13.020723342895508, 13.755455017089844, 14.49018669128418, 15.224918365478516, 15.959650039672852, 16.694381713867188, 17.42911148071289, 18.16384506225586, 18.898574829101562, 19.6333065032959, 20.368038177490234, 21.10276985168457, 21.837501525878906, 22.572233200073242, 23.306964874267578, 24.04169464111328, 24.77642822265625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 3.0, 3.0, 2.0, 9.0, 9.0, 9.0, 18.0, 26.0, 34.0, 36.0, 55.0, 115.0, 128.0, 180.0, 286.0, 432.0, 729.0, 1170.0, 1957.0, 3575.0, 6885.0, 14554.0, 36514.0, 131398.0, 2799093.0, 1037753.0, 101923.0, 31032.0, 12574.0, 6044.0, 3083.0, 1832.0, 1046.0, 597.0, 359.0, 243.0, 176.0, 132.0, 73.0, 46.0, 51.0, 25.0, 23.0, 17.0, 11.0, 3.0, 4.0, 2.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-5.21484375, -5.056396484375, -4.89794921875, -4.739501953125, -4.5810546875, -4.422607421875, -4.26416015625, -4.105712890625, -3.947265625, -3.788818359375, -3.63037109375, -3.471923828125, -3.3134765625, -3.155029296875, -2.99658203125, -2.838134765625, -2.6796875, -2.521240234375, -2.36279296875, -2.204345703125, -2.0458984375, -1.887451171875, -1.72900390625, -1.570556640625, -1.412109375, -1.253662109375, -1.09521484375, -0.936767578125, -0.7783203125, -0.619873046875, -0.46142578125, -0.302978515625, -0.14453125, 0.013916015625, 0.17236328125, 0.330810546875, 0.4892578125, 0.647705078125, 0.80615234375, 0.964599609375, 1.123046875, 1.281494140625, 1.43994140625, 1.598388671875, 1.7568359375, 1.915283203125, 2.07373046875, 2.232177734375, 2.390625, 2.549072265625, 2.70751953125, 2.865966796875, 3.0244140625, 3.182861328125, 3.34130859375, 3.499755859375, 3.658203125, 3.816650390625, 3.97509765625, 4.133544921875, 4.2919921875, 4.450439453125, 4.60888671875, 4.767333984375, 4.92578125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 6.0, 11.0, 6.0, 17.0, 14.0, 10.0, 25.0, 29.0, 39.0, 39.0, 53.0, 35.0, 43.0, 54.0, 50.0, 53.0, 52.0, 62.0, 44.0, 47.0, 47.0, 37.0, 40.0, 29.0, 35.0, 30.0, 22.0, 11.0, 13.0, 9.0, 9.0, 8.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.19921875, -1.16302490234375, -1.1268310546875, -1.09063720703125, -1.054443359375, -1.01824951171875, -0.9820556640625, -0.94586181640625, -0.90966796875, -0.87347412109375, -0.8372802734375, -0.80108642578125, -0.764892578125, -0.72869873046875, -0.6925048828125, -0.65631103515625, -0.6201171875, -0.58392333984375, -0.5477294921875, -0.51153564453125, -0.475341796875, -0.43914794921875, -0.4029541015625, -0.36676025390625, -0.33056640625, -0.29437255859375, -0.2581787109375, -0.22198486328125, -0.185791015625, -0.14959716796875, -0.1134033203125, -0.07720947265625, -0.041015625, -0.00482177734375, 0.0313720703125, 0.06756591796875, 0.103759765625, 0.13995361328125, 0.1761474609375, 0.21234130859375, 0.24853515625, 0.28472900390625, 0.3209228515625, 0.35711669921875, 0.393310546875, 0.42950439453125, 0.4656982421875, 0.50189208984375, 0.5380859375, 0.57427978515625, 0.6104736328125, 0.64666748046875, 0.682861328125, 0.71905517578125, 0.7552490234375, 0.79144287109375, 0.82763671875, 0.86383056640625, 0.9000244140625, 0.93621826171875, 0.972412109375, 1.00860595703125, 1.0447998046875, 1.08099365234375, 1.1171875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 9.0, 16.0, 19.0, 21.0, 40.0, 70.0, 77.0, 135.0, 231.0, 371.0, 686.0, 1188.0, 2525.0, 5708.0, 15878.0, 60887.0, 474700.0, 3377492.0, 198694.0, 36212.0, 10919.0, 4062.0, 1885.0, 985.0, 588.0, 282.0, 204.0, 135.0, 75.0, 58.0, 46.0, 27.0, 16.0, 14.0, 6.0, 8.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.30078125, -5.09149169921875, -4.8822021484375, -4.67291259765625, -4.463623046875, -4.25433349609375, -4.0450439453125, -3.83575439453125, -3.62646484375, -3.41717529296875, -3.2078857421875, -2.99859619140625, -2.789306640625, -2.58001708984375, -2.3707275390625, -2.16143798828125, -1.9521484375, -1.74285888671875, -1.5335693359375, -1.32427978515625, -1.114990234375, -0.90570068359375, -0.6964111328125, -0.48712158203125, -0.27783203125, -0.06854248046875, 0.1407470703125, 0.35003662109375, 0.559326171875, 0.76861572265625, 0.9779052734375, 1.18719482421875, 1.396484375, 1.60577392578125, 1.8150634765625, 2.02435302734375, 2.233642578125, 2.44293212890625, 2.6522216796875, 2.86151123046875, 3.07080078125, 3.28009033203125, 3.4893798828125, 3.69866943359375, 3.907958984375, 4.11724853515625, 4.3265380859375, 4.53582763671875, 4.7451171875, 4.95440673828125, 5.1636962890625, 5.37298583984375, 5.582275390625, 5.79156494140625, 6.0008544921875, 6.21014404296875, 6.41943359375, 6.62872314453125, 6.8380126953125, 7.04730224609375, 7.256591796875, 7.46588134765625, 7.6751708984375, 7.88446044921875, 8.09375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 4.0, 4.0, 14.0, 16.0, 13.0, 25.0, 37.0, 51.0, 81.0, 157.0, 236.0, 636.0, 1558.0, 614.0, 238.0, 129.0, 82.0, 49.0, 37.0, 18.0, 17.0, 13.0, 9.0, 12.0, 5.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.28515625, -2.19183349609375, -2.0985107421875, -2.00518798828125, -1.911865234375, -1.81854248046875, -1.7252197265625, -1.63189697265625, -1.53857421875, -1.44525146484375, -1.3519287109375, -1.25860595703125, -1.165283203125, -1.07196044921875, -0.9786376953125, -0.88531494140625, -0.7919921875, -0.69866943359375, -0.6053466796875, -0.51202392578125, -0.418701171875, -0.32537841796875, -0.2320556640625, -0.13873291015625, -0.04541015625, 0.04791259765625, 0.1412353515625, 0.23455810546875, 0.327880859375, 0.42120361328125, 0.5145263671875, 0.60784912109375, 0.701171875, 0.79449462890625, 0.8878173828125, 0.98114013671875, 1.074462890625, 1.16778564453125, 1.2611083984375, 1.35443115234375, 1.44775390625, 1.54107666015625, 1.6343994140625, 1.72772216796875, 1.821044921875, 1.91436767578125, 2.0076904296875, 2.10101318359375, 2.1943359375, 2.28765869140625, 2.3809814453125, 2.47430419921875, 2.567626953125, 2.66094970703125, 2.7542724609375, 2.84759521484375, 2.94091796875, 3.03424072265625, 3.1275634765625, 3.22088623046875, 3.314208984375, 3.40753173828125, 3.5008544921875, 3.59417724609375, 3.6875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 9.0, 9.0, 9.0, 28.0, 37.0, 43.0, 72.0, 98.0, 96.0, 147.0, 118.0, 105.0, 107.0, 51.0, 32.0, 12.0, 10.0, 13.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.24634552001953, -19.67736053466797, -19.108373641967773, -18.53938865661621, -17.97040367126465, -17.401418685913086, -16.83243179321289, -16.263446807861328, -15.694461822509766, -15.125475883483887, -14.556490898132324, -13.987504959106445, -13.418519973754883, -12.849534034729004, -12.280548095703125, -11.711563110351562, -11.142577171325684, -10.573591232299805, -10.004606246948242, -9.435620307922363, -8.8666353225708, -8.297649383544922, -7.728663921356201, -7.1596784591674805, -6.59069299697876, -6.021707534790039, -5.452722072601318, -4.883736610412598, -4.314750671386719, -3.745765447616577, -3.1767797470092773, -2.6077942848205566, -2.038808822631836, -1.4698233604431152, -0.900837779045105, -0.3318521976470947, 0.23713326454162598, 0.8061187267303467, 1.3751044273376465, 1.9440898895263672, 2.513075351715088, 3.0820608139038086, 3.6510462760925293, 4.22003173828125, 4.789017677307129, 5.358002662658691, 5.92698860168457, 6.495974063873291, 7.064959526062012, 7.633944988250732, 8.202930450439453, 8.771916389465332, 9.340901374816895, 9.909887313842773, 10.478872299194336, 11.047858238220215, 11.616844177246094, 12.185830116271973, 12.754815101623535, 13.323801040649414, 13.892786026000977, 14.461771965026855, 15.030757904052734, 15.599742889404297, 16.16872787475586]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 3.0, 8.0, 13.0, 10.0, 11.0, 7.0, 8.0, 19.0, 15.0, 27.0, 22.0, 35.0, 30.0, 42.0, 46.0, 49.0, 40.0, 40.0, 54.0, 39.0, 46.0, 55.0, 35.0, 46.0, 33.0, 43.0, 25.0, 29.0, 21.0, 19.0, 24.0, 19.0, 17.0, 13.0, 7.0, 16.0, 5.0, 6.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.278190612792969, -8.989839553833008, -8.70148754119873, -8.41313648223877, -8.124784469604492, -7.836432933807373, -7.548081398010254, -7.259730339050293, -6.971378326416016, -6.6830267906188965, -6.394675254821777, -6.106323719024658, -5.817972183227539, -5.52962064743042, -5.241269111633301, -4.95291805267334, -4.664566516876221, -4.376214981079102, -4.087863445281982, -3.7995119094848633, -3.511160373687744, -3.222808837890625, -2.934457540512085, -2.646106004714966, -2.3577544689178467, -2.0694029331207275, -1.7810513973236084, -1.4926999807357788, -1.2043484449386597, -0.9159969091415405, -0.6276454925537109, -0.3392939567565918, -0.050942420959472656, 0.2374090850353241, 0.5257605910301208, 0.8141120672225952, 1.1024636030197144, 1.3908151388168335, 1.679166555404663, 1.9675180912017822, 2.2558696269989014, 2.5442211627960205, 2.8325726985931396, 3.1209239959716797, 3.409275531768799, 3.697627067565918, 3.985978603363037, 4.274330139160156, 4.562681674957275, 4.8510332107543945, 5.139384746551514, 5.427736282348633, 5.716087818145752, 6.004439353942871, 6.292790412902832, 6.581142425537109, 6.86949348449707, 7.1578450202941895, 7.446196556091309, 7.734548091888428, 8.022899627685547, 8.311250686645508, 8.599602699279785, 8.887953758239746, 9.176305770874023]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 4.0, 11.0, 26.0, 30.0, 33.0, 47.0, 68.0, 120.0, 161.0, 285.0, 464.0, 791.0, 1302.0, 2275.0, 4217.0, 8657.0, 19114.0, 46770.0, 147216.0, 598489.0, 137082.0, 44708.0, 18527.0, 8523.0, 4209.0, 2254.0, 1236.0, 732.0, 413.0, 262.0, 158.0, 108.0, 91.0, 44.0, 32.0, 30.0, 19.0, 14.0, 9.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.72265625, -6.5218505859375, -6.321044921875, -6.1202392578125, -5.91943359375, -5.7186279296875, -5.517822265625, -5.3170166015625, -5.1162109375, -4.9154052734375, -4.714599609375, -4.5137939453125, -4.31298828125, -4.1121826171875, -3.911376953125, -3.7105712890625, -3.509765625, -3.3089599609375, -3.108154296875, -2.9073486328125, -2.70654296875, -2.5057373046875, -2.304931640625, -2.1041259765625, -1.9033203125, -1.7025146484375, -1.501708984375, -1.3009033203125, -1.10009765625, -0.8992919921875, -0.698486328125, -0.4976806640625, -0.296875, -0.0960693359375, 0.104736328125, 0.3055419921875, 0.50634765625, 0.7071533203125, 0.907958984375, 1.1087646484375, 1.3095703125, 1.5103759765625, 1.711181640625, 1.9119873046875, 2.11279296875, 2.3135986328125, 2.514404296875, 2.7152099609375, 2.916015625, 3.1168212890625, 3.317626953125, 3.5184326171875, 3.71923828125, 3.9200439453125, 4.120849609375, 4.3216552734375, 4.5224609375, 4.7232666015625, 4.924072265625, 5.1248779296875, 5.32568359375, 5.5264892578125, 5.727294921875, 5.9281005859375, 6.12890625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 4.0, 6.0, 8.0, 19.0, 21.0, 25.0, 21.0, 34.0, 21.0, 35.0, 39.0, 33.0, 45.0, 66.0, 45.0, 49.0, 48.0, 51.0, 42.0, 45.0, 39.0, 44.0, 38.0, 31.0, 34.0, 34.0, 27.0, 21.0, 16.0, 10.0, 12.0, 4.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.138671875, -1.103607177734375, -1.06854248046875, -1.033477783203125, -0.9984130859375, -0.963348388671875, -0.92828369140625, -0.893218994140625, -0.858154296875, -0.823089599609375, -0.78802490234375, -0.752960205078125, -0.7178955078125, -0.682830810546875, -0.64776611328125, -0.612701416015625, -0.57763671875, -0.542572021484375, -0.50750732421875, -0.472442626953125, -0.4373779296875, -0.402313232421875, -0.36724853515625, -0.332183837890625, -0.297119140625, -0.262054443359375, -0.22698974609375, -0.191925048828125, -0.1568603515625, -0.121795654296875, -0.08673095703125, -0.051666259765625, -0.0166015625, 0.018463134765625, 0.05352783203125, 0.088592529296875, 0.1236572265625, 0.158721923828125, 0.19378662109375, 0.228851318359375, 0.263916015625, 0.298980712890625, 0.33404541015625, 0.369110107421875, 0.4041748046875, 0.439239501953125, 0.47430419921875, 0.509368896484375, 0.54443359375, 0.579498291015625, 0.61456298828125, 0.649627685546875, 0.6846923828125, 0.719757080078125, 0.75482177734375, 0.789886474609375, 0.824951171875, 0.860015869140625, 0.89508056640625, 0.930145263671875, 0.9652099609375, 1.000274658203125, 1.03533935546875, 1.070404052734375, 1.10546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 15.0, 14.0, 29.0, 30.0, 51.0, 39.0, 90.0, 116.0, 162.0, 268.0, 391.0, 622.0, 1212.0, 2948.0, 9629.0, 43544.0, 388448.0, 531701.0, 51696.0, 11077.0, 3239.0, 1318.0, 697.0, 362.0, 260.0, 169.0, 109.0, 82.0, 53.0, 54.0, 33.0, 23.0, 18.0, 14.0, 11.0, 3.0, 8.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.9921875, -9.69873046875, -9.4052734375, -9.11181640625, -8.818359375, -8.52490234375, -8.2314453125, -7.93798828125, -7.64453125, -7.35107421875, -7.0576171875, -6.76416015625, -6.470703125, -6.17724609375, -5.8837890625, -5.59033203125, -5.296875, -5.00341796875, -4.7099609375, -4.41650390625, -4.123046875, -3.82958984375, -3.5361328125, -3.24267578125, -2.94921875, -2.65576171875, -2.3623046875, -2.06884765625, -1.775390625, -1.48193359375, -1.1884765625, -0.89501953125, -0.6015625, -0.30810546875, -0.0146484375, 0.27880859375, 0.572265625, 0.86572265625, 1.1591796875, 1.45263671875, 1.74609375, 2.03955078125, 2.3330078125, 2.62646484375, 2.919921875, 3.21337890625, 3.5068359375, 3.80029296875, 4.09375, 4.38720703125, 4.6806640625, 4.97412109375, 5.267578125, 5.56103515625, 5.8544921875, 6.14794921875, 6.44140625, 6.73486328125, 7.0283203125, 7.32177734375, 7.615234375, 7.90869140625, 8.2021484375, 8.49560546875, 8.7890625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 1.0, 4.0, 3.0, 8.0, 8.0, 12.0, 11.0, 16.0, 23.0, 17.0, 25.0, 16.0, 28.0, 30.0, 31.0, 41.0, 40.0, 55.0, 56.0, 54.0, 36.0, 42.0, 52.0, 47.0, 49.0, 29.0, 34.0, 30.0, 34.0, 22.0, 28.0, 21.0, 15.0, 12.0, 18.0, 9.0, 8.0, 5.0, 3.0, 7.0, 1.0, 6.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5625, -4.41802978515625, -4.2735595703125, -4.12908935546875, -3.984619140625, -3.84014892578125, -3.6956787109375, -3.55120849609375, -3.40673828125, -3.26226806640625, -3.1177978515625, -2.97332763671875, -2.828857421875, -2.68438720703125, -2.5399169921875, -2.39544677734375, -2.2509765625, -2.10650634765625, -1.9620361328125, -1.81756591796875, -1.673095703125, -1.52862548828125, -1.3841552734375, -1.23968505859375, -1.09521484375, -0.95074462890625, -0.8062744140625, -0.66180419921875, -0.517333984375, -0.37286376953125, -0.2283935546875, -0.08392333984375, 0.060546875, 0.20501708984375, 0.3494873046875, 0.49395751953125, 0.638427734375, 0.78289794921875, 0.9273681640625, 1.07183837890625, 1.21630859375, 1.36077880859375, 1.5052490234375, 1.64971923828125, 1.794189453125, 1.93865966796875, 2.0831298828125, 2.22760009765625, 2.3720703125, 2.51654052734375, 2.6610107421875, 2.80548095703125, 2.949951171875, 3.09442138671875, 3.2388916015625, 3.38336181640625, 3.52783203125, 3.67230224609375, 3.8167724609375, 3.96124267578125, 4.105712890625, 4.25018310546875, 4.3946533203125, 4.53912353515625, 4.68359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 2.0, 3.0, 6.0, 10.0, 7.0, 24.0, 26.0, 61.0, 102.0, 310.0, 745.0, 2763.0, 14421.0, 195981.0, 796946.0, 30700.0, 4517.0, 1189.0, 401.0, 155.0, 83.0, 43.0, 21.0, 16.0, 8.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.6015625, -11.305419921875, -11.00927734375, -10.713134765625, -10.4169921875, -10.120849609375, -9.82470703125, -9.528564453125, -9.232421875, -8.936279296875, -8.64013671875, -8.343994140625, -8.0478515625, -7.751708984375, -7.45556640625, -7.159423828125, -6.86328125, -6.567138671875, -6.27099609375, -5.974853515625, -5.6787109375, -5.382568359375, -5.08642578125, -4.790283203125, -4.494140625, -4.197998046875, -3.90185546875, -3.605712890625, -3.3095703125, -3.013427734375, -2.71728515625, -2.421142578125, -2.125, -1.828857421875, -1.53271484375, -1.236572265625, -0.9404296875, -0.644287109375, -0.34814453125, -0.052001953125, 0.244140625, 0.540283203125, 0.83642578125, 1.132568359375, 1.4287109375, 1.724853515625, 2.02099609375, 2.317138671875, 2.61328125, 2.909423828125, 3.20556640625, 3.501708984375, 3.7978515625, 4.093994140625, 4.39013671875, 4.686279296875, 4.982421875, 5.278564453125, 5.57470703125, 5.870849609375, 6.1669921875, 6.463134765625, 6.75927734375, 7.055419921875, 7.3515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 12.0, 11.0, 22.0, 32.0, 48.0, 179.0, 448.0, 99.0, 52.0, 36.0, 21.0, 12.0, 8.0, 4.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019092559814453125, -0.0018502622842788696, -0.0017912685871124268, -0.0017322748899459839, -0.001673281192779541, -0.0016142874956130981, -0.0015552937984466553, -0.0014963001012802124, -0.0014373064041137695, -0.0013783127069473267, -0.0013193190097808838, -0.001260325312614441, -0.001201331615447998, -0.0011423379182815552, -0.0010833442211151123, -0.0010243505239486694, -0.0009653568267822266, -0.0009063631296157837, -0.0008473694324493408, -0.000788375735282898, -0.0007293820381164551, -0.0006703883409500122, -0.0006113946437835693, -0.0005524009466171265, -0.0004934072494506836, -0.0004344135522842407, -0.00037541985511779785, -0.000316426157951355, -0.0002574324607849121, -0.00019843876361846924, -0.00013944506645202637, -8.04513692855835e-05, -2.1457672119140625e-05, 3.7536025047302246e-05, 9.652972221374512e-05, 0.000155523419380188, 0.00021451711654663086, 0.00027351081371307373, 0.0003325045108795166, 0.00039149820804595947, 0.00045049190521240234, 0.0005094856023788452, 0.0005684792995452881, 0.000627472996711731, 0.0006864666938781738, 0.0007454603910446167, 0.0008044540882110596, 0.0008634477853775024, 0.0009224414825439453, 0.0009814351797103882, 0.001040428876876831, 0.001099422574043274, 0.0011584162712097168, 0.0012174099683761597, 0.0012764036655426025, 0.0013353973627090454, 0.0013943910598754883, 0.0014533847570419312, 0.001512378454208374, 0.001571372151374817, 0.0016303658485412598, 0.0016893595457077026, 0.0017483532428741455, 0.0018073469400405884, 0.0018663406372070312]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 9.0, 12.0, 8.0, 18.0, 26.0, 42.0, 50.0, 77.0, 117.0, 204.0, 361.0, 737.0, 1800.0, 6168.0, 30783.0, 408389.0, 554271.0, 35270.0, 6534.0, 1904.0, 749.0, 408.0, 211.0, 150.0, 71.0, 55.0, 43.0, 26.0, 11.0, 11.0, 8.0, 8.0, 3.0, 2.0, 3.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.375, -7.17034912109375, -6.9656982421875, -6.76104736328125, -6.556396484375, -6.35174560546875, -6.1470947265625, -5.94244384765625, -5.73779296875, -5.53314208984375, -5.3284912109375, -5.12384033203125, -4.919189453125, -4.71453857421875, -4.5098876953125, -4.30523681640625, -4.1005859375, -3.89593505859375, -3.6912841796875, -3.48663330078125, -3.281982421875, -3.07733154296875, -2.8726806640625, -2.66802978515625, -2.46337890625, -2.25872802734375, -2.0540771484375, -1.84942626953125, -1.644775390625, -1.44012451171875, -1.2354736328125, -1.03082275390625, -0.826171875, -0.62152099609375, -0.4168701171875, -0.21221923828125, -0.007568359375, 0.19708251953125, 0.4017333984375, 0.60638427734375, 0.81103515625, 1.01568603515625, 1.2203369140625, 1.42498779296875, 1.629638671875, 1.83428955078125, 2.0389404296875, 2.24359130859375, 2.4482421875, 2.65289306640625, 2.8575439453125, 3.06219482421875, 3.266845703125, 3.47149658203125, 3.6761474609375, 3.88079833984375, 4.08544921875, 4.29010009765625, 4.4947509765625, 4.69940185546875, 4.904052734375, 5.10870361328125, 5.3133544921875, 5.51800537109375, 5.72265625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 10.0, 7.0, 11.0, 13.0, 22.0, 22.0, 34.0, 71.0, 138.0, 229.0, 194.0, 87.0, 50.0, 24.0, 16.0, 13.0, 19.0, 7.0, 7.0, 4.0, 1.0, 4.0, 6.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.39453125, -5.24761962890625, -5.1007080078125, -4.95379638671875, -4.806884765625, -4.65997314453125, -4.5130615234375, -4.36614990234375, -4.21923828125, -4.07232666015625, -3.9254150390625, -3.77850341796875, -3.631591796875, -3.48468017578125, -3.3377685546875, -3.19085693359375, -3.0439453125, -2.89703369140625, -2.7501220703125, -2.60321044921875, -2.456298828125, -2.30938720703125, -2.1624755859375, -2.01556396484375, -1.86865234375, -1.72174072265625, -1.5748291015625, -1.42791748046875, -1.281005859375, -1.13409423828125, -0.9871826171875, -0.84027099609375, -0.693359375, -0.54644775390625, -0.3995361328125, -0.25262451171875, -0.105712890625, 0.04119873046875, 0.1881103515625, 0.33502197265625, 0.48193359375, 0.62884521484375, 0.7757568359375, 0.92266845703125, 1.069580078125, 1.21649169921875, 1.3634033203125, 1.51031494140625, 1.6572265625, 1.80413818359375, 1.9510498046875, 2.09796142578125, 2.244873046875, 2.39178466796875, 2.5386962890625, 2.68560791015625, 2.83251953125, 2.97943115234375, 3.1263427734375, 3.27325439453125, 3.420166015625, 3.56707763671875, 3.7139892578125, 3.86090087890625, 4.0078125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 12.0, 39.0, 97.0, 209.0, 259.0, 215.0, 109.0, 35.0, 21.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.82325744628906, -69.84823608398438, -66.87322235107422, -63.89820098876953, -60.92318344116211, -57.94816589355469, -54.97314453125, -51.99812698364258, -49.023109436035156, -46.048091888427734, -43.07307434082031, -40.098052978515625, -37.1230354309082, -34.14801788330078, -31.172998428344727, -28.197978973388672, -25.22296142578125, -22.247943878173828, -19.272924423217773, -16.29790496826172, -13.322887420654297, -10.347868919372559, -7.37285041809082, -4.397830963134766, -1.4228134155273438, 1.5522050857543945, 4.527223587036133, 7.502242088317871, 10.47726058959961, 13.452279090881348, 16.427297592163086, 19.40231704711914, 22.377342224121094, 25.352359771728516, 28.32737922668457, 31.302398681640625, 34.27741622924805, 37.25243377685547, 40.227455139160156, 43.20247268676758, 46.177490234375, 49.15250778198242, 52.127525329589844, 55.10254669189453, 58.07756423950195, 61.052581787109375, 64.02760314941406, 67.00262451171875, 69.9776382446289, 72.9526596069336, 75.92767333984375, 78.90269470214844, 81.87771606445312, 84.85272979736328, 87.82775115966797, 90.80276489257812, 93.77778625488281, 96.7528076171875, 99.72782135009766, 102.70284271240234, 105.6778564453125, 108.65287780761719, 111.62789916992188, 114.60292053222656, 117.57793426513672]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 3.0, 1.0, 8.0, 6.0, 7.0, 8.0, 12.0, 15.0, 15.0, 12.0, 9.0, 20.0, 29.0, 21.0, 30.0, 35.0, 31.0, 26.0, 38.0, 42.0, 45.0, 45.0, 44.0, 42.0, 31.0, 36.0, 36.0, 44.0, 24.0, 28.0, 24.0, 32.0, 33.0, 15.0, 18.0, 21.0, 21.0, 18.0, 15.0, 10.0, 12.0, 7.0, 8.0, 5.0, 10.0, 4.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.64881706237793, -21.933399200439453, -21.21798324584961, -20.502565383911133, -19.787147521972656, -19.071731567382812, -18.356313705444336, -17.64089584350586, -16.925479888916016, -16.21006202697754, -15.494645118713379, -14.779228210449219, -14.063810348510742, -13.348393440246582, -12.632976531982422, -11.917558670043945, -11.202140808105469, -10.486723899841309, -9.771306037902832, -9.055889129638672, -8.340471267700195, -7.625054359436035, -6.909637451171875, -6.194220066070557, -5.478802680969238, -4.76338529586792, -4.047967910766602, -3.3325510025024414, -2.617133617401123, -1.9017162322998047, -1.1862993240356445, -0.47088193893432617, 0.244537353515625, 0.9599546194076538, 1.6753718852996826, 2.390789031982422, 3.1062064170837402, 3.8216238021850586, 4.537040710449219, 5.252458095550537, 5.9678754806518555, 6.683292865753174, 7.398710250854492, 8.114127159118652, 8.829544067382812, 9.544961929321289, 10.26037883758545, 10.97579574584961, 11.691213607788086, 12.406630516052246, 13.122048377990723, 13.837465286254883, 14.55288314819336, 15.26830005645752, 15.98371696472168, 16.699134826660156, 17.41455078125, 18.129968643188477, 18.84538459777832, 19.560802459716797, 20.276220321655273, 20.99163818359375, 21.707054138183594, 22.42247200012207, 23.137889862060547]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 5.0, 15.0, 16.0, 26.0, 39.0, 76.0, 93.0, 146.0, 266.0, 456.0, 722.0, 1289.0, 2652.0, 5465.0, 13014.0, 37836.0, 207206.0, 3649163.0, 212744.0, 38661.0, 13147.0, 5496.0, 2663.0, 1290.0, 723.0, 418.0, 227.0, 147.0, 94.0, 59.0, 39.0, 29.0, 14.0, 12.0, 9.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.8359375, -7.615234375, -7.39453125, -7.173828125, -6.953125, -6.732421875, -6.51171875, -6.291015625, -6.0703125, -5.849609375, -5.62890625, -5.408203125, -5.1875, -4.966796875, -4.74609375, -4.525390625, -4.3046875, -4.083984375, -3.86328125, -3.642578125, -3.421875, -3.201171875, -2.98046875, -2.759765625, -2.5390625, -2.318359375, -2.09765625, -1.876953125, -1.65625, -1.435546875, -1.21484375, -0.994140625, -0.7734375, -0.552734375, -0.33203125, -0.111328125, 0.109375, 0.330078125, 0.55078125, 0.771484375, 0.9921875, 1.212890625, 1.43359375, 1.654296875, 1.875, 2.095703125, 2.31640625, 2.537109375, 2.7578125, 2.978515625, 3.19921875, 3.419921875, 3.640625, 3.861328125, 4.08203125, 4.302734375, 4.5234375, 4.744140625, 4.96484375, 5.185546875, 5.40625, 5.626953125, 5.84765625, 6.068359375, 6.2890625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 6.0, 4.0, 14.0, 6.0, 7.0, 13.0, 18.0, 16.0, 18.0, 20.0, 33.0, 24.0, 51.0, 34.0, 40.0, 29.0, 43.0, 44.0, 55.0, 36.0, 35.0, 37.0, 40.0, 51.0, 36.0, 44.0, 31.0, 30.0, 29.0, 28.0, 26.0, 17.0, 8.0, 14.0, 11.0, 10.0, 6.0, 8.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0], "bins": [-1.1650390625, -1.1313018798828125, -1.097564697265625, -1.0638275146484375, -1.03009033203125, -0.9963531494140625, -0.962615966796875, -0.9288787841796875, -0.8951416015625, -0.8614044189453125, -0.827667236328125, -0.7939300537109375, -0.76019287109375, -0.7264556884765625, -0.692718505859375, -0.6589813232421875, -0.625244140625, -0.5915069580078125, -0.557769775390625, -0.5240325927734375, -0.49029541015625, -0.4565582275390625, -0.422821044921875, -0.3890838623046875, -0.3553466796875, -0.3216094970703125, -0.287872314453125, -0.2541351318359375, -0.22039794921875, -0.1866607666015625, -0.152923583984375, -0.1191864013671875, -0.08544921875, -0.0517120361328125, -0.017974853515625, 0.0157623291015625, 0.04949951171875, 0.0832366943359375, 0.116973876953125, 0.1507110595703125, 0.1844482421875, 0.2181854248046875, 0.251922607421875, 0.2856597900390625, 0.31939697265625, 0.3531341552734375, 0.386871337890625, 0.4206085205078125, 0.454345703125, 0.4880828857421875, 0.521820068359375, 0.5555572509765625, 0.58929443359375, 0.6230316162109375, 0.656768798828125, 0.6905059814453125, 0.7242431640625, 0.7579803466796875, 0.791717529296875, 0.8254547119140625, 0.85919189453125, 0.8929290771484375, 0.926666259765625, 0.9604034423828125, 0.994140625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 8.0, 9.0, 14.0, 13.0, 17.0, 30.0, 56.0, 59.0, 96.0, 130.0, 178.0, 309.0, 489.0, 902.0, 1904.0, 4527.0, 13595.0, 52184.0, 508627.0, 3442933.0, 129386.0, 25334.0, 7699.0, 2849.0, 1221.0, 608.0, 339.0, 249.0, 177.0, 107.0, 70.0, 55.0, 40.0, 19.0, 16.0, 14.0, 6.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4765625, -8.22906494140625, -7.9815673828125, -7.73406982421875, -7.486572265625, -7.23907470703125, -6.9915771484375, -6.74407958984375, -6.49658203125, -6.24908447265625, -6.0015869140625, -5.75408935546875, -5.506591796875, -5.25909423828125, -5.0115966796875, -4.76409912109375, -4.5166015625, -4.26910400390625, -4.0216064453125, -3.77410888671875, -3.526611328125, -3.27911376953125, -3.0316162109375, -2.78411865234375, -2.53662109375, -2.28912353515625, -2.0416259765625, -1.79412841796875, -1.546630859375, -1.29913330078125, -1.0516357421875, -0.80413818359375, -0.556640625, -0.30914306640625, -0.0616455078125, 0.18585205078125, 0.433349609375, 0.68084716796875, 0.9283447265625, 1.17584228515625, 1.42333984375, 1.67083740234375, 1.9183349609375, 2.16583251953125, 2.413330078125, 2.66082763671875, 2.9083251953125, 3.15582275390625, 3.4033203125, 3.65081787109375, 3.8983154296875, 4.14581298828125, 4.393310546875, 4.64080810546875, 4.8883056640625, 5.13580322265625, 5.38330078125, 5.63079833984375, 5.8782958984375, 6.12579345703125, 6.373291015625, 6.62078857421875, 6.8682861328125, 7.11578369140625, 7.36328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 9.0, 15.0, 17.0, 25.0, 24.0, 55.0, 84.0, 207.0, 575.0, 2022.0, 579.0, 208.0, 91.0, 61.0, 45.0, 9.0, 20.0, 8.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.23046875, -4.114410400390625, -3.99835205078125, -3.882293701171875, -3.7662353515625, -3.650177001953125, -3.53411865234375, -3.418060302734375, -3.302001953125, -3.185943603515625, -3.06988525390625, -2.953826904296875, -2.8377685546875, -2.721710205078125, -2.60565185546875, -2.489593505859375, -2.37353515625, -2.257476806640625, -2.14141845703125, -2.025360107421875, -1.9093017578125, -1.793243408203125, -1.67718505859375, -1.561126708984375, -1.445068359375, -1.329010009765625, -1.21295166015625, -1.096893310546875, -0.9808349609375, -0.864776611328125, -0.74871826171875, -0.632659912109375, -0.5166015625, -0.400543212890625, -0.28448486328125, -0.168426513671875, -0.0523681640625, 0.063690185546875, 0.17974853515625, 0.295806884765625, 0.411865234375, 0.527923583984375, 0.64398193359375, 0.760040283203125, 0.8760986328125, 0.992156982421875, 1.10821533203125, 1.224273681640625, 1.34033203125, 1.456390380859375, 1.57244873046875, 1.688507080078125, 1.8045654296875, 1.920623779296875, 2.03668212890625, 2.152740478515625, 2.268798828125, 2.384857177734375, 2.50091552734375, 2.616973876953125, 2.7330322265625, 2.849090576171875, 2.96514892578125, 3.081207275390625, 3.197265625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 6.0, 12.0, 13.0, 13.0, 36.0, 49.0, 75.0, 107.0, 133.0, 114.0, 149.0, 105.0, 66.0, 45.0, 33.0, 21.0, 9.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.04202651977539, -22.510051727294922, -21.978076934814453, -21.446102142333984, -20.914127349853516, -20.38215446472168, -19.85017967224121, -19.318204879760742, -18.786230087280273, -18.254255294799805, -17.722280502319336, -17.190305709838867, -16.65833282470703, -16.126358032226562, -15.594383239746094, -15.062408447265625, -14.530433654785156, -13.998458862304688, -13.466484069824219, -12.934510231018066, -12.402535438537598, -11.870560646057129, -11.338586807250977, -10.806612014770508, -10.274637222290039, -9.74266242980957, -9.210687637329102, -8.67871379852295, -8.14673900604248, -7.614764213562012, -7.082789897918701, -6.550815582275391, -6.018838882446289, -5.48686408996582, -4.95488977432251, -4.422915458679199, -3.8909406661987305, -3.358966112136841, -2.826991558074951, -2.2950170040130615, -1.7630424499511719, -1.2310678958892822, -0.6990933418273926, -0.16711878776550293, 0.3648557662963867, 0.8968303203582764, 1.428804874420166, 1.9607794284820557, 2.4927539825439453, 3.024728536605835, 3.5567030906677246, 4.088677406311035, 4.620652198791504, 5.152626991271973, 5.684601306915283, 6.216575622558594, 6.7485504150390625, 7.280525207519531, 7.812499523162842, 8.344473838806152, 8.876448631286621, 9.40842342376709, 9.940397262573242, 10.472372055053711, 11.00434684753418]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 9.0, 8.0, 13.0, 11.0, 22.0, 15.0, 22.0, 16.0, 14.0, 17.0, 34.0, 22.0, 40.0, 34.0, 44.0, 36.0, 44.0, 44.0, 35.0, 50.0, 36.0, 41.0, 40.0, 30.0, 31.0, 37.0, 38.0, 27.0, 32.0, 15.0, 22.0, 20.0, 22.0, 14.0, 13.0, 13.0, 11.0, 6.0, 5.0, 6.0, 2.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.785093784332275, -6.556012153625488, -6.326930522918701, -6.097848892211914, -5.868766784667969, -5.639685153961182, -5.4106035232543945, -5.181521892547607, -4.95244026184082, -4.723358631134033, -4.494277000427246, -4.265194892883301, -4.036113262176514, -3.8070316314697266, -3.5779500007629395, -3.3488683700561523, -3.119786262512207, -2.89070463180542, -2.6616227626800537, -2.4325411319732666, -2.2034592628479004, -1.9743776321411133, -1.7452960014343262, -1.5162142515182495, -1.2871325016021729, -1.0580507516860962, -0.8289690613746643, -0.5998873710632324, -0.37080562114715576, -0.1417238712310791, 0.08735775947570801, 0.31643950939178467, 0.5455207824707031, 0.7746025323867798, 1.0036842823028564, 1.2327659130096436, 1.4618476629257202, 1.6909294128417969, 1.920011043548584, 2.149092674255371, 2.3781745433807373, 2.6072561740875244, 2.8363380432128906, 3.0654196739196777, 3.294501304626465, 3.523583173751831, 3.752664804458618, 3.9817466735839844, 4.2108283042907715, 4.439909934997559, 4.668991565704346, 4.898073196411133, 5.127155303955078, 5.356236934661865, 5.585318565368652, 5.8144001960754395, 6.043481826782227, 6.272563457489014, 6.501645088195801, 6.730727195739746, 6.959808826446533, 7.18889045715332, 7.417972087860107, 7.6470537185668945, 7.87613582611084]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 6.0, 5.0, 12.0, 15.0, 13.0, 31.0, 33.0, 60.0, 80.0, 163.0, 268.0, 578.0, 1142.0, 2805.0, 7529.0, 21849.0, 77187.0, 522381.0, 331079.0, 56029.0, 17122.0, 5877.0, 2245.0, 991.0, 459.0, 232.0, 125.0, 89.0, 50.0, 35.0, 23.0, 14.0, 9.0, 7.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.953125, -6.720458984375, -6.48779296875, -6.255126953125, -6.0224609375, -5.789794921875, -5.55712890625, -5.324462890625, -5.091796875, -4.859130859375, -4.62646484375, -4.393798828125, -4.1611328125, -3.928466796875, -3.69580078125, -3.463134765625, -3.23046875, -2.997802734375, -2.76513671875, -2.532470703125, -2.2998046875, -2.067138671875, -1.83447265625, -1.601806640625, -1.369140625, -1.136474609375, -0.90380859375, -0.671142578125, -0.4384765625, -0.205810546875, 0.02685546875, 0.259521484375, 0.4921875, 0.724853515625, 0.95751953125, 1.190185546875, 1.4228515625, 1.655517578125, 1.88818359375, 2.120849609375, 2.353515625, 2.586181640625, 2.81884765625, 3.051513671875, 3.2841796875, 3.516845703125, 3.74951171875, 3.982177734375, 4.21484375, 4.447509765625, 4.68017578125, 4.912841796875, 5.1455078125, 5.378173828125, 5.61083984375, 5.843505859375, 6.076171875, 6.308837890625, 6.54150390625, 6.774169921875, 7.0068359375, 7.239501953125, 7.47216796875, 7.704833984375, 7.9375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 2.0, 3.0, 6.0, 7.0, 12.0, 9.0, 9.0, 21.0, 18.0, 14.0, 24.0, 31.0, 28.0, 40.0, 41.0, 33.0, 45.0, 41.0, 39.0, 37.0, 49.0, 48.0, 39.0, 49.0, 40.0, 37.0, 51.0, 30.0, 30.0, 24.0, 31.0, 20.0, 17.0, 12.0, 12.0, 14.0, 9.0, 10.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1796875, -1.1433258056640625, -1.106964111328125, -1.0706024169921875, -1.03424072265625, -0.9978790283203125, -0.961517333984375, -0.9251556396484375, -0.8887939453125, -0.8524322509765625, -0.816070556640625, -0.7797088623046875, -0.74334716796875, -0.7069854736328125, -0.670623779296875, -0.6342620849609375, -0.597900390625, -0.5615386962890625, -0.525177001953125, -0.4888153076171875, -0.45245361328125, -0.4160919189453125, -0.379730224609375, -0.3433685302734375, -0.3070068359375, -0.2706451416015625, -0.234283447265625, -0.1979217529296875, -0.16156005859375, -0.1251983642578125, -0.088836669921875, -0.0524749755859375, -0.01611328125, 0.0202484130859375, 0.056610107421875, 0.0929718017578125, 0.12933349609375, 0.1656951904296875, 0.202056884765625, 0.2384185791015625, 0.2747802734375, 0.3111419677734375, 0.347503662109375, 0.3838653564453125, 0.42022705078125, 0.4565887451171875, 0.492950439453125, 0.5293121337890625, 0.565673828125, 0.6020355224609375, 0.638397216796875, 0.6747589111328125, 0.71112060546875, 0.7474822998046875, 0.783843994140625, 0.8202056884765625, 0.8565673828125, 0.8929290771484375, 0.929290771484375, 0.9656524658203125, 1.00201416015625, 1.0383758544921875, 1.074737548828125, 1.1110992431640625, 1.1474609375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 12.0, 12.0, 9.0, 15.0, 20.0, 45.0, 52.0, 87.0, 163.0, 218.0, 383.0, 739.0, 1739.0, 4629.0, 15018.0, 57573.0, 639398.0, 272988.0, 38471.0, 10741.0, 3415.0, 1338.0, 639.0, 343.0, 184.0, 108.0, 66.0, 53.0, 31.0, 24.0, 11.0, 6.0, 4.0, 9.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3671875, -7.082275390625, -6.79736328125, -6.512451171875, -6.2275390625, -5.942626953125, -5.65771484375, -5.372802734375, -5.087890625, -4.802978515625, -4.51806640625, -4.233154296875, -3.9482421875, -3.663330078125, -3.37841796875, -3.093505859375, -2.80859375, -2.523681640625, -2.23876953125, -1.953857421875, -1.6689453125, -1.384033203125, -1.09912109375, -0.814208984375, -0.529296875, -0.244384765625, 0.04052734375, 0.325439453125, 0.6103515625, 0.895263671875, 1.18017578125, 1.465087890625, 1.75, 2.034912109375, 2.31982421875, 2.604736328125, 2.8896484375, 3.174560546875, 3.45947265625, 3.744384765625, 4.029296875, 4.314208984375, 4.59912109375, 4.884033203125, 5.1689453125, 5.453857421875, 5.73876953125, 6.023681640625, 6.30859375, 6.593505859375, 6.87841796875, 7.163330078125, 7.4482421875, 7.733154296875, 8.01806640625, 8.302978515625, 8.587890625, 8.872802734375, 9.15771484375, 9.442626953125, 9.7275390625, 10.012451171875, 10.29736328125, 10.582275390625, 10.8671875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 6.0, 12.0, 16.0, 14.0, 21.0, 34.0, 38.0, 37.0, 55.0, 57.0, 71.0, 72.0, 81.0, 71.0, 52.0, 62.0, 57.0, 47.0, 38.0, 38.0, 27.0, 20.0, 12.0, 5.0, 10.0, 10.0, 5.0, 6.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.8828125, -6.6414794921875, -6.400146484375, -6.1588134765625, -5.91748046875, -5.6761474609375, -5.434814453125, -5.1934814453125, -4.9521484375, -4.7108154296875, -4.469482421875, -4.2281494140625, -3.98681640625, -3.7454833984375, -3.504150390625, -3.2628173828125, -3.021484375, -2.7801513671875, -2.538818359375, -2.2974853515625, -2.05615234375, -1.8148193359375, -1.573486328125, -1.3321533203125, -1.0908203125, -0.8494873046875, -0.608154296875, -0.3668212890625, -0.12548828125, 0.1158447265625, 0.357177734375, 0.5985107421875, 0.83984375, 1.0811767578125, 1.322509765625, 1.5638427734375, 1.80517578125, 2.0465087890625, 2.287841796875, 2.5291748046875, 2.7705078125, 3.0118408203125, 3.253173828125, 3.4945068359375, 3.73583984375, 3.9771728515625, 4.218505859375, 4.4598388671875, 4.701171875, 4.9425048828125, 5.183837890625, 5.4251708984375, 5.66650390625, 5.9078369140625, 6.149169921875, 6.3905029296875, 6.6318359375, 6.8731689453125, 7.114501953125, 7.3558349609375, 7.59716796875, 7.8385009765625, 8.079833984375, 8.3211669921875, 8.5625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 13.0, 17.0, 32.0, 53.0, 78.0, 154.0, 254.0, 489.0, 947.0, 2026.0, 4805.0, 12329.0, 32944.0, 118666.0, 637778.0, 172125.0, 40798.0, 14614.0, 5680.0, 2461.0, 1050.0, 526.0, 287.0, 160.0, 106.0, 62.0, 34.0, 23.0, 15.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.65625, -2.55999755859375, -2.4637451171875, -2.36749267578125, -2.271240234375, -2.17498779296875, -2.0787353515625, -1.98248291015625, -1.88623046875, -1.78997802734375, -1.6937255859375, -1.59747314453125, -1.501220703125, -1.40496826171875, -1.3087158203125, -1.21246337890625, -1.1162109375, -1.01995849609375, -0.9237060546875, -0.82745361328125, -0.731201171875, -0.63494873046875, -0.5386962890625, -0.44244384765625, -0.34619140625, -0.24993896484375, -0.1536865234375, -0.05743408203125, 0.038818359375, 0.13507080078125, 0.2313232421875, 0.32757568359375, 0.423828125, 0.52008056640625, 0.6163330078125, 0.71258544921875, 0.808837890625, 0.90509033203125, 1.0013427734375, 1.09759521484375, 1.19384765625, 1.29010009765625, 1.3863525390625, 1.48260498046875, 1.578857421875, 1.67510986328125, 1.7713623046875, 1.86761474609375, 1.9638671875, 2.06011962890625, 2.1563720703125, 2.25262451171875, 2.348876953125, 2.44512939453125, 2.5413818359375, 2.63763427734375, 2.73388671875, 2.83013916015625, 2.9263916015625, 3.02264404296875, 3.118896484375, 3.21514892578125, 3.3114013671875, 3.40765380859375, 3.50390625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 8.0, 15.0, 9.0, 16.0, 22.0, 28.0, 80.0, 300.0, 305.0, 85.0, 38.0, 14.0, 15.0, 12.0, 9.0, 7.0, 5.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00139617919921875, -0.0013573914766311646, -0.001318603754043579, -0.0012798160314559937, -0.0012410283088684082, -0.0012022405862808228, -0.0011634528636932373, -0.0011246651411056519, -0.0010858774185180664, -0.001047089695930481, -0.0010083019733428955, -0.0009695142507553101, -0.0009307265281677246, -0.0008919388055801392, -0.0008531510829925537, -0.0008143633604049683, -0.0007755756378173828, -0.0007367879152297974, -0.0006980001926422119, -0.0006592124700546265, -0.000620424747467041, -0.0005816370248794556, -0.0005428493022918701, -0.0005040615797042847, -0.0004652738571166992, -0.00042648613452911377, -0.0003876984119415283, -0.00034891068935394287, -0.0003101229667663574, -0.00027133524417877197, -0.00023254752159118652, -0.00019375979900360107, -0.00015497207641601562, -0.00011618435382843018, -7.739663124084473e-05, -3.860890865325928e-05, 1.7881393432617188e-07, 3.896653652191162e-05, 7.775425910949707e-05, 0.00011654198169708252, 0.00015532970428466797, 0.00019411742687225342, 0.00023290514945983887, 0.0002716928720474243, 0.00031048059463500977, 0.0003492683172225952, 0.00038805603981018066, 0.0004268437623977661, 0.00046563148498535156, 0.000504419207572937, 0.0005432069301605225, 0.0005819946527481079, 0.0006207823753356934, 0.0006595700979232788, 0.0006983578205108643, 0.0007371455430984497, 0.0007759332656860352, 0.0008147209882736206, 0.0008535087108612061, 0.0008922964334487915, 0.000931084156036377, 0.0009698718786239624, 0.0010086596012115479, 0.0010474473237991333, 0.0010862350463867188]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 3.0, 6.0, 6.0, 4.0, 8.0, 13.0, 13.0, 20.0, 29.0, 38.0, 62.0, 90.0, 133.0, 219.0, 375.0, 665.0, 1278.0, 2572.0, 5755.0, 13693.0, 34474.0, 120705.0, 628399.0, 169885.0, 41326.0, 15890.0, 6668.0, 2891.0, 1444.0, 777.0, 413.0, 253.0, 144.0, 100.0, 76.0, 42.0, 26.0, 21.0, 8.0, 10.0, 8.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.154296875, -2.073272705078125, -1.99224853515625, -1.911224365234375, -1.8302001953125, -1.749176025390625, -1.66815185546875, -1.587127685546875, -1.506103515625, -1.425079345703125, -1.34405517578125, -1.263031005859375, -1.1820068359375, -1.100982666015625, -1.01995849609375, -0.938934326171875, -0.85791015625, -0.776885986328125, -0.69586181640625, -0.614837646484375, -0.5338134765625, -0.452789306640625, -0.37176513671875, -0.290740966796875, -0.209716796875, -0.128692626953125, -0.04766845703125, 0.033355712890625, 0.1143798828125, 0.195404052734375, 0.27642822265625, 0.357452392578125, 0.4384765625, 0.519500732421875, 0.60052490234375, 0.681549072265625, 0.7625732421875, 0.843597412109375, 0.92462158203125, 1.005645751953125, 1.086669921875, 1.167694091796875, 1.24871826171875, 1.329742431640625, 1.4107666015625, 1.491790771484375, 1.57281494140625, 1.653839111328125, 1.73486328125, 1.815887451171875, 1.89691162109375, 1.977935791015625, 2.0589599609375, 2.139984130859375, 2.22100830078125, 2.302032470703125, 2.383056640625, 2.464080810546875, 2.54510498046875, 2.626129150390625, 2.7071533203125, 2.788177490234375, 2.86920166015625, 2.950225830078125, 3.03125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 3.0, 5.0, 4.0, 3.0, 7.0, 1.0, 7.0, 7.0, 9.0, 11.0, 14.0, 11.0, 20.0, 20.0, 37.0, 49.0, 86.0, 114.0, 130.0, 119.0, 96.0, 67.0, 38.0, 23.0, 16.0, 17.0, 16.0, 17.0, 10.0, 4.0, 9.0, 4.0, 7.0, 3.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9208984375, -1.8563385009765625, -1.791778564453125, -1.7272186279296875, -1.66265869140625, -1.5980987548828125, -1.533538818359375, -1.4689788818359375, -1.4044189453125, -1.3398590087890625, -1.275299072265625, -1.2107391357421875, -1.14617919921875, -1.0816192626953125, -1.017059326171875, -0.9524993896484375, -0.887939453125, -0.8233795166015625, -0.758819580078125, -0.6942596435546875, -0.62969970703125, -0.5651397705078125, -0.500579833984375, -0.4360198974609375, -0.3714599609375, -0.3069000244140625, -0.242340087890625, -0.1777801513671875, -0.11322021484375, -0.0486602783203125, 0.015899658203125, 0.0804595947265625, 0.14501953125, 0.2095794677734375, 0.274139404296875, 0.3386993408203125, 0.40325927734375, 0.4678192138671875, 0.532379150390625, 0.5969390869140625, 0.6614990234375, 0.7260589599609375, 0.790618896484375, 0.8551788330078125, 0.91973876953125, 0.9842987060546875, 1.048858642578125, 1.1134185791015625, 1.177978515625, 1.2425384521484375, 1.307098388671875, 1.3716583251953125, 1.43621826171875, 1.5007781982421875, 1.565338134765625, 1.6298980712890625, 1.6944580078125, 1.7590179443359375, 1.823577880859375, 1.8881378173828125, 1.95269775390625, 2.0172576904296875, 2.081817626953125, 2.1463775634765625, 2.2109375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 10.0, 21.0, 29.0, 40.0, 63.0, 88.0, 130.0, 137.0, 104.0, 107.0, 83.0, 72.0, 47.0, 24.0, 17.0, 8.0, 10.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.31786346435547, -27.983177185058594, -26.64849090576172, -25.313804626464844, -23.9791202545166, -22.644433975219727, -21.30974769592285, -19.97506332397461, -18.640377044677734, -17.30569076538086, -15.9710054397583, -14.636319160461426, -13.301633834838867, -11.966947555541992, -10.632261276245117, -9.297575950622559, -7.962888717651367, -6.62820291519165, -5.293517112731934, -3.9588308334350586, -2.624145030975342, -1.289459228515625, 0.04522705078125, 1.3799123764038086, 2.7145986557006836, 4.0492844581604, 5.383970260620117, 6.718656539916992, 8.053342819213867, 9.388028144836426, 10.7227144241333, 12.05739974975586, 13.392086029052734, 14.72677230834961, 16.061458587646484, 17.39614486694336, 18.7308292388916, 20.065515518188477, 21.40020179748535, 22.734886169433594, 24.06957244873047, 25.404258728027344, 26.73894500732422, 28.073631286621094, 29.408315658569336, 30.74300193786621, 32.07769012451172, 33.41237258911133, 34.74706268310547, 36.081748962402344, 37.41643524169922, 38.751121520996094, 40.08580780029297, 41.420494079589844, 42.75518035888672, 44.08986282348633, 45.4245491027832, 46.75923538208008, 48.09392166137695, 49.42860794067383, 50.7632942199707, 52.09797668457031, 53.43266296386719, 54.76734924316406, 56.10203552246094]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 5.0, 2.0, 1.0, 0.0, 10.0, 6.0, 9.0, 10.0, 9.0, 7.0, 17.0, 19.0, 15.0, 25.0, 26.0, 27.0, 22.0, 24.0, 28.0, 33.0, 35.0, 40.0, 42.0, 41.0, 41.0, 50.0, 30.0, 45.0, 32.0, 41.0, 48.0, 28.0, 30.0, 29.0, 23.0, 18.0, 23.0, 21.0, 14.0, 18.0, 10.0, 9.0, 7.0, 4.0, 5.0, 4.0, 7.0, 10.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.662212371826172, -20.99093246459961, -20.319652557373047, -19.648372650146484, -18.977092742919922, -18.30581283569336, -17.634532928466797, -16.963253021240234, -16.291973114013672, -15.62069320678711, -14.949413299560547, -14.278133392333984, -13.606853485107422, -12.93557357788086, -12.264294624328613, -11.59301471710205, -10.921735763549805, -10.250455856323242, -9.57917594909668, -8.907896041870117, -8.236616134643555, -7.56533670425415, -6.894057273864746, -6.222777366638184, -5.551497459411621, -4.880217552185059, -4.208937644958496, -3.537658214569092, -2.8663783073425293, -2.195098400115967, -1.5238189697265625, -0.8525390625, -0.1812591552734375, 0.49002063274383545, 1.1613004207611084, 1.8325800895690918, 2.5038599967956543, 3.175139904022217, 3.846419334411621, 4.517699241638184, 5.188979148864746, 5.860259056091309, 6.531538963317871, 7.202818393707275, 7.874098300933838, 8.545377731323242, 9.216657638549805, 9.887937545776367, 10.55921745300293, 11.230497360229492, 11.901777267456055, 12.573057174682617, 13.24433708190918, 13.915616989135742, 14.586895942687988, 15.25817584991455, 15.929455757141113, 16.60073471069336, 17.272014617919922, 17.943294525146484, 18.614574432373047, 19.28585433959961, 19.957134246826172, 20.628414154052734, 21.299694061279297]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 4.0, 6.0, 11.0, 14.0, 25.0, 33.0, 32.0, 53.0, 117.0, 168.0, 288.0, 498.0, 852.0, 1595.0, 2881.0, 6498.0, 15591.0, 50177.0, 434826.0, 3531982.0, 105058.0, 25262.0, 9501.0, 4259.0, 1994.0, 1085.0, 558.0, 349.0, 202.0, 129.0, 81.0, 43.0, 33.0, 15.0, 15.0, 18.0, 11.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.26171875, -6.99493408203125, -6.7281494140625, -6.46136474609375, -6.194580078125, -5.92779541015625, -5.6610107421875, -5.39422607421875, -5.12744140625, -4.86065673828125, -4.5938720703125, -4.32708740234375, -4.060302734375, -3.79351806640625, -3.5267333984375, -3.25994873046875, -2.9931640625, -2.72637939453125, -2.4595947265625, -2.19281005859375, -1.926025390625, -1.65924072265625, -1.3924560546875, -1.12567138671875, -0.85888671875, -0.59210205078125, -0.3253173828125, -0.05853271484375, 0.208251953125, 0.47503662109375, 0.7418212890625, 1.00860595703125, 1.275390625, 1.54217529296875, 1.8089599609375, 2.07574462890625, 2.342529296875, 2.60931396484375, 2.8760986328125, 3.14288330078125, 3.40966796875, 3.67645263671875, 3.9432373046875, 4.21002197265625, 4.476806640625, 4.74359130859375, 5.0103759765625, 5.27716064453125, 5.5439453125, 5.81072998046875, 6.0775146484375, 6.34429931640625, 6.611083984375, 6.87786865234375, 7.1446533203125, 7.41143798828125, 7.67822265625, 7.94500732421875, 8.2117919921875, 8.47857666015625, 8.745361328125, 9.01214599609375, 9.2789306640625, 9.54571533203125, 9.8125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 4.0, 0.0, 4.0, 8.0, 8.0, 5.0, 13.0, 9.0, 11.0, 20.0, 13.0, 22.0, 24.0, 28.0, 24.0, 29.0, 30.0, 29.0, 36.0, 37.0, 45.0, 40.0, 37.0, 46.0, 36.0, 24.0, 40.0, 47.0, 45.0, 46.0, 34.0, 26.0, 14.0, 19.0, 29.0, 20.0, 20.0, 15.0, 13.0, 10.0, 7.0, 9.0, 8.0, 5.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.072265625, -1.0380859375, -1.00390625, -0.9697265625, -0.935546875, -0.9013671875, -0.8671875, -0.8330078125, -0.798828125, -0.7646484375, -0.73046875, -0.6962890625, -0.662109375, -0.6279296875, -0.59375, -0.5595703125, -0.525390625, -0.4912109375, -0.45703125, -0.4228515625, -0.388671875, -0.3544921875, -0.3203125, -0.2861328125, -0.251953125, -0.2177734375, -0.18359375, -0.1494140625, -0.115234375, -0.0810546875, -0.046875, -0.0126953125, 0.021484375, 0.0556640625, 0.08984375, 0.1240234375, 0.158203125, 0.1923828125, 0.2265625, 0.2607421875, 0.294921875, 0.3291015625, 0.36328125, 0.3974609375, 0.431640625, 0.4658203125, 0.5, 0.5341796875, 0.568359375, 0.6025390625, 0.63671875, 0.6708984375, 0.705078125, 0.7392578125, 0.7734375, 0.8076171875, 0.841796875, 0.8759765625, 0.91015625, 0.9443359375, 0.978515625, 1.0126953125, 1.046875, 1.0810546875, 1.115234375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 4.0, 7.0, 11.0, 16.0, 23.0, 31.0, 42.0, 60.0, 103.0, 123.0, 190.0, 282.0, 423.0, 747.0, 1092.0, 1804.0, 3010.0, 4952.0, 9298.0, 17681.0, 39534.0, 114630.0, 652570.0, 3020372.0, 213342.0, 60778.0, 24735.0, 12120.0, 6481.0, 3627.0, 2204.0, 1391.0, 912.0, 550.0, 364.0, 242.0, 149.0, 115.0, 80.0, 54.0, 40.0, 28.0, 31.0, 9.0, 7.0, 7.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.78515625, -5.61102294921875, -5.4368896484375, -5.26275634765625, -5.088623046875, -4.91448974609375, -4.7403564453125, -4.56622314453125, -4.39208984375, -4.21795654296875, -4.0438232421875, -3.86968994140625, -3.695556640625, -3.52142333984375, -3.3472900390625, -3.17315673828125, -2.9990234375, -2.82489013671875, -2.6507568359375, -2.47662353515625, -2.302490234375, -2.12835693359375, -1.9542236328125, -1.78009033203125, -1.60595703125, -1.43182373046875, -1.2576904296875, -1.08355712890625, -0.909423828125, -0.73529052734375, -0.5611572265625, -0.38702392578125, -0.212890625, -0.03875732421875, 0.1353759765625, 0.30950927734375, 0.483642578125, 0.65777587890625, 0.8319091796875, 1.00604248046875, 1.18017578125, 1.35430908203125, 1.5284423828125, 1.70257568359375, 1.876708984375, 2.05084228515625, 2.2249755859375, 2.39910888671875, 2.5732421875, 2.74737548828125, 2.9215087890625, 3.09564208984375, 3.269775390625, 3.44390869140625, 3.6180419921875, 3.79217529296875, 3.96630859375, 4.14044189453125, 4.3145751953125, 4.48870849609375, 4.662841796875, 4.83697509765625, 5.0111083984375, 5.18524169921875, 5.359375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 7.0, 12.0, 4.0, 13.0, 14.0, 23.0, 18.0, 26.0, 48.0, 92.0, 102.0, 177.0, 416.0, 1939.0, 552.0, 236.0, 100.0, 92.0, 48.0, 40.0, 25.0, 24.0, 15.0, 8.0, 8.0, 6.0, 5.0, 1.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-3.310546875, -3.2176513671875, -3.124755859375, -3.0318603515625, -2.93896484375, -2.8460693359375, -2.753173828125, -2.6602783203125, -2.5673828125, -2.4744873046875, -2.381591796875, -2.2886962890625, -2.19580078125, -2.1029052734375, -2.010009765625, -1.9171142578125, -1.82421875, -1.7313232421875, -1.638427734375, -1.5455322265625, -1.45263671875, -1.3597412109375, -1.266845703125, -1.1739501953125, -1.0810546875, -0.9881591796875, -0.895263671875, -0.8023681640625, -0.70947265625, -0.6165771484375, -0.523681640625, -0.4307861328125, -0.337890625, -0.2449951171875, -0.152099609375, -0.0592041015625, 0.03369140625, 0.1265869140625, 0.219482421875, 0.3123779296875, 0.4052734375, 0.4981689453125, 0.591064453125, 0.6839599609375, 0.77685546875, 0.8697509765625, 0.962646484375, 1.0555419921875, 1.1484375, 1.2413330078125, 1.334228515625, 1.4271240234375, 1.52001953125, 1.6129150390625, 1.705810546875, 1.7987060546875, 1.8916015625, 1.9844970703125, 2.077392578125, 2.1702880859375, 2.26318359375, 2.3560791015625, 2.448974609375, 2.5418701171875, 2.634765625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 9.0, 24.0, 80.0, 175.0, 231.0, 234.0, 134.0, 78.0, 26.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.13190841674805, -40.93213653564453, -39.732364654541016, -38.5325927734375, -37.33282470703125, -36.133052825927734, -34.93328094482422, -33.7335090637207, -32.53373718261719, -31.333965301513672, -30.134193420410156, -28.934423446655273, -27.734651565551758, -26.534879684448242, -25.33510971069336, -24.135337829589844, -22.935565948486328, -21.735794067382812, -20.536022186279297, -19.336252212524414, -18.1364803314209, -16.936708450317383, -15.736937522888184, -14.537166595458984, -13.337394714355469, -12.137622833251953, -10.937851905822754, -9.738080978393555, -8.538309097290039, -7.338537693023682, -6.138766288757324, -4.938995361328125, -3.739227294921875, -2.5394558906555176, -1.3396844863891602, -0.13991308212280273, 1.0598583221435547, 2.259629726409912, 3.4594011306762695, 4.659172058105469, 5.858943939208984, 7.058715343475342, 8.2584867477417, 9.458257675170898, 10.658029556274414, 11.85780143737793, 13.057572364807129, 14.257343292236328, 15.457115173339844, 16.65688705444336, 17.856658935546875, 19.056428909301758, 20.256200790405273, 21.45597267150879, 22.655742645263672, 23.855514526367188, 25.055286407470703, 26.25505828857422, 27.454830169677734, 28.654600143432617, 29.854372024536133, 31.05414390563965, 32.25391387939453, 33.45368576049805, 34.65345764160156]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 3.0, 8.0, 8.0, 9.0, 11.0, 4.0, 5.0, 14.0, 13.0, 17.0, 17.0, 17.0, 26.0, 14.0, 35.0, 41.0, 30.0, 37.0, 39.0, 45.0, 32.0, 45.0, 52.0, 41.0, 40.0, 37.0, 30.0, 41.0, 39.0, 28.0, 35.0, 31.0, 24.0, 20.0, 19.0, 19.0, 13.0, 15.0, 5.0, 10.0, 7.0, 7.0, 5.0, 5.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.676658630371094, -8.408642768859863, -8.140626907348633, -7.8726115226745605, -7.60459566116333, -7.336580276489258, -7.068564414978027, -6.800548553466797, -6.532532691955566, -6.264516830444336, -5.996501445770264, -5.728485584259033, -5.460469722747803, -5.1924543380737305, -4.9244384765625, -4.6564226150512695, -4.388407230377197, -4.120391368865967, -3.8523757457733154, -3.584360122680664, -3.3163442611694336, -3.0483286380767822, -2.780313014984131, -2.5122971534729004, -2.244281530380249, -1.976265788078308, -1.7082500457763672, -1.4402344226837158, -1.172218680381775, -0.904202938079834, -0.6361873149871826, -0.3681715726852417, -0.10015583038330078, 0.16785988211631775, 0.4358755946159363, 0.7038912773132324, 0.9719070196151733, 1.2399227619171143, 1.5079383850097656, 1.7759541273117065, 2.0439698696136475, 2.311985492706299, 2.5800013542175293, 2.8480169773101807, 3.116032600402832, 3.3840484619140625, 3.652064085006714, 3.9200797080993652, 4.188095569610596, 4.456111431121826, 4.724126815795898, 4.992142677307129, 5.260158538818359, 5.52817440032959, 5.796189785003662, 6.064205646514893, 6.332221031188965, 6.600236892700195, 6.868252277374268, 7.136268138885498, 7.4042840003967285, 7.672299385070801, 7.940315246582031, 8.208331108093262, 8.476346969604492]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 9.0, 18.0, 26.0, 31.0, 46.0, 80.0, 134.0, 199.0, 372.0, 479.0, 832.0, 1455.0, 2613.0, 4855.0, 9218.0, 18235.0, 35782.0, 70284.0, 133846.0, 285949.0, 244190.0, 115261.0, 60370.0, 30886.0, 15534.0, 8028.0, 4184.0, 2323.0, 1314.0, 765.0, 439.0, 280.0, 184.0, 105.0, 61.0, 43.0, 37.0, 21.0, 21.0, 8.0, 7.0, 7.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.777435302734375, -3.64666748046875, -3.515899658203125, -3.3851318359375, -3.254364013671875, -3.12359619140625, -2.992828369140625, -2.862060546875, -2.731292724609375, -2.60052490234375, -2.469757080078125, -2.3389892578125, -2.208221435546875, -2.07745361328125, -1.946685791015625, -1.81591796875, -1.685150146484375, -1.55438232421875, -1.423614501953125, -1.2928466796875, -1.162078857421875, -1.03131103515625, -0.900543212890625, -0.769775390625, -0.639007568359375, -0.50823974609375, -0.377471923828125, -0.2467041015625, -0.115936279296875, 0.01483154296875, 0.145599365234375, 0.2763671875, 0.407135009765625, 0.53790283203125, 0.668670654296875, 0.7994384765625, 0.930206298828125, 1.06097412109375, 1.191741943359375, 1.322509765625, 1.453277587890625, 1.58404541015625, 1.714813232421875, 1.8455810546875, 1.976348876953125, 2.10711669921875, 2.237884521484375, 2.36865234375, 2.499420166015625, 2.63018798828125, 2.760955810546875, 2.8917236328125, 3.022491455078125, 3.15325927734375, 3.284027099609375, 3.414794921875, 3.545562744140625, 3.67633056640625, 3.807098388671875, 3.9378662109375, 4.068634033203125, 4.19940185546875, 4.330169677734375, 4.4609375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 3.0, 9.0, 8.0, 8.0, 17.0, 20.0, 14.0, 15.0, 17.0, 27.0, 22.0, 33.0, 33.0, 30.0, 34.0, 39.0, 45.0, 29.0, 49.0, 41.0, 41.0, 37.0, 44.0, 41.0, 41.0, 36.0, 27.0, 26.0, 19.0, 22.0, 25.0, 22.0, 20.0, 9.0, 16.0, 16.0, 10.0, 4.0, 12.0, 5.0, 7.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-1.2607421875, -1.2244415283203125, -1.188140869140625, -1.1518402099609375, -1.11553955078125, -1.0792388916015625, -1.042938232421875, -1.0066375732421875, -0.9703369140625, -0.9340362548828125, -0.897735595703125, -0.8614349365234375, -0.82513427734375, -0.7888336181640625, -0.752532958984375, -0.7162322998046875, -0.679931640625, -0.6436309814453125, -0.607330322265625, -0.5710296630859375, -0.53472900390625, -0.4984283447265625, -0.462127685546875, -0.4258270263671875, -0.3895263671875, -0.3532257080078125, -0.316925048828125, -0.2806243896484375, -0.24432373046875, -0.2080230712890625, -0.171722412109375, -0.1354217529296875, -0.09912109375, -0.0628204345703125, -0.026519775390625, 0.0097808837890625, 0.04608154296875, 0.0823822021484375, 0.118682861328125, 0.1549835205078125, 0.1912841796875, 0.2275848388671875, 0.263885498046875, 0.3001861572265625, 0.33648681640625, 0.3727874755859375, 0.409088134765625, 0.4453887939453125, 0.481689453125, 0.5179901123046875, 0.554290771484375, 0.5905914306640625, 0.62689208984375, 0.6631927490234375, 0.699493408203125, 0.7357940673828125, 0.7720947265625, 0.8083953857421875, 0.844696044921875, 0.8809967041015625, 0.91729736328125, 0.9535980224609375, 0.989898681640625, 1.0261993408203125, 1.0625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 7.0, 11.0, 15.0, 28.0, 29.0, 44.0, 48.0, 96.0, 103.0, 138.0, 191.0, 229.0, 428.0, 675.0, 1281.0, 3487.0, 20995.0, 182026.0, 710484.0, 109486.0, 13183.0, 2642.0, 1089.0, 614.0, 356.0, 257.0, 169.0, 127.0, 80.0, 68.0, 46.0, 34.0, 25.0, 20.0, 17.0, 11.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.015625, -12.6370849609375, -12.258544921875, -11.8800048828125, -11.50146484375, -11.1229248046875, -10.744384765625, -10.3658447265625, -9.9873046875, -9.6087646484375, -9.230224609375, -8.8516845703125, -8.47314453125, -8.0946044921875, -7.716064453125, -7.3375244140625, -6.958984375, -6.5804443359375, -6.201904296875, -5.8233642578125, -5.44482421875, -5.0662841796875, -4.687744140625, -4.3092041015625, -3.9306640625, -3.5521240234375, -3.173583984375, -2.7950439453125, -2.41650390625, -2.0379638671875, -1.659423828125, -1.2808837890625, -0.90234375, -0.5238037109375, -0.145263671875, 0.2332763671875, 0.61181640625, 0.9903564453125, 1.368896484375, 1.7474365234375, 2.1259765625, 2.5045166015625, 2.883056640625, 3.2615966796875, 3.64013671875, 4.0186767578125, 4.397216796875, 4.7757568359375, 5.154296875, 5.5328369140625, 5.911376953125, 6.2899169921875, 6.66845703125, 7.0469970703125, 7.425537109375, 7.8040771484375, 8.1826171875, 8.5611572265625, 8.939697265625, 9.3182373046875, 9.69677734375, 10.0753173828125, 10.453857421875, 10.8323974609375, 11.2109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 4.0, 10.0, 8.0, 10.0, 17.0, 32.0, 26.0, 19.0, 28.0, 49.0, 41.0, 53.0, 51.0, 44.0, 56.0, 53.0, 64.0, 66.0, 42.0, 48.0, 40.0, 38.0, 40.0, 32.0, 27.0, 12.0, 22.0, 13.0, 9.0, 11.0, 7.0, 9.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.8125, -8.5684814453125, -8.324462890625, -8.0804443359375, -7.83642578125, -7.5924072265625, -7.348388671875, -7.1043701171875, -6.8603515625, -6.6163330078125, -6.372314453125, -6.1282958984375, -5.88427734375, -5.6402587890625, -5.396240234375, -5.1522216796875, -4.908203125, -4.6641845703125, -4.420166015625, -4.1761474609375, -3.93212890625, -3.6881103515625, -3.444091796875, -3.2000732421875, -2.9560546875, -2.7120361328125, -2.468017578125, -2.2239990234375, -1.97998046875, -1.7359619140625, -1.491943359375, -1.2479248046875, -1.00390625, -0.7598876953125, -0.515869140625, -0.2718505859375, -0.02783203125, 0.2161865234375, 0.460205078125, 0.7042236328125, 0.9482421875, 1.1922607421875, 1.436279296875, 1.6802978515625, 1.92431640625, 2.1683349609375, 2.412353515625, 2.6563720703125, 2.900390625, 3.1444091796875, 3.388427734375, 3.6324462890625, 3.87646484375, 4.1204833984375, 4.364501953125, 4.6085205078125, 4.8525390625, 5.0965576171875, 5.340576171875, 5.5845947265625, 5.82861328125, 6.0726318359375, 6.316650390625, 6.5606689453125, 6.8046875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 14.0, 23.0, 23.0, 36.0, 52.0, 80.0, 157.0, 295.0, 486.0, 949.0, 1997.0, 4605.0, 12729.0, 42528.0, 167582.0, 586392.0, 167157.0, 42381.0, 12431.0, 4519.0, 1934.0, 987.0, 498.0, 247.0, 148.0, 100.0, 69.0, 34.0, 30.0, 19.0, 14.0, 7.0, 10.0, 3.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7578125, -3.62115478515625, -3.4844970703125, -3.34783935546875, -3.211181640625, -3.07452392578125, -2.9378662109375, -2.80120849609375, -2.66455078125, -2.52789306640625, -2.3912353515625, -2.25457763671875, -2.117919921875, -1.98126220703125, -1.8446044921875, -1.70794677734375, -1.5712890625, -1.43463134765625, -1.2979736328125, -1.16131591796875, -1.024658203125, -0.88800048828125, -0.7513427734375, -0.61468505859375, -0.47802734375, -0.34136962890625, -0.2047119140625, -0.06805419921875, 0.068603515625, 0.20526123046875, 0.3419189453125, 0.47857666015625, 0.615234375, 0.75189208984375, 0.8885498046875, 1.02520751953125, 1.161865234375, 1.29852294921875, 1.4351806640625, 1.57183837890625, 1.70849609375, 1.84515380859375, 1.9818115234375, 2.11846923828125, 2.255126953125, 2.39178466796875, 2.5284423828125, 2.66510009765625, 2.8017578125, 2.93841552734375, 3.0750732421875, 3.21173095703125, 3.348388671875, 3.48504638671875, 3.6217041015625, 3.75836181640625, 3.89501953125, 4.03167724609375, 4.1683349609375, 4.30499267578125, 4.441650390625, 4.57830810546875, 4.7149658203125, 4.85162353515625, 4.98828125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 7.0, 6.0, 8.0, 6.0, 11.0, 15.0, 21.0, 22.0, 30.0, 36.0, 53.0, 63.0, 72.0, 111.0, 156.0, 92.0, 64.0, 35.0, 41.0, 27.0, 22.0, 18.0, 20.0, 17.0, 9.0, 11.0, 3.0, 4.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008721351623535156, -0.000845007598400116, -0.0008178800344467163, -0.0007907524704933167, -0.000763624906539917, -0.0007364973425865173, -0.0007093697786331177, -0.000682242214679718, -0.0006551146507263184, -0.0006279870867729187, -0.000600859522819519, -0.0005737319588661194, -0.0005466043949127197, -0.0005194768309593201, -0.0004923492670059204, -0.00046522170305252075, -0.0004380941390991211, -0.00041096657514572144, -0.0003838390111923218, -0.0003567114472389221, -0.00032958388328552246, -0.0003024563193321228, -0.00027532875537872314, -0.0002482011914253235, -0.00022107362747192383, -0.00019394606351852417, -0.0001668184995651245, -0.00013969093561172485, -0.0001125633716583252, -8.543580770492554e-05, -5.830824375152588e-05, -3.118067979812622e-05, -4.0531158447265625e-06, 2.3074448108673096e-05, 5.0202012062072754e-05, 7.732957601547241e-05, 0.00010445713996887207, 0.00013158470392227173, 0.0001587122678756714, 0.00018583983182907104, 0.0002129673957824707, 0.00024009495973587036, 0.00026722252368927, 0.0002943500876426697, 0.00032147765159606934, 0.000348605215549469, 0.00037573277950286865, 0.0004028603434562683, 0.00042998790740966797, 0.0004571154713630676, 0.0004842430353164673, 0.0005113705992698669, 0.0005384981632232666, 0.0005656257271766663, 0.0005927532911300659, 0.0006198808550834656, 0.0006470084190368652, 0.0006741359829902649, 0.0007012635469436646, 0.0007283911108970642, 0.0007555186748504639, 0.0007826462388038635, 0.0008097738027572632, 0.0008369013667106628, 0.0008640289306640625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 7.0, 8.0, 16.0, 22.0, 31.0, 28.0, 42.0, 86.0, 128.0, 176.0, 367.0, 619.0, 1448.0, 4216.0, 19116.0, 168016.0, 736146.0, 99616.0, 12863.0, 3091.0, 1161.0, 541.0, 283.0, 160.0, 111.0, 71.0, 44.0, 31.0, 36.0, 16.0, 9.0, 10.0, 6.0, 6.0, 4.0, 6.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.3125, -6.09771728515625, -5.8829345703125, -5.66815185546875, -5.453369140625, -5.23858642578125, -5.0238037109375, -4.80902099609375, -4.59423828125, -4.37945556640625, -4.1646728515625, -3.94989013671875, -3.735107421875, -3.52032470703125, -3.3055419921875, -3.09075927734375, -2.8759765625, -2.66119384765625, -2.4464111328125, -2.23162841796875, -2.016845703125, -1.80206298828125, -1.5872802734375, -1.37249755859375, -1.15771484375, -0.94293212890625, -0.7281494140625, -0.51336669921875, -0.298583984375, -0.08380126953125, 0.1309814453125, 0.34576416015625, 0.560546875, 0.77532958984375, 0.9901123046875, 1.20489501953125, 1.419677734375, 1.63446044921875, 1.8492431640625, 2.06402587890625, 2.27880859375, 2.49359130859375, 2.7083740234375, 2.92315673828125, 3.137939453125, 3.35272216796875, 3.5675048828125, 3.78228759765625, 3.9970703125, 4.21185302734375, 4.4266357421875, 4.64141845703125, 4.856201171875, 5.07098388671875, 5.2857666015625, 5.50054931640625, 5.71533203125, 5.93011474609375, 6.1448974609375, 6.35968017578125, 6.574462890625, 6.78924560546875, 7.0040283203125, 7.21881103515625, 7.43359375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 7.0, 7.0, 12.0, 11.0, 18.0, 23.0, 26.0, 40.0, 41.0, 57.0, 88.0, 107.0, 158.0, 97.0, 72.0, 54.0, 39.0, 38.0, 29.0, 17.0, 21.0, 6.0, 8.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40234375, -5.24957275390625, -5.0968017578125, -4.94403076171875, -4.791259765625, -4.63848876953125, -4.4857177734375, -4.33294677734375, -4.18017578125, -4.02740478515625, -3.8746337890625, -3.72186279296875, -3.569091796875, -3.41632080078125, -3.2635498046875, -3.11077880859375, -2.9580078125, -2.80523681640625, -2.6524658203125, -2.49969482421875, -2.346923828125, -2.19415283203125, -2.0413818359375, -1.88861083984375, -1.73583984375, -1.58306884765625, -1.4302978515625, -1.27752685546875, -1.124755859375, -0.97198486328125, -0.8192138671875, -0.66644287109375, -0.513671875, -0.36090087890625, -0.2081298828125, -0.05535888671875, 0.097412109375, 0.25018310546875, 0.4029541015625, 0.55572509765625, 0.70849609375, 0.86126708984375, 1.0140380859375, 1.16680908203125, 1.319580078125, 1.47235107421875, 1.6251220703125, 1.77789306640625, 1.9306640625, 2.08343505859375, 2.2362060546875, 2.38897705078125, 2.541748046875, 2.69451904296875, 2.8472900390625, 3.00006103515625, 3.15283203125, 3.30560302734375, 3.4583740234375, 3.61114501953125, 3.763916015625, 3.91668701171875, 4.0694580078125, 4.22222900390625, 4.375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 14.0, 16.0, 32.0, 95.0, 129.0, 187.0, 199.0, 134.0, 103.0, 53.0, 25.0, 3.0, 7.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.10092163085938, -75.42745971679688, -72.75399017333984, -70.08052825927734, -67.40705871582031, -64.73359680175781, -62.06013107299805, -59.38666534423828, -56.713199615478516, -54.03973388671875, -51.366268157958984, -48.69280242919922, -46.01934051513672, -43.34587097167969, -40.67240905761719, -37.99894332885742, -35.325477600097656, -32.65201187133789, -29.978546142578125, -27.305082321166992, -24.631616592407227, -21.95815086364746, -19.284687042236328, -16.611221313476562, -13.937755584716797, -11.264289855957031, -8.590825080871582, -5.917360305786133, -3.243894577026367, -0.5704288482666016, 2.1030349731445312, 4.776500701904297, 7.449974060058594, 10.12343978881836, 12.796904563903809, 15.470369338989258, 18.143835067749023, 20.81730079650879, 23.490764617919922, 26.164230346679688, 28.837696075439453, 31.51116180419922, 34.184627532958984, 36.85809326171875, 39.53155517578125, 42.20502471923828, 44.87848663330078, 47.55195236206055, 50.22541809082031, 52.89888381958008, 55.572349548339844, 58.245811462402344, 60.919281005859375, 63.592742919921875, 66.26620483398438, 68.9396743774414, 71.61314392089844, 74.28660583496094, 76.96007537841797, 79.63353729248047, 82.3070068359375, 84.98046875, 87.6539306640625, 90.32740020751953, 93.00086212158203]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 4.0, 7.0, 11.0, 19.0, 14.0, 16.0, 19.0, 23.0, 25.0, 25.0, 29.0, 38.0, 37.0, 39.0, 42.0, 52.0, 51.0, 58.0, 48.0, 59.0, 42.0, 37.0, 45.0, 34.0, 40.0, 32.0, 28.0, 27.0, 16.0, 19.0, 18.0, 8.0, 4.0, 10.0, 3.0, 3.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.343772888183594, -36.130653381347656, -34.917537689208984, -33.70441818237305, -32.49129867553711, -31.278182983398438, -30.0650634765625, -28.851945877075195, -27.63882827758789, -26.425710678100586, -25.21259117126465, -23.999473571777344, -22.78635597229004, -21.573238372802734, -20.360118865966797, -19.147001266479492, -17.933881759643555, -16.72076416015625, -15.507645606994629, -14.294527053833008, -13.081409454345703, -11.868290901184082, -10.655172348022461, -9.442054748535156, -8.228936195373535, -7.015818119049072, -5.802700042724609, -4.589581489562988, -3.3764634132385254, -2.1633453369140625, -0.9502267837524414, 0.2628908157348633, 1.4760093688964844, 2.6891274452209473, 3.9022457599639893, 5.115364074707031, 6.328482151031494, 7.541600227355957, 8.754718780517578, 9.967836380004883, 11.180954933166504, 12.394073486328125, 13.60719108581543, 14.82030963897705, 16.033428192138672, 17.246545791625977, 18.45966339111328, 19.67278289794922, 20.885900497436523, 22.099018096923828, 23.312137603759766, 24.52525520324707, 25.738372802734375, 26.951492309570312, 28.164609909057617, 29.377727508544922, 30.59084701538086, 31.803964614868164, 33.01708221435547, 34.230201721191406, 35.443321228027344, 36.656436920166016, 37.86955642700195, 39.082672119140625, 40.29579162597656]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 10.0, 18.0, 17.0, 24.0, 32.0, 45.0, 69.0, 107.0, 175.0, 219.0, 377.0, 618.0, 1016.0, 1827.0, 3340.0, 6894.0, 16729.0, 54558.0, 362795.0, 3466188.0, 211866.0, 40833.0, 13847.0, 5947.0, 2946.0, 1518.0, 865.0, 491.0, 271.0, 232.0, 125.0, 83.0, 57.0, 47.0, 26.0, 23.0, 10.0, 7.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6484375, -8.389404296875, -8.13037109375, -7.871337890625, -7.6123046875, -7.353271484375, -7.09423828125, -6.835205078125, -6.576171875, -6.317138671875, -6.05810546875, -5.799072265625, -5.5400390625, -5.281005859375, -5.02197265625, -4.762939453125, -4.50390625, -4.244873046875, -3.98583984375, -3.726806640625, -3.4677734375, -3.208740234375, -2.94970703125, -2.690673828125, -2.431640625, -2.172607421875, -1.91357421875, -1.654541015625, -1.3955078125, -1.136474609375, -0.87744140625, -0.618408203125, -0.359375, -0.100341796875, 0.15869140625, 0.417724609375, 0.6767578125, 0.935791015625, 1.19482421875, 1.453857421875, 1.712890625, 1.971923828125, 2.23095703125, 2.489990234375, 2.7490234375, 3.008056640625, 3.26708984375, 3.526123046875, 3.78515625, 4.044189453125, 4.30322265625, 4.562255859375, 4.8212890625, 5.080322265625, 5.33935546875, 5.598388671875, 5.857421875, 6.116455078125, 6.37548828125, 6.634521484375, 6.8935546875, 7.152587890625, 7.41162109375, 7.670654296875, 7.9296875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 0.0, 1.0, 6.0, 7.0, 5.0, 6.0, 9.0, 12.0, 14.0, 19.0, 15.0, 19.0, 18.0, 23.0, 29.0, 26.0, 31.0, 27.0, 38.0, 38.0, 36.0, 41.0, 39.0, 40.0, 46.0, 36.0, 31.0, 27.0, 50.0, 48.0, 26.0, 28.0, 33.0, 26.0, 20.0, 23.0, 17.0, 25.0, 16.0, 8.0, 8.0, 12.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.2763671875, -1.235137939453125, -1.19390869140625, -1.152679443359375, -1.1114501953125, -1.070220947265625, -1.02899169921875, -0.987762451171875, -0.946533203125, -0.905303955078125, -0.86407470703125, -0.822845458984375, -0.7816162109375, -0.740386962890625, -0.69915771484375, -0.657928466796875, -0.61669921875, -0.575469970703125, -0.53424072265625, -0.493011474609375, -0.4517822265625, -0.410552978515625, -0.36932373046875, -0.328094482421875, -0.286865234375, -0.245635986328125, -0.20440673828125, -0.163177490234375, -0.1219482421875, -0.080718994140625, -0.03948974609375, 0.001739501953125, 0.04296875, 0.084197998046875, 0.12542724609375, 0.166656494140625, 0.2078857421875, 0.249114990234375, 0.29034423828125, 0.331573486328125, 0.372802734375, 0.414031982421875, 0.45526123046875, 0.496490478515625, 0.5377197265625, 0.578948974609375, 0.62017822265625, 0.661407470703125, 0.70263671875, 0.743865966796875, 0.78509521484375, 0.826324462890625, 0.8675537109375, 0.908782958984375, 0.95001220703125, 0.991241455078125, 1.032470703125, 1.073699951171875, 1.11492919921875, 1.156158447265625, 1.1973876953125, 1.238616943359375, 1.27984619140625, 1.321075439453125, 1.3623046875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 5.0, 9.0, 7.0, 10.0, 29.0, 46.0, 47.0, 75.0, 122.0, 177.0, 297.0, 429.0, 772.0, 1301.0, 2262.0, 4345.0, 8686.0, 19091.0, 48007.0, 162810.0, 1385308.0, 2276005.0, 190085.0, 53568.0, 20979.0, 9199.0, 4679.0, 2452.0, 1334.0, 744.0, 507.0, 326.0, 183.0, 115.0, 75.0, 54.0, 46.0, 21.0, 24.0, 16.0, 8.0, 7.0, 10.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-7.5859375, -7.3631591796875, -7.140380859375, -6.9176025390625, -6.69482421875, -6.4720458984375, -6.249267578125, -6.0264892578125, -5.8037109375, -5.5809326171875, -5.358154296875, -5.1353759765625, -4.91259765625, -4.6898193359375, -4.467041015625, -4.2442626953125, -4.021484375, -3.7987060546875, -3.575927734375, -3.3531494140625, -3.13037109375, -2.9075927734375, -2.684814453125, -2.4620361328125, -2.2392578125, -2.0164794921875, -1.793701171875, -1.5709228515625, -1.34814453125, -1.1253662109375, -0.902587890625, -0.6798095703125, -0.45703125, -0.2342529296875, -0.011474609375, 0.2113037109375, 0.43408203125, 0.6568603515625, 0.879638671875, 1.1024169921875, 1.3251953125, 1.5479736328125, 1.770751953125, 1.9935302734375, 2.21630859375, 2.4390869140625, 2.661865234375, 2.8846435546875, 3.107421875, 3.3302001953125, 3.552978515625, 3.7757568359375, 3.99853515625, 4.2213134765625, 4.444091796875, 4.6668701171875, 4.8896484375, 5.1124267578125, 5.335205078125, 5.5579833984375, 5.78076171875, 6.0035400390625, 6.226318359375, 6.4490966796875, 6.671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 8.0, 9.0, 9.0, 13.0, 21.0, 23.0, 35.0, 32.0, 62.0, 106.0, 163.0, 322.0, 876.0, 1339.0, 420.0, 201.0, 136.0, 74.0, 61.0, 40.0, 30.0, 25.0, 10.0, 12.0, 12.0, 9.0, 3.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.18359375, -4.0447998046875, -3.906005859375, -3.7672119140625, -3.62841796875, -3.4896240234375, -3.350830078125, -3.2120361328125, -3.0732421875, -2.9344482421875, -2.795654296875, -2.6568603515625, -2.51806640625, -2.3792724609375, -2.240478515625, -2.1016845703125, -1.962890625, -1.8240966796875, -1.685302734375, -1.5465087890625, -1.40771484375, -1.2689208984375, -1.130126953125, -0.9913330078125, -0.8525390625, -0.7137451171875, -0.574951171875, -0.4361572265625, -0.29736328125, -0.1585693359375, -0.019775390625, 0.1190185546875, 0.2578125, 0.3966064453125, 0.535400390625, 0.6741943359375, 0.81298828125, 0.9517822265625, 1.090576171875, 1.2293701171875, 1.3681640625, 1.5069580078125, 1.645751953125, 1.7845458984375, 1.92333984375, 2.0621337890625, 2.200927734375, 2.3397216796875, 2.478515625, 2.6173095703125, 2.756103515625, 2.8948974609375, 3.03369140625, 3.1724853515625, 3.311279296875, 3.4500732421875, 3.5888671875, 3.7276611328125, 3.866455078125, 4.0052490234375, 4.14404296875, 4.2828369140625, 4.421630859375, 4.5604248046875, 4.69921875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 14.0, 33.0, 87.0, 110.0, 145.0, 182.0, 152.0, 113.0, 76.0, 45.0, 13.0, 11.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.29136657714844, -35.9809684753418, -34.67056655883789, -33.36016845703125, -32.049766540527344, -30.739368438720703, -29.428970336914062, -28.11857032775879, -26.808170318603516, -25.497770309448242, -24.18737030029297, -22.876972198486328, -21.566572189331055, -20.25617218017578, -18.94577407836914, -17.635374069213867, -16.324974060058594, -15.01457405090332, -13.704174995422363, -12.393775939941406, -11.083375930786133, -9.77297592163086, -8.462576866149902, -7.152177810668945, -5.841777801513672, -4.531378269195557, -3.2209787368774414, -1.9105792045593262, -0.6001796722412109, 0.7102198600769043, 2.0206193923950195, 3.3310184478759766, 4.64141845703125, 5.951817989349365, 7.2622175216674805, 8.572616577148438, 9.883016586303711, 11.193416595458984, 12.503815650939941, 13.814214706420898, 15.124614715576172, 16.435014724731445, 17.74541473388672, 19.05581283569336, 20.366212844848633, 21.676612854003906, 22.987010955810547, 24.29741096496582, 25.607810974121094, 26.918210983276367, 28.22861099243164, 29.53900909423828, 30.849409103393555, 32.15980911254883, 33.47020721435547, 34.780609130859375, 36.091007232666016, 37.401405334472656, 38.71180725097656, 40.0222053527832, 41.332603454589844, 42.64300537109375, 43.95340347290039, 45.26380157470703, 46.57420349121094]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 5.0, 16.0, 6.0, 18.0, 20.0, 16.0, 31.0, 34.0, 42.0, 33.0, 52.0, 32.0, 57.0, 46.0, 49.0, 59.0, 54.0, 54.0, 53.0, 56.0, 42.0, 36.0, 29.0, 41.0, 22.0, 16.0, 16.0, 12.0, 8.0, 16.0, 9.0, 5.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.120235443115234, -19.56670379638672, -19.013172149658203, -18.459638595581055, -17.90610694885254, -17.352575302124023, -16.799043655395508, -16.24551010131836, -15.691978454589844, -15.138446807861328, -14.584914207458496, -14.03138256072998, -13.477849960327148, -12.924318313598633, -12.370786666870117, -11.817254066467285, -11.26372241973877, -10.710190773010254, -10.156658172607422, -9.603126525878906, -9.049593925476074, -8.496062278747559, -7.942530155181885, -7.388998031616211, -6.835465908050537, -6.281933784484863, -5.7284016609191895, -5.174869537353516, -4.621337890625, -4.067805290222168, -3.5142736434936523, -2.9607415199279785, -2.407210350036621, -1.8536782264709473, -1.300146222114563, -0.7466142177581787, -0.19308209419250488, 0.36045002937316895, 0.9139819145202637, 1.4675140380859375, 2.0210461616516113, 2.574578285217285, 3.128110408782959, 3.6816422939300537, 4.235174179077148, 4.7887067794799805, 5.342238426208496, 5.89577054977417, 6.449302673339844, 7.002834796905518, 7.556366920471191, 8.109898567199707, 8.663431167602539, 9.216962814331055, 9.77049446105957, 10.324027061462402, 10.877559661865234, 11.43109130859375, 11.984623908996582, 12.538155555725098, 13.09168815612793, 13.645219802856445, 14.198751449584961, 14.752284049987793, 15.305815696716309]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 4.0, 3.0, 8.0, 9.0, 13.0, 13.0, 36.0, 49.0, 77.0, 124.0, 198.0, 345.0, 608.0, 1117.0, 2326.0, 4860.0, 11301.0, 26909.0, 68701.0, 172293.0, 325340.0, 252804.0, 108338.0, 41979.0, 17155.0, 7274.0, 3175.0, 1572.0, 833.0, 437.0, 250.0, 136.0, 95.0, 54.0, 28.0, 23.0, 18.0, 18.0, 7.0, 2.0, 5.0, 3.0, 2.0, 8.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.90625, -5.731201171875, -5.55615234375, -5.381103515625, -5.2060546875, -5.031005859375, -4.85595703125, -4.680908203125, -4.505859375, -4.330810546875, -4.15576171875, -3.980712890625, -3.8056640625, -3.630615234375, -3.45556640625, -3.280517578125, -3.10546875, -2.930419921875, -2.75537109375, -2.580322265625, -2.4052734375, -2.230224609375, -2.05517578125, -1.880126953125, -1.705078125, -1.530029296875, -1.35498046875, -1.179931640625, -1.0048828125, -0.829833984375, -0.65478515625, -0.479736328125, -0.3046875, -0.129638671875, 0.04541015625, 0.220458984375, 0.3955078125, 0.570556640625, 0.74560546875, 0.920654296875, 1.095703125, 1.270751953125, 1.44580078125, 1.620849609375, 1.7958984375, 1.970947265625, 2.14599609375, 2.321044921875, 2.49609375, 2.671142578125, 2.84619140625, 3.021240234375, 3.1962890625, 3.371337890625, 3.54638671875, 3.721435546875, 3.896484375, 4.071533203125, 4.24658203125, 4.421630859375, 4.5966796875, 4.771728515625, 4.94677734375, 5.121826171875, 5.296875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 7.0, 7.0, 7.0, 9.0, 6.0, 10.0, 16.0, 19.0, 23.0, 25.0, 22.0, 18.0, 26.0, 30.0, 29.0, 28.0, 39.0, 38.0, 40.0, 40.0, 50.0, 38.0, 39.0, 34.0, 30.0, 44.0, 35.0, 39.0, 36.0, 33.0, 27.0, 26.0, 20.0, 19.0, 20.0, 12.0, 12.0, 9.0, 9.0, 9.0, 7.0, 5.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.439453125, -1.3949432373046875, -1.350433349609375, -1.3059234619140625, -1.26141357421875, -1.2169036865234375, -1.172393798828125, -1.1278839111328125, -1.0833740234375, -1.0388641357421875, -0.994354248046875, -0.9498443603515625, -0.90533447265625, -0.8608245849609375, -0.816314697265625, -0.7718048095703125, -0.727294921875, -0.6827850341796875, -0.638275146484375, -0.5937652587890625, -0.54925537109375, -0.5047454833984375, -0.460235595703125, -0.4157257080078125, -0.3712158203125, -0.3267059326171875, -0.282196044921875, -0.2376861572265625, -0.19317626953125, -0.1486663818359375, -0.104156494140625, -0.0596466064453125, -0.01513671875, 0.0293731689453125, 0.073883056640625, 0.1183929443359375, 0.16290283203125, 0.2074127197265625, 0.251922607421875, 0.2964324951171875, 0.3409423828125, 0.3854522705078125, 0.429962158203125, 0.4744720458984375, 0.51898193359375, 0.5634918212890625, 0.608001708984375, 0.6525115966796875, 0.697021484375, 0.7415313720703125, 0.786041259765625, 0.8305511474609375, 0.87506103515625, 0.9195709228515625, 0.964080810546875, 1.0085906982421875, 1.0531005859375, 1.0976104736328125, 1.142120361328125, 1.1866302490234375, 1.23114013671875, 1.2756500244140625, 1.320159912109375, 1.3646697998046875, 1.4091796875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 8.0, 11.0, 10.0, 18.0, 20.0, 32.0, 37.0, 57.0, 76.0, 87.0, 124.0, 213.0, 335.0, 564.0, 956.0, 1907.0, 6294.0, 38882.0, 352895.0, 558770.0, 71820.0, 9866.0, 2661.0, 1095.0, 630.0, 385.0, 241.0, 178.0, 97.0, 85.0, 56.0, 44.0, 29.0, 18.0, 16.0, 13.0, 7.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-15.0390625, -14.6341552734375, -14.229248046875, -13.8243408203125, -13.41943359375, -13.0145263671875, -12.609619140625, -12.2047119140625, -11.7998046875, -11.3948974609375, -10.989990234375, -10.5850830078125, -10.18017578125, -9.7752685546875, -9.370361328125, -8.9654541015625, -8.560546875, -8.1556396484375, -7.750732421875, -7.3458251953125, -6.94091796875, -6.5360107421875, -6.131103515625, -5.7261962890625, -5.3212890625, -4.9163818359375, -4.511474609375, -4.1065673828125, -3.70166015625, -3.2967529296875, -2.891845703125, -2.4869384765625, -2.08203125, -1.6771240234375, -1.272216796875, -0.8673095703125, -0.46240234375, -0.0574951171875, 0.347412109375, 0.7523193359375, 1.1572265625, 1.5621337890625, 1.967041015625, 2.3719482421875, 2.77685546875, 3.1817626953125, 3.586669921875, 3.9915771484375, 4.396484375, 4.8013916015625, 5.206298828125, 5.6112060546875, 6.01611328125, 6.4210205078125, 6.825927734375, 7.2308349609375, 7.6357421875, 8.0406494140625, 8.445556640625, 8.8504638671875, 9.25537109375, 9.6602783203125, 10.065185546875, 10.4700927734375, 10.875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 4.0, 4.0, 8.0, 9.0, 6.0, 10.0, 7.0, 13.0, 19.0, 16.0, 26.0, 14.0, 24.0, 32.0, 27.0, 42.0, 53.0, 39.0, 55.0, 43.0, 50.0, 36.0, 36.0, 49.0, 52.0, 39.0, 39.0, 33.0, 22.0, 30.0, 33.0, 23.0, 18.0, 18.0, 17.0, 14.0, 12.0, 3.0, 9.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.3515625, -9.065673828125, -8.77978515625, -8.493896484375, -8.2080078125, -7.922119140625, -7.63623046875, -7.350341796875, -7.064453125, -6.778564453125, -6.49267578125, -6.206787109375, -5.9208984375, -5.635009765625, -5.34912109375, -5.063232421875, -4.77734375, -4.491455078125, -4.20556640625, -3.919677734375, -3.6337890625, -3.347900390625, -3.06201171875, -2.776123046875, -2.490234375, -2.204345703125, -1.91845703125, -1.632568359375, -1.3466796875, -1.060791015625, -0.77490234375, -0.489013671875, -0.203125, 0.082763671875, 0.36865234375, 0.654541015625, 0.9404296875, 1.226318359375, 1.51220703125, 1.798095703125, 2.083984375, 2.369873046875, 2.65576171875, 2.941650390625, 3.2275390625, 3.513427734375, 3.79931640625, 4.085205078125, 4.37109375, 4.656982421875, 4.94287109375, 5.228759765625, 5.5146484375, 5.800537109375, 6.08642578125, 6.372314453125, 6.658203125, 6.944091796875, 7.22998046875, 7.515869140625, 7.8017578125, 8.087646484375, 8.37353515625, 8.659423828125, 8.9453125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 4.0, 3.0, 7.0, 8.0, 7.0, 9.0, 30.0, 37.0, 56.0, 90.0, 157.0, 303.0, 731.0, 1882.0, 6491.0, 28290.0, 152467.0, 541475.0, 255199.0, 46680.0, 9942.0, 2838.0, 942.0, 413.0, 204.0, 104.0, 63.0, 22.0, 43.0, 27.0, 12.0, 9.0, 3.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.86328125, -6.68572998046875, -6.5081787109375, -6.33062744140625, -6.153076171875, -5.97552490234375, -5.7979736328125, -5.62042236328125, -5.44287109375, -5.26531982421875, -5.0877685546875, -4.91021728515625, -4.732666015625, -4.55511474609375, -4.3775634765625, -4.20001220703125, -4.0224609375, -3.84490966796875, -3.6673583984375, -3.48980712890625, -3.312255859375, -3.13470458984375, -2.9571533203125, -2.77960205078125, -2.60205078125, -2.42449951171875, -2.2469482421875, -2.06939697265625, -1.891845703125, -1.71429443359375, -1.5367431640625, -1.35919189453125, -1.181640625, -1.00408935546875, -0.8265380859375, -0.64898681640625, -0.471435546875, -0.29388427734375, -0.1163330078125, 0.06121826171875, 0.23876953125, 0.41632080078125, 0.5938720703125, 0.77142333984375, 0.948974609375, 1.12652587890625, 1.3040771484375, 1.48162841796875, 1.6591796875, 1.83673095703125, 2.0142822265625, 2.19183349609375, 2.369384765625, 2.54693603515625, 2.7244873046875, 2.90203857421875, 3.07958984375, 3.25714111328125, 3.4346923828125, 3.61224365234375, 3.789794921875, 3.96734619140625, 4.1448974609375, 4.32244873046875, 4.5]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 11.0, 11.0, 14.0, 11.0, 17.0, 32.0, 31.0, 52.0, 59.0, 67.0, 75.0, 106.0, 91.0, 85.0, 70.0, 62.0, 44.0, 37.0, 29.0, 24.0, 17.0, 12.0, 16.0, 8.0, 5.0, 5.0, 3.0, 3.0, 0.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0012073516845703125, -0.0011765360832214355, -0.0011457204818725586, -0.0011149048805236816, -0.0010840892791748047, -0.0010532736778259277, -0.0010224580764770508, -0.0009916424751281738, -0.0009608268737792969, -0.0009300112724304199, -0.000899195671081543, -0.000868380069732666, -0.0008375644683837891, -0.0008067488670349121, -0.0007759332656860352, -0.0007451176643371582, -0.0007143020629882812, -0.0006834864616394043, -0.0006526708602905273, -0.0006218552589416504, -0.0005910396575927734, -0.0005602240562438965, -0.0005294084548950195, -0.0004985928535461426, -0.0004677772521972656, -0.00043696165084838867, -0.0004061460494995117, -0.00037533044815063477, -0.0003445148468017578, -0.00031369924545288086, -0.0002828836441040039, -0.00025206804275512695, -0.00022125244140625, -0.00019043684005737305, -0.0001596212387084961, -0.00012880563735961914, -9.799003601074219e-05, -6.717443466186523e-05, -3.635883331298828e-05, -5.543231964111328e-06, 2.5272369384765625e-05, 5.608797073364258e-05, 8.690357208251953e-05, 0.00011771917343139648, 0.00014853477478027344, 0.0001793503761291504, 0.00021016597747802734, 0.0002409815788269043, 0.00027179718017578125, 0.0003026127815246582, 0.00033342838287353516, 0.0003642439842224121, 0.00039505958557128906, 0.000425875186920166, 0.00045669078826904297, 0.0004875063896179199, 0.0005183219909667969, 0.0005491375923156738, 0.0005799531936645508, 0.0006107687950134277, 0.0006415843963623047, 0.0006723999977111816, 0.0007032155990600586, 0.0007340312004089355, 0.0007648468017578125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 4.0, 5.0, 9.0, 9.0, 9.0, 15.0, 22.0, 42.0, 55.0, 68.0, 118.0, 184.0, 338.0, 566.0, 1090.0, 2296.0, 6262.0, 26558.0, 156065.0, 559748.0, 240398.0, 40216.0, 8714.0, 2849.0, 1240.0, 651.0, 378.0, 232.0, 140.0, 83.0, 78.0, 31.0, 22.0, 14.0, 14.0, 6.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.1640625, -5.99102783203125, -5.8179931640625, -5.64495849609375, -5.471923828125, -5.29888916015625, -5.1258544921875, -4.95281982421875, -4.77978515625, -4.60675048828125, -4.4337158203125, -4.26068115234375, -4.087646484375, -3.91461181640625, -3.7415771484375, -3.56854248046875, -3.3955078125, -3.22247314453125, -3.0494384765625, -2.87640380859375, -2.703369140625, -2.53033447265625, -2.3572998046875, -2.18426513671875, -2.01123046875, -1.83819580078125, -1.6651611328125, -1.49212646484375, -1.319091796875, -1.14605712890625, -0.9730224609375, -0.79998779296875, -0.626953125, -0.45391845703125, -0.2808837890625, -0.10784912109375, 0.065185546875, 0.23822021484375, 0.4112548828125, 0.58428955078125, 0.75732421875, 0.93035888671875, 1.1033935546875, 1.27642822265625, 1.449462890625, 1.62249755859375, 1.7955322265625, 1.96856689453125, 2.1416015625, 2.31463623046875, 2.4876708984375, 2.66070556640625, 2.833740234375, 3.00677490234375, 3.1798095703125, 3.35284423828125, 3.52587890625, 3.69891357421875, 3.8719482421875, 4.04498291015625, 4.218017578125, 4.39105224609375, 4.5640869140625, 4.73712158203125, 4.91015625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 10.0, 9.0, 12.0, 12.0, 24.0, 29.0, 32.0, 61.0, 54.0, 76.0, 80.0, 84.0, 87.0, 73.0, 81.0, 68.0, 55.0, 35.0, 34.0, 20.0, 16.0, 21.0, 6.0, 8.0, 5.0, 2.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65625, -4.515380859375, -4.37451171875, -4.233642578125, -4.0927734375, -3.951904296875, -3.81103515625, -3.670166015625, -3.529296875, -3.388427734375, -3.24755859375, -3.106689453125, -2.9658203125, -2.824951171875, -2.68408203125, -2.543212890625, -2.40234375, -2.261474609375, -2.12060546875, -1.979736328125, -1.8388671875, -1.697998046875, -1.55712890625, -1.416259765625, -1.275390625, -1.134521484375, -0.99365234375, -0.852783203125, -0.7119140625, -0.571044921875, -0.43017578125, -0.289306640625, -0.1484375, -0.007568359375, 0.13330078125, 0.274169921875, 0.4150390625, 0.555908203125, 0.69677734375, 0.837646484375, 0.978515625, 1.119384765625, 1.26025390625, 1.401123046875, 1.5419921875, 1.682861328125, 1.82373046875, 1.964599609375, 2.10546875, 2.246337890625, 2.38720703125, 2.528076171875, 2.6689453125, 2.809814453125, 2.95068359375, 3.091552734375, 3.232421875, 3.373291015625, 3.51416015625, 3.655029296875, 3.7958984375, 3.936767578125, 4.07763671875, 4.218505859375, 4.359375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 10.0, 44.0, 114.0, 212.0, 261.0, 204.0, 113.0, 35.0, 7.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.90145874023438, -152.48587036132812, -148.07029724121094, -143.6547088623047, -139.2391357421875, -134.82354736328125, -130.407958984375, -125.99237823486328, -121.57679748535156, -117.16121673583984, -112.74563598632812, -108.33004760742188, -103.91446685791016, -99.49888610839844, -95.08329772949219, -90.66771697998047, -86.25213623046875, -81.83655548095703, -77.42097473144531, -73.00538635253906, -68.58980560302734, -64.17422485351562, -59.75864028930664, -55.343055725097656, -50.92747497558594, -46.51189422607422, -42.096309661865234, -37.68072509765625, -33.26514434814453, -28.84956169128418, -24.433979034423828, -20.018396377563477, -15.602813720703125, -11.187231063842773, -6.771648406982422, -2.3560657501220703, 2.0595169067382812, 6.475099563598633, 10.890682220458984, 15.306264877319336, 19.721847534179688, 24.13743019104004, 28.55301284790039, 32.968597412109375, 37.384178161621094, 41.79975891113281, 46.2153434753418, 50.63092803955078, 55.0465087890625, 59.46208953857422, 63.8776741027832, 68.29325866699219, 72.7088394165039, 77.12442016601562, 81.54000854492188, 85.9555892944336, 90.37117004394531, 94.78675079345703, 99.20233154296875, 103.617919921875, 108.03350067138672, 112.44908142089844, 116.86466979980469, 121.2802505493164, 125.69583129882812]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 6.0, 6.0, 8.0, 12.0, 7.0, 10.0, 9.0, 18.0, 16.0, 22.0, 27.0, 23.0, 38.0, 33.0, 34.0, 37.0, 44.0, 50.0, 46.0, 35.0, 46.0, 54.0, 50.0, 40.0, 49.0, 32.0, 36.0, 25.0, 21.0, 29.0, 16.0, 26.0, 17.0, 11.0, 11.0, 12.0, 12.0, 3.0, 11.0, 5.0, 5.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0], "bins": [-51.0140380859375, -49.59974670410156, -48.18545150756836, -46.77116012573242, -45.35686492919922, -43.94257354736328, -42.528282165527344, -41.11398696899414, -39.69969177246094, -38.285400390625, -36.8711051940918, -35.45681381225586, -34.042518615722656, -32.62822723388672, -31.21393394470215, -29.799640655517578, -28.38534927368164, -26.97105598449707, -25.5567626953125, -24.142471313476562, -22.72817611694336, -21.313884735107422, -19.89959144592285, -18.48529815673828, -17.07100486755371, -15.65671157836914, -14.24241828918457, -12.828125953674316, -11.413832664489746, -9.999539375305176, -8.585247039794922, -7.170953750610352, -5.756660461425781, -4.342367172241211, -2.928074359893799, -1.5137815475463867, -0.0994882583618164, 1.314805030822754, 2.729097366333008, 4.143390655517578, 5.557683944702148, 6.971977233886719, 8.386270523071289, 9.800562858581543, 11.214856147766113, 12.629149436950684, 14.043441772460938, 15.457735061645508, 16.872028350830078, 18.28632164001465, 19.70061492919922, 21.114906311035156, 22.52920150756836, 23.943492889404297, 25.357786178588867, 26.772079467773438, 28.186372756958008, 29.600666046142578, 31.01495933532715, 32.42925262451172, 33.843544006347656, 35.25783920288086, 36.6721305847168, 38.08642578125, 39.50071716308594]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 8.0, 5.0, 6.0, 5.0, 5.0, 10.0, 18.0, 23.0, 26.0, 33.0, 37.0, 47.0, 68.0, 98.0, 149.0, 189.0, 298.0, 496.0, 995.0, 2139.0, 5790.0, 29592.0, 3968563.0, 164557.0, 13992.0, 3625.0, 1502.0, 779.0, 395.0, 232.0, 165.0, 104.0, 90.0, 47.0, 52.0, 35.0, 22.0, 19.0, 23.0, 18.0, 9.0, 9.0, 8.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.125, -13.616943359375, -13.10888671875, -12.600830078125, -12.0927734375, -11.584716796875, -11.07666015625, -10.568603515625, -10.060546875, -9.552490234375, -9.04443359375, -8.536376953125, -8.0283203125, -7.520263671875, -7.01220703125, -6.504150390625, -5.99609375, -5.488037109375, -4.97998046875, -4.471923828125, -3.9638671875, -3.455810546875, -2.94775390625, -2.439697265625, -1.931640625, -1.423583984375, -0.91552734375, -0.407470703125, 0.1005859375, 0.608642578125, 1.11669921875, 1.624755859375, 2.1328125, 2.640869140625, 3.14892578125, 3.656982421875, 4.1650390625, 4.673095703125, 5.18115234375, 5.689208984375, 6.197265625, 6.705322265625, 7.21337890625, 7.721435546875, 8.2294921875, 8.737548828125, 9.24560546875, 9.753662109375, 10.26171875, 10.769775390625, 11.27783203125, 11.785888671875, 12.2939453125, 12.802001953125, 13.31005859375, 13.818115234375, 14.326171875, 14.834228515625, 15.34228515625, 15.850341796875, 16.3583984375, 16.866455078125, 17.37451171875, 17.882568359375, 18.390625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 6.0, 9.0, 11.0, 9.0, 13.0, 17.0, 17.0, 17.0, 22.0, 32.0, 35.0, 38.0, 32.0, 39.0, 45.0, 50.0, 44.0, 49.0, 40.0, 39.0, 34.0, 51.0, 33.0, 37.0, 37.0, 42.0, 33.0, 30.0, 16.0, 21.0, 21.0, 16.0, 5.0, 15.0, 10.0, 3.0, 7.0, 3.0, 2.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.751953125, -1.6958160400390625, -1.639678955078125, -1.5835418701171875, -1.52740478515625, -1.4712677001953125, -1.415130615234375, -1.3589935302734375, -1.3028564453125, -1.2467193603515625, -1.190582275390625, -1.1344451904296875, -1.07830810546875, -1.0221710205078125, -0.966033935546875, -0.9098968505859375, -0.853759765625, -0.7976226806640625, -0.741485595703125, -0.6853485107421875, -0.62921142578125, -0.5730743408203125, -0.516937255859375, -0.4608001708984375, -0.4046630859375, -0.3485260009765625, -0.292388916015625, -0.2362518310546875, -0.18011474609375, -0.1239776611328125, -0.067840576171875, -0.0117034912109375, 0.04443359375, 0.1005706787109375, 0.156707763671875, 0.2128448486328125, 0.26898193359375, 0.3251190185546875, 0.381256103515625, 0.4373931884765625, 0.4935302734375, 0.5496673583984375, 0.605804443359375, 0.6619415283203125, 0.71807861328125, 0.7742156982421875, 0.830352783203125, 0.8864898681640625, 0.942626953125, 0.9987640380859375, 1.054901123046875, 1.1110382080078125, 1.16717529296875, 1.2233123779296875, 1.279449462890625, 1.3355865478515625, 1.3917236328125, 1.4478607177734375, 1.503997802734375, 1.5601348876953125, 1.61627197265625, 1.6724090576171875, 1.728546142578125, 1.7846832275390625, 1.8408203125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 8.0, 5.0, 10.0, 10.0, 15.0, 14.0, 22.0, 32.0, 45.0, 51.0, 78.0, 116.0, 172.0, 271.0, 454.0, 903.0, 2026.0, 6745.0, 56093.0, 4082111.0, 35922.0, 5416.0, 1752.0, 795.0, 407.0, 243.0, 154.0, 117.0, 90.0, 56.0, 39.0, 24.0, 25.0, 16.0, 15.0, 12.0, 1.0, 7.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.90625, -27.095703125, -26.28515625, -25.474609375, -24.6640625, -23.853515625, -23.04296875, -22.232421875, -21.421875, -20.611328125, -19.80078125, -18.990234375, -18.1796875, -17.369140625, -16.55859375, -15.748046875, -14.9375, -14.126953125, -13.31640625, -12.505859375, -11.6953125, -10.884765625, -10.07421875, -9.263671875, -8.453125, -7.642578125, -6.83203125, -6.021484375, -5.2109375, -4.400390625, -3.58984375, -2.779296875, -1.96875, -1.158203125, -0.34765625, 0.462890625, 1.2734375, 2.083984375, 2.89453125, 3.705078125, 4.515625, 5.326171875, 6.13671875, 6.947265625, 7.7578125, 8.568359375, 9.37890625, 10.189453125, 11.0, 11.810546875, 12.62109375, 13.431640625, 14.2421875, 15.052734375, 15.86328125, 16.673828125, 17.484375, 18.294921875, 19.10546875, 19.916015625, 20.7265625, 21.537109375, 22.34765625, 23.158203125, 23.96875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 9.0, 4.0, 12.0, 19.0, 33.0, 85.0, 586.0, 3103.0, 143.0, 38.0, 15.0, 13.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.46875, -5.3323974609375, -5.196044921875, -5.0596923828125, -4.92333984375, -4.7869873046875, -4.650634765625, -4.5142822265625, -4.3779296875, -4.2415771484375, -4.105224609375, -3.9688720703125, -3.83251953125, -3.6961669921875, -3.559814453125, -3.4234619140625, -3.287109375, -3.1507568359375, -3.014404296875, -2.8780517578125, -2.74169921875, -2.6053466796875, -2.468994140625, -2.3326416015625, -2.1962890625, -2.0599365234375, -1.923583984375, -1.7872314453125, -1.65087890625, -1.5145263671875, -1.378173828125, -1.2418212890625, -1.10546875, -0.9691162109375, -0.832763671875, -0.6964111328125, -0.56005859375, -0.4237060546875, -0.287353515625, -0.1510009765625, -0.0146484375, 0.1217041015625, 0.258056640625, 0.3944091796875, 0.53076171875, 0.6671142578125, 0.803466796875, 0.9398193359375, 1.076171875, 1.2125244140625, 1.348876953125, 1.4852294921875, 1.62158203125, 1.7579345703125, 1.894287109375, 2.0306396484375, 2.1669921875, 2.3033447265625, 2.439697265625, 2.5760498046875, 2.71240234375, 2.8487548828125, 2.985107421875, 3.1214599609375, 3.2578125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 0.0, 2.0, 5.0, 2.0, 4.0, 10.0, 4.0, 5.0, 9.0, 7.0, 12.0, 16.0, 11.0, 28.0, 33.0, 64.0, 67.0, 92.0, 102.0, 120.0, 107.0, 95.0, 74.0, 38.0, 37.0, 28.0, 13.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.764802932739258, -12.39647102355957, -12.028138160705566, -11.659806251525879, -11.291474342346191, -10.923141479492188, -10.5548095703125, -10.186477661132812, -9.818144798278809, -9.449812889099121, -9.081480026245117, -8.71314811706543, -8.344816207885742, -7.976483345031738, -7.608151435852051, -7.239819049835205, -6.871487140655518, -6.503154754638672, -6.134822845458984, -5.766490459442139, -5.398158073425293, -5.0298261642456055, -4.66149377822876, -4.293161392211914, -3.9248292446136475, -3.556497097015381, -3.188164710998535, -2.8198325634002686, -2.451500415802002, -2.0831680297851562, -1.7148358821868896, -1.346503496170044, -0.9781713485717773, -0.6098390817642212, -0.24150687456130981, 0.12682533264160156, 0.4951575994491577, 0.8634898662567139, 1.2318220138549805, 1.6001543998718262, 1.9684865474700928, 2.3368186950683594, 2.705151081085205, 3.0734832286834717, 3.4418153762817383, 3.810147762298584, 4.17848014831543, 4.546812057495117, 4.915144443511963, 5.283476829528809, 5.651808738708496, 6.020141124725342, 6.3884735107421875, 6.756805419921875, 7.125137805938721, 7.493470191955566, 7.861802101135254, 8.230134010314941, 8.598466873168945, 8.966798782348633, 9.33513069152832, 9.703463554382324, 10.071795463562012, 10.440128326416016, 10.808460235595703]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 5.0, 12.0, 8.0, 6.0, 16.0, 14.0, 12.0, 11.0, 24.0, 23.0, 30.0, 27.0, 38.0, 44.0, 47.0, 49.0, 43.0, 50.0, 41.0, 42.0, 53.0, 52.0, 51.0, 35.0, 40.0, 38.0, 39.0, 11.0, 28.0, 22.0, 13.0, 19.0, 4.0, 12.0, 4.0, 8.0, 6.0, 3.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0], "bins": [-8.845468521118164, -8.60477066040039, -8.364072799682617, -8.123374938964844, -7.882676601409912, -7.6419782638549805, -7.401280403137207, -7.160582542419434, -6.91988468170166, -6.679186820983887, -6.438488483428955, -6.197790622711182, -5.957092761993408, -5.716394424438477, -5.475696563720703, -5.23499870300293, -4.994300365447998, -4.753602504730225, -4.512904167175293, -4.2722063064575195, -4.031508445739746, -3.7908103466033936, -3.550112247467041, -3.3094143867492676, -3.068716287612915, -2.8280181884765625, -2.587320327758789, -2.3466222286224365, -2.105924129486084, -1.8652262687683105, -1.624528169631958, -1.383830189704895, -1.1431326866149902, -0.9024347066879272, -0.6617366671562195, -0.4210386276245117, -0.18034064769744873, 0.06035733222961426, 0.3010554313659668, 0.5417534112930298, 0.7824513912200928, 1.0231493711471558, 1.2638473510742188, 1.5045454502105713, 1.7452434301376343, 1.9859414100646973, 2.22663950920105, 2.4673376083374023, 2.708035469055176, 2.9487335681915283, 3.1894314289093018, 3.4301295280456543, 3.6708273887634277, 3.9115254878997803, 4.152223587036133, 4.392921447753906, 4.63361930847168, 4.874317169189453, 5.115015506744385, 5.355713367462158, 5.596411228179932, 5.837109565734863, 6.077807426452637, 6.31850528717041, 6.559203624725342]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 10.0, 21.0, 18.0, 17.0, 38.0, 54.0, 66.0, 102.0, 215.0, 409.0, 888.0, 1923.0, 4656.0, 12158.0, 32324.0, 85912.0, 206074.0, 326035.0, 222988.0, 95473.0, 36137.0, 13625.0, 5288.0, 2116.0, 917.0, 466.0, 224.0, 125.0, 76.0, 47.0, 38.0, 30.0, 16.0, 15.0, 8.0, 5.0, 6.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.82421875, -5.6396484375, -5.455078125, -5.2705078125, -5.0859375, -4.9013671875, -4.716796875, -4.5322265625, -4.34765625, -4.1630859375, -3.978515625, -3.7939453125, -3.609375, -3.4248046875, -3.240234375, -3.0556640625, -2.87109375, -2.6865234375, -2.501953125, -2.3173828125, -2.1328125, -1.9482421875, -1.763671875, -1.5791015625, -1.39453125, -1.2099609375, -1.025390625, -0.8408203125, -0.65625, -0.4716796875, -0.287109375, -0.1025390625, 0.08203125, 0.2666015625, 0.451171875, 0.6357421875, 0.8203125, 1.0048828125, 1.189453125, 1.3740234375, 1.55859375, 1.7431640625, 1.927734375, 2.1123046875, 2.296875, 2.4814453125, 2.666015625, 2.8505859375, 3.03515625, 3.2197265625, 3.404296875, 3.5888671875, 3.7734375, 3.9580078125, 4.142578125, 4.3271484375, 4.51171875, 4.6962890625, 4.880859375, 5.0654296875, 5.25, 5.4345703125, 5.619140625, 5.8037109375, 5.98828125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 2.0, 6.0, 5.0, 9.0, 16.0, 14.0, 14.0, 18.0, 22.0, 22.0, 25.0, 37.0, 44.0, 37.0, 45.0, 51.0, 45.0, 43.0, 46.0, 52.0, 47.0, 53.0, 43.0, 39.0, 41.0, 38.0, 26.0, 32.0, 20.0, 24.0, 17.0, 15.0, 10.0, 11.0, 6.0, 2.0, 9.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.25390625, -2.1846923828125, -2.115478515625, -2.0462646484375, -1.97705078125, -1.9078369140625, -1.838623046875, -1.7694091796875, -1.7001953125, -1.6309814453125, -1.561767578125, -1.4925537109375, -1.42333984375, -1.3541259765625, -1.284912109375, -1.2156982421875, -1.146484375, -1.0772705078125, -1.008056640625, -0.9388427734375, -0.86962890625, -0.8004150390625, -0.731201171875, -0.6619873046875, -0.5927734375, -0.5235595703125, -0.454345703125, -0.3851318359375, -0.31591796875, -0.2467041015625, -0.177490234375, -0.1082763671875, -0.0390625, 0.0301513671875, 0.099365234375, 0.1685791015625, 0.23779296875, 0.3070068359375, 0.376220703125, 0.4454345703125, 0.5146484375, 0.5838623046875, 0.653076171875, 0.7222900390625, 0.79150390625, 0.8607177734375, 0.929931640625, 0.9991455078125, 1.068359375, 1.1375732421875, 1.206787109375, 1.2760009765625, 1.34521484375, 1.4144287109375, 1.483642578125, 1.5528564453125, 1.6220703125, 1.6912841796875, 1.760498046875, 1.8297119140625, 1.89892578125, 1.9681396484375, 2.037353515625, 2.1065673828125, 2.17578125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 9.0, 8.0, 17.0, 16.0, 33.0, 29.0, 56.0, 80.0, 123.0, 187.0, 275.0, 435.0, 809.0, 1753.0, 5829.0, 48308.0, 611235.0, 347237.0, 25164.0, 3858.0, 1328.0, 630.0, 403.0, 245.0, 173.0, 91.0, 71.0, 45.0, 28.0, 16.0, 15.0, 16.0, 11.0, 2.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.8046875, -15.3087158203125, -14.812744140625, -14.3167724609375, -13.82080078125, -13.3248291015625, -12.828857421875, -12.3328857421875, -11.8369140625, -11.3409423828125, -10.844970703125, -10.3489990234375, -9.85302734375, -9.3570556640625, -8.861083984375, -8.3651123046875, -7.869140625, -7.3731689453125, -6.877197265625, -6.3812255859375, -5.88525390625, -5.3892822265625, -4.893310546875, -4.3973388671875, -3.9013671875, -3.4053955078125, -2.909423828125, -2.4134521484375, -1.91748046875, -1.4215087890625, -0.925537109375, -0.4295654296875, 0.06640625, 0.5623779296875, 1.058349609375, 1.5543212890625, 2.05029296875, 2.5462646484375, 3.042236328125, 3.5382080078125, 4.0341796875, 4.5301513671875, 5.026123046875, 5.5220947265625, 6.01806640625, 6.5140380859375, 7.010009765625, 7.5059814453125, 8.001953125, 8.4979248046875, 8.993896484375, 9.4898681640625, 9.98583984375, 10.4818115234375, 10.977783203125, 11.4737548828125, 11.9697265625, 12.4656982421875, 12.961669921875, 13.4576416015625, 13.95361328125, 14.4495849609375, 14.945556640625, 15.4415283203125, 15.9375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 12.0, 8.0, 9.0, 16.0, 15.0, 27.0, 26.0, 30.0, 30.0, 35.0, 38.0, 45.0, 34.0, 57.0, 50.0, 56.0, 56.0, 45.0, 49.0, 54.0, 43.0, 40.0, 42.0, 30.0, 25.0, 24.0, 15.0, 22.0, 12.0, 14.0, 4.0, 6.0, 7.0, 7.0, 4.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.4375, -14.0411376953125, -13.644775390625, -13.2484130859375, -12.85205078125, -12.4556884765625, -12.059326171875, -11.6629638671875, -11.2666015625, -10.8702392578125, -10.473876953125, -10.0775146484375, -9.68115234375, -9.2847900390625, -8.888427734375, -8.4920654296875, -8.095703125, -7.6993408203125, -7.302978515625, -6.9066162109375, -6.51025390625, -6.1138916015625, -5.717529296875, -5.3211669921875, -4.9248046875, -4.5284423828125, -4.132080078125, -3.7357177734375, -3.33935546875, -2.9429931640625, -2.546630859375, -2.1502685546875, -1.75390625, -1.3575439453125, -0.961181640625, -0.5648193359375, -0.16845703125, 0.2279052734375, 0.624267578125, 1.0206298828125, 1.4169921875, 1.8133544921875, 2.209716796875, 2.6060791015625, 3.00244140625, 3.3988037109375, 3.795166015625, 4.1915283203125, 4.587890625, 4.9842529296875, 5.380615234375, 5.7769775390625, 6.17333984375, 6.5697021484375, 6.966064453125, 7.3624267578125, 7.7587890625, 8.1551513671875, 8.551513671875, 8.9478759765625, 9.34423828125, 9.7406005859375, 10.136962890625, 10.5333251953125, 10.9296875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 9.0, 4.0, 7.0, 12.0, 7.0, 27.0, 49.0, 121.0, 169.0, 336.0, 774.0, 1882.0, 5900.0, 25663.0, 167466.0, 623996.0, 184106.0, 28100.0, 6330.0, 2014.0, 797.0, 365.0, 176.0, 107.0, 64.0, 30.0, 21.0, 10.0, 7.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.08203125, -3.91558837890625, -3.7491455078125, -3.58270263671875, -3.416259765625, -3.24981689453125, -3.0833740234375, -2.91693115234375, -2.75048828125, -2.58404541015625, -2.4176025390625, -2.25115966796875, -2.084716796875, -1.91827392578125, -1.7518310546875, -1.58538818359375, -1.4189453125, -1.25250244140625, -1.0860595703125, -0.91961669921875, -0.753173828125, -0.58673095703125, -0.4202880859375, -0.25384521484375, -0.08740234375, 0.07904052734375, 0.2454833984375, 0.41192626953125, 0.578369140625, 0.74481201171875, 0.9112548828125, 1.07769775390625, 1.244140625, 1.41058349609375, 1.5770263671875, 1.74346923828125, 1.909912109375, 2.07635498046875, 2.2427978515625, 2.40924072265625, 2.57568359375, 2.74212646484375, 2.9085693359375, 3.07501220703125, 3.241455078125, 3.40789794921875, 3.5743408203125, 3.74078369140625, 3.9072265625, 4.07366943359375, 4.2401123046875, 4.40655517578125, 4.572998046875, 4.73944091796875, 4.9058837890625, 5.07232666015625, 5.23876953125, 5.40521240234375, 5.5716552734375, 5.73809814453125, 5.904541015625, 6.07098388671875, 6.2374267578125, 6.40386962890625, 6.5703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 2.0, 4.0, 7.0, 6.0, 7.0, 7.0, 15.0, 10.0, 12.0, 25.0, 30.0, 33.0, 39.0, 47.0, 56.0, 66.0, 65.0, 69.0, 64.0, 50.0, 51.0, 49.0, 39.0, 37.0, 40.0, 32.0, 34.0, 24.0, 19.0, 12.0, 13.0, 7.0, 7.0, 9.0, 4.0, 6.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0006237030029296875, -0.0006044954061508179, -0.0005852878093719482, -0.0005660802125930786, -0.000546872615814209, -0.0005276650190353394, -0.0005084574222564697, -0.0004892498254776001, -0.00047004222869873047, -0.00045083463191986084, -0.0004316270351409912, -0.0004124194383621216, -0.00039321184158325195, -0.0003740042448043823, -0.0003547966480255127, -0.00033558905124664307, -0.00031638145446777344, -0.0002971738576889038, -0.0002779662609100342, -0.00025875866413116455, -0.00023955106735229492, -0.0002203434705734253, -0.00020113587379455566, -0.00018192827701568604, -0.0001627206802368164, -0.00014351308345794678, -0.00012430548667907715, -0.00010509788990020752, -8.589029312133789e-05, -6.668269634246826e-05, -4.747509956359863e-05, -2.8267502784729004e-05, -9.059906005859375e-06, 1.0147690773010254e-05, 2.9355287551879883e-05, 4.856288433074951e-05, 6.777048110961914e-05, 8.697807788848877e-05, 0.0001061856746673584, 0.00012539327144622803, 0.00014460086822509766, 0.00016380846500396729, 0.00018301606178283691, 0.00020222365856170654, 0.00022143125534057617, 0.0002406388521194458, 0.00025984644889831543, 0.00027905404567718506, 0.0002982616424560547, 0.0003174692392349243, 0.00033667683601379395, 0.0003558844327926636, 0.0003750920295715332, 0.00039429962635040283, 0.00041350722312927246, 0.0004327148199081421, 0.0004519224166870117, 0.00047113001346588135, 0.000490337610244751, 0.0005095452070236206, 0.0005287528038024902, 0.0005479604005813599, 0.0005671679973602295, 0.0005863755941390991, 0.0006055831909179688]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 7.0, 11.0, 12.0, 16.0, 27.0, 48.0, 64.0, 106.0, 188.0, 340.0, 684.0, 1840.0, 5515.0, 34148.0, 451007.0, 506532.0, 38616.0, 5961.0, 1827.0, 734.0, 370.0, 201.0, 109.0, 62.0, 46.0, 30.0, 18.0, 10.0, 6.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.04296875, -6.8297119140625, -6.616455078125, -6.4031982421875, -6.18994140625, -5.9766845703125, -5.763427734375, -5.5501708984375, -5.3369140625, -5.1236572265625, -4.910400390625, -4.6971435546875, -4.48388671875, -4.2706298828125, -4.057373046875, -3.8441162109375, -3.630859375, -3.4176025390625, -3.204345703125, -2.9910888671875, -2.77783203125, -2.5645751953125, -2.351318359375, -2.1380615234375, -1.9248046875, -1.7115478515625, -1.498291015625, -1.2850341796875, -1.07177734375, -0.8585205078125, -0.645263671875, -0.4320068359375, -0.21875, -0.0054931640625, 0.207763671875, 0.4210205078125, 0.63427734375, 0.8475341796875, 1.060791015625, 1.2740478515625, 1.4873046875, 1.7005615234375, 1.913818359375, 2.1270751953125, 2.34033203125, 2.5535888671875, 2.766845703125, 2.9801025390625, 3.193359375, 3.4066162109375, 3.619873046875, 3.8331298828125, 4.04638671875, 4.2596435546875, 4.472900390625, 4.6861572265625, 4.8994140625, 5.1126708984375, 5.325927734375, 5.5391845703125, 5.75244140625, 5.9656982421875, 6.178955078125, 6.3922119140625, 6.60546875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 10.0, 15.0, 9.0, 21.0, 23.0, 22.0, 42.0, 59.0, 67.0, 68.0, 90.0, 97.0, 89.0, 66.0, 71.0, 52.0, 43.0, 30.0, 32.0, 29.0, 15.0, 12.0, 8.0, 5.0, 6.0, 4.0, 3.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.720703125, -3.580535888671875, -3.44036865234375, -3.300201416015625, -3.1600341796875, -3.019866943359375, -2.87969970703125, -2.739532470703125, -2.599365234375, -2.459197998046875, -2.31903076171875, -2.178863525390625, -2.0386962890625, -1.898529052734375, -1.75836181640625, -1.618194580078125, -1.47802734375, -1.337860107421875, -1.19769287109375, -1.057525634765625, -0.9173583984375, -0.777191162109375, -0.63702392578125, -0.496856689453125, -0.356689453125, -0.216522216796875, -0.07635498046875, 0.063812255859375, 0.2039794921875, 0.344146728515625, 0.48431396484375, 0.624481201171875, 0.7646484375, 0.904815673828125, 1.04498291015625, 1.185150146484375, 1.3253173828125, 1.465484619140625, 1.60565185546875, 1.745819091796875, 1.885986328125, 2.026153564453125, 2.16632080078125, 2.306488037109375, 2.4466552734375, 2.586822509765625, 2.72698974609375, 2.867156982421875, 3.00732421875, 3.147491455078125, 3.28765869140625, 3.427825927734375, 3.5679931640625, 3.708160400390625, 3.84832763671875, 3.988494873046875, 4.128662109375, 4.268829345703125, 4.40899658203125, 4.549163818359375, 4.6893310546875, 4.829498291015625, 4.96966552734375, 5.109832763671875, 5.25]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 10.0, 13.0, 42.0, 117.0, 157.0, 193.0, 209.0, 137.0, 77.0, 25.0, 14.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-195.56956481933594, -191.56192016601562, -187.55426025390625, -183.54661560058594, -179.53897094726562, -175.53131103515625, -171.52366638183594, -167.51600646972656, -163.50836181640625, -159.50071716308594, -155.49305725097656, -151.48541259765625, -147.47775268554688, -143.47010803222656, -139.46246337890625, -135.45480346679688, -131.44715881347656, -127.43950653076172, -123.43185424804688, -119.42420959472656, -115.41655731201172, -111.40890502929688, -107.40126037597656, -103.39360809326172, -99.38595581054688, -95.37830352783203, -91.37065124511719, -87.36300659179688, -83.35535430908203, -79.34770202636719, -75.34005737304688, -71.33240509033203, -67.32474517822266, -63.31709289550781, -59.309444427490234, -55.301795959472656, -51.29414367675781, -47.28649139404297, -43.27884292602539, -39.27119445800781, -35.26354217529297, -31.255891799926758, -27.248241424560547, -23.240591049194336, -19.232940673828125, -15.225290298461914, -11.217639923095703, -7.209989547729492, -3.2023391723632812, 0.8053112030029297, 4.812961578369141, 8.820611953735352, 12.828262329101562, 16.835912704467773, 20.843563079833984, 24.851213455200195, 28.858863830566406, 32.86651611328125, 36.87416458129883, 40.881813049316406, 44.88946533203125, 48.897117614746094, 52.90476608276367, 56.91241455078125, 60.920066833496094]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 3.0, 4.0, 7.0, 8.0, 10.0, 14.0, 11.0, 15.0, 13.0, 23.0, 21.0, 26.0, 32.0, 26.0, 36.0, 40.0, 39.0, 59.0, 52.0, 51.0, 41.0, 45.0, 58.0, 43.0, 45.0, 34.0, 37.0, 37.0, 24.0, 32.0, 19.0, 23.0, 14.0, 14.0, 9.0, 5.0, 7.0, 5.0, 7.0, 2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-63.24349594116211, -61.334815979003906, -59.4261360168457, -57.517452239990234, -55.60877227783203, -53.70009231567383, -51.791412353515625, -49.882728576660156, -47.97404861450195, -46.06536865234375, -44.15668869018555, -42.24800491333008, -40.339324951171875, -38.43064498901367, -36.52196502685547, -34.61328125, -32.70460510253906, -30.79592514038086, -28.887243270874023, -26.97856330871582, -25.069881439208984, -23.16120147705078, -21.252521514892578, -19.343839645385742, -17.435157775878906, -15.526476860046387, -13.617795944213867, -11.709115982055664, -9.800434112548828, -7.891754150390625, -5.9830732345581055, -4.074392318725586, -2.16571044921875, -0.25702965259552, 1.65165114402771, 3.5603318214416504, 5.46901273727417, 7.377693176269531, 9.28637409210205, 11.19505500793457, 13.10373592376709, 15.01241683959961, 16.921096801757812, 18.82977867126465, 20.73845863342285, 22.647140502929688, 24.55582046508789, 26.464500427246094, 28.37318229675293, 30.281862258911133, 32.19054412841797, 34.09922409057617, 36.007904052734375, 37.916587829589844, 39.82526779174805, 41.73394775390625, 43.64262771606445, 45.551307678222656, 47.45998764038086, 49.36867141723633, 51.27735137939453, 53.186031341552734, 55.09471130371094, 57.003395080566406, 58.91207504272461]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 9.0, 10.0, 12.0, 15.0, 14.0, 20.0, 31.0, 32.0, 51.0, 50.0, 105.0, 121.0, 151.0, 210.0, 323.0, 521.0, 789.0, 1240.0, 2353.0, 4933.0, 13878.0, 66065.0, 3908739.0, 158010.0, 22304.0, 6869.0, 2957.0, 1553.0, 946.0, 588.0, 381.0, 231.0, 215.0, 148.0, 94.0, 86.0, 39.0, 44.0, 43.0, 19.0, 21.0, 16.0, 11.0, 11.0, 5.0, 6.0, 4.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-9.984375, -9.6788330078125, -9.373291015625, -9.0677490234375, -8.76220703125, -8.4566650390625, -8.151123046875, -7.8455810546875, -7.5400390625, -7.2344970703125, -6.928955078125, -6.6234130859375, -6.31787109375, -6.0123291015625, -5.706787109375, -5.4012451171875, -5.095703125, -4.7901611328125, -4.484619140625, -4.1790771484375, -3.87353515625, -3.5679931640625, -3.262451171875, -2.9569091796875, -2.6513671875, -2.3458251953125, -2.040283203125, -1.7347412109375, -1.42919921875, -1.1236572265625, -0.818115234375, -0.5125732421875, -0.20703125, 0.0985107421875, 0.404052734375, 0.7095947265625, 1.01513671875, 1.3206787109375, 1.626220703125, 1.9317626953125, 2.2373046875, 2.5428466796875, 2.848388671875, 3.1539306640625, 3.45947265625, 3.7650146484375, 4.070556640625, 4.3760986328125, 4.681640625, 4.9871826171875, 5.292724609375, 5.5982666015625, 5.90380859375, 6.2093505859375, 6.514892578125, 6.8204345703125, 7.1259765625, 7.4315185546875, 7.737060546875, 8.0426025390625, 8.34814453125, 8.6536865234375, 8.959228515625, 9.2647705078125, 9.5703125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 4.0, 4.0, 8.0, 6.0, 8.0, 12.0, 11.0, 15.0, 17.0, 21.0, 16.0, 28.0, 34.0, 31.0, 46.0, 41.0, 55.0, 54.0, 62.0, 50.0, 55.0, 35.0, 45.0, 52.0, 37.0, 36.0, 48.0, 33.0, 38.0, 19.0, 12.0, 14.0, 9.0, 8.0, 6.0, 5.0, 6.0, 5.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.099609375, -2.02862548828125, -1.9576416015625, -1.88665771484375, -1.815673828125, -1.74468994140625, -1.6737060546875, -1.60272216796875, -1.53173828125, -1.46075439453125, -1.3897705078125, -1.31878662109375, -1.247802734375, -1.17681884765625, -1.1058349609375, -1.03485107421875, -0.9638671875, -0.89288330078125, -0.8218994140625, -0.75091552734375, -0.679931640625, -0.60894775390625, -0.5379638671875, -0.46697998046875, -0.39599609375, -0.32501220703125, -0.2540283203125, -0.18304443359375, -0.112060546875, -0.04107666015625, 0.0299072265625, 0.10089111328125, 0.171875, 0.24285888671875, 0.3138427734375, 0.38482666015625, 0.455810546875, 0.52679443359375, 0.5977783203125, 0.66876220703125, 0.73974609375, 0.81072998046875, 0.8817138671875, 0.95269775390625, 1.023681640625, 1.09466552734375, 1.1656494140625, 1.23663330078125, 1.3076171875, 1.37860107421875, 1.4495849609375, 1.52056884765625, 1.591552734375, 1.66253662109375, 1.7335205078125, 1.80450439453125, 1.87548828125, 1.94647216796875, 2.0174560546875, 2.08843994140625, 2.159423828125, 2.23040771484375, 2.3013916015625, 2.37237548828125, 2.443359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 5.0, 11.0, 12.0, 13.0, 19.0, 31.0, 34.0, 49.0, 61.0, 107.0, 114.0, 167.0, 208.0, 316.0, 438.0, 636.0, 921.0, 1553.0, 2748.0, 5291.0, 12994.0, 48045.0, 855638.0, 3185841.0, 52206.0, 13578.0, 5548.0, 2789.0, 1584.0, 1050.0, 667.0, 418.0, 313.0, 224.0, 158.0, 137.0, 96.0, 79.0, 46.0, 34.0, 26.0, 18.0, 13.0, 11.0, 8.0, 5.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.9609375, -9.64990234375, -9.3388671875, -9.02783203125, -8.716796875, -8.40576171875, -8.0947265625, -7.78369140625, -7.47265625, -7.16162109375, -6.8505859375, -6.53955078125, -6.228515625, -5.91748046875, -5.6064453125, -5.29541015625, -4.984375, -4.67333984375, -4.3623046875, -4.05126953125, -3.740234375, -3.42919921875, -3.1181640625, -2.80712890625, -2.49609375, -2.18505859375, -1.8740234375, -1.56298828125, -1.251953125, -0.94091796875, -0.6298828125, -0.31884765625, -0.0078125, 0.30322265625, 0.6142578125, 0.92529296875, 1.236328125, 1.54736328125, 1.8583984375, 2.16943359375, 2.48046875, 2.79150390625, 3.1025390625, 3.41357421875, 3.724609375, 4.03564453125, 4.3466796875, 4.65771484375, 4.96875, 5.27978515625, 5.5908203125, 5.90185546875, 6.212890625, 6.52392578125, 6.8349609375, 7.14599609375, 7.45703125, 7.76806640625, 8.0791015625, 8.39013671875, 8.701171875, 9.01220703125, 9.3232421875, 9.63427734375, 9.9453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 7.0, 1.0, 4.0, 7.0, 14.0, 22.0, 37.0, 72.0, 163.0, 2689.0, 710.0, 156.0, 79.0, 33.0, 21.0, 17.0, 9.0, 6.0, 9.0, 1.0, 5.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.755859375, -2.663787841796875, -2.57171630859375, -2.479644775390625, -2.3875732421875, -2.295501708984375, -2.20343017578125, -2.111358642578125, -2.019287109375, -1.927215576171875, -1.83514404296875, -1.743072509765625, -1.6510009765625, -1.558929443359375, -1.46685791015625, -1.374786376953125, -1.28271484375, -1.190643310546875, -1.09857177734375, -1.006500244140625, -0.9144287109375, -0.822357177734375, -0.73028564453125, -0.638214111328125, -0.546142578125, -0.454071044921875, -0.36199951171875, -0.269927978515625, -0.1778564453125, -0.085784912109375, 0.00628662109375, 0.098358154296875, 0.1904296875, 0.282501220703125, 0.37457275390625, 0.466644287109375, 0.5587158203125, 0.650787353515625, 0.74285888671875, 0.834930419921875, 0.927001953125, 1.019073486328125, 1.11114501953125, 1.203216552734375, 1.2952880859375, 1.387359619140625, 1.47943115234375, 1.571502685546875, 1.66357421875, 1.755645751953125, 1.84771728515625, 1.939788818359375, 2.0318603515625, 2.123931884765625, 2.21600341796875, 2.308074951171875, 2.400146484375, 2.492218017578125, 2.58428955078125, 2.676361083984375, 2.7684326171875, 2.860504150390625, 2.95257568359375, 3.044647216796875, 3.13671875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 8.0, 6.0, 10.0, 24.0, 24.0, 18.0, 36.0, 65.0, 63.0, 63.0, 74.0, 72.0, 72.0, 66.0, 73.0, 59.0, 60.0, 43.0, 50.0, 26.0, 18.0, 15.0, 12.0, 8.0, 5.0, 8.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.847022533416748, -6.5972065925598145, -6.347391128540039, -6.0975751876831055, -5.84775972366333, -5.5979437828063965, -5.348128318786621, -5.0983123779296875, -4.848496437072754, -4.59868049621582, -4.348865032196045, -4.099049091339111, -3.849233627319336, -3.5994176864624023, -3.349601984024048, -3.0997862815856934, -2.849970817565918, -2.6001551151275635, -2.350339412689209, -2.1005234718322754, -1.8507078886032104, -1.600892186164856, -1.351076364517212, -1.1012606620788574, -0.8514449596405029, -0.6016292572021484, -0.35181349515914917, -0.1019977331161499, 0.1478179693222046, 0.3976336717605591, 0.6474494934082031, 0.8972651958465576, 1.147080421447754, 1.3968961238861084, 1.646711826324463, 1.896527647972107, 2.146343231201172, 2.3961591720581055, 2.64597487449646, 2.8957905769348145, 3.145606279373169, 3.3954219818115234, 3.645237684249878, 3.8950533866882324, 4.144869327545166, 4.394684791564941, 4.644500732421875, 4.894316673278809, 5.144132137298584, 5.393948078155518, 5.643763542175293, 5.893579483032227, 6.143394947052002, 6.3932108879089355, 6.643026351928711, 6.8928422927856445, 7.142658233642578, 7.392474174499512, 7.642289638519287, 7.892105579376221, 8.141921043395996, 8.39173698425293, 8.641552925109863, 8.891368865966797, 9.141183853149414]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 1.0, 0.0, 4.0, 6.0, 3.0, 9.0, 6.0, 11.0, 6.0, 13.0, 10.0, 13.0, 13.0, 22.0, 22.0, 12.0, 20.0, 35.0, 29.0, 46.0, 31.0, 35.0, 33.0, 46.0, 44.0, 37.0, 51.0, 42.0, 43.0, 44.0, 28.0, 32.0, 37.0, 36.0, 32.0, 25.0, 25.0, 15.0, 12.0, 14.0, 10.0, 11.0, 8.0, 7.0, 7.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.495150566101074, -5.3013596534729, -5.107568740844727, -4.913777828216553, -4.719986915588379, -4.526196002960205, -4.332405090332031, -4.138614177703857, -3.9448232650756836, -3.7510323524475098, -3.557241439819336, -3.363450527191162, -3.1696596145629883, -2.9758687019348145, -2.7820777893066406, -2.588286876678467, -2.394496202468872, -2.2007052898406982, -2.0069143772125244, -1.8131234645843506, -1.6193325519561768, -1.425541639328003, -1.2317508459091187, -1.0379599332809448, -0.844169020652771, -0.6503781080245972, -0.4565872251987457, -0.2627963423728943, -0.06900542974472046, 0.12478548288345337, 0.3185763359069824, 0.5123672485351562, 0.7061581611633301, 0.8999490737915039, 1.0937399864196777, 1.2875308990478516, 1.4813218116760254, 1.6751127243041992, 1.8689035177230835, 2.062694549560547, 2.2564854621887207, 2.4502763748168945, 2.6440672874450684, 2.837858200073242, 3.031649112701416, 3.22544002532959, 3.4192309379577637, 3.6130218505859375, 3.8068125247955322, 4.000603199005127, 4.194394111633301, 4.388185024261475, 4.581975936889648, 4.775766849517822, 4.969557762145996, 5.16334867477417, 5.357139587402344, 5.550930500030518, 5.744721412658691, 5.938512325286865, 6.132303237915039, 6.326094150543213, 6.519885063171387, 6.7136759757995605, 6.907466888427734]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 9.0, 13.0, 8.0, 29.0, 42.0, 56.0, 80.0, 143.0, 200.0, 350.0, 590.0, 1028.0, 1968.0, 3638.0, 7057.0, 14257.0, 29514.0, 59607.0, 116387.0, 195707.0, 235772.0, 178090.0, 101864.0, 51479.0, 25041.0, 12424.0, 6113.0, 3066.0, 1765.0, 920.0, 517.0, 274.0, 193.0, 122.0, 68.0, 46.0, 34.0, 21.0, 13.0, 12.0, 9.0, 8.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.279296875, -3.167724609375, -3.05615234375, -2.944580078125, -2.8330078125, -2.721435546875, -2.60986328125, -2.498291015625, -2.38671875, -2.275146484375, -2.16357421875, -2.052001953125, -1.9404296875, -1.828857421875, -1.71728515625, -1.605712890625, -1.494140625, -1.382568359375, -1.27099609375, -1.159423828125, -1.0478515625, -0.936279296875, -0.82470703125, -0.713134765625, -0.6015625, -0.489990234375, -0.37841796875, -0.266845703125, -0.1552734375, -0.043701171875, 0.06787109375, 0.179443359375, 0.291015625, 0.402587890625, 0.51416015625, 0.625732421875, 0.7373046875, 0.848876953125, 0.96044921875, 1.072021484375, 1.18359375, 1.295166015625, 1.40673828125, 1.518310546875, 1.6298828125, 1.741455078125, 1.85302734375, 1.964599609375, 2.076171875, 2.187744140625, 2.29931640625, 2.410888671875, 2.5224609375, 2.634033203125, 2.74560546875, 2.857177734375, 2.96875, 3.080322265625, 3.19189453125, 3.303466796875, 3.4150390625, 3.526611328125, 3.63818359375, 3.749755859375, 3.861328125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 1.0, 7.0, 4.0, 6.0, 8.0, 7.0, 7.0, 11.0, 8.0, 18.0, 30.0, 26.0, 25.0, 47.0, 41.0, 50.0, 52.0, 54.0, 64.0, 52.0, 58.0, 53.0, 62.0, 47.0, 46.0, 33.0, 37.0, 31.0, 22.0, 21.0, 18.0, 13.0, 9.0, 3.0, 12.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.552734375, -2.471893310546875, -2.39105224609375, -2.310211181640625, -2.2293701171875, -2.148529052734375, -2.06768798828125, -1.986846923828125, -1.906005859375, -1.825164794921875, -1.74432373046875, -1.663482666015625, -1.5826416015625, -1.501800537109375, -1.42095947265625, -1.340118408203125, -1.25927734375, -1.178436279296875, -1.09759521484375, -1.016754150390625, -0.9359130859375, -0.855072021484375, -0.77423095703125, -0.693389892578125, -0.612548828125, -0.531707763671875, -0.45086669921875, -0.370025634765625, -0.2891845703125, -0.208343505859375, -0.12750244140625, -0.046661376953125, 0.0341796875, 0.115020751953125, 0.19586181640625, 0.276702880859375, 0.3575439453125, 0.438385009765625, 0.51922607421875, 0.600067138671875, 0.680908203125, 0.761749267578125, 0.84259033203125, 0.923431396484375, 1.0042724609375, 1.085113525390625, 1.16595458984375, 1.246795654296875, 1.32763671875, 1.408477783203125, 1.48931884765625, 1.570159912109375, 1.6510009765625, 1.731842041015625, 1.81268310546875, 1.893524169921875, 1.974365234375, 2.055206298828125, 2.13604736328125, 2.216888427734375, 2.2977294921875, 2.378570556640625, 2.45941162109375, 2.540252685546875, 2.62109375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 2.0, 4.0, 3.0, 12.0, 9.0, 10.0, 31.0, 34.0, 55.0, 62.0, 79.0, 137.0, 177.0, 298.0, 479.0, 774.0, 1549.0, 3642.0, 17898.0, 228068.0, 707991.0, 73425.0, 8429.0, 2423.0, 1149.0, 616.0, 387.0, 264.0, 164.0, 126.0, 63.0, 59.0, 38.0, 24.0, 19.0, 15.0, 14.0, 4.0, 7.0, 3.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4453125, -11.0675048828125, -10.689697265625, -10.3118896484375, -9.93408203125, -9.5562744140625, -9.178466796875, -8.8006591796875, -8.4228515625, -8.0450439453125, -7.667236328125, -7.2894287109375, -6.91162109375, -6.5338134765625, -6.156005859375, -5.7781982421875, -5.400390625, -5.0225830078125, -4.644775390625, -4.2669677734375, -3.88916015625, -3.5113525390625, -3.133544921875, -2.7557373046875, -2.3779296875, -2.0001220703125, -1.622314453125, -1.2445068359375, -0.86669921875, -0.4888916015625, -0.111083984375, 0.2667236328125, 0.64453125, 1.0223388671875, 1.400146484375, 1.7779541015625, 2.15576171875, 2.5335693359375, 2.911376953125, 3.2891845703125, 3.6669921875, 4.0447998046875, 4.422607421875, 4.8004150390625, 5.17822265625, 5.5560302734375, 5.933837890625, 6.3116455078125, 6.689453125, 7.0672607421875, 7.445068359375, 7.8228759765625, 8.20068359375, 8.5784912109375, 8.956298828125, 9.3341064453125, 9.7119140625, 10.0897216796875, 10.467529296875, 10.8453369140625, 11.22314453125, 11.6009521484375, 11.978759765625, 12.3565673828125, 12.734375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 5.0, 3.0, 11.0, 8.0, 17.0, 20.0, 20.0, 19.0, 30.0, 33.0, 38.0, 37.0, 38.0, 44.0, 54.0, 56.0, 48.0, 58.0, 45.0, 51.0, 38.0, 59.0, 52.0, 25.0, 30.0, 21.0, 25.0, 29.0, 19.0, 19.0, 9.0, 4.0, 12.0, 5.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0625, -10.6676025390625, -10.272705078125, -9.8778076171875, -9.48291015625, -9.0880126953125, -8.693115234375, -8.2982177734375, -7.9033203125, -7.5084228515625, -7.113525390625, -6.7186279296875, -6.32373046875, -5.9288330078125, -5.533935546875, -5.1390380859375, -4.744140625, -4.3492431640625, -3.954345703125, -3.5594482421875, -3.16455078125, -2.7696533203125, -2.374755859375, -1.9798583984375, -1.5849609375, -1.1900634765625, -0.795166015625, -0.4002685546875, -0.00537109375, 0.3895263671875, 0.784423828125, 1.1793212890625, 1.57421875, 1.9691162109375, 2.364013671875, 2.7589111328125, 3.15380859375, 3.5487060546875, 3.943603515625, 4.3385009765625, 4.7333984375, 5.1282958984375, 5.523193359375, 5.9180908203125, 6.31298828125, 6.7078857421875, 7.102783203125, 7.4976806640625, 7.892578125, 8.2874755859375, 8.682373046875, 9.0772705078125, 9.47216796875, 9.8670654296875, 10.261962890625, 10.6568603515625, 11.0517578125, 11.4466552734375, 11.841552734375, 12.2364501953125, 12.63134765625, 13.0262451171875, 13.421142578125, 13.8160400390625, 14.2109375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 8.0, 12.0, 13.0, 34.0, 78.0, 168.0, 400.0, 1144.0, 5026.0, 84291.0, 869117.0, 81401.0, 5062.0, 1116.0, 353.0, 154.0, 78.0, 37.0, 30.0, 9.0, 6.0, 4.0, 4.0, 6.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9375, -8.67840576171875, -8.4193115234375, -8.16021728515625, -7.901123046875, -7.64202880859375, -7.3829345703125, -7.12384033203125, -6.86474609375, -6.60565185546875, -6.3465576171875, -6.08746337890625, -5.828369140625, -5.56927490234375, -5.3101806640625, -5.05108642578125, -4.7919921875, -4.53289794921875, -4.2738037109375, -4.01470947265625, -3.755615234375, -3.49652099609375, -3.2374267578125, -2.97833251953125, -2.71923828125, -2.46014404296875, -2.2010498046875, -1.94195556640625, -1.682861328125, -1.42376708984375, -1.1646728515625, -0.90557861328125, -0.646484375, -0.38739013671875, -0.1282958984375, 0.13079833984375, 0.389892578125, 0.64898681640625, 0.9080810546875, 1.16717529296875, 1.42626953125, 1.68536376953125, 1.9444580078125, 2.20355224609375, 2.462646484375, 2.72174072265625, 2.9808349609375, 3.23992919921875, 3.4990234375, 3.75811767578125, 4.0172119140625, 4.27630615234375, 4.535400390625, 4.79449462890625, 5.0535888671875, 5.31268310546875, 5.57177734375, 5.83087158203125, 6.0899658203125, 6.34906005859375, 6.608154296875, 6.86724853515625, 7.1263427734375, 7.38543701171875, 7.64453125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 8.0, 5.0, 10.0, 17.0, 13.0, 17.0, 16.0, 30.0, 41.0, 48.0, 47.0, 51.0, 76.0, 62.0, 66.0, 71.0, 66.0, 66.0, 55.0, 32.0, 40.0, 29.0, 35.0, 22.0, 17.0, 14.0, 9.0, 9.0, 5.0, 6.0, 8.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005311965942382812, -0.0005119740962982178, -0.0004927515983581543, -0.0004735291004180908, -0.00045430660247802734, -0.00043508410453796387, -0.0004158616065979004, -0.0003966391086578369, -0.00037741661071777344, -0.00035819411277770996, -0.0003389716148376465, -0.000319749116897583, -0.00030052661895751953, -0.00028130412101745605, -0.0002620816230773926, -0.0002428591251373291, -0.00022363662719726562, -0.00020441412925720215, -0.00018519163131713867, -0.0001659691333770752, -0.00014674663543701172, -0.00012752413749694824, -0.00010830163955688477, -8.907914161682129e-05, -6.985664367675781e-05, -5.0634145736694336e-05, -3.141164779663086e-05, -1.2189149856567383e-05, 7.033348083496094e-06, 2.625584602355957e-05, 4.547834396362305e-05, 6.470084190368652e-05, 8.392333984375e-05, 0.00010314583778381348, 0.00012236833572387695, 0.00014159083366394043, 0.0001608133316040039, 0.00018003582954406738, 0.00019925832748413086, 0.00021848082542419434, 0.0002377033233642578, 0.0002569258213043213, 0.00027614831924438477, 0.00029537081718444824, 0.0003145933151245117, 0.0003338158130645752, 0.00035303831100463867, 0.00037226080894470215, 0.0003914833068847656, 0.0004107058048248291, 0.0004299283027648926, 0.00044915080070495605, 0.00046837329864501953, 0.000487595796585083, 0.0005068182945251465, 0.00052604079246521, 0.0005452632904052734, 0.0005644857883453369, 0.0005837082862854004, 0.0006029307842254639, 0.0006221532821655273, 0.0006413757801055908, 0.0006605982780456543, 0.0006798207759857178, 0.0006990432739257812]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 6.0, 20.0, 21.0, 24.0, 64.0, 116.0, 267.0, 667.0, 2124.0, 11219.0, 274633.0, 724976.0, 29257.0, 3449.0, 997.0, 385.0, 148.0, 74.0, 34.0, 22.0, 18.0, 7.0, 8.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.34765625, -6.08514404296875, -5.8226318359375, -5.56011962890625, -5.297607421875, -5.03509521484375, -4.7725830078125, -4.51007080078125, -4.24755859375, -3.98504638671875, -3.7225341796875, -3.46002197265625, -3.197509765625, -2.93499755859375, -2.6724853515625, -2.40997314453125, -2.1474609375, -1.88494873046875, -1.6224365234375, -1.35992431640625, -1.097412109375, -0.83489990234375, -0.5723876953125, -0.30987548828125, -0.04736328125, 0.21514892578125, 0.4776611328125, 0.74017333984375, 1.002685546875, 1.26519775390625, 1.5277099609375, 1.79022216796875, 2.052734375, 2.31524658203125, 2.5777587890625, 2.84027099609375, 3.102783203125, 3.36529541015625, 3.6278076171875, 3.89031982421875, 4.15283203125, 4.41534423828125, 4.6778564453125, 4.94036865234375, 5.202880859375, 5.46539306640625, 5.7279052734375, 5.99041748046875, 6.2529296875, 6.51544189453125, 6.7779541015625, 7.04046630859375, 7.302978515625, 7.56549072265625, 7.8280029296875, 8.09051513671875, 8.35302734375, 8.61553955078125, 8.8780517578125, 9.14056396484375, 9.403076171875, 9.66558837890625, 9.9281005859375, 10.19061279296875, 10.453125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 11.0, 7.0, 20.0, 41.0, 63.0, 93.0, 135.0, 135.0, 131.0, 99.0, 96.0, 62.0, 39.0, 26.0, 17.0, 8.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1484375, -7.92816162109375, -7.7078857421875, -7.48760986328125, -7.267333984375, -7.04705810546875, -6.8267822265625, -6.60650634765625, -6.38623046875, -6.16595458984375, -5.9456787109375, -5.72540283203125, -5.505126953125, -5.28485107421875, -5.0645751953125, -4.84429931640625, -4.6240234375, -4.40374755859375, -4.1834716796875, -3.96319580078125, -3.742919921875, -3.52264404296875, -3.3023681640625, -3.08209228515625, -2.86181640625, -2.64154052734375, -2.4212646484375, -2.20098876953125, -1.980712890625, -1.76043701171875, -1.5401611328125, -1.31988525390625, -1.099609375, -0.87933349609375, -0.6590576171875, -0.43878173828125, -0.218505859375, 0.00177001953125, 0.2220458984375, 0.44232177734375, 0.66259765625, 0.88287353515625, 1.1031494140625, 1.32342529296875, 1.543701171875, 1.76397705078125, 1.9842529296875, 2.20452880859375, 2.4248046875, 2.64508056640625, 2.8653564453125, 3.08563232421875, 3.305908203125, 3.52618408203125, 3.7464599609375, 3.96673583984375, 4.18701171875, 4.40728759765625, 4.6275634765625, 4.84783935546875, 5.068115234375, 5.28839111328125, 5.5086669921875, 5.72894287109375, 5.94921875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 13.0, 18.0, 95.0, 258.0, 319.0, 206.0, 67.0, 22.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.9571762084961, -115.7615966796875, -110.5660171508789, -105.37043762207031, -100.17485046386719, -94.97927856445312, -89.78369140625, -84.5881118774414, -79.39253234863281, -74.19695281982422, -69.00137329101562, -63.805789947509766, -58.61021041870117, -53.41463088989258, -48.21904754638672, -43.023468017578125, -37.82788848876953, -32.63230895996094, -27.43672752380371, -22.241146087646484, -17.04556655883789, -11.849987030029297, -6.65440559387207, -1.4588241577148438, 3.73675537109375, 8.93233585357666, 14.12791633605957, 19.323497772216797, 24.51907730102539, 29.714656829833984, 34.910240173339844, 40.10581970214844, 45.3013916015625, 50.496971130371094, 55.69255065917969, 60.88813400268555, 66.08370971679688, 71.279296875, 76.4748764038086, 81.67045593261719, 86.86603546142578, 92.06161499023438, 97.25719451904297, 102.45277404785156, 107.64836120605469, 112.84393310546875, 118.03952026367188, 123.23509979248047, 128.43067932128906, 133.6262664794922, 138.82183837890625, 144.01742553710938, 149.21299743652344, 154.40858459472656, 159.60415649414062, 164.79974365234375, 169.99533081054688, 175.19091796875, 180.38648986816406, 185.5820770263672, 190.77764892578125, 195.97323608398438, 201.16880798339844, 206.36439514160156, 211.55996704101562]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 8.0, 6.0, 9.0, 9.0, 17.0, 23.0, 17.0, 21.0, 20.0, 34.0, 27.0, 36.0, 42.0, 38.0, 40.0, 55.0, 43.0, 49.0, 49.0, 53.0, 67.0, 36.0, 45.0, 35.0, 39.0, 32.0, 24.0, 17.0, 18.0, 16.0, 17.0, 11.0, 13.0, 8.0, 5.0, 7.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.229698181152344, -54.52511978149414, -52.82054138183594, -51.115962982177734, -49.41138458251953, -47.70680618286133, -46.002227783203125, -44.29765319824219, -42.59307098388672, -40.888492584228516, -39.18391418457031, -37.47933578491211, -35.774757385253906, -34.0701789855957, -32.3656005859375, -30.66102409362793, -28.95644760131836, -27.251869201660156, -25.547290802001953, -23.84271240234375, -22.138134002685547, -20.433555603027344, -18.728979110717773, -17.02440071105957, -15.319822311401367, -13.615243911743164, -11.910665512084961, -10.206088066101074, -8.501509666442871, -6.796931266784668, -5.092353820800781, -3.387775421142578, -1.683197021484375, 0.021381139755249023, 1.725959300994873, 3.430537223815918, 5.135115623474121, 6.839694023132324, 8.544271469116211, 10.248849868774414, 11.953428268432617, 13.65800666809082, 15.362585067749023, 17.067161560058594, 18.771739959716797, 20.476318359375, 22.180896759033203, 23.885475158691406, 25.59005355834961, 27.294631958007812, 28.999210357666016, 30.70378875732422, 32.40836715698242, 34.112945556640625, 35.81752014160156, 37.52210235595703, 39.22667694091797, 40.93125534057617, 42.635833740234375, 44.34041213989258, 46.04499053955078, 47.749568939208984, 49.45414733886719, 51.158721923828125, 52.863304138183594]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 4.0, 6.0, 11.0, 7.0, 16.0, 21.0, 36.0, 35.0, 64.0, 74.0, 95.0, 111.0, 166.0, 340.0, 699.0, 1876.0, 6646.0, 49203.0, 4097653.0, 29279.0, 4956.0, 1446.0, 645.0, 291.0, 138.0, 109.0, 81.0, 88.0, 33.0, 38.0, 28.0, 23.0, 18.0, 11.0, 8.0, 11.0, 2.0, 4.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.8125, -18.23193359375, -17.6513671875, -17.07080078125, -16.490234375, -15.90966796875, -15.3291015625, -14.74853515625, -14.16796875, -13.58740234375, -13.0068359375, -12.42626953125, -11.845703125, -11.26513671875, -10.6845703125, -10.10400390625, -9.5234375, -8.94287109375, -8.3623046875, -7.78173828125, -7.201171875, -6.62060546875, -6.0400390625, -5.45947265625, -4.87890625, -4.29833984375, -3.7177734375, -3.13720703125, -2.556640625, -1.97607421875, -1.3955078125, -0.81494140625, -0.234375, 0.34619140625, 0.9267578125, 1.50732421875, 2.087890625, 2.66845703125, 3.2490234375, 3.82958984375, 4.41015625, 4.99072265625, 5.5712890625, 6.15185546875, 6.732421875, 7.31298828125, 7.8935546875, 8.47412109375, 9.0546875, 9.63525390625, 10.2158203125, 10.79638671875, 11.376953125, 11.95751953125, 12.5380859375, 13.11865234375, 13.69921875, 14.27978515625, 14.8603515625, 15.44091796875, 16.021484375, 16.60205078125, 17.1826171875, 17.76318359375, 18.34375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 10.0, 18.0, 23.0, 17.0, 38.0, 25.0, 41.0, 48.0, 60.0, 63.0, 67.0, 54.0, 75.0, 59.0, 57.0, 45.0, 55.0, 50.0, 34.0, 35.0, 28.0, 16.0, 23.0, 7.0, 7.0, 5.0, 8.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.15625, -3.06396484375, -2.9716796875, -2.87939453125, -2.787109375, -2.69482421875, -2.6025390625, -2.51025390625, -2.41796875, -2.32568359375, -2.2333984375, -2.14111328125, -2.048828125, -1.95654296875, -1.8642578125, -1.77197265625, -1.6796875, -1.58740234375, -1.4951171875, -1.40283203125, -1.310546875, -1.21826171875, -1.1259765625, -1.03369140625, -0.94140625, -0.84912109375, -0.7568359375, -0.66455078125, -0.572265625, -0.47998046875, -0.3876953125, -0.29541015625, -0.203125, -0.11083984375, -0.0185546875, 0.07373046875, 0.166015625, 0.25830078125, 0.3505859375, 0.44287109375, 0.53515625, 0.62744140625, 0.7197265625, 0.81201171875, 0.904296875, 0.99658203125, 1.0888671875, 1.18115234375, 1.2734375, 1.36572265625, 1.4580078125, 1.55029296875, 1.642578125, 1.73486328125, 1.8271484375, 1.91943359375, 2.01171875, 2.10400390625, 2.1962890625, 2.28857421875, 2.380859375, 2.47314453125, 2.5654296875, 2.65771484375, 2.75]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 7.0, 12.0, 11.0, 16.0, 16.0, 35.0, 38.0, 58.0, 71.0, 127.0, 175.0, 282.0, 524.0, 1433.0, 5554.0, 48256.0, 4087979.0, 41639.0, 5240.0, 1316.0, 580.0, 284.0, 197.0, 130.0, 93.0, 59.0, 42.0, 29.0, 16.0, 15.0, 13.0, 5.0, 6.0, 3.0, 10.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.4375, -17.83251953125, -17.2275390625, -16.62255859375, -16.017578125, -15.41259765625, -14.8076171875, -14.20263671875, -13.59765625, -12.99267578125, -12.3876953125, -11.78271484375, -11.177734375, -10.57275390625, -9.9677734375, -9.36279296875, -8.7578125, -8.15283203125, -7.5478515625, -6.94287109375, -6.337890625, -5.73291015625, -5.1279296875, -4.52294921875, -3.91796875, -3.31298828125, -2.7080078125, -2.10302734375, -1.498046875, -0.89306640625, -0.2880859375, 0.31689453125, 0.921875, 1.52685546875, 2.1318359375, 2.73681640625, 3.341796875, 3.94677734375, 4.5517578125, 5.15673828125, 5.76171875, 6.36669921875, 6.9716796875, 7.57666015625, 8.181640625, 8.78662109375, 9.3916015625, 9.99658203125, 10.6015625, 11.20654296875, 11.8115234375, 12.41650390625, 13.021484375, 13.62646484375, 14.2314453125, 14.83642578125, 15.44140625, 16.04638671875, 16.6513671875, 17.25634765625, 17.861328125, 18.46630859375, 19.0712890625, 19.67626953125, 20.28125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 5.0, 15.0, 24.0, 38.0, 85.0, 526.0, 3173.0, 99.0, 52.0, 14.0, 15.0, 5.0, 6.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9521484375, -1.8443145751953125, -1.736480712890625, -1.6286468505859375, -1.52081298828125, -1.4129791259765625, -1.305145263671875, -1.1973114013671875, -1.0894775390625, -0.9816436767578125, -0.873809814453125, -0.7659759521484375, -0.65814208984375, -0.5503082275390625, -0.442474365234375, -0.3346405029296875, -0.226806640625, -0.1189727783203125, -0.011138916015625, 0.0966949462890625, 0.20452880859375, 0.3123626708984375, 0.420196533203125, 0.5280303955078125, 0.6358642578125, 0.7436981201171875, 0.851531982421875, 0.9593658447265625, 1.06719970703125, 1.1750335693359375, 1.282867431640625, 1.3907012939453125, 1.49853515625, 1.6063690185546875, 1.714202880859375, 1.8220367431640625, 1.92987060546875, 2.0377044677734375, 2.145538330078125, 2.2533721923828125, 2.3612060546875, 2.4690399169921875, 2.576873779296875, 2.6847076416015625, 2.79254150390625, 2.9003753662109375, 3.008209228515625, 3.1160430908203125, 3.223876953125, 3.3317108154296875, 3.439544677734375, 3.5473785400390625, 3.65521240234375, 3.7630462646484375, 3.870880126953125, 3.9787139892578125, 4.0865478515625, 4.1943817138671875, 4.302215576171875, 4.4100494384765625, 4.51788330078125, 4.6257171630859375, 4.733551025390625, 4.8413848876953125, 4.94921875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 10.0, 7.0, 30.0, 33.0, 36.0, 54.0, 75.0, 83.0, 113.0, 108.0, 79.0, 87.0, 65.0, 54.0, 40.0, 29.0, 23.0, 19.0, 10.0, 6.0, 3.0, 8.0, 7.0, 4.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-10.107322692871094, -9.82966136932373, -9.55199909210205, -9.274337768554688, -8.996676445007324, -8.719014167785645, -8.441352844238281, -8.163691520690918, -7.886029243469238, -7.608367443084717, -7.3307061195373535, -7.053044319152832, -6.7753825187683105, -6.497720718383789, -6.220059394836426, -5.942397594451904, -5.664736270904541, -5.3870744705200195, -5.109413146972656, -4.831751346588135, -4.554089546203613, -4.27642822265625, -3.9987664222717285, -3.721104621887207, -3.4434430599212646, -3.1657814979553223, -2.888119697570801, -2.6104581356048584, -2.332796573638916, -2.0551347732543945, -1.7774732112884521, -1.4998115301132202, -1.22214937210083, -0.9444876909255981, -0.666826069355011, -0.38916444778442383, -0.1115027666091919, 0.16615891456604004, 0.4438204765319824, 0.7214821577072144, 0.9991438388824463, 1.2768055200576782, 1.5544672012329102, 1.8321287631988525, 2.109790325164795, 2.3874521255493164, 2.665113687515259, 2.942775249481201, 3.2204370498657227, 3.498098611831665, 3.7757604122161865, 4.053421974182129, 4.33108377456665, 4.608745574951172, 4.886406898498535, 5.164068698883057, 5.441730499267578, 5.7193922996521, 5.997053623199463, 6.274715423583984, 6.552377223968506, 6.830039024353027, 7.107700347900391, 7.385362148284912, 7.663023471832275]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 8.0, 7.0, 2.0, 10.0, 11.0, 12.0, 19.0, 15.0, 17.0, 18.0, 27.0, 18.0, 19.0, 30.0, 29.0, 33.0, 43.0, 45.0, 38.0, 37.0, 42.0, 39.0, 41.0, 38.0, 43.0, 40.0, 32.0, 37.0, 31.0, 29.0, 24.0, 28.0, 16.0, 17.0, 22.0, 16.0, 12.0, 9.0, 9.0, 10.0, 10.0, 3.0, 5.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.144894123077393, -4.985811710357666, -4.8267292976379395, -4.667646408081055, -4.508563995361328, -4.349481582641602, -4.190399169921875, -4.031316757202148, -3.8722341060638428, -3.713151693344116, -3.5540690422058105, -3.394986629486084, -3.2359042167663574, -3.0768215656280518, -2.917739152908325, -2.7586565017700195, -2.599574089050293, -2.4404916763305664, -2.2814090251922607, -2.122326612472534, -1.963244080543518, -1.804161548614502, -1.6450791358947754, -1.4859966039657593, -1.3269140720367432, -1.167831540107727, -1.008749008178711, -0.8496665954589844, -0.6905840635299683, -0.5315015316009521, -0.3724190592765808, -0.21333658695220947, -0.054253578186035156, 0.10482892394065857, 0.2639114260673523, 0.422993928194046, 0.5820764303207397, 0.7411589622497559, 0.9002414345741272, 1.0593239068984985, 1.2184064388275146, 1.3774889707565308, 1.5365715026855469, 1.6956539154052734, 1.8547364473342896, 2.0138189792633057, 2.1729013919830322, 2.331984043121338, 2.4910664558410645, 2.650148868560791, 2.8092315196990967, 2.9683139324188232, 3.127396583557129, 3.2864789962768555, 3.445561408996582, 3.6046438217163086, 3.7637264728546143, 3.922808885574341, 4.0818915367126465, 4.240973949432373, 4.4000563621521, 4.559139251708984, 4.718221664428711, 4.8773040771484375, 5.036386489868164]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 5.0, 5.0, 13.0, 11.0, 16.0, 33.0, 39.0, 66.0, 159.0, 234.0, 376.0, 677.0, 1376.0, 2826.0, 6547.0, 17018.0, 48810.0, 144522.0, 368967.0, 294414.0, 104473.0, 35726.0, 12553.0, 5117.0, 2139.0, 1068.0, 587.0, 306.0, 197.0, 106.0, 61.0, 44.0, 22.0, 16.0, 14.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.09375, -5.92376708984375, -5.7537841796875, -5.58380126953125, -5.413818359375, -5.24383544921875, -5.0738525390625, -4.90386962890625, -4.73388671875, -4.56390380859375, -4.3939208984375, -4.22393798828125, -4.053955078125, -3.88397216796875, -3.7139892578125, -3.54400634765625, -3.3740234375, -3.20404052734375, -3.0340576171875, -2.86407470703125, -2.694091796875, -2.52410888671875, -2.3541259765625, -2.18414306640625, -2.01416015625, -1.84417724609375, -1.6741943359375, -1.50421142578125, -1.334228515625, -1.16424560546875, -0.9942626953125, -0.82427978515625, -0.654296875, -0.48431396484375, -0.3143310546875, -0.14434814453125, 0.025634765625, 0.19561767578125, 0.3656005859375, 0.53558349609375, 0.70556640625, 0.87554931640625, 1.0455322265625, 1.21551513671875, 1.385498046875, 1.55548095703125, 1.7254638671875, 1.89544677734375, 2.0654296875, 2.23541259765625, 2.4053955078125, 2.57537841796875, 2.745361328125, 2.91534423828125, 3.0853271484375, 3.25531005859375, 3.42529296875, 3.59527587890625, 3.7652587890625, 3.93524169921875, 4.105224609375, 4.27520751953125, 4.4451904296875, 4.61517333984375, 4.78515625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 3.0, 6.0, 15.0, 5.0, 31.0, 26.0, 30.0, 37.0, 45.0, 49.0, 61.0, 61.0, 74.0, 63.0, 67.0, 63.0, 58.0, 50.0, 49.0, 33.0, 35.0, 41.0, 19.0, 23.0, 8.0, 12.0, 11.0, 3.0, 9.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.953125, -3.848724365234375, -3.74432373046875, -3.639923095703125, -3.5355224609375, -3.431121826171875, -3.32672119140625, -3.222320556640625, -3.117919921875, -3.013519287109375, -2.90911865234375, -2.804718017578125, -2.7003173828125, -2.595916748046875, -2.49151611328125, -2.387115478515625, -2.28271484375, -2.178314208984375, -2.07391357421875, -1.969512939453125, -1.8651123046875, -1.760711669921875, -1.65631103515625, -1.551910400390625, -1.447509765625, -1.343109130859375, -1.23870849609375, -1.134307861328125, -1.0299072265625, -0.925506591796875, -0.82110595703125, -0.716705322265625, -0.6123046875, -0.507904052734375, -0.40350341796875, -0.299102783203125, -0.1947021484375, -0.090301513671875, 0.01409912109375, 0.118499755859375, 0.222900390625, 0.327301025390625, 0.43170166015625, 0.536102294921875, 0.6405029296875, 0.744903564453125, 0.84930419921875, 0.953704833984375, 1.05810546875, 1.162506103515625, 1.26690673828125, 1.371307373046875, 1.4757080078125, 1.580108642578125, 1.68450927734375, 1.788909912109375, 1.893310546875, 1.997711181640625, 2.10211181640625, 2.206512451171875, 2.3109130859375, 2.415313720703125, 2.51971435546875, 2.624114990234375, 2.728515625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 12.0, 18.0, 18.0, 15.0, 29.0, 41.0, 55.0, 71.0, 99.0, 143.0, 206.0, 267.0, 388.0, 579.0, 927.0, 1618.0, 3942.0, 16831.0, 136294.0, 717344.0, 143325.0, 17595.0, 4152.0, 1762.0, 930.0, 590.0, 371.0, 271.0, 181.0, 110.0, 91.0, 76.0, 60.0, 36.0, 20.0, 24.0, 10.0, 16.0, 12.0, 7.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7890625, -7.515869140625, -7.24267578125, -6.969482421875, -6.6962890625, -6.423095703125, -6.14990234375, -5.876708984375, -5.603515625, -5.330322265625, -5.05712890625, -4.783935546875, -4.5107421875, -4.237548828125, -3.96435546875, -3.691162109375, -3.41796875, -3.144775390625, -2.87158203125, -2.598388671875, -2.3251953125, -2.052001953125, -1.77880859375, -1.505615234375, -1.232421875, -0.959228515625, -0.68603515625, -0.412841796875, -0.1396484375, 0.133544921875, 0.40673828125, 0.679931640625, 0.953125, 1.226318359375, 1.49951171875, 1.772705078125, 2.0458984375, 2.319091796875, 2.59228515625, 2.865478515625, 3.138671875, 3.411865234375, 3.68505859375, 3.958251953125, 4.2314453125, 4.504638671875, 4.77783203125, 5.051025390625, 5.32421875, 5.597412109375, 5.87060546875, 6.143798828125, 6.4169921875, 6.690185546875, 6.96337890625, 7.236572265625, 7.509765625, 7.782958984375, 8.05615234375, 8.329345703125, 8.6025390625, 8.875732421875, 9.14892578125, 9.422119140625, 9.6953125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 6.0, 6.0, 5.0, 13.0, 15.0, 13.0, 18.0, 16.0, 15.0, 30.0, 28.0, 30.0, 35.0, 32.0, 34.0, 37.0, 47.0, 36.0, 40.0, 33.0, 43.0, 38.0, 41.0, 36.0, 36.0, 38.0, 27.0, 35.0, 30.0, 22.0, 24.0, 13.0, 18.0, 14.0, 16.0, 14.0, 15.0, 10.0, 11.0, 4.0, 7.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-10.78125, -10.46484375, -10.1484375, -9.83203125, -9.515625, -9.19921875, -8.8828125, -8.56640625, -8.25, -7.93359375, -7.6171875, -7.30078125, -6.984375, -6.66796875, -6.3515625, -6.03515625, -5.71875, -5.40234375, -5.0859375, -4.76953125, -4.453125, -4.13671875, -3.8203125, -3.50390625, -3.1875, -2.87109375, -2.5546875, -2.23828125, -1.921875, -1.60546875, -1.2890625, -0.97265625, -0.65625, -0.33984375, -0.0234375, 0.29296875, 0.609375, 0.92578125, 1.2421875, 1.55859375, 1.875, 2.19140625, 2.5078125, 2.82421875, 3.140625, 3.45703125, 3.7734375, 4.08984375, 4.40625, 4.72265625, 5.0390625, 5.35546875, 5.671875, 5.98828125, 6.3046875, 6.62109375, 6.9375, 7.25390625, 7.5703125, 7.88671875, 8.203125, 8.51953125, 8.8359375, 9.15234375, 9.46875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 11.0, 6.0, 22.0, 18.0, 34.0, 73.0, 104.0, 236.0, 461.0, 1294.0, 5228.0, 59021.0, 898215.0, 75406.0, 6000.0, 1457.0, 451.0, 213.0, 115.0, 76.0, 42.0, 21.0, 11.0, 9.0, 5.0, 6.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.8125, -9.557861328125, -9.30322265625, -9.048583984375, -8.7939453125, -8.539306640625, -8.28466796875, -8.030029296875, -7.775390625, -7.520751953125, -7.26611328125, -7.011474609375, -6.7568359375, -6.502197265625, -6.24755859375, -5.992919921875, -5.73828125, -5.483642578125, -5.22900390625, -4.974365234375, -4.7197265625, -4.465087890625, -4.21044921875, -3.955810546875, -3.701171875, -3.446533203125, -3.19189453125, -2.937255859375, -2.6826171875, -2.427978515625, -2.17333984375, -1.918701171875, -1.6640625, -1.409423828125, -1.15478515625, -0.900146484375, -0.6455078125, -0.390869140625, -0.13623046875, 0.118408203125, 0.373046875, 0.627685546875, 0.88232421875, 1.136962890625, 1.3916015625, 1.646240234375, 1.90087890625, 2.155517578125, 2.41015625, 2.664794921875, 2.91943359375, 3.174072265625, 3.4287109375, 3.683349609375, 3.93798828125, 4.192626953125, 4.447265625, 4.701904296875, 4.95654296875, 5.211181640625, 5.4658203125, 5.720458984375, 5.97509765625, 6.229736328125, 6.484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 5.0, 7.0, 15.0, 15.0, 17.0, 28.0, 39.0, 47.0, 60.0, 88.0, 107.0, 120.0, 95.0, 91.0, 65.0, 43.0, 35.0, 32.0, 21.0, 17.0, 19.0, 9.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005316734313964844, -0.0005080774426460266, -0.00048448145389556885, -0.0004608854651451111, -0.0004372894763946533, -0.00041369348764419556, -0.0003900974988937378, -0.00036650151014328003, -0.00034290552139282227, -0.0003193095326423645, -0.00029571354389190674, -0.000272117555141449, -0.0002485215663909912, -0.00022492557764053345, -0.00020132958889007568, -0.00017773360013961792, -0.00015413761138916016, -0.0001305416226387024, -0.00010694563388824463, -8.334964513778687e-05, -5.97536563873291e-05, -3.615766763687134e-05, -1.2561678886413574e-05, 1.103430986404419e-05, 3.463029861450195e-05, 5.822628736495972e-05, 8.182227611541748e-05, 0.00010541826486587524, 0.000129014253616333, 0.00015261024236679077, 0.00017620623111724854, 0.0001998022198677063, 0.00022339820861816406, 0.0002469941973686218, 0.0002705901861190796, 0.00029418617486953735, 0.0003177821636199951, 0.0003413781523704529, 0.00036497414112091064, 0.0003885701298713684, 0.00041216611862182617, 0.00043576210737228394, 0.0004593580961227417, 0.00048295408487319946, 0.0005065500736236572, 0.000530146062374115, 0.0005537420511245728, 0.0005773380398750305, 0.0006009340286254883, 0.000624530017375946, 0.0006481260061264038, 0.0006717219948768616, 0.0006953179836273193, 0.0007189139723777771, 0.0007425099611282349, 0.0007661059498786926, 0.0007897019386291504, 0.0008132979273796082, 0.0008368939161300659, 0.0008604899048805237, 0.0008840858936309814, 0.0009076818823814392, 0.000931277871131897, 0.0009548738598823547, 0.0009784698486328125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 13.0, 9.0, 6.0, 13.0, 21.0, 35.0, 29.0, 44.0, 71.0, 102.0, 156.0, 236.0, 414.0, 711.0, 1387.0, 3028.0, 8404.0, 36805.0, 274599.0, 609525.0, 88228.0, 15769.0, 4611.0, 1873.0, 963.0, 562.0, 317.0, 181.0, 129.0, 89.0, 57.0, 38.0, 34.0, 19.0, 16.0, 10.0, 6.0, 7.0, 4.0, 3.0, 5.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.3203125, -4.186279296875, -4.05224609375, -3.918212890625, -3.7841796875, -3.650146484375, -3.51611328125, -3.382080078125, -3.248046875, -3.114013671875, -2.97998046875, -2.845947265625, -2.7119140625, -2.577880859375, -2.44384765625, -2.309814453125, -2.17578125, -2.041748046875, -1.90771484375, -1.773681640625, -1.6396484375, -1.505615234375, -1.37158203125, -1.237548828125, -1.103515625, -0.969482421875, -0.83544921875, -0.701416015625, -0.5673828125, -0.433349609375, -0.29931640625, -0.165283203125, -0.03125, 0.102783203125, 0.23681640625, 0.370849609375, 0.5048828125, 0.638916015625, 0.77294921875, 0.906982421875, 1.041015625, 1.175048828125, 1.30908203125, 1.443115234375, 1.5771484375, 1.711181640625, 1.84521484375, 1.979248046875, 2.11328125, 2.247314453125, 2.38134765625, 2.515380859375, 2.6494140625, 2.783447265625, 2.91748046875, 3.051513671875, 3.185546875, 3.319580078125, 3.45361328125, 3.587646484375, 3.7216796875, 3.855712890625, 3.98974609375, 4.123779296875, 4.2578125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 7.0, 11.0, 14.0, 10.0, 26.0, 54.0, 49.0, 68.0, 64.0, 106.0, 98.0, 90.0, 90.0, 84.0, 72.0, 63.0, 18.0, 17.0, 9.0, 9.0, 9.0, 10.0, 7.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.03125, -5.8720703125, -5.712890625, -5.5537109375, -5.39453125, -5.2353515625, -5.076171875, -4.9169921875, -4.7578125, -4.5986328125, -4.439453125, -4.2802734375, -4.12109375, -3.9619140625, -3.802734375, -3.6435546875, -3.484375, -3.3251953125, -3.166015625, -3.0068359375, -2.84765625, -2.6884765625, -2.529296875, -2.3701171875, -2.2109375, -2.0517578125, -1.892578125, -1.7333984375, -1.57421875, -1.4150390625, -1.255859375, -1.0966796875, -0.9375, -0.7783203125, -0.619140625, -0.4599609375, -0.30078125, -0.1416015625, 0.017578125, 0.1767578125, 0.3359375, 0.4951171875, 0.654296875, 0.8134765625, 0.97265625, 1.1318359375, 1.291015625, 1.4501953125, 1.609375, 1.7685546875, 1.927734375, 2.0869140625, 2.24609375, 2.4052734375, 2.564453125, 2.7236328125, 2.8828125, 3.0419921875, 3.201171875, 3.3603515625, 3.51953125, 3.6787109375, 3.837890625, 3.9970703125, 4.15625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 19.0, 106.0, 339.0, 342.0, 137.0, 38.0, 12.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-161.54248046875, -155.76971435546875, -149.99693298339844, -144.2241668701172, -138.45138549804688, -132.67861938476562, -126.90584564208984, -121.13307189941406, -115.36029815673828, -109.5875244140625, -103.81475067138672, -98.04197692871094, -92.26921081542969, -86.49642944335938, -80.72366333007812, -74.95088958740234, -69.17811584472656, -63.40534210205078, -57.632568359375, -51.859798431396484, -46.0870246887207, -40.31425094604492, -34.541481018066406, -28.768707275390625, -22.995933532714844, -17.223159790039062, -11.450387954711914, -5.677616119384766, 0.09515762329101562, 5.867931365966797, 11.640701293945312, 17.413475036621094, 23.186248779296875, 28.959022521972656, 34.73179626464844, 40.50456619262695, 46.277339935302734, 52.050113677978516, 57.82288360595703, 63.59565734863281, 69.3684310913086, 75.14120483398438, 80.91397857666016, 86.68675231933594, 92.45951843261719, 98.2322998046875, 104.00506591796875, 109.77783966064453, 115.55061340332031, 121.3233871459961, 127.09616088867188, 132.86892700195312, 138.64170837402344, 144.4144744873047, 150.187255859375, 155.96002197265625, 161.7327880859375, 167.50555419921875, 173.27833557128906, 179.0511016845703, 184.82388305664062, 190.59664916992188, 196.36941528320312, 202.14219665527344, 207.91497802734375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 13.0, 7.0, 10.0, 12.0, 17.0, 31.0, 25.0, 34.0, 29.0, 34.0, 42.0, 37.0, 49.0, 53.0, 55.0, 52.0, 57.0, 54.0, 59.0, 49.0, 31.0, 37.0, 34.0, 26.0, 32.0, 21.0, 19.0, 14.0, 16.0, 7.0, 10.0, 7.0, 3.0, 6.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0], "bins": [-64.94923400878906, -63.23587417602539, -61.522518157958984, -59.80915832519531, -58.095802307128906, -56.382442474365234, -54.66908264160156, -52.955726623535156, -51.242366790771484, -49.52900695800781, -47.815650939941406, -46.102291107177734, -44.38893508911133, -42.675575256347656, -40.96221923828125, -39.24885940551758, -37.535499572753906, -35.822139739990234, -34.10878372192383, -32.395423889160156, -30.682065963745117, -28.968708038330078, -27.25535011291504, -25.5419921875, -23.828636169433594, -22.115278244018555, -20.401920318603516, -18.688560485839844, -16.975202560424805, -15.261844635009766, -13.548486709594727, -11.835127830505371, -10.121768951416016, -8.408411026000977, -6.695052146911621, -4.981694221496582, -3.2683358192443848, -1.5549774169921875, 0.15838050842285156, 1.871739387512207, 3.585097312927246, 5.298455715179443, 7.011814117431641, 8.72517204284668, 10.438529968261719, 12.151888847351074, 13.865246772766113, 15.578605651855469, 17.291963577270508, 19.005321502685547, 20.718679428100586, 22.432037353515625, 24.145397186279297, 25.858755111694336, 27.572113037109375, 29.285472869873047, 30.998828887939453, 32.712188720703125, 34.42554473876953, 36.1389045715332, 37.85226058959961, 39.56562042236328, 41.27897644042969, 42.99233627319336, 44.70569610595703]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 11.0, 14.0, 19.0, 19.0, 25.0, 38.0, 49.0, 79.0, 84.0, 188.0, 289.0, 547.0, 1215.0, 3433.0, 14126.0, 177643.0, 3953466.0, 33324.0, 6027.0, 1876.0, 809.0, 370.0, 202.0, 124.0, 82.0, 61.0, 42.0, 39.0, 25.0, 14.0, 14.0, 9.0, 3.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-15.3203125, -14.8726806640625, -14.425048828125, -13.9774169921875, -13.52978515625, -13.0821533203125, -12.634521484375, -12.1868896484375, -11.7392578125, -11.2916259765625, -10.843994140625, -10.3963623046875, -9.94873046875, -9.5010986328125, -9.053466796875, -8.6058349609375, -8.158203125, -7.7105712890625, -7.262939453125, -6.8153076171875, -6.36767578125, -5.9200439453125, -5.472412109375, -5.0247802734375, -4.5771484375, -4.1295166015625, -3.681884765625, -3.2342529296875, -2.78662109375, -2.3389892578125, -1.891357421875, -1.4437255859375, -0.99609375, -0.5484619140625, -0.100830078125, 0.3468017578125, 0.79443359375, 1.2420654296875, 1.689697265625, 2.1373291015625, 2.5849609375, 3.0325927734375, 3.480224609375, 3.9278564453125, 4.37548828125, 4.8231201171875, 5.270751953125, 5.7183837890625, 6.166015625, 6.6136474609375, 7.061279296875, 7.5089111328125, 7.95654296875, 8.4041748046875, 8.851806640625, 9.2994384765625, 9.7470703125, 10.1947021484375, 10.642333984375, 11.0899658203125, 11.53759765625, 11.9852294921875, 12.432861328125, 12.8804931640625, 13.328125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 7.0, 6.0, 13.0, 17.0, 18.0, 32.0, 28.0, 29.0, 46.0, 43.0, 71.0, 57.0, 56.0, 59.0, 64.0, 68.0, 57.0, 50.0, 37.0, 45.0, 40.0, 35.0, 31.0, 25.0, 17.0, 16.0, 8.0, 4.0, 11.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.548828125, -3.455780029296875, -3.36273193359375, -3.269683837890625, -3.1766357421875, -3.083587646484375, -2.99053955078125, -2.897491455078125, -2.804443359375, -2.711395263671875, -2.61834716796875, -2.525299072265625, -2.4322509765625, -2.339202880859375, -2.24615478515625, -2.153106689453125, -2.06005859375, -1.967010498046875, -1.87396240234375, -1.780914306640625, -1.6878662109375, -1.594818115234375, -1.50177001953125, -1.408721923828125, -1.315673828125, -1.222625732421875, -1.12957763671875, -1.036529541015625, -0.9434814453125, -0.850433349609375, -0.75738525390625, -0.664337158203125, -0.5712890625, -0.478240966796875, -0.38519287109375, -0.292144775390625, -0.1990966796875, -0.106048583984375, -0.01300048828125, 0.080047607421875, 0.173095703125, 0.266143798828125, 0.35919189453125, 0.452239990234375, 0.5452880859375, 0.638336181640625, 0.73138427734375, 0.824432373046875, 0.91748046875, 1.010528564453125, 1.10357666015625, 1.196624755859375, 1.2896728515625, 1.382720947265625, 1.47576904296875, 1.568817138671875, 1.661865234375, 1.754913330078125, 1.84796142578125, 1.941009521484375, 2.0340576171875, 2.127105712890625, 2.22015380859375, 2.313201904296875, 2.40625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 9.0, 12.0, 14.0, 14.0, 21.0, 23.0, 27.0, 55.0, 79.0, 96.0, 169.0, 214.0, 427.0, 793.0, 1702.0, 4541.0, 16407.0, 135545.0, 3925303.0, 88555.0, 13085.0, 3889.0, 1510.0, 699.0, 390.0, 219.0, 149.0, 115.0, 63.0, 41.0, 28.0, 23.0, 19.0, 14.0, 12.0, 12.0, 4.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.625, -11.2664794921875, -10.907958984375, -10.5494384765625, -10.19091796875, -9.8323974609375, -9.473876953125, -9.1153564453125, -8.7568359375, -8.3983154296875, -8.039794921875, -7.6812744140625, -7.32275390625, -6.9642333984375, -6.605712890625, -6.2471923828125, -5.888671875, -5.5301513671875, -5.171630859375, -4.8131103515625, -4.45458984375, -4.0960693359375, -3.737548828125, -3.3790283203125, -3.0205078125, -2.6619873046875, -2.303466796875, -1.9449462890625, -1.58642578125, -1.2279052734375, -0.869384765625, -0.5108642578125, -0.15234375, 0.2061767578125, 0.564697265625, 0.9232177734375, 1.28173828125, 1.6402587890625, 1.998779296875, 2.3572998046875, 2.7158203125, 3.0743408203125, 3.432861328125, 3.7913818359375, 4.14990234375, 4.5084228515625, 4.866943359375, 5.2254638671875, 5.583984375, 5.9425048828125, 6.301025390625, 6.6595458984375, 7.01806640625, 7.3765869140625, 7.735107421875, 8.0936279296875, 8.4521484375, 8.8106689453125, 9.169189453125, 9.5277099609375, 9.88623046875, 10.2447509765625, 10.603271484375, 10.9617919921875, 11.3203125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 13.0, 28.0, 33.0, 75.0, 153.0, 1025.0, 2402.0, 184.0, 66.0, 37.0, 22.0, 9.0, 10.0, 8.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44921875, -5.26788330078125, -5.0865478515625, -4.90521240234375, -4.723876953125, -4.54254150390625, -4.3612060546875, -4.17987060546875, -3.99853515625, -3.81719970703125, -3.6358642578125, -3.45452880859375, -3.273193359375, -3.09185791015625, -2.9105224609375, -2.72918701171875, -2.5478515625, -2.36651611328125, -2.1851806640625, -2.00384521484375, -1.822509765625, -1.64117431640625, -1.4598388671875, -1.27850341796875, -1.09716796875, -0.91583251953125, -0.7344970703125, -0.55316162109375, -0.371826171875, -0.19049072265625, -0.0091552734375, 0.17218017578125, 0.353515625, 0.53485107421875, 0.7161865234375, 0.89752197265625, 1.078857421875, 1.26019287109375, 1.4415283203125, 1.62286376953125, 1.80419921875, 1.98553466796875, 2.1668701171875, 2.34820556640625, 2.529541015625, 2.71087646484375, 2.8922119140625, 3.07354736328125, 3.2548828125, 3.43621826171875, 3.6175537109375, 3.79888916015625, 3.980224609375, 4.16156005859375, 4.3428955078125, 4.52423095703125, 4.70556640625, 4.88690185546875, 5.0682373046875, 5.24957275390625, 5.430908203125, 5.61224365234375, 5.7935791015625, 5.97491455078125, 6.15625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 9.0, 9.0, 8.0, 17.0, 9.0, 16.0, 20.0, 39.0, 45.0, 54.0, 65.0, 85.0, 74.0, 97.0, 93.0, 90.0, 69.0, 45.0, 48.0, 31.0, 21.0, 10.0, 2.0, 7.0, 4.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.569573402404785, -10.201430320739746, -9.833288192749023, -9.465145111083984, -9.097002029418945, -8.728859901428223, -8.360716819763184, -7.992574214935303, -7.624431610107422, -7.256289005279541, -6.888145923614502, -6.520003318786621, -6.15186071395874, -5.783718109130859, -5.41557502746582, -5.0474324226379395, -4.6792893409729, -4.3111467361450195, -3.9430038928985596, -3.5748610496520996, -3.2067184448242188, -2.838575601577759, -2.470432758331299, -2.102290153503418, -1.734147310256958, -1.3660045862197876, -0.9978618025779724, -0.6297190189361572, -0.2615762948989868, 0.1065664291381836, 0.47470927238464355, 0.8428518772125244, 1.2109947204589844, 1.5791374444961548, 1.9472801685333252, 2.315423011779785, 2.683565616607666, 3.051708459854126, 3.419851303100586, 3.787993907928467, 4.156136512756348, 4.5242791175842285, 4.892422199249268, 5.260564804077148, 5.628707408905029, 5.99685001373291, 6.364993095397949, 6.73313570022583, 7.101278781890869, 7.46942138671875, 7.837564468383789, 8.205707550048828, 8.57384967803955, 8.94199275970459, 9.310134887695312, 9.678277969360352, 10.04642105102539, 10.41456413269043, 10.782706260681152, 11.150849342346191, 11.51899242401123, 11.887134552001953, 12.255277633666992, 12.623420715332031, 12.991562843322754]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 6.0, 4.0, 6.0, 8.0, 2.0, 7.0, 12.0, 10.0, 14.0, 17.0, 12.0, 31.0, 18.0, 31.0, 22.0, 24.0, 30.0, 35.0, 36.0, 32.0, 39.0, 44.0, 32.0, 38.0, 36.0, 46.0, 46.0, 40.0, 29.0, 23.0, 33.0, 25.0, 28.0, 26.0, 17.0, 20.0, 18.0, 26.0, 17.0, 13.0, 4.0, 11.0, 9.0, 6.0, 5.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 3.0], "bins": [-10.026663780212402, -9.740232467651367, -9.453801155090332, -9.167369842529297, -8.880938529968262, -8.594507217407227, -8.308075904846191, -8.021644592285156, -7.735213756561279, -7.448782444000244, -7.162351131439209, -6.875919818878174, -6.589488983154297, -6.303057670593262, -6.016626358032227, -5.730195045471191, -5.443763732910156, -5.157332420349121, -4.870901107788086, -4.584469795227051, -4.298038482666016, -4.0116071701049805, -3.7251763343811035, -3.4387450218200684, -3.152313709259033, -2.865882396697998, -2.579451084136963, -2.293020009994507, -2.0065886974334717, -1.7201573848724365, -1.433726191520691, -1.1472949981689453, -0.8608627319335938, -0.5744314789772034, -0.288000226020813, -0.0015689730644226074, 0.2848622798919678, 0.5712935924530029, 0.8577247858047485, 1.1441559791564941, 1.4305872917175293, 1.7170186042785645, 2.0034499168395996, 2.2898809909820557, 2.576312303543091, 2.862743616104126, 3.149174690246582, 3.435606002807617, 3.7220373153686523, 4.0084686279296875, 4.294899940490723, 4.581331253051758, 4.867762565612793, 5.154193878173828, 5.440624713897705, 5.72705602645874, 6.013487339019775, 6.2999186515808105, 6.586349964141846, 6.872781276702881, 7.159212112426758, 7.445643424987793, 7.732074737548828, 8.018506050109863, 8.304937362670898]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 13.0, 11.0, 16.0, 24.0, 29.0, 35.0, 53.0, 87.0, 107.0, 157.0, 267.0, 383.0, 648.0, 1114.0, 2193.0, 4545.0, 10869.0, 28020.0, 75785.0, 213372.0, 429625.0, 175640.0, 64363.0, 23455.0, 9074.0, 3993.0, 1942.0, 1042.0, 629.0, 319.0, 217.0, 149.0, 110.0, 73.0, 59.0, 33.0, 27.0, 21.0, 17.0, 14.0, 2.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.20703125, -6.0029296875, -5.798828125, -5.5947265625, -5.390625, -5.1865234375, -4.982421875, -4.7783203125, -4.57421875, -4.3701171875, -4.166015625, -3.9619140625, -3.7578125, -3.5537109375, -3.349609375, -3.1455078125, -2.94140625, -2.7373046875, -2.533203125, -2.3291015625, -2.125, -1.9208984375, -1.716796875, -1.5126953125, -1.30859375, -1.1044921875, -0.900390625, -0.6962890625, -0.4921875, -0.2880859375, -0.083984375, 0.1201171875, 0.32421875, 0.5283203125, 0.732421875, 0.9365234375, 1.140625, 1.3447265625, 1.548828125, 1.7529296875, 1.95703125, 2.1611328125, 2.365234375, 2.5693359375, 2.7734375, 2.9775390625, 3.181640625, 3.3857421875, 3.58984375, 3.7939453125, 3.998046875, 4.2021484375, 4.40625, 4.6103515625, 4.814453125, 5.0185546875, 5.22265625, 5.4267578125, 5.630859375, 5.8349609375, 6.0390625, 6.2431640625, 6.447265625, 6.6513671875, 6.85546875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 8.0, 6.0, 14.0, 13.0, 24.0, 24.0, 31.0, 44.0, 37.0, 48.0, 57.0, 62.0, 68.0, 66.0, 65.0, 53.0, 56.0, 39.0, 46.0, 33.0, 47.0, 31.0, 18.0, 20.0, 23.0, 10.0, 12.0, 11.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.744140625, -3.64990234375, -3.5556640625, -3.46142578125, -3.3671875, -3.27294921875, -3.1787109375, -3.08447265625, -2.990234375, -2.89599609375, -2.8017578125, -2.70751953125, -2.61328125, -2.51904296875, -2.4248046875, -2.33056640625, -2.236328125, -2.14208984375, -2.0478515625, -1.95361328125, -1.859375, -1.76513671875, -1.6708984375, -1.57666015625, -1.482421875, -1.38818359375, -1.2939453125, -1.19970703125, -1.10546875, -1.01123046875, -0.9169921875, -0.82275390625, -0.728515625, -0.63427734375, -0.5400390625, -0.44580078125, -0.3515625, -0.25732421875, -0.1630859375, -0.06884765625, 0.025390625, 0.11962890625, 0.2138671875, 0.30810546875, 0.40234375, 0.49658203125, 0.5908203125, 0.68505859375, 0.779296875, 0.87353515625, 0.9677734375, 1.06201171875, 1.15625, 1.25048828125, 1.3447265625, 1.43896484375, 1.533203125, 1.62744140625, 1.7216796875, 1.81591796875, 1.91015625, 2.00439453125, 2.0986328125, 2.19287109375, 2.287109375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 9.0, 7.0, 11.0, 8.0, 33.0, 31.0, 40.0, 63.0, 100.0, 124.0, 189.0, 321.0, 416.0, 721.0, 1250.0, 2492.0, 6664.0, 33924.0, 341985.0, 589775.0, 54742.0, 9145.0, 2930.0, 1421.0, 806.0, 470.0, 300.0, 197.0, 117.0, 92.0, 55.0, 35.0, 28.0, 13.0, 15.0, 9.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.78125, -10.4232177734375, -10.065185546875, -9.7071533203125, -9.34912109375, -8.9910888671875, -8.633056640625, -8.2750244140625, -7.9169921875, -7.5589599609375, -7.200927734375, -6.8428955078125, -6.48486328125, -6.1268310546875, -5.768798828125, -5.4107666015625, -5.052734375, -4.6947021484375, -4.336669921875, -3.9786376953125, -3.62060546875, -3.2625732421875, -2.904541015625, -2.5465087890625, -2.1884765625, -1.8304443359375, -1.472412109375, -1.1143798828125, -0.75634765625, -0.3983154296875, -0.040283203125, 0.3177490234375, 0.67578125, 1.0338134765625, 1.391845703125, 1.7498779296875, 2.10791015625, 2.4659423828125, 2.823974609375, 3.1820068359375, 3.5400390625, 3.8980712890625, 4.256103515625, 4.6141357421875, 4.97216796875, 5.3302001953125, 5.688232421875, 6.0462646484375, 6.404296875, 6.7623291015625, 7.120361328125, 7.4783935546875, 7.83642578125, 8.1944580078125, 8.552490234375, 8.9105224609375, 9.2685546875, 9.6265869140625, 9.984619140625, 10.3426513671875, 10.70068359375, 11.0587158203125, 11.416748046875, 11.7747802734375, 12.1328125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 2.0, 4.0, 4.0, 4.0, 6.0, 19.0, 12.0, 15.0, 26.0, 16.0, 19.0, 34.0, 43.0, 24.0, 40.0, 47.0, 46.0, 48.0, 54.0, 67.0, 52.0, 58.0, 30.0, 42.0, 43.0, 41.0, 36.0, 29.0, 33.0, 17.0, 13.0, 9.0, 15.0, 8.0, 9.0, 15.0, 5.0, 5.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-12.78125, -12.421875, -12.0625, -11.703125, -11.34375, -10.984375, -10.625, -10.265625, -9.90625, -9.546875, -9.1875, -8.828125, -8.46875, -8.109375, -7.75, -7.390625, -7.03125, -6.671875, -6.3125, -5.953125, -5.59375, -5.234375, -4.875, -4.515625, -4.15625, -3.796875, -3.4375, -3.078125, -2.71875, -2.359375, -2.0, -1.640625, -1.28125, -0.921875, -0.5625, -0.203125, 0.15625, 0.515625, 0.875, 1.234375, 1.59375, 1.953125, 2.3125, 2.671875, 3.03125, 3.390625, 3.75, 4.109375, 4.46875, 4.828125, 5.1875, 5.546875, 5.90625, 6.265625, 6.625, 6.984375, 7.34375, 7.703125, 8.0625, 8.421875, 8.78125, 9.140625, 9.5, 9.859375, 10.21875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 1.0, 8.0, 11.0, 9.0, 19.0, 24.0, 42.0, 49.0, 101.0, 130.0, 212.0, 364.0, 686.0, 1275.0, 2814.0, 6715.0, 19998.0, 74010.0, 341192.0, 467184.0, 94411.0, 24648.0, 8120.0, 3199.0, 1449.0, 765.0, 401.0, 248.0, 156.0, 104.0, 55.0, 35.0, 37.0, 23.0, 17.0, 12.0, 8.0, 10.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.759765625, -2.670989990234375, -2.58221435546875, -2.493438720703125, -2.4046630859375, -2.315887451171875, -2.22711181640625, -2.138336181640625, -2.049560546875, -1.960784912109375, -1.87200927734375, -1.783233642578125, -1.6944580078125, -1.605682373046875, -1.51690673828125, -1.428131103515625, -1.33935546875, -1.250579833984375, -1.16180419921875, -1.073028564453125, -0.9842529296875, -0.895477294921875, -0.80670166015625, -0.717926025390625, -0.629150390625, -0.540374755859375, -0.45159912109375, -0.362823486328125, -0.2740478515625, -0.185272216796875, -0.09649658203125, -0.007720947265625, 0.0810546875, 0.169830322265625, 0.25860595703125, 0.347381591796875, 0.4361572265625, 0.524932861328125, 0.61370849609375, 0.702484130859375, 0.791259765625, 0.880035400390625, 0.96881103515625, 1.057586669921875, 1.1463623046875, 1.235137939453125, 1.32391357421875, 1.412689208984375, 1.50146484375, 1.590240478515625, 1.67901611328125, 1.767791748046875, 1.8565673828125, 1.945343017578125, 2.03411865234375, 2.122894287109375, 2.211669921875, 2.300445556640625, 2.38922119140625, 2.477996826171875, 2.5667724609375, 2.655548095703125, 2.74432373046875, 2.833099365234375, 2.921875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 12.0, 13.0, 12.0, 12.0, 13.0, 27.0, 16.0, 26.0, 31.0, 27.0, 48.0, 51.0, 62.0, 91.0, 121.0, 106.0, 57.0, 40.0, 37.0, 21.0, 36.0, 21.0, 18.0, 11.0, 10.0, 11.0, 15.0, 3.0, 8.0, 3.0, 6.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0007367134094238281, -0.0007132813334465027, -0.0006898492574691772, -0.0006664171814918518, -0.0006429851055145264, -0.0006195530295372009, -0.0005961209535598755, -0.00057268887758255, -0.0005492568016052246, -0.0005258247256278992, -0.0005023926496505737, -0.0004789605736732483, -0.00045552849769592285, -0.0004320964217185974, -0.00040866434574127197, -0.00038523226976394653, -0.0003618001937866211, -0.00033836811780929565, -0.0003149360418319702, -0.0002915039658546448, -0.00026807188987731934, -0.0002446398138999939, -0.00022120773792266846, -0.00019777566194534302, -0.00017434358596801758, -0.00015091150999069214, -0.0001274794340133667, -0.00010404735803604126, -8.061528205871582e-05, -5.718320608139038e-05, -3.375113010406494e-05, -1.0319054126739502e-05, 1.3113021850585938e-05, 3.654509782791138e-05, 5.9977173805236816e-05, 8.340924978256226e-05, 0.0001068413257598877, 0.00013027340173721313, 0.00015370547771453857, 0.00017713755369186401, 0.00020056962966918945, 0.0002240017056465149, 0.00024743378162384033, 0.00027086585760116577, 0.0002942979335784912, 0.00031773000955581665, 0.0003411620855331421, 0.00036459416151046753, 0.00038802623748779297, 0.0004114583134651184, 0.00043489038944244385, 0.0004583224654197693, 0.0004817545413970947, 0.0005051866173744202, 0.0005286186933517456, 0.000552050769329071, 0.0005754828453063965, 0.0005989149212837219, 0.0006223469972610474, 0.0006457790732383728, 0.0006692111492156982, 0.0006926432251930237, 0.0007160753011703491, 0.0007395073771476746, 0.000762939453125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 9.0, 12.0, 10.0, 17.0, 21.0, 20.0, 48.0, 50.0, 90.0, 168.0, 236.0, 425.0, 791.0, 1752.0, 4828.0, 20836.0, 154290.0, 710322.0, 128934.0, 18082.0, 4165.0, 1656.0, 752.0, 414.0, 224.0, 155.0, 84.0, 49.0, 44.0, 16.0, 15.0, 10.0, 10.0, 10.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.91796875, -4.79010009765625, -4.6622314453125, -4.53436279296875, -4.406494140625, -4.27862548828125, -4.1507568359375, -4.02288818359375, -3.89501953125, -3.76715087890625, -3.6392822265625, -3.51141357421875, -3.383544921875, -3.25567626953125, -3.1278076171875, -2.99993896484375, -2.8720703125, -2.74420166015625, -2.6163330078125, -2.48846435546875, -2.360595703125, -2.23272705078125, -2.1048583984375, -1.97698974609375, -1.84912109375, -1.72125244140625, -1.5933837890625, -1.46551513671875, -1.337646484375, -1.20977783203125, -1.0819091796875, -0.95404052734375, -0.826171875, -0.69830322265625, -0.5704345703125, -0.44256591796875, -0.314697265625, -0.18682861328125, -0.0589599609375, 0.06890869140625, 0.19677734375, 0.32464599609375, 0.4525146484375, 0.58038330078125, 0.708251953125, 0.83612060546875, 0.9639892578125, 1.09185791015625, 1.2197265625, 1.34759521484375, 1.4754638671875, 1.60333251953125, 1.731201171875, 1.85906982421875, 1.9869384765625, 2.11480712890625, 2.24267578125, 2.37054443359375, 2.4984130859375, 2.62628173828125, 2.754150390625, 2.88201904296875, 3.0098876953125, 3.13775634765625, 3.265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 11.0, 15.0, 12.0, 13.0, 16.0, 16.0, 29.0, 29.0, 48.0, 52.0, 75.0, 88.0, 85.0, 85.0, 86.0, 77.0, 65.0, 45.0, 36.0, 28.0, 23.0, 13.0, 16.0, 13.0, 6.0, 5.0, 9.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.54296875, -4.43560791015625, -4.3282470703125, -4.22088623046875, -4.113525390625, -4.00616455078125, -3.8988037109375, -3.79144287109375, -3.68408203125, -3.57672119140625, -3.4693603515625, -3.36199951171875, -3.254638671875, -3.14727783203125, -3.0399169921875, -2.93255615234375, -2.8251953125, -2.71783447265625, -2.6104736328125, -2.50311279296875, -2.395751953125, -2.28839111328125, -2.1810302734375, -2.07366943359375, -1.96630859375, -1.85894775390625, -1.7515869140625, -1.64422607421875, -1.536865234375, -1.42950439453125, -1.3221435546875, -1.21478271484375, -1.107421875, -1.00006103515625, -0.8927001953125, -0.78533935546875, -0.677978515625, -0.57061767578125, -0.4632568359375, -0.35589599609375, -0.24853515625, -0.14117431640625, -0.0338134765625, 0.07354736328125, 0.180908203125, 0.28826904296875, 0.3956298828125, 0.50299072265625, 0.6103515625, 0.71771240234375, 0.8250732421875, 0.93243408203125, 1.039794921875, 1.14715576171875, 1.2545166015625, 1.36187744140625, 1.46923828125, 1.57659912109375, 1.6839599609375, 1.79132080078125, 1.898681640625, 2.00604248046875, 2.1134033203125, 2.22076416015625, 2.328125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 15.0, 19.0, 35.0, 48.0, 74.0, 91.0, 113.0, 123.0, 110.0, 100.0, 81.0, 59.0, 43.0, 24.0, 18.0, 14.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-64.60453033447266, -62.79473114013672, -60.98493576049805, -59.17513656616211, -57.36534118652344, -55.5555419921875, -53.74574279785156, -51.93594741821289, -50.12615203857422, -48.31635284423828, -46.50655746459961, -44.69675827026367, -42.886962890625, -41.07716369628906, -39.267364501953125, -37.45756912231445, -35.647769927978516, -33.83797073364258, -32.028175354003906, -30.21837615966797, -28.408580780029297, -26.59878158569336, -24.788984298706055, -22.97918701171875, -21.169389724731445, -19.35959243774414, -17.549795150756836, -15.739996910095215, -13.93019962310791, -12.120402336120605, -10.310604095458984, -8.50080680847168, -6.691009521484375, -4.88121223449707, -3.0714144706726074, -1.2616167068481445, 0.5481805801391602, 2.357977867126465, 4.167776107788086, 5.977573394775391, 7.787370681762695, 9.59716796875, 11.406965255737305, 13.216763496398926, 15.02656078338623, 16.83635711669922, 18.646156311035156, 20.45595359802246, 22.265750885009766, 24.07554817199707, 25.885345458984375, 27.695144653320312, 29.504940032958984, 31.314739227294922, 33.124534606933594, 34.93433380126953, 36.74413299560547, 38.553932189941406, 40.36372756958008, 42.173526763916016, 43.98332214355469, 45.793121337890625, 47.60292053222656, 49.412715911865234, 51.222511291503906]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 8.0, 5.0, 9.0, 10.0, 12.0, 13.0, 16.0, 24.0, 30.0, 27.0, 36.0, 28.0, 55.0, 37.0, 32.0, 45.0, 65.0, 60.0, 57.0, 51.0, 44.0, 46.0, 52.0, 47.0, 29.0, 25.0, 21.0, 14.0, 18.0, 16.0, 16.0, 10.0, 5.0, 7.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-54.771141052246094, -53.17585754394531, -51.5805778503418, -49.985294342041016, -48.390010833740234, -46.79473114013672, -45.19944763183594, -43.604164123535156, -42.008880615234375, -40.413597106933594, -38.81831741333008, -37.2230339050293, -35.627750396728516, -34.032470703125, -32.43718719482422, -30.841903686523438, -29.246623992919922, -27.651342391967773, -26.056058883666992, -24.460777282714844, -22.865493774414062, -21.270212173461914, -19.674930572509766, -18.079647064208984, -16.484365463256836, -14.889082908630371, -13.293800354003906, -11.698518753051758, -10.103236198425293, -8.507953643798828, -6.91267204284668, -5.317389488220215, -3.72210693359375, -2.1268246173858643, -0.5315423011779785, 1.0637397766113281, 2.659022331237793, 4.254304885864258, 5.849586486816406, 7.444869041442871, 9.040151596069336, 10.6354341506958, 12.230716705322266, 13.825998306274414, 15.421280860900879, 17.016563415527344, 18.611845016479492, 20.20712661743164, 21.802410125732422, 23.39769172668457, 24.99297523498535, 26.5882568359375, 28.18354034423828, 29.77882194519043, 31.374103546142578, 32.96938705444336, 34.564666748046875, 36.159950256347656, 37.75522994995117, 39.35051345825195, 40.945796966552734, 42.54107666015625, 44.13636016845703, 45.73164367675781, 47.326927185058594]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 5.0, 9.0, 9.0, 19.0, 14.0, 18.0, 27.0, 42.0, 69.0, 100.0, 144.0, 253.0, 350.0, 596.0, 1064.0, 1830.0, 3354.0, 6988.0, 16220.0, 46969.0, 220244.0, 2678325.0, 1050765.0, 113437.0, 30639.0, 11521.0, 5262.0, 2581.0, 1350.0, 798.0, 453.0, 303.0, 170.0, 113.0, 59.0, 63.0, 32.0, 17.0, 15.0, 18.0, 8.0, 7.0, 8.0, 4.0, 3.0, 5.0, 1.0, 3.0, 2.0], "bins": [-5.90234375, -5.74200439453125, -5.5816650390625, -5.42132568359375, -5.260986328125, -5.10064697265625, -4.9403076171875, -4.77996826171875, -4.61962890625, -4.45928955078125, -4.2989501953125, -4.13861083984375, -3.978271484375, -3.81793212890625, -3.6575927734375, -3.49725341796875, -3.3369140625, -3.17657470703125, -3.0162353515625, -2.85589599609375, -2.695556640625, -2.53521728515625, -2.3748779296875, -2.21453857421875, -2.05419921875, -1.89385986328125, -1.7335205078125, -1.57318115234375, -1.412841796875, -1.25250244140625, -1.0921630859375, -0.93182373046875, -0.771484375, -0.61114501953125, -0.4508056640625, -0.29046630859375, -0.130126953125, 0.03021240234375, 0.1905517578125, 0.35089111328125, 0.51123046875, 0.67156982421875, 0.8319091796875, 0.99224853515625, 1.152587890625, 1.31292724609375, 1.4732666015625, 1.63360595703125, 1.7939453125, 1.95428466796875, 2.1146240234375, 2.27496337890625, 2.435302734375, 2.59564208984375, 2.7559814453125, 2.91632080078125, 3.07666015625, 3.23699951171875, 3.3973388671875, 3.55767822265625, 3.718017578125, 3.87835693359375, 4.0386962890625, 4.19903564453125, 4.359375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 8.0, 8.0, 12.0, 9.0, 10.0, 25.0, 25.0, 35.0, 41.0, 41.0, 57.0, 79.0, 75.0, 63.0, 75.0, 75.0, 63.0, 52.0, 55.0, 42.0, 35.0, 35.0, 27.0, 16.0, 14.0, 11.0, 6.0, 2.0, 5.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.37109375, -4.269775390625, -4.16845703125, -4.067138671875, -3.9658203125, -3.864501953125, -3.76318359375, -3.661865234375, -3.560546875, -3.459228515625, -3.35791015625, -3.256591796875, -3.1552734375, -3.053955078125, -2.95263671875, -2.851318359375, -2.75, -2.648681640625, -2.54736328125, -2.446044921875, -2.3447265625, -2.243408203125, -2.14208984375, -2.040771484375, -1.939453125, -1.838134765625, -1.73681640625, -1.635498046875, -1.5341796875, -1.432861328125, -1.33154296875, -1.230224609375, -1.12890625, -1.027587890625, -0.92626953125, -0.824951171875, -0.7236328125, -0.622314453125, -0.52099609375, -0.419677734375, -0.318359375, -0.217041015625, -0.11572265625, -0.014404296875, 0.0869140625, 0.188232421875, 0.28955078125, 0.390869140625, 0.4921875, 0.593505859375, 0.69482421875, 0.796142578125, 0.8974609375, 0.998779296875, 1.10009765625, 1.201416015625, 1.302734375, 1.404052734375, 1.50537109375, 1.606689453125, 1.7080078125, 1.809326171875, 1.91064453125, 2.011962890625, 2.11328125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 4.0, 3.0, 15.0, 11.0, 24.0, 30.0, 40.0, 77.0, 116.0, 191.0, 376.0, 713.0, 1493.0, 3838.0, 10299.0, 35318.0, 190776.0, 3139995.0, 710413.0, 71911.0, 18073.0, 5994.0, 2301.0, 1054.0, 512.0, 267.0, 140.0, 99.0, 64.0, 42.0, 14.0, 19.0, 21.0, 15.0, 4.0, 5.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.578125, -7.353515625, -7.12890625, -6.904296875, -6.6796875, -6.455078125, -6.23046875, -6.005859375, -5.78125, -5.556640625, -5.33203125, -5.107421875, -4.8828125, -4.658203125, -4.43359375, -4.208984375, -3.984375, -3.759765625, -3.53515625, -3.310546875, -3.0859375, -2.861328125, -2.63671875, -2.412109375, -2.1875, -1.962890625, -1.73828125, -1.513671875, -1.2890625, -1.064453125, -0.83984375, -0.615234375, -0.390625, -0.166015625, 0.05859375, 0.283203125, 0.5078125, 0.732421875, 0.95703125, 1.181640625, 1.40625, 1.630859375, 1.85546875, 2.080078125, 2.3046875, 2.529296875, 2.75390625, 2.978515625, 3.203125, 3.427734375, 3.65234375, 3.876953125, 4.1015625, 4.326171875, 4.55078125, 4.775390625, 5.0, 5.224609375, 5.44921875, 5.673828125, 5.8984375, 6.123046875, 6.34765625, 6.572265625, 6.796875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 6.0, 8.0, 2.0, 8.0, 15.0, 11.0, 14.0, 29.0, 33.0, 38.0, 63.0, 110.0, 162.0, 280.0, 488.0, 823.0, 825.0, 458.0, 241.0, 135.0, 103.0, 56.0, 36.0, 32.0, 24.0, 14.0, 10.0, 11.0, 10.0, 6.0, 7.0, 2.0, 6.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3359375, -6.11676025390625, -5.8975830078125, -5.67840576171875, -5.459228515625, -5.24005126953125, -5.0208740234375, -4.80169677734375, -4.58251953125, -4.36334228515625, -4.1441650390625, -3.92498779296875, -3.705810546875, -3.48663330078125, -3.2674560546875, -3.04827880859375, -2.8291015625, -2.60992431640625, -2.3907470703125, -2.17156982421875, -1.952392578125, -1.73321533203125, -1.5140380859375, -1.29486083984375, -1.07568359375, -0.85650634765625, -0.6373291015625, -0.41815185546875, -0.198974609375, 0.02020263671875, 0.2393798828125, 0.45855712890625, 0.677734375, 0.89691162109375, 1.1160888671875, 1.33526611328125, 1.554443359375, 1.77362060546875, 1.9927978515625, 2.21197509765625, 2.43115234375, 2.65032958984375, 2.8695068359375, 3.08868408203125, 3.307861328125, 3.52703857421875, 3.7462158203125, 3.96539306640625, 4.1845703125, 4.40374755859375, 4.6229248046875, 4.84210205078125, 5.061279296875, 5.28045654296875, 5.4996337890625, 5.71881103515625, 5.93798828125, 6.15716552734375, 6.3763427734375, 6.59552001953125, 6.814697265625, 7.03387451171875, 7.2530517578125, 7.47222900390625, 7.69140625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 10.0, 14.0, 22.0, 53.0, 76.0, 133.0, 168.0, 174.0, 126.0, 101.0, 51.0, 23.0, 14.0, 10.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-52.672786712646484, -50.492698669433594, -48.31261444091797, -46.13252639770508, -43.95243835449219, -41.7723503112793, -39.592262268066406, -37.41217803955078, -35.23208999633789, -33.052001953125, -30.871915817260742, -28.691829681396484, -26.511741638183594, -24.331653594970703, -22.151567459106445, -19.971481323242188, -17.791393280029297, -15.611306190490723, -13.431219100952148, -11.251132011413574, -9.071044921875, -6.890957832336426, -4.710870742797852, -2.5307836532592773, -0.3506965637207031, 1.829390525817871, 4.009477615356445, 6.1895647048950195, 8.369651794433594, 10.549738883972168, 12.729825973510742, 14.909913063049316, 17.089996337890625, 19.270084381103516, 21.450170516967773, 23.63025665283203, 25.810344696044922, 27.990432739257812, 30.17051887512207, 32.35060501098633, 34.53069305419922, 36.71078109741211, 38.890869140625, 41.070953369140625, 43.251041412353516, 45.431129455566406, 47.61121368408203, 49.79130172729492, 51.97138977050781, 54.1514778137207, 56.331565856933594, 58.51165008544922, 60.69173812866211, 62.871826171875, 65.05191040039062, 67.23200225830078, 69.4120864868164, 71.59217071533203, 73.77226257324219, 75.95234680175781, 78.13243103027344, 80.3125228881836, 82.49260711669922, 84.67269897460938, 86.852783203125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 6.0, 7.0, 11.0, 12.0, 21.0, 19.0, 12.0, 31.0, 17.0, 37.0, 32.0, 34.0, 59.0, 42.0, 39.0, 44.0, 37.0, 44.0, 50.0, 48.0, 40.0, 42.0, 49.0, 30.0, 30.0, 30.0, 33.0, 24.0, 27.0, 23.0, 8.0, 16.0, 11.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.845794677734375, -27.835613250732422, -26.825429916381836, -25.81524658203125, -24.805065155029297, -23.794883728027344, -22.784700393676758, -21.774517059326172, -20.76433563232422, -19.754154205322266, -18.74397087097168, -17.733787536621094, -16.72360610961914, -15.713423728942871, -14.703241348266602, -13.693058967590332, -12.682876586914062, -11.672694206237793, -10.662511825561523, -9.652329444885254, -8.642147064208984, -7.631964683532715, -6.621782302856445, -5.611599922180176, -4.601417541503906, -3.5912351608276367, -2.581052780151367, -1.5708703994750977, -0.5606880187988281, 0.4494943618774414, 1.459676742553711, 2.4698591232299805, 3.4800453186035156, 4.490227699279785, 5.500410079956055, 6.510592460632324, 7.520774841308594, 8.530957221984863, 9.541139602661133, 10.551321983337402, 11.561504364013672, 12.571686744689941, 13.581869125366211, 14.59205150604248, 15.60223388671875, 16.612415313720703, 17.62259864807129, 18.632781982421875, 19.642963409423828, 20.65314483642578, 21.663328170776367, 22.673511505126953, 23.683692932128906, 24.69387435913086, 25.704057693481445, 26.71424102783203, 27.724422454833984, 28.734603881835938, 29.744787216186523, 30.75497055053711, 31.765151977539062, 32.775333404541016, 33.78551483154297, 34.79570007324219, 35.80588150024414]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 17.0, 23.0, 34.0, 69.0, 78.0, 113.0, 150.0, 244.0, 393.0, 600.0, 995.0, 1541.0, 2594.0, 4661.0, 8018.0, 15337.0, 29188.0, 61649.0, 151619.0, 380180.0, 225738.0, 83726.0, 38378.0, 19186.0, 10114.0, 5618.0, 3188.0, 1903.0, 1157.0, 700.0, 401.0, 280.0, 230.0, 126.0, 86.0, 74.0, 44.0, 33.0, 17.0, 17.0, 6.0, 7.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0, -4.8515625, -4.703125, -4.5546875, -4.40625, -4.2578125, -4.109375, -3.9609375, -3.8125, -3.6640625, -3.515625, -3.3671875, -3.21875, -3.0703125, -2.921875, -2.7734375, -2.625, -2.4765625, -2.328125, -2.1796875, -2.03125, -1.8828125, -1.734375, -1.5859375, -1.4375, -1.2890625, -1.140625, -0.9921875, -0.84375, -0.6953125, -0.546875, -0.3984375, -0.25, -0.1015625, 0.046875, 0.1953125, 0.34375, 0.4921875, 0.640625, 0.7890625, 0.9375, 1.0859375, 1.234375, 1.3828125, 1.53125, 1.6796875, 1.828125, 1.9765625, 2.125, 2.2734375, 2.421875, 2.5703125, 2.71875, 2.8671875, 3.015625, 3.1640625, 3.3125, 3.4609375, 3.609375, 3.7578125, 3.90625, 4.0546875, 4.203125, 4.3515625, 4.5]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 6.0, 6.0, 4.0, 10.0, 10.0, 15.0, 16.0, 15.0, 24.0, 23.0, 29.0, 29.0, 14.0, 43.0, 39.0, 49.0, 42.0, 46.0, 53.0, 54.0, 44.0, 36.0, 40.0, 38.0, 38.0, 33.0, 40.0, 30.0, 28.0, 13.0, 26.0, 18.0, 11.0, 15.0, 14.0, 9.0, 14.0, 6.0, 8.0, 8.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.314453125, -2.249755859375, -2.18505859375, -2.120361328125, -2.0556640625, -1.990966796875, -1.92626953125, -1.861572265625, -1.796875, -1.732177734375, -1.66748046875, -1.602783203125, -1.5380859375, -1.473388671875, -1.40869140625, -1.343994140625, -1.279296875, -1.214599609375, -1.14990234375, -1.085205078125, -1.0205078125, -0.955810546875, -0.89111328125, -0.826416015625, -0.76171875, -0.697021484375, -0.63232421875, -0.567626953125, -0.5029296875, -0.438232421875, -0.37353515625, -0.308837890625, -0.244140625, -0.179443359375, -0.11474609375, -0.050048828125, 0.0146484375, 0.079345703125, 0.14404296875, 0.208740234375, 0.2734375, 0.338134765625, 0.40283203125, 0.467529296875, 0.5322265625, 0.596923828125, 0.66162109375, 0.726318359375, 0.791015625, 0.855712890625, 0.92041015625, 0.985107421875, 1.0498046875, 1.114501953125, 1.17919921875, 1.243896484375, 1.30859375, 1.373291015625, 1.43798828125, 1.502685546875, 1.5673828125, 1.632080078125, 1.69677734375, 1.761474609375, 1.826171875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 10.0, 12.0, 26.0, 24.0, 35.0, 59.0, 107.0, 132.0, 231.0, 339.0, 592.0, 1050.0, 2193.0, 6637.0, 32034.0, 426117.0, 531768.0, 35208.0, 6879.0, 2363.0, 1124.0, 567.0, 344.0, 237.0, 144.0, 95.0, 69.0, 52.0, 27.0, 24.0, 11.0, 13.0, 12.0, 11.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1484375, -10.7642822265625, -10.380126953125, -9.9959716796875, -9.61181640625, -9.2276611328125, -8.843505859375, -8.4593505859375, -8.0751953125, -7.6910400390625, -7.306884765625, -6.9227294921875, -6.53857421875, -6.1544189453125, -5.770263671875, -5.3861083984375, -5.001953125, -4.6177978515625, -4.233642578125, -3.8494873046875, -3.46533203125, -3.0811767578125, -2.697021484375, -2.3128662109375, -1.9287109375, -1.5445556640625, -1.160400390625, -0.7762451171875, -0.39208984375, -0.0079345703125, 0.376220703125, 0.7603759765625, 1.14453125, 1.5286865234375, 1.912841796875, 2.2969970703125, 2.68115234375, 3.0653076171875, 3.449462890625, 3.8336181640625, 4.2177734375, 4.6019287109375, 4.986083984375, 5.3702392578125, 5.75439453125, 6.1385498046875, 6.522705078125, 6.9068603515625, 7.291015625, 7.6751708984375, 8.059326171875, 8.4434814453125, 8.82763671875, 9.2117919921875, 9.595947265625, 9.9801025390625, 10.3642578125, 10.7484130859375, 11.132568359375, 11.5167236328125, 11.90087890625, 12.2850341796875, 12.669189453125, 13.0533447265625, 13.4375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 4.0, 8.0, 8.0, 14.0, 10.0, 4.0, 12.0, 16.0, 18.0, 32.0, 29.0, 35.0, 30.0, 33.0, 30.0, 45.0, 50.0, 53.0, 53.0, 49.0, 37.0, 39.0, 47.0, 41.0, 41.0, 34.0, 27.0, 26.0, 29.0, 20.0, 24.0, 21.0, 12.0, 17.0, 9.0, 9.0, 8.0, 4.0, 11.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.484375, -8.185546875, -7.88671875, -7.587890625, -7.2890625, -6.990234375, -6.69140625, -6.392578125, -6.09375, -5.794921875, -5.49609375, -5.197265625, -4.8984375, -4.599609375, -4.30078125, -4.001953125, -3.703125, -3.404296875, -3.10546875, -2.806640625, -2.5078125, -2.208984375, -1.91015625, -1.611328125, -1.3125, -1.013671875, -0.71484375, -0.416015625, -0.1171875, 0.181640625, 0.48046875, 0.779296875, 1.078125, 1.376953125, 1.67578125, 1.974609375, 2.2734375, 2.572265625, 2.87109375, 3.169921875, 3.46875, 3.767578125, 4.06640625, 4.365234375, 4.6640625, 4.962890625, 5.26171875, 5.560546875, 5.859375, 6.158203125, 6.45703125, 6.755859375, 7.0546875, 7.353515625, 7.65234375, 7.951171875, 8.25, 8.548828125, 8.84765625, 9.146484375, 9.4453125, 9.744140625, 10.04296875, 10.341796875, 10.640625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 5.0, 5.0, 8.0, 13.0, 12.0, 19.0, 45.0, 75.0, 118.0, 224.0, 470.0, 1097.0, 3009.0, 10424.0, 52804.0, 604432.0, 326431.0, 37333.0, 7866.0, 2436.0, 890.0, 391.0, 192.0, 96.0, 48.0, 40.0, 31.0, 8.0, 16.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.375, -4.22869873046875, -4.0823974609375, -3.93609619140625, -3.789794921875, -3.64349365234375, -3.4971923828125, -3.35089111328125, -3.20458984375, -3.05828857421875, -2.9119873046875, -2.76568603515625, -2.619384765625, -2.47308349609375, -2.3267822265625, -2.18048095703125, -2.0341796875, -1.88787841796875, -1.7415771484375, -1.59527587890625, -1.448974609375, -1.30267333984375, -1.1563720703125, -1.01007080078125, -0.86376953125, -0.71746826171875, -0.5711669921875, -0.42486572265625, -0.278564453125, -0.13226318359375, 0.0140380859375, 0.16033935546875, 0.306640625, 0.45294189453125, 0.5992431640625, 0.74554443359375, 0.891845703125, 1.03814697265625, 1.1844482421875, 1.33074951171875, 1.47705078125, 1.62335205078125, 1.7696533203125, 1.91595458984375, 2.062255859375, 2.20855712890625, 2.3548583984375, 2.50115966796875, 2.6474609375, 2.79376220703125, 2.9400634765625, 3.08636474609375, 3.232666015625, 3.37896728515625, 3.5252685546875, 3.67156982421875, 3.81787109375, 3.96417236328125, 4.1104736328125, 4.25677490234375, 4.403076171875, 4.54937744140625, 4.6956787109375, 4.84197998046875, 4.98828125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 9.0, 10.0, 10.0, 22.0, 24.0, 20.0, 34.0, 50.0, 78.0, 172.0, 176.0, 127.0, 77.0, 35.0, 36.0, 28.0, 15.0, 14.0, 7.0, 14.0, 12.0, 2.0, 7.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012636184692382812, -0.0012267082929611206, -0.00118979811668396, -0.0011528879404067993, -0.0011159777641296387, -0.001079067587852478, -0.0010421574115753174, -0.0010052472352981567, -0.0009683370590209961, -0.0009314268827438354, -0.0008945167064666748, -0.0008576065301895142, -0.0008206963539123535, -0.0007837861776351929, -0.0007468760013580322, -0.0007099658250808716, -0.0006730556488037109, -0.0006361454725265503, -0.0005992352962493896, -0.000562325119972229, -0.0005254149436950684, -0.0004885047674179077, -0.00045159459114074707, -0.0004146844148635864, -0.0003777742385864258, -0.00034086406230926514, -0.0003039538860321045, -0.00026704370975494385, -0.0002301335334777832, -0.00019322335720062256, -0.00015631318092346191, -0.00011940300464630127, -8.249282836914062e-05, -4.558265209197998e-05, -8.672475814819336e-06, 2.823770046234131e-05, 6.514787673950195e-05, 0.0001020580530166626, 0.00013896822929382324, 0.0001758784055709839, 0.00021278858184814453, 0.0002496987581253052, 0.0002866089344024658, 0.00032351911067962646, 0.0003604292869567871, 0.00039733946323394775, 0.0004342496395111084, 0.00047115981578826904, 0.0005080699920654297, 0.0005449801683425903, 0.000581890344619751, 0.0006188005208969116, 0.0006557106971740723, 0.0006926208734512329, 0.0007295310497283936, 0.0007664412260055542, 0.0008033514022827148, 0.0008402615785598755, 0.0008771717548370361, 0.0009140819311141968, 0.0009509921073913574, 0.000987902283668518, 0.0010248124599456787, 0.0010617226362228394, 0.0010986328125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 4.0, 8.0, 16.0, 24.0, 34.0, 55.0, 64.0, 103.0, 169.0, 316.0, 449.0, 827.0, 1736.0, 3942.0, 12170.0, 56930.0, 503435.0, 398520.0, 51186.0, 11181.0, 3657.0, 1627.0, 834.0, 449.0, 271.0, 185.0, 119.0, 75.0, 43.0, 37.0, 29.0, 12.0, 17.0, 8.0, 5.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.3359375, -4.211944580078125, -4.08795166015625, -3.963958740234375, -3.8399658203125, -3.715972900390625, -3.59197998046875, -3.467987060546875, -3.343994140625, -3.220001220703125, -3.09600830078125, -2.972015380859375, -2.8480224609375, -2.724029541015625, -2.60003662109375, -2.476043701171875, -2.35205078125, -2.228057861328125, -2.10406494140625, -1.980072021484375, -1.8560791015625, -1.732086181640625, -1.60809326171875, -1.484100341796875, -1.360107421875, -1.236114501953125, -1.11212158203125, -0.988128662109375, -0.8641357421875, -0.740142822265625, -0.61614990234375, -0.492156982421875, -0.3681640625, -0.244171142578125, -0.12017822265625, 0.003814697265625, 0.1278076171875, 0.251800537109375, 0.37579345703125, 0.499786376953125, 0.623779296875, 0.747772216796875, 0.87176513671875, 0.995758056640625, 1.1197509765625, 1.243743896484375, 1.36773681640625, 1.491729736328125, 1.61572265625, 1.739715576171875, 1.86370849609375, 1.987701416015625, 2.1116943359375, 2.235687255859375, 2.35968017578125, 2.483673095703125, 2.607666015625, 2.731658935546875, 2.85565185546875, 2.979644775390625, 3.1036376953125, 3.227630615234375, 3.35162353515625, 3.475616455078125, 3.599609375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 7.0, 3.0, 5.0, 7.0, 10.0, 10.0, 16.0, 14.0, 14.0, 22.0, 26.0, 27.0, 28.0, 42.0, 50.0, 46.0, 70.0, 71.0, 87.0, 62.0, 68.0, 52.0, 59.0, 34.0, 41.0, 29.0, 17.0, 19.0, 10.0, 8.0, 13.0, 8.0, 8.0, 5.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.76953125, -2.68328857421875, -2.5970458984375, -2.51080322265625, -2.424560546875, -2.33831787109375, -2.2520751953125, -2.16583251953125, -2.07958984375, -1.99334716796875, -1.9071044921875, -1.82086181640625, -1.734619140625, -1.64837646484375, -1.5621337890625, -1.47589111328125, -1.3896484375, -1.30340576171875, -1.2171630859375, -1.13092041015625, -1.044677734375, -0.95843505859375, -0.8721923828125, -0.78594970703125, -0.69970703125, -0.61346435546875, -0.5272216796875, -0.44097900390625, -0.354736328125, -0.26849365234375, -0.1822509765625, -0.09600830078125, -0.009765625, 0.07647705078125, 0.1627197265625, 0.24896240234375, 0.335205078125, 0.42144775390625, 0.5076904296875, 0.59393310546875, 0.68017578125, 0.76641845703125, 0.8526611328125, 0.93890380859375, 1.025146484375, 1.11138916015625, 1.1976318359375, 1.28387451171875, 1.3701171875, 1.45635986328125, 1.5426025390625, 1.62884521484375, 1.715087890625, 1.80133056640625, 1.8875732421875, 1.97381591796875, 2.06005859375, 2.14630126953125, 2.2325439453125, 2.31878662109375, 2.405029296875, 2.49127197265625, 2.5775146484375, 2.66375732421875, 2.75]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 13.0, 22.0, 39.0, 88.0, 122.0, 182.0, 187.0, 127.0, 88.0, 58.0, 22.0, 17.0, 8.0, 7.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-88.24029541015625, -85.86024475097656, -83.48018646240234, -81.10013580322266, -78.72007751464844, -76.34002685546875, -73.95996856689453, -71.57991790771484, -69.19985961914062, -66.81980895996094, -64.43975067138672, -62.059696197509766, -59.67964172363281, -57.29958724975586, -54.919532775878906, -52.53948211669922, -50.159427642822266, -47.77937316894531, -45.39931869506836, -43.019264221191406, -40.63920974731445, -38.2591552734375, -35.87910461425781, -33.499046325683594, -31.118993759155273, -28.73893928527832, -26.358884811401367, -23.978832244873047, -21.598777770996094, -19.21872329711914, -16.838668823242188, -14.458614349365234, -12.078559875488281, -9.698505401611328, -7.318451404571533, -4.938397407531738, -2.558342933654785, -0.17828845977783203, 2.2017650604248047, 4.581819534301758, 6.961874008178711, 9.341928482055664, 11.721982955932617, 14.102036476135254, 16.48208999633789, 18.862144470214844, 21.242198944091797, 23.62225341796875, 26.002307891845703, 28.382362365722656, 30.76241683959961, 33.14247131347656, 35.522525787353516, 37.90258026123047, 40.282630920410156, 42.662689208984375, 45.04273986816406, 47.422794342041016, 49.80284881591797, 52.18290328979492, 54.562957763671875, 56.94301223754883, 59.32306671142578, 61.70311737060547, 64.08317565917969]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 5.0, 9.0, 7.0, 13.0, 11.0, 18.0, 13.0, 25.0, 30.0, 27.0, 32.0, 41.0, 24.0, 50.0, 48.0, 48.0, 55.0, 57.0, 70.0, 44.0, 39.0, 34.0, 31.0, 27.0, 37.0, 44.0, 28.0, 19.0, 22.0, 16.0, 19.0, 12.0, 5.0, 6.0, 9.0, 11.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.08901023864746, -29.91200828552246, -28.735004425048828, -27.558002471923828, -26.381000518798828, -25.203998565673828, -24.026994705200195, -22.849992752075195, -21.672988891601562, -20.495986938476562, -19.31898307800293, -18.14198112487793, -16.96497917175293, -15.787976264953613, -14.610973358154297, -13.433971405029297, -12.256969451904297, -11.07996654510498, -9.90296459197998, -8.725961685180664, -7.548959255218506, -6.371956825256348, -5.194953918457031, -4.017951965332031, -2.840949058532715, -1.663946509361267, -0.48694396018981934, 0.690058708190918, 1.8670611381530762, 3.0440635681152344, 4.221066474914551, 5.398068428039551, 6.575069427490234, 7.752071857452393, 8.92907428741455, 10.106077194213867, 11.283079147338867, 12.460082054138184, 13.6370849609375, 14.8140869140625, 15.991089820861816, 17.168092727661133, 18.345094680786133, 19.522098541259766, 20.699100494384766, 21.876102447509766, 23.053104400634766, 24.230106353759766, 25.4071102142334, 26.5841121673584, 27.76111602783203, 28.93811798095703, 30.11511993408203, 31.29212188720703, 32.46912384033203, 33.64612579345703, 34.8231315612793, 36.0001335144043, 37.1771354675293, 38.35414123535156, 39.53114318847656, 40.70814514160156, 41.88514709472656, 43.06214904785156, 44.23915100097656]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 8.0, 7.0, 17.0, 16.0, 30.0, 42.0, 61.0, 90.0, 173.0, 464.0, 2495.0, 44708.0, 4074510.0, 67563.0, 3063.0, 542.0, 167.0, 101.0, 60.0, 55.0, 32.0, 10.0, 17.0, 17.0, 8.0, 7.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0625, -14.4951171875, -13.927734375, -13.3603515625, -12.79296875, -12.2255859375, -11.658203125, -11.0908203125, -10.5234375, -9.9560546875, -9.388671875, -8.8212890625, -8.25390625, -7.6865234375, -7.119140625, -6.5517578125, -5.984375, -5.4169921875, -4.849609375, -4.2822265625, -3.71484375, -3.1474609375, -2.580078125, -2.0126953125, -1.4453125, -0.8779296875, -0.310546875, 0.2568359375, 0.82421875, 1.3916015625, 1.958984375, 2.5263671875, 3.09375, 3.6611328125, 4.228515625, 4.7958984375, 5.36328125, 5.9306640625, 6.498046875, 7.0654296875, 7.6328125, 8.2001953125, 8.767578125, 9.3349609375, 9.90234375, 10.4697265625, 11.037109375, 11.6044921875, 12.171875, 12.7392578125, 13.306640625, 13.8740234375, 14.44140625, 15.0087890625, 15.576171875, 16.1435546875, 16.7109375, 17.2783203125, 17.845703125, 18.4130859375, 18.98046875, 19.5478515625, 20.115234375, 20.6826171875, 21.25]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 3.0, 8.0, 17.0, 15.0, 13.0, 16.0, 21.0, 27.0, 23.0, 34.0, 44.0, 46.0, 51.0, 46.0, 44.0, 51.0, 49.0, 39.0, 50.0, 43.0, 44.0, 45.0, 27.0, 48.0, 29.0, 24.0, 26.0, 18.0, 17.0, 15.0, 11.0, 8.0, 10.0, 1.0, 6.0, 8.0, 1.0, 5.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.974609375, -1.90997314453125, -1.8453369140625, -1.78070068359375, -1.716064453125, -1.65142822265625, -1.5867919921875, -1.52215576171875, -1.45751953125, -1.39288330078125, -1.3282470703125, -1.26361083984375, -1.198974609375, -1.13433837890625, -1.0697021484375, -1.00506591796875, -0.9404296875, -0.87579345703125, -0.8111572265625, -0.74652099609375, -0.681884765625, -0.61724853515625, -0.5526123046875, -0.48797607421875, -0.42333984375, -0.35870361328125, -0.2940673828125, -0.22943115234375, -0.164794921875, -0.10015869140625, -0.0355224609375, 0.02911376953125, 0.09375, 0.15838623046875, 0.2230224609375, 0.28765869140625, 0.352294921875, 0.41693115234375, 0.4815673828125, 0.54620361328125, 0.61083984375, 0.67547607421875, 0.7401123046875, 0.80474853515625, 0.869384765625, 0.93402099609375, 0.9986572265625, 1.06329345703125, 1.1279296875, 1.19256591796875, 1.2572021484375, 1.32183837890625, 1.386474609375, 1.45111083984375, 1.5157470703125, 1.58038330078125, 1.64501953125, 1.70965576171875, 1.7742919921875, 1.83892822265625, 1.903564453125, 1.96820068359375, 2.0328369140625, 2.09747314453125, 2.162109375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 9.0, 21.0, 29.0, 49.0, 72.0, 91.0, 154.0, 247.0, 439.0, 718.0, 1313.0, 2576.0, 5543.0, 12706.0, 35388.0, 132802.0, 902178.0, 2604078.0, 382208.0, 73571.0, 22520.0, 8968.0, 4040.0, 1944.0, 1063.0, 615.0, 327.0, 241.0, 115.0, 93.0, 42.0, 29.0, 27.0, 15.0, 14.0, 5.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.853515625, -3.707000732421875, -3.56048583984375, -3.413970947265625, -3.2674560546875, -3.120941162109375, -2.97442626953125, -2.827911376953125, -2.681396484375, -2.534881591796875, -2.38836669921875, -2.241851806640625, -2.0953369140625, -1.948822021484375, -1.80230712890625, -1.655792236328125, -1.50927734375, -1.362762451171875, -1.21624755859375, -1.069732666015625, -0.9232177734375, -0.776702880859375, -0.63018798828125, -0.483673095703125, -0.337158203125, -0.190643310546875, -0.04412841796875, 0.102386474609375, 0.2489013671875, 0.395416259765625, 0.54193115234375, 0.688446044921875, 0.8349609375, 0.981475830078125, 1.12799072265625, 1.274505615234375, 1.4210205078125, 1.567535400390625, 1.71405029296875, 1.860565185546875, 2.007080078125, 2.153594970703125, 2.30010986328125, 2.446624755859375, 2.5931396484375, 2.739654541015625, 2.88616943359375, 3.032684326171875, 3.17919921875, 3.325714111328125, 3.47222900390625, 3.618743896484375, 3.7652587890625, 3.911773681640625, 4.05828857421875, 4.204803466796875, 4.351318359375, 4.497833251953125, 4.64434814453125, 4.790863037109375, 4.9373779296875, 5.083892822265625, 5.23040771484375, 5.376922607421875, 5.5234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 5.0, 3.0, 6.0, 16.0, 24.0, 24.0, 28.0, 72.0, 93.0, 146.0, 273.0, 441.0, 794.0, 841.0, 567.0, 304.0, 152.0, 100.0, 63.0, 39.0, 19.0, 18.0, 12.0, 11.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.87109375, -7.6468505859375, -7.422607421875, -7.1983642578125, -6.97412109375, -6.7498779296875, -6.525634765625, -6.3013916015625, -6.0771484375, -5.8529052734375, -5.628662109375, -5.4044189453125, -5.18017578125, -4.9559326171875, -4.731689453125, -4.5074462890625, -4.283203125, -4.0589599609375, -3.834716796875, -3.6104736328125, -3.38623046875, -3.1619873046875, -2.937744140625, -2.7135009765625, -2.4892578125, -2.2650146484375, -2.040771484375, -1.8165283203125, -1.59228515625, -1.3680419921875, -1.143798828125, -0.9195556640625, -0.6953125, -0.4710693359375, -0.246826171875, -0.0225830078125, 0.20166015625, 0.4259033203125, 0.650146484375, 0.8743896484375, 1.0986328125, 1.3228759765625, 1.547119140625, 1.7713623046875, 1.99560546875, 2.2198486328125, 2.444091796875, 2.6683349609375, 2.892578125, 3.1168212890625, 3.341064453125, 3.5653076171875, 3.78955078125, 4.0137939453125, 4.238037109375, 4.4622802734375, 4.6865234375, 4.9107666015625, 5.135009765625, 5.3592529296875, 5.58349609375, 5.8077392578125, 6.031982421875, 6.2562255859375, 6.48046875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 11.0, 20.0, 61.0, 87.0, 153.0, 195.0, 207.0, 134.0, 60.0, 30.0, 13.0, 12.0, 5.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-91.51319885253906, -89.37858581542969, -87.24397277832031, -85.10935974121094, -82.97474670410156, -80.84013366699219, -78.70552062988281, -76.57090759277344, -74.43629455566406, -72.30168151855469, -70.16706848144531, -68.03245544433594, -65.89784240722656, -63.76322937011719, -61.62861251831055, -59.49399948120117, -57.35938262939453, -55.224769592285156, -53.09015655517578, -50.955543518066406, -48.82093048095703, -46.686317443847656, -44.551700592041016, -42.41708755493164, -40.282474517822266, -38.14786148071289, -36.013248443603516, -33.87863540649414, -31.744020462036133, -29.609407424926758, -27.47479248046875, -25.340179443359375, -23.205562591552734, -21.07094955444336, -18.936336517333984, -16.801721572875977, -14.667108535766602, -12.532495498657227, -10.397881507873535, -8.263267517089844, -6.128654479980469, -3.9940409660339355, -1.8594274520874023, 0.27518606185913086, 2.409799575805664, 4.544412612915039, 6.6790266036987305, 8.813640594482422, 10.948253631591797, 13.082866668701172, 15.217480659484863, 17.352094650268555, 19.48670768737793, 21.621320724487305, 23.755935668945312, 25.890548706054688, 28.025161743164062, 30.159774780273438, 32.29438781738281, 34.42900085449219, 36.56361389160156, 38.69822692871094, 40.83284378051758, 42.96745681762695, 45.10206985473633]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 4.0, 7.0, 6.0, 6.0, 7.0, 13.0, 10.0, 11.0, 23.0, 25.0, 38.0, 27.0, 29.0, 35.0, 41.0, 43.0, 23.0, 31.0, 51.0, 35.0, 43.0, 43.0, 41.0, 35.0, 37.0, 29.0, 28.0, 30.0, 33.0, 29.0, 27.0, 24.0, 17.0, 21.0, 17.0, 14.0, 15.0, 5.0, 11.0, 11.0, 7.0, 2.0, 5.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-23.235137939453125, -22.518321990966797, -21.80150604248047, -21.08469009399414, -20.367874145507812, -19.651058197021484, -18.934242248535156, -18.217426300048828, -17.5006103515625, -16.783794403076172, -16.066978454589844, -15.350162506103516, -14.633346557617188, -13.91653060913086, -13.199714660644531, -12.482898712158203, -11.766083717346191, -11.049267768859863, -10.332451820373535, -9.615635871887207, -8.898819923400879, -8.18200397491455, -7.465188503265381, -6.748372554779053, -6.031556606292725, -5.3147406578063965, -4.597924709320068, -3.8811089992523193, -3.164293050765991, -2.447477102279663, -1.730661392211914, -1.013845443725586, -0.2970294952392578, 0.41978639364242554, 1.1366022825241089, 1.8534181118011475, 2.5702340602874756, 3.2870500087738037, 4.003865718841553, 4.720681667327881, 5.437497615814209, 6.154313564300537, 6.871129512786865, 7.587944984436035, 8.304760932922363, 9.021576881408691, 9.73839282989502, 10.455208778381348, 11.172024726867676, 11.888840675354004, 12.605656623840332, 13.32247257232666, 14.039288520812988, 14.756104469299316, 15.472919464111328, 16.189735412597656, 16.906551361083984, 17.623367309570312, 18.34018325805664, 19.05699920654297, 19.773815155029297, 20.490631103515625, 21.207447052001953, 21.92426300048828, 22.64107894897461]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 2.0, 7.0, 16.0, 22.0, 29.0, 37.0, 55.0, 89.0, 105.0, 161.0, 252.0, 348.0, 534.0, 844.0, 1235.0, 1959.0, 3458.0, 6013.0, 10491.0, 19899.0, 40448.0, 99584.0, 307719.0, 346652.0, 113853.0, 45320.0, 21970.0, 11451.0, 6395.0, 3624.0, 2135.0, 1279.0, 865.0, 530.0, 371.0, 233.0, 151.0, 118.0, 90.0, 61.0, 43.0, 35.0, 21.0, 16.0, 17.0, 7.0, 5.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.63671875, -4.5006103515625, -4.364501953125, -4.2283935546875, -4.09228515625, -3.9561767578125, -3.820068359375, -3.6839599609375, -3.5478515625, -3.4117431640625, -3.275634765625, -3.1395263671875, -3.00341796875, -2.8673095703125, -2.731201171875, -2.5950927734375, -2.458984375, -2.3228759765625, -2.186767578125, -2.0506591796875, -1.91455078125, -1.7784423828125, -1.642333984375, -1.5062255859375, -1.3701171875, -1.2340087890625, -1.097900390625, -0.9617919921875, -0.82568359375, -0.6895751953125, -0.553466796875, -0.4173583984375, -0.28125, -0.1451416015625, -0.009033203125, 0.1270751953125, 0.26318359375, 0.3992919921875, 0.535400390625, 0.6715087890625, 0.8076171875, 0.9437255859375, 1.079833984375, 1.2159423828125, 1.35205078125, 1.4881591796875, 1.624267578125, 1.7603759765625, 1.896484375, 2.0325927734375, 2.168701171875, 2.3048095703125, 2.44091796875, 2.5770263671875, 2.713134765625, 2.8492431640625, 2.9853515625, 3.1214599609375, 3.257568359375, 3.3936767578125, 3.52978515625, 3.6658935546875, 3.802001953125, 3.9381103515625, 4.07421875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 3.0, 5.0, 6.0, 10.0, 12.0, 13.0, 11.0, 15.0, 18.0, 22.0, 34.0, 24.0, 43.0, 30.0, 43.0, 35.0, 41.0, 47.0, 34.0, 51.0, 44.0, 33.0, 54.0, 51.0, 51.0, 30.0, 27.0, 34.0, 27.0, 34.0, 20.0, 22.0, 20.0, 10.0, 8.0, 5.0, 7.0, 6.0, 5.0, 4.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.060546875, -1.995880126953125, -1.93121337890625, -1.866546630859375, -1.8018798828125, -1.737213134765625, -1.67254638671875, -1.607879638671875, -1.543212890625, -1.478546142578125, -1.41387939453125, -1.349212646484375, -1.2845458984375, -1.219879150390625, -1.15521240234375, -1.090545654296875, -1.02587890625, -0.961212158203125, -0.89654541015625, -0.831878662109375, -0.7672119140625, -0.702545166015625, -0.63787841796875, -0.573211669921875, -0.508544921875, -0.443878173828125, -0.37921142578125, -0.314544677734375, -0.2498779296875, -0.185211181640625, -0.12054443359375, -0.055877685546875, 0.0087890625, 0.073455810546875, 0.13812255859375, 0.202789306640625, 0.2674560546875, 0.332122802734375, 0.39678955078125, 0.461456298828125, 0.526123046875, 0.590789794921875, 0.65545654296875, 0.720123291015625, 0.7847900390625, 0.849456787109375, 0.91412353515625, 0.978790283203125, 1.04345703125, 1.108123779296875, 1.17279052734375, 1.237457275390625, 1.3021240234375, 1.366790771484375, 1.43145751953125, 1.496124267578125, 1.560791015625, 1.625457763671875, 1.69012451171875, 1.754791259765625, 1.8194580078125, 1.884124755859375, 1.94879150390625, 2.013458251953125, 2.078125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 14.0, 17.0, 18.0, 31.0, 26.0, 54.0, 57.0, 97.0, 147.0, 205.0, 303.0, 501.0, 868.0, 1592.0, 3809.0, 9981.0, 34224.0, 196820.0, 687042.0, 81041.0, 19613.0, 6410.0, 2627.0, 1236.0, 665.0, 398.0, 227.0, 152.0, 95.0, 68.0, 62.0, 40.0, 23.0, 24.0, 16.0, 8.0, 7.0, 7.0, 7.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.03125, -8.767822265625, -8.50439453125, -8.240966796875, -7.9775390625, -7.714111328125, -7.45068359375, -7.187255859375, -6.923828125, -6.660400390625, -6.39697265625, -6.133544921875, -5.8701171875, -5.606689453125, -5.34326171875, -5.079833984375, -4.81640625, -4.552978515625, -4.28955078125, -4.026123046875, -3.7626953125, -3.499267578125, -3.23583984375, -2.972412109375, -2.708984375, -2.445556640625, -2.18212890625, -1.918701171875, -1.6552734375, -1.391845703125, -1.12841796875, -0.864990234375, -0.6015625, -0.338134765625, -0.07470703125, 0.188720703125, 0.4521484375, 0.715576171875, 0.97900390625, 1.242431640625, 1.505859375, 1.769287109375, 2.03271484375, 2.296142578125, 2.5595703125, 2.822998046875, 3.08642578125, 3.349853515625, 3.61328125, 3.876708984375, 4.14013671875, 4.403564453125, 4.6669921875, 4.930419921875, 5.19384765625, 5.457275390625, 5.720703125, 5.984130859375, 6.24755859375, 6.510986328125, 6.7744140625, 7.037841796875, 7.30126953125, 7.564697265625, 7.828125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 3.0, 1.0, 5.0, 8.0, 6.0, 11.0, 17.0, 23.0, 22.0, 21.0, 29.0, 32.0, 44.0, 62.0, 60.0, 56.0, 52.0, 47.0, 75.0, 69.0, 58.0, 48.0, 45.0, 31.0, 39.0, 35.0, 24.0, 14.0, 21.0, 11.0, 8.0, 13.0, 8.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1328125, -8.7930908203125, -8.453369140625, -8.1136474609375, -7.77392578125, -7.4342041015625, -7.094482421875, -6.7547607421875, -6.4150390625, -6.0753173828125, -5.735595703125, -5.3958740234375, -5.05615234375, -4.7164306640625, -4.376708984375, -4.0369873046875, -3.697265625, -3.3575439453125, -3.017822265625, -2.6781005859375, -2.33837890625, -1.9986572265625, -1.658935546875, -1.3192138671875, -0.9794921875, -0.6397705078125, -0.300048828125, 0.0396728515625, 0.37939453125, 0.7191162109375, 1.058837890625, 1.3985595703125, 1.73828125, 2.0780029296875, 2.417724609375, 2.7574462890625, 3.09716796875, 3.4368896484375, 3.776611328125, 4.1163330078125, 4.4560546875, 4.7957763671875, 5.135498046875, 5.4752197265625, 5.81494140625, 6.1546630859375, 6.494384765625, 6.8341064453125, 7.173828125, 7.5135498046875, 7.853271484375, 8.1929931640625, 8.53271484375, 8.8724365234375, 9.212158203125, 9.5518798828125, 9.8916015625, 10.2313232421875, 10.571044921875, 10.9107666015625, 11.25048828125, 11.5902099609375, 11.929931640625, 12.2696533203125, 12.609375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 8.0, 7.0, 15.0, 26.0, 42.0, 103.0, 163.0, 416.0, 1171.0, 4255.0, 23096.0, 255871.0, 704706.0, 48333.0, 7467.0, 1789.0, 561.0, 244.0, 119.0, 43.0, 38.0, 19.0, 11.0, 15.0, 6.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.765625, -6.57861328125, -6.3916015625, -6.20458984375, -6.017578125, -5.83056640625, -5.6435546875, -5.45654296875, -5.26953125, -5.08251953125, -4.8955078125, -4.70849609375, -4.521484375, -4.33447265625, -4.1474609375, -3.96044921875, -3.7734375, -3.58642578125, -3.3994140625, -3.21240234375, -3.025390625, -2.83837890625, -2.6513671875, -2.46435546875, -2.27734375, -2.09033203125, -1.9033203125, -1.71630859375, -1.529296875, -1.34228515625, -1.1552734375, -0.96826171875, -0.78125, -0.59423828125, -0.4072265625, -0.22021484375, -0.033203125, 0.15380859375, 0.3408203125, 0.52783203125, 0.71484375, 0.90185546875, 1.0888671875, 1.27587890625, 1.462890625, 1.64990234375, 1.8369140625, 2.02392578125, 2.2109375, 2.39794921875, 2.5849609375, 2.77197265625, 2.958984375, 3.14599609375, 3.3330078125, 3.52001953125, 3.70703125, 3.89404296875, 4.0810546875, 4.26806640625, 4.455078125, 4.64208984375, 4.8291015625, 5.01611328125, 5.203125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 8.0, 6.0, 17.0, 20.0, 28.0, 29.0, 43.0, 93.0, 220.0, 231.0, 131.0, 66.0, 28.0, 22.0, 27.0, 12.0, 7.0, 7.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000850677490234375, -0.0007981956005096436, -0.0007457137107849121, -0.0006932318210601807, -0.0006407499313354492, -0.0005882680416107178, -0.0005357861518859863, -0.0004833042621612549, -0.00043082237243652344, -0.000378340482711792, -0.00032585859298706055, -0.0002733767032623291, -0.00022089481353759766, -0.0001684129238128662, -0.00011593103408813477, -6.344914436340332e-05, -1.0967254638671875e-05, 4.151463508605957e-05, 9.399652481079102e-05, 0.00014647841453552246, 0.0001989603042602539, 0.00025144219398498535, 0.0003039240837097168, 0.00035640597343444824, 0.0004088878631591797, 0.00046136975288391113, 0.0005138516426086426, 0.000566333532333374, 0.0006188154220581055, 0.0006712973117828369, 0.0007237792015075684, 0.0007762610912322998, 0.0008287429809570312, 0.0008812248706817627, 0.0009337067604064941, 0.0009861886501312256, 0.001038670539855957, 0.0010911524295806885, 0.00114363431930542, 0.0011961162090301514, 0.0012485980987548828, 0.0013010799884796143, 0.0013535618782043457, 0.0014060437679290771, 0.0014585256576538086, 0.00151100754737854, 0.0015634894371032715, 0.001615971326828003, 0.0016684532165527344, 0.0017209351062774658, 0.0017734169960021973, 0.0018258988857269287, 0.0018783807754516602, 0.0019308626651763916, 0.001983344554901123, 0.0020358264446258545, 0.002088308334350586, 0.0021407902240753174, 0.002193272113800049, 0.0022457540035247803, 0.0022982358932495117, 0.002350717782974243, 0.0024031996726989746, 0.002455681562423706, 0.0025081634521484375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 13.0, 12.0, 14.0, 25.0, 36.0, 56.0, 108.0, 160.0, 286.0, 536.0, 1217.0, 2912.0, 9421.0, 41700.0, 288685.0, 605147.0, 75599.0, 15224.0, 4254.0, 1551.0, 730.0, 404.0, 189.0, 108.0, 57.0, 40.0, 23.0, 16.0, 12.0, 10.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.51953125, -3.39459228515625, -3.2696533203125, -3.14471435546875, -3.019775390625, -2.89483642578125, -2.7698974609375, -2.64495849609375, -2.52001953125, -2.39508056640625, -2.2701416015625, -2.14520263671875, -2.020263671875, -1.89532470703125, -1.7703857421875, -1.64544677734375, -1.5205078125, -1.39556884765625, -1.2706298828125, -1.14569091796875, -1.020751953125, -0.89581298828125, -0.7708740234375, -0.64593505859375, -0.52099609375, -0.39605712890625, -0.2711181640625, -0.14617919921875, -0.021240234375, 0.10369873046875, 0.2286376953125, 0.35357666015625, 0.478515625, 0.60345458984375, 0.7283935546875, 0.85333251953125, 0.978271484375, 1.10321044921875, 1.2281494140625, 1.35308837890625, 1.47802734375, 1.60296630859375, 1.7279052734375, 1.85284423828125, 1.977783203125, 2.10272216796875, 2.2276611328125, 2.35260009765625, 2.4775390625, 2.60247802734375, 2.7274169921875, 2.85235595703125, 2.977294921875, 3.10223388671875, 3.2271728515625, 3.35211181640625, 3.47705078125, 3.60198974609375, 3.7269287109375, 3.85186767578125, 3.976806640625, 4.10174560546875, 4.2266845703125, 4.35162353515625, 4.4765625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 2.0, 5.0, 3.0, 6.0, 6.0, 8.0, 9.0, 9.0, 18.0, 22.0, 34.0, 27.0, 41.0, 44.0, 70.0, 58.0, 93.0, 89.0, 87.0, 69.0, 63.0, 62.0, 32.0, 22.0, 27.0, 19.0, 18.0, 13.0, 12.0, 9.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.27734375, -3.175628662109375, -3.07391357421875, -2.972198486328125, -2.8704833984375, -2.768768310546875, -2.66705322265625, -2.565338134765625, -2.463623046875, -2.361907958984375, -2.26019287109375, -2.158477783203125, -2.0567626953125, -1.955047607421875, -1.85333251953125, -1.751617431640625, -1.64990234375, -1.548187255859375, -1.44647216796875, -1.344757080078125, -1.2430419921875, -1.141326904296875, -1.03961181640625, -0.937896728515625, -0.836181640625, -0.734466552734375, -0.63275146484375, -0.531036376953125, -0.4293212890625, -0.327606201171875, -0.22589111328125, -0.124176025390625, -0.0224609375, 0.079254150390625, 0.18096923828125, 0.282684326171875, 0.3843994140625, 0.486114501953125, 0.58782958984375, 0.689544677734375, 0.791259765625, 0.892974853515625, 0.99468994140625, 1.096405029296875, 1.1981201171875, 1.299835205078125, 1.40155029296875, 1.503265380859375, 1.60498046875, 1.706695556640625, 1.80841064453125, 1.910125732421875, 2.0118408203125, 2.113555908203125, 2.21527099609375, 2.316986083984375, 2.418701171875, 2.520416259765625, 2.62213134765625, 2.723846435546875, 2.8255615234375, 2.927276611328125, 3.02899169921875, 3.130706787109375, 3.232421875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 6.0, 18.0, 46.0, 98.0, 178.0, 291.0, 179.0, 107.0, 41.0, 15.0, 7.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-109.37437438964844, -106.30702209472656, -103.23966217041016, -100.17230987548828, -97.10494995117188, -94.03759765625, -90.9702377319336, -87.90288543701172, -84.83552551269531, -81.76817321777344, -78.70081329345703, -75.63346099853516, -72.56610107421875, -69.49874877929688, -66.43138885498047, -63.364036560058594, -60.29668045043945, -57.22932434082031, -54.16196823120117, -51.09461212158203, -48.02725601196289, -44.95989990234375, -41.892547607421875, -38.82518768310547, -35.757835388183594, -32.69047927856445, -29.623123168945312, -26.555767059326172, -23.48841094970703, -20.42105484008789, -17.353700637817383, -14.286344528198242, -11.218986511230469, -8.151630401611328, -5.084274768829346, -2.0169191360473633, 1.0504369735717773, 4.117793083190918, 7.185148239135742, 10.252504348754883, 13.319860458374023, 16.387216567993164, 19.454572677612305, 22.521926879882812, 25.589282989501953, 28.656639099121094, 31.723995208740234, 34.791351318359375, 37.858707427978516, 40.926063537597656, 43.9934196472168, 47.06077575683594, 50.12813186645508, 53.19548797607422, 56.262840270996094, 59.3302001953125, 62.397552490234375, 65.46490478515625, 68.53226470947266, 71.59961700439453, 74.66697692871094, 77.73432922363281, 80.80168914794922, 83.8690414428711, 86.9364013671875]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 14.0, 18.0, 11.0, 18.0, 14.0, 16.0, 26.0, 26.0, 26.0, 49.0, 39.0, 49.0, 52.0, 63.0, 77.0, 79.0, 72.0, 60.0, 41.0, 54.0, 20.0, 38.0, 25.0, 29.0, 24.0, 21.0, 11.0, 8.0, 7.0, 4.0, 2.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.405670166015625, -39.97478485107422, -38.54389953613281, -37.113014221191406, -35.68212890625, -34.251243591308594, -32.82035827636719, -31.38947296142578, -29.958587646484375, -28.52770233154297, -27.096817016601562, -25.665931701660156, -24.23504638671875, -22.804161071777344, -21.373275756835938, -19.94239044189453, -18.511505126953125, -17.08061981201172, -15.649734497070312, -14.218849182128906, -12.7879638671875, -11.357078552246094, -9.926193237304688, -8.495307922363281, -7.064422607421875, -5.633537292480469, -4.2026519775390625, -2.7717666625976562, -1.34088134765625, 0.09000396728515625, 1.5208892822265625, 2.9517745971679688, 4.382656097412109, 5.813541412353516, 7.244426727294922, 8.675312042236328, 10.106197357177734, 11.53708267211914, 12.967967987060547, 14.398853302001953, 15.82973861694336, 17.260623931884766, 18.691509246826172, 20.122394561767578, 21.553279876708984, 22.98416519165039, 24.415050506591797, 25.845935821533203, 27.27682113647461, 28.707706451416016, 30.138591766357422, 31.569477081298828, 33.000362396240234, 34.43124771118164, 35.86213302612305, 37.29301834106445, 38.72390365600586, 40.154788970947266, 41.58567428588867, 43.01655960083008, 44.447444915771484, 45.87833023071289, 47.3092155456543, 48.7401008605957, 50.17098617553711]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 10.0, 12.0, 15.0, 15.0, 36.0, 27.0, 55.0, 75.0, 113.0, 197.0, 270.0, 469.0, 743.0, 1259.0, 2244.0, 4158.0, 7944.0, 15306.0, 32828.0, 75001.0, 208145.0, 746128.0, 1862283.0, 849579.0, 234531.0, 82598.0, 35150.0, 16628.0, 8341.0, 4359.0, 2300.0, 1376.0, 783.0, 441.0, 289.0, 164.0, 134.0, 80.0, 68.0, 30.0, 26.0, 20.0, 12.0, 19.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.375, -2.29180908203125, -2.2086181640625, -2.12542724609375, -2.042236328125, -1.95904541015625, -1.8758544921875, -1.79266357421875, -1.70947265625, -1.62628173828125, -1.5430908203125, -1.45989990234375, -1.376708984375, -1.29351806640625, -1.2103271484375, -1.12713623046875, -1.0439453125, -0.96075439453125, -0.8775634765625, -0.79437255859375, -0.711181640625, -0.62799072265625, -0.5447998046875, -0.46160888671875, -0.37841796875, -0.29522705078125, -0.2120361328125, -0.12884521484375, -0.045654296875, 0.03753662109375, 0.1207275390625, 0.20391845703125, 0.287109375, 0.37030029296875, 0.4534912109375, 0.53668212890625, 0.619873046875, 0.70306396484375, 0.7862548828125, 0.86944580078125, 0.95263671875, 1.03582763671875, 1.1190185546875, 1.20220947265625, 1.285400390625, 1.36859130859375, 1.4517822265625, 1.53497314453125, 1.6181640625, 1.70135498046875, 1.7845458984375, 1.86773681640625, 1.950927734375, 2.03411865234375, 2.1173095703125, 2.20050048828125, 2.28369140625, 2.36688232421875, 2.4500732421875, 2.53326416015625, 2.616455078125, 2.69964599609375, 2.7828369140625, 2.86602783203125, 2.94921875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 13.0, 21.0, 18.0, 31.0, 35.0, 53.0, 50.0, 73.0, 82.0, 89.0, 109.0, 81.0, 68.0, 60.0, 51.0, 46.0, 36.0, 29.0, 20.0, 13.0, 5.0, 9.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41015625, -2.30181884765625, -2.1934814453125, -2.08514404296875, -1.976806640625, -1.86846923828125, -1.7601318359375, -1.65179443359375, -1.54345703125, -1.43511962890625, -1.3267822265625, -1.21844482421875, -1.110107421875, -1.00177001953125, -0.8934326171875, -0.78509521484375, -0.6767578125, -0.56842041015625, -0.4600830078125, -0.35174560546875, -0.243408203125, -0.13507080078125, -0.0267333984375, 0.08160400390625, 0.18994140625, 0.29827880859375, 0.4066162109375, 0.51495361328125, 0.623291015625, 0.73162841796875, 0.8399658203125, 0.94830322265625, 1.056640625, 1.16497802734375, 1.2733154296875, 1.38165283203125, 1.489990234375, 1.59832763671875, 1.7066650390625, 1.81500244140625, 1.92333984375, 2.03167724609375, 2.1400146484375, 2.24835205078125, 2.356689453125, 2.46502685546875, 2.5733642578125, 2.68170166015625, 2.7900390625, 2.89837646484375, 3.0067138671875, 3.11505126953125, 3.223388671875, 3.33172607421875, 3.4400634765625, 3.54840087890625, 3.65673828125, 3.76507568359375, 3.8734130859375, 3.98175048828125, 4.090087890625, 4.19842529296875, 4.3067626953125, 4.41510009765625, 4.5234375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 8.0, 5.0, 13.0, 8.0, 7.0, 22.0, 61.0, 62.0, 117.0, 209.0, 359.0, 698.0, 1380.0, 3160.0, 7962.0, 24274.0, 91664.0, 527442.0, 2726170.0, 664821.0, 105906.0, 25943.0, 8190.0, 3088.0, 1270.0, 616.0, 293.0, 221.0, 108.0, 64.0, 47.0, 29.0, 20.0, 18.0, 10.0, 8.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.875, -5.7049560546875, -5.534912109375, -5.3648681640625, -5.19482421875, -5.0247802734375, -4.854736328125, -4.6846923828125, -4.5146484375, -4.3446044921875, -4.174560546875, -4.0045166015625, -3.83447265625, -3.6644287109375, -3.494384765625, -3.3243408203125, -3.154296875, -2.9842529296875, -2.814208984375, -2.6441650390625, -2.47412109375, -2.3040771484375, -2.134033203125, -1.9639892578125, -1.7939453125, -1.6239013671875, -1.453857421875, -1.2838134765625, -1.11376953125, -0.9437255859375, -0.773681640625, -0.6036376953125, -0.43359375, -0.2635498046875, -0.093505859375, 0.0765380859375, 0.24658203125, 0.4166259765625, 0.586669921875, 0.7567138671875, 0.9267578125, 1.0968017578125, 1.266845703125, 1.4368896484375, 1.60693359375, 1.7769775390625, 1.947021484375, 2.1170654296875, 2.287109375, 2.4571533203125, 2.627197265625, 2.7972412109375, 2.96728515625, 3.1373291015625, 3.307373046875, 3.4774169921875, 3.6474609375, 3.8175048828125, 3.987548828125, 4.1575927734375, 4.32763671875, 4.4976806640625, 4.667724609375, 4.8377685546875, 5.0078125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 3.0, 5.0, 12.0, 3.0, 11.0, 17.0, 17.0, 26.0, 35.0, 40.0, 60.0, 81.0, 110.0, 157.0, 224.0, 325.0, 411.0, 577.0, 507.0, 439.0, 266.0, 224.0, 171.0, 83.0, 80.0, 41.0, 38.0, 29.0, 14.0, 17.0, 12.0, 10.0, 7.0, 5.0, 5.0, 0.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.125, -5.93829345703125, -5.7515869140625, -5.56488037109375, -5.378173828125, -5.19146728515625, -5.0047607421875, -4.81805419921875, -4.63134765625, -4.44464111328125, -4.2579345703125, -4.07122802734375, -3.884521484375, -3.69781494140625, -3.5111083984375, -3.32440185546875, -3.1376953125, -2.95098876953125, -2.7642822265625, -2.57757568359375, -2.390869140625, -2.20416259765625, -2.0174560546875, -1.83074951171875, -1.64404296875, -1.45733642578125, -1.2706298828125, -1.08392333984375, -0.897216796875, -0.71051025390625, -0.5238037109375, -0.33709716796875, -0.150390625, 0.03631591796875, 0.2230224609375, 0.40972900390625, 0.596435546875, 0.78314208984375, 0.9698486328125, 1.15655517578125, 1.34326171875, 1.52996826171875, 1.7166748046875, 1.90338134765625, 2.090087890625, 2.27679443359375, 2.4635009765625, 2.65020751953125, 2.8369140625, 3.02362060546875, 3.2103271484375, 3.39703369140625, 3.583740234375, 3.77044677734375, 3.9571533203125, 4.14385986328125, 4.33056640625, 4.51727294921875, 4.7039794921875, 4.89068603515625, 5.077392578125, 5.26409912109375, 5.4508056640625, 5.63751220703125, 5.82421875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 9.0, 16.0, 14.0, 54.0, 107.0, 198.0, 212.0, 180.0, 107.0, 51.0, 23.0, 13.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-88.04563903808594, -85.15619659423828, -82.26675415039062, -79.3773193359375, -76.48787689208984, -73.59843444824219, -70.70899200439453, -67.81954956054688, -64.93010711669922, -62.04066467285156, -59.15122604370117, -56.261783599853516, -53.37234115600586, -50.48290252685547, -47.59346008300781, -44.704017639160156, -41.814579010009766, -38.92513656616211, -36.03569793701172, -33.14625549316406, -30.256813049316406, -27.367372512817383, -24.47793197631836, -21.588489532470703, -18.69904899597168, -15.80960750579834, -12.920166015625, -10.030725479125977, -7.141283988952637, -4.251842498779297, -1.3624019622802734, 1.5270404815673828, 4.416481018066406, 7.305922508239746, 10.195363998413086, 13.08480453491211, 15.97424602508545, 18.86368751525879, 21.753128051757812, 24.64257049560547, 27.532011032104492, 30.421451568603516, 33.31089401245117, 36.20033264160156, 39.08977508544922, 41.979217529296875, 44.86865997314453, 47.75810241699219, 50.64754104614258, 53.536983489990234, 56.426422119140625, 59.31586456298828, 62.20530700683594, 65.0947494506836, 67.98419189453125, 70.87362670898438, 73.76306915283203, 76.65251159667969, 79.54195404052734, 82.431396484375, 85.32083129882812, 88.21027374267578, 91.09971618652344, 93.9891586303711, 96.87860107421875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 9.0, 7.0, 6.0, 8.0, 17.0, 12.0, 25.0, 22.0, 24.0, 19.0, 27.0, 26.0, 44.0, 27.0, 43.0, 38.0, 49.0, 45.0, 48.0, 43.0, 58.0, 52.0, 37.0, 36.0, 28.0, 37.0, 15.0, 21.0, 30.0, 28.0, 20.0, 13.0, 15.0, 11.0, 13.0, 7.0, 18.0, 6.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-32.65509033203125, -31.727840423583984, -30.80059051513672, -29.873340606689453, -28.946088790893555, -28.01883888244629, -27.091588973999023, -26.164339065551758, -25.23708724975586, -24.309837341308594, -23.382587432861328, -22.455337524414062, -21.528085708618164, -20.6008358001709, -19.673585891723633, -18.746335983276367, -17.8190860748291, -16.891836166381836, -15.964585304260254, -15.037335395812988, -14.110084533691406, -13.18283462524414, -12.255584716796875, -11.32833480834961, -10.401083946228027, -9.473834037780762, -8.54658317565918, -7.619333267211914, -6.69208288192749, -5.764832496643066, -4.837582588195801, -3.910332202911377, -2.983081817626953, -2.0558314323425293, -1.1285812854766846, -0.20133113861083984, 0.725919246673584, 1.6531696319580078, 2.5804195404052734, 3.5076699256896973, 4.434920310974121, 5.362170696258545, 6.289421081542969, 7.216670989990234, 8.1439208984375, 9.071171760559082, 9.998421669006348, 10.92567253112793, 11.852922439575195, 12.780172348022461, 13.707423210144043, 14.634673118591309, 15.56192398071289, 16.489173889160156, 17.416423797607422, 18.343673706054688, 19.270923614501953, 20.19817352294922, 21.125423431396484, 22.05267333984375, 22.97992515563965, 23.907175064086914, 24.83442497253418, 25.761674880981445, 26.688926696777344]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 6.0, 3.0, 8.0, 6.0, 14.0, 15.0, 19.0, 26.0, 44.0, 70.0, 84.0, 115.0, 136.0, 248.0, 341.0, 532.0, 774.0, 1346.0, 1988.0, 3350.0, 5462.0, 8953.0, 15286.0, 26157.0, 45825.0, 82787.0, 166069.0, 289536.0, 187738.0, 91060.0, 49892.0, 28729.0, 16610.0, 9688.0, 5890.0, 3479.0, 2219.0, 1342.0, 871.0, 592.0, 387.0, 261.0, 176.0, 119.0, 91.0, 66.0, 37.0, 27.0, 23.0, 19.0, 15.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-3.583984375, -3.470489501953125, -3.35699462890625, -3.243499755859375, -3.1300048828125, -3.016510009765625, -2.90301513671875, -2.789520263671875, -2.676025390625, -2.562530517578125, -2.44903564453125, -2.335540771484375, -2.2220458984375, -2.108551025390625, -1.99505615234375, -1.881561279296875, -1.76806640625, -1.654571533203125, -1.54107666015625, -1.427581787109375, -1.3140869140625, -1.200592041015625, -1.08709716796875, -0.973602294921875, -0.860107421875, -0.746612548828125, -0.63311767578125, -0.519622802734375, -0.4061279296875, -0.292633056640625, -0.17913818359375, -0.065643310546875, 0.0478515625, 0.161346435546875, 0.27484130859375, 0.388336181640625, 0.5018310546875, 0.615325927734375, 0.72882080078125, 0.842315673828125, 0.955810546875, 1.069305419921875, 1.18280029296875, 1.296295166015625, 1.4097900390625, 1.523284912109375, 1.63677978515625, 1.750274658203125, 1.86376953125, 1.977264404296875, 2.09075927734375, 2.204254150390625, 2.3177490234375, 2.431243896484375, 2.54473876953125, 2.658233642578125, 2.771728515625, 2.885223388671875, 2.99871826171875, 3.112213134765625, 3.2257080078125, 3.339202880859375, 3.45269775390625, 3.566192626953125, 3.6796875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 1.0, 7.0, 2.0, 0.0, 10.0, 10.0, 16.0, 7.0, 13.0, 11.0, 11.0, 19.0, 23.0, 26.0, 32.0, 27.0, 40.0, 33.0, 20.0, 40.0, 41.0, 47.0, 49.0, 44.0, 35.0, 41.0, 41.0, 39.0, 34.0, 33.0, 36.0, 40.0, 27.0, 15.0, 29.0, 21.0, 6.0, 9.0, 13.0, 7.0, 7.0, 10.0, 6.0, 4.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6533203125, -1.596893310546875, -1.54046630859375, -1.484039306640625, -1.4276123046875, -1.371185302734375, -1.31475830078125, -1.258331298828125, -1.201904296875, -1.145477294921875, -1.08905029296875, -1.032623291015625, -0.9761962890625, -0.919769287109375, -0.86334228515625, -0.806915283203125, -0.75048828125, -0.694061279296875, -0.63763427734375, -0.581207275390625, -0.5247802734375, -0.468353271484375, -0.41192626953125, -0.355499267578125, -0.299072265625, -0.242645263671875, -0.18621826171875, -0.129791259765625, -0.0733642578125, -0.016937255859375, 0.03948974609375, 0.095916748046875, 0.15234375, 0.208770751953125, 0.26519775390625, 0.321624755859375, 0.3780517578125, 0.434478759765625, 0.49090576171875, 0.547332763671875, 0.603759765625, 0.660186767578125, 0.71661376953125, 0.773040771484375, 0.8294677734375, 0.885894775390625, 0.94232177734375, 0.998748779296875, 1.05517578125, 1.111602783203125, 1.16802978515625, 1.224456787109375, 1.2808837890625, 1.337310791015625, 1.39373779296875, 1.450164794921875, 1.506591796875, 1.563018798828125, 1.61944580078125, 1.675872802734375, 1.7322998046875, 1.788726806640625, 1.84515380859375, 1.901580810546875, 1.9580078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 9.0, 18.0, 10.0, 21.0, 23.0, 35.0, 43.0, 60.0, 109.0, 104.0, 154.0, 241.0, 327.0, 443.0, 737.0, 1199.0, 1931.0, 3968.0, 10495.0, 38369.0, 215093.0, 660645.0, 82799.0, 18854.0, 6046.0, 2631.0, 1519.0, 852.0, 570.0, 366.0, 250.0, 184.0, 119.0, 102.0, 61.0, 48.0, 36.0, 24.0, 17.0, 15.0, 10.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.9609375, -8.6646728515625, -8.368408203125, -8.0721435546875, -7.77587890625, -7.4796142578125, -7.183349609375, -6.8870849609375, -6.5908203125, -6.2945556640625, -5.998291015625, -5.7020263671875, -5.40576171875, -5.1094970703125, -4.813232421875, -4.5169677734375, -4.220703125, -3.9244384765625, -3.628173828125, -3.3319091796875, -3.03564453125, -2.7393798828125, -2.443115234375, -2.1468505859375, -1.8505859375, -1.5543212890625, -1.258056640625, -0.9617919921875, -0.66552734375, -0.3692626953125, -0.072998046875, 0.2232666015625, 0.51953125, 0.8157958984375, 1.112060546875, 1.4083251953125, 1.70458984375, 2.0008544921875, 2.297119140625, 2.5933837890625, 2.8896484375, 3.1859130859375, 3.482177734375, 3.7784423828125, 4.07470703125, 4.3709716796875, 4.667236328125, 4.9635009765625, 5.259765625, 5.5560302734375, 5.852294921875, 6.1485595703125, 6.44482421875, 6.7410888671875, 7.037353515625, 7.3336181640625, 7.6298828125, 7.9261474609375, 8.222412109375, 8.5186767578125, 8.81494140625, 9.1112060546875, 9.407470703125, 9.7037353515625, 10.0]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 5.0, 6.0, 7.0, 7.0, 10.0, 11.0, 12.0, 15.0, 19.0, 13.0, 33.0, 44.0, 34.0, 27.0, 46.0, 30.0, 58.0, 59.0, 49.0, 57.0, 62.0, 51.0, 51.0, 44.0, 37.0, 35.0, 30.0, 27.0, 23.0, 20.0, 18.0, 16.0, 10.0, 12.0, 6.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.710205078125, -8.40478515625, -8.099365234375, -7.7939453125, -7.488525390625, -7.18310546875, -6.877685546875, -6.572265625, -6.266845703125, -5.96142578125, -5.656005859375, -5.3505859375, -5.045166015625, -4.73974609375, -4.434326171875, -4.12890625, -3.823486328125, -3.51806640625, -3.212646484375, -2.9072265625, -2.601806640625, -2.29638671875, -1.990966796875, -1.685546875, -1.380126953125, -1.07470703125, -0.769287109375, -0.4638671875, -0.158447265625, 0.14697265625, 0.452392578125, 0.7578125, 1.063232421875, 1.36865234375, 1.674072265625, 1.9794921875, 2.284912109375, 2.59033203125, 2.895751953125, 3.201171875, 3.506591796875, 3.81201171875, 4.117431640625, 4.4228515625, 4.728271484375, 5.03369140625, 5.339111328125, 5.64453125, 5.949951171875, 6.25537109375, 6.560791015625, 6.8662109375, 7.171630859375, 7.47705078125, 7.782470703125, 8.087890625, 8.393310546875, 8.69873046875, 9.004150390625, 9.3095703125, 9.614990234375, 9.92041015625, 10.225830078125, 10.53125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 5.0, 2.0, 8.0, 10.0, 17.0, 25.0, 38.0, 58.0, 85.0, 155.0, 242.0, 370.0, 778.0, 1523.0, 3387.0, 8966.0, 27615.0, 96247.0, 577506.0, 243538.0, 59312.0, 17811.0, 5887.0, 2366.0, 1151.0, 592.0, 333.0, 193.0, 113.0, 78.0, 52.0, 25.0, 19.0, 12.0, 15.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.955078125, -3.844635009765625, -3.73419189453125, -3.623748779296875, -3.5133056640625, -3.402862548828125, -3.29241943359375, -3.181976318359375, -3.071533203125, -2.961090087890625, -2.85064697265625, -2.740203857421875, -2.6297607421875, -2.519317626953125, -2.40887451171875, -2.298431396484375, -2.18798828125, -2.077545166015625, -1.96710205078125, -1.856658935546875, -1.7462158203125, -1.635772705078125, -1.52532958984375, -1.414886474609375, -1.304443359375, -1.194000244140625, -1.08355712890625, -0.973114013671875, -0.8626708984375, -0.752227783203125, -0.64178466796875, -0.531341552734375, -0.4208984375, -0.310455322265625, -0.20001220703125, -0.089569091796875, 0.0208740234375, 0.131317138671875, 0.24176025390625, 0.352203369140625, 0.462646484375, 0.573089599609375, 0.68353271484375, 0.793975830078125, 0.9044189453125, 1.014862060546875, 1.12530517578125, 1.235748291015625, 1.34619140625, 1.456634521484375, 1.56707763671875, 1.677520751953125, 1.7879638671875, 1.898406982421875, 2.00885009765625, 2.119293212890625, 2.229736328125, 2.340179443359375, 2.45062255859375, 2.561065673828125, 2.6715087890625, 2.781951904296875, 2.89239501953125, 3.002838134765625, 3.11328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 8.0, 4.0, 11.0, 4.0, 4.0, 9.0, 9.0, 12.0, 14.0, 16.0, 17.0, 21.0, 30.0, 37.0, 43.0, 57.0, 84.0, 101.0, 117.0, 81.0, 51.0, 51.0, 23.0, 36.0, 23.0, 24.0, 13.0, 14.0, 11.0, 13.0, 11.0, 8.0, 8.0, 5.0, 4.0, 6.0, 4.0, 1.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010080337524414062, -0.0009756982326507568, -0.0009433627128601074, -0.000911027193069458, -0.0008786916732788086, -0.0008463561534881592, -0.0008140206336975098, -0.0007816851139068604, -0.0007493495941162109, -0.0007170140743255615, -0.0006846785545349121, -0.0006523430347442627, -0.0006200075149536133, -0.0005876719951629639, -0.0005553364753723145, -0.000523000955581665, -0.0004906654357910156, -0.0004583299160003662, -0.0004259943962097168, -0.0003936588764190674, -0.00036132335662841797, -0.00032898783683776855, -0.00029665231704711914, -0.0002643167972564697, -0.0002319812774658203, -0.0001996457576751709, -0.00016731023788452148, -0.00013497471809387207, -0.00010263919830322266, -7.030367851257324e-05, -3.796815872192383e-05, -5.632638931274414e-06, 2.6702880859375e-05, 5.9038400650024414e-05, 9.137392044067383e-05, 0.00012370944023132324, 0.00015604496002197266, 0.00018838047981262207, 0.00022071599960327148, 0.0002530515193939209, 0.0002853870391845703, 0.0003177225589752197, 0.00035005807876586914, 0.00038239359855651855, 0.00041472911834716797, 0.0004470646381378174, 0.0004794001579284668, 0.0005117356777191162, 0.0005440711975097656, 0.000576406717300415, 0.0006087422370910645, 0.0006410777568817139, 0.0006734132766723633, 0.0007057487964630127, 0.0007380843162536621, 0.0007704198360443115, 0.0008027553558349609, 0.0008350908756256104, 0.0008674263954162598, 0.0008997619152069092, 0.0009320974349975586, 0.000964432954788208, 0.0009967684745788574, 0.0010291039943695068, 0.0010614395141601562]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 8.0, 2.0, 5.0, 18.0, 14.0, 20.0, 34.0, 41.0, 76.0, 107.0, 174.0, 263.0, 451.0, 796.0, 1450.0, 3172.0, 8386.0, 31141.0, 155257.0, 674087.0, 131655.0, 27472.0, 7559.0, 3006.0, 1416.0, 714.0, 443.0, 276.0, 180.0, 117.0, 84.0, 45.0, 29.0, 20.0, 11.0, 7.0, 10.0, 8.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19140625, -4.07318115234375, -3.9549560546875, -3.83673095703125, -3.718505859375, -3.60028076171875, -3.4820556640625, -3.36383056640625, -3.24560546875, -3.12738037109375, -3.0091552734375, -2.89093017578125, -2.772705078125, -2.65447998046875, -2.5362548828125, -2.41802978515625, -2.2998046875, -2.18157958984375, -2.0633544921875, -1.94512939453125, -1.826904296875, -1.70867919921875, -1.5904541015625, -1.47222900390625, -1.35400390625, -1.23577880859375, -1.1175537109375, -0.99932861328125, -0.881103515625, -0.76287841796875, -0.6446533203125, -0.52642822265625, -0.408203125, -0.28997802734375, -0.1717529296875, -0.05352783203125, 0.064697265625, 0.18292236328125, 0.3011474609375, 0.41937255859375, 0.53759765625, 0.65582275390625, 0.7740478515625, 0.89227294921875, 1.010498046875, 1.12872314453125, 1.2469482421875, 1.36517333984375, 1.4833984375, 1.60162353515625, 1.7198486328125, 1.83807373046875, 1.956298828125, 2.07452392578125, 2.1927490234375, 2.31097412109375, 2.42919921875, 2.54742431640625, 2.6656494140625, 2.78387451171875, 2.902099609375, 3.02032470703125, 3.1385498046875, 3.25677490234375, 3.375]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 7.0, 12.0, 13.0, 16.0, 12.0, 19.0, 25.0, 34.0, 35.0, 54.0, 57.0, 59.0, 70.0, 104.0, 82.0, 58.0, 70.0, 50.0, 38.0, 37.0, 32.0, 23.0, 18.0, 14.0, 9.0, 12.0, 7.0, 8.0, 9.0, 3.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.00390625, -2.886962890625, -2.77001953125, -2.653076171875, -2.5361328125, -2.419189453125, -2.30224609375, -2.185302734375, -2.068359375, -1.951416015625, -1.83447265625, -1.717529296875, -1.6005859375, -1.483642578125, -1.36669921875, -1.249755859375, -1.1328125, -1.015869140625, -0.89892578125, -0.781982421875, -0.6650390625, -0.548095703125, -0.43115234375, -0.314208984375, -0.197265625, -0.080322265625, 0.03662109375, 0.153564453125, 0.2705078125, 0.387451171875, 0.50439453125, 0.621337890625, 0.73828125, 0.855224609375, 0.97216796875, 1.089111328125, 1.2060546875, 1.322998046875, 1.43994140625, 1.556884765625, 1.673828125, 1.790771484375, 1.90771484375, 2.024658203125, 2.1416015625, 2.258544921875, 2.37548828125, 2.492431640625, 2.609375, 2.726318359375, 2.84326171875, 2.960205078125, 3.0771484375, 3.194091796875, 3.31103515625, 3.427978515625, 3.544921875, 3.661865234375, 3.77880859375, 3.895751953125, 4.0126953125, 4.129638671875, 4.24658203125, 4.363525390625, 4.48046875]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 2.0, 4.0, 5.0, 4.0, 10.0, 27.0, 37.0, 62.0, 89.0, 149.0, 248.0, 179.0, 85.0, 50.0, 21.0, 16.0, 7.0, 5.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-108.04973602294922, -105.3194808959961, -102.58921813964844, -99.85896301269531, -97.12870788574219, -94.39845275878906, -91.66819763183594, -88.93793487548828, -86.20767974853516, -83.47742462158203, -80.74716186523438, -78.01690673828125, -75.28665161132812, -72.556396484375, -69.82614135742188, -67.09587860107422, -64.3656234741211, -61.63536834716797, -58.90510940551758, -56.17485046386719, -53.44459533691406, -50.71434020996094, -47.98408126831055, -45.253822326660156, -42.52356719970703, -39.793312072753906, -37.063053131103516, -34.332794189453125, -31.6025390625, -28.872282028198242, -26.142024993896484, -23.411767959594727, -20.681503295898438, -17.95124626159668, -15.220989227294922, -12.490732192993164, -9.760475158691406, -7.030218124389648, -4.299961090087891, -1.5697040557861328, 1.160552978515625, 3.890810012817383, 6.621067047119141, 9.351324081420898, 12.081581115722656, 14.811838150024414, 17.542095184326172, 20.27235221862793, 23.002609252929688, 25.732866287231445, 28.463123321533203, 31.19338035583496, 33.92363739013672, 36.653892517089844, 39.384151458740234, 42.114410400390625, 44.84466552734375, 47.574920654296875, 50.305179595947266, 53.035438537597656, 55.76569366455078, 58.495948791503906, 61.2262077331543, 63.95646667480469, 66.68672180175781]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 4.0, 11.0, 4.0, 10.0, 8.0, 15.0, 16.0, 14.0, 22.0, 24.0, 23.0, 32.0, 31.0, 38.0, 32.0, 41.0, 52.0, 83.0, 83.0, 70.0, 49.0, 42.0, 34.0, 35.0, 37.0, 32.0, 19.0, 24.0, 19.0, 25.0, 18.0, 12.0, 12.0, 11.0, 7.0, 4.0, 1.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.337371826171875, -44.09278106689453, -42.84818649291992, -41.60359573364258, -40.35900115966797, -39.114410400390625, -37.869815826416016, -36.62522506713867, -35.38063049316406, -34.13603973388672, -32.89144515991211, -31.646852493286133, -30.402259826660156, -29.157669067382812, -27.913076400756836, -26.66848373413086, -25.423892974853516, -24.17930030822754, -22.934707641601562, -21.690114974975586, -20.44552230834961, -19.200931549072266, -17.95633888244629, -16.711746215820312, -15.467153549194336, -14.22256088256836, -12.977968215942383, -11.733376502990723, -10.488783836364746, -9.24419116973877, -7.999598979949951, -6.755006790161133, -5.510414123535156, -4.26582145690918, -3.0212292671203613, -1.7766368389129639, -0.5320444107055664, 0.7125482559204102, 1.9571404457092285, 3.201732635498047, 4.446325302124023, 5.69091796875, 6.935510158538818, 8.180102348327637, 9.424695014953613, 10.66928768157959, 11.91387939453125, 13.158472061157227, 14.403064727783203, 15.64765739440918, 16.892250061035156, 18.136842727661133, 19.38143539428711, 20.626026153564453, 21.87061882019043, 23.115211486816406, 24.359804153442383, 25.60439682006836, 26.848989486694336, 28.093582153320312, 29.338172912597656, 30.582767486572266, 31.82735824584961, 33.07195281982422, 34.31654357910156]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 5.0, 3.0, 8.0, 18.0, 24.0, 30.0, 46.0, 78.0, 121.0, 168.0, 308.0, 613.0, 1076.0, 2081.0, 4190.0, 8619.0, 19775.0, 50629.0, 151727.0, 616475.0, 2034945.0, 965451.0, 222083.0, 68878.0, 25837.0, 11003.0, 4969.0, 2398.0, 1225.0, 671.0, 335.0, 193.0, 129.0, 61.0, 39.0, 22.0, 17.0, 13.0, 5.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.90625, -2.8114013671875, -2.716552734375, -2.6217041015625, -2.52685546875, -2.4320068359375, -2.337158203125, -2.2423095703125, -2.1474609375, -2.0526123046875, -1.957763671875, -1.8629150390625, -1.76806640625, -1.6732177734375, -1.578369140625, -1.4835205078125, -1.388671875, -1.2938232421875, -1.198974609375, -1.1041259765625, -1.00927734375, -0.9144287109375, -0.819580078125, -0.7247314453125, -0.6298828125, -0.5350341796875, -0.440185546875, -0.3453369140625, -0.25048828125, -0.1556396484375, -0.060791015625, 0.0340576171875, 0.12890625, 0.2237548828125, 0.318603515625, 0.4134521484375, 0.50830078125, 0.6031494140625, 0.697998046875, 0.7928466796875, 0.8876953125, 0.9825439453125, 1.077392578125, 1.1722412109375, 1.26708984375, 1.3619384765625, 1.456787109375, 1.5516357421875, 1.646484375, 1.7413330078125, 1.836181640625, 1.9310302734375, 2.02587890625, 2.1207275390625, 2.215576171875, 2.3104248046875, 2.4052734375, 2.5001220703125, 2.594970703125, 2.6898193359375, 2.78466796875, 2.8795166015625, 2.974365234375, 3.0692138671875, 3.1640625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 3.0, 6.0, 4.0, 7.0, 15.0, 12.0, 13.0, 37.0, 30.0, 45.0, 46.0, 52.0, 58.0, 51.0, 64.0, 67.0, 69.0, 72.0, 65.0, 47.0, 53.0, 41.0, 37.0, 21.0, 16.0, 18.0, 12.0, 20.0, 10.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08203125, -2.99078369140625, -2.8995361328125, -2.80828857421875, -2.717041015625, -2.62579345703125, -2.5345458984375, -2.44329833984375, -2.35205078125, -2.26080322265625, -2.1695556640625, -2.07830810546875, -1.987060546875, -1.89581298828125, -1.8045654296875, -1.71331787109375, -1.6220703125, -1.53082275390625, -1.4395751953125, -1.34832763671875, -1.257080078125, -1.16583251953125, -1.0745849609375, -0.98333740234375, -0.89208984375, -0.80084228515625, -0.7095947265625, -0.61834716796875, -0.527099609375, -0.43585205078125, -0.3446044921875, -0.25335693359375, -0.162109375, -0.07086181640625, 0.0203857421875, 0.11163330078125, 0.202880859375, 0.29412841796875, 0.3853759765625, 0.47662353515625, 0.56787109375, 0.65911865234375, 0.7503662109375, 0.84161376953125, 0.932861328125, 1.02410888671875, 1.1153564453125, 1.20660400390625, 1.2978515625, 1.38909912109375, 1.4803466796875, 1.57159423828125, 1.662841796875, 1.75408935546875, 1.8453369140625, 1.93658447265625, 2.02783203125, 2.11907958984375, 2.2103271484375, 2.30157470703125, 2.392822265625, 2.48406982421875, 2.5753173828125, 2.66656494140625, 2.7578125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 4.0, 4.0, 10.0, 26.0, 48.0, 57.0, 157.0, 304.0, 734.0, 2117.0, 8906.0, 55252.0, 702516.0, 3131792.0, 252305.0, 30516.0, 6116.0, 1884.0, 693.0, 347.0, 209.0, 109.0, 77.0, 39.0, 25.0, 17.0, 9.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.76171875, -7.50567626953125, -7.2496337890625, -6.99359130859375, -6.737548828125, -6.48150634765625, -6.2254638671875, -5.96942138671875, -5.71337890625, -5.45733642578125, -5.2012939453125, -4.94525146484375, -4.689208984375, -4.43316650390625, -4.1771240234375, -3.92108154296875, -3.6650390625, -3.40899658203125, -3.1529541015625, -2.89691162109375, -2.640869140625, -2.38482666015625, -2.1287841796875, -1.87274169921875, -1.61669921875, -1.36065673828125, -1.1046142578125, -0.84857177734375, -0.592529296875, -0.33648681640625, -0.0804443359375, 0.17559814453125, 0.431640625, 0.68768310546875, 0.9437255859375, 1.19976806640625, 1.455810546875, 1.71185302734375, 1.9678955078125, 2.22393798828125, 2.47998046875, 2.73602294921875, 2.9920654296875, 3.24810791015625, 3.504150390625, 3.76019287109375, 4.0162353515625, 4.27227783203125, 4.5283203125, 4.78436279296875, 5.0404052734375, 5.29644775390625, 5.552490234375, 5.80853271484375, 6.0645751953125, 6.32061767578125, 6.57666015625, 6.83270263671875, 7.0887451171875, 7.34478759765625, 7.600830078125, 7.85687255859375, 8.1129150390625, 8.36895751953125, 8.625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 8.0, 16.0, 17.0, 44.0, 40.0, 67.0, 122.0, 165.0, 229.0, 413.0, 578.0, 667.0, 559.0, 373.0, 235.0, 186.0, 92.0, 77.0, 51.0, 35.0, 25.0, 24.0, 8.0, 6.0, 8.0, 4.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.015625, -4.7803955078125, -4.545166015625, -4.3099365234375, -4.07470703125, -3.8394775390625, -3.604248046875, -3.3690185546875, -3.1337890625, -2.8985595703125, -2.663330078125, -2.4281005859375, -2.19287109375, -1.9576416015625, -1.722412109375, -1.4871826171875, -1.251953125, -1.0167236328125, -0.781494140625, -0.5462646484375, -0.31103515625, -0.0758056640625, 0.159423828125, 0.3946533203125, 0.6298828125, 0.8651123046875, 1.100341796875, 1.3355712890625, 1.57080078125, 1.8060302734375, 2.041259765625, 2.2764892578125, 2.51171875, 2.7469482421875, 2.982177734375, 3.2174072265625, 3.45263671875, 3.6878662109375, 3.923095703125, 4.1583251953125, 4.3935546875, 4.6287841796875, 4.864013671875, 5.0992431640625, 5.33447265625, 5.5697021484375, 5.804931640625, 6.0401611328125, 6.275390625, 6.5106201171875, 6.745849609375, 6.9810791015625, 7.21630859375, 7.4515380859375, 7.686767578125, 7.9219970703125, 8.1572265625, 8.3924560546875, 8.627685546875, 8.8629150390625, 9.09814453125, 9.3333740234375, 9.568603515625, 9.8038330078125, 10.0390625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 16.0, 27.0, 53.0, 74.0, 125.0, 132.0, 174.0, 134.0, 97.0, 62.0, 34.0, 10.0, 15.0, 8.0, 4.0, 4.0, 6.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.03895568847656, -31.859479904174805, -29.680004119873047, -27.500526428222656, -25.32105255126953, -23.14157485961914, -20.962099075317383, -18.782623291015625, -16.603147506713867, -14.42367172241211, -12.244195938110352, -10.064719200134277, -7.8852434158325195, -5.705767631530762, -3.5262908935546875, -1.3468151092529297, 0.8326606750488281, 3.012136697769165, 5.191612720489502, 7.371088981628418, 9.550564765930176, 11.730040550231934, 13.909517288208008, 16.088993072509766, 18.268468856811523, 20.44794464111328, 22.62742042541504, 24.806896209716797, 26.986373901367188, 29.165847778320312, 31.345325469970703, 33.524803161621094, 35.70427703857422, 37.88375473022461, 40.063228607177734, 42.242706298828125, 44.42218017578125, 46.60165786743164, 48.78113555908203, 50.960609436035156, 53.14008331298828, 55.31956100463867, 57.4990348815918, 59.67851257324219, 61.85798645019531, 64.03746032714844, 66.2169418334961, 68.39641571044922, 70.57589721679688, 72.75537109375, 74.93485260009766, 77.11432647705078, 79.2938003540039, 81.47327423095703, 83.65275573730469, 85.83222961425781, 88.01170349121094, 90.19117736816406, 92.37065887451172, 94.55013275146484, 96.72960662841797, 98.9090805053711, 101.08856201171875, 103.26803588867188, 105.447509765625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 8.0, 6.0, 7.0, 8.0, 12.0, 27.0, 15.0, 26.0, 31.0, 30.0, 34.0, 51.0, 54.0, 33.0, 50.0, 41.0, 45.0, 47.0, 49.0, 45.0, 46.0, 33.0, 43.0, 32.0, 36.0, 38.0, 29.0, 21.0, 15.0, 9.0, 18.0, 16.0, 13.0, 7.0, 8.0, 5.0, 10.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-42.47863006591797, -41.298622131347656, -40.118614196777344, -38.93860626220703, -37.75859832763672, -36.578590393066406, -35.398582458496094, -34.21857452392578, -33.03856658935547, -31.858558654785156, -30.678550720214844, -29.49854278564453, -28.31853485107422, -27.138526916503906, -25.95851707458496, -24.77850914001465, -23.598499298095703, -22.41849136352539, -21.238483428955078, -20.058475494384766, -18.878467559814453, -17.69845962524414, -16.518449783325195, -15.338441848754883, -14.15843391418457, -12.978425979614258, -11.798418045043945, -10.618409156799316, -9.438401222229004, -8.258393287658691, -7.078384876251221, -5.89837646484375, -4.718372344970703, -3.5383641719818115, -2.35835599899292, -1.1783478260040283, 0.0016603469848632812, 1.1816682815551758, 2.3616766929626465, 3.541685104370117, 4.72169303894043, 5.901700973510742, 7.081709384918213, 8.261717796325684, 9.441725730895996, 10.621733665466309, 11.801742553710938, 12.98175048828125, 14.161758422851562, 15.341766357421875, 16.521774291992188, 17.7017822265625, 18.881790161132812, 20.061798095703125, 21.24180793762207, 22.421815872192383, 23.601823806762695, 24.781831741333008, 25.96183967590332, 27.141847610473633, 28.321857452392578, 29.50186538696289, 30.681873321533203, 31.861881256103516, 33.04188919067383]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 7.0, 11.0, 11.0, 15.0, 29.0, 35.0, 39.0, 79.0, 121.0, 184.0, 283.0, 406.0, 601.0, 1029.0, 1672.0, 2683.0, 4747.0, 8503.0, 16928.0, 35158.0, 82822.0, 239504.0, 383029.0, 156662.0, 58266.0, 25890.0, 13044.0, 6960.0, 3800.0, 2287.0, 1343.0, 849.0, 552.0, 337.0, 223.0, 162.0, 89.0, 62.0, 39.0, 36.0, 17.0, 12.0, 11.0, 7.0, 4.0, 2.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.72265625, -4.57647705078125, -4.4302978515625, -4.28411865234375, -4.137939453125, -3.99176025390625, -3.8455810546875, -3.69940185546875, -3.55322265625, -3.40704345703125, -3.2608642578125, -3.11468505859375, -2.968505859375, -2.82232666015625, -2.6761474609375, -2.52996826171875, -2.3837890625, -2.23760986328125, -2.0914306640625, -1.94525146484375, -1.799072265625, -1.65289306640625, -1.5067138671875, -1.36053466796875, -1.21435546875, -1.06817626953125, -0.9219970703125, -0.77581787109375, -0.629638671875, -0.48345947265625, -0.3372802734375, -0.19110107421875, -0.044921875, 0.10125732421875, 0.2474365234375, 0.39361572265625, 0.539794921875, 0.68597412109375, 0.8321533203125, 0.97833251953125, 1.12451171875, 1.27069091796875, 1.4168701171875, 1.56304931640625, 1.709228515625, 1.85540771484375, 2.0015869140625, 2.14776611328125, 2.2939453125, 2.44012451171875, 2.5863037109375, 2.73248291015625, 2.878662109375, 3.02484130859375, 3.1710205078125, 3.31719970703125, 3.46337890625, 3.60955810546875, 3.7557373046875, 3.90191650390625, 4.048095703125, 4.19427490234375, 4.3404541015625, 4.48663330078125, 4.6328125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 11.0, 8.0, 13.0, 19.0, 12.0, 24.0, 25.0, 27.0, 26.0, 49.0, 38.0, 53.0, 43.0, 36.0, 51.0, 53.0, 46.0, 46.0, 56.0, 61.0, 44.0, 34.0, 40.0, 35.0, 17.0, 25.0, 17.0, 20.0, 9.0, 10.0, 9.0, 10.0, 5.0, 4.0, 8.0, 5.0, 0.0, 1.0, 4.0, 1.0, 2.0], "bins": [-2.904296875, -2.82928466796875, -2.7542724609375, -2.67926025390625, -2.604248046875, -2.52923583984375, -2.4542236328125, -2.37921142578125, -2.30419921875, -2.22918701171875, -2.1541748046875, -2.07916259765625, -2.004150390625, -1.92913818359375, -1.8541259765625, -1.77911376953125, -1.7041015625, -1.62908935546875, -1.5540771484375, -1.47906494140625, -1.404052734375, -1.32904052734375, -1.2540283203125, -1.17901611328125, -1.10400390625, -1.02899169921875, -0.9539794921875, -0.87896728515625, -0.803955078125, -0.72894287109375, -0.6539306640625, -0.57891845703125, -0.50390625, -0.42889404296875, -0.3538818359375, -0.27886962890625, -0.203857421875, -0.12884521484375, -0.0538330078125, 0.02117919921875, 0.09619140625, 0.17120361328125, 0.2462158203125, 0.32122802734375, 0.396240234375, 0.47125244140625, 0.5462646484375, 0.62127685546875, 0.6962890625, 0.77130126953125, 0.8463134765625, 0.92132568359375, 0.996337890625, 1.07135009765625, 1.1463623046875, 1.22137451171875, 1.29638671875, 1.37139892578125, 1.4464111328125, 1.52142333984375, 1.596435546875, 1.67144775390625, 1.7464599609375, 1.82147216796875, 1.896484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 2.0, 1.0, 5.0, 10.0, 10.0, 7.0, 16.0, 27.0, 41.0, 47.0, 67.0, 81.0, 109.0, 140.0, 236.0, 358.0, 495.0, 878.0, 1588.0, 3382.0, 8582.0, 26607.0, 124691.0, 705523.0, 131297.0, 27611.0, 8891.0, 3583.0, 1661.0, 915.0, 537.0, 341.0, 234.0, 156.0, 119.0, 85.0, 51.0, 46.0, 30.0, 23.0, 16.0, 16.0, 7.0, 7.0, 8.0, 6.0, 5.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.0703125, -7.796875, -7.5234375, -7.25, -6.9765625, -6.703125, -6.4296875, -6.15625, -5.8828125, -5.609375, -5.3359375, -5.0625, -4.7890625, -4.515625, -4.2421875, -3.96875, -3.6953125, -3.421875, -3.1484375, -2.875, -2.6015625, -2.328125, -2.0546875, -1.78125, -1.5078125, -1.234375, -0.9609375, -0.6875, -0.4140625, -0.140625, 0.1328125, 0.40625, 0.6796875, 0.953125, 1.2265625, 1.5, 1.7734375, 2.046875, 2.3203125, 2.59375, 2.8671875, 3.140625, 3.4140625, 3.6875, 3.9609375, 4.234375, 4.5078125, 4.78125, 5.0546875, 5.328125, 5.6015625, 5.875, 6.1484375, 6.421875, 6.6953125, 6.96875, 7.2421875, 7.515625, 7.7890625, 8.0625, 8.3359375, 8.609375, 8.8828125, 9.15625, 9.4296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 4.0, 7.0, 4.0, 11.0, 11.0, 19.0, 29.0, 20.0, 34.0, 35.0, 32.0, 40.0, 53.0, 50.0, 58.0, 41.0, 59.0, 64.0, 49.0, 57.0, 44.0, 39.0, 39.0, 31.0, 36.0, 18.0, 28.0, 23.0, 18.0, 11.0, 10.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6640625, -9.328857421875, -8.99365234375, -8.658447265625, -8.3232421875, -7.988037109375, -7.65283203125, -7.317626953125, -6.982421875, -6.647216796875, -6.31201171875, -5.976806640625, -5.6416015625, -5.306396484375, -4.97119140625, -4.635986328125, -4.30078125, -3.965576171875, -3.63037109375, -3.295166015625, -2.9599609375, -2.624755859375, -2.28955078125, -1.954345703125, -1.619140625, -1.283935546875, -0.94873046875, -0.613525390625, -0.2783203125, 0.056884765625, 0.39208984375, 0.727294921875, 1.0625, 1.397705078125, 1.73291015625, 2.068115234375, 2.4033203125, 2.738525390625, 3.07373046875, 3.408935546875, 3.744140625, 4.079345703125, 4.41455078125, 4.749755859375, 5.0849609375, 5.420166015625, 5.75537109375, 6.090576171875, 6.42578125, 6.760986328125, 7.09619140625, 7.431396484375, 7.7666015625, 8.101806640625, 8.43701171875, 8.772216796875, 9.107421875, 9.442626953125, 9.77783203125, 10.113037109375, 10.4482421875, 10.783447265625, 11.11865234375, 11.453857421875, 11.7890625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 2.0, 3.0, 6.0, 5.0, 15.0, 8.0, 20.0, 30.0, 34.0, 61.0, 82.0, 116.0, 207.0, 337.0, 606.0, 1210.0, 2510.0, 6351.0, 18461.0, 57999.0, 246656.0, 573589.0, 95750.0, 28075.0, 9488.0, 3665.0, 1427.0, 771.0, 381.0, 229.0, 118.0, 107.0, 70.0, 54.0, 26.0, 22.0, 17.0, 9.0, 16.0, 4.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.46875, -3.37017822265625, -3.2716064453125, -3.17303466796875, -3.074462890625, -2.97589111328125, -2.8773193359375, -2.77874755859375, -2.68017578125, -2.58160400390625, -2.4830322265625, -2.38446044921875, -2.285888671875, -2.18731689453125, -2.0887451171875, -1.99017333984375, -1.8916015625, -1.79302978515625, -1.6944580078125, -1.59588623046875, -1.497314453125, -1.39874267578125, -1.3001708984375, -1.20159912109375, -1.10302734375, -1.00445556640625, -0.9058837890625, -0.80731201171875, -0.708740234375, -0.61016845703125, -0.5115966796875, -0.41302490234375, -0.314453125, -0.21588134765625, -0.1173095703125, -0.01873779296875, 0.079833984375, 0.17840576171875, 0.2769775390625, 0.37554931640625, 0.47412109375, 0.57269287109375, 0.6712646484375, 0.76983642578125, 0.868408203125, 0.96697998046875, 1.0655517578125, 1.16412353515625, 1.2626953125, 1.36126708984375, 1.4598388671875, 1.55841064453125, 1.656982421875, 1.75555419921875, 1.8541259765625, 1.95269775390625, 2.05126953125, 2.14984130859375, 2.2484130859375, 2.34698486328125, 2.445556640625, 2.54412841796875, 2.6427001953125, 2.74127197265625, 2.83984375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 11.0, 0.0, 7.0, 8.0, 10.0, 8.0, 15.0, 27.0, 27.0, 30.0, 45.0, 72.0, 86.0, 153.0, 137.0, 122.0, 63.0, 45.0, 33.0, 31.0, 12.0, 18.0, 9.0, 8.0, 10.0, 6.0, 7.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0013294219970703125, -0.0012905895709991455, -0.0012517571449279785, -0.0012129247188568115, -0.0011740922927856445, -0.0011352598667144775, -0.0010964274406433105, -0.0010575950145721436, -0.0010187625885009766, -0.0009799301624298096, -0.0009410977363586426, -0.0009022653102874756, -0.0008634328842163086, -0.0008246004581451416, -0.0007857680320739746, -0.0007469356060028076, -0.0007081031799316406, -0.0006692707538604736, -0.0006304383277893066, -0.0005916059017181396, -0.0005527734756469727, -0.0005139410495758057, -0.00047510862350463867, -0.0004362761974334717, -0.0003974437713623047, -0.0003586113452911377, -0.0003197789192199707, -0.0002809464931488037, -0.00024211406707763672, -0.00020328164100646973, -0.00016444921493530273, -0.00012561678886413574, -8.678436279296875e-05, -4.795193672180176e-05, -9.119510650634766e-06, 2.9712915420532227e-05, 6.854534149169922e-05, 0.00010737776756286621, 0.0001462101936340332, 0.0001850426197052002, 0.0002238750457763672, 0.0002627074718475342, 0.00030153989791870117, 0.00034037232398986816, 0.00037920475006103516, 0.00041803717613220215, 0.00045686960220336914, 0.0004957020282745361, 0.0005345344543457031, 0.0005733668804168701, 0.0006121993064880371, 0.0006510317325592041, 0.0006898641586303711, 0.0007286965847015381, 0.0007675290107727051, 0.0008063614368438721, 0.0008451938629150391, 0.0008840262889862061, 0.000922858715057373, 0.00096169114112854, 0.001000523567199707, 0.001039355993270874, 0.001078188419342041, 0.001117020845413208, 0.001155853271484375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 11.0, 13.0, 19.0, 24.0, 36.0, 56.0, 90.0, 120.0, 177.0, 319.0, 468.0, 794.0, 1332.0, 2657.0, 5861.0, 16292.0, 55920.0, 243693.0, 577764.0, 99163.0, 26766.0, 8963.0, 3729.0, 1784.0, 964.0, 556.0, 345.0, 234.0, 127.0, 95.0, 66.0, 43.0, 34.0, 14.0, 16.0, 6.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.005859375, -2.91534423828125, -2.8248291015625, -2.73431396484375, -2.643798828125, -2.55328369140625, -2.4627685546875, -2.37225341796875, -2.28173828125, -2.19122314453125, -2.1007080078125, -2.01019287109375, -1.919677734375, -1.82916259765625, -1.7386474609375, -1.64813232421875, -1.5576171875, -1.46710205078125, -1.3765869140625, -1.28607177734375, -1.195556640625, -1.10504150390625, -1.0145263671875, -0.92401123046875, -0.83349609375, -0.74298095703125, -0.6524658203125, -0.56195068359375, -0.471435546875, -0.38092041015625, -0.2904052734375, -0.19989013671875, -0.109375, -0.01885986328125, 0.0716552734375, 0.16217041015625, 0.252685546875, 0.34320068359375, 0.4337158203125, 0.52423095703125, 0.61474609375, 0.70526123046875, 0.7957763671875, 0.88629150390625, 0.976806640625, 1.06732177734375, 1.1578369140625, 1.24835205078125, 1.3388671875, 1.42938232421875, 1.5198974609375, 1.61041259765625, 1.700927734375, 1.79144287109375, 1.8819580078125, 1.97247314453125, 2.06298828125, 2.15350341796875, 2.2440185546875, 2.33453369140625, 2.425048828125, 2.51556396484375, 2.6060791015625, 2.69659423828125, 2.787109375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 8.0, 13.0, 7.0, 6.0, 18.0, 16.0, 25.0, 36.0, 31.0, 63.0, 68.0, 101.0, 89.0, 96.0, 98.0, 86.0, 46.0, 42.0, 39.0, 26.0, 20.0, 14.0, 10.0, 11.0, 6.0, 4.0, 6.0, 4.0, 1.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01953125, -2.91845703125, -2.8173828125, -2.71630859375, -2.615234375, -2.51416015625, -2.4130859375, -2.31201171875, -2.2109375, -2.10986328125, -2.0087890625, -1.90771484375, -1.806640625, -1.70556640625, -1.6044921875, -1.50341796875, -1.40234375, -1.30126953125, -1.2001953125, -1.09912109375, -0.998046875, -0.89697265625, -0.7958984375, -0.69482421875, -0.59375, -0.49267578125, -0.3916015625, -0.29052734375, -0.189453125, -0.08837890625, 0.0126953125, 0.11376953125, 0.21484375, 0.31591796875, 0.4169921875, 0.51806640625, 0.619140625, 0.72021484375, 0.8212890625, 0.92236328125, 1.0234375, 1.12451171875, 1.2255859375, 1.32666015625, 1.427734375, 1.52880859375, 1.6298828125, 1.73095703125, 1.83203125, 1.93310546875, 2.0341796875, 2.13525390625, 2.236328125, 2.33740234375, 2.4384765625, 2.53955078125, 2.640625, 2.74169921875, 2.8427734375, 2.94384765625, 3.044921875, 3.14599609375, 3.2470703125, 3.34814453125, 3.44921875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 8.0, 16.0, 34.0, 76.0, 175.0, 332.0, 186.0, 80.0, 43.0, 12.0, 11.0, 8.0, 2.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.56970977783203, -83.31324005126953, -80.05677032470703, -76.80030059814453, -73.54383087158203, -70.28736114501953, -67.03089904785156, -63.7744255065918, -60.5179557800293, -57.2614860534668, -54.0050163269043, -50.74855041503906, -47.49208068847656, -44.23561096191406, -40.97914123535156, -37.72267150878906, -34.46620178222656, -31.209732055664062, -27.953262329101562, -24.696794509887695, -21.440324783325195, -18.183855056762695, -14.927387237548828, -11.670917510986328, -8.414447784423828, -5.157978534698486, -1.9015092849731445, 1.354959487915039, 4.611429214477539, 7.867898941040039, 11.124366760253906, 14.380836486816406, 17.637298583984375, 20.893768310546875, 24.150238037109375, 27.406705856323242, 30.663175582885742, 33.919647216796875, 37.17611312866211, 40.43258285522461, 43.68905258178711, 46.94552230834961, 50.20199203491211, 53.458457946777344, 56.714927673339844, 59.971397399902344, 63.227867126464844, 66.48433685302734, 69.74080657958984, 72.99727630615234, 76.25374603271484, 79.51021575927734, 82.76668548583984, 86.02315521240234, 89.27961730957031, 92.53608703613281, 95.79255676269531, 99.04902648925781, 102.30549621582031, 105.56196594238281, 108.81843566894531, 112.07490539550781, 115.33137512207031, 118.58784484863281, 121.84431457519531]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 9.0, 10.0, 7.0, 14.0, 10.0, 16.0, 25.0, 22.0, 20.0, 33.0, 21.0, 34.0, 35.0, 34.0, 54.0, 69.0, 79.0, 57.0, 54.0, 46.0, 47.0, 28.0, 38.0, 41.0, 22.0, 31.0, 25.0, 15.0, 16.0, 18.0, 12.0, 10.0, 4.0, 13.0, 11.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.468772888183594, -39.158447265625, -37.848121643066406, -36.53779220581055, -35.22746658325195, -33.91714096069336, -32.606815338134766, -31.296489715576172, -29.986162185668945, -28.67583656311035, -27.365509033203125, -26.05518341064453, -24.744857788085938, -23.43453025817871, -22.124204635620117, -20.81387710571289, -19.503551483154297, -18.193225860595703, -16.882898330688477, -15.572572708129883, -14.262246131896973, -12.951919555664062, -11.641593933105469, -10.331267356872559, -9.020940780639648, -7.710614204406738, -6.400288105010986, -5.089962005615234, -3.779635429382324, -2.469308853149414, -1.158982753753662, 0.15134334564208984, 1.4616737365722656, 2.7720000743865967, 4.082326412200928, 5.39265251159668, 6.70297908782959, 8.0133056640625, 9.323631286621094, 10.633957862854004, 11.944284439086914, 13.254611015319824, 14.564937591552734, 15.875263214111328, 17.185588836669922, 18.49591636657715, 19.806241989135742, 21.11656951904297, 22.426895141601562, 23.737220764160156, 25.047548294067383, 26.357873916625977, 27.668201446533203, 28.978527069091797, 30.28885269165039, 31.599178314208984, 32.909507751464844, 34.21983337402344, 35.53015899658203, 36.84048843383789, 38.150814056396484, 39.46113967895508, 40.77146530151367, 42.081790924072266, 43.39211654663086]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 2.0, 5.0, 5.0, 6.0, 8.0, 14.0, 21.0, 22.0, 33.0, 44.0, 59.0, 95.0, 105.0, 194.0, 327.0, 478.0, 860.0, 1565.0, 2888.0, 5645.0, 11858.0, 27483.0, 73475.0, 270085.0, 1364618.0, 1869566.0, 403136.0, 98454.0, 34210.0, 14534.0, 6696.0, 3354.0, 1799.0, 973.0, 597.0, 363.0, 226.0, 159.0, 79.0, 73.0, 42.0, 37.0, 30.0, 19.0, 11.0, 9.0, 6.0, 7.0, 5.0, 4.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.615234375, -2.52545166015625, -2.4356689453125, -2.34588623046875, -2.256103515625, -2.16632080078125, -2.0765380859375, -1.98675537109375, -1.89697265625, -1.80718994140625, -1.7174072265625, -1.62762451171875, -1.537841796875, -1.44805908203125, -1.3582763671875, -1.26849365234375, -1.1787109375, -1.08892822265625, -0.9991455078125, -0.90936279296875, -0.819580078125, -0.72979736328125, -0.6400146484375, -0.55023193359375, -0.46044921875, -0.37066650390625, -0.2808837890625, -0.19110107421875, -0.101318359375, -0.01153564453125, 0.0782470703125, 0.16802978515625, 0.2578125, 0.34759521484375, 0.4373779296875, 0.52716064453125, 0.616943359375, 0.70672607421875, 0.7965087890625, 0.88629150390625, 0.97607421875, 1.06585693359375, 1.1556396484375, 1.24542236328125, 1.335205078125, 1.42498779296875, 1.5147705078125, 1.60455322265625, 1.6943359375, 1.78411865234375, 1.8739013671875, 1.96368408203125, 2.053466796875, 2.14324951171875, 2.2330322265625, 2.32281494140625, 2.41259765625, 2.50238037109375, 2.5921630859375, 2.68194580078125, 2.771728515625, 2.86151123046875, 2.9512939453125, 3.04107666015625, 3.130859375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 8.0, 8.0, 10.0, 23.0, 25.0, 20.0, 24.0, 44.0, 23.0, 36.0, 38.0, 52.0, 40.0, 69.0, 73.0, 66.0, 43.0, 60.0, 72.0, 43.0, 43.0, 32.0, 33.0, 15.0, 26.0, 14.0, 12.0, 11.0, 14.0, 8.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.125, -2.042877197265625, -1.96075439453125, -1.878631591796875, -1.7965087890625, -1.714385986328125, -1.63226318359375, -1.550140380859375, -1.468017578125, -1.385894775390625, -1.30377197265625, -1.221649169921875, -1.1395263671875, -1.057403564453125, -0.97528076171875, -0.893157958984375, -0.81103515625, -0.728912353515625, -0.64678955078125, -0.564666748046875, -0.4825439453125, -0.400421142578125, -0.31829833984375, -0.236175537109375, -0.154052734375, -0.071929931640625, 0.01019287109375, 0.092315673828125, 0.1744384765625, 0.256561279296875, 0.33868408203125, 0.420806884765625, 0.5029296875, 0.585052490234375, 0.66717529296875, 0.749298095703125, 0.8314208984375, 0.913543701171875, 0.99566650390625, 1.077789306640625, 1.159912109375, 1.242034912109375, 1.32415771484375, 1.406280517578125, 1.4884033203125, 1.570526123046875, 1.65264892578125, 1.734771728515625, 1.81689453125, 1.899017333984375, 1.98114013671875, 2.063262939453125, 2.1453857421875, 2.227508544921875, 2.30963134765625, 2.391754150390625, 2.473876953125, 2.555999755859375, 2.63812255859375, 2.720245361328125, 2.8023681640625, 2.884490966796875, 2.96661376953125, 3.048736572265625, 3.130859375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 5.0, 12.0, 9.0, 13.0, 17.0, 26.0, 33.0, 47.0, 77.0, 129.0, 188.0, 364.0, 739.0, 1854.0, 5155.0, 18306.0, 84704.0, 831358.0, 2933262.0, 261103.0, 41012.0, 10159.0, 3243.0, 1155.0, 565.0, 277.0, 162.0, 95.0, 60.0, 41.0, 33.0, 20.0, 16.0, 13.0, 16.0, 2.0, 7.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.31719970703125, -5.1148681640625, -4.91253662109375, -4.710205078125, -4.50787353515625, -4.3055419921875, -4.10321044921875, -3.90087890625, -3.69854736328125, -3.4962158203125, -3.29388427734375, -3.091552734375, -2.88922119140625, -2.6868896484375, -2.48455810546875, -2.2822265625, -2.07989501953125, -1.8775634765625, -1.67523193359375, -1.472900390625, -1.27056884765625, -1.0682373046875, -0.86590576171875, -0.66357421875, -0.46124267578125, -0.2589111328125, -0.05657958984375, 0.145751953125, 0.34808349609375, 0.5504150390625, 0.75274658203125, 0.955078125, 1.15740966796875, 1.3597412109375, 1.56207275390625, 1.764404296875, 1.96673583984375, 2.1690673828125, 2.37139892578125, 2.57373046875, 2.77606201171875, 2.9783935546875, 3.18072509765625, 3.383056640625, 3.58538818359375, 3.7877197265625, 3.99005126953125, 4.1923828125, 4.39471435546875, 4.5970458984375, 4.79937744140625, 5.001708984375, 5.20404052734375, 5.4063720703125, 5.60870361328125, 5.81103515625, 6.01336669921875, 6.2156982421875, 6.41802978515625, 6.620361328125, 6.82269287109375, 7.0250244140625, 7.22735595703125, 7.4296875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 6.0, 7.0, 3.0, 11.0, 15.0, 11.0, 20.0, 21.0, 25.0, 24.0, 37.0, 55.0, 74.0, 89.0, 133.0, 193.0, 298.0, 347.0, 489.0, 504.0, 460.0, 343.0, 229.0, 182.0, 116.0, 90.0, 59.0, 53.0, 40.0, 32.0, 23.0, 18.0, 18.0, 9.0, 8.0, 9.0, 8.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.8359375, -4.686279296875, -4.53662109375, -4.386962890625, -4.2373046875, -4.087646484375, -3.93798828125, -3.788330078125, -3.638671875, -3.489013671875, -3.33935546875, -3.189697265625, -3.0400390625, -2.890380859375, -2.74072265625, -2.591064453125, -2.44140625, -2.291748046875, -2.14208984375, -1.992431640625, -1.8427734375, -1.693115234375, -1.54345703125, -1.393798828125, -1.244140625, -1.094482421875, -0.94482421875, -0.795166015625, -0.6455078125, -0.495849609375, -0.34619140625, -0.196533203125, -0.046875, 0.102783203125, 0.25244140625, 0.402099609375, 0.5517578125, 0.701416015625, 0.85107421875, 1.000732421875, 1.150390625, 1.300048828125, 1.44970703125, 1.599365234375, 1.7490234375, 1.898681640625, 2.04833984375, 2.197998046875, 2.34765625, 2.497314453125, 2.64697265625, 2.796630859375, 2.9462890625, 3.095947265625, 3.24560546875, 3.395263671875, 3.544921875, 3.694580078125, 3.84423828125, 3.993896484375, 4.1435546875, 4.293212890625, 4.44287109375, 4.592529296875, 4.7421875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 2.0, 7.0, 11.0, 27.0, 52.0, 94.0, 166.0, 185.0, 170.0, 109.0, 89.0, 36.0, 17.0, 9.0, 3.0, 6.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-74.386962890625, -72.24458312988281, -70.10221099853516, -67.95983123779297, -65.81745910644531, -63.675079345703125, -61.5327033996582, -59.39032745361328, -57.247947692871094, -55.10557174682617, -52.96319580078125, -50.82081604003906, -48.67844009399414, -46.53606414794922, -44.3936882019043, -42.251312255859375, -40.10893630981445, -37.96656036376953, -35.82418441772461, -33.68180847167969, -31.5394287109375, -29.397052764892578, -27.254676818847656, -25.112300872802734, -22.96992301940918, -20.827547073364258, -18.685169219970703, -16.54279327392578, -14.400416374206543, -12.258039474487305, -10.115663528442383, -7.9732866287231445, -5.830905914306641, -3.6885292530059814, -1.5461525917053223, 0.5962238311767578, 2.738600730895996, 4.880977630615234, 7.023353576660156, 9.165730476379395, 11.308107376098633, 13.450484275817871, 15.59286117553711, 17.73523712158203, 19.877613067626953, 22.019990921020508, 24.16236686706543, 26.304744720458984, 28.447120666503906, 30.589496612548828, 32.73187255859375, 34.87425231933594, 37.01662826538086, 39.15900421142578, 41.3013801574707, 43.443756103515625, 45.58613586425781, 47.728511810302734, 49.870887756347656, 52.013267517089844, 54.155643463134766, 56.29801940917969, 58.44039535522461, 60.58277130126953, 62.72514724731445]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 10.0, 1.0, 6.0, 9.0, 9.0, 17.0, 20.0, 15.0, 23.0, 31.0, 37.0, 35.0, 33.0, 46.0, 46.0, 58.0, 45.0, 60.0, 55.0, 35.0, 48.0, 48.0, 45.0, 29.0, 38.0, 26.0, 41.0, 27.0, 26.0, 22.0, 11.0, 12.0, 13.0, 8.0, 6.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.262693405151367, -30.378803253173828, -29.494915008544922, -28.611024856567383, -27.727134704589844, -26.843246459960938, -25.9593563079834, -25.07546615600586, -24.191577911376953, -23.307687759399414, -22.423799514770508, -21.53990936279297, -20.65601921081543, -19.77212905883789, -18.888240814208984, -18.004350662231445, -17.120460510253906, -16.236570358276367, -15.352681159973145, -14.468791961669922, -13.584901809692383, -12.70101261138916, -11.817123413085938, -10.933233261108398, -10.049344062805176, -9.165454864501953, -8.281564712524414, -7.397675514221191, -6.5137858390808105, -5.62989616394043, -4.746006965637207, -3.862117290496826, -2.978229522705078, -2.0943398475646973, -1.2104504108428955, -0.32656097412109375, 0.5573287010192871, 1.441218376159668, 2.3251075744628906, 3.2089972496032715, 4.092886924743652, 4.976776599884033, 5.860666275024414, 6.744555473327637, 7.628445148468018, 8.512334823608398, 9.396224021911621, 10.280113220214844, 11.164003372192383, 12.047892570495605, 12.931782722473145, 13.815671920776367, 14.699562072753906, 15.583451271057129, 16.46734046936035, 17.35123062133789, 18.235118865966797, 19.119009017944336, 20.002897262573242, 20.88678741455078, 21.77067756652832, 22.65456771850586, 23.538455963134766, 24.422346115112305, 25.306236267089844]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 14.0, 15.0, 31.0, 57.0, 91.0, 187.0, 331.0, 661.0, 1428.0, 3143.0, 8369.0, 28468.0, 135205.0, 501997.0, 288391.0, 57033.0, 14189.0, 4964.0, 2008.0, 940.0, 496.0, 231.0, 121.0, 71.0, 39.0, 28.0, 14.0, 14.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.015625, -5.8472900390625, -5.678955078125, -5.5106201171875, -5.34228515625, -5.1739501953125, -5.005615234375, -4.8372802734375, -4.6689453125, -4.5006103515625, -4.332275390625, -4.1639404296875, -3.99560546875, -3.8272705078125, -3.658935546875, -3.4906005859375, -3.322265625, -3.1539306640625, -2.985595703125, -2.8172607421875, -2.64892578125, -2.4805908203125, -2.312255859375, -2.1439208984375, -1.9755859375, -1.8072509765625, -1.638916015625, -1.4705810546875, -1.30224609375, -1.1339111328125, -0.965576171875, -0.7972412109375, -0.62890625, -0.4605712890625, -0.292236328125, -0.1239013671875, 0.04443359375, 0.2127685546875, 0.381103515625, 0.5494384765625, 0.7177734375, 0.8861083984375, 1.054443359375, 1.2227783203125, 1.39111328125, 1.5594482421875, 1.727783203125, 1.8961181640625, 2.064453125, 2.2327880859375, 2.401123046875, 2.5694580078125, 2.73779296875, 2.9061279296875, 3.074462890625, 3.2427978515625, 3.4111328125, 3.5794677734375, 3.747802734375, 3.9161376953125, 4.08447265625, 4.2528076171875, 4.421142578125, 4.5894775390625, 4.7578125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 11.0, 14.0, 11.0, 15.0, 18.0, 16.0, 30.0, 30.0, 28.0, 43.0, 32.0, 40.0, 50.0, 48.0, 50.0, 46.0, 49.0, 61.0, 47.0, 52.0, 45.0, 46.0, 34.0, 24.0, 38.0, 21.0, 17.0, 15.0, 18.0, 13.0, 7.0, 8.0, 4.0, 7.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.111328125, -2.033172607421875, -1.95501708984375, -1.876861572265625, -1.7987060546875, -1.720550537109375, -1.64239501953125, -1.564239501953125, -1.486083984375, -1.407928466796875, -1.32977294921875, -1.251617431640625, -1.1734619140625, -1.095306396484375, -1.01715087890625, -0.938995361328125, -0.86083984375, -0.782684326171875, -0.70452880859375, -0.626373291015625, -0.5482177734375, -0.470062255859375, -0.39190673828125, -0.313751220703125, -0.235595703125, -0.157440185546875, -0.07928466796875, -0.001129150390625, 0.0770263671875, 0.155181884765625, 0.23333740234375, 0.311492919921875, 0.3896484375, 0.467803955078125, 0.54595947265625, 0.624114990234375, 0.7022705078125, 0.780426025390625, 0.85858154296875, 0.936737060546875, 1.014892578125, 1.093048095703125, 1.17120361328125, 1.249359130859375, 1.3275146484375, 1.405670166015625, 1.48382568359375, 1.561981201171875, 1.64013671875, 1.718292236328125, 1.79644775390625, 1.874603271484375, 1.9527587890625, 2.030914306640625, 2.10906982421875, 2.187225341796875, 2.265380859375, 2.343536376953125, 2.42169189453125, 2.499847412109375, 2.5780029296875, 2.656158447265625, 2.73431396484375, 2.812469482421875, 2.890625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 6.0, 6.0, 4.0, 7.0, 9.0, 11.0, 21.0, 25.0, 41.0, 65.0, 103.0, 174.0, 336.0, 725.0, 1603.0, 3992.0, 13877.0, 82835.0, 677201.0, 226891.0, 29452.0, 6712.0, 2414.0, 945.0, 481.0, 269.0, 131.0, 79.0, 39.0, 32.0, 22.0, 13.0, 12.0, 5.0, 5.0, 2.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.359375, -5.151123046875, -4.94287109375, -4.734619140625, -4.5263671875, -4.318115234375, -4.10986328125, -3.901611328125, -3.693359375, -3.485107421875, -3.27685546875, -3.068603515625, -2.8603515625, -2.652099609375, -2.44384765625, -2.235595703125, -2.02734375, -1.819091796875, -1.61083984375, -1.402587890625, -1.1943359375, -0.986083984375, -0.77783203125, -0.569580078125, -0.361328125, -0.153076171875, 0.05517578125, 0.263427734375, 0.4716796875, 0.679931640625, 0.88818359375, 1.096435546875, 1.3046875, 1.512939453125, 1.72119140625, 1.929443359375, 2.1376953125, 2.345947265625, 2.55419921875, 2.762451171875, 2.970703125, 3.178955078125, 3.38720703125, 3.595458984375, 3.8037109375, 4.011962890625, 4.22021484375, 4.428466796875, 4.63671875, 4.844970703125, 5.05322265625, 5.261474609375, 5.4697265625, 5.677978515625, 5.88623046875, 6.094482421875, 6.302734375, 6.510986328125, 6.71923828125, 6.927490234375, 7.1357421875, 7.343994140625, 7.55224609375, 7.760498046875, 7.96875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 8.0, 6.0, 7.0, 4.0, 9.0, 17.0, 23.0, 22.0, 21.0, 33.0, 38.0, 45.0, 37.0, 48.0, 52.0, 41.0, 61.0, 58.0, 58.0, 51.0, 51.0, 51.0, 47.0, 43.0, 24.0, 30.0, 20.0, 18.0, 9.0, 18.0, 4.0, 12.0, 9.0, 9.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.546875, -8.2684326171875, -7.989990234375, -7.7115478515625, -7.43310546875, -7.1546630859375, -6.876220703125, -6.5977783203125, -6.3193359375, -6.0408935546875, -5.762451171875, -5.4840087890625, -5.20556640625, -4.9271240234375, -4.648681640625, -4.3702392578125, -4.091796875, -3.8133544921875, -3.534912109375, -3.2564697265625, -2.97802734375, -2.6995849609375, -2.421142578125, -2.1427001953125, -1.8642578125, -1.5858154296875, -1.307373046875, -1.0289306640625, -0.75048828125, -0.4720458984375, -0.193603515625, 0.0848388671875, 0.36328125, 0.6417236328125, 0.920166015625, 1.1986083984375, 1.47705078125, 1.7554931640625, 2.033935546875, 2.3123779296875, 2.5908203125, 2.8692626953125, 3.147705078125, 3.4261474609375, 3.70458984375, 3.9830322265625, 4.261474609375, 4.5399169921875, 4.818359375, 5.0968017578125, 5.375244140625, 5.6536865234375, 5.93212890625, 6.2105712890625, 6.489013671875, 6.7674560546875, 7.0458984375, 7.3243408203125, 7.602783203125, 7.8812255859375, 8.15966796875, 8.4381103515625, 8.716552734375, 8.9949951171875, 9.2734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 9.0, 9.0, 19.0, 30.0, 38.0, 67.0, 80.0, 197.0, 387.0, 723.0, 1460.0, 3341.0, 8208.0, 23355.0, 81306.0, 317609.0, 483039.0, 88180.0, 25075.0, 8683.0, 3526.0, 1612.0, 734.0, 373.0, 179.0, 106.0, 75.0, 40.0, 34.0, 16.0, 14.0, 7.0, 9.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.919921875, -1.855987548828125, -1.79205322265625, -1.728118896484375, -1.6641845703125, -1.600250244140625, -1.53631591796875, -1.472381591796875, -1.408447265625, -1.344512939453125, -1.28057861328125, -1.216644287109375, -1.1527099609375, -1.088775634765625, -1.02484130859375, -0.960906982421875, -0.89697265625, -0.833038330078125, -0.76910400390625, -0.705169677734375, -0.6412353515625, -0.577301025390625, -0.51336669921875, -0.449432373046875, -0.385498046875, -0.321563720703125, -0.25762939453125, -0.193695068359375, -0.1297607421875, -0.065826416015625, -0.00189208984375, 0.062042236328125, 0.1259765625, 0.189910888671875, 0.25384521484375, 0.317779541015625, 0.3817138671875, 0.445648193359375, 0.50958251953125, 0.573516845703125, 0.637451171875, 0.701385498046875, 0.76531982421875, 0.829254150390625, 0.8931884765625, 0.957122802734375, 1.02105712890625, 1.084991455078125, 1.14892578125, 1.212860107421875, 1.27679443359375, 1.340728759765625, 1.4046630859375, 1.468597412109375, 1.53253173828125, 1.596466064453125, 1.660400390625, 1.724334716796875, 1.78826904296875, 1.852203369140625, 1.9161376953125, 1.980072021484375, 2.04400634765625, 2.107940673828125, 2.171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 11.0, 4.0, 12.0, 16.0, 17.0, 29.0, 49.0, 87.0, 116.0, 155.0, 126.0, 131.0, 84.0, 55.0, 35.0, 23.0, 16.0, 10.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008730888366699219, -0.0008431300520896912, -0.0008131712675094604, -0.0007832124829292297, -0.000753253698348999, -0.0007232949137687683, -0.0006933361291885376, -0.0006633773446083069, -0.0006334185600280762, -0.0006034597754478455, -0.0005735009908676147, -0.000543542206287384, -0.0005135834217071533, -0.0004836246371269226, -0.0004536658525466919, -0.0004237070679664612, -0.00039374828338623047, -0.00036378949880599976, -0.00033383071422576904, -0.00030387192964553833, -0.0002739131450653076, -0.0002439543604850769, -0.0002139955759048462, -0.00018403679132461548, -0.00015407800674438477, -0.00012411922216415405, -9.416043758392334e-05, -6.420165300369263e-05, -3.4242868423461914e-05, -4.284083843231201e-06, 2.5674700736999512e-05, 5.5633485317230225e-05, 8.559226989746094e-05, 0.00011555105447769165, 0.00014550983905792236, 0.00017546862363815308, 0.0002054274082183838, 0.0002353861927986145, 0.0002653449773788452, 0.00029530376195907593, 0.00032526254653930664, 0.00035522133111953735, 0.00038518011569976807, 0.0004151389002799988, 0.0004450976848602295, 0.0004750564694404602, 0.0005050152540206909, 0.0005349740386009216, 0.0005649328231811523, 0.0005948916077613831, 0.0006248503923416138, 0.0006548091769218445, 0.0006847679615020752, 0.0007147267460823059, 0.0007446855306625366, 0.0007746443152427673, 0.000804603099822998, 0.0008345618844032288, 0.0008645206689834595, 0.0008944794535636902, 0.0009244382381439209, 0.0009543970227241516, 0.0009843558073043823, 0.001014314591884613, 0.0010442733764648438]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 9.0, 5.0, 14.0, 11.0, 36.0, 35.0, 58.0, 99.0, 180.0, 322.0, 603.0, 1247.0, 2648.0, 6230.0, 16642.0, 53704.0, 197351.0, 560248.0, 145656.0, 40734.0, 13305.0, 5043.0, 2159.0, 995.0, 504.0, 300.0, 145.0, 85.0, 61.0, 34.0, 25.0, 20.0, 8.0, 6.0, 7.0, 3.0, 4.0, 6.0, 1.0, 5.0, 2.0, 0.0, 1.0], "bins": [-2.48046875, -2.4158477783203125, -2.351226806640625, -2.2866058349609375, -2.22198486328125, -2.1573638916015625, -2.092742919921875, -2.0281219482421875, -1.9635009765625, -1.8988800048828125, -1.834259033203125, -1.7696380615234375, -1.70501708984375, -1.6403961181640625, -1.575775146484375, -1.5111541748046875, -1.446533203125, -1.3819122314453125, -1.317291259765625, -1.2526702880859375, -1.18804931640625, -1.1234283447265625, -1.058807373046875, -0.9941864013671875, -0.9295654296875, -0.8649444580078125, -0.800323486328125, -0.7357025146484375, -0.67108154296875, -0.6064605712890625, -0.541839599609375, -0.4772186279296875, -0.41259765625, -0.3479766845703125, -0.283355712890625, -0.2187347412109375, -0.15411376953125, -0.0894927978515625, -0.024871826171875, 0.0397491455078125, 0.1043701171875, 0.1689910888671875, 0.233612060546875, 0.2982330322265625, 0.36285400390625, 0.4274749755859375, 0.492095947265625, 0.5567169189453125, 0.621337890625, 0.6859588623046875, 0.750579833984375, 0.8152008056640625, 0.87982177734375, 0.9444427490234375, 1.009063720703125, 1.0736846923828125, 1.1383056640625, 1.2029266357421875, 1.267547607421875, 1.3321685791015625, 1.39678955078125, 1.4614105224609375, 1.526031494140625, 1.5906524658203125, 1.6552734375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 3.0, 7.0, 5.0, 8.0, 6.0, 13.0, 19.0, 24.0, 23.0, 20.0, 33.0, 35.0, 37.0, 50.0, 60.0, 56.0, 80.0, 61.0, 66.0, 60.0, 50.0, 68.0, 37.0, 32.0, 32.0, 22.0, 16.0, 11.0, 12.0, 6.0, 7.0, 5.0, 7.0, 7.0, 7.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.794921875, -1.7410125732421875, -1.687103271484375, -1.6331939697265625, -1.57928466796875, -1.5253753662109375, -1.471466064453125, -1.4175567626953125, -1.3636474609375, -1.3097381591796875, -1.255828857421875, -1.2019195556640625, -1.14801025390625, -1.0941009521484375, -1.040191650390625, -0.9862823486328125, -0.932373046875, -0.8784637451171875, -0.824554443359375, -0.7706451416015625, -0.71673583984375, -0.6628265380859375, -0.608917236328125, -0.5550079345703125, -0.5010986328125, -0.4471893310546875, -0.393280029296875, -0.3393707275390625, -0.28546142578125, -0.2315521240234375, -0.177642822265625, -0.1237335205078125, -0.06982421875, -0.0159149169921875, 0.037994384765625, 0.0919036865234375, 0.14581298828125, 0.1997222900390625, 0.253631591796875, 0.3075408935546875, 0.3614501953125, 0.4153594970703125, 0.469268798828125, 0.5231781005859375, 0.57708740234375, 0.6309967041015625, 0.684906005859375, 0.7388153076171875, 0.792724609375, 0.8466339111328125, 0.900543212890625, 0.9544525146484375, 1.00836181640625, 1.0622711181640625, 1.116180419921875, 1.1700897216796875, 1.2239990234375, 1.2779083251953125, 1.331817626953125, 1.3857269287109375, 1.43963623046875, 1.4935455322265625, 1.547454833984375, 1.6013641357421875, 1.6552734375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 10.0, 16.0, 34.0, 61.0, 133.0, 226.0, 187.0, 142.0, 76.0, 33.0, 32.0, 15.0, 5.0, 3.0, 1.0, 1.0, 8.0, 0.0, 9.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.842132568359375, -42.143985748291016, -40.44583511352539, -38.74768829345703, -37.049537658691406, -35.35139083862305, -33.65324401855469, -31.955095291137695, -30.256946563720703, -28.55879783630371, -26.86064910888672, -25.16250228881836, -23.464353561401367, -21.766204833984375, -20.068058013916016, -18.369909286499023, -16.67176055908203, -14.973611831665039, -13.275464057922363, -11.577316284179688, -9.879167556762695, -8.181018829345703, -6.482871055603027, -4.784723281860352, -3.0865745544433594, -1.3884263038635254, 0.3097219467163086, 2.0078701972961426, 3.7060184478759766, 5.404167175292969, 7.1023149490356445, 8.80046272277832, 10.498611450195312, 12.196760177612305, 13.89490795135498, 15.593055725097656, 17.29120445251465, 18.98935317993164, 20.6875, 22.385648727416992, 24.083797454833984, 25.781946182250977, 27.48009490966797, 29.178241729736328, 30.87639045715332, 32.57453918457031, 34.27268600463867, 35.97083282470703, 37.668983459472656, 39.367130279541016, 41.06528091430664, 42.763427734375, 44.461578369140625, 46.159725189208984, 47.857872009277344, 49.55602264404297, 51.25416946411133, 52.95231628417969, 54.65046691894531, 56.34861373901367, 58.04676055908203, 59.744911193847656, 61.443058013916016, 63.141204833984375, 64.83935546875]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 4.0, 5.0, 2.0, 11.0, 5.0, 9.0, 8.0, 12.0, 14.0, 19.0, 21.0, 22.0, 20.0, 24.0, 32.0, 34.0, 29.0, 44.0, 59.0, 67.0, 81.0, 80.0, 64.0, 47.0, 48.0, 35.0, 30.0, 29.0, 33.0, 14.0, 19.0, 12.0, 14.0, 12.0, 8.0, 8.0, 5.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.29172897338867, -35.244815826416016, -34.19790267944336, -33.1509895324707, -32.10407638549805, -31.05716323852539, -30.0102481842041, -28.963335037231445, -27.91642189025879, -26.869508743286133, -25.822595596313477, -24.77568244934082, -23.72876739501953, -22.681854248046875, -21.63494110107422, -20.588027954101562, -19.541114807128906, -18.49420166015625, -17.447288513183594, -16.400375366210938, -15.353461265563965, -14.306548118591309, -13.259634017944336, -12.21272087097168, -11.165807723999023, -10.118894577026367, -9.071981430053711, -8.025067329406738, -6.978154182434082, -5.931241035461426, -4.884327411651611, -3.837413787841797, -2.7905006408691406, -1.7435872554779053, -0.6966738700866699, 0.35023951530456543, 1.3971529006958008, 2.444066047668457, 3.4909796714782715, 4.537893295288086, 5.584806442260742, 6.631719589233398, 7.678633213043213, 8.725546836853027, 9.772459983825684, 10.81937313079834, 11.866287231445312, 12.913200378417969, 13.960113525390625, 15.007026672363281, 16.053939819335938, 17.100852966308594, 18.14776611328125, 19.194679260253906, 20.241594314575195, 21.28850746154785, 22.335420608520508, 23.382333755493164, 24.42924690246582, 25.476160049438477, 26.523075103759766, 27.569988250732422, 28.616901397705078, 29.663814544677734, 30.71072769165039]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 15.0, 16.0, 36.0, 79.0, 122.0, 233.0, 418.0, 835.0, 1788.0, 4246.0, 11790.0, 38542.0, 172556.0, 1401551.0, 2210711.0, 273742.0, 52624.0, 15257.0, 5465.0, 2149.0, 1037.0, 502.0, 253.0, 131.0, 71.0, 42.0, 28.0, 15.0, 7.0, 8.0, 5.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46484375, -4.344573974609375, -4.22430419921875, -4.104034423828125, -3.9837646484375, -3.863494873046875, -3.74322509765625, -3.622955322265625, -3.502685546875, -3.382415771484375, -3.26214599609375, -3.141876220703125, -3.0216064453125, -2.901336669921875, -2.78106689453125, -2.660797119140625, -2.54052734375, -2.420257568359375, -2.29998779296875, -2.179718017578125, -2.0594482421875, -1.939178466796875, -1.81890869140625, -1.698638916015625, -1.578369140625, -1.458099365234375, -1.33782958984375, -1.217559814453125, -1.0972900390625, -0.977020263671875, -0.85675048828125, -0.736480712890625, -0.6162109375, -0.495941162109375, -0.37567138671875, -0.255401611328125, -0.1351318359375, -0.014862060546875, 0.10540771484375, 0.225677490234375, 0.345947265625, 0.466217041015625, 0.58648681640625, 0.706756591796875, 0.8270263671875, 0.947296142578125, 1.06756591796875, 1.187835693359375, 1.30810546875, 1.428375244140625, 1.54864501953125, 1.668914794921875, 1.7891845703125, 1.909454345703125, 2.02972412109375, 2.149993896484375, 2.270263671875, 2.390533447265625, 2.51080322265625, 2.631072998046875, 2.7513427734375, 2.871612548828125, 2.99188232421875, 3.112152099609375, 3.232421875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 5.0, 1.0, 9.0, 6.0, 2.0, 15.0, 16.0, 13.0, 17.0, 33.0, 31.0, 21.0, 40.0, 36.0, 37.0, 32.0, 39.0, 45.0, 47.0, 51.0, 42.0, 44.0, 40.0, 49.0, 43.0, 38.0, 30.0, 30.0, 34.0, 28.0, 26.0, 19.0, 11.0, 20.0, 7.0, 10.0, 12.0, 3.0, 4.0, 9.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.15625, -2.0888671875, -2.021484375, -1.9541015625, -1.88671875, -1.8193359375, -1.751953125, -1.6845703125, -1.6171875, -1.5498046875, -1.482421875, -1.4150390625, -1.34765625, -1.2802734375, -1.212890625, -1.1455078125, -1.078125, -1.0107421875, -0.943359375, -0.8759765625, -0.80859375, -0.7412109375, -0.673828125, -0.6064453125, -0.5390625, -0.4716796875, -0.404296875, -0.3369140625, -0.26953125, -0.2021484375, -0.134765625, -0.0673828125, 0.0, 0.0673828125, 0.134765625, 0.2021484375, 0.26953125, 0.3369140625, 0.404296875, 0.4716796875, 0.5390625, 0.6064453125, 0.673828125, 0.7412109375, 0.80859375, 0.8759765625, 0.943359375, 1.0107421875, 1.078125, 1.1455078125, 1.212890625, 1.2802734375, 1.34765625, 1.4150390625, 1.482421875, 1.5498046875, 1.6171875, 1.6845703125, 1.751953125, 1.8193359375, 1.88671875, 1.9541015625, 2.021484375, 2.0888671875, 2.15625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 4.0, 3.0, 4.0, 5.0, 3.0, 10.0, 16.0, 16.0, 29.0, 33.0, 56.0, 80.0, 138.0, 299.0, 721.0, 1718.0, 5771.0, 23904.0, 161146.0, 2732349.0, 1162828.0, 83934.0, 14981.0, 4005.0, 1212.0, 481.0, 186.0, 132.0, 70.0, 26.0, 30.0, 22.0, 19.0, 11.0, 14.0, 3.0, 5.0, 2.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5703125, -6.364013671875, -6.15771484375, -5.951416015625, -5.7451171875, -5.538818359375, -5.33251953125, -5.126220703125, -4.919921875, -4.713623046875, -4.50732421875, -4.301025390625, -4.0947265625, -3.888427734375, -3.68212890625, -3.475830078125, -3.26953125, -3.063232421875, -2.85693359375, -2.650634765625, -2.4443359375, -2.238037109375, -2.03173828125, -1.825439453125, -1.619140625, -1.412841796875, -1.20654296875, -1.000244140625, -0.7939453125, -0.587646484375, -0.38134765625, -0.175048828125, 0.03125, 0.237548828125, 0.44384765625, 0.650146484375, 0.8564453125, 1.062744140625, 1.26904296875, 1.475341796875, 1.681640625, 1.887939453125, 2.09423828125, 2.300537109375, 2.5068359375, 2.713134765625, 2.91943359375, 3.125732421875, 3.33203125, 3.538330078125, 3.74462890625, 3.950927734375, 4.1572265625, 4.363525390625, 4.56982421875, 4.776123046875, 4.982421875, 5.188720703125, 5.39501953125, 5.601318359375, 5.8076171875, 6.013916015625, 6.22021484375, 6.426513671875, 6.6328125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 9.0, 8.0, 6.0, 22.0, 24.0, 27.0, 40.0, 56.0, 68.0, 81.0, 141.0, 168.0, 267.0, 429.0, 595.0, 582.0, 437.0, 307.0, 233.0, 147.0, 120.0, 63.0, 55.0, 36.0, 32.0, 25.0, 7.0, 13.0, 16.0, 10.0, 8.0, 8.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-5.3515625, -5.20367431640625, -5.0557861328125, -4.90789794921875, -4.760009765625, -4.61212158203125, -4.4642333984375, -4.31634521484375, -4.16845703125, -4.02056884765625, -3.8726806640625, -3.72479248046875, -3.576904296875, -3.42901611328125, -3.2811279296875, -3.13323974609375, -2.9853515625, -2.83746337890625, -2.6895751953125, -2.54168701171875, -2.393798828125, -2.24591064453125, -2.0980224609375, -1.95013427734375, -1.80224609375, -1.65435791015625, -1.5064697265625, -1.35858154296875, -1.210693359375, -1.06280517578125, -0.9149169921875, -0.76702880859375, -0.619140625, -0.47125244140625, -0.3233642578125, -0.17547607421875, -0.027587890625, 0.12030029296875, 0.2681884765625, 0.41607666015625, 0.56396484375, 0.71185302734375, 0.8597412109375, 1.00762939453125, 1.155517578125, 1.30340576171875, 1.4512939453125, 1.59918212890625, 1.7470703125, 1.89495849609375, 2.0428466796875, 2.19073486328125, 2.338623046875, 2.48651123046875, 2.6343994140625, 2.78228759765625, 2.93017578125, 3.07806396484375, 3.2259521484375, 3.37384033203125, 3.521728515625, 3.66961669921875, 3.8175048828125, 3.96539306640625, 4.11328125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 10.0, 15.0, 28.0, 77.0, 147.0, 233.0, 214.0, 156.0, 65.0, 29.0, 18.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-118.6193618774414, -116.09321594238281, -113.56706237792969, -111.04090881347656, -108.51476287841797, -105.98861694335938, -103.46246337890625, -100.93630981445312, -98.41016387939453, -95.88401794433594, -93.35786437988281, -90.83171081542969, -88.3055648803711, -85.7794189453125, -83.25326538085938, -80.72711181640625, -78.20096588134766, -75.67481994628906, -73.14866638183594, -70.62251281738281, -68.09636688232422, -65.57022094726562, -63.0440673828125, -60.51791763305664, -57.99176788330078, -55.46561813354492, -52.93946838378906, -50.4133186340332, -47.887168884277344, -45.361019134521484, -42.834869384765625, -40.308719635009766, -37.78256607055664, -35.25641632080078, -32.73026657104492, -30.204116821289062, -27.677967071533203, -25.151817321777344, -22.625667572021484, -20.099517822265625, -17.573368072509766, -15.047218322753906, -12.521068572998047, -9.994918823242188, -7.468769073486328, -4.942619323730469, -2.4164695739746094, 0.10968017578125, 2.6358299255371094, 5.161979675292969, 7.688129425048828, 10.214279174804688, 12.740428924560547, 15.266578674316406, 17.792728424072266, 20.318878173828125, 22.845027923583984, 25.371177673339844, 27.897327423095703, 30.423477172851562, 32.94962692260742, 35.47577667236328, 38.00192642211914, 40.528076171875, 43.05422592163086]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 7.0, 2.0, 6.0, 14.0, 8.0, 8.0, 11.0, 11.0, 15.0, 22.0, 20.0, 15.0, 24.0, 34.0, 26.0, 32.0, 38.0, 36.0, 31.0, 55.0, 50.0, 57.0, 56.0, 52.0, 48.0, 41.0, 43.0, 28.0, 30.0, 19.0, 23.0, 18.0, 21.0, 15.0, 16.0, 15.0, 14.0, 8.0, 6.0, 2.0, 7.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-24.950990676879883, -24.231101989746094, -23.511215209960938, -22.79132652282715, -22.07143783569336, -21.351551055908203, -20.631662368774414, -19.911773681640625, -19.19188690185547, -18.47199821472168, -17.752111434936523, -17.032222747802734, -16.312335968017578, -15.592447280883789, -14.87255859375, -14.152670860290527, -13.432783126831055, -12.712895393371582, -11.99300765991211, -11.27311897277832, -10.553231239318848, -9.833343505859375, -9.113454818725586, -8.393567085266113, -7.673679351806641, -6.953791618347168, -6.233903408050537, -5.514015197753906, -4.794127464294434, -4.074239730834961, -3.35435152053833, -2.634463310241699, -1.9145736694335938, -1.194685697555542, -0.47479772567749023, 0.24509024620056152, 0.9649782180786133, 1.684866189956665, 2.404754161834717, 3.1246423721313477, 3.8445301055908203, 4.564417839050293, 5.284306049346924, 6.004194259643555, 6.724081993103027, 7.4439697265625, 8.163858413696289, 8.883746147155762, 9.603633880615234, 10.323521614074707, 11.04340934753418, 11.763298034667969, 12.483185768127441, 13.203073501586914, 13.922962188720703, 14.642849922180176, 15.362737655639648, 16.082626342773438, 16.802513122558594, 17.522401809692383, 18.242290496826172, 18.962177276611328, 19.682065963745117, 20.401954650878906, 21.121841430664062]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 11.0, 18.0, 28.0, 41.0, 75.0, 131.0, 181.0, 339.0, 632.0, 1233.0, 2283.0, 5424.0, 13611.0, 40381.0, 142091.0, 435471.0, 288407.0, 77921.0, 24149.0, 8669.0, 3661.0, 1697.0, 893.0, 496.0, 291.0, 157.0, 81.0, 67.0, 32.0, 30.0, 19.0, 11.0, 8.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.58203125, -4.45025634765625, -4.3184814453125, -4.18670654296875, -4.054931640625, -3.92315673828125, -3.7913818359375, -3.65960693359375, -3.52783203125, -3.39605712890625, -3.2642822265625, -3.13250732421875, -3.000732421875, -2.86895751953125, -2.7371826171875, -2.60540771484375, -2.4736328125, -2.34185791015625, -2.2100830078125, -2.07830810546875, -1.946533203125, -1.81475830078125, -1.6829833984375, -1.55120849609375, -1.41943359375, -1.28765869140625, -1.1558837890625, -1.02410888671875, -0.892333984375, -0.76055908203125, -0.6287841796875, -0.49700927734375, -0.365234375, -0.23345947265625, -0.1016845703125, 0.03009033203125, 0.161865234375, 0.29364013671875, 0.4254150390625, 0.55718994140625, 0.68896484375, 0.82073974609375, 0.9525146484375, 1.08428955078125, 1.216064453125, 1.34783935546875, 1.4796142578125, 1.61138916015625, 1.7431640625, 1.87493896484375, 2.0067138671875, 2.13848876953125, 2.270263671875, 2.40203857421875, 2.5338134765625, 2.66558837890625, 2.79736328125, 2.92913818359375, 3.0609130859375, 3.19268798828125, 3.324462890625, 3.45623779296875, 3.5880126953125, 3.71978759765625, 3.8515625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 6.0, 11.0, 12.0, 9.0, 13.0, 15.0, 18.0, 10.0, 17.0, 19.0, 24.0, 29.0, 33.0, 32.0, 30.0, 40.0, 33.0, 33.0, 35.0, 45.0, 33.0, 39.0, 54.0, 34.0, 45.0, 33.0, 33.0, 38.0, 26.0, 15.0, 35.0, 27.0, 19.0, 15.0, 12.0, 10.0, 8.0, 9.0, 6.0, 9.0, 0.0, 7.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.19140625, -2.1271514892578125, -2.062896728515625, -1.9986419677734375, -1.93438720703125, -1.8701324462890625, -1.805877685546875, -1.7416229248046875, -1.6773681640625, -1.6131134033203125, -1.548858642578125, -1.4846038818359375, -1.42034912109375, -1.3560943603515625, -1.291839599609375, -1.2275848388671875, -1.163330078125, -1.0990753173828125, -1.034820556640625, -0.9705657958984375, -0.90631103515625, -0.8420562744140625, -0.777801513671875, -0.7135467529296875, -0.6492919921875, -0.5850372314453125, -0.520782470703125, -0.4565277099609375, -0.39227294921875, -0.3280181884765625, -0.263763427734375, -0.1995086669921875, -0.13525390625, -0.0709991455078125, -0.006744384765625, 0.0575103759765625, 0.12176513671875, 0.1860198974609375, 0.250274658203125, 0.3145294189453125, 0.3787841796875, 0.4430389404296875, 0.507293701171875, 0.5715484619140625, 0.63580322265625, 0.7000579833984375, 0.764312744140625, 0.8285675048828125, 0.892822265625, 0.9570770263671875, 1.021331787109375, 1.0855865478515625, 1.14984130859375, 1.2140960693359375, 1.278350830078125, 1.3426055908203125, 1.4068603515625, 1.4711151123046875, 1.535369873046875, 1.5996246337890625, 1.66387939453125, 1.7281341552734375, 1.792388916015625, 1.8566436767578125, 1.9208984375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 10.0, 8.0, 10.0, 11.0, 15.0, 16.0, 24.0, 34.0, 62.0, 94.0, 159.0, 185.0, 274.0, 500.0, 955.0, 2219.0, 6404.0, 24608.0, 146958.0, 714797.0, 119852.0, 21487.0, 5718.0, 2083.0, 843.0, 457.0, 244.0, 157.0, 113.0, 80.0, 55.0, 36.0, 21.0, 15.0, 11.0, 17.0, 6.0, 7.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2734375, -5.08807373046875, -4.9027099609375, -4.71734619140625, -4.531982421875, -4.34661865234375, -4.1612548828125, -3.97589111328125, -3.79052734375, -3.60516357421875, -3.4197998046875, -3.23443603515625, -3.049072265625, -2.86370849609375, -2.6783447265625, -2.49298095703125, -2.3076171875, -2.12225341796875, -1.9368896484375, -1.75152587890625, -1.566162109375, -1.38079833984375, -1.1954345703125, -1.01007080078125, -0.82470703125, -0.63934326171875, -0.4539794921875, -0.26861572265625, -0.083251953125, 0.10211181640625, 0.2874755859375, 0.47283935546875, 0.658203125, 0.84356689453125, 1.0289306640625, 1.21429443359375, 1.399658203125, 1.58502197265625, 1.7703857421875, 1.95574951171875, 2.14111328125, 2.32647705078125, 2.5118408203125, 2.69720458984375, 2.882568359375, 3.06793212890625, 3.2532958984375, 3.43865966796875, 3.6240234375, 3.80938720703125, 3.9947509765625, 4.18011474609375, 4.365478515625, 4.55084228515625, 4.7362060546875, 4.92156982421875, 5.10693359375, 5.29229736328125, 5.4776611328125, 5.66302490234375, 5.848388671875, 6.03375244140625, 6.2191162109375, 6.40447998046875, 6.58984375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 11.0, 7.0, 3.0, 11.0, 12.0, 13.0, 11.0, 15.0, 29.0, 25.0, 39.0, 49.0, 54.0, 61.0, 67.0, 66.0, 71.0, 70.0, 60.0, 42.0, 37.0, 47.0, 33.0, 35.0, 20.0, 22.0, 24.0, 14.0, 15.0, 9.0, 5.0, 5.0, 1.0, 2.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-12.484375, -12.1336669921875, -11.782958984375, -11.4322509765625, -11.08154296875, -10.7308349609375, -10.380126953125, -10.0294189453125, -9.6787109375, -9.3280029296875, -8.977294921875, -8.6265869140625, -8.27587890625, -7.9251708984375, -7.574462890625, -7.2237548828125, -6.873046875, -6.5223388671875, -6.171630859375, -5.8209228515625, -5.47021484375, -5.1195068359375, -4.768798828125, -4.4180908203125, -4.0673828125, -3.7166748046875, -3.365966796875, -3.0152587890625, -2.66455078125, -2.3138427734375, -1.963134765625, -1.6124267578125, -1.26171875, -0.9110107421875, -0.560302734375, -0.2095947265625, 0.14111328125, 0.4918212890625, 0.842529296875, 1.1932373046875, 1.5439453125, 1.8946533203125, 2.245361328125, 2.5960693359375, 2.94677734375, 3.2974853515625, 3.648193359375, 3.9989013671875, 4.349609375, 4.7003173828125, 5.051025390625, 5.4017333984375, 5.75244140625, 6.1031494140625, 6.453857421875, 6.8045654296875, 7.1552734375, 7.5059814453125, 7.856689453125, 8.2073974609375, 8.55810546875, 8.9088134765625, 9.259521484375, 9.6102294921875, 9.9609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 3.0, 6.0, 8.0, 7.0, 11.0, 22.0, 22.0, 34.0, 51.0, 66.0, 107.0, 166.0, 290.0, 448.0, 835.0, 1458.0, 2816.0, 5856.0, 13142.0, 35510.0, 118790.0, 628696.0, 163732.0, 45449.0, 16707.0, 7122.0, 3270.0, 1654.0, 884.0, 510.0, 322.0, 185.0, 128.0, 74.0, 53.0, 33.0, 24.0, 20.0, 11.0, 12.0, 8.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0], "bins": [-2.06640625, -2.0099639892578125, -1.953521728515625, -1.8970794677734375, -1.84063720703125, -1.7841949462890625, -1.727752685546875, -1.6713104248046875, -1.6148681640625, -1.5584259033203125, -1.501983642578125, -1.4455413818359375, -1.38909912109375, -1.3326568603515625, -1.276214599609375, -1.2197723388671875, -1.163330078125, -1.1068878173828125, -1.050445556640625, -0.9940032958984375, -0.93756103515625, -0.8811187744140625, -0.824676513671875, -0.7682342529296875, -0.7117919921875, -0.6553497314453125, -0.598907470703125, -0.5424652099609375, -0.48602294921875, -0.4295806884765625, -0.373138427734375, -0.3166961669921875, -0.26025390625, -0.2038116455078125, -0.147369384765625, -0.0909271240234375, -0.03448486328125, 0.0219573974609375, 0.078399658203125, 0.1348419189453125, 0.1912841796875, 0.2477264404296875, 0.304168701171875, 0.3606109619140625, 0.41705322265625, 0.4734954833984375, 0.529937744140625, 0.5863800048828125, 0.642822265625, 0.6992645263671875, 0.755706787109375, 0.8121490478515625, 0.86859130859375, 0.9250335693359375, 0.981475830078125, 1.0379180908203125, 1.0943603515625, 1.1508026123046875, 1.207244873046875, 1.2636871337890625, 1.32012939453125, 1.3765716552734375, 1.433013916015625, 1.4894561767578125, 1.5458984375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 6.0, 15.0, 13.0, 19.0, 23.0, 19.0, 29.0, 48.0, 48.0, 71.0, 110.0, 101.0, 114.0, 95.0, 64.0, 49.0, 43.0, 21.0, 30.0, 18.0, 10.0, 8.0, 9.0, 4.0, 4.0, 7.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0007658004760742188, -0.0007460415363311768, -0.0007262825965881348, -0.0007065236568450928, -0.0006867647171020508, -0.0006670057773590088, -0.0006472468376159668, -0.0006274878978729248, -0.0006077289581298828, -0.0005879700183868408, -0.0005682110786437988, -0.0005484521389007568, -0.0005286931991577148, -0.0005089342594146729, -0.0004891753196716309, -0.00046941637992858887, -0.0004496574401855469, -0.0004298985004425049, -0.0004101395606994629, -0.0003903806209564209, -0.0003706216812133789, -0.0003508627414703369, -0.0003311038017272949, -0.00031134486198425293, -0.00029158592224121094, -0.00027182698249816895, -0.00025206804275512695, -0.00023230910301208496, -0.00021255016326904297, -0.00019279122352600098, -0.00017303228378295898, -0.000153273344039917, -0.000133514404296875, -0.00011375546455383301, -9.399652481079102e-05, -7.423758506774902e-05, -5.447864532470703e-05, -3.471970558166504e-05, -1.4960765838623047e-05, 4.798173904418945e-06, 2.4557113647460938e-05, 4.431605339050293e-05, 6.407499313354492e-05, 8.383393287658691e-05, 0.0001035928726196289, 0.0001233518123626709, 0.0001431107521057129, 0.00016286969184875488, 0.00018262863159179688, 0.00020238757133483887, 0.00022214651107788086, 0.00024190545082092285, 0.00026166439056396484, 0.00028142333030700684, 0.00030118227005004883, 0.0003209412097930908, 0.0003407001495361328, 0.0003604590892791748, 0.0003802180290222168, 0.0003999769687652588, 0.0004197359085083008, 0.0004394948482513428, 0.00045925378799438477, 0.00047901272773742676, 0.0004987716674804688]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 3.0, 3.0, 6.0, 7.0, 14.0, 25.0, 47.0, 75.0, 104.0, 231.0, 373.0, 709.0, 1695.0, 4361.0, 13216.0, 51809.0, 348527.0, 550171.0, 55013.0, 14125.0, 4633.0, 1765.0, 740.0, 385.0, 226.0, 111.0, 59.0, 40.0, 26.0, 22.0, 9.0, 8.0, 5.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.77734375, -2.695709228515625, -2.61407470703125, -2.532440185546875, -2.4508056640625, -2.369171142578125, -2.28753662109375, -2.205902099609375, -2.124267578125, -2.042633056640625, -1.96099853515625, -1.879364013671875, -1.7977294921875, -1.716094970703125, -1.63446044921875, -1.552825927734375, -1.47119140625, -1.389556884765625, -1.30792236328125, -1.226287841796875, -1.1446533203125, -1.063018798828125, -0.98138427734375, -0.899749755859375, -0.818115234375, -0.736480712890625, -0.65484619140625, -0.573211669921875, -0.4915771484375, -0.409942626953125, -0.32830810546875, -0.246673583984375, -0.1650390625, -0.083404541015625, -0.00177001953125, 0.079864501953125, 0.1614990234375, 0.243133544921875, 0.32476806640625, 0.406402587890625, 0.488037109375, 0.569671630859375, 0.65130615234375, 0.732940673828125, 0.8145751953125, 0.896209716796875, 0.97784423828125, 1.059478759765625, 1.14111328125, 1.222747802734375, 1.30438232421875, 1.386016845703125, 1.4676513671875, 1.549285888671875, 1.63092041015625, 1.712554931640625, 1.794189453125, 1.875823974609375, 1.95745849609375, 2.039093017578125, 2.1207275390625, 2.202362060546875, 2.28399658203125, 2.365631103515625, 2.447265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 2.0, 5.0, 3.0, 3.0, 4.0, 7.0, 5.0, 9.0, 11.0, 24.0, 27.0, 25.0, 34.0, 60.0, 73.0, 119.0, 102.0, 121.0, 109.0, 63.0, 48.0, 40.0, 26.0, 18.0, 15.0, 9.0, 8.0, 9.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669921875, -2.586090087890625, -2.50225830078125, -2.418426513671875, -2.3345947265625, -2.250762939453125, -2.16693115234375, -2.083099365234375, -1.999267578125, -1.915435791015625, -1.83160400390625, -1.747772216796875, -1.6639404296875, -1.580108642578125, -1.49627685546875, -1.412445068359375, -1.32861328125, -1.244781494140625, -1.16094970703125, -1.077117919921875, -0.9932861328125, -0.909454345703125, -0.82562255859375, -0.741790771484375, -0.657958984375, -0.574127197265625, -0.49029541015625, -0.406463623046875, -0.3226318359375, -0.238800048828125, -0.15496826171875, -0.071136474609375, 0.0126953125, 0.096527099609375, 0.18035888671875, 0.264190673828125, 0.3480224609375, 0.431854248046875, 0.51568603515625, 0.599517822265625, 0.683349609375, 0.767181396484375, 0.85101318359375, 0.934844970703125, 1.0186767578125, 1.102508544921875, 1.18634033203125, 1.270172119140625, 1.35400390625, 1.437835693359375, 1.52166748046875, 1.605499267578125, 1.6893310546875, 1.773162841796875, 1.85699462890625, 1.940826416015625, 2.024658203125, 2.108489990234375, 2.19232177734375, 2.276153564453125, 2.3599853515625, 2.443817138671875, 2.52764892578125, 2.611480712890625, 2.6953125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 8.0, 14.0, 29.0, 56.0, 107.0, 235.0, 282.0, 123.0, 80.0, 23.0, 16.0, 7.0, 11.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.64256286621094, -57.44483184814453, -55.24709701538086, -53.04936599731445, -50.85163497924805, -48.653900146484375, -46.45616912841797, -44.25843811035156, -42.060707092285156, -39.86297607421875, -37.66524124145508, -35.46751022338867, -33.269779205322266, -31.072046279907227, -28.874313354492188, -26.67658233642578, -24.47884750366211, -22.28111457824707, -20.083383560180664, -17.885650634765625, -15.687918663024902, -13.49018669128418, -11.29245376586914, -9.094721794128418, -6.896989822387695, -4.699257850646973, -2.501525402069092, -0.30379295349121094, 1.8939390182495117, 4.091670989990234, 6.289403915405273, 8.487135887145996, 10.684867858886719, 12.882599830627441, 15.080331802368164, 17.278064727783203, 19.47579574584961, 21.67352867126465, 23.871261596679688, 26.068992614746094, 28.266725540161133, 30.464458465576172, 32.66218948364258, 34.85992431640625, 37.057655334472656, 39.25538635253906, 41.45311737060547, 43.65085220336914, 45.84858322143555, 48.04631423950195, 50.244049072265625, 52.44178009033203, 54.63951110839844, 56.837242126464844, 59.034976959228516, 61.23270797729492, 63.430442810058594, 65.628173828125, 67.8259048461914, 70.02363586425781, 72.22137451171875, 74.41910552978516, 76.61683654785156, 78.81456756591797, 81.01229858398438]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 4.0, 7.0, 12.0, 6.0, 7.0, 11.0, 11.0, 14.0, 22.0, 34.0, 17.0, 19.0, 23.0, 40.0, 38.0, 42.0, 48.0, 69.0, 89.0, 84.0, 78.0, 45.0, 31.0, 42.0, 27.0, 29.0, 26.0, 18.0, 13.0, 15.0, 21.0, 12.0, 11.0, 8.0, 6.0, 7.0, 4.0, 4.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.689926147460938, -29.546859741210938, -28.403793334960938, -27.260726928710938, -26.117660522460938, -24.974594116210938, -23.831527709960938, -22.688461303710938, -21.545394897460938, -20.402328491210938, -19.259262084960938, -18.116195678710938, -16.973129272460938, -15.830062866210938, -14.686995506286621, -13.543929100036621, -12.400861740112305, -11.257795333862305, -10.114728927612305, -8.971662521362305, -7.8285956382751465, -6.6855292320251465, -5.542462348937988, -4.399395942687988, -3.2563295364379883, -2.1132631301879883, -0.9701964855194092, 0.17287015914916992, 1.31593656539917, 2.45900297164917, 3.602069854736328, 4.745136260986328, 5.888202667236328, 7.031269073486328, 8.174335479736328, 9.317401885986328, 10.460468292236328, 11.603534698486328, 12.746602058410645, 13.889668464660645, 15.032734870910645, 16.17580223083496, 17.31886863708496, 18.46193504333496, 19.60500144958496, 20.74806785583496, 21.89113426208496, 23.03420066833496, 24.17726707458496, 25.32033348083496, 26.46339988708496, 27.60646629333496, 28.74953269958496, 29.89259910583496, 31.035667419433594, 32.178733825683594, 33.321800231933594, 34.464866638183594, 35.607933044433594, 36.750999450683594, 37.894065856933594, 39.037132263183594, 40.180198669433594, 41.323265075683594, 42.466331481933594]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 3.0, 10.0, 7.0, 12.0, 15.0, 35.0, 53.0, 71.0, 119.0, 217.0, 345.0, 646.0, 1125.0, 2118.0, 4211.0, 8771.0, 20424.0, 54142.0, 180406.0, 809558.0, 2186837.0, 681986.0, 158836.0, 48650.0, 18778.0, 8297.0, 4048.0, 2050.0, 1055.0, 604.0, 337.0, 213.0, 112.0, 74.0, 42.0, 28.0, 16.0, 9.0, 9.0, 9.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.3125, -3.216339111328125, -3.12017822265625, -3.024017333984375, -2.9278564453125, -2.831695556640625, -2.73553466796875, -2.639373779296875, -2.543212890625, -2.447052001953125, -2.35089111328125, -2.254730224609375, -2.1585693359375, -2.062408447265625, -1.96624755859375, -1.870086669921875, -1.77392578125, -1.677764892578125, -1.58160400390625, -1.485443115234375, -1.3892822265625, -1.293121337890625, -1.19696044921875, -1.100799560546875, -1.004638671875, -0.908477783203125, -0.81231689453125, -0.716156005859375, -0.6199951171875, -0.523834228515625, -0.42767333984375, -0.331512451171875, -0.2353515625, -0.139190673828125, -0.04302978515625, 0.053131103515625, 0.1492919921875, 0.245452880859375, 0.34161376953125, 0.437774658203125, 0.533935546875, 0.630096435546875, 0.72625732421875, 0.822418212890625, 0.9185791015625, 1.014739990234375, 1.11090087890625, 1.207061767578125, 1.30322265625, 1.399383544921875, 1.49554443359375, 1.591705322265625, 1.6878662109375, 1.784027099609375, 1.88018798828125, 1.976348876953125, 2.072509765625, 2.168670654296875, 2.26483154296875, 2.360992431640625, 2.4571533203125, 2.553314208984375, 2.64947509765625, 2.745635986328125, 2.841796875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 2.0, 4.0, 6.0, 11.0, 7.0, 14.0, 20.0, 16.0, 12.0, 20.0, 27.0, 31.0, 44.0, 36.0, 42.0, 44.0, 49.0, 50.0, 48.0, 59.0, 43.0, 52.0, 39.0, 41.0, 42.0, 28.0, 32.0, 23.0, 34.0, 23.0, 19.0, 16.0, 11.0, 14.0, 9.0, 11.0, 4.0, 6.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.578125, -2.5, -2.421875, -2.34375, -2.265625, -2.1875, -2.109375, -2.03125, -1.953125, -1.875, -1.796875, -1.71875, -1.640625, -1.5625, -1.484375, -1.40625, -1.328125, -1.25, -1.171875, -1.09375, -1.015625, -0.9375, -0.859375, -0.78125, -0.703125, -0.625, -0.546875, -0.46875, -0.390625, -0.3125, -0.234375, -0.15625, -0.078125, 0.0, 0.078125, 0.15625, 0.234375, 0.3125, 0.390625, 0.46875, 0.546875, 0.625, 0.703125, 0.78125, 0.859375, 0.9375, 1.015625, 1.09375, 1.171875, 1.25, 1.328125, 1.40625, 1.484375, 1.5625, 1.640625, 1.71875, 1.796875, 1.875, 1.953125, 2.03125, 2.109375, 2.1875, 2.265625, 2.34375, 2.421875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 8.0, 6.0, 16.0, 18.0, 17.0, 15.0, 38.0, 68.0, 104.0, 179.0, 521.0, 1488.0, 5562.0, 33388.0, 620613.0, 3393410.0, 121047.0, 13278.0, 2921.0, 898.0, 302.0, 155.0, 78.0, 59.0, 24.0, 20.0, 12.0, 15.0, 6.0, 6.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.90234375, -7.61248779296875, -7.3226318359375, -7.03277587890625, -6.742919921875, -6.45306396484375, -6.1632080078125, -5.87335205078125, -5.58349609375, -5.29364013671875, -5.0037841796875, -4.71392822265625, -4.424072265625, -4.13421630859375, -3.8443603515625, -3.55450439453125, -3.2646484375, -2.97479248046875, -2.6849365234375, -2.39508056640625, -2.105224609375, -1.81536865234375, -1.5255126953125, -1.23565673828125, -0.94580078125, -0.65594482421875, -0.3660888671875, -0.07623291015625, 0.213623046875, 0.50347900390625, 0.7933349609375, 1.08319091796875, 1.373046875, 1.66290283203125, 1.9527587890625, 2.24261474609375, 2.532470703125, 2.82232666015625, 3.1121826171875, 3.40203857421875, 3.69189453125, 3.98175048828125, 4.2716064453125, 4.56146240234375, 4.851318359375, 5.14117431640625, 5.4310302734375, 5.72088623046875, 6.0107421875, 6.30059814453125, 6.5904541015625, 6.88031005859375, 7.170166015625, 7.46002197265625, 7.7498779296875, 8.03973388671875, 8.32958984375, 8.61944580078125, 8.9093017578125, 9.19915771484375, 9.489013671875, 9.77886962890625, 10.0687255859375, 10.35858154296875, 10.6484375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 3.0, 7.0, 4.0, 12.0, 16.0, 14.0, 24.0, 30.0, 47.0, 84.0, 111.0, 150.0, 215.0, 340.0, 566.0, 671.0, 622.0, 395.0, 236.0, 154.0, 119.0, 67.0, 52.0, 31.0, 25.0, 16.0, 16.0, 8.0, 13.0, 4.0, 3.0, 3.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.875, -5.6768798828125, -5.478759765625, -5.2806396484375, -5.08251953125, -4.8843994140625, -4.686279296875, -4.4881591796875, -4.2900390625, -4.0919189453125, -3.893798828125, -3.6956787109375, -3.49755859375, -3.2994384765625, -3.101318359375, -2.9031982421875, -2.705078125, -2.5069580078125, -2.308837890625, -2.1107177734375, -1.91259765625, -1.7144775390625, -1.516357421875, -1.3182373046875, -1.1201171875, -0.9219970703125, -0.723876953125, -0.5257568359375, -0.32763671875, -0.1295166015625, 0.068603515625, 0.2667236328125, 0.46484375, 0.6629638671875, 0.861083984375, 1.0592041015625, 1.25732421875, 1.4554443359375, 1.653564453125, 1.8516845703125, 2.0498046875, 2.2479248046875, 2.446044921875, 2.6441650390625, 2.84228515625, 3.0404052734375, 3.238525390625, 3.4366455078125, 3.634765625, 3.8328857421875, 4.031005859375, 4.2291259765625, 4.42724609375, 4.6253662109375, 4.823486328125, 5.0216064453125, 5.2197265625, 5.4178466796875, 5.615966796875, 5.8140869140625, 6.01220703125, 6.2103271484375, 6.408447265625, 6.6065673828125, 6.8046875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 8.0, 12.0, 51.0, 141.0, 352.0, 281.0, 109.0, 35.0, 13.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-214.80784606933594, -210.74838256835938, -206.6889190673828, -202.62945556640625, -198.5699920654297, -194.51052856445312, -190.45106506347656, -186.3916015625, -182.3321533203125, -178.27268981933594, -174.21322631835938, -170.1537628173828, -166.09429931640625, -162.0348358154297, -157.97537231445312, -153.91592407226562, -149.8564453125, -145.79698181152344, -141.73751831054688, -137.6780548095703, -133.61859130859375, -129.5591278076172, -125.49967193603516, -121.4402084350586, -117.38074493408203, -113.32128143310547, -109.2618179321289, -105.20235443115234, -101.14289855957031, -97.08343505859375, -93.02397155761719, -88.96450805664062, -84.905029296875, -80.84556579589844, -76.78610229492188, -72.72663879394531, -68.66717529296875, -64.60771179199219, -60.548255920410156, -56.488792419433594, -52.42932891845703, -48.36986541748047, -44.310401916503906, -40.25094223022461, -36.19147872924805, -32.132015228271484, -28.072553634643555, -24.013092041015625, -19.953628540039062, -15.894165992736816, -11.83470344543457, -7.775240898132324, -3.715778350830078, 0.3436851501464844, 4.403146743774414, 8.462608337402344, 12.522071838378906, 16.58153533935547, 20.6409969329834, 24.700458526611328, 28.75992202758789, 32.81938552856445, 36.87884521484375, 40.93830871582031, 44.997772216796875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 8.0, 6.0, 9.0, 19.0, 13.0, 30.0, 23.0, 26.0, 30.0, 29.0, 36.0, 41.0, 49.0, 55.0, 45.0, 53.0, 50.0, 63.0, 41.0, 45.0, 41.0, 39.0, 39.0, 30.0, 33.0, 27.0, 18.0, 18.0, 20.0, 17.0, 16.0, 12.0, 8.0, 5.0, 5.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.557758331298828, -28.66191864013672, -27.76607894897461, -26.8702392578125, -25.974401473999023, -25.078561782836914, -24.182722091674805, -23.286882400512695, -22.39104461669922, -21.49520492553711, -20.599365234375, -19.70352554321289, -18.807687759399414, -17.911848068237305, -17.016008377075195, -16.120168685913086, -15.224328994750977, -14.328489303588867, -13.432650566101074, -12.536810874938965, -11.640972137451172, -10.745132446289062, -9.849292755126953, -8.953453063964844, -8.05761432647705, -7.1617751121521, -6.265935897827148, -5.370096206665039, -4.474256992340088, -3.5784177780151367, -2.6825780868530273, -1.7867388725280762, -0.8908977508544922, 0.004941582679748535, 0.9007809162139893, 1.7966203689575195, 2.6924595832824707, 3.588298797607422, 4.484138488769531, 5.379977703094482, 6.275816917419434, 7.171656131744385, 8.067495346069336, 8.963335037231445, 9.859174728393555, 10.755013465881348, 11.650853157043457, 12.54669189453125, 13.44253158569336, 14.338371276855469, 15.234210014343262, 16.130050659179688, 17.025888442993164, 17.921728134155273, 18.817567825317383, 19.713407516479492, 20.60924530029297, 21.505084991455078, 22.400924682617188, 23.296764373779297, 24.192602157592773, 25.088441848754883, 25.984281539916992, 26.8801212310791, 27.77596092224121]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 9.0, 13.0, 23.0, 28.0, 31.0, 59.0, 90.0, 139.0, 202.0, 299.0, 549.0, 1029.0, 2002.0, 4312.0, 10166.0, 26421.0, 80029.0, 284324.0, 430535.0, 138528.0, 42209.0, 15347.0, 6234.0, 2765.0, 1338.0, 750.0, 416.0, 240.0, 147.0, 105.0, 60.0, 41.0, 39.0, 22.0, 15.0, 11.0, 6.0, 6.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2265625, -4.0911865234375, -3.955810546875, -3.8204345703125, -3.68505859375, -3.5496826171875, -3.414306640625, -3.2789306640625, -3.1435546875, -3.0081787109375, -2.872802734375, -2.7374267578125, -2.60205078125, -2.4666748046875, -2.331298828125, -2.1959228515625, -2.060546875, -1.9251708984375, -1.789794921875, -1.6544189453125, -1.51904296875, -1.3836669921875, -1.248291015625, -1.1129150390625, -0.9775390625, -0.8421630859375, -0.706787109375, -0.5714111328125, -0.43603515625, -0.3006591796875, -0.165283203125, -0.0299072265625, 0.10546875, 0.2408447265625, 0.376220703125, 0.5115966796875, 0.64697265625, 0.7823486328125, 0.917724609375, 1.0531005859375, 1.1884765625, 1.3238525390625, 1.459228515625, 1.5946044921875, 1.72998046875, 1.8653564453125, 2.000732421875, 2.1361083984375, 2.271484375, 2.4068603515625, 2.542236328125, 2.6776123046875, 2.81298828125, 2.9483642578125, 3.083740234375, 3.2191162109375, 3.3544921875, 3.4898681640625, 3.625244140625, 3.7606201171875, 3.89599609375, 4.0313720703125, 4.166748046875, 4.3021240234375, 4.4375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 6.0, 9.0, 7.0, 10.0, 4.0, 8.0, 19.0, 22.0, 16.0, 18.0, 25.0, 23.0, 35.0, 31.0, 41.0, 42.0, 42.0, 51.0, 37.0, 34.0, 37.0, 41.0, 59.0, 45.0, 44.0, 34.0, 26.0, 37.0, 38.0, 23.0, 21.0, 21.0, 13.0, 15.0, 10.0, 14.0, 5.0, 10.0, 7.0, 2.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-2.89453125, -2.81591796875, -2.7373046875, -2.65869140625, -2.580078125, -2.50146484375, -2.4228515625, -2.34423828125, -2.265625, -2.18701171875, -2.1083984375, -2.02978515625, -1.951171875, -1.87255859375, -1.7939453125, -1.71533203125, -1.63671875, -1.55810546875, -1.4794921875, -1.40087890625, -1.322265625, -1.24365234375, -1.1650390625, -1.08642578125, -1.0078125, -0.92919921875, -0.8505859375, -0.77197265625, -0.693359375, -0.61474609375, -0.5361328125, -0.45751953125, -0.37890625, -0.30029296875, -0.2216796875, -0.14306640625, -0.064453125, 0.01416015625, 0.0927734375, 0.17138671875, 0.25, 0.32861328125, 0.4072265625, 0.48583984375, 0.564453125, 0.64306640625, 0.7216796875, 0.80029296875, 0.87890625, 0.95751953125, 1.0361328125, 1.11474609375, 1.193359375, 1.27197265625, 1.3505859375, 1.42919921875, 1.5078125, 1.58642578125, 1.6650390625, 1.74365234375, 1.822265625, 1.90087890625, 1.9794921875, 2.05810546875, 2.13671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 7.0, 7.0, 17.0, 15.0, 25.0, 32.0, 43.0, 53.0, 79.0, 108.0, 144.0, 287.0, 431.0, 816.0, 1663.0, 3653.0, 10252.0, 39513.0, 246470.0, 659117.0, 62408.0, 14197.0, 4684.0, 2023.0, 1001.0, 532.0, 327.0, 193.0, 126.0, 96.0, 57.0, 37.0, 32.0, 24.0, 13.0, 16.0, 18.0, 7.0, 6.0, 7.0, 5.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.54296875, -5.34600830078125, -5.1490478515625, -4.95208740234375, -4.755126953125, -4.55816650390625, -4.3612060546875, -4.16424560546875, -3.96728515625, -3.77032470703125, -3.5733642578125, -3.37640380859375, -3.179443359375, -2.98248291015625, -2.7855224609375, -2.58856201171875, -2.3916015625, -2.19464111328125, -1.9976806640625, -1.80072021484375, -1.603759765625, -1.40679931640625, -1.2098388671875, -1.01287841796875, -0.81591796875, -0.61895751953125, -0.4219970703125, -0.22503662109375, -0.028076171875, 0.16888427734375, 0.3658447265625, 0.56280517578125, 0.759765625, 0.95672607421875, 1.1536865234375, 1.35064697265625, 1.547607421875, 1.74456787109375, 1.9415283203125, 2.13848876953125, 2.33544921875, 2.53240966796875, 2.7293701171875, 2.92633056640625, 3.123291015625, 3.32025146484375, 3.5172119140625, 3.71417236328125, 3.9111328125, 4.10809326171875, 4.3050537109375, 4.50201416015625, 4.698974609375, 4.89593505859375, 5.0928955078125, 5.28985595703125, 5.48681640625, 5.68377685546875, 5.8807373046875, 6.07769775390625, 6.274658203125, 6.47161865234375, 6.6685791015625, 6.86553955078125, 7.0625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 11.0, 7.0, 5.0, 15.0, 16.0, 17.0, 20.0, 18.0, 33.0, 31.0, 33.0, 41.0, 55.0, 55.0, 59.0, 69.0, 53.0, 77.0, 53.0, 49.0, 48.0, 44.0, 29.0, 32.0, 21.0, 24.0, 14.0, 10.0, 8.0, 14.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.546875, -9.19482421875, -8.8427734375, -8.49072265625, -8.138671875, -7.78662109375, -7.4345703125, -7.08251953125, -6.73046875, -6.37841796875, -6.0263671875, -5.67431640625, -5.322265625, -4.97021484375, -4.6181640625, -4.26611328125, -3.9140625, -3.56201171875, -3.2099609375, -2.85791015625, -2.505859375, -2.15380859375, -1.8017578125, -1.44970703125, -1.09765625, -0.74560546875, -0.3935546875, -0.04150390625, 0.310546875, 0.66259765625, 1.0146484375, 1.36669921875, 1.71875, 2.07080078125, 2.4228515625, 2.77490234375, 3.126953125, 3.47900390625, 3.8310546875, 4.18310546875, 4.53515625, 4.88720703125, 5.2392578125, 5.59130859375, 5.943359375, 6.29541015625, 6.6474609375, 6.99951171875, 7.3515625, 7.70361328125, 8.0556640625, 8.40771484375, 8.759765625, 9.11181640625, 9.4638671875, 9.81591796875, 10.16796875, 10.52001953125, 10.8720703125, 11.22412109375, 11.576171875, 11.92822265625, 12.2802734375, 12.63232421875, 12.984375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 8.0, 14.0, 12.0, 36.0, 46.0, 66.0, 89.0, 168.0, 346.0, 566.0, 1207.0, 2600.0, 6432.0, 18254.0, 61884.0, 370304.0, 493532.0, 62310.0, 18709.0, 6587.0, 2683.0, 1277.0, 599.0, 349.0, 193.0, 100.0, 46.0, 36.0, 27.0, 22.0, 11.0, 13.0, 4.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.642578125, -1.589599609375, -1.53662109375, -1.483642578125, -1.4306640625, -1.377685546875, -1.32470703125, -1.271728515625, -1.21875, -1.165771484375, -1.11279296875, -1.059814453125, -1.0068359375, -0.953857421875, -0.90087890625, -0.847900390625, -0.794921875, -0.741943359375, -0.68896484375, -0.635986328125, -0.5830078125, -0.530029296875, -0.47705078125, -0.424072265625, -0.37109375, -0.318115234375, -0.26513671875, -0.212158203125, -0.1591796875, -0.106201171875, -0.05322265625, -0.000244140625, 0.052734375, 0.105712890625, 0.15869140625, 0.211669921875, 0.2646484375, 0.317626953125, 0.37060546875, 0.423583984375, 0.4765625, 0.529541015625, 0.58251953125, 0.635498046875, 0.6884765625, 0.741455078125, 0.79443359375, 0.847412109375, 0.900390625, 0.953369140625, 1.00634765625, 1.059326171875, 1.1123046875, 1.165283203125, 1.21826171875, 1.271240234375, 1.32421875, 1.377197265625, 1.43017578125, 1.483154296875, 1.5361328125, 1.589111328125, 1.64208984375, 1.695068359375, 1.748046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 8.0, 2.0, 3.0, 6.0, 0.0, 7.0, 5.0, 8.0, 12.0, 11.0, 15.0, 21.0, 29.0, 49.0, 64.0, 92.0, 130.0, 152.0, 108.0, 69.0, 62.0, 40.0, 27.0, 23.0, 16.0, 10.0, 11.0, 6.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006480216979980469, -0.0006274133920669556, -0.0006068050861358643, -0.000586196780204773, -0.0005655884742736816, -0.0005449801683425903, -0.000524371862411499, -0.0005037635564804077, -0.0004831552505493164, -0.0004625469446182251, -0.0004419386386871338, -0.0004213303327560425, -0.00040072202682495117, -0.00038011372089385986, -0.00035950541496276855, -0.00033889710903167725, -0.00031828880310058594, -0.00029768049716949463, -0.0002770721912384033, -0.000256463885307312, -0.0002358555793762207, -0.0002152472734451294, -0.00019463896751403809, -0.00017403066158294678, -0.00015342235565185547, -0.00013281404972076416, -0.00011220574378967285, -9.159743785858154e-05, -7.098913192749023e-05, -5.0380825996398926e-05, -2.9772520065307617e-05, -9.164214134216309e-06, 1.1444091796875e-05, 3.205239772796631e-05, 5.266070365905762e-05, 7.326900959014893e-05, 9.387731552124023e-05, 0.00011448562145233154, 0.00013509392738342285, 0.00015570223331451416, 0.00017631053924560547, 0.00019691884517669678, 0.00021752715110778809, 0.0002381354570388794, 0.0002587437629699707, 0.000279352068901062, 0.0002999603748321533, 0.00032056868076324463, 0.00034117698669433594, 0.00036178529262542725, 0.00038239359855651855, 0.00040300190448760986, 0.00042361021041870117, 0.0004442185163497925, 0.0004648268222808838, 0.0004854351282119751, 0.0005060434341430664, 0.0005266517400741577, 0.000547260046005249, 0.0005678683519363403, 0.0005884766578674316, 0.000609084963798523, 0.0006296932697296143, 0.0006503015756607056, 0.0006709098815917969]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 4.0, 7.0, 9.0, 20.0, 27.0, 22.0, 36.0, 78.0, 107.0, 179.0, 264.0, 547.0, 1066.0, 2074.0, 4906.0, 12711.0, 37768.0, 126861.0, 644505.0, 149617.0, 43105.0, 14356.0, 5466.0, 2368.0, 1095.0, 531.0, 318.0, 192.0, 112.0, 70.0, 43.0, 33.0, 21.0, 19.0, 4.0, 10.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.6943359375, -1.6453094482421875, -1.596282958984375, -1.5472564697265625, -1.49822998046875, -1.4492034912109375, -1.400177001953125, -1.3511505126953125, -1.3021240234375, -1.2530975341796875, -1.204071044921875, -1.1550445556640625, -1.10601806640625, -1.0569915771484375, -1.007965087890625, -0.9589385986328125, -0.909912109375, -0.8608856201171875, -0.811859130859375, -0.7628326416015625, -0.71380615234375, -0.6647796630859375, -0.615753173828125, -0.5667266845703125, -0.5177001953125, -0.4686737060546875, -0.419647216796875, -0.3706207275390625, -0.32159423828125, -0.2725677490234375, -0.223541259765625, -0.1745147705078125, -0.12548828125, -0.0764617919921875, -0.027435302734375, 0.0215911865234375, 0.07061767578125, 0.1196441650390625, 0.168670654296875, 0.2176971435546875, 0.2667236328125, 0.3157501220703125, 0.364776611328125, 0.4138031005859375, 0.46282958984375, 0.5118560791015625, 0.560882568359375, 0.6099090576171875, 0.658935546875, 0.7079620361328125, 0.756988525390625, 0.8060150146484375, 0.85504150390625, 0.9040679931640625, 0.953094482421875, 1.0021209716796875, 1.0511474609375, 1.1001739501953125, 1.149200439453125, 1.1982269287109375, 1.24725341796875, 1.2962799072265625, 1.345306396484375, 1.3943328857421875, 1.443359375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 9.0, 9.0, 15.0, 9.0, 17.0, 13.0, 21.0, 21.0, 34.0, 34.0, 39.0, 36.0, 53.0, 83.0, 81.0, 58.0, 83.0, 47.0, 46.0, 48.0, 39.0, 35.0, 29.0, 21.0, 23.0, 13.0, 16.0, 9.0, 13.0, 11.0, 6.0, 2.0, 0.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.826171875, -1.775390625, -1.724609375, -1.673828125, -1.623046875, -1.572265625, -1.521484375, -1.470703125, -1.419921875, -1.369140625, -1.318359375, -1.267578125, -1.216796875, -1.166015625, -1.115234375, -1.064453125, -1.013671875, -0.962890625, -0.912109375, -0.861328125, -0.810546875, -0.759765625, -0.708984375, -0.658203125, -0.607421875, -0.556640625, -0.505859375, -0.455078125, -0.404296875, -0.353515625, -0.302734375, -0.251953125, -0.201171875, -0.150390625, -0.099609375, -0.048828125, 0.001953125, 0.052734375, 0.103515625, 0.154296875, 0.205078125, 0.255859375, 0.306640625, 0.357421875, 0.408203125, 0.458984375, 0.509765625, 0.560546875, 0.611328125, 0.662109375, 0.712890625, 0.763671875, 0.814453125, 0.865234375, 0.916015625, 0.966796875, 1.017578125, 1.068359375, 1.119140625, 1.169921875, 1.220703125, 1.271484375, 1.322265625, 1.373046875, 1.423828125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 3.0, 4.0, 8.0, 6.0, 7.0, 10.0, 24.0, 27.0, 44.0, 70.0, 106.0, 210.0, 201.0, 92.0, 63.0, 45.0, 23.0, 18.0, 9.0, 5.0, 8.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.154144287109375, -24.8507137298584, -23.547283172607422, -22.243852615356445, -20.94042205810547, -19.636993408203125, -18.33356285095215, -17.030132293701172, -15.726701736450195, -14.423271179199219, -13.119840621948242, -11.816411018371582, -10.512980461120605, -9.209549903869629, -7.9061198234558105, -6.602689743041992, -5.299259185791016, -3.995828866958618, -2.6923985481262207, -1.3889682292938232, -0.08553791046142578, 1.2178926467895508, 2.521322727203369, 3.8247528076171875, 5.128183364868164, 6.431613922119141, 7.735044002532959, 9.038474082946777, 10.341904640197754, 11.64533519744873, 12.94876480102539, 14.252195358276367, 15.555625915527344, 16.85905647277832, 18.162487030029297, 19.465917587280273, 20.76934814453125, 22.072776794433594, 23.37620735168457, 24.679637908935547, 25.983068466186523, 27.2864990234375, 28.589929580688477, 29.893360137939453, 31.196788787841797, 32.500221252441406, 33.80364990234375, 35.107078552246094, 36.4105110168457, 37.71393966674805, 39.017372131347656, 40.32080078125, 41.62423324584961, 42.92766189575195, 44.23109436035156, 45.534523010253906, 46.83795166015625, 48.141380310058594, 49.4448127746582, 50.74824142456055, 52.051673889160156, 53.3551025390625, 54.65853500366211, 55.96196365356445, 57.26539611816406]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 1.0, 3.0, 4.0, 4.0, 7.0, 8.0, 8.0, 15.0, 16.0, 19.0, 23.0, 16.0, 17.0, 17.0, 25.0, 33.0, 29.0, 35.0, 59.0, 95.0, 143.0, 87.0, 60.0, 49.0, 25.0, 28.0, 24.0, 25.0, 22.0, 15.0, 11.0, 8.0, 5.0, 10.0, 4.0, 13.0, 6.0, 10.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 4.0, 2.0], "bins": [-46.954917907714844, -45.70467758178711, -44.454437255859375, -43.20419692993164, -41.953956604003906, -40.70371627807617, -39.45347595214844, -38.2032356262207, -36.95299530029297, -35.702754974365234, -34.4525146484375, -33.202274322509766, -31.95203399658203, -30.701793670654297, -29.451553344726562, -28.201313018798828, -26.951072692871094, -25.70083236694336, -24.450592041015625, -23.20035171508789, -21.950111389160156, -20.699871063232422, -19.449630737304688, -18.199390411376953, -16.94915008544922, -15.698909759521484, -14.44866943359375, -13.198429107666016, -11.948188781738281, -10.697948455810547, -9.447708129882812, -8.197467803955078, -6.947227478027344, -5.696987152099609, -4.446746826171875, -3.1965065002441406, -1.9462661743164062, -0.6960258483886719, 0.5542144775390625, 1.8044548034667969, 3.0546951293945312, 4.304935455322266, 5.55517578125, 6.805416107177734, 8.055656433105469, 9.305896759033203, 10.556137084960938, 11.806377410888672, 13.056617736816406, 14.30685806274414, 15.557098388671875, 16.80733871459961, 18.057579040527344, 19.307819366455078, 20.558059692382812, 21.808300018310547, 23.05854034423828, 24.308780670166016, 25.55902099609375, 26.809261322021484, 28.05950164794922, 29.309741973876953, 30.559982299804688, 31.810222625732422, 33.060462951660156]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 4.0, 6.0, 10.0, 18.0, 20.0, 21.0, 36.0, 60.0, 99.0, 144.0, 252.0, 459.0, 748.0, 1301.0, 2397.0, 4535.0, 9537.0, 21482.0, 53730.0, 160585.0, 550772.0, 1627078.0, 1212423.0, 366627.0, 110837.0, 39281.0, 15966.0, 7531.0, 3665.0, 1932.0, 1119.0, 639.0, 374.0, 229.0, 131.0, 88.0, 47.0, 46.0, 16.0, 18.0, 9.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.705078125, -3.580902099609375, -3.45672607421875, -3.332550048828125, -3.2083740234375, -3.084197998046875, -2.96002197265625, -2.835845947265625, -2.711669921875, -2.587493896484375, -2.46331787109375, -2.339141845703125, -2.2149658203125, -2.090789794921875, -1.96661376953125, -1.842437744140625, -1.71826171875, -1.594085693359375, -1.46990966796875, -1.345733642578125, -1.2215576171875, -1.097381591796875, -0.97320556640625, -0.849029541015625, -0.724853515625, -0.600677490234375, -0.47650146484375, -0.352325439453125, -0.2281494140625, -0.103973388671875, 0.02020263671875, 0.144378662109375, 0.2685546875, 0.392730712890625, 0.51690673828125, 0.641082763671875, 0.7652587890625, 0.889434814453125, 1.01361083984375, 1.137786865234375, 1.261962890625, 1.386138916015625, 1.51031494140625, 1.634490966796875, 1.7586669921875, 1.882843017578125, 2.00701904296875, 2.131195068359375, 2.25537109375, 2.379547119140625, 2.50372314453125, 2.627899169921875, 2.7520751953125, 2.876251220703125, 3.00042724609375, 3.124603271484375, 3.248779296875, 3.372955322265625, 3.49713134765625, 3.621307373046875, 3.7454833984375, 3.869659423828125, 3.99383544921875, 4.118011474609375, 4.2421875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 6.0, 6.0, 7.0, 8.0, 18.0, 8.0, 18.0, 16.0, 22.0, 22.0, 24.0, 29.0, 31.0, 40.0, 35.0, 29.0, 39.0, 38.0, 50.0, 45.0, 40.0, 48.0, 43.0, 32.0, 37.0, 32.0, 43.0, 36.0, 33.0, 30.0, 24.0, 10.0, 20.0, 16.0, 13.0, 8.0, 10.0, 8.0, 5.0, 3.0, 7.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-2.5546875, -2.48236083984375, -2.4100341796875, -2.33770751953125, -2.265380859375, -2.19305419921875, -2.1207275390625, -2.04840087890625, -1.97607421875, -1.90374755859375, -1.8314208984375, -1.75909423828125, -1.686767578125, -1.61444091796875, -1.5421142578125, -1.46978759765625, -1.3974609375, -1.32513427734375, -1.2528076171875, -1.18048095703125, -1.108154296875, -1.03582763671875, -0.9635009765625, -0.89117431640625, -0.81884765625, -0.74652099609375, -0.6741943359375, -0.60186767578125, -0.529541015625, -0.45721435546875, -0.3848876953125, -0.31256103515625, -0.240234375, -0.16790771484375, -0.0955810546875, -0.02325439453125, 0.049072265625, 0.12139892578125, 0.1937255859375, 0.26605224609375, 0.33837890625, 0.41070556640625, 0.4830322265625, 0.55535888671875, 0.627685546875, 0.70001220703125, 0.7723388671875, 0.84466552734375, 0.9169921875, 0.98931884765625, 1.0616455078125, 1.13397216796875, 1.206298828125, 1.27862548828125, 1.3509521484375, 1.42327880859375, 1.49560546875, 1.56793212890625, 1.6402587890625, 1.71258544921875, 1.784912109375, 1.85723876953125, 1.9295654296875, 2.00189208984375, 2.07421875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 4.0, 8.0, 14.0, 26.0, 31.0, 45.0, 95.0, 156.0, 287.0, 571.0, 1484.0, 7358.0, 194405.0, 3933135.0, 50492.0, 4177.0, 1018.0, 387.0, 237.0, 124.0, 75.0, 49.0, 31.0, 19.0, 14.0, 9.0, 10.0, 4.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-28.609375, -27.91748046875, -27.2255859375, -26.53369140625, -25.841796875, -25.14990234375, -24.4580078125, -23.76611328125, -23.07421875, -22.38232421875, -21.6904296875, -20.99853515625, -20.306640625, -19.61474609375, -18.9228515625, -18.23095703125, -17.5390625, -16.84716796875, -16.1552734375, -15.46337890625, -14.771484375, -14.07958984375, -13.3876953125, -12.69580078125, -12.00390625, -11.31201171875, -10.6201171875, -9.92822265625, -9.236328125, -8.54443359375, -7.8525390625, -7.16064453125, -6.46875, -5.77685546875, -5.0849609375, -4.39306640625, -3.701171875, -3.00927734375, -2.3173828125, -1.62548828125, -0.93359375, -0.24169921875, 0.4501953125, 1.14208984375, 1.833984375, 2.52587890625, 3.2177734375, 3.90966796875, 4.6015625, 5.29345703125, 5.9853515625, 6.67724609375, 7.369140625, 8.06103515625, 8.7529296875, 9.44482421875, 10.13671875, 10.82861328125, 11.5205078125, 12.21240234375, 12.904296875, 13.59619140625, 14.2880859375, 14.97998046875, 15.671875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 2.0, 4.0, 8.0, 5.0, 9.0, 10.0, 10.0, 24.0, 27.0, 43.0, 37.0, 63.0, 77.0, 106.0, 153.0, 201.0, 286.0, 323.0, 480.0, 476.0, 411.0, 349.0, 240.0, 181.0, 139.0, 100.0, 94.0, 58.0, 40.0, 26.0, 26.0, 14.0, 15.0, 9.0, 4.0, 7.0, 8.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.23828125, -6.99298095703125, -6.7476806640625, -6.50238037109375, -6.257080078125, -6.01177978515625, -5.7664794921875, -5.52117919921875, -5.27587890625, -5.03057861328125, -4.7852783203125, -4.53997802734375, -4.294677734375, -4.04937744140625, -3.8040771484375, -3.55877685546875, -3.3134765625, -3.06817626953125, -2.8228759765625, -2.57757568359375, -2.332275390625, -2.08697509765625, -1.8416748046875, -1.59637451171875, -1.35107421875, -1.10577392578125, -0.8604736328125, -0.61517333984375, -0.369873046875, -0.12457275390625, 0.1207275390625, 0.36602783203125, 0.611328125, 0.85662841796875, 1.1019287109375, 1.34722900390625, 1.592529296875, 1.83782958984375, 2.0831298828125, 2.32843017578125, 2.57373046875, 2.81903076171875, 3.0643310546875, 3.30963134765625, 3.554931640625, 3.80023193359375, 4.0455322265625, 4.29083251953125, 4.5361328125, 4.78143310546875, 5.0267333984375, 5.27203369140625, 5.517333984375, 5.76263427734375, 6.0079345703125, 6.25323486328125, 6.49853515625, 6.74383544921875, 6.9891357421875, 7.23443603515625, 7.479736328125, 7.72503662109375, 7.9703369140625, 8.21563720703125, 8.4609375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 2.0, 11.0, 20.0, 17.0, 28.0, 43.0, 73.0, 111.0, 150.0, 174.0, 125.0, 92.0, 44.0, 38.0, 19.0, 11.0, 10.0, 5.0, 2.0, 4.0, 4.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.85687255859375, -117.5990219116211, -114.34117126464844, -111.08331298828125, -107.8254623413086, -104.56761169433594, -101.30976104736328, -98.05191040039062, -94.79405212402344, -91.53620147705078, -88.27835083007812, -85.02049255371094, -81.76264190673828, -78.50479125976562, -75.24694061279297, -71.98908996582031, -68.73123931884766, -65.473388671875, -62.21553421020508, -58.95768356323242, -55.6998291015625, -52.441978454589844, -49.18412780761719, -45.92627716064453, -42.66842269897461, -39.41057205200195, -36.15271759033203, -32.894866943359375, -29.637014389038086, -26.379161834716797, -23.12131118774414, -19.86345863342285, -16.605613708496094, -13.347761154174805, -10.089909553527832, -6.832057952880859, -3.5742053985595703, -0.31635284423828125, 2.941497802734375, 6.199350357055664, 9.457202911376953, 12.715055465698242, 15.972907066345215, 19.230758666992188, 22.488611221313477, 25.746463775634766, 29.004314422607422, 32.262168884277344, 35.52001953125, 38.777870178222656, 42.03572463989258, 45.293575286865234, 48.551429748535156, 51.80928039550781, 55.06713104248047, 58.324981689453125, 61.58283615112305, 64.84069061279297, 68.09854125976562, 71.35639190673828, 74.61424255371094, 77.87210083007812, 81.12994384765625, 84.38780212402344, 87.6456527709961]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 5.0, 6.0, 10.0, 13.0, 10.0, 6.0, 15.0, 14.0, 16.0, 25.0, 28.0, 26.0, 22.0, 33.0, 44.0, 31.0, 45.0, 40.0, 55.0, 53.0, 59.0, 53.0, 50.0, 30.0, 40.0, 35.0, 28.0, 41.0, 27.0, 24.0, 25.0, 19.0, 19.0, 15.0, 11.0, 8.0, 4.0, 3.0, 3.0, 5.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.165245056152344, -39.78171157836914, -38.39817810058594, -37.01464080810547, -35.631107330322266, -34.24757385253906, -32.86404037475586, -31.480506896972656, -30.09697151184082, -28.713438034057617, -27.32990264892578, -25.946369171142578, -24.562835693359375, -23.17930030822754, -21.795766830444336, -20.4122314453125, -19.028697967529297, -17.645164489746094, -16.261629104614258, -14.878095626831055, -13.494561195373535, -12.111026763916016, -10.727493286132812, -9.343958854675293, -7.960424423217773, -6.576889991760254, -5.193356037139893, -3.8098220825195312, -2.4262876510620117, -1.0427532196044922, 0.34078025817871094, 1.7243146896362305, 3.10784912109375, 4.4913835525512695, 5.874917507171631, 7.258451461791992, 8.641985893249512, 10.025520324707031, 11.409053802490234, 12.792588233947754, 14.176122665405273, 15.559657096862793, 16.943191528320312, 18.326725006103516, 19.71025848388672, 21.093793869018555, 22.477327346801758, 23.860862731933594, 25.244396209716797, 26.6279296875, 28.011465072631836, 29.39499855041504, 30.778533935546875, 32.16206741333008, 33.54560089111328, 34.929134368896484, 36.31266784667969, 37.69620132446289, 39.079734802246094, 40.46327209472656, 41.846805572509766, 43.23033905029297, 44.61387252807617, 45.997406005859375, 47.380943298339844]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 3.0, 5.0, 6.0, 10.0, 9.0, 19.0, 28.0, 49.0, 53.0, 97.0, 142.0, 220.0, 379.0, 581.0, 1035.0, 1929.0, 3910.0, 8619.0, 22182.0, 69182.0, 299989.0, 489106.0, 99425.0, 30289.0, 11108.0, 4825.0, 2309.0, 1215.0, 731.0, 423.0, 254.0, 147.0, 103.0, 51.0, 38.0, 22.0, 20.0, 17.0, 8.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.81640625, -4.67108154296875, -4.5257568359375, -4.38043212890625, -4.235107421875, -4.08978271484375, -3.9444580078125, -3.79913330078125, -3.65380859375, -3.50848388671875, -3.3631591796875, -3.21783447265625, -3.072509765625, -2.92718505859375, -2.7818603515625, -2.63653564453125, -2.4912109375, -2.34588623046875, -2.2005615234375, -2.05523681640625, -1.909912109375, -1.76458740234375, -1.6192626953125, -1.47393798828125, -1.32861328125, -1.18328857421875, -1.0379638671875, -0.89263916015625, -0.747314453125, -0.60198974609375, -0.4566650390625, -0.31134033203125, -0.166015625, -0.02069091796875, 0.1246337890625, 0.26995849609375, 0.415283203125, 0.56060791015625, 0.7059326171875, 0.85125732421875, 0.99658203125, 1.14190673828125, 1.2872314453125, 1.43255615234375, 1.577880859375, 1.72320556640625, 1.8685302734375, 2.01385498046875, 2.1591796875, 2.30450439453125, 2.4498291015625, 2.59515380859375, 2.740478515625, 2.88580322265625, 3.0311279296875, 3.17645263671875, 3.32177734375, 3.46710205078125, 3.6124267578125, 3.75775146484375, 3.903076171875, 4.04840087890625, 4.1937255859375, 4.33905029296875, 4.484375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 4.0, 4.0, 5.0, 14.0, 9.0, 15.0, 13.0, 22.0, 18.0, 25.0, 19.0, 30.0, 37.0, 29.0, 33.0, 43.0, 40.0, 40.0, 52.0, 53.0, 57.0, 43.0, 43.0, 31.0, 42.0, 43.0, 40.0, 35.0, 35.0, 22.0, 17.0, 18.0, 10.0, 10.0, 17.0, 8.0, 5.0, 10.0, 3.0, 0.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.75390625, -3.6519775390625, -3.550048828125, -3.4481201171875, -3.34619140625, -3.2442626953125, -3.142333984375, -3.0404052734375, -2.9384765625, -2.8365478515625, -2.734619140625, -2.6326904296875, -2.53076171875, -2.4288330078125, -2.326904296875, -2.2249755859375, -2.123046875, -2.0211181640625, -1.919189453125, -1.8172607421875, -1.71533203125, -1.6134033203125, -1.511474609375, -1.4095458984375, -1.3076171875, -1.2056884765625, -1.103759765625, -1.0018310546875, -0.89990234375, -0.7979736328125, -0.696044921875, -0.5941162109375, -0.4921875, -0.3902587890625, -0.288330078125, -0.1864013671875, -0.08447265625, 0.0174560546875, 0.119384765625, 0.2213134765625, 0.3232421875, 0.4251708984375, 0.527099609375, 0.6290283203125, 0.73095703125, 0.8328857421875, 0.934814453125, 1.0367431640625, 1.138671875, 1.2406005859375, 1.342529296875, 1.4444580078125, 1.54638671875, 1.6483154296875, 1.750244140625, 1.8521728515625, 1.9541015625, 2.0560302734375, 2.157958984375, 2.2598876953125, 2.36181640625, 2.4637451171875, 2.565673828125, 2.6676025390625, 2.76953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 9.0, 10.0, 10.0, 8.0, 15.0, 19.0, 24.0, 36.0, 67.0, 105.0, 145.0, 210.0, 355.0, 688.0, 1402.0, 3529.0, 12128.0, 66453.0, 867013.0, 76273.0, 13190.0, 3706.0, 1431.0, 679.0, 361.0, 234.0, 140.0, 84.0, 69.0, 46.0, 29.0, 19.0, 24.0, 10.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.75390625, -5.53704833984375, -5.3201904296875, -5.10333251953125, -4.886474609375, -4.66961669921875, -4.4527587890625, -4.23590087890625, -4.01904296875, -3.80218505859375, -3.5853271484375, -3.36846923828125, -3.151611328125, -2.93475341796875, -2.7178955078125, -2.50103759765625, -2.2841796875, -2.06732177734375, -1.8504638671875, -1.63360595703125, -1.416748046875, -1.19989013671875, -0.9830322265625, -0.76617431640625, -0.54931640625, -0.33245849609375, -0.1156005859375, 0.10125732421875, 0.318115234375, 0.53497314453125, 0.7518310546875, 0.96868896484375, 1.185546875, 1.40240478515625, 1.6192626953125, 1.83612060546875, 2.052978515625, 2.26983642578125, 2.4866943359375, 2.70355224609375, 2.92041015625, 3.13726806640625, 3.3541259765625, 3.57098388671875, 3.787841796875, 4.00469970703125, 4.2215576171875, 4.43841552734375, 4.6552734375, 4.87213134765625, 5.0889892578125, 5.30584716796875, 5.522705078125, 5.73956298828125, 5.9564208984375, 6.17327880859375, 6.39013671875, 6.60699462890625, 6.8238525390625, 7.04071044921875, 7.257568359375, 7.47442626953125, 7.6912841796875, 7.90814208984375, 8.125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 4.0, 2.0, 6.0, 5.0, 4.0, 5.0, 11.0, 14.0, 16.0, 17.0, 19.0, 21.0, 30.0, 17.0, 29.0, 48.0, 48.0, 52.0, 80.0, 83.0, 84.0, 70.0, 67.0, 41.0, 47.0, 39.0, 20.0, 22.0, 20.0, 15.0, 15.0, 10.0, 9.0, 6.0, 5.0, 5.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8359375, -12.3917236328125, -11.947509765625, -11.5032958984375, -11.05908203125, -10.6148681640625, -10.170654296875, -9.7264404296875, -9.2822265625, -8.8380126953125, -8.393798828125, -7.9495849609375, -7.50537109375, -7.0611572265625, -6.616943359375, -6.1727294921875, -5.728515625, -5.2843017578125, -4.840087890625, -4.3958740234375, -3.95166015625, -3.5074462890625, -3.063232421875, -2.6190185546875, -2.1748046875, -1.7305908203125, -1.286376953125, -0.8421630859375, -0.39794921875, 0.0462646484375, 0.490478515625, 0.9346923828125, 1.37890625, 1.8231201171875, 2.267333984375, 2.7115478515625, 3.15576171875, 3.5999755859375, 4.044189453125, 4.4884033203125, 4.9326171875, 5.3768310546875, 5.821044921875, 6.2652587890625, 6.70947265625, 7.1536865234375, 7.597900390625, 8.0421142578125, 8.486328125, 8.9305419921875, 9.374755859375, 9.8189697265625, 10.26318359375, 10.7073974609375, 11.151611328125, 11.5958251953125, 12.0400390625, 12.4842529296875, 12.928466796875, 13.3726806640625, 13.81689453125, 14.2611083984375, 14.705322265625, 15.1495361328125, 15.59375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 7.0, 9.0, 12.0, 26.0, 21.0, 30.0, 50.0, 83.0, 155.0, 217.0, 377.0, 646.0, 1096.0, 2287.0, 4857.0, 11807.0, 33697.0, 147796.0, 747601.0, 63997.0, 19349.0, 7438.0, 3355.0, 1563.0, 786.0, 463.0, 286.0, 193.0, 107.0, 82.0, 50.0, 26.0, 21.0, 19.0, 10.0, 10.0, 3.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.107421875, -1.0741119384765625, -1.040802001953125, -1.0074920654296875, -0.97418212890625, -0.9408721923828125, -0.907562255859375, -0.8742523193359375, -0.8409423828125, -0.8076324462890625, -0.774322509765625, -0.7410125732421875, -0.70770263671875, -0.6743927001953125, -0.641082763671875, -0.6077728271484375, -0.574462890625, -0.5411529541015625, -0.507843017578125, -0.4745330810546875, -0.44122314453125, -0.4079132080078125, -0.374603271484375, -0.3412933349609375, -0.3079833984375, -0.2746734619140625, -0.241363525390625, -0.2080535888671875, -0.17474365234375, -0.1414337158203125, -0.108123779296875, -0.0748138427734375, -0.04150390625, -0.0081939697265625, 0.025115966796875, 0.0584259033203125, 0.09173583984375, 0.1250457763671875, 0.158355712890625, 0.1916656494140625, 0.2249755859375, 0.2582855224609375, 0.291595458984375, 0.3249053955078125, 0.35821533203125, 0.3915252685546875, 0.424835205078125, 0.4581451416015625, 0.491455078125, 0.5247650146484375, 0.558074951171875, 0.5913848876953125, 0.62469482421875, 0.6580047607421875, 0.691314697265625, 0.7246246337890625, 0.7579345703125, 0.7912445068359375, 0.824554443359375, 0.8578643798828125, 0.89117431640625, 0.9244842529296875, 0.957794189453125, 0.9911041259765625, 1.0244140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 5.0, 4.0, 3.0, 5.0, 7.0, 12.0, 13.0, 16.0, 21.0, 24.0, 34.0, 53.0, 94.0, 119.0, 130.0, 122.0, 98.0, 55.0, 46.0, 28.0, 21.0, 16.0, 8.0, 10.0, 9.0, 7.0, 8.0, 4.0, 3.0, 4.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004742145538330078, -0.000458691269159317, -0.0004431679844856262, -0.0004276446998119354, -0.00041212141513824463, -0.00039659813046455383, -0.00038107484579086304, -0.00036555156111717224, -0.00035002827644348145, -0.00033450499176979065, -0.00031898170709609985, -0.00030345842242240906, -0.00028793513774871826, -0.00027241185307502747, -0.00025688856840133667, -0.00024136528372764587, -0.00022584199905395508, -0.00021031871438026428, -0.00019479542970657349, -0.0001792721450328827, -0.0001637488603591919, -0.0001482255756855011, -0.0001327022910118103, -0.00011717900633811951, -0.00010165572166442871, -8.613243699073792e-05, -7.060915231704712e-05, -5.508586764335632e-05, -3.956258296966553e-05, -2.403929829597473e-05, -8.516013622283936e-06, 7.00727105140686e-06, 2.2530555725097656e-05, 3.805384039878845e-05, 5.357712507247925e-05, 6.910040974617004e-05, 8.462369441986084e-05, 0.00010014697909355164, 0.00011567026376724243, 0.00013119354844093323, 0.00014671683311462402, 0.00016224011778831482, 0.00017776340246200562, 0.0001932866871356964, 0.0002088099718093872, 0.000224333256483078, 0.0002398565411567688, 0.0002553798258304596, 0.0002709031105041504, 0.0002864263951778412, 0.000301949679851532, 0.0003174729645252228, 0.0003329962491989136, 0.00034851953387260437, 0.00036404281854629517, 0.00037956610321998596, 0.00039508938789367676, 0.00041061267256736755, 0.00042613595724105835, 0.00044165924191474915, 0.00045718252658843994, 0.00047270581126213074, 0.00048822909593582153, 0.0005037523806095123, 0.0005192756652832031]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 7.0, 11.0, 11.0, 10.0, 18.0, 36.0, 66.0, 93.0, 144.0, 293.0, 612.0, 1184.0, 2804.0, 6785.0, 18589.0, 69467.0, 785523.0, 119939.0, 27041.0, 9225.0, 3603.0, 1477.0, 722.0, 409.0, 194.0, 123.0, 70.0, 37.0, 21.0, 17.0, 6.0, 7.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.580078125, -1.53448486328125, -1.4888916015625, -1.44329833984375, -1.397705078125, -1.35211181640625, -1.3065185546875, -1.26092529296875, -1.21533203125, -1.16973876953125, -1.1241455078125, -1.07855224609375, -1.032958984375, -0.98736572265625, -0.9417724609375, -0.89617919921875, -0.8505859375, -0.80499267578125, -0.7593994140625, -0.71380615234375, -0.668212890625, -0.62261962890625, -0.5770263671875, -0.53143310546875, -0.48583984375, -0.44024658203125, -0.3946533203125, -0.34906005859375, -0.303466796875, -0.25787353515625, -0.2122802734375, -0.16668701171875, -0.12109375, -0.07550048828125, -0.0299072265625, 0.01568603515625, 0.061279296875, 0.10687255859375, 0.1524658203125, 0.19805908203125, 0.24365234375, 0.28924560546875, 0.3348388671875, 0.38043212890625, 0.426025390625, 0.47161865234375, 0.5172119140625, 0.56280517578125, 0.6083984375, 0.65399169921875, 0.6995849609375, 0.74517822265625, 0.790771484375, 0.83636474609375, 0.8819580078125, 0.92755126953125, 0.97314453125, 1.01873779296875, 1.0643310546875, 1.10992431640625, 1.155517578125, 1.20111083984375, 1.2467041015625, 1.29229736328125, 1.337890625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 8.0, 2.0, 7.0, 5.0, 12.0, 22.0, 20.0, 36.0, 47.0, 87.0, 83.0, 127.0, 120.0, 83.0, 76.0, 76.0, 32.0, 27.0, 29.0, 20.0, 12.0, 10.0, 9.0, 4.0, 6.0, 7.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.71875, -1.67254638671875, -1.6263427734375, -1.58013916015625, -1.533935546875, -1.48773193359375, -1.4415283203125, -1.39532470703125, -1.34912109375, -1.30291748046875, -1.2567138671875, -1.21051025390625, -1.164306640625, -1.11810302734375, -1.0718994140625, -1.02569580078125, -0.9794921875, -0.93328857421875, -0.8870849609375, -0.84088134765625, -0.794677734375, -0.74847412109375, -0.7022705078125, -0.65606689453125, -0.60986328125, -0.56365966796875, -0.5174560546875, -0.47125244140625, -0.425048828125, -0.37884521484375, -0.3326416015625, -0.28643798828125, -0.240234375, -0.19403076171875, -0.1478271484375, -0.10162353515625, -0.055419921875, -0.00921630859375, 0.0369873046875, 0.08319091796875, 0.12939453125, 0.17559814453125, 0.2218017578125, 0.26800537109375, 0.314208984375, 0.36041259765625, 0.4066162109375, 0.45281982421875, 0.4990234375, 0.54522705078125, 0.5914306640625, 0.63763427734375, 0.683837890625, 0.73004150390625, 0.7762451171875, 0.82244873046875, 0.86865234375, 0.91485595703125, 0.9610595703125, 1.00726318359375, 1.053466796875, 1.09967041015625, 1.1458740234375, 1.19207763671875, 1.23828125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 3.0, 8.0, 19.0, 28.0, 54.0, 138.0, 399.0, 180.0, 70.0, 32.0, 34.0, 16.0, 6.0, 3.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.836883544921875, -42.853431701660156, -40.86997985839844, -38.88652801513672, -36.903076171875, -34.91962432861328, -32.93617248535156, -30.952722549438477, -28.969270706176758, -26.98581886291504, -25.00236701965332, -23.018917083740234, -21.035465240478516, -19.052013397216797, -17.068561553955078, -15.08510971069336, -13.10165786743164, -11.118206024169922, -9.134754180908203, -7.151303291320801, -5.167851448059082, -3.1843996047973633, -1.200948715209961, 0.7825031280517578, 2.7659549713134766, 4.749406814575195, 6.732858180999756, 8.716309547424316, 10.699761390686035, 12.683213233947754, 14.666664123535156, 16.650115966796875, 18.633567810058594, 20.617019653320312, 22.60047149658203, 24.58392333984375, 26.56737518310547, 28.550827026367188, 30.534276962280273, 32.517730712890625, 34.501182556152344, 36.48463439941406, 38.46808624267578, 40.4515380859375, 42.43498992919922, 44.41844177246094, 46.401893615722656, 48.385345458984375, 50.36879348754883, 52.35224533081055, 54.335697174072266, 56.319149017333984, 58.3026008605957, 60.28605270385742, 62.269500732421875, 64.2529525756836, 66.23640441894531, 68.21985626220703, 70.20330810546875, 72.18675994873047, 74.17021179199219, 76.1536636352539, 78.13711547851562, 80.12056732177734, 82.10401916503906]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 9.0, 4.0, 9.0, 14.0, 12.0, 10.0, 17.0, 21.0, 19.0, 11.0, 16.0, 20.0, 26.0, 38.0, 73.0, 101.0, 104.0, 116.0, 109.0, 64.0, 40.0, 20.0, 17.0, 10.0, 23.0, 24.0, 19.0, 11.0, 10.0, 5.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.46061325073242, -34.2375373840332, -33.014461517333984, -31.7913875579834, -30.56831169128418, -29.34523582458496, -28.122161865234375, -26.899085998535156, -25.676010131835938, -24.45293426513672, -23.2298583984375, -22.006784439086914, -20.783708572387695, -19.560632705688477, -18.33755874633789, -17.114482879638672, -15.891407012939453, -14.668331146240234, -13.445256233215332, -12.22218132019043, -10.999105453491211, -9.776029586791992, -8.55295467376709, -7.3298797607421875, -6.106803894042969, -4.883728504180908, -3.6606531143188477, -2.437577724456787, -1.2145023345947266, 0.008573055267333984, 1.2316484451293945, 2.454723358154297, 3.67779541015625, 4.9008708000183105, 6.123946189880371, 7.347021579742432, 8.570096969604492, 9.793172836303711, 11.016247749328613, 12.239322662353516, 13.462398529052734, 14.685474395751953, 15.908549308776855, 17.131624221801758, 18.354700088500977, 19.577775955200195, 20.80084991455078, 22.02392578125, 23.24700164794922, 24.470077514648438, 25.693153381347656, 26.916227340698242, 28.13930320739746, 29.36237907409668, 30.585453033447266, 31.808528900146484, 33.0316047668457, 34.25468063354492, 35.47775650024414, 36.70083236694336, 37.92390441894531, 39.14698028564453, 40.37005615234375, 41.59313201904297, 42.81620788574219]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 11.0, 11.0, 6.0, 19.0, 18.0, 14.0, 13.0, 22.0, 30.0, 26.0, 37.0, 41.0, 29.0, 78.0, 174.0, 110.0, 67.0, 35.0, 26.0, 30.0, 21.0, 24.0, 23.0, 21.0, 24.0, 12.0, 14.0, 11.0, 9.0, 6.0, 8.0, 4.0, 3.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.37109375, -3.26806640625, -3.1650390625, -3.06201171875, -2.958984375, -2.85595703125, -2.7529296875, -2.64990234375, -2.546875, -2.44384765625, -2.3408203125, -2.23779296875, -2.134765625, -2.03173828125, -1.9287109375, -1.82568359375, -1.72265625, -1.61962890625, -1.5166015625, -1.41357421875, -1.310546875, -1.20751953125, -1.1044921875, -1.00146484375, -0.8984375, -0.79541015625, -0.6923828125, -0.58935546875, -0.486328125, -0.38330078125, -0.2802734375, -0.17724609375, -0.07421875, 0.02880859375, 0.1318359375, 0.23486328125, 0.337890625, 0.44091796875, 0.5439453125, 0.64697265625, 0.75, 0.85302734375, 0.9560546875, 1.05908203125, 1.162109375, 1.26513671875, 1.3681640625, 1.47119140625, 1.57421875, 1.67724609375, 1.7802734375, 1.88330078125, 1.986328125, 2.08935546875, 2.1923828125, 2.29541015625, 2.3984375, 2.50146484375, 2.6044921875, 2.70751953125, 2.810546875, 2.91357421875, 3.0166015625, 3.11962890625, 3.22265625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 7.0, 9.0, 10.0, 13.0, 15.0, 36.0, 46.0, 124.0, 209.0, 713.0, 3524.0, 48867.0, 8326156.0, 6920.0, 1251.0, 379.0, 126.0, 74.0, 25.0, 21.0, 4.0, 6.0, 14.0, 16.0, 16.0, 3.0, 0.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-37.74658966064453, -36.452911376953125, -35.15923309326172, -33.86555480957031, -32.571876525878906, -31.278196334838867, -29.98451805114746, -28.690837860107422, -27.397159576416016, -26.10348129272461, -24.809803009033203, -23.516124725341797, -22.222444534301758, -20.92876625061035, -19.635087966918945, -18.341407775878906, -17.047731399536133, -15.754053115844727, -14.460373878479004, -13.166695594787598, -11.873016357421875, -10.579338073730469, -9.285659790039062, -7.99198055267334, -6.698302268981934, -5.404623508453369, -4.110944747924805, -2.8172664642333984, -1.523587703704834, -0.22990894317626953, 1.0637693405151367, 2.3574485778808594, 3.6511268615722656, 4.94480562210083, 6.2384843826293945, 7.532162666320801, 8.825841903686523, 10.11952018737793, 11.413198471069336, 12.706877708435059, 14.000555992126465, 15.294234275817871, 16.587913513183594, 17.881591796875, 19.175270080566406, 20.468948364257812, 21.76262664794922, 23.056306838989258, 24.349985122680664, 25.64366340637207, 26.937341690063477, 28.231021881103516, 29.524700164794922, 30.818378448486328, 32.112056732177734, 33.40573501586914, 34.69941329956055, 35.99309158325195, 37.28676986694336, 38.580448150634766, 39.87412643432617, 41.167808532714844, 42.46148681640625, 43.755165100097656, 45.04884338378906]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 3.0, 2.0, 7.0, 4.0, 3.0, 3.0, 1.0, 9.0, 5.0, 8.0, 4.0, 8.0, 7.0, 3.0, 4.0, 4.0, 4.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-43.25182342529297, -41.656986236572266, -40.06214904785156, -38.46731185913086, -36.872474670410156, -35.27763748168945, -33.68280029296875, -32.08796310424805, -30.493125915527344, -28.89828872680664, -27.303451538085938, -25.708614349365234, -24.11377716064453, -22.518939971923828, -20.924102783203125, -19.329265594482422, -17.73443031311035, -16.13959312438965, -14.544755935668945, -12.949918746948242, -11.355081558227539, -9.760244369506836, -8.16540813446045, -6.570570945739746, -4.975733757019043, -3.38089656829834, -1.7860596179962158, -0.1912226676940918, 1.4036145210266113, 2.9984517097473145, 4.593288421630859, 6.1881256103515625, 7.782962799072266, 9.377799987792969, 10.972637176513672, 12.567474365234375, 14.162311553955078, 15.757148742675781, 17.351985931396484, 18.946823120117188, 20.54166030883789, 22.136497497558594, 23.731334686279297, 25.326171875, 26.921009063720703, 28.515846252441406, 30.11068344116211, 31.705520629882812, 33.30035400390625, 34.89519119262695, 36.490028381347656, 38.08486557006836, 39.67970275878906, 41.274539947509766, 42.86937713623047, 44.46421432495117, 46.059051513671875, 47.65388870239258, 49.24872589111328, 50.843563079833984, 52.43840026855469, 54.03323745727539, 55.628074645996094, 57.2229118347168, 58.8177490234375]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 8.0, 3.0, 8.0, 10.0, 12.0, 15.0, 20.0, 19.0, 11.0, 31.0, 37.0, 52.0, 51.0, 52.0, 62.0, 67.0, 73.0, 64.0, 60.0, 65.0, 42.0, 49.0, 42.0, 34.0, 32.0, 24.0, 12.0, 17.0, 9.0, 2.0, 5.0, 1.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.302734375, -2.2191162109375, -2.135498046875, -2.0518798828125, -1.96826171875, -1.8846435546875, -1.801025390625, -1.7174072265625, -1.6337890625, -1.5501708984375, -1.466552734375, -1.3829345703125, -1.29931640625, -1.2156982421875, -1.132080078125, -1.0484619140625, -0.96484375, -0.8812255859375, -0.797607421875, -0.7139892578125, -0.63037109375, -0.5467529296875, -0.463134765625, -0.3795166015625, -0.2958984375, -0.2122802734375, -0.128662109375, -0.0450439453125, 0.03857421875, 0.1221923828125, 0.205810546875, 0.2894287109375, 0.373046875, 0.4566650390625, 0.540283203125, 0.6239013671875, 0.70751953125, 0.7911376953125, 0.874755859375, 0.9583740234375, 1.0419921875, 1.1256103515625, 1.209228515625, 1.2928466796875, 1.37646484375, 1.4600830078125, 1.543701171875, 1.6273193359375, 1.7109375, 1.7945556640625, 1.878173828125, 1.9617919921875, 2.04541015625, 2.1290283203125, 2.212646484375, 2.2962646484375, 2.3798828125, 2.4635009765625, 2.547119140625, 2.6307373046875, 2.71435546875, 2.7979736328125, 2.881591796875, 2.9652099609375, 3.048828125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 11.0, 13.0, 18.0, 39.0, 50.0, 80.0, 128.0, 183.0, 322.0, 579.0, 999.0, 2125.0, 4394.0, 9784.0, 22821.0, 53473.0, 119309.0, 157101.0, 86699.0, 36838.0, 15587.0, 6905.0, 3197.0, 1588.0, 823.0, 457.0, 264.0, 171.0, 102.0, 64.0, 50.0, 25.0, 18.0, 11.0, 9.0, 8.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.328125, -18.68994140625, -18.0517578125, -17.41357421875, -16.775390625, -16.13720703125, -15.4990234375, -14.86083984375, -14.22265625, -13.58447265625, -12.9462890625, -12.30810546875, -11.669921875, -11.03173828125, -10.3935546875, -9.75537109375, -9.1171875, -8.47900390625, -7.8408203125, -7.20263671875, -6.564453125, -5.92626953125, -5.2880859375, -4.64990234375, -4.01171875, -3.37353515625, -2.7353515625, -2.09716796875, -1.458984375, -0.82080078125, -0.1826171875, 0.45556640625, 1.09375, 1.73193359375, 2.3701171875, 3.00830078125, 3.646484375, 4.28466796875, 4.9228515625, 5.56103515625, 6.19921875, 6.83740234375, 7.4755859375, 8.11376953125, 8.751953125, 9.39013671875, 10.0283203125, 10.66650390625, 11.3046875, 11.94287109375, 12.5810546875, 13.21923828125, 13.857421875, 14.49560546875, 15.1337890625, 15.77197265625, 16.41015625, 17.04833984375, 17.6865234375, 18.32470703125, 18.962890625, 19.60107421875, 20.2392578125, 20.87744140625, 21.515625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 5.0, 5.0, 4.0, 3.0, 15.0, 9.0, 16.0, 17.0, 17.0, 23.0, 24.0, 21.0, 35.0, 28.0, 35.0, 46.0, 50.0, 48.0, 53.0, 46.0, 47.0, 64.0, 50.0, 47.0, 34.0, 28.0, 39.0, 27.0, 23.0, 21.0, 23.0, 23.0, 19.0, 5.0, 9.0, 9.0, 5.0, 8.0, 5.0, 4.0, 3.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.18359375, -3.08648681640625, -2.9893798828125, -2.89227294921875, -2.795166015625, -2.69805908203125, -2.6009521484375, -2.50384521484375, -2.40673828125, -2.30963134765625, -2.2125244140625, -2.11541748046875, -2.018310546875, -1.92120361328125, -1.8240966796875, -1.72698974609375, -1.6298828125, -1.53277587890625, -1.4356689453125, -1.33856201171875, -1.241455078125, -1.14434814453125, -1.0472412109375, -0.95013427734375, -0.85302734375, -0.75592041015625, -0.6588134765625, -0.56170654296875, -0.464599609375, -0.36749267578125, -0.2703857421875, -0.17327880859375, -0.076171875, 0.02093505859375, 0.1180419921875, 0.21514892578125, 0.312255859375, 0.40936279296875, 0.5064697265625, 0.60357666015625, 0.70068359375, 0.79779052734375, 0.8948974609375, 0.99200439453125, 1.089111328125, 1.18621826171875, 1.2833251953125, 1.38043212890625, 1.4775390625, 1.57464599609375, 1.6717529296875, 1.76885986328125, 1.865966796875, 1.96307373046875, 2.0601806640625, 2.15728759765625, 2.25439453125, 2.35150146484375, 2.4486083984375, 2.54571533203125, 2.642822265625, 2.73992919921875, 2.8370361328125, 2.93414306640625, 3.03125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 4.0, 4.0, 6.0, 10.0, 21.0, 25.0, 62.0, 105.0, 105.0, 61.0, 31.0, 16.0, 4.0, 3.0, 4.0, 6.0, 5.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.659820556640625, -30.639490127563477, -29.619159698486328, -28.598827362060547, -27.5784969329834, -26.55816650390625, -25.5378360748291, -24.517505645751953, -23.497173309326172, -22.476842880249023, -21.456512451171875, -20.436180114746094, -19.415849685668945, -18.395519256591797, -17.37518882751465, -16.3548583984375, -15.334527969360352, -14.314197540283203, -13.293866157531738, -12.27353572845459, -11.253204345703125, -10.232873916625977, -9.212543487548828, -8.19221305847168, -7.171881675720215, -6.151550769805908, -5.131219863891602, -4.110889434814453, -3.0905585289001465, -2.07022762298584, -1.0498971939086914, -0.029566287994384766, 0.9907646179199219, 2.0110955238342285, 3.031426191329956, 4.051756858825684, 5.07208776473999, 6.092418670654297, 7.112749099731445, 8.133079528808594, 9.153410911560059, 10.173741340637207, 11.194072723388672, 12.21440315246582, 13.234733581542969, 14.255064964294434, 15.275395393371582, 16.295726776123047, 17.316057205200195, 18.336387634277344, 19.356718063354492, 20.37704849243164, 21.397380828857422, 22.41771125793457, 23.43804168701172, 24.458372116088867, 25.478702545166016, 26.499032974243164, 27.519363403320312, 28.539695739746094, 29.560026168823242, 30.58035659790039, 31.60068702697754, 32.62101745605469, 33.64134979248047]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 5.0, 7.0, 9.0, 8.0, 9.0, 16.0, 21.0, 32.0, 58.0, 55.0, 72.0, 45.0, 27.0, 27.0, 18.0, 11.0, 7.0, 10.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 6.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.537559509277344, -15.982501029968262, -15.42744255065918, -14.872384071350098, -14.317325592041016, -13.76226806640625, -13.207209587097168, -12.652151107788086, -12.097092628479004, -11.542034149169922, -10.98697566986084, -10.431917190551758, -9.876859664916992, -9.321800231933594, -8.766742706298828, -8.211684226989746, -7.656625747680664, -7.101567268371582, -6.5465087890625, -5.991450786590576, -5.436392307281494, -4.881333827972412, -4.326275825500488, -3.7712173461914062, -3.216158866882324, -2.661100387573242, -2.1060421466827393, -1.5509837865829468, -0.9959254264831543, -0.44086694717407227, 0.11419129371643066, 0.6692495346069336, 1.2243061065673828, 1.7793644666671753, 2.3344228267669678, 2.8894810676574707, 3.4445395469665527, 3.9995980262756348, 4.554656028747559, 5.109714508056641, 5.664772987365723, 6.219831466674805, 6.774889945983887, 7.3299479484558105, 7.885006427764893, 8.440065383911133, 8.995122909545898, 9.55018138885498, 10.105239868164062, 10.660298347473145, 11.215356826782227, 11.770415306091309, 12.32547378540039, 12.880531311035156, 13.435589790344238, 13.99064826965332, 14.545706748962402, 15.100765228271484, 15.655823707580566, 16.21088218688965, 16.765939712524414, 17.320999145507812, 17.876056671142578, 18.431114196777344, 18.986173629760742]}, "eval/loss": 1.8941514492034912, "eval/wer": 1.1062871876239588, "eval/runtime": 910.08, "eval/samples_per_second": 2.903, "eval/steps_per_second": 0.364} \ No newline at end of file +{"train/loss": 0.2736, "train/learning_rate": 6.142517814726841e-05, "train/epoch": 8.41, "train/global_step": 7500, "_runtime": 47750, "_timestamp": 1647641627, "_step": 7502, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 10.0, 35.0, 72.0, 109.0, 179.0, 202.0, 164.0, 126.0, 62.0, 28.0, 10.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.8568115234375, -106.24176788330078, -103.62672424316406, -101.01168060302734, -98.39663696289062, -95.78160095214844, -93.16654968261719, -90.551513671875, -87.93647003173828, -85.32142639160156, -82.70638275146484, -80.09133911132812, -77.4762954711914, -74.86125183105469, -72.2462158203125, -69.63117218017578, -67.01612854003906, -64.40108489990234, -61.786041259765625, -59.170997619628906, -56.55595779418945, -53.940914154052734, -51.325870513916016, -48.71083068847656, -46.09577941894531, -43.480735778808594, -40.865692138671875, -38.250648498535156, -35.6356086730957, -33.020565032958984, -30.405521392822266, -27.79047966003418, -25.175434112548828, -22.56039047241211, -19.945348739624023, -17.330305099487305, -14.715262413024902, -12.1002197265625, -9.485176086425781, -6.870134353637695, -4.255090713500977, -1.6400477886199951, 0.9749951362609863, 3.590038299560547, 6.205080986022949, 8.820123672485352, 11.43516731262207, 14.050209045410156, 16.665252685546875, 19.280296325683594, 21.89533805847168, 24.5103816986084, 27.125423431396484, 29.740467071533203, 32.35551071166992, 34.970550537109375, 37.585594177246094, 40.20063781738281, 42.81568145751953, 45.43072509765625, 48.0457649230957, 50.66080856323242, 53.27585220336914, 55.890892028808594, 58.50593948364258]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 7.0, 5.0, 9.0, 9.0, 15.0, 16.0, 21.0, 25.0, 27.0, 42.0, 38.0, 47.0, 52.0, 78.0, 65.0, 68.0, 50.0, 74.0, 64.0, 46.0, 37.0, 39.0, 33.0, 35.0, 18.0, 25.0, 12.0, 10.0, 9.0, 7.0, 6.0, 7.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.08191680908203, -37.88005828857422, -36.67820358276367, -35.476348876953125, -34.27449035644531, -33.0726318359375, -31.870777130126953, -30.668920516967773, -29.467063903808594, -28.265207290649414, -27.063350677490234, -25.861494064331055, -24.659637451171875, -23.457780838012695, -22.255924224853516, -21.054067611694336, -19.852210998535156, -18.650354385375977, -17.448497772216797, -16.246641159057617, -15.044784545898438, -13.842927932739258, -12.641071319580078, -11.439214706420898, -10.237358093261719, -9.035501480102539, -7.833644866943359, -6.63178825378418, -5.429931640625, -4.22807502746582, -3.0262184143066406, -1.824361801147461, -0.6225013732910156, 0.5793552398681641, 1.7812118530273438, 2.9830684661865234, 4.184925079345703, 5.386781692504883, 6.5886383056640625, 7.790494918823242, 8.992351531982422, 10.194208145141602, 11.396064758300781, 12.597921371459961, 13.79977798461914, 15.00163459777832, 16.2034912109375, 17.40534782409668, 18.60720443725586, 19.80906105041504, 21.01091766357422, 22.2127742767334, 23.414630889892578, 24.616487503051758, 25.818344116210938, 27.020200729370117, 28.222057342529297, 29.423913955688477, 30.625770568847656, 31.827627182006836, 33.029483795166016, 34.23133850097656, 35.433197021484375, 36.63505554199219, 37.836910247802734]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 6.0, 4.0, 6.0, 8.0, 11.0, 10.0, 19.0, 20.0, 14.0, 21.0, 17.0, 26.0, 30.0, 26.0, 29.0, 39.0, 41.0, 47.0, 55.0, 48.0, 49.0, 48.0, 38.0, 51.0, 30.0, 38.0, 36.0, 37.0, 30.0, 24.0, 21.0, 19.0, 17.0, 15.0, 12.0, 11.0, 11.0, 7.0, 7.0, 3.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-2.52734375, -2.458892822265625, -2.39044189453125, -2.321990966796875, -2.2535400390625, -2.185089111328125, -2.11663818359375, -2.048187255859375, -1.979736328125, -1.911285400390625, -1.84283447265625, -1.774383544921875, -1.7059326171875, -1.637481689453125, -1.56903076171875, -1.500579833984375, -1.43212890625, -1.363677978515625, -1.29522705078125, -1.226776123046875, -1.1583251953125, -1.089874267578125, -1.02142333984375, -0.952972412109375, -0.884521484375, -0.816070556640625, -0.74761962890625, -0.679168701171875, -0.6107177734375, -0.542266845703125, -0.47381591796875, -0.405364990234375, -0.3369140625, -0.268463134765625, -0.20001220703125, -0.131561279296875, -0.0631103515625, 0.005340576171875, 0.07379150390625, 0.142242431640625, 0.210693359375, 0.279144287109375, 0.34759521484375, 0.416046142578125, 0.4844970703125, 0.552947998046875, 0.62139892578125, 0.689849853515625, 0.75830078125, 0.826751708984375, 0.89520263671875, 0.963653564453125, 1.0321044921875, 1.100555419921875, 1.16900634765625, 1.237457275390625, 1.305908203125, 1.374359130859375, 1.44281005859375, 1.511260986328125, 1.5797119140625, 1.648162841796875, 1.71661376953125, 1.785064697265625, 1.853515625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 3.0, 3.0, 5.0, 8.0, 20.0, 19.0, 21.0, 38.0, 28.0, 44.0, 56.0, 71.0, 95.0, 135.0, 167.0, 224.0, 345.0, 609.0, 1172.0, 2719.0, 7357.0, 26879.0, 149824.0, 2475900.0, 1387590.0, 111694.0, 20432.0, 5181.0, 1642.0, 727.0, 342.0, 233.0, 171.0, 108.0, 102.0, 78.0, 53.0, 55.0, 33.0, 33.0, 13.0, 18.0, 8.0, 7.0, 5.0, 7.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.84375, -20.263427734375, -19.68310546875, -19.102783203125, -18.5224609375, -17.942138671875, -17.36181640625, -16.781494140625, -16.201171875, -15.620849609375, -15.04052734375, -14.460205078125, -13.8798828125, -13.299560546875, -12.71923828125, -12.138916015625, -11.55859375, -10.978271484375, -10.39794921875, -9.817626953125, -9.2373046875, -8.656982421875, -8.07666015625, -7.496337890625, -6.916015625, -6.335693359375, -5.75537109375, -5.175048828125, -4.5947265625, -4.014404296875, -3.43408203125, -2.853759765625, -2.2734375, -1.693115234375, -1.11279296875, -0.532470703125, 0.0478515625, 0.628173828125, 1.20849609375, 1.788818359375, 2.369140625, 2.949462890625, 3.52978515625, 4.110107421875, 4.6904296875, 5.270751953125, 5.85107421875, 6.431396484375, 7.01171875, 7.592041015625, 8.17236328125, 8.752685546875, 9.3330078125, 9.913330078125, 10.49365234375, 11.073974609375, 11.654296875, 12.234619140625, 12.81494140625, 13.395263671875, 13.9755859375, 14.555908203125, 15.13623046875, 15.716552734375, 16.296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 7.0, 6.0, 8.0, 14.0, 20.0, 44.0, 66.0, 101.0, 172.0, 253.0, 439.0, 790.0, 868.0, 523.0, 299.0, 190.0, 117.0, 54.0, 48.0, 31.0, 12.0, 8.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7578125, -9.2733154296875, -8.788818359375, -8.3043212890625, -7.81982421875, -7.3353271484375, -6.850830078125, -6.3663330078125, -5.8818359375, -5.3973388671875, -4.912841796875, -4.4283447265625, -3.94384765625, -3.4593505859375, -2.974853515625, -2.4903564453125, -2.005859375, -1.5213623046875, -1.036865234375, -0.5523681640625, -0.06787109375, 0.4166259765625, 0.901123046875, 1.3856201171875, 1.8701171875, 2.3546142578125, 2.839111328125, 3.3236083984375, 3.80810546875, 4.2926025390625, 4.777099609375, 5.2615966796875, 5.74609375, 6.2305908203125, 6.715087890625, 7.1995849609375, 7.68408203125, 8.1685791015625, 8.653076171875, 9.1375732421875, 9.6220703125, 10.1065673828125, 10.591064453125, 11.0755615234375, 11.56005859375, 12.0445556640625, 12.529052734375, 13.0135498046875, 13.498046875, 13.9825439453125, 14.467041015625, 14.9515380859375, 15.43603515625, 15.9205322265625, 16.405029296875, 16.8895263671875, 17.3740234375, 17.8585205078125, 18.343017578125, 18.8275146484375, 19.31201171875, 19.7965087890625, 20.281005859375, 20.7655029296875, 21.25]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 19.0, 25.0, 49.0, 106.0, 226.0, 555.0, 1826.0, 12465.0, 304147.0, 3719872.0, 144573.0, 8203.0, 1431.0, 414.0, 182.0, 93.0, 42.0, 29.0, 12.0, 6.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.21875, -48.31689453125, -46.4150390625, -44.51318359375, -42.611328125, -40.70947265625, -38.8076171875, -36.90576171875, -35.00390625, -33.10205078125, -31.2001953125, -29.29833984375, -27.396484375, -25.49462890625, -23.5927734375, -21.69091796875, -19.7890625, -17.88720703125, -15.9853515625, -14.08349609375, -12.181640625, -10.27978515625, -8.3779296875, -6.47607421875, -4.57421875, -2.67236328125, -0.7705078125, 1.13134765625, 3.033203125, 4.93505859375, 6.8369140625, 8.73876953125, 10.640625, 12.54248046875, 14.4443359375, 16.34619140625, 18.248046875, 20.14990234375, 22.0517578125, 23.95361328125, 25.85546875, 27.75732421875, 29.6591796875, 31.56103515625, 33.462890625, 35.36474609375, 37.2666015625, 39.16845703125, 41.0703125, 42.97216796875, 44.8740234375, 46.77587890625, 48.677734375, 50.57958984375, 52.4814453125, 54.38330078125, 56.28515625, 58.18701171875, 60.0888671875, 61.99072265625, 63.892578125, 65.79443359375, 67.6962890625, 69.59814453125, 71.5]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 3.0, 12.0, 8.0, 21.0, 35.0, 43.0, 62.0, 54.0, 84.0, 81.0, 78.0, 100.0, 95.0, 67.0, 70.0, 57.0, 34.0, 30.0, 17.0, 17.0, 12.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.74275207519531, -48.39180374145508, -47.040855407714844, -45.68990707397461, -44.338958740234375, -42.988006591796875, -41.637062072753906, -40.286109924316406, -38.93516159057617, -37.58421325683594, -36.2332649230957, -34.88231658935547, -33.531368255615234, -32.180419921875, -30.829469680786133, -29.478519439697266, -28.127573013305664, -26.77662467956543, -25.425676345825195, -24.074726104736328, -22.723777770996094, -21.37282943725586, -20.021881103515625, -18.67093276977539, -17.319984436035156, -15.969036102294922, -14.618086814880371, -13.267138481140137, -11.916189193725586, -10.565240859985352, -9.214292526245117, -7.863343238830566, -6.512393951416016, -5.161445140838623, -3.8104965686798096, -2.459547996520996, -1.1085991859436035, 0.24234962463378906, 1.5932979583740234, 2.944247245788574, 4.295195579528809, 5.646144390106201, 6.997093200683594, 8.348041534423828, 9.698989868164062, 11.049939155578613, 12.400887489318848, 13.751836776733398, 15.102785110473633, 16.453733444213867, 17.8046817779541, 19.15563201904297, 20.506580352783203, 21.857528686523438, 23.208477020263672, 24.559425354003906, 25.91037368774414, 27.261322021484375, 28.61227035522461, 29.963218688964844, 31.31416893005371, 32.66511535644531, 34.01606750488281, 35.36701583862305, 36.71796417236328]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 6.0, 3.0, 5.0, 5.0, 10.0, 13.0, 9.0, 6.0, 12.0, 23.0, 19.0, 27.0, 28.0, 29.0, 23.0, 33.0, 35.0, 38.0, 42.0, 36.0, 41.0, 49.0, 44.0, 37.0, 34.0, 46.0, 40.0, 26.0, 37.0, 18.0, 40.0, 31.0, 29.0, 23.0, 20.0, 18.0, 15.0, 11.0, 9.0, 10.0, 4.0, 6.0, 8.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-34.79730987548828, -33.73090362548828, -32.66450119018555, -31.59809684753418, -30.531692504882812, -29.465288162231445, -28.398883819580078, -27.332477569580078, -26.266075134277344, -25.199670791625977, -24.13326644897461, -23.066862106323242, -22.000457763671875, -20.934053421020508, -19.86764907836914, -18.80124282836914, -17.734838485717773, -16.668434143066406, -15.602029800415039, -14.535625457763672, -13.469221115112305, -12.402816772460938, -11.336411476135254, -10.270007133483887, -9.20360279083252, -8.137198448181152, -7.070794105529785, -6.00438928604126, -4.937984943389893, -3.8715806007385254, -2.80517578125, -1.7387714385986328, -0.6723670959472656, 0.3940373659133911, 1.4604418277740479, 2.526846408843994, 3.5932507514953613, 4.6596550941467285, 5.726059913635254, 6.792464256286621, 7.858868598937988, 8.925272941589355, 9.991677284240723, 11.058082580566406, 12.124486923217773, 13.19089126586914, 14.257295608520508, 15.323699951171875, 16.390104293823242, 17.45650863647461, 18.522912979125977, 19.589317321777344, 20.65572166442871, 21.722126007080078, 22.788532257080078, 23.854934692382812, 24.921340942382812, 25.98774528503418, 27.054149627685547, 28.120553970336914, 29.18695831298828, 30.25336265563965, 31.319766998291016, 32.386173248291016, 33.45257568359375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 5.0, 3.0, 8.0, 10.0, 11.0, 12.0, 12.0, 11.0, 17.0, 19.0, 26.0, 22.0, 32.0, 35.0, 38.0, 37.0, 41.0, 44.0, 39.0, 37.0, 52.0, 47.0, 36.0, 41.0, 34.0, 42.0, 49.0, 37.0, 31.0, 31.0, 19.0, 22.0, 11.0, 21.0, 13.0, 9.0, 7.0, 5.0, 5.0, 6.0, 2.0, 3.0, 7.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.71484375, -2.63330078125, -2.5517578125, -2.47021484375, -2.388671875, -2.30712890625, -2.2255859375, -2.14404296875, -2.0625, -1.98095703125, -1.8994140625, -1.81787109375, -1.736328125, -1.65478515625, -1.5732421875, -1.49169921875, -1.41015625, -1.32861328125, -1.2470703125, -1.16552734375, -1.083984375, -1.00244140625, -0.9208984375, -0.83935546875, -0.7578125, -0.67626953125, -0.5947265625, -0.51318359375, -0.431640625, -0.35009765625, -0.2685546875, -0.18701171875, -0.10546875, -0.02392578125, 0.0576171875, 0.13916015625, 0.220703125, 0.30224609375, 0.3837890625, 0.46533203125, 0.546875, 0.62841796875, 0.7099609375, 0.79150390625, 0.873046875, 0.95458984375, 1.0361328125, 1.11767578125, 1.19921875, 1.28076171875, 1.3623046875, 1.44384765625, 1.525390625, 1.60693359375, 1.6884765625, 1.77001953125, 1.8515625, 1.93310546875, 2.0146484375, 2.09619140625, 2.177734375, 2.25927734375, 2.3408203125, 2.42236328125, 2.50390625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 8.0, 6.0, 11.0, 16.0, 22.0, 29.0, 47.0, 63.0, 93.0, 131.0, 208.0, 332.0, 437.0, 747.0, 1179.0, 2039.0, 3443.0, 5795.0, 10326.0, 19415.0, 37523.0, 81532.0, 248397.0, 412673.0, 117569.0, 50286.0, 24900.0, 13139.0, 7431.0, 4211.0, 2496.0, 1508.0, 905.0, 536.0, 336.0, 235.0, 172.0, 105.0, 62.0, 59.0, 44.0, 25.0, 17.0, 14.0, 10.0, 9.0, 4.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7421875, -4.57977294921875, -4.4173583984375, -4.25494384765625, -4.092529296875, -3.93011474609375, -3.7677001953125, -3.60528564453125, -3.44287109375, -3.28045654296875, -3.1180419921875, -2.95562744140625, -2.793212890625, -2.63079833984375, -2.4683837890625, -2.30596923828125, -2.1435546875, -1.98114013671875, -1.8187255859375, -1.65631103515625, -1.493896484375, -1.33148193359375, -1.1690673828125, -1.00665283203125, -0.84423828125, -0.68182373046875, -0.5194091796875, -0.35699462890625, -0.194580078125, -0.03216552734375, 0.1302490234375, 0.29266357421875, 0.455078125, 0.61749267578125, 0.7799072265625, 0.94232177734375, 1.104736328125, 1.26715087890625, 1.4295654296875, 1.59197998046875, 1.75439453125, 1.91680908203125, 2.0792236328125, 2.24163818359375, 2.404052734375, 2.56646728515625, 2.7288818359375, 2.89129638671875, 3.0537109375, 3.21612548828125, 3.3785400390625, 3.54095458984375, 3.703369140625, 3.86578369140625, 4.0281982421875, 4.19061279296875, 4.35302734375, 4.51544189453125, 4.6778564453125, 4.84027099609375, 5.002685546875, 5.16510009765625, 5.3275146484375, 5.48992919921875, 5.65234375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 2.0, 0.0, 3.0, 2.0, 7.0, 10.0, 11.0, 15.0, 14.0, 15.0, 15.0, 19.0, 19.0, 26.0, 30.0, 28.0, 30.0, 28.0, 36.0, 39.0, 29.0, 50.0, 26.0, 1065.0, 45.0, 29.0, 40.0, 41.0, 33.0, 32.0, 32.0, 38.0, 27.0, 29.0, 23.0, 20.0, 18.0, 17.0, 11.0, 10.0, 18.0, 11.0, 6.0, 4.0, 8.0, 5.0, 4.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.318359375, -2.24517822265625, -2.1719970703125, -2.09881591796875, -2.025634765625, -1.95245361328125, -1.8792724609375, -1.80609130859375, -1.73291015625, -1.65972900390625, -1.5865478515625, -1.51336669921875, -1.440185546875, -1.36700439453125, -1.2938232421875, -1.22064208984375, -1.1474609375, -1.07427978515625, -1.0010986328125, -0.92791748046875, -0.854736328125, -0.78155517578125, -0.7083740234375, -0.63519287109375, -0.56201171875, -0.48883056640625, -0.4156494140625, -0.34246826171875, -0.269287109375, -0.19610595703125, -0.1229248046875, -0.04974365234375, 0.0234375, 0.09661865234375, 0.1697998046875, 0.24298095703125, 0.316162109375, 0.38934326171875, 0.4625244140625, 0.53570556640625, 0.60888671875, 0.68206787109375, 0.7552490234375, 0.82843017578125, 0.901611328125, 0.97479248046875, 1.0479736328125, 1.12115478515625, 1.1943359375, 1.26751708984375, 1.3406982421875, 1.41387939453125, 1.487060546875, 1.56024169921875, 1.6334228515625, 1.70660400390625, 1.77978515625, 1.85296630859375, 1.9261474609375, 1.99932861328125, 2.072509765625, 2.14569091796875, 2.2188720703125, 2.29205322265625, 2.365234375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 9.0, 16.0, 24.0, 30.0, 45.0, 62.0, 106.0, 175.0, 243.0, 353.0, 601.0, 973.0, 1582.0, 2621.0, 4514.0, 7688.0, 13863.0, 25491.0, 51992.0, 120474.0, 411906.0, 1066896.0, 223326.0, 80719.0, 37906.0, 19466.0, 10817.0, 6018.0, 3651.0, 2072.0, 1291.0, 800.0, 486.0, 301.0, 207.0, 137.0, 77.0, 52.0, 54.0, 28.0, 23.0, 7.0, 5.0, 10.0, 6.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.083984375, -2.0249176025390625, -1.965850830078125, -1.9067840576171875, -1.84771728515625, -1.7886505126953125, -1.729583740234375, -1.6705169677734375, -1.6114501953125, -1.5523834228515625, -1.493316650390625, -1.4342498779296875, -1.37518310546875, -1.3161163330078125, -1.257049560546875, -1.1979827880859375, -1.138916015625, -1.0798492431640625, -1.020782470703125, -0.9617156982421875, -0.90264892578125, -0.8435821533203125, -0.784515380859375, -0.7254486083984375, -0.6663818359375, -0.6073150634765625, -0.548248291015625, -0.4891815185546875, -0.43011474609375, -0.3710479736328125, -0.311981201171875, -0.2529144287109375, -0.19384765625, -0.1347808837890625, -0.075714111328125, -0.0166473388671875, 0.04241943359375, 0.1014862060546875, 0.160552978515625, 0.2196197509765625, 0.2786865234375, 0.3377532958984375, 0.396820068359375, 0.4558868408203125, 0.51495361328125, 0.5740203857421875, 0.633087158203125, 0.6921539306640625, 0.751220703125, 0.8102874755859375, 0.869354248046875, 0.9284210205078125, 0.98748779296875, 1.0465545654296875, 1.105621337890625, 1.1646881103515625, 1.2237548828125, 1.2828216552734375, 1.341888427734375, 1.4009552001953125, 1.46002197265625, 1.5190887451171875, 1.578155517578125, 1.6372222900390625, 1.6962890625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 7.0, 2.0, 3.0, 7.0, 3.0, 5.0, 5.0, 14.0, 9.0, 10.0, 9.0, 9.0, 12.0, 15.0, 22.0, 26.0, 34.0, 61.0, 113.0, 261.0, 124.0, 61.0, 43.0, 24.0, 18.0, 14.0, 7.0, 14.0, 9.0, 10.0, 6.0, 8.0, 7.0, 5.0, 4.0, 2.0, 7.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3291015625, -1.2840423583984375, -1.238983154296875, -1.1939239501953125, -1.14886474609375, -1.1038055419921875, -1.058746337890625, -1.0136871337890625, -0.9686279296875, -0.9235687255859375, -0.878509521484375, -0.8334503173828125, -0.78839111328125, -0.7433319091796875, -0.698272705078125, -0.6532135009765625, -0.608154296875, -0.5630950927734375, -0.518035888671875, -0.4729766845703125, -0.42791748046875, -0.3828582763671875, -0.337799072265625, -0.2927398681640625, -0.2476806640625, -0.2026214599609375, -0.157562255859375, -0.1125030517578125, -0.06744384765625, -0.0223846435546875, 0.022674560546875, 0.0677337646484375, 0.11279296875, 0.1578521728515625, 0.202911376953125, 0.2479705810546875, 0.29302978515625, 0.3380889892578125, 0.383148193359375, 0.4282073974609375, 0.4732666015625, 0.5183258056640625, 0.563385009765625, 0.6084442138671875, 0.65350341796875, 0.6985626220703125, 0.743621826171875, 0.7886810302734375, 0.833740234375, 0.8787994384765625, 0.923858642578125, 0.9689178466796875, 1.01397705078125, 1.0590362548828125, 1.104095458984375, 1.1491546630859375, 1.1942138671875, 1.2392730712890625, 1.284332275390625, 1.3293914794921875, 1.37445068359375, 1.4195098876953125, 1.464569091796875, 1.5096282958984375, 1.5546875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 2.0, 6.0, 3.0, 0.0, 1.0, 6.0, 6.0, 5.0, 11.0, 16.0, 19.0, 31.0, 55.0, 87.0, 107.0, 157.0, 359.0, 13060.0, 1019653.0, 14045.0, 412.0, 155.0, 85.0, 69.0, 56.0, 42.0, 30.0, 20.0, 7.0, 10.0, 10.0, 5.0, 0.0, 1.0, 5.0, 3.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-37.3125, -36.231201171875, -35.14990234375, -34.068603515625, -32.9873046875, -31.906005859375, -30.82470703125, -29.743408203125, -28.662109375, -27.580810546875, -26.49951171875, -25.418212890625, -24.3369140625, -23.255615234375, -22.17431640625, -21.093017578125, -20.01171875, -18.930419921875, -17.84912109375, -16.767822265625, -15.6865234375, -14.605224609375, -13.52392578125, -12.442626953125, -11.361328125, -10.280029296875, -9.19873046875, -8.117431640625, -7.0361328125, -5.954833984375, -4.87353515625, -3.792236328125, -2.7109375, -1.629638671875, -0.54833984375, 0.532958984375, 1.6142578125, 2.695556640625, 3.77685546875, 4.858154296875, 5.939453125, 7.020751953125, 8.10205078125, 9.183349609375, 10.2646484375, 11.345947265625, 12.42724609375, 13.508544921875, 14.58984375, 15.671142578125, 16.75244140625, 17.833740234375, 18.9150390625, 19.996337890625, 21.07763671875, 22.158935546875, 23.240234375, 24.321533203125, 25.40283203125, 26.484130859375, 27.5654296875, 28.646728515625, 29.72802734375, 30.809326171875, 31.890625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 57.0, 761.0, 183.0, 4.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.394366264343262, -12.485061645507812, -11.575757026672363, -10.666452407836914, -9.757148742675781, -8.847844123840332, -7.938539505004883, -7.029235363006592, -6.119930744171143, -5.210626125335693, -4.301321983337402, -3.392017364501953, -2.482712984085083, -1.573408603668213, -0.6641039848327637, 0.24520015716552734, 1.1545047760009766, 2.0638091564178467, 2.973113536834717, 3.882418155670166, 4.791722297668457, 5.701026916503906, 6.6103315353393555, 7.5196356773376465, 8.428939819335938, 9.338244438171387, 10.247549057006836, 11.156852722167969, 12.066157341003418, 12.975461959838867, 13.884766578674316, 14.794071197509766, 15.703374862670898, 16.61267852783203, 17.521984100341797, 18.43128776550293, 19.340593338012695, 20.249897003173828, 21.159202575683594, 22.068506240844727, 22.97780990600586, 23.887113571166992, 24.796419143676758, 25.70572280883789, 26.615028381347656, 27.52433204650879, 28.433635711669922, 29.342941284179688, 30.252246856689453, 31.161550521850586, 32.07085418701172, 32.980159759521484, 33.88946533203125, 34.79876708984375, 35.708072662353516, 36.61737823486328, 37.52667999267578, 38.43598556518555, 39.34528732299805, 40.25459289550781, 41.16389846801758, 42.073204040527344, 42.982505798339844, 43.89181137084961, 44.801116943359375]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 15.0, 7.0, 11.0, 25.0, 19.0, 26.0, 30.0, 37.0, 48.0, 77.0, 62.0, 70.0, 63.0, 62.0, 55.0, 64.0, 51.0, 48.0, 41.0, 36.0, 39.0, 27.0, 27.0, 10.0, 14.0, 8.0, 5.0, 12.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-4.737126350402832, -4.609360694885254, -4.481595039367676, -4.3538289070129395, -4.226063251495361, -4.098297595977783, -3.970531702041626, -3.8427658081054688, -3.7150001525878906, -3.5872344970703125, -3.4594686031341553, -3.331702709197998, -3.20393705368042, -3.076171398162842, -2.9484055042266846, -2.8206396102905273, -2.692873954772949, -2.565108299255371, -2.437342405319214, -2.3095765113830566, -2.1818108558654785, -2.0540452003479004, -1.9262793064117432, -1.7985135316848755, -1.6707477569580078, -1.5429819822311401, -1.4152162075042725, -1.2874504327774048, -1.159684658050537, -1.0319188833236694, -0.9041531085968018, -0.7763873338699341, -0.6486215591430664, -0.5208557844161987, -0.39309000968933105, -0.2653242349624634, -0.1375584602355957, -0.009792685508728027, 0.11797308921813965, 0.24573886394500732, 0.373504638671875, 0.5012704133987427, 0.6290361881256104, 0.756801962852478, 0.8845677375793457, 1.0123335123062134, 1.140099287033081, 1.2678650617599487, 1.3956308364868164, 1.523396611213684, 1.6511623859405518, 1.7789281606674194, 1.906693935394287, 2.0344595909118652, 2.1622254848480225, 2.2899913787841797, 2.417757034301758, 2.545522689819336, 2.673288583755493, 2.8010544776916504, 2.9288201332092285, 3.0565857887268066, 3.184351682662964, 3.312117576599121, 3.439883232116699]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 6.0, 3.0, 11.0, 8.0, 3.0, 17.0, 17.0, 14.0, 15.0, 15.0, 18.0, 21.0, 34.0, 22.0, 38.0, 46.0, 39.0, 37.0, 30.0, 35.0, 49.0, 51.0, 37.0, 36.0, 41.0, 44.0, 49.0, 37.0, 25.0, 31.0, 28.0, 25.0, 19.0, 15.0, 17.0, 13.0, 16.0, 7.0, 4.0, 5.0, 3.0, 5.0, 3.0, 5.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.6875, -2.608978271484375, -2.53045654296875, -2.451934814453125, -2.3734130859375, -2.294891357421875, -2.21636962890625, -2.137847900390625, -2.059326171875, -1.980804443359375, -1.90228271484375, -1.823760986328125, -1.7452392578125, -1.666717529296875, -1.58819580078125, -1.509674072265625, -1.43115234375, -1.352630615234375, -1.27410888671875, -1.195587158203125, -1.1170654296875, -1.038543701171875, -0.96002197265625, -0.881500244140625, -0.802978515625, -0.724456787109375, -0.64593505859375, -0.567413330078125, -0.4888916015625, -0.410369873046875, -0.33184814453125, -0.253326416015625, -0.1748046875, -0.096282958984375, -0.01776123046875, 0.060760498046875, 0.1392822265625, 0.217803955078125, 0.29632568359375, 0.374847412109375, 0.453369140625, 0.531890869140625, 0.61041259765625, 0.688934326171875, 0.7674560546875, 0.845977783203125, 0.92449951171875, 1.003021240234375, 1.08154296875, 1.160064697265625, 1.23858642578125, 1.317108154296875, 1.3956298828125, 1.474151611328125, 1.55267333984375, 1.631195068359375, 1.709716796875, 1.788238525390625, 1.86676025390625, 1.945281982421875, 2.0238037109375, 2.102325439453125, 2.18084716796875, 2.259368896484375, 2.337890625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 1.0, 6.0, 4.0, 11.0, 11.0, 21.0, 33.0, 57.0, 81.0, 160.0, 246.0, 476.0, 795.0, 1507.0, 2921.0, 5953.0, 13277.0, 31574.0, 83497.0, 213307.0, 344897.0, 210443.0, 82299.0, 31251.0, 13182.0, 6039.0, 3040.0, 1500.0, 847.0, 471.0, 247.0, 134.0, 90.0, 69.0, 41.0, 23.0, 22.0, 8.0, 8.0, 1.0, 9.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.671875, -6.4200439453125, -6.168212890625, -5.9163818359375, -5.66455078125, -5.4127197265625, -5.160888671875, -4.9090576171875, -4.6572265625, -4.4053955078125, -4.153564453125, -3.9017333984375, -3.64990234375, -3.3980712890625, -3.146240234375, -2.8944091796875, -2.642578125, -2.3907470703125, -2.138916015625, -1.8870849609375, -1.63525390625, -1.3834228515625, -1.131591796875, -0.8797607421875, -0.6279296875, -0.3760986328125, -0.124267578125, 0.1275634765625, 0.37939453125, 0.6312255859375, 0.883056640625, 1.1348876953125, 1.38671875, 1.6385498046875, 1.890380859375, 2.1422119140625, 2.39404296875, 2.6458740234375, 2.897705078125, 3.1495361328125, 3.4013671875, 3.6531982421875, 3.905029296875, 4.1568603515625, 4.40869140625, 4.6605224609375, 4.912353515625, 5.1641845703125, 5.416015625, 5.6678466796875, 5.919677734375, 6.1715087890625, 6.42333984375, 6.6751708984375, 6.927001953125, 7.1788330078125, 7.4306640625, 7.6824951171875, 7.934326171875, 8.1861572265625, 8.43798828125, 8.6898193359375, 8.941650390625, 9.1934814453125, 9.4453125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 6.0, 12.0, 7.0, 7.0, 7.0, 23.0, 24.0, 24.0, 20.0, 22.0, 20.0, 32.0, 36.0, 54.0, 61.0, 87.0, 122.0, 188.0, 1384.0, 249.0, 166.0, 88.0, 82.0, 52.0, 49.0, 33.0, 36.0, 33.0, 15.0, 15.0, 16.0, 16.0, 17.0, 7.0, 12.0, 6.0, 8.0, 8.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.859375, -9.549072265625, -9.23876953125, -8.928466796875, -8.6181640625, -8.307861328125, -7.99755859375, -7.687255859375, -7.376953125, -7.066650390625, -6.75634765625, -6.446044921875, -6.1357421875, -5.825439453125, -5.51513671875, -5.204833984375, -4.89453125, -4.584228515625, -4.27392578125, -3.963623046875, -3.6533203125, -3.343017578125, -3.03271484375, -2.722412109375, -2.412109375, -2.101806640625, -1.79150390625, -1.481201171875, -1.1708984375, -0.860595703125, -0.55029296875, -0.239990234375, 0.0703125, 0.380615234375, 0.69091796875, 1.001220703125, 1.3115234375, 1.621826171875, 1.93212890625, 2.242431640625, 2.552734375, 2.863037109375, 3.17333984375, 3.483642578125, 3.7939453125, 4.104248046875, 4.41455078125, 4.724853515625, 5.03515625, 5.345458984375, 5.65576171875, 5.966064453125, 6.2763671875, 6.586669921875, 6.89697265625, 7.207275390625, 7.517578125, 7.827880859375, 8.13818359375, 8.448486328125, 8.7587890625, 9.069091796875, 9.37939453125, 9.689697265625, 10.0]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 6.0, 7.0, 12.0, 10.0, 9.0, 12.0, 7.0, 19.0, 18.0, 22.0, 29.0, 30.0, 48.0, 58.0, 137.0, 280.0, 1554.0, 58338.0, 2927578.0, 154272.0, 2469.0, 349.0, 121.0, 74.0, 44.0, 32.0, 25.0, 21.0, 19.0, 11.0, 18.0, 20.0, 9.0, 13.0, 10.0, 6.0, 6.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.78125, -40.53759765625, -39.2939453125, -38.05029296875, -36.806640625, -35.56298828125, -34.3193359375, -33.07568359375, -31.83203125, -30.58837890625, -29.3447265625, -28.10107421875, -26.857421875, -25.61376953125, -24.3701171875, -23.12646484375, -21.8828125, -20.63916015625, -19.3955078125, -18.15185546875, -16.908203125, -15.66455078125, -14.4208984375, -13.17724609375, -11.93359375, -10.68994140625, -9.4462890625, -8.20263671875, -6.958984375, -5.71533203125, -4.4716796875, -3.22802734375, -1.984375, -0.74072265625, 0.5029296875, 1.74658203125, 2.990234375, 4.23388671875, 5.4775390625, 6.72119140625, 7.96484375, 9.20849609375, 10.4521484375, 11.69580078125, 12.939453125, 14.18310546875, 15.4267578125, 16.67041015625, 17.9140625, 19.15771484375, 20.4013671875, 21.64501953125, 22.888671875, 24.13232421875, 25.3759765625, 26.61962890625, 27.86328125, 29.10693359375, 30.3505859375, 31.59423828125, 32.837890625, 34.08154296875, 35.3251953125, 36.56884765625, 37.8125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 56.0, 474.0, 432.0, 47.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-110.408447265625, -106.14456176757812, -101.88067626953125, -97.61679077148438, -93.3529052734375, -89.08901977539062, -84.82514190673828, -80.5612564086914, -76.29737091064453, -72.03348541259766, -67.76959991455078, -63.50571823120117, -59.2418327331543, -54.97794723510742, -50.71406555175781, -46.45018005371094, -42.18629455566406, -37.92240905761719, -33.65852355957031, -29.394641876220703, -25.130756378173828, -20.866870880126953, -16.60298728942871, -12.339103698730469, -8.075218200683594, -3.811333656311035, 0.45255088806152344, 4.716435432434082, 8.98031997680664, 13.244205474853516, 17.508089065551758, 21.77197265625, 26.035858154296875, 30.29974365234375, 34.563629150390625, 38.827510833740234, 43.09139633178711, 47.355281829833984, 51.619163513183594, 55.88304901123047, 60.146934509277344, 64.41082000732422, 68.6747055053711, 72.93859100341797, 77.20246887207031, 81.46635437011719, 85.73023986816406, 89.99412536621094, 94.25801086425781, 98.52189636230469, 102.78578186035156, 107.04966735839844, 111.31355285644531, 115.57743835449219, 119.84131622314453, 124.1052017211914, 128.36907958984375, 132.63296508789062, 136.8968505859375, 141.16073608398438, 145.42462158203125, 149.68850708007812, 153.952392578125, 158.21627807617188, 162.48016357421875]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 5.0, 6.0, 8.0, 6.0, 8.0, 15.0, 16.0, 24.0, 20.0, 36.0, 26.0, 28.0, 26.0, 17.0, 28.0, 29.0, 38.0, 30.0, 28.0, 44.0, 42.0, 43.0, 48.0, 31.0, 41.0, 34.0, 33.0, 26.0, 27.0, 28.0, 23.0, 30.0, 17.0, 14.0, 19.0, 14.0, 7.0, 12.0, 9.0, 16.0, 10.0, 11.0, 3.0, 8.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-31.76959991455078, -30.880353927612305, -29.991107940673828, -29.10186195373535, -28.212615966796875, -27.32337188720703, -26.434125900268555, -25.544879913330078, -24.6556339263916, -23.766387939453125, -22.87714195251465, -21.987895965576172, -21.098651885986328, -20.20940399169922, -19.320159912109375, -18.4309139251709, -17.541667938232422, -16.652421951293945, -15.763175964355469, -14.873930931091309, -13.984684944152832, -13.095438957214355, -12.206193923950195, -11.316947937011719, -10.427701950073242, -9.538455963134766, -8.649209976196289, -7.759964942932129, -6.870718955993652, -5.981472969055176, -5.092227458953857, -4.202981948852539, -3.3137340545654297, -2.4244883060455322, -1.5352425575256348, -0.6459968090057373, 0.24324893951416016, 1.1324949264526367, 2.021740436553955, 2.9109859466552734, 3.80023193359375, 4.689477920532227, 5.578723430633545, 6.467968940734863, 7.35721492767334, 8.246460914611816, 9.135705947875977, 10.024951934814453, 10.91419792175293, 11.803443908691406, 12.692689895629883, 13.581934928894043, 14.47118091583252, 15.360426902770996, 16.249671936035156, 17.138917922973633, 18.02816390991211, 18.917409896850586, 19.806655883789062, 20.69590187072754, 21.585147857666016, 22.47439193725586, 23.363637924194336, 24.252883911132812, 25.14212989807129]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 11.0, 7.0, 10.0, 13.0, 15.0, 18.0, 26.0, 22.0, 31.0, 25.0, 27.0, 32.0, 39.0, 31.0, 36.0, 43.0, 41.0, 36.0, 43.0, 52.0, 25.0, 36.0, 29.0, 48.0, 43.0, 39.0, 23.0, 30.0, 14.0, 13.0, 19.0, 23.0, 12.0, 8.0, 11.0, 9.0, 11.0, 8.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.6015625, -2.52001953125, -2.4384765625, -2.35693359375, -2.275390625, -2.19384765625, -2.1123046875, -2.03076171875, -1.94921875, -1.86767578125, -1.7861328125, -1.70458984375, -1.623046875, -1.54150390625, -1.4599609375, -1.37841796875, -1.296875, -1.21533203125, -1.1337890625, -1.05224609375, -0.970703125, -0.88916015625, -0.8076171875, -0.72607421875, -0.64453125, -0.56298828125, -0.4814453125, -0.39990234375, -0.318359375, -0.23681640625, -0.1552734375, -0.07373046875, 0.0078125, 0.08935546875, 0.1708984375, 0.25244140625, 0.333984375, 0.41552734375, 0.4970703125, 0.57861328125, 0.66015625, 0.74169921875, 0.8232421875, 0.90478515625, 0.986328125, 1.06787109375, 1.1494140625, 1.23095703125, 1.3125, 1.39404296875, 1.4755859375, 1.55712890625, 1.638671875, 1.72021484375, 1.8017578125, 1.88330078125, 1.96484375, 2.04638671875, 2.1279296875, 2.20947265625, 2.291015625, 2.37255859375, 2.4541015625, 2.53564453125, 2.6171875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 0.0, 5.0, 2.0, 8.0, 13.0, 10.0, 15.0, 24.0, 31.0, 55.0, 59.0, 100.0, 136.0, 235.0, 383.0, 688.0, 1098.0, 2099.0, 3961.0, 8820.0, 21403.0, 62163.0, 235374.0, 1606615.0, 1864923.0, 276418.0, 69950.0, 22872.0, 8813.0, 3844.0, 1830.0, 979.0, 549.0, 313.0, 188.0, 111.0, 64.0, 46.0, 31.0, 17.0, 17.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.984375, -11.65185546875, -11.3193359375, -10.98681640625, -10.654296875, -10.32177734375, -9.9892578125, -9.65673828125, -9.32421875, -8.99169921875, -8.6591796875, -8.32666015625, -7.994140625, -7.66162109375, -7.3291015625, -6.99658203125, -6.6640625, -6.33154296875, -5.9990234375, -5.66650390625, -5.333984375, -5.00146484375, -4.6689453125, -4.33642578125, -4.00390625, -3.67138671875, -3.3388671875, -3.00634765625, -2.673828125, -2.34130859375, -2.0087890625, -1.67626953125, -1.34375, -1.01123046875, -0.6787109375, -0.34619140625, -0.013671875, 0.31884765625, 0.6513671875, 0.98388671875, 1.31640625, 1.64892578125, 1.9814453125, 2.31396484375, 2.646484375, 2.97900390625, 3.3115234375, 3.64404296875, 3.9765625, 4.30908203125, 4.6416015625, 4.97412109375, 5.306640625, 5.63916015625, 5.9716796875, 6.30419921875, 6.63671875, 6.96923828125, 7.3017578125, 7.63427734375, 7.966796875, 8.29931640625, 8.6318359375, 8.96435546875, 9.296875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 7.0, 6.0, 4.0, 10.0, 12.0, 18.0, 19.0, 23.0, 41.0, 50.0, 69.0, 84.0, 115.0, 137.0, 209.0, 296.0, 351.0, 517.0, 496.0, 408.0, 329.0, 204.0, 158.0, 128.0, 92.0, 83.0, 49.0, 44.0, 28.0, 13.0, 18.0, 14.0, 9.0, 8.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.171875, -9.845703125, -9.51953125, -9.193359375, -8.8671875, -8.541015625, -8.21484375, -7.888671875, -7.5625, -7.236328125, -6.91015625, -6.583984375, -6.2578125, -5.931640625, -5.60546875, -5.279296875, -4.953125, -4.626953125, -4.30078125, -3.974609375, -3.6484375, -3.322265625, -2.99609375, -2.669921875, -2.34375, -2.017578125, -1.69140625, -1.365234375, -1.0390625, -0.712890625, -0.38671875, -0.060546875, 0.265625, 0.591796875, 0.91796875, 1.244140625, 1.5703125, 1.896484375, 2.22265625, 2.548828125, 2.875, 3.201171875, 3.52734375, 3.853515625, 4.1796875, 4.505859375, 4.83203125, 5.158203125, 5.484375, 5.810546875, 6.13671875, 6.462890625, 6.7890625, 7.115234375, 7.44140625, 7.767578125, 8.09375, 8.419921875, 8.74609375, 9.072265625, 9.3984375, 9.724609375, 10.05078125, 10.376953125, 10.703125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 15.0, 24.0, 39.0, 63.0, 94.0, 152.0, 283.0, 411.0, 701.0, 1189.0, 2078.0, 3883.0, 7633.0, 16820.0, 41409.0, 123494.0, 465314.0, 1974284.0, 1166093.0, 260931.0, 76620.0, 28024.0, 11777.0, 5792.0, 3001.0, 1715.0, 948.0, 587.0, 357.0, 209.0, 133.0, 67.0, 55.0, 35.0, 23.0, 11.0, 12.0, 5.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.09375, -14.569580078125, -14.04541015625, -13.521240234375, -12.9970703125, -12.472900390625, -11.94873046875, -11.424560546875, -10.900390625, -10.376220703125, -9.85205078125, -9.327880859375, -8.8037109375, -8.279541015625, -7.75537109375, -7.231201171875, -6.70703125, -6.182861328125, -5.65869140625, -5.134521484375, -4.6103515625, -4.086181640625, -3.56201171875, -3.037841796875, -2.513671875, -1.989501953125, -1.46533203125, -0.941162109375, -0.4169921875, 0.107177734375, 0.63134765625, 1.155517578125, 1.6796875, 2.203857421875, 2.72802734375, 3.252197265625, 3.7763671875, 4.300537109375, 4.82470703125, 5.348876953125, 5.873046875, 6.397216796875, 6.92138671875, 7.445556640625, 7.9697265625, 8.493896484375, 9.01806640625, 9.542236328125, 10.06640625, 10.590576171875, 11.11474609375, 11.638916015625, 12.1630859375, 12.687255859375, 13.21142578125, 13.735595703125, 14.259765625, 14.783935546875, 15.30810546875, 15.832275390625, 16.3564453125, 16.880615234375, 17.40478515625, 17.928955078125, 18.453125]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 13.0, 14.0, 19.0, 41.0, 80.0, 107.0, 135.0, 164.0, 158.0, 94.0, 84.0, 42.0, 27.0, 18.0, 9.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-124.5372085571289, -122.02279663085938, -119.50839233398438, -116.99398040771484, -114.47957611083984, -111.96516418457031, -109.45075988769531, -106.93634796142578, -104.42193603515625, -101.90752410888672, -99.39311981201172, -96.87870788574219, -94.36430358886719, -91.84989166259766, -89.33547973632812, -86.82107543945312, -84.30667114257812, -81.7922592163086, -79.2778549194336, -76.76344299316406, -74.24903869628906, -71.73462677001953, -69.22021484375, -66.705810546875, -64.19139862060547, -61.6769905090332, -59.16258239746094, -56.648170471191406, -54.13376235961914, -51.619354248046875, -49.10494613647461, -46.590538024902344, -44.07612609863281, -41.56171798706055, -39.04730987548828, -36.53289794921875, -34.018489837646484, -31.50408172607422, -28.989673614501953, -26.475263595581055, -23.96085548400879, -21.446447372436523, -18.932037353515625, -16.41762924194336, -13.903220176696777, -11.388811111450195, -8.87440299987793, -6.359992980957031, -3.8455848693847656, -1.3311760425567627, 1.1832327842712402, 3.697641372680664, 6.212050437927246, 8.726459503173828, 11.240867614746094, 13.755277633666992, 16.269685745239258, 18.784093856811523, 21.298503875732422, 23.812911987304688, 26.327320098876953, 28.84173011779785, 31.356138229370117, 33.870548248291016, 36.38495635986328]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 8.0, 9.0, 9.0, 7.0, 16.0, 16.0, 16.0, 27.0, 27.0, 24.0, 30.0, 43.0, 28.0, 41.0, 51.0, 46.0, 51.0, 45.0, 49.0, 58.0, 40.0, 31.0, 42.0, 41.0, 28.0, 28.0, 30.0, 27.0, 17.0, 16.0, 15.0, 14.0, 20.0, 12.0, 4.0, 8.0, 4.0, 5.0, 6.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-44.59584045410156, -43.37046813964844, -42.14509582519531, -40.91972351074219, -39.69435119628906, -38.46897888183594, -37.24360656738281, -36.01823043823242, -34.7928581237793, -33.56748580932617, -32.34211349487305, -31.116741180419922, -29.891366958618164, -28.66599464416504, -27.440622329711914, -26.215248107910156, -24.989877700805664, -23.76450538635254, -22.539133071899414, -21.313758850097656, -20.08838653564453, -18.863014221191406, -17.63764190673828, -16.412269592285156, -15.186896324157715, -13.96152400970459, -12.736150741577148, -11.510778427124023, -10.285406112670898, -9.060032844543457, -7.834660530090332, -6.609287261962891, -5.383914947509766, -4.158542156219482, -2.9331696033477783, -1.7077970504760742, -0.482424259185791, 0.7429485321044922, 1.9683208465576172, 3.1936941146850586, 4.419066429138184, 5.644439220428467, 6.86981201171875, 8.095184326171875, 9.320556640625, 10.545929908752441, 11.771302223205566, 12.996675491333008, 14.222047805786133, 15.447420120239258, 16.672792434692383, 17.89816665649414, 19.123538970947266, 20.34891128540039, 21.574283599853516, 22.79965591430664, 24.025028228759766, 25.25040054321289, 26.475772857666016, 27.70114517211914, 28.9265193939209, 30.151891708374023, 31.37726402282715, 32.602638244628906, 33.82801055908203]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 4.0, 7.0, 13.0, 19.0, 13.0, 14.0, 25.0, 17.0, 24.0, 34.0, 34.0, 36.0, 35.0, 33.0, 41.0, 52.0, 32.0, 53.0, 46.0, 50.0, 50.0, 46.0, 49.0, 40.0, 32.0, 28.0, 32.0, 25.0, 26.0, 15.0, 18.0, 14.0, 8.0, 9.0, 1.0, 6.0, 4.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0078125, -2.90277099609375, -2.7977294921875, -2.69268798828125, -2.587646484375, -2.48260498046875, -2.3775634765625, -2.27252197265625, -2.16748046875, -2.06243896484375, -1.9573974609375, -1.85235595703125, -1.747314453125, -1.64227294921875, -1.5372314453125, -1.43218994140625, -1.3271484375, -1.22210693359375, -1.1170654296875, -1.01202392578125, -0.906982421875, -0.80194091796875, -0.6968994140625, -0.59185791015625, -0.48681640625, -0.38177490234375, -0.2767333984375, -0.17169189453125, -0.066650390625, 0.03839111328125, 0.1434326171875, 0.24847412109375, 0.353515625, 0.45855712890625, 0.5635986328125, 0.66864013671875, 0.773681640625, 0.87872314453125, 0.9837646484375, 1.08880615234375, 1.19384765625, 1.29888916015625, 1.4039306640625, 1.50897216796875, 1.614013671875, 1.71905517578125, 1.8240966796875, 1.92913818359375, 2.0341796875, 2.13922119140625, 2.2442626953125, 2.34930419921875, 2.454345703125, 2.55938720703125, 2.6644287109375, 2.76947021484375, 2.87451171875, 2.97955322265625, 3.0845947265625, 3.18963623046875, 3.294677734375, 3.39971923828125, 3.5047607421875, 3.60980224609375, 3.71484375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 4.0, 3.0, 10.0, 9.0, 20.0, 24.0, 45.0, 78.0, 91.0, 162.0, 211.0, 370.0, 606.0, 1055.0, 1774.0, 2822.0, 4877.0, 8851.0, 17439.0, 41482.0, 136036.0, 497439.0, 227094.0, 59743.0, 22784.0, 10937.0, 5885.0, 3387.0, 2015.0, 1291.0, 760.0, 477.0, 274.0, 175.0, 119.0, 73.0, 46.0, 28.0, 26.0, 11.0, 5.0, 6.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.390625, -10.08203125, -9.7734375, -9.46484375, -9.15625, -8.84765625, -8.5390625, -8.23046875, -7.921875, -7.61328125, -7.3046875, -6.99609375, -6.6875, -6.37890625, -6.0703125, -5.76171875, -5.453125, -5.14453125, -4.8359375, -4.52734375, -4.21875, -3.91015625, -3.6015625, -3.29296875, -2.984375, -2.67578125, -2.3671875, -2.05859375, -1.75, -1.44140625, -1.1328125, -0.82421875, -0.515625, -0.20703125, 0.1015625, 0.41015625, 0.71875, 1.02734375, 1.3359375, 1.64453125, 1.953125, 2.26171875, 2.5703125, 2.87890625, 3.1875, 3.49609375, 3.8046875, 4.11328125, 4.421875, 4.73046875, 5.0390625, 5.34765625, 5.65625, 5.96484375, 6.2734375, 6.58203125, 6.890625, 7.19921875, 7.5078125, 7.81640625, 8.125, 8.43359375, 8.7421875, 9.05078125, 9.359375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 9.0, 3.0, 9.0, 11.0, 11.0, 17.0, 12.0, 18.0, 12.0, 15.0, 19.0, 41.0, 27.0, 31.0, 25.0, 35.0, 45.0, 29.0, 43.0, 45.0, 1067.0, 36.0, 51.0, 31.0, 38.0, 38.0, 38.0, 23.0, 30.0, 33.0, 26.0, 33.0, 17.0, 18.0, 16.0, 15.0, 14.0, 13.0, 10.0, 7.0, 9.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.552734375, -2.4749755859375, -2.397216796875, -2.3194580078125, -2.24169921875, -2.1639404296875, -2.086181640625, -2.0084228515625, -1.9306640625, -1.8529052734375, -1.775146484375, -1.6973876953125, -1.61962890625, -1.5418701171875, -1.464111328125, -1.3863525390625, -1.30859375, -1.2308349609375, -1.153076171875, -1.0753173828125, -0.99755859375, -0.9197998046875, -0.842041015625, -0.7642822265625, -0.6865234375, -0.6087646484375, -0.531005859375, -0.4532470703125, -0.37548828125, -0.2977294921875, -0.219970703125, -0.1422119140625, -0.064453125, 0.0133056640625, 0.091064453125, 0.1688232421875, 0.24658203125, 0.3243408203125, 0.402099609375, 0.4798583984375, 0.5576171875, 0.6353759765625, 0.713134765625, 0.7908935546875, 0.86865234375, 0.9464111328125, 1.024169921875, 1.1019287109375, 1.1796875, 1.2574462890625, 1.335205078125, 1.4129638671875, 1.49072265625, 1.5684814453125, 1.646240234375, 1.7239990234375, 1.8017578125, 1.8795166015625, 1.957275390625, 2.0350341796875, 2.11279296875, 2.1905517578125, 2.268310546875, 2.3460693359375, 2.423828125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 5.0, 6.0, 4.0, 14.0, 23.0, 26.0, 46.0, 73.0, 76.0, 135.0, 186.0, 246.0, 401.0, 568.0, 1030.0, 1920.0, 4403.0, 16184.0, 149692.0, 1819296.0, 83214.0, 11819.0, 3703.0, 1692.0, 864.0, 501.0, 314.0, 198.0, 151.0, 96.0, 78.0, 46.0, 40.0, 23.0, 13.0, 14.0, 10.0, 6.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.921875, -13.4921875, -13.0625, -12.6328125, -12.203125, -11.7734375, -11.34375, -10.9140625, -10.484375, -10.0546875, -9.625, -9.1953125, -8.765625, -8.3359375, -7.90625, -7.4765625, -7.046875, -6.6171875, -6.1875, -5.7578125, -5.328125, -4.8984375, -4.46875, -4.0390625, -3.609375, -3.1796875, -2.75, -2.3203125, -1.890625, -1.4609375, -1.03125, -0.6015625, -0.171875, 0.2578125, 0.6875, 1.1171875, 1.546875, 1.9765625, 2.40625, 2.8359375, 3.265625, 3.6953125, 4.125, 4.5546875, 4.984375, 5.4140625, 5.84375, 6.2734375, 6.703125, 7.1328125, 7.5625, 7.9921875, 8.421875, 8.8515625, 9.28125, 9.7109375, 10.140625, 10.5703125, 11.0, 11.4296875, 11.859375, 12.2890625, 12.71875, 13.1484375, 13.578125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 8.0, 9.0, 19.0, 24.0, 140.0, 602.0, 117.0, 25.0, 17.0, 11.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.66796875, -6.4622802734375, -6.256591796875, -6.0509033203125, -5.84521484375, -5.6395263671875, -5.433837890625, -5.2281494140625, -5.0224609375, -4.8167724609375, -4.611083984375, -4.4053955078125, -4.19970703125, -3.9940185546875, -3.788330078125, -3.5826416015625, -3.376953125, -3.1712646484375, -2.965576171875, -2.7598876953125, -2.55419921875, -2.3485107421875, -2.142822265625, -1.9371337890625, -1.7314453125, -1.5257568359375, -1.320068359375, -1.1143798828125, -0.90869140625, -0.7030029296875, -0.497314453125, -0.2916259765625, -0.0859375, 0.1197509765625, 0.325439453125, 0.5311279296875, 0.73681640625, 0.9425048828125, 1.148193359375, 1.3538818359375, 1.5595703125, 1.7652587890625, 1.970947265625, 2.1766357421875, 2.38232421875, 2.5880126953125, 2.793701171875, 2.9993896484375, 3.205078125, 3.4107666015625, 3.616455078125, 3.8221435546875, 4.02783203125, 4.2335205078125, 4.439208984375, 4.6448974609375, 4.8505859375, 5.0562744140625, 5.261962890625, 5.4676513671875, 5.67333984375, 5.8790283203125, 6.084716796875, 6.2904052734375, 6.49609375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 9.0, 7.0, 0.0, 3.0, 5.0, 1.0, 6.0, 9.0, 10.0, 2.0, 9.0, 27.0, 65.0, 161.0, 630.0, 2588.0, 10851.0, 1020715.0, 10157.0, 2408.0, 583.0, 156.0, 57.0, 22.0, 9.0, 2.0, 15.0, 10.0, 1.0, 1.0, 3.0, 5.0, 4.0, 7.0, 5.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0], "bins": [-84.9375, -82.400390625, -79.86328125, -77.326171875, -74.7890625, -72.251953125, -69.71484375, -67.177734375, -64.640625, -62.103515625, -59.56640625, -57.029296875, -54.4921875, -51.955078125, -49.41796875, -46.880859375, -44.34375, -41.806640625, -39.26953125, -36.732421875, -34.1953125, -31.658203125, -29.12109375, -26.583984375, -24.046875, -21.509765625, -18.97265625, -16.435546875, -13.8984375, -11.361328125, -8.82421875, -6.287109375, -3.75, -1.212890625, 1.32421875, 3.861328125, 6.3984375, 8.935546875, 11.47265625, 14.009765625, 16.546875, 19.083984375, 21.62109375, 24.158203125, 26.6953125, 29.232421875, 31.76953125, 34.306640625, 36.84375, 39.380859375, 41.91796875, 44.455078125, 46.9921875, 49.529296875, 52.06640625, 54.603515625, 57.140625, 59.677734375, 62.21484375, 64.751953125, 67.2890625, 69.826171875, 72.36328125, 74.900390625, 77.4375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 16.0, 61.0, 219.0, 518.0, 124.0, 55.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.187665939331055, -15.46308708190918, -14.738507270812988, -14.013927459716797, -13.289348602294922, -12.564769744873047, -11.840189933776855, -11.115610122680664, -10.391031265258789, -9.666452407836914, -8.941872596740723, -8.217292785644531, -7.492713928222656, -6.768134593963623, -6.04355525970459, -5.318975925445557, -4.594396591186523, -3.8698172569274902, -3.145237922668457, -2.420658588409424, -1.6960792541503906, -0.9714999198913574, -0.24692058563232422, 0.477658748626709, 1.2022380828857422, 1.9268174171447754, 2.6513967514038086, 3.375976085662842, 4.100555419921875, 4.825134754180908, 5.549714088439941, 6.274293422698975, 6.998872756958008, 7.723452091217041, 8.448031425476074, 9.172611236572266, 9.89719009399414, 10.621768951416016, 11.346348762512207, 12.070928573608398, 12.795507431030273, 13.520086288452148, 14.24466609954834, 14.969245910644531, 15.693824768066406, 16.41840362548828, 17.142982482910156, 17.867563247680664, 18.59214210510254, 19.316720962524414, 20.041301727294922, 20.765880584716797, 21.490459442138672, 22.215038299560547, 22.939617156982422, 23.66419792175293, 24.388776779174805, 25.11335563659668, 25.837936401367188, 26.562515258789062, 27.287094116210938, 28.011672973632812, 28.736251831054688, 29.460832595825195, 30.18541145324707]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 6.0, 10.0, 14.0, 8.0, 20.0, 19.0, 27.0, 28.0, 30.0, 37.0, 27.0, 36.0, 45.0, 53.0, 59.0, 45.0, 41.0, 51.0, 39.0, 63.0, 42.0, 43.0, 35.0, 42.0, 29.0, 27.0, 27.0, 14.0, 10.0, 21.0, 8.0, 9.0, 11.0, 10.0, 2.0, 7.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.625494956970215, -4.48131799697876, -4.337141036987305, -4.19296407699585, -4.0487871170043945, -3.9046099185943604, -3.760432720184326, -3.616255760192871, -3.472078800201416, -3.327901840209961, -3.183724880218506, -3.0395476818084717, -2.8953707218170166, -2.7511937618255615, -2.6070165634155273, -2.4628396034240723, -2.318662643432617, -2.174485683441162, -2.030308723449707, -1.8861315250396729, -1.7419545650482178, -1.5977776050567627, -1.453600525856018, -1.3094234466552734, -1.1652464866638184, -1.0210695266723633, -0.8768924474716187, -0.7327154278755188, -0.588538408279419, -0.4443613886833191, -0.30018436908721924, -0.1560072898864746, -0.011830329895019531, 0.13234668970108032, 0.2765237092971802, 0.42070072889328003, 0.5648777484893799, 0.7090547680854797, 0.8532317876815796, 0.9974088668823242, 1.1415858268737793, 1.2857627868652344, 1.429939866065979, 1.5741169452667236, 1.7182939052581787, 1.8624708652496338, 2.006648063659668, 2.150825023651123, 2.295001983642578, 2.439178943634033, 2.5833559036254883, 2.7275331020355225, 2.8717100620269775, 3.0158870220184326, 3.160064220428467, 3.304241180419922, 3.448418140411377, 3.592595100402832, 3.736772060394287, 3.8809492588043213, 4.0251264572143555, 4.1693034172058105, 4.313480377197266, 4.457657337188721, 4.601834297180176]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 10.0, 10.0, 21.0, 15.0, 23.0, 28.0, 20.0, 30.0, 33.0, 34.0, 32.0, 40.0, 38.0, 37.0, 46.0, 41.0, 45.0, 43.0, 37.0, 44.0, 56.0, 49.0, 37.0, 29.0, 39.0, 30.0, 26.0, 11.0, 15.0, 11.0, 11.0, 7.0, 8.0, 5.0, 3.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.83984375, -2.738037109375, -2.63623046875, -2.534423828125, -2.4326171875, -2.330810546875, -2.22900390625, -2.127197265625, -2.025390625, -1.923583984375, -1.82177734375, -1.719970703125, -1.6181640625, -1.516357421875, -1.41455078125, -1.312744140625, -1.2109375, -1.109130859375, -1.00732421875, -0.905517578125, -0.8037109375, -0.701904296875, -0.60009765625, -0.498291015625, -0.396484375, -0.294677734375, -0.19287109375, -0.091064453125, 0.0107421875, 0.112548828125, 0.21435546875, 0.316162109375, 0.41796875, 0.519775390625, 0.62158203125, 0.723388671875, 0.8251953125, 0.927001953125, 1.02880859375, 1.130615234375, 1.232421875, 1.334228515625, 1.43603515625, 1.537841796875, 1.6396484375, 1.741455078125, 1.84326171875, 1.945068359375, 2.046875, 2.148681640625, 2.25048828125, 2.352294921875, 2.4541015625, 2.555908203125, 2.65771484375, 2.759521484375, 2.861328125, 2.963134765625, 3.06494140625, 3.166748046875, 3.2685546875, 3.370361328125, 3.47216796875, 3.573974609375, 3.67578125]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 6.0, 4.0, 5.0, 2.0, 11.0, 14.0, 20.0, 39.0, 41.0, 95.0, 170.0, 295.0, 506.0, 1132.0, 2491.0, 6409.0, 20095.0, 84010.0, 354483.0, 424190.0, 115132.0, 26131.0, 7655.0, 2896.0, 1302.0, 658.0, 315.0, 182.0, 100.0, 65.0, 30.0, 27.0, 16.0, 12.0, 6.0, 4.0, 7.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.41015625, -7.171875, -6.93359375, -6.6953125, -6.45703125, -6.21875, -5.98046875, -5.7421875, -5.50390625, -5.265625, -5.02734375, -4.7890625, -4.55078125, -4.3125, -4.07421875, -3.8359375, -3.59765625, -3.359375, -3.12109375, -2.8828125, -2.64453125, -2.40625, -2.16796875, -1.9296875, -1.69140625, -1.453125, -1.21484375, -0.9765625, -0.73828125, -0.5, -0.26171875, -0.0234375, 0.21484375, 0.453125, 0.69140625, 0.9296875, 1.16796875, 1.40625, 1.64453125, 1.8828125, 2.12109375, 2.359375, 2.59765625, 2.8359375, 3.07421875, 3.3125, 3.55078125, 3.7890625, 4.02734375, 4.265625, 4.50390625, 4.7421875, 4.98046875, 5.21875, 5.45703125, 5.6953125, 5.93359375, 6.171875, 6.41015625, 6.6484375, 6.88671875, 7.125, 7.36328125, 7.6015625, 7.83984375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 14.0, 16.0, 7.0, 9.0, 11.0, 20.0, 20.0, 17.0, 21.0, 22.0, 30.0, 34.0, 31.0, 47.0, 52.0, 72.0, 101.0, 170.0, 293.0, 1360.0, 164.0, 95.0, 81.0, 48.0, 46.0, 33.0, 37.0, 34.0, 24.0, 21.0, 19.0, 17.0, 21.0, 13.0, 5.0, 13.0, 7.0, 7.0, 6.0, 4.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.1640625, -11.7855224609375, -11.406982421875, -11.0284423828125, -10.64990234375, -10.2713623046875, -9.892822265625, -9.5142822265625, -9.1357421875, -8.7572021484375, -8.378662109375, -8.0001220703125, -7.62158203125, -7.2430419921875, -6.864501953125, -6.4859619140625, -6.107421875, -5.7288818359375, -5.350341796875, -4.9718017578125, -4.59326171875, -4.2147216796875, -3.836181640625, -3.4576416015625, -3.0791015625, -2.7005615234375, -2.322021484375, -1.9434814453125, -1.56494140625, -1.1864013671875, -0.807861328125, -0.4293212890625, -0.05078125, 0.3277587890625, 0.706298828125, 1.0848388671875, 1.46337890625, 1.8419189453125, 2.220458984375, 2.5989990234375, 2.9775390625, 3.3560791015625, 3.734619140625, 4.1131591796875, 4.49169921875, 4.8702392578125, 5.248779296875, 5.6273193359375, 6.005859375, 6.3843994140625, 6.762939453125, 7.1414794921875, 7.52001953125, 7.8985595703125, 8.277099609375, 8.6556396484375, 9.0341796875, 9.4127197265625, 9.791259765625, 10.1697998046875, 10.54833984375, 10.9268798828125, 11.305419921875, 11.6839599609375, 12.0625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 13.0, 9.0, 14.0, 13.0, 9.0, 17.0, 19.0, 32.0, 30.0, 46.0, 88.0, 157.0, 387.0, 921.0, 3300.0, 18265.0, 231684.0, 2528237.0, 332917.0, 23644.0, 3932.0, 1054.0, 393.0, 178.0, 98.0, 51.0, 34.0, 18.0, 26.0, 21.0, 22.0, 5.0, 12.0, 16.0, 12.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.484375, -18.866943359375, -18.24951171875, -17.632080078125, -17.0146484375, -16.397216796875, -15.77978515625, -15.162353515625, -14.544921875, -13.927490234375, -13.31005859375, -12.692626953125, -12.0751953125, -11.457763671875, -10.84033203125, -10.222900390625, -9.60546875, -8.988037109375, -8.37060546875, -7.753173828125, -7.1357421875, -6.518310546875, -5.90087890625, -5.283447265625, -4.666015625, -4.048583984375, -3.43115234375, -2.813720703125, -2.1962890625, -1.578857421875, -0.96142578125, -0.343994140625, 0.2734375, 0.890869140625, 1.50830078125, 2.125732421875, 2.7431640625, 3.360595703125, 3.97802734375, 4.595458984375, 5.212890625, 5.830322265625, 6.44775390625, 7.065185546875, 7.6826171875, 8.300048828125, 8.91748046875, 9.534912109375, 10.15234375, 10.769775390625, 11.38720703125, 12.004638671875, 12.6220703125, 13.239501953125, 13.85693359375, 14.474365234375, 15.091796875, 15.709228515625, 16.32666015625, 16.944091796875, 17.5615234375, 18.178955078125, 18.79638671875, 19.413818359375, 20.03125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 19.0, 64.0, 168.0, 285.0, 295.0, 133.0, 39.0, 13.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-106.72075653076172, -104.62381744384766, -102.52688598632812, -100.42994689941406, -98.3330078125, -96.23607635498047, -94.1391372680664, -92.04220581054688, -89.94526672363281, -87.84832763671875, -85.75139617919922, -83.65445709228516, -81.55752563476562, -79.46058654785156, -77.3636474609375, -75.26671600341797, -73.1697769165039, -71.07283782958984, -68.97590637207031, -66.87896728515625, -64.78202819824219, -62.685096740722656, -60.588157653808594, -58.4912223815918, -56.394287109375, -54.2973518371582, -52.200416564941406, -50.103477478027344, -48.00654220581055, -45.90960693359375, -43.81266784667969, -41.71573257446289, -39.61878967285156, -37.521854400634766, -35.42491912841797, -33.327980041503906, -31.23104476928711, -29.134109497070312, -27.037172317504883, -24.940235137939453, -22.84330177307129, -20.74636459350586, -18.649429321289062, -16.552494049072266, -14.455556869506836, -12.358620643615723, -10.26168441772461, -8.164748191833496, -6.067811965942383, -3.9708757400512695, -1.8739395141601562, 0.22299671173095703, 2.3199329376220703, 4.416869163513184, 6.513805389404297, 8.61074161529541, 10.707677841186523, 12.804614067077637, 14.90155029296875, 16.998485565185547, 19.095422744750977, 21.192359924316406, 23.289295196533203, 25.38623046875, 27.48316764831543]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 12.0, 3.0, 8.0, 16.0, 18.0, 22.0, 20.0, 16.0, 31.0, 26.0, 25.0, 26.0, 26.0, 32.0, 32.0, 39.0, 42.0, 34.0, 44.0, 48.0, 34.0, 40.0, 36.0, 42.0, 41.0, 30.0, 37.0, 31.0, 28.0, 27.0, 20.0, 14.0, 17.0, 16.0, 14.0, 9.0, 11.0, 6.0, 8.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-38.66307830810547, -37.49760437011719, -36.33212661743164, -35.16665267944336, -34.00117874145508, -32.83570098876953, -31.67022705078125, -30.50475311279297, -29.339277267456055, -28.17380142211914, -27.00832748413086, -25.842851638793945, -24.67737579345703, -23.51190185546875, -22.346426010131836, -21.180950164794922, -20.01547622680664, -18.850000381469727, -17.684526443481445, -16.51905059814453, -15.353575706481934, -14.188100814819336, -13.022624969482422, -11.857150077819824, -10.691675186157227, -9.526200294494629, -8.360725402832031, -7.195249557495117, -6.0297746658325195, -4.864299774169922, -3.698824405670166, -2.53334903717041, -1.3678703308105469, -0.20239520072937012, 0.9630799293518066, 2.1285550594329834, 3.29403018951416, 4.459505081176758, 5.624980449676514, 6.7904558181762695, 7.955930709838867, 9.121405601501465, 10.286880493164062, 11.452356338500977, 12.617831230163574, 13.783306121826172, 14.948781967163086, 16.1142578125, 17.27973175048828, 18.445207595825195, 19.610681533813477, 20.77615737915039, 21.941631317138672, 23.107107162475586, 24.2725830078125, 25.43805694580078, 26.603532791137695, 27.76900863647461, 28.93448257446289, 30.099958419799805, 31.26543426513672, 32.430908203125, 33.59638214111328, 34.76185989379883, 35.92733383178711]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 0.0, 2.0, 1.0, 5.0, 6.0, 5.0, 5.0, 4.0, 3.0, 14.0, 8.0, 13.0, 21.0, 20.0, 27.0, 30.0, 24.0, 36.0, 33.0, 31.0, 30.0, 43.0, 37.0, 43.0, 58.0, 40.0, 38.0, 35.0, 53.0, 31.0, 37.0, 46.0, 26.0, 33.0, 30.0, 17.0, 16.0, 24.0, 17.0, 6.0, 12.0, 6.0, 11.0, 12.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.689453125, -2.591064453125, -2.49267578125, -2.394287109375, -2.2958984375, -2.197509765625, -2.09912109375, -2.000732421875, -1.90234375, -1.803955078125, -1.70556640625, -1.607177734375, -1.5087890625, -1.410400390625, -1.31201171875, -1.213623046875, -1.115234375, -1.016845703125, -0.91845703125, -0.820068359375, -0.7216796875, -0.623291015625, -0.52490234375, -0.426513671875, -0.328125, -0.229736328125, -0.13134765625, -0.032958984375, 0.0654296875, 0.163818359375, 0.26220703125, 0.360595703125, 0.458984375, 0.557373046875, 0.65576171875, 0.754150390625, 0.8525390625, 0.950927734375, 1.04931640625, 1.147705078125, 1.24609375, 1.344482421875, 1.44287109375, 1.541259765625, 1.6396484375, 1.738037109375, 1.83642578125, 1.934814453125, 2.033203125, 2.131591796875, 2.22998046875, 2.328369140625, 2.4267578125, 2.525146484375, 2.62353515625, 2.721923828125, 2.8203125, 2.918701171875, 3.01708984375, 3.115478515625, 3.2138671875, 3.312255859375, 3.41064453125, 3.509033203125, 3.607421875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 10.0, 9.0, 4.0, 9.0, 16.0, 20.0, 26.0, 31.0, 41.0, 50.0, 81.0, 107.0, 194.0, 322.0, 649.0, 1406.0, 3205.0, 8254.0, 26159.0, 122304.0, 1373852.0, 2410021.0, 193721.0, 36169.0, 10458.0, 3909.0, 1612.0, 691.0, 323.0, 205.0, 130.0, 72.0, 45.0, 44.0, 26.0, 26.0, 15.0, 18.0, 16.0, 11.0, 7.0, 8.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.359375, -11.903564453125, -11.44775390625, -10.991943359375, -10.5361328125, -10.080322265625, -9.62451171875, -9.168701171875, -8.712890625, -8.257080078125, -7.80126953125, -7.345458984375, -6.8896484375, -6.433837890625, -5.97802734375, -5.522216796875, -5.06640625, -4.610595703125, -4.15478515625, -3.698974609375, -3.2431640625, -2.787353515625, -2.33154296875, -1.875732421875, -1.419921875, -0.964111328125, -0.50830078125, -0.052490234375, 0.4033203125, 0.859130859375, 1.31494140625, 1.770751953125, 2.2265625, 2.682373046875, 3.13818359375, 3.593994140625, 4.0498046875, 4.505615234375, 4.96142578125, 5.417236328125, 5.873046875, 6.328857421875, 6.78466796875, 7.240478515625, 7.6962890625, 8.152099609375, 8.60791015625, 9.063720703125, 9.51953125, 9.975341796875, 10.43115234375, 10.886962890625, 11.3427734375, 11.798583984375, 12.25439453125, 12.710205078125, 13.166015625, 13.621826171875, 14.07763671875, 14.533447265625, 14.9892578125, 15.445068359375, 15.90087890625, 16.356689453125, 16.8125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 8.0, 17.0, 10.0, 38.0, 41.0, 84.0, 123.0, 227.0, 394.0, 624.0, 881.0, 695.0, 399.0, 231.0, 109.0, 79.0, 46.0, 32.0, 22.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.59375, -26.009765625, -25.42578125, -24.841796875, -24.2578125, -23.673828125, -23.08984375, -22.505859375, -21.921875, -21.337890625, -20.75390625, -20.169921875, -19.5859375, -19.001953125, -18.41796875, -17.833984375, -17.25, -16.666015625, -16.08203125, -15.498046875, -14.9140625, -14.330078125, -13.74609375, -13.162109375, -12.578125, -11.994140625, -11.41015625, -10.826171875, -10.2421875, -9.658203125, -9.07421875, -8.490234375, -7.90625, -7.322265625, -6.73828125, -6.154296875, -5.5703125, -4.986328125, -4.40234375, -3.818359375, -3.234375, -2.650390625, -2.06640625, -1.482421875, -0.8984375, -0.314453125, 0.26953125, 0.853515625, 1.4375, 2.021484375, 2.60546875, 3.189453125, 3.7734375, 4.357421875, 4.94140625, 5.525390625, 6.109375, 6.693359375, 7.27734375, 7.861328125, 8.4453125, 9.029296875, 9.61328125, 10.197265625, 10.78125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 8.0, 6.0, 3.0, 6.0, 14.0, 8.0, 11.0, 15.0, 24.0, 25.0, 23.0, 34.0, 51.0, 120.0, 184.0, 446.0, 990.0, 2635.0, 8752.0, 38528.0, 304998.0, 3057550.0, 694296.0, 66067.0, 13183.0, 3879.0, 1302.0, 524.0, 204.0, 115.0, 61.0, 44.0, 32.0, 30.0, 21.0, 17.0, 17.0, 11.0, 13.0, 13.0, 4.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-35.15625, -34.170166015625, -33.18408203125, -32.197998046875, -31.2119140625, -30.225830078125, -29.23974609375, -28.253662109375, -27.267578125, -26.281494140625, -25.29541015625, -24.309326171875, -23.3232421875, -22.337158203125, -21.35107421875, -20.364990234375, -19.37890625, -18.392822265625, -17.40673828125, -16.420654296875, -15.4345703125, -14.448486328125, -13.46240234375, -12.476318359375, -11.490234375, -10.504150390625, -9.51806640625, -8.531982421875, -7.5458984375, -6.559814453125, -5.57373046875, -4.587646484375, -3.6015625, -2.615478515625, -1.62939453125, -0.643310546875, 0.3427734375, 1.328857421875, 2.31494140625, 3.301025390625, 4.287109375, 5.273193359375, 6.25927734375, 7.245361328125, 8.2314453125, 9.217529296875, 10.20361328125, 11.189697265625, 12.17578125, 13.161865234375, 14.14794921875, 15.134033203125, 16.1201171875, 17.106201171875, 18.09228515625, 19.078369140625, 20.064453125, 21.050537109375, 22.03662109375, 23.022705078125, 24.0087890625, 24.994873046875, 25.98095703125, 26.967041015625, 27.953125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 15.0, 30.0, 58.0, 114.0, 157.0, 181.0, 169.0, 117.0, 71.0, 49.0, 21.0, 10.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.0972785949707, -54.63044357299805, -51.163612365722656, -47.69677734375, -44.229942321777344, -40.76310729980469, -37.29627227783203, -33.82944107055664, -30.362606048583984, -26.895771026611328, -23.428937911987305, -19.96210479736328, -16.495269775390625, -13.028434753417969, -9.561601638793945, -6.094768524169922, -2.6279335021972656, 0.8389005661010742, 4.305734634399414, 7.772568702697754, 11.239402770996094, 14.70623779296875, 18.173070907592773, 21.639904022216797, 25.106739044189453, 28.57357406616211, 32.0404052734375, 35.507240295410156, 38.97407531738281, 42.44091033935547, 45.907745361328125, 49.374576568603516, 52.84141540527344, 56.308250427246094, 59.77508544921875, 63.24191665649414, 66.70875549316406, 70.17558288574219, 73.64241790771484, 77.1092529296875, 80.57608795166016, 84.04292297363281, 87.50975799560547, 90.97659301757812, 94.44342041015625, 97.91026306152344, 101.37709045410156, 104.84392547607422, 108.31076049804688, 111.77759552001953, 115.24443054199219, 118.71126556396484, 122.1781005859375, 125.64492797851562, 129.1117706298828, 132.57859802246094, 136.04544067382812, 139.51226806640625, 142.97911071777344, 146.44593811035156, 149.91278076171875, 153.37960815429688, 156.84645080566406, 160.3132781982422, 163.7801055908203]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 3.0, 5.0, 6.0, 8.0, 11.0, 6.0, 12.0, 13.0, 18.0, 19.0, 19.0, 17.0, 22.0, 42.0, 29.0, 30.0, 38.0, 36.0, 45.0, 51.0, 46.0, 35.0, 42.0, 58.0, 46.0, 28.0, 38.0, 28.0, 31.0, 26.0, 28.0, 22.0, 23.0, 21.0, 17.0, 12.0, 16.0, 13.0, 10.0, 9.0, 4.0, 2.0, 5.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-41.533958435058594, -40.333946228027344, -39.133934020996094, -37.933921813964844, -36.733909606933594, -35.53390121459961, -34.33388900756836, -33.13387680053711, -31.93386459350586, -30.73385238647461, -29.53384017944336, -28.333829879760742, -27.133817672729492, -25.933805465698242, -24.733795166015625, -23.533782958984375, -22.333770751953125, -21.133758544921875, -19.933746337890625, -18.733736038208008, -17.533723831176758, -16.333711624145508, -15.133700370788574, -13.93368911743164, -12.73367691040039, -11.53366470336914, -10.333653450012207, -9.133642196655273, -7.933629989624023, -6.733618259429932, -5.53360652923584, -4.333595275878906, -3.1335830688476562, -1.9335713386535645, -0.7335596084594727, 0.46645212173461914, 1.666463851928711, 2.8664755821228027, 4.0664873123168945, 5.266498565673828, 6.466510772705078, 7.66652250289917, 8.866534233093262, 10.066545486450195, 11.266557693481445, 12.466569900512695, 13.666581153869629, 14.866592407226562, 16.066604614257812, 17.266616821289062, 18.466629028320312, 19.66663932800293, 20.86665153503418, 22.06666374206543, 23.266674041748047, 24.466686248779297, 25.666698455810547, 26.866710662841797, 28.066722869873047, 29.266733169555664, 30.466745376586914, 31.666757583618164, 32.86676788330078, 34.06678009033203, 35.26679229736328]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 5.0, 7.0, 6.0, 3.0, 5.0, 10.0, 8.0, 12.0, 18.0, 18.0, 30.0, 17.0, 25.0, 33.0, 25.0, 25.0, 33.0, 35.0, 43.0, 50.0, 38.0, 37.0, 51.0, 44.0, 36.0, 38.0, 39.0, 42.0, 41.0, 41.0, 27.0, 24.0, 29.0, 21.0, 19.0, 15.0, 13.0, 17.0, 7.0, 4.0, 7.0, 4.0, 1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.107421875, -2.996734619140625, -2.88604736328125, -2.775360107421875, -2.6646728515625, -2.553985595703125, -2.44329833984375, -2.332611083984375, -2.221923828125, -2.111236572265625, -2.00054931640625, -1.889862060546875, -1.7791748046875, -1.668487548828125, -1.55780029296875, -1.447113037109375, -1.33642578125, -1.225738525390625, -1.11505126953125, -1.004364013671875, -0.8936767578125, -0.782989501953125, -0.67230224609375, -0.561614990234375, -0.450927734375, -0.340240478515625, -0.22955322265625, -0.118865966796875, -0.0081787109375, 0.102508544921875, 0.21319580078125, 0.323883056640625, 0.4345703125, 0.545257568359375, 0.65594482421875, 0.766632080078125, 0.8773193359375, 0.988006591796875, 1.09869384765625, 1.209381103515625, 1.320068359375, 1.430755615234375, 1.54144287109375, 1.652130126953125, 1.7628173828125, 1.873504638671875, 1.98419189453125, 2.094879150390625, 2.20556640625, 2.316253662109375, 2.42694091796875, 2.537628173828125, 2.6483154296875, 2.759002685546875, 2.86968994140625, 2.980377197265625, 3.091064453125, 3.201751708984375, 3.31243896484375, 3.423126220703125, 3.5338134765625, 3.644500732421875, 3.75518798828125, 3.865875244140625, 3.9765625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 10.0, 13.0, 23.0, 36.0, 63.0, 107.0, 164.0, 289.0, 463.0, 900.0, 1542.0, 2778.0, 4967.0, 8825.0, 15565.0, 27179.0, 45805.0, 75323.0, 117042.0, 168956.0, 188817.0, 146306.0, 97254.0, 60481.0, 36588.0, 21248.0, 12127.0, 6829.0, 3923.0, 2100.0, 1221.0, 653.0, 390.0, 216.0, 133.0, 69.0, 45.0, 27.0, 21.0, 17.0, 9.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.87109375, -7.62725830078125, -7.3834228515625, -7.13958740234375, -6.895751953125, -6.65191650390625, -6.4080810546875, -6.16424560546875, -5.92041015625, -5.67657470703125, -5.4327392578125, -5.18890380859375, -4.945068359375, -4.70123291015625, -4.4573974609375, -4.21356201171875, -3.9697265625, -3.72589111328125, -3.4820556640625, -3.23822021484375, -2.994384765625, -2.75054931640625, -2.5067138671875, -2.26287841796875, -2.01904296875, -1.77520751953125, -1.5313720703125, -1.28753662109375, -1.043701171875, -0.79986572265625, -0.5560302734375, -0.31219482421875, -0.068359375, 0.17547607421875, 0.4193115234375, 0.66314697265625, 0.906982421875, 1.15081787109375, 1.3946533203125, 1.63848876953125, 1.88232421875, 2.12615966796875, 2.3699951171875, 2.61383056640625, 2.857666015625, 3.10150146484375, 3.3453369140625, 3.58917236328125, 3.8330078125, 4.07684326171875, 4.3206787109375, 4.56451416015625, 4.808349609375, 5.05218505859375, 5.2960205078125, 5.53985595703125, 5.78369140625, 6.02752685546875, 6.2713623046875, 6.51519775390625, 6.759033203125, 7.00286865234375, 7.2467041015625, 7.49053955078125, 7.734375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 5.0, 6.0, 16.0, 15.0, 14.0, 21.0, 27.0, 22.0, 25.0, 18.0, 37.0, 38.0, 36.0, 44.0, 32.0, 32.0, 46.0, 1064.0, 35.0, 43.0, 56.0, 31.0, 42.0, 42.0, 32.0, 32.0, 28.0, 28.0, 28.0, 18.0, 19.0, 6.0, 8.0, 16.0, 13.0, 12.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.755859375, -2.6722412109375, -2.588623046875, -2.5050048828125, -2.42138671875, -2.3377685546875, -2.254150390625, -2.1705322265625, -2.0869140625, -2.0032958984375, -1.919677734375, -1.8360595703125, -1.75244140625, -1.6688232421875, -1.585205078125, -1.5015869140625, -1.41796875, -1.3343505859375, -1.250732421875, -1.1671142578125, -1.08349609375, -0.9998779296875, -0.916259765625, -0.8326416015625, -0.7490234375, -0.6654052734375, -0.581787109375, -0.4981689453125, -0.41455078125, -0.3309326171875, -0.247314453125, -0.1636962890625, -0.080078125, 0.0035400390625, 0.087158203125, 0.1707763671875, 0.25439453125, 0.3380126953125, 0.421630859375, 0.5052490234375, 0.5888671875, 0.6724853515625, 0.756103515625, 0.8397216796875, 0.92333984375, 1.0069580078125, 1.090576171875, 1.1741943359375, 1.2578125, 1.3414306640625, 1.425048828125, 1.5086669921875, 1.59228515625, 1.6759033203125, 1.759521484375, 1.8431396484375, 1.9267578125, 2.0103759765625, 2.093994140625, 2.1776123046875, 2.26123046875, 2.3448486328125, 2.428466796875, 2.5120849609375, 2.595703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 3.0, 9.0, 9.0, 12.0, 19.0, 30.0, 27.0, 37.0, 68.0, 98.0, 116.0, 173.0, 277.0, 398.0, 575.0, 972.0, 1557.0, 2823.0, 5375.0, 12736.0, 34394.0, 112143.0, 456292.0, 1061365.0, 286911.0, 76165.0, 24604.0, 9664.0, 4320.0, 2280.0, 1276.0, 771.0, 516.0, 355.0, 242.0, 180.0, 94.0, 56.0, 60.0, 33.0, 26.0, 22.0, 18.0, 11.0, 5.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7734375, -8.4935302734375, -8.213623046875, -7.9337158203125, -7.65380859375, -7.3739013671875, -7.093994140625, -6.8140869140625, -6.5341796875, -6.2542724609375, -5.974365234375, -5.6944580078125, -5.41455078125, -5.1346435546875, -4.854736328125, -4.5748291015625, -4.294921875, -4.0150146484375, -3.735107421875, -3.4552001953125, -3.17529296875, -2.8953857421875, -2.615478515625, -2.3355712890625, -2.0556640625, -1.7757568359375, -1.495849609375, -1.2159423828125, -0.93603515625, -0.6561279296875, -0.376220703125, -0.0963134765625, 0.18359375, 0.4635009765625, 0.743408203125, 1.0233154296875, 1.30322265625, 1.5831298828125, 1.863037109375, 2.1429443359375, 2.4228515625, 2.7027587890625, 2.982666015625, 3.2625732421875, 3.54248046875, 3.8223876953125, 4.102294921875, 4.3822021484375, 4.662109375, 4.9420166015625, 5.221923828125, 5.5018310546875, 5.78173828125, 6.0616455078125, 6.341552734375, 6.6214599609375, 6.9013671875, 7.1812744140625, 7.461181640625, 7.7410888671875, 8.02099609375, 8.3009033203125, 8.580810546875, 8.8607177734375, 9.140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 7.0, 7.0, 6.0, 4.0, 11.0, 11.0, 20.0, 26.0, 28.0, 19.0, 31.0, 42.0, 55.0, 81.0, 83.0, 79.0, 87.0, 69.0, 70.0, 43.0, 52.0, 38.0, 19.0, 25.0, 19.0, 15.0, 10.0, 3.0, 4.0, 3.0, 4.0, 4.0, 4.0, 5.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.125, -3.023468017578125, -2.92193603515625, -2.820404052734375, -2.7188720703125, -2.617340087890625, -2.51580810546875, -2.414276123046875, -2.312744140625, -2.211212158203125, -2.10968017578125, -2.008148193359375, -1.9066162109375, -1.805084228515625, -1.70355224609375, -1.602020263671875, -1.50048828125, -1.398956298828125, -1.29742431640625, -1.195892333984375, -1.0943603515625, -0.992828369140625, -0.89129638671875, -0.789764404296875, -0.688232421875, -0.586700439453125, -0.48516845703125, -0.383636474609375, -0.2821044921875, -0.180572509765625, -0.07904052734375, 0.022491455078125, 0.1240234375, 0.225555419921875, 0.32708740234375, 0.428619384765625, 0.5301513671875, 0.631683349609375, 0.73321533203125, 0.834747314453125, 0.936279296875, 1.037811279296875, 1.13934326171875, 1.240875244140625, 1.3424072265625, 1.443939208984375, 1.54547119140625, 1.647003173828125, 1.74853515625, 1.850067138671875, 1.95159912109375, 2.053131103515625, 2.1546630859375, 2.256195068359375, 2.35772705078125, 2.459259033203125, 2.560791015625, 2.662322998046875, 2.76385498046875, 2.865386962890625, 2.9669189453125, 3.068450927734375, 3.16998291015625, 3.271514892578125, 3.373046875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 13.0, 8.0, 5.0, 9.0, 9.0, 14.0, 16.0, 20.0, 23.0, 32.0, 50.0, 57.0, 92.0, 117.0, 179.0, 343.0, 1086.0, 6905.0, 230956.0, 790372.0, 15329.0, 1771.0, 460.0, 201.0, 115.0, 78.0, 72.0, 46.0, 32.0, 27.0, 24.0, 21.0, 12.0, 15.0, 9.0, 8.0, 5.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.5, -46.99169921875, -45.4833984375, -43.97509765625, -42.466796875, -40.95849609375, -39.4501953125, -37.94189453125, -36.43359375, -34.92529296875, -33.4169921875, -31.90869140625, -30.400390625, -28.89208984375, -27.3837890625, -25.87548828125, -24.3671875, -22.85888671875, -21.3505859375, -19.84228515625, -18.333984375, -16.82568359375, -15.3173828125, -13.80908203125, -12.30078125, -10.79248046875, -9.2841796875, -7.77587890625, -6.267578125, -4.75927734375, -3.2509765625, -1.74267578125, -0.234375, 1.27392578125, 2.7822265625, 4.29052734375, 5.798828125, 7.30712890625, 8.8154296875, 10.32373046875, 11.83203125, 13.34033203125, 14.8486328125, 16.35693359375, 17.865234375, 19.37353515625, 20.8818359375, 22.39013671875, 23.8984375, 25.40673828125, 26.9150390625, 28.42333984375, 29.931640625, 31.43994140625, 32.9482421875, 34.45654296875, 35.96484375, 37.47314453125, 38.9814453125, 40.48974609375, 41.998046875, 43.50634765625, 45.0146484375, 46.52294921875, 48.03125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 6.0, 41.0, 78.0, 154.0, 214.0, 240.0, 129.0, 78.0, 39.0, 13.0, 10.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.371774673461914, -18.920814514160156, -18.4698543548584, -18.018896102905273, -17.567935943603516, -17.116975784301758, -16.666015625, -16.215055465698242, -15.7640962600708, -15.313136100769043, -14.862176895141602, -14.411216735839844, -13.960256576538086, -13.509297370910645, -13.058337211608887, -12.607378005981445, -12.156417846679688, -11.70545768737793, -11.254498481750488, -10.80353832244873, -10.352579116821289, -9.901618957519531, -9.450658798217773, -8.999698638916016, -8.548739433288574, -8.097779273986816, -7.646820068359375, -7.195859909057617, -6.744900226593018, -6.293940544128418, -5.84298038482666, -5.3920207023620605, -4.9410600662231445, -4.490100383758545, -4.039140701293945, -3.5881805419921875, -3.137220859527588, -2.6862611770629883, -2.2353012561798096, -1.7843413352966309, -1.3333816528320312, -0.8824218511581421, -0.43146204948425293, 0.01949775218963623, 0.4704575538635254, 0.921417236328125, 1.3723771572113037, 1.8233370780944824, 2.274296760559082, 2.7252564430236816, 3.1762163639068604, 3.627176284790039, 4.078135967254639, 4.529095649719238, 4.980055809020996, 5.431015491485596, 5.881975173950195, 6.332934856414795, 6.7838945388793945, 7.234854698181152, 7.685814380645752, 8.136774063110352, 8.58773422241211, 9.038694381713867, 9.489653587341309]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 8.0, 9.0, 5.0, 4.0, 14.0, 15.0, 21.0, 21.0, 20.0, 30.0, 24.0, 35.0, 32.0, 24.0, 46.0, 29.0, 34.0, 35.0, 48.0, 48.0, 38.0, 37.0, 52.0, 37.0, 44.0, 40.0, 37.0, 32.0, 27.0, 23.0, 17.0, 26.0, 18.0, 21.0, 15.0, 5.0, 6.0, 4.0, 5.0, 4.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.6793127059936523, -3.5387067794799805, -3.3981008529663086, -3.2574949264526367, -3.116888999938965, -2.976283073425293, -2.835677146911621, -2.695071220397949, -2.5544652938842773, -2.4138593673706055, -2.2732534408569336, -2.1326475143432617, -1.9920415878295898, -1.851435661315918, -1.7108298540115356, -1.5702239274978638, -1.4296181201934814, -1.2890121936798096, -1.1484062671661377, -1.0078003406524658, -0.8671944737434387, -0.7265885472297668, -0.5859826803207397, -0.44537675380706787, -0.304770827293396, -0.16416491568088531, -0.023559004068374634, 0.11704689264297485, 0.25765281915664673, 0.3982587456703186, 0.5388646125793457, 0.6794705390930176, 0.8200764656066895, 0.9606823921203613, 1.1012883186340332, 1.241894245147705, 1.382500171661377, 1.5231060981750488, 1.6637119054794312, 1.804317831993103, 1.944923758506775, 2.0855295658111572, 2.226135492324829, 2.366741418838501, 2.507347345352173, 2.6479532718658447, 2.7885591983795166, 2.9291651248931885, 3.0697710514068604, 3.2103769779205322, 3.350982904434204, 3.491588830947876, 3.632194757461548, 3.7728006839752197, 3.9134063720703125, 4.054012298583984, 4.194618225097656, 4.335224151611328, 4.475830078125, 4.616436004638672, 4.757041931152344, 4.897647857666016, 5.0382537841796875, 5.178859710693359, 5.319465637207031]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 5.0, 8.0, 15.0, 12.0, 16.0, 18.0, 23.0, 27.0, 23.0, 27.0, 34.0, 33.0, 32.0, 44.0, 37.0, 43.0, 35.0, 41.0, 48.0, 43.0, 35.0, 46.0, 57.0, 41.0, 36.0, 26.0, 22.0, 30.0, 40.0, 24.0, 19.0, 10.0, 5.0, 17.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.201171875, -3.086151123046875, -2.97113037109375, -2.856109619140625, -2.7410888671875, -2.626068115234375, -2.51104736328125, -2.396026611328125, -2.281005859375, -2.165985107421875, -2.05096435546875, -1.935943603515625, -1.8209228515625, -1.705902099609375, -1.59088134765625, -1.475860595703125, -1.36083984375, -1.245819091796875, -1.13079833984375, -1.015777587890625, -0.9007568359375, -0.785736083984375, -0.67071533203125, -0.555694580078125, -0.440673828125, -0.325653076171875, -0.21063232421875, -0.095611572265625, 0.0194091796875, 0.134429931640625, 0.24945068359375, 0.364471435546875, 0.4794921875, 0.594512939453125, 0.70953369140625, 0.824554443359375, 0.9395751953125, 1.054595947265625, 1.16961669921875, 1.284637451171875, 1.399658203125, 1.514678955078125, 1.62969970703125, 1.744720458984375, 1.8597412109375, 1.974761962890625, 2.08978271484375, 2.204803466796875, 2.31982421875, 2.434844970703125, 2.54986572265625, 2.664886474609375, 2.7799072265625, 2.894927978515625, 3.00994873046875, 3.124969482421875, 3.239990234375, 3.355010986328125, 3.47003173828125, 3.585052490234375, 3.7000732421875, 3.815093994140625, 3.93011474609375, 4.045135498046875, 4.16015625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 3.0, 6.0, 15.0, 17.0, 15.0, 27.0, 41.0, 54.0, 85.0, 117.0, 180.0, 292.0, 519.0, 810.0, 1424.0, 2641.0, 5028.0, 10022.0, 22297.0, 67555.0, 317734.0, 456599.0, 106483.0, 30480.0, 12467.0, 6076.0, 3182.0, 1766.0, 978.0, 554.0, 377.0, 218.0, 157.0, 102.0, 66.0, 37.0, 30.0, 26.0, 16.0, 8.0, 9.0, 9.0, 5.0, 6.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-8.5625, -8.30426025390625, -8.0460205078125, -7.78778076171875, -7.529541015625, -7.27130126953125, -7.0130615234375, -6.75482177734375, -6.49658203125, -6.23834228515625, -5.9801025390625, -5.72186279296875, -5.463623046875, -5.20538330078125, -4.9471435546875, -4.68890380859375, -4.4306640625, -4.17242431640625, -3.9141845703125, -3.65594482421875, -3.397705078125, -3.13946533203125, -2.8812255859375, -2.62298583984375, -2.36474609375, -2.10650634765625, -1.8482666015625, -1.59002685546875, -1.331787109375, -1.07354736328125, -0.8153076171875, -0.55706787109375, -0.298828125, -0.04058837890625, 0.2176513671875, 0.47589111328125, 0.734130859375, 0.99237060546875, 1.2506103515625, 1.50885009765625, 1.76708984375, 2.02532958984375, 2.2835693359375, 2.54180908203125, 2.800048828125, 3.05828857421875, 3.3165283203125, 3.57476806640625, 3.8330078125, 4.09124755859375, 4.3494873046875, 4.60772705078125, 4.865966796875, 5.12420654296875, 5.3824462890625, 5.64068603515625, 5.89892578125, 6.15716552734375, 6.4154052734375, 6.67364501953125, 6.931884765625, 7.19012451171875, 7.4483642578125, 7.70660400390625, 7.96484375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 7.0, 12.0, 8.0, 10.0, 10.0, 24.0, 24.0, 25.0, 35.0, 34.0, 40.0, 57.0, 61.0, 91.0, 154.0, 362.0, 1458.0, 143.0, 117.0, 73.0, 50.0, 50.0, 33.0, 39.0, 40.0, 27.0, 25.0, 12.0, 5.0, 7.0, 7.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-21.875, -21.3294677734375, -20.783935546875, -20.2384033203125, -19.69287109375, -19.1473388671875, -18.601806640625, -18.0562744140625, -17.5107421875, -16.9652099609375, -16.419677734375, -15.8741455078125, -15.32861328125, -14.7830810546875, -14.237548828125, -13.6920166015625, -13.146484375, -12.6009521484375, -12.055419921875, -11.5098876953125, -10.96435546875, -10.4188232421875, -9.873291015625, -9.3277587890625, -8.7822265625, -8.2366943359375, -7.691162109375, -7.1456298828125, -6.60009765625, -6.0545654296875, -5.509033203125, -4.9635009765625, -4.41796875, -3.8724365234375, -3.326904296875, -2.7813720703125, -2.23583984375, -1.6903076171875, -1.144775390625, -0.5992431640625, -0.0537109375, 0.4918212890625, 1.037353515625, 1.5828857421875, 2.12841796875, 2.6739501953125, 3.219482421875, 3.7650146484375, 4.310546875, 4.8560791015625, 5.401611328125, 5.9471435546875, 6.49267578125, 7.0382080078125, 7.583740234375, 8.1292724609375, 8.6748046875, 9.2203369140625, 9.765869140625, 10.3114013671875, 10.85693359375, 11.4024658203125, 11.947998046875, 12.4935302734375, 13.0390625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 10.0, 11.0, 21.0, 38.0, 48.0, 108.0, 209.0, 446.0, 1152.0, 3811.0, 32634.0, 2955339.0, 142175.0, 6988.0, 1555.0, 538.0, 258.0, 145.0, 100.0, 56.0, 32.0, 18.0, 8.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.8125, -49.15625, -47.5, -45.84375, -44.1875, -42.53125, -40.875, -39.21875, -37.5625, -35.90625, -34.25, -32.59375, -30.9375, -29.28125, -27.625, -25.96875, -24.3125, -22.65625, -21.0, -19.34375, -17.6875, -16.03125, -14.375, -12.71875, -11.0625, -9.40625, -7.75, -6.09375, -4.4375, -2.78125, -1.125, 0.53125, 2.1875, 3.84375, 5.5, 7.15625, 8.8125, 10.46875, 12.125, 13.78125, 15.4375, 17.09375, 18.75, 20.40625, 22.0625, 23.71875, 25.375, 27.03125, 28.6875, 30.34375, 32.0, 33.65625, 35.3125, 36.96875, 38.625, 40.28125, 41.9375, 43.59375, 45.25, 46.90625, 48.5625, 50.21875, 51.875, 53.53125, 55.1875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 9.0, 38.0, 114.0, 307.0, 312.0, 166.0, 47.0, 14.0, 3.0, 3.0], "bins": [-217.1337890625, -213.39869689941406, -209.66360473632812, -205.9285125732422, -202.19342041015625, -198.4583282470703, -194.72323608398438, -190.98814392089844, -187.2530517578125, -183.51795959472656, -179.78286743164062, -176.0477752685547, -172.31268310546875, -168.5775909423828, -164.84249877929688, -161.10740661621094, -157.372314453125, -153.63722229003906, -149.90213012695312, -146.1670379638672, -142.43194580078125, -138.6968536376953, -134.96176147460938, -131.22666931152344, -127.4915771484375, -123.75648498535156, -120.02139282226562, -116.28630065917969, -112.55120849609375, -108.81611633300781, -105.08102416992188, -101.34593200683594, -97.61083221435547, -93.87574005126953, -90.1406478881836, -86.40555572509766, -82.67046356201172, -78.93537139892578, -75.20027923583984, -71.4651870727539, -67.73009490966797, -63.99500274658203, -60.259910583496094, -56.524818420410156, -52.78972625732422, -49.05463409423828, -45.319541931152344, -41.584449768066406, -37.84935760498047, -34.11426544189453, -30.379173278808594, -26.644081115722656, -22.90898895263672, -19.17389678955078, -15.438804626464844, -11.703712463378906, -7.968622207641602, -4.233530044555664, -0.49843788146972656, 3.236654281616211, 6.971746444702148, 10.706838607788086, 14.441930770874023, 18.17702293395996, 21.9121150970459]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 8.0, 13.0, 11.0, 14.0, 20.0, 23.0, 31.0, 24.0, 18.0, 21.0, 28.0, 32.0, 33.0, 36.0, 21.0, 46.0, 39.0, 35.0, 37.0, 39.0, 33.0, 30.0, 45.0, 35.0, 24.0, 35.0, 28.0, 35.0, 23.0, 26.0, 20.0, 12.0, 13.0, 19.0, 9.0, 19.0, 17.0, 3.0, 6.0, 3.0, 4.0, 7.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-43.37954330444336, -42.0287971496582, -40.67805480957031, -39.327308654785156, -37.976566314697266, -36.62582015991211, -35.27507781982422, -33.92433166503906, -32.573585510253906, -31.222841262817383, -29.87209701538086, -28.521350860595703, -27.170608520507812, -25.819862365722656, -24.469118118286133, -23.11837387084961, -21.76763153076172, -20.416887283325195, -19.066143035888672, -17.715396881103516, -16.364654541015625, -15.013909339904785, -13.663164138793945, -12.312419891357422, -10.961675643920898, -9.610931396484375, -8.260187149047852, -6.909441947937012, -5.558697700500488, -4.207953453063965, -2.857208251953125, -1.5064640045166016, -0.1557159423828125, 1.19502854347229, 2.5457730293273926, 3.896517753601074, 5.247262001037598, 6.598006248474121, 7.948751449584961, 9.299495697021484, 10.650239944458008, 12.000984191894531, 13.351728439331055, 14.702473640441895, 16.053218841552734, 17.403961181640625, 18.75470733642578, 20.105451583862305, 21.456195831298828, 22.80694007873535, 24.157684326171875, 25.50843048095703, 26.859172821044922, 28.209918975830078, 29.5606632232666, 30.911407470703125, 32.26215362548828, 33.61289978027344, 34.96364212036133, 36.314388275146484, 37.665130615234375, 39.01587677001953, 40.36662292480469, 41.71736526489258, 43.06810760498047]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 12.0, 5.0, 5.0, 11.0, 10.0, 11.0, 20.0, 16.0, 22.0, 22.0, 18.0, 28.0, 33.0, 32.0, 44.0, 29.0, 32.0, 44.0, 52.0, 46.0, 32.0, 50.0, 52.0, 49.0, 33.0, 48.0, 41.0, 29.0, 31.0, 23.0, 24.0, 15.0, 16.0, 10.0, 14.0, 16.0, 6.0, 6.0, 7.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.294921875, -3.177032470703125, -3.05914306640625, -2.941253662109375, -2.8233642578125, -2.705474853515625, -2.58758544921875, -2.469696044921875, -2.351806640625, -2.233917236328125, -2.11602783203125, -1.998138427734375, -1.8802490234375, -1.762359619140625, -1.64447021484375, -1.526580810546875, -1.40869140625, -1.290802001953125, -1.17291259765625, -1.055023193359375, -0.9371337890625, -0.819244384765625, -0.70135498046875, -0.583465576171875, -0.465576171875, -0.347686767578125, -0.22979736328125, -0.111907958984375, 0.0059814453125, 0.123870849609375, 0.24176025390625, 0.359649658203125, 0.4775390625, 0.595428466796875, 0.71331787109375, 0.831207275390625, 0.9490966796875, 1.066986083984375, 1.18487548828125, 1.302764892578125, 1.420654296875, 1.538543701171875, 1.65643310546875, 1.774322509765625, 1.8922119140625, 2.010101318359375, 2.12799072265625, 2.245880126953125, 2.36376953125, 2.481658935546875, 2.59954833984375, 2.717437744140625, 2.8353271484375, 2.953216552734375, 3.07110595703125, 3.188995361328125, 3.306884765625, 3.424774169921875, 3.54266357421875, 3.660552978515625, 3.7784423828125, 3.896331787109375, 4.01422119140625, 4.132110595703125, 4.25]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 11.0, 8.0, 10.0, 10.0, 28.0, 33.0, 42.0, 79.0, 101.0, 146.0, 216.0, 359.0, 560.0, 923.0, 1709.0, 3209.0, 6368.0, 14870.0, 44907.0, 234092.0, 2435914.0, 1270119.0, 129377.0, 30430.0, 10702.0, 4746.0, 2357.0, 1209.0, 687.0, 409.0, 219.0, 139.0, 101.0, 53.0, 51.0, 33.0, 19.0, 12.0, 12.0, 8.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9453125, -12.5511474609375, -12.156982421875, -11.7628173828125, -11.36865234375, -10.9744873046875, -10.580322265625, -10.1861572265625, -9.7919921875, -9.3978271484375, -9.003662109375, -8.6094970703125, -8.21533203125, -7.8211669921875, -7.427001953125, -7.0328369140625, -6.638671875, -6.2445068359375, -5.850341796875, -5.4561767578125, -5.06201171875, -4.6678466796875, -4.273681640625, -3.8795166015625, -3.4853515625, -3.0911865234375, -2.697021484375, -2.3028564453125, -1.90869140625, -1.5145263671875, -1.120361328125, -0.7261962890625, -0.33203125, 0.0621337890625, 0.456298828125, 0.8504638671875, 1.24462890625, 1.6387939453125, 2.032958984375, 2.4271240234375, 2.8212890625, 3.2154541015625, 3.609619140625, 4.0037841796875, 4.39794921875, 4.7921142578125, 5.186279296875, 5.5804443359375, 5.974609375, 6.3687744140625, 6.762939453125, 7.1571044921875, 7.55126953125, 7.9454345703125, 8.339599609375, 8.7337646484375, 9.1279296875, 9.5220947265625, 9.916259765625, 10.3104248046875, 10.70458984375, 11.0987548828125, 11.492919921875, 11.8870849609375, 12.28125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 2.0, 4.0, 11.0, 12.0, 13.0, 27.0, 33.0, 57.0, 97.0, 175.0, 275.0, 501.0, 832.0, 814.0, 520.0, 308.0, 156.0, 91.0, 63.0, 33.0, 18.0, 20.0, 11.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7734375, -9.1978759765625, -8.622314453125, -8.0467529296875, -7.47119140625, -6.8956298828125, -6.320068359375, -5.7445068359375, -5.1689453125, -4.5933837890625, -4.017822265625, -3.4422607421875, -2.86669921875, -2.2911376953125, -1.715576171875, -1.1400146484375, -0.564453125, 0.0111083984375, 0.586669921875, 1.1622314453125, 1.73779296875, 2.3133544921875, 2.888916015625, 3.4644775390625, 4.0400390625, 4.6156005859375, 5.191162109375, 5.7667236328125, 6.34228515625, 6.9178466796875, 7.493408203125, 8.0689697265625, 8.64453125, 9.2200927734375, 9.795654296875, 10.3712158203125, 10.94677734375, 11.5223388671875, 12.097900390625, 12.6734619140625, 13.2490234375, 13.8245849609375, 14.400146484375, 14.9757080078125, 15.55126953125, 16.1268310546875, 16.702392578125, 17.2779541015625, 17.853515625, 18.4290771484375, 19.004638671875, 19.5802001953125, 20.15576171875, 20.7313232421875, 21.306884765625, 21.8824462890625, 22.4580078125, 23.0335693359375, 23.609130859375, 24.1846923828125, 24.76025390625, 25.3358154296875, 25.911376953125, 26.4869384765625, 27.0625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 3.0, 9.0, 10.0, 12.0, 21.0, 16.0, 21.0, 22.0, 17.0, 46.0, 43.0, 87.0, 168.0, 278.0, 692.0, 1810.0, 5438.0, 20353.0, 135590.0, 2753136.0, 1186891.0, 70016.0, 13247.0, 3842.0, 1359.0, 519.0, 243.0, 107.0, 50.0, 41.0, 36.0, 29.0, 19.0, 21.0, 20.0, 14.0, 11.0, 10.0, 6.0, 3.0, 3.0, 5.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-32.15625, -31.0791015625, -30.001953125, -28.9248046875, -27.84765625, -26.7705078125, -25.693359375, -24.6162109375, -23.5390625, -22.4619140625, -21.384765625, -20.3076171875, -19.23046875, -18.1533203125, -17.076171875, -15.9990234375, -14.921875, -13.8447265625, -12.767578125, -11.6904296875, -10.61328125, -9.5361328125, -8.458984375, -7.3818359375, -6.3046875, -5.2275390625, -4.150390625, -3.0732421875, -1.99609375, -0.9189453125, 0.158203125, 1.2353515625, 2.3125, 3.3896484375, 4.466796875, 5.5439453125, 6.62109375, 7.6982421875, 8.775390625, 9.8525390625, 10.9296875, 12.0068359375, 13.083984375, 14.1611328125, 15.23828125, 16.3154296875, 17.392578125, 18.4697265625, 19.546875, 20.6240234375, 21.701171875, 22.7783203125, 23.85546875, 24.9326171875, 26.009765625, 27.0869140625, 28.1640625, 29.2412109375, 30.318359375, 31.3955078125, 32.47265625, 33.5498046875, 34.626953125, 35.7041015625, 36.78125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 3.0, 4.0, 6.0, 15.0, 16.0, 23.0, 20.0, 40.0, 60.0, 65.0, 62.0, 74.0, 88.0, 90.0, 76.0, 72.0, 65.0, 57.0, 53.0, 33.0, 27.0, 13.0, 10.0, 10.0, 8.0, 5.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.96723556518555, -36.31988525390625, -34.67253112792969, -33.02518081665039, -31.377826690673828, -29.73047637939453, -28.0831241607666, -26.435771942138672, -24.788419723510742, -23.141067504882812, -21.493715286254883, -19.846363067626953, -18.199012756347656, -16.551658630371094, -14.904308319091797, -13.256956100463867, -11.609603881835938, -9.962251663208008, -8.314899444580078, -6.667548179626465, -5.020195960998535, -3.3728437423706055, -1.7254924774169922, -0.0781402587890625, 1.5692119598388672, 3.2165639400482178, 4.863915920257568, 6.51126766204834, 8.15861988067627, 9.8059720993042, 11.453323364257812, 13.100675582885742, 14.748031616210938, 16.395383834838867, 18.042736053466797, 19.690086364746094, 21.337440490722656, 22.984790802001953, 24.632143020629883, 26.279495239257812, 27.926847457885742, 29.574199676513672, 31.2215518951416, 32.86890411376953, 34.51625442504883, 36.16360855102539, 37.81095886230469, 39.45831298828125, 41.10566329956055, 42.753013610839844, 44.400367736816406, 46.0477180480957, 47.695072174072266, 49.34242248535156, 50.989776611328125, 52.63712692260742, 54.28447723388672, 55.931827545166016, 57.57918167114258, 59.226531982421875, 60.87388610839844, 62.521236419677734, 64.16858673095703, 65.8159408569336, 67.46329498291016]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 2.0, 2.0, 9.0, 7.0, 5.0, 8.0, 11.0, 6.0, 14.0, 19.0, 18.0, 20.0, 20.0, 20.0, 29.0, 44.0, 30.0, 45.0, 39.0, 39.0, 43.0, 39.0, 34.0, 35.0, 44.0, 24.0, 33.0, 39.0, 30.0, 27.0, 38.0, 19.0, 25.0, 24.0, 12.0, 24.0, 20.0, 9.0, 14.0, 21.0, 13.0, 10.0, 5.0, 10.0, 4.0, 8.0, 3.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-32.862281799316406, -31.812808990478516, -30.763338088989258, -29.7138671875, -28.66439437866211, -27.61492156982422, -26.56545066833496, -25.515979766845703, -24.466506958007812, -23.417034149169922, -22.367563247680664, -21.318092346191406, -20.268619537353516, -19.219146728515625, -18.169675827026367, -17.12020492553711, -16.07073211669922, -15.021260261535645, -13.97178840637207, -12.922316551208496, -11.872844696044922, -10.823372840881348, -9.773900985717773, -8.7244291305542, -7.674957275390625, -6.625485420227051, -5.576013565063477, -4.526541709899902, -3.477069854736328, -2.427597999572754, -1.3781261444091797, -0.32865428924560547, 0.7208175659179688, 1.770289421081543, 2.819761276245117, 3.8692331314086914, 4.918704986572266, 5.96817684173584, 7.017648696899414, 8.067120552062988, 9.116592407226562, 10.166064262390137, 11.215536117553711, 12.265007972717285, 13.31447982788086, 14.363951683044434, 15.413423538208008, 16.462894439697266, 17.512367248535156, 18.561840057373047, 19.611310958862305, 20.660781860351562, 21.710254669189453, 22.759727478027344, 23.8091983795166, 24.85866928100586, 25.90814208984375, 26.95761489868164, 28.0070858001709, 29.056556701660156, 30.106029510498047, 31.155502319335938, 32.20497131347656, 33.25444412231445, 34.303916931152344]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 4.0, 4.0, 6.0, 10.0, 5.0, 7.0, 18.0, 10.0, 18.0, 14.0, 16.0, 27.0, 37.0, 24.0, 30.0, 43.0, 36.0, 31.0, 38.0, 42.0, 42.0, 39.0, 48.0, 37.0, 44.0, 32.0, 48.0, 34.0, 32.0, 27.0, 25.0, 23.0, 31.0, 20.0, 17.0, 18.0, 13.0, 9.0, 6.0, 11.0, 10.0, 4.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.953125, -3.8370361328125, -3.720947265625, -3.6048583984375, -3.48876953125, -3.3726806640625, -3.256591796875, -3.1405029296875, -3.0244140625, -2.9083251953125, -2.792236328125, -2.6761474609375, -2.56005859375, -2.4439697265625, -2.327880859375, -2.2117919921875, -2.095703125, -1.9796142578125, -1.863525390625, -1.7474365234375, -1.63134765625, -1.5152587890625, -1.399169921875, -1.2830810546875, -1.1669921875, -1.0509033203125, -0.934814453125, -0.8187255859375, -0.70263671875, -0.5865478515625, -0.470458984375, -0.3543701171875, -0.23828125, -0.1221923828125, -0.006103515625, 0.1099853515625, 0.22607421875, 0.3421630859375, 0.458251953125, 0.5743408203125, 0.6904296875, 0.8065185546875, 0.922607421875, 1.0386962890625, 1.15478515625, 1.2708740234375, 1.386962890625, 1.5030517578125, 1.619140625, 1.7352294921875, 1.851318359375, 1.9674072265625, 2.08349609375, 2.1995849609375, 2.315673828125, 2.4317626953125, 2.5478515625, 2.6639404296875, 2.780029296875, 2.8961181640625, 3.01220703125, 3.1282958984375, 3.244384765625, 3.3604736328125, 3.4765625]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 6.0, 8.0, 15.0, 20.0, 21.0, 38.0, 41.0, 69.0, 111.0, 146.0, 208.0, 319.0, 526.0, 773.0, 1291.0, 2082.0, 3366.0, 5666.0, 9546.0, 15725.0, 25772.0, 41537.0, 65045.0, 104088.0, 169823.0, 219493.0, 145258.0, 89865.0, 56550.0, 35138.0, 21961.0, 13329.0, 8061.0, 4790.0, 2906.0, 1825.0, 1113.0, 693.0, 437.0, 286.0, 206.0, 122.0, 92.0, 61.0, 45.0, 23.0, 16.0, 12.0, 5.0, 5.0, 7.0, 6.0, 5.0, 1.0, 0.0, 3.0], "bins": [-9.3359375, -9.055908203125, -8.77587890625, -8.495849609375, -8.2158203125, -7.935791015625, -7.65576171875, -7.375732421875, -7.095703125, -6.815673828125, -6.53564453125, -6.255615234375, -5.9755859375, -5.695556640625, -5.41552734375, -5.135498046875, -4.85546875, -4.575439453125, -4.29541015625, -4.015380859375, -3.7353515625, -3.455322265625, -3.17529296875, -2.895263671875, -2.615234375, -2.335205078125, -2.05517578125, -1.775146484375, -1.4951171875, -1.215087890625, -0.93505859375, -0.655029296875, -0.375, -0.094970703125, 0.18505859375, 0.465087890625, 0.7451171875, 1.025146484375, 1.30517578125, 1.585205078125, 1.865234375, 2.145263671875, 2.42529296875, 2.705322265625, 2.9853515625, 3.265380859375, 3.54541015625, 3.825439453125, 4.10546875, 4.385498046875, 4.66552734375, 4.945556640625, 5.2255859375, 5.505615234375, 5.78564453125, 6.065673828125, 6.345703125, 6.625732421875, 6.90576171875, 7.185791015625, 7.4658203125, 7.745849609375, 8.02587890625, 8.305908203125, 8.5859375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 5.0, 8.0, 9.0, 13.0, 10.0, 8.0, 16.0, 9.0, 17.0, 24.0, 27.0, 24.0, 30.0, 38.0, 34.0, 38.0, 46.0, 40.0, 44.0, 43.0, 1075.0, 33.0, 41.0, 37.0, 47.0, 40.0, 39.0, 32.0, 28.0, 25.0, 24.0, 23.0, 13.0, 11.0, 16.0, 13.0, 10.0, 13.0, 8.0, 6.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.623046875, -2.5245361328125, -2.426025390625, -2.3275146484375, -2.22900390625, -2.1304931640625, -2.031982421875, -1.9334716796875, -1.8349609375, -1.7364501953125, -1.637939453125, -1.5394287109375, -1.44091796875, -1.3424072265625, -1.243896484375, -1.1453857421875, -1.046875, -0.9483642578125, -0.849853515625, -0.7513427734375, -0.65283203125, -0.5543212890625, -0.455810546875, -0.3572998046875, -0.2587890625, -0.1602783203125, -0.061767578125, 0.0367431640625, 0.13525390625, 0.2337646484375, 0.332275390625, 0.4307861328125, 0.529296875, 0.6278076171875, 0.726318359375, 0.8248291015625, 0.92333984375, 1.0218505859375, 1.120361328125, 1.2188720703125, 1.3173828125, 1.4158935546875, 1.514404296875, 1.6129150390625, 1.71142578125, 1.8099365234375, 1.908447265625, 2.0069580078125, 2.10546875, 2.2039794921875, 2.302490234375, 2.4010009765625, 2.49951171875, 2.5980224609375, 2.696533203125, 2.7950439453125, 2.8935546875, 2.9920654296875, 3.090576171875, 3.1890869140625, 3.28759765625, 3.3861083984375, 3.484619140625, 3.5831298828125, 3.681640625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 9.0, 7.0, 13.0, 16.0, 26.0, 17.0, 37.0, 63.0, 69.0, 104.0, 144.0, 201.0, 251.0, 346.0, 547.0, 753.0, 1129.0, 1611.0, 2743.0, 4512.0, 7892.0, 15337.0, 32071.0, 77002.0, 215629.0, 938883.0, 533972.0, 151432.0, 57281.0, 25125.0, 12391.0, 6513.0, 3837.0, 2242.0, 1537.0, 971.0, 678.0, 477.0, 391.0, 248.0, 178.0, 142.0, 88.0, 65.0, 47.0, 27.0, 27.0, 18.0, 17.0, 11.0, 6.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5625, -9.25244140625, -8.9423828125, -8.63232421875, -8.322265625, -8.01220703125, -7.7021484375, -7.39208984375, -7.08203125, -6.77197265625, -6.4619140625, -6.15185546875, -5.841796875, -5.53173828125, -5.2216796875, -4.91162109375, -4.6015625, -4.29150390625, -3.9814453125, -3.67138671875, -3.361328125, -3.05126953125, -2.7412109375, -2.43115234375, -2.12109375, -1.81103515625, -1.5009765625, -1.19091796875, -0.880859375, -0.57080078125, -0.2607421875, 0.04931640625, 0.359375, 0.66943359375, 0.9794921875, 1.28955078125, 1.599609375, 1.90966796875, 2.2197265625, 2.52978515625, 2.83984375, 3.14990234375, 3.4599609375, 3.77001953125, 4.080078125, 4.39013671875, 4.7001953125, 5.01025390625, 5.3203125, 5.63037109375, 5.9404296875, 6.25048828125, 6.560546875, 6.87060546875, 7.1806640625, 7.49072265625, 7.80078125, 8.11083984375, 8.4208984375, 8.73095703125, 9.041015625, 9.35107421875, 9.6611328125, 9.97119140625, 10.28125]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 7.0, 6.0, 8.0, 6.0, 11.0, 16.0, 23.0, 20.0, 23.0, 46.0, 48.0, 61.0, 85.0, 221.0, 104.0, 69.0, 46.0, 25.0, 32.0, 15.0, 17.0, 15.0, 9.0, 11.0, 15.0, 18.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0], "bins": [-6.5390625, -6.378692626953125, -6.21832275390625, -6.057952880859375, -5.8975830078125, -5.737213134765625, -5.57684326171875, -5.416473388671875, -5.256103515625, -5.095733642578125, -4.93536376953125, -4.774993896484375, -4.6146240234375, -4.454254150390625, -4.29388427734375, -4.133514404296875, -3.97314453125, -3.812774658203125, -3.65240478515625, -3.492034912109375, -3.3316650390625, -3.171295166015625, -3.01092529296875, -2.850555419921875, -2.690185546875, -2.529815673828125, -2.36944580078125, -2.209075927734375, -2.0487060546875, -1.888336181640625, -1.72796630859375, -1.567596435546875, -1.4072265625, -1.246856689453125, -1.08648681640625, -0.926116943359375, -0.7657470703125, -0.605377197265625, -0.44500732421875, -0.284637451171875, -0.124267578125, 0.036102294921875, 0.19647216796875, 0.356842041015625, 0.5172119140625, 0.677581787109375, 0.83795166015625, 0.998321533203125, 1.15869140625, 1.319061279296875, 1.47943115234375, 1.639801025390625, 1.8001708984375, 1.960540771484375, 2.12091064453125, 2.281280517578125, 2.441650390625, 2.602020263671875, 2.76239013671875, 2.922760009765625, 3.0831298828125, 3.243499755859375, 3.40386962890625, 3.564239501953125, 3.724609375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 10.0, 10.0, 4.0, 12.0, 12.0, 21.0, 28.0, 43.0, 40.0, 76.0, 90.0, 156.0, 325.0, 982.0, 5901.0, 94035.0, 921894.0, 21198.0, 2509.0, 543.0, 244.0, 108.0, 88.0, 62.0, 42.0, 29.0, 16.0, 21.0, 12.0, 12.0, 11.0, 3.0, 4.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.3125, -62.91796875, -60.5234375, -58.12890625, -55.734375, -53.33984375, -50.9453125, -48.55078125, -46.15625, -43.76171875, -41.3671875, -38.97265625, -36.578125, -34.18359375, -31.7890625, -29.39453125, -27.0, -24.60546875, -22.2109375, -19.81640625, -17.421875, -15.02734375, -12.6328125, -10.23828125, -7.84375, -5.44921875, -3.0546875, -0.66015625, 1.734375, 4.12890625, 6.5234375, 8.91796875, 11.3125, 13.70703125, 16.1015625, 18.49609375, 20.890625, 23.28515625, 25.6796875, 28.07421875, 30.46875, 32.86328125, 35.2578125, 37.65234375, 40.046875, 42.44140625, 44.8359375, 47.23046875, 49.625, 52.01953125, 54.4140625, 56.80859375, 59.203125, 61.59765625, 63.9921875, 66.38671875, 68.78125, 71.17578125, 73.5703125, 75.96484375, 78.359375, 80.75390625, 83.1484375, 85.54296875, 87.9375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 9.0, 20.0, 21.0, 25.0, 37.0, 55.0, 70.0, 83.0, 125.0, 113.0, 121.0, 101.0, 54.0, 55.0, 27.0, 32.0, 19.0, 15.0, 6.0, 9.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.981024742126465, -10.652749061584473, -10.324474334716797, -9.996198654174805, -9.667922973632812, -9.33964729309082, -9.011372566223145, -8.683096885681152, -8.354822158813477, -8.026546478271484, -7.69827127456665, -7.369996070861816, -7.041720390319824, -6.71344518661499, -6.385169982910156, -6.056894302368164, -5.728618621826172, -5.400343418121338, -5.072067737579346, -4.743792533874512, -4.4155168533325195, -4.0872416496276855, -3.7589664459228516, -3.4306910037994385, -3.1024155616760254, -2.7741401195526123, -2.445864677429199, -2.1175894737243652, -1.7893140316009521, -1.461038589477539, -1.1327632665634155, -0.804487943649292, -0.4762115478515625, -0.1479361653327942, 0.18033921718597412, 0.5086145997047424, 0.8368899822235107, 1.1651654243469238, 1.4934407472610474, 1.821716070175171, 2.149991512298584, 2.478266954421997, 2.80654239654541, 3.134817600250244, 3.4630930423736572, 3.7913684844970703, 4.119643688201904, 4.447918891906738, 4.7761945724487305, 5.1044697761535645, 5.432745456695557, 5.761020660400391, 6.089296340942383, 6.417571544647217, 6.745846748352051, 7.074122428894043, 7.402397632598877, 7.730672836303711, 8.058948516845703, 8.387224197387695, 8.715498924255371, 9.043774604797363, 9.372050285339355, 9.700325012207031, 10.028600692749023]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 5.0, 4.0, 5.0, 8.0, 8.0, 5.0, 10.0, 14.0, 21.0, 26.0, 29.0, 24.0, 18.0, 22.0, 42.0, 35.0, 39.0, 40.0, 38.0, 31.0, 42.0, 49.0, 38.0, 34.0, 37.0, 37.0, 41.0, 34.0, 31.0, 33.0, 24.0, 23.0, 25.0, 20.0, 15.0, 22.0, 11.0, 18.0, 5.0, 5.0, 7.0, 3.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.468539714813232, -5.301634788513184, -5.134730339050293, -4.967825412750244, -4.800920486450195, -4.6340155601501465, -4.467110633850098, -4.300206184387207, -4.133301258087158, -3.9663963317871094, -3.7994916439056396, -3.63258695602417, -3.465682029724121, -3.2987771034240723, -3.1318724155426025, -2.964967727661133, -2.798062801361084, -2.631157875061035, -2.4642531871795654, -2.2973484992980957, -2.130443572998047, -1.9635387659072876, -1.7966339588165283, -1.629729151725769, -1.4628243446350098, -1.2959195375442505, -1.1290147304534912, -0.9621099233627319, -0.7952051162719727, -0.6283003091812134, -0.4613955020904541, -0.2944906949996948, -0.12758636474609375, 0.03931844234466553, 0.2062232494354248, 0.3731280565261841, 0.5400328636169434, 0.7069376707077026, 0.8738424777984619, 1.0407472848892212, 1.2076520919799805, 1.3745568990707397, 1.541461706161499, 1.7083665132522583, 1.8752713203430176, 2.0421762466430664, 2.209080934524536, 2.375985622406006, 2.5428905487060547, 2.7097954750061035, 2.8767001628875732, 3.043604850769043, 3.210509777069092, 3.3774147033691406, 3.5443193912506104, 3.71122407913208, 3.878129005432129, 4.045033931732178, 4.211938858032227, 4.378843307495117, 4.545748233795166, 4.712653160095215, 4.8795576095581055, 5.046462535858154, 5.213367462158203]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 6.0, 7.0, 8.0, 6.0, 7.0, 11.0, 10.0, 12.0, 19.0, 16.0, 17.0, 25.0, 24.0, 26.0, 30.0, 25.0, 26.0, 48.0, 42.0, 27.0, 31.0, 41.0, 50.0, 38.0, 44.0, 36.0, 40.0, 31.0, 34.0, 28.0, 32.0, 30.0, 32.0, 28.0, 17.0, 18.0, 20.0, 13.0, 6.0, 16.0, 8.0, 4.0, 4.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.943359375, -3.828948974609375, -3.71453857421875, -3.600128173828125, -3.4857177734375, -3.371307373046875, -3.25689697265625, -3.142486572265625, -3.028076171875, -2.913665771484375, -2.79925537109375, -2.684844970703125, -2.5704345703125, -2.456024169921875, -2.34161376953125, -2.227203369140625, -2.11279296875, -1.998382568359375, -1.88397216796875, -1.769561767578125, -1.6551513671875, -1.540740966796875, -1.42633056640625, -1.311920166015625, -1.197509765625, -1.083099365234375, -0.96868896484375, -0.854278564453125, -0.7398681640625, -0.625457763671875, -0.51104736328125, -0.396636962890625, -0.2822265625, -0.167816162109375, -0.05340576171875, 0.061004638671875, 0.1754150390625, 0.289825439453125, 0.40423583984375, 0.518646240234375, 0.633056640625, 0.747467041015625, 0.86187744140625, 0.976287841796875, 1.0906982421875, 1.205108642578125, 1.31951904296875, 1.433929443359375, 1.54833984375, 1.662750244140625, 1.77716064453125, 1.891571044921875, 2.0059814453125, 2.120391845703125, 2.23480224609375, 2.349212646484375, 2.463623046875, 2.578033447265625, 2.69244384765625, 2.806854248046875, 2.9212646484375, 3.035675048828125, 3.15008544921875, 3.264495849609375, 3.37890625]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 11.0, 9.0, 10.0, 14.0, 19.0, 22.0, 37.0, 45.0, 69.0, 84.0, 126.0, 186.0, 300.0, 416.0, 751.0, 1411.0, 2468.0, 4689.0, 9784.0, 22494.0, 55689.0, 142611.0, 307882.0, 285925.0, 125237.0, 49132.0, 20365.0, 8935.0, 4316.0, 2229.0, 1274.0, 700.0, 457.0, 267.0, 159.0, 123.0, 85.0, 56.0, 46.0, 31.0, 29.0, 11.0, 15.0, 9.0, 14.0, 6.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-4.69921875, -4.564697265625, -4.43017578125, -4.295654296875, -4.1611328125, -4.026611328125, -3.89208984375, -3.757568359375, -3.623046875, -3.488525390625, -3.35400390625, -3.219482421875, -3.0849609375, -2.950439453125, -2.81591796875, -2.681396484375, -2.546875, -2.412353515625, -2.27783203125, -2.143310546875, -2.0087890625, -1.874267578125, -1.73974609375, -1.605224609375, -1.470703125, -1.336181640625, -1.20166015625, -1.067138671875, -0.9326171875, -0.798095703125, -0.66357421875, -0.529052734375, -0.39453125, -0.260009765625, -0.12548828125, 0.009033203125, 0.1435546875, 0.278076171875, 0.41259765625, 0.547119140625, 0.681640625, 0.816162109375, 0.95068359375, 1.085205078125, 1.2197265625, 1.354248046875, 1.48876953125, 1.623291015625, 1.7578125, 1.892333984375, 2.02685546875, 2.161376953125, 2.2958984375, 2.430419921875, 2.56494140625, 2.699462890625, 2.833984375, 2.968505859375, 3.10302734375, 3.237548828125, 3.3720703125, 3.506591796875, 3.64111328125, 3.775634765625, 3.91015625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 8.0, 11.0, 4.0, 12.0, 10.0, 8.0, 19.0, 17.0, 25.0, 28.0, 31.0, 28.0, 34.0, 43.0, 44.0, 57.0, 73.0, 120.0, 307.0, 1483.0, 200.0, 87.0, 58.0, 41.0, 34.0, 38.0, 24.0, 21.0, 23.0, 24.0, 17.0, 20.0, 19.0, 12.0, 9.0, 12.0, 6.0, 10.0, 8.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.71875, -13.2926025390625, -12.866455078125, -12.4403076171875, -12.01416015625, -11.5880126953125, -11.161865234375, -10.7357177734375, -10.3095703125, -9.8834228515625, -9.457275390625, -9.0311279296875, -8.60498046875, -8.1788330078125, -7.752685546875, -7.3265380859375, -6.900390625, -6.4742431640625, -6.048095703125, -5.6219482421875, -5.19580078125, -4.7696533203125, -4.343505859375, -3.9173583984375, -3.4912109375, -3.0650634765625, -2.638916015625, -2.2127685546875, -1.78662109375, -1.3604736328125, -0.934326171875, -0.5081787109375, -0.08203125, 0.3441162109375, 0.770263671875, 1.1964111328125, 1.62255859375, 2.0487060546875, 2.474853515625, 2.9010009765625, 3.3271484375, 3.7532958984375, 4.179443359375, 4.6055908203125, 5.03173828125, 5.4578857421875, 5.884033203125, 6.3101806640625, 6.736328125, 7.1624755859375, 7.588623046875, 8.0147705078125, 8.44091796875, 8.8670654296875, 9.293212890625, 9.7193603515625, 10.1455078125, 10.5716552734375, 10.997802734375, 11.4239501953125, 11.85009765625, 12.2762451171875, 12.702392578125, 13.1285400390625, 13.5546875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 8.0, 6.0, 12.0, 7.0, 13.0, 9.0, 21.0, 24.0, 33.0, 40.0, 41.0, 77.0, 132.0, 201.0, 409.0, 950.0, 2473.0, 9891.0, 81855.0, 2032418.0, 963017.0, 43680.0, 6698.0, 1954.0, 798.0, 333.0, 182.0, 124.0, 82.0, 48.0, 27.0, 28.0, 28.0, 16.0, 14.0, 9.0, 6.0, 6.0, 3.0, 7.0, 8.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-15.15625, -14.6807861328125, -14.205322265625, -13.7298583984375, -13.25439453125, -12.7789306640625, -12.303466796875, -11.8280029296875, -11.3525390625, -10.8770751953125, -10.401611328125, -9.9261474609375, -9.45068359375, -8.9752197265625, -8.499755859375, -8.0242919921875, -7.548828125, -7.0733642578125, -6.597900390625, -6.1224365234375, -5.64697265625, -5.1715087890625, -4.696044921875, -4.2205810546875, -3.7451171875, -3.2696533203125, -2.794189453125, -2.3187255859375, -1.84326171875, -1.3677978515625, -0.892333984375, -0.4168701171875, 0.05859375, 0.5340576171875, 1.009521484375, 1.4849853515625, 1.96044921875, 2.4359130859375, 2.911376953125, 3.3868408203125, 3.8623046875, 4.3377685546875, 4.813232421875, 5.2886962890625, 5.76416015625, 6.2396240234375, 6.715087890625, 7.1905517578125, 7.666015625, 8.1414794921875, 8.616943359375, 9.0924072265625, 9.56787109375, 10.0433349609375, 10.518798828125, 10.9942626953125, 11.4697265625, 11.9451904296875, 12.420654296875, 12.8961181640625, 13.37158203125, 13.8470458984375, 14.322509765625, 14.7979736328125, 15.2734375]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 40.0, 92.0, 199.0, 270.0, 229.0, 116.0, 43.0, 14.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.08335494995117, -31.391977310180664, -29.700599670410156, -28.009220123291016, -26.317842483520508, -24.62646484375, -22.93508529663086, -21.24370765686035, -19.552330017089844, -17.860952377319336, -16.169574737548828, -14.478195190429688, -12.78681755065918, -11.095439910888672, -9.404061317443848, -7.712682723999023, -6.021305084228516, -4.32992696762085, -2.6385488510131836, -0.9471707344055176, 0.7442073822021484, 2.4355850219726562, 4.1269636154174805, 5.818342208862305, 7.5097198486328125, 9.20109748840332, 10.892476081848145, 12.583854675292969, 14.275232315063477, 15.966609954833984, 17.657989501953125, 19.349367141723633, 21.040748596191406, 22.732126235961914, 24.423503875732422, 26.114883422851562, 27.80626106262207, 29.497638702392578, 31.18901824951172, 32.880393981933594, 34.571773529052734, 36.263153076171875, 37.95452880859375, 39.64590835571289, 41.33728790283203, 43.028663635253906, 44.72004318237305, 46.41142272949219, 48.10279846191406, 49.7941780090332, 51.48555374145508, 53.17693328857422, 54.868309020996094, 56.559688568115234, 58.251068115234375, 59.94244384765625, 61.63382339477539, 63.32520294189453, 65.0165786743164, 66.70795440673828, 68.39933776855469, 70.09071350097656, 71.78208923339844, 73.47347259521484, 75.16484832763672]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 3.0, 10.0, 10.0, 8.0, 9.0, 11.0, 13.0, 26.0, 25.0, 27.0, 32.0, 28.0, 49.0, 40.0, 47.0, 48.0, 68.0, 44.0, 39.0, 46.0, 45.0, 44.0, 43.0, 47.0, 39.0, 23.0, 32.0, 24.0, 21.0, 18.0, 16.0, 18.0, 16.0, 7.0, 6.0, 3.0, 8.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.467437744140625, -44.91783142089844, -43.36822509765625, -41.81861877441406, -40.269012451171875, -38.71940612792969, -37.1697998046875, -35.62019348144531, -34.070587158203125, -32.52098083496094, -30.97137451171875, -29.421768188476562, -27.872161865234375, -26.322555541992188, -24.77294921875, -23.223342895507812, -21.673738479614258, -20.12413215637207, -18.574525833129883, -17.024919509887695, -15.475313186645508, -13.92570686340332, -12.37610149383545, -10.826495170593262, -9.276888847351074, -7.727282524108887, -6.177676200866699, -4.62807035446167, -3.0784640312194824, -1.528857707977295, 0.020748138427734375, 1.5703544616699219, 3.1199607849121094, 4.669567108154297, 6.219173431396484, 7.768779277801514, 9.31838607788086, 10.867992401123047, 12.417597770690918, 13.967204093933105, 15.516810417175293, 17.066415786743164, 18.61602210998535, 20.16562843322754, 21.715234756469727, 23.264841079711914, 24.8144474029541, 26.36405372619629, 27.913660049438477, 29.463266372680664, 31.01287269592285, 32.562477111816406, 34.112083435058594, 35.66168975830078, 37.21129608154297, 38.760902404785156, 40.310508728027344, 41.86011505126953, 43.40972137451172, 44.959327697753906, 46.508934020996094, 48.05854034423828, 49.60814666748047, 51.157752990722656, 52.707359313964844]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 10.0, 13.0, 5.0, 9.0, 18.0, 22.0, 39.0, 15.0, 30.0, 27.0, 32.0, 26.0, 47.0, 44.0, 50.0, 33.0, 50.0, 42.0, 29.0, 53.0, 32.0, 45.0, 34.0, 30.0, 41.0, 35.0, 34.0, 27.0, 23.0, 17.0, 14.0, 10.0, 11.0, 10.0, 6.0, 10.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.359375, -4.232208251953125, -4.10504150390625, -3.977874755859375, -3.8507080078125, -3.723541259765625, -3.59637451171875, -3.469207763671875, -3.342041015625, -3.214874267578125, -3.08770751953125, -2.960540771484375, -2.8333740234375, -2.706207275390625, -2.57904052734375, -2.451873779296875, -2.32470703125, -2.197540283203125, -2.07037353515625, -1.943206787109375, -1.8160400390625, -1.688873291015625, -1.56170654296875, -1.434539794921875, -1.307373046875, -1.180206298828125, -1.05303955078125, -0.925872802734375, -0.7987060546875, -0.671539306640625, -0.54437255859375, -0.417205810546875, -0.2900390625, -0.162872314453125, -0.03570556640625, 0.091461181640625, 0.2186279296875, 0.345794677734375, 0.47296142578125, 0.600128173828125, 0.727294921875, 0.854461669921875, 0.98162841796875, 1.108795166015625, 1.2359619140625, 1.363128662109375, 1.49029541015625, 1.617462158203125, 1.74462890625, 1.871795654296875, 1.99896240234375, 2.126129150390625, 2.2532958984375, 2.380462646484375, 2.50762939453125, 2.634796142578125, 2.761962890625, 2.889129638671875, 3.01629638671875, 3.143463134765625, 3.2706298828125, 3.397796630859375, 3.52496337890625, 3.652130126953125, 3.779296875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 5.0, 22.0, 14.0, 26.0, 30.0, 37.0, 66.0, 76.0, 148.0, 188.0, 262.0, 427.0, 624.0, 1007.0, 1610.0, 2672.0, 4675.0, 9346.0, 22064.0, 63770.0, 288982.0, 2196375.0, 1339642.0, 178909.0, 47146.0, 18001.0, 7981.0, 4174.0, 2316.0, 1349.0, 822.0, 511.0, 344.0, 243.0, 121.0, 88.0, 69.0, 36.0, 35.0, 14.0, 18.0, 11.0, 8.0, 5.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.6640625, -11.3294677734375, -10.994873046875, -10.6602783203125, -10.32568359375, -9.9910888671875, -9.656494140625, -9.3218994140625, -8.9873046875, -8.6527099609375, -8.318115234375, -7.9835205078125, -7.64892578125, -7.3143310546875, -6.979736328125, -6.6451416015625, -6.310546875, -5.9759521484375, -5.641357421875, -5.3067626953125, -4.97216796875, -4.6375732421875, -4.302978515625, -3.9683837890625, -3.6337890625, -3.2991943359375, -2.964599609375, -2.6300048828125, -2.29541015625, -1.9608154296875, -1.626220703125, -1.2916259765625, -0.95703125, -0.6224365234375, -0.287841796875, 0.0467529296875, 0.38134765625, 0.7159423828125, 1.050537109375, 1.3851318359375, 1.7197265625, 2.0543212890625, 2.388916015625, 2.7235107421875, 3.05810546875, 3.3927001953125, 3.727294921875, 4.0618896484375, 4.396484375, 4.7310791015625, 5.065673828125, 5.4002685546875, 5.73486328125, 6.0694580078125, 6.404052734375, 6.7386474609375, 7.0732421875, 7.4078369140625, 7.742431640625, 8.0770263671875, 8.41162109375, 8.7462158203125, 9.080810546875, 9.4154052734375, 9.75]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 7.0, 10.0, 9.0, 11.0, 13.0, 21.0, 32.0, 46.0, 69.0, 88.0, 141.0, 203.0, 371.0, 521.0, 636.0, 572.0, 458.0, 290.0, 183.0, 105.0, 87.0, 68.0, 45.0, 26.0, 20.0, 6.0, 11.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.6875, -15.2608642578125, -14.834228515625, -14.4075927734375, -13.98095703125, -13.5543212890625, -13.127685546875, -12.7010498046875, -12.2744140625, -11.8477783203125, -11.421142578125, -10.9945068359375, -10.56787109375, -10.1412353515625, -9.714599609375, -9.2879638671875, -8.861328125, -8.4346923828125, -8.008056640625, -7.5814208984375, -7.15478515625, -6.7281494140625, -6.301513671875, -5.8748779296875, -5.4482421875, -5.0216064453125, -4.594970703125, -4.1683349609375, -3.74169921875, -3.3150634765625, -2.888427734375, -2.4617919921875, -2.03515625, -1.6085205078125, -1.181884765625, -0.7552490234375, -0.32861328125, 0.0980224609375, 0.524658203125, 0.9512939453125, 1.3779296875, 1.8045654296875, 2.231201171875, 2.6578369140625, 3.08447265625, 3.5111083984375, 3.937744140625, 4.3643798828125, 4.791015625, 5.2176513671875, 5.644287109375, 6.0709228515625, 6.49755859375, 6.9241943359375, 7.350830078125, 7.7774658203125, 8.2041015625, 8.6307373046875, 9.057373046875, 9.4840087890625, 9.91064453125, 10.3372802734375, 10.763916015625, 11.1905517578125, 11.6171875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 14.0, 19.0, 13.0, 18.0, 30.0, 52.0, 81.0, 120.0, 190.0, 285.0, 412.0, 727.0, 982.0, 1621.0, 2806.0, 4897.0, 9485.0, 19365.0, 46731.0, 149836.0, 738254.0, 2382267.0, 622679.0, 132222.0, 42711.0, 17913.0, 8879.0, 4640.0, 2646.0, 1651.0, 975.0, 588.0, 369.0, 249.0, 169.0, 97.0, 92.0, 54.0, 37.0, 22.0, 25.0, 22.0, 15.0, 5.0, 5.0, 1.0, 4.0, 4.0, 1.0], "bins": [-18.515625, -18.0076904296875, -17.499755859375, -16.9918212890625, -16.48388671875, -15.9759521484375, -15.468017578125, -14.9600830078125, -14.4521484375, -13.9442138671875, -13.436279296875, -12.9283447265625, -12.42041015625, -11.9124755859375, -11.404541015625, -10.8966064453125, -10.388671875, -9.8807373046875, -9.372802734375, -8.8648681640625, -8.35693359375, -7.8489990234375, -7.341064453125, -6.8331298828125, -6.3251953125, -5.8172607421875, -5.309326171875, -4.8013916015625, -4.29345703125, -3.7855224609375, -3.277587890625, -2.7696533203125, -2.26171875, -1.7537841796875, -1.245849609375, -0.7379150390625, -0.22998046875, 0.2779541015625, 0.785888671875, 1.2938232421875, 1.8017578125, 2.3096923828125, 2.817626953125, 3.3255615234375, 3.83349609375, 4.3414306640625, 4.849365234375, 5.3572998046875, 5.865234375, 6.3731689453125, 6.881103515625, 7.3890380859375, 7.89697265625, 8.4049072265625, 8.912841796875, 9.4207763671875, 9.9287109375, 10.4366455078125, 10.944580078125, 11.4525146484375, 11.96044921875, 12.4683837890625, 12.976318359375, 13.4842529296875, 13.9921875]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 9.0, 12.0, 38.0, 49.0, 81.0, 143.0, 180.0, 171.0, 126.0, 91.0, 57.0, 23.0, 18.0, 5.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.41480255126953, -58.01824951171875, -54.621700286865234, -51.22515106201172, -47.82859802246094, -44.432044982910156, -41.03549575805664, -37.638946533203125, -34.242393493652344, -30.845842361450195, -27.449291229248047, -24.0527400970459, -20.65618896484375, -17.2596378326416, -13.863086700439453, -10.466535568237305, -7.069984436035156, -3.673433303833008, -0.2768821716308594, 3.119668960571289, 6.5162200927734375, 9.912771224975586, 13.309322357177734, 16.705873489379883, 20.10242462158203, 23.49897575378418, 26.895526885986328, 30.292078018188477, 33.688629150390625, 37.085182189941406, 40.48173141479492, 43.87828063964844, 47.27482604980469, 50.67137908935547, 54.067928314208984, 57.4644775390625, 60.86103057861328, 64.25758361816406, 67.65412902832031, 71.0506820678711, 74.44723510742188, 77.84378814697266, 81.24034118652344, 84.63688659667969, 88.03343963623047, 91.42999267578125, 94.8265380859375, 98.22309112548828, 101.61964416503906, 105.01619720458984, 108.41275024414062, 111.80929565429688, 115.20584869384766, 118.60240173339844, 121.99894714355469, 125.39550018310547, 128.79205322265625, 132.1885986328125, 135.5851593017578, 138.98170471191406, 142.37826538085938, 145.77481079101562, 149.17135620117188, 152.5679168701172, 155.96446228027344]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 4.0, 2.0, 5.0, 7.0, 9.0, 8.0, 7.0, 18.0, 14.0, 18.0, 17.0, 18.0, 19.0, 25.0, 34.0, 30.0, 28.0, 40.0, 43.0, 34.0, 39.0, 49.0, 49.0, 39.0, 35.0, 33.0, 40.0, 34.0, 40.0, 44.0, 34.0, 28.0, 25.0, 16.0, 15.0, 25.0, 10.0, 18.0, 11.0, 8.0, 7.0, 6.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.170333862304688, -27.089126586914062, -26.007919311523438, -24.926713943481445, -23.84550666809082, -22.764299392700195, -21.683094024658203, -20.601886749267578, -19.520679473876953, -18.439472198486328, -17.358264923095703, -16.27705955505371, -15.195852279663086, -14.114645004272461, -13.033438682556152, -11.952232360839844, -10.871025085449219, -9.789817810058594, -8.708611488342285, -7.627404689788818, -6.546197891235352, -5.464991092681885, -4.383784294128418, -3.302577495574951, -2.2213706970214844, -1.1401638984680176, -0.05895709991455078, 1.022249698638916, 2.103456497192383, 3.1846632957458496, 4.265870094299316, 5.347076892852783, 6.42828369140625, 7.509490489959717, 8.590697288513184, 9.671903610229492, 10.753110885620117, 11.834318161010742, 12.91552448272705, 13.99673080444336, 15.077938079833984, 16.15914535522461, 17.240352630615234, 18.321557998657227, 19.40276527404785, 20.483972549438477, 21.56517791748047, 22.646385192871094, 23.72759246826172, 24.808799743652344, 25.89000701904297, 26.97121238708496, 28.052419662475586, 29.13362693786621, 30.214832305908203, 31.296039581298828, 32.37724685668945, 33.45845413208008, 34.5396614074707, 35.62086868286133, 36.70207214355469, 37.78327941894531, 38.86448669433594, 39.94569396972656, 41.02690124511719]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 12.0, 10.0, 3.0, 10.0, 10.0, 8.0, 11.0, 18.0, 18.0, 26.0, 26.0, 27.0, 29.0, 24.0, 38.0, 37.0, 33.0, 40.0, 52.0, 42.0, 43.0, 40.0, 47.0, 40.0, 48.0, 47.0, 35.0, 35.0, 20.0, 34.0, 25.0, 18.0, 20.0, 17.0, 9.0, 14.0, 6.0, 5.0, 5.0, 2.0, 6.0, 2.0, 5.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.28125, -4.152557373046875, -4.02386474609375, -3.895172119140625, -3.7664794921875, -3.637786865234375, -3.50909423828125, -3.380401611328125, -3.251708984375, -3.123016357421875, -2.99432373046875, -2.865631103515625, -2.7369384765625, -2.608245849609375, -2.47955322265625, -2.350860595703125, -2.22216796875, -2.093475341796875, -1.96478271484375, -1.836090087890625, -1.7073974609375, -1.578704833984375, -1.45001220703125, -1.321319580078125, -1.192626953125, -1.063934326171875, -0.93524169921875, -0.806549072265625, -0.6778564453125, -0.549163818359375, -0.42047119140625, -0.291778564453125, -0.1630859375, -0.034393310546875, 0.09429931640625, 0.222991943359375, 0.3516845703125, 0.480377197265625, 0.60906982421875, 0.737762451171875, 0.866455078125, 0.995147705078125, 1.12384033203125, 1.252532958984375, 1.3812255859375, 1.509918212890625, 1.63861083984375, 1.767303466796875, 1.89599609375, 2.024688720703125, 2.15338134765625, 2.282073974609375, 2.4107666015625, 2.539459228515625, 2.66815185546875, 2.796844482421875, 2.925537109375, 3.054229736328125, 3.18292236328125, 3.311614990234375, 3.4403076171875, 3.569000244140625, 3.69769287109375, 3.826385498046875, 3.955078125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 10.0, 10.0, 9.0, 16.0, 31.0, 63.0, 72.0, 115.0, 184.0, 256.0, 401.0, 672.0, 943.0, 1511.0, 2351.0, 3862.0, 5807.0, 9109.0, 14055.0, 21909.0, 33480.0, 51621.0, 77160.0, 109613.0, 140198.0, 151736.0, 131284.0, 98027.0, 67431.0, 44816.0, 29024.0, 18782.0, 12158.0, 7891.0, 5001.0, 3218.0, 2043.0, 1274.0, 881.0, 586.0, 326.0, 231.0, 126.0, 96.0, 59.0, 38.0, 26.0, 18.0, 11.0, 11.0, 5.0, 5.0, 2.0], "bins": [-7.8671875, -7.650634765625, -7.43408203125, -7.217529296875, -7.0009765625, -6.784423828125, -6.56787109375, -6.351318359375, -6.134765625, -5.918212890625, -5.70166015625, -5.485107421875, -5.2685546875, -5.052001953125, -4.83544921875, -4.618896484375, -4.40234375, -4.185791015625, -3.96923828125, -3.752685546875, -3.5361328125, -3.319580078125, -3.10302734375, -2.886474609375, -2.669921875, -2.453369140625, -2.23681640625, -2.020263671875, -1.8037109375, -1.587158203125, -1.37060546875, -1.154052734375, -0.9375, -0.720947265625, -0.50439453125, -0.287841796875, -0.0712890625, 0.145263671875, 0.36181640625, 0.578369140625, 0.794921875, 1.011474609375, 1.22802734375, 1.444580078125, 1.6611328125, 1.877685546875, 2.09423828125, 2.310791015625, 2.52734375, 2.743896484375, 2.96044921875, 3.177001953125, 3.3935546875, 3.610107421875, 3.82666015625, 4.043212890625, 4.259765625, 4.476318359375, 4.69287109375, 4.909423828125, 5.1259765625, 5.342529296875, 5.55908203125, 5.775634765625, 5.9921875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 3.0, 3.0, 5.0, 2.0, 5.0, 3.0, 4.0, 9.0, 10.0, 10.0, 10.0, 16.0, 16.0, 24.0, 26.0, 26.0, 27.0, 35.0, 26.0, 35.0, 33.0, 42.0, 41.0, 41.0, 39.0, 1065.0, 41.0, 34.0, 39.0, 37.0, 36.0, 26.0, 25.0, 20.0, 30.0, 22.0, 20.0, 26.0, 20.0, 18.0, 9.0, 12.0, 12.0, 7.0, 6.0, 7.0, 8.0, 6.0, 2.0, 2.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.794921875, -2.6973876953125, -2.599853515625, -2.5023193359375, -2.40478515625, -2.3072509765625, -2.209716796875, -2.1121826171875, -2.0146484375, -1.9171142578125, -1.819580078125, -1.7220458984375, -1.62451171875, -1.5269775390625, -1.429443359375, -1.3319091796875, -1.234375, -1.1368408203125, -1.039306640625, -0.9417724609375, -0.84423828125, -0.7467041015625, -0.649169921875, -0.5516357421875, -0.4541015625, -0.3565673828125, -0.259033203125, -0.1614990234375, -0.06396484375, 0.0335693359375, 0.131103515625, 0.2286376953125, 0.326171875, 0.4237060546875, 0.521240234375, 0.6187744140625, 0.71630859375, 0.8138427734375, 0.911376953125, 1.0089111328125, 1.1064453125, 1.2039794921875, 1.301513671875, 1.3990478515625, 1.49658203125, 1.5941162109375, 1.691650390625, 1.7891845703125, 1.88671875, 1.9842529296875, 2.081787109375, 2.1793212890625, 2.27685546875, 2.3743896484375, 2.471923828125, 2.5694580078125, 2.6669921875, 2.7645263671875, 2.862060546875, 2.9595947265625, 3.05712890625, 3.1546630859375, 3.252197265625, 3.3497314453125, 3.447265625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 4.0, 5.0, 11.0, 11.0, 17.0, 9.0, 20.0, 31.0, 26.0, 41.0, 65.0, 69.0, 114.0, 169.0, 227.0, 341.0, 427.0, 722.0, 1124.0, 1714.0, 2845.0, 5077.0, 9517.0, 19229.0, 44107.0, 116187.0, 373260.0, 1003479.0, 332120.0, 106139.0, 40836.0, 17903.0, 8732.0, 4842.0, 2814.0, 1676.0, 1039.0, 639.0, 466.0, 307.0, 228.0, 152.0, 109.0, 65.0, 61.0, 40.0, 33.0, 23.0, 18.0, 9.0, 11.0, 5.0, 6.0, 7.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-9.0390625, -8.751708984375, -8.46435546875, -8.177001953125, -7.8896484375, -7.602294921875, -7.31494140625, -7.027587890625, -6.740234375, -6.452880859375, -6.16552734375, -5.878173828125, -5.5908203125, -5.303466796875, -5.01611328125, -4.728759765625, -4.44140625, -4.154052734375, -3.86669921875, -3.579345703125, -3.2919921875, -3.004638671875, -2.71728515625, -2.429931640625, -2.142578125, -1.855224609375, -1.56787109375, -1.280517578125, -0.9931640625, -0.705810546875, -0.41845703125, -0.131103515625, 0.15625, 0.443603515625, 0.73095703125, 1.018310546875, 1.3056640625, 1.593017578125, 1.88037109375, 2.167724609375, 2.455078125, 2.742431640625, 3.02978515625, 3.317138671875, 3.6044921875, 3.891845703125, 4.17919921875, 4.466552734375, 4.75390625, 5.041259765625, 5.32861328125, 5.615966796875, 5.9033203125, 6.190673828125, 6.47802734375, 6.765380859375, 7.052734375, 7.340087890625, 7.62744140625, 7.914794921875, 8.2021484375, 8.489501953125, 8.77685546875, 9.064208984375, 9.3515625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 3.0, 8.0, 11.0, 11.0, 15.0, 20.0, 27.0, 41.0, 49.0, 82.0, 152.0, 149.0, 134.0, 88.0, 48.0, 34.0, 26.0, 23.0, 13.0, 13.0, 8.0, 7.0, 7.0, 6.0, 3.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.26953125, -5.1077880859375, -4.946044921875, -4.7843017578125, -4.62255859375, -4.4608154296875, -4.299072265625, -4.1373291015625, -3.9755859375, -3.8138427734375, -3.652099609375, -3.4903564453125, -3.32861328125, -3.1668701171875, -3.005126953125, -2.8433837890625, -2.681640625, -2.5198974609375, -2.358154296875, -2.1964111328125, -2.03466796875, -1.8729248046875, -1.711181640625, -1.5494384765625, -1.3876953125, -1.2259521484375, -1.064208984375, -0.9024658203125, -0.74072265625, -0.5789794921875, -0.417236328125, -0.2554931640625, -0.09375, 0.0679931640625, 0.229736328125, 0.3914794921875, 0.55322265625, 0.7149658203125, 0.876708984375, 1.0384521484375, 1.2001953125, 1.3619384765625, 1.523681640625, 1.6854248046875, 1.84716796875, 2.0089111328125, 2.170654296875, 2.3323974609375, 2.494140625, 2.6558837890625, 2.817626953125, 2.9793701171875, 3.14111328125, 3.3028564453125, 3.464599609375, 3.6263427734375, 3.7880859375, 3.9498291015625, 4.111572265625, 4.2733154296875, 4.43505859375, 4.5968017578125, 4.758544921875, 4.9202880859375, 5.08203125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 7.0, 12.0, 8.0, 8.0, 14.0, 17.0, 19.0, 22.0, 33.0, 51.0, 111.0, 105.0, 173.0, 425.0, 2823.0, 65681.0, 951986.0, 24667.0, 1521.0, 318.0, 165.0, 102.0, 72.0, 46.0, 43.0, 37.0, 22.0, 18.0, 15.0, 6.0, 5.0, 2.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-62.625, -60.6904296875, -58.755859375, -56.8212890625, -54.88671875, -52.9521484375, -51.017578125, -49.0830078125, -47.1484375, -45.2138671875, -43.279296875, -41.3447265625, -39.41015625, -37.4755859375, -35.541015625, -33.6064453125, -31.671875, -29.7373046875, -27.802734375, -25.8681640625, -23.93359375, -21.9990234375, -20.064453125, -18.1298828125, -16.1953125, -14.2607421875, -12.326171875, -10.3916015625, -8.45703125, -6.5224609375, -4.587890625, -2.6533203125, -0.71875, 1.2158203125, 3.150390625, 5.0849609375, 7.01953125, 8.9541015625, 10.888671875, 12.8232421875, 14.7578125, 16.6923828125, 18.626953125, 20.5615234375, 22.49609375, 24.4306640625, 26.365234375, 28.2998046875, 30.234375, 32.1689453125, 34.103515625, 36.0380859375, 37.97265625, 39.9072265625, 41.841796875, 43.7763671875, 45.7109375, 47.6455078125, 49.580078125, 51.5146484375, 53.44921875, 55.3837890625, 57.318359375, 59.2529296875, 61.1875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 8.0, 16.0, 74.0, 157.0, 306.0, 254.0, 121.0, 48.0, 18.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.372220993041992, -23.672985076904297, -22.9737491607666, -22.274513244628906, -21.57527732849121, -20.876041412353516, -20.17680549621582, -19.477569580078125, -18.77833366394043, -18.079097747802734, -17.37986183166504, -16.680625915527344, -15.981389999389648, -15.282154083251953, -14.582918167114258, -13.883682250976562, -13.18444538116455, -12.485209465026855, -11.78597354888916, -11.086737632751465, -10.38750171661377, -9.688265800476074, -8.989028930664062, -8.289793014526367, -7.59055757522583, -6.891321659088135, -6.1920857429504395, -5.492849349975586, -4.793613433837891, -4.094377517700195, -3.3951416015625, -2.6959056854248047, -1.9966697692871094, -1.297433853149414, -0.5981978178024292, 0.10103821754455566, 0.800274133682251, 1.4995100498199463, 2.1987462043762207, 2.897982120513916, 3.5972180366516113, 4.296453952789307, 4.995689868927002, 5.6949262619018555, 6.394162178039551, 7.093398094177246, 7.792634010314941, 8.491869926452637, 9.191105842590332, 9.890341758728027, 10.589577674865723, 11.288813591003418, 11.988049507141113, 12.687285423278809, 13.38652229309082, 14.085758209228516, 14.784994125366211, 15.484230041503906, 16.1834659576416, 16.882701873779297, 17.581937789916992, 18.281173706054688, 18.980409622192383, 19.679645538330078, 20.378881454467773]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 11.0, 17.0, 12.0, 18.0, 14.0, 23.0, 30.0, 31.0, 43.0, 30.0, 40.0, 39.0, 47.0, 57.0, 55.0, 44.0, 53.0, 51.0, 59.0, 40.0, 45.0, 46.0, 29.0, 44.0, 25.0, 24.0, 16.0, 20.0, 10.0, 8.0, 8.0, 3.0, 8.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.664618968963623, -7.39613151550293, -7.1276445388793945, -6.859157085418701, -6.590669631958008, -6.322182655334473, -6.053695201873779, -5.785207748413086, -5.516720771789551, -5.248233318328857, -4.979746341705322, -4.711258888244629, -4.442771911621094, -4.1742844581604, -3.905797004699707, -3.6373097896575928, -3.3688225746154785, -3.1003353595733643, -2.83184814453125, -2.5633606910705566, -2.2948734760284424, -2.026386260986328, -1.7578989267349243, -1.4894115924835205, -1.2209243774414062, -0.9524371027946472, -0.6839498281478882, -0.41546255350112915, -0.14697527885437012, 0.12151193618774414, 0.38999927043914795, 0.6584866046905518, 0.9269742965698242, 1.1954615116119385, 1.4639488458633423, 1.732436180114746, 2.0009233951568604, 2.2694106101989746, 2.537898063659668, 2.8063852787017822, 3.0748724937438965, 3.3433597087860107, 3.611846923828125, 3.8803343772888184, 4.148821830749512, 4.417308807373047, 4.68579626083374, 4.954283714294434, 5.222770690917969, 5.491258144378662, 5.759745121002197, 6.028232574462891, 6.296719551086426, 6.565207004547119, 6.8336944580078125, 7.102181434631348, 7.370668888092041, 7.639156341552734, 7.9076433181762695, 8.176130294799805, 8.444618225097656, 8.713105201721191, 8.981592178344727, 9.250080108642578, 9.518567085266113]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 9.0, 9.0, 7.0, 11.0, 10.0, 13.0, 16.0, 14.0, 28.0, 25.0, 25.0, 33.0, 45.0, 37.0, 45.0, 45.0, 38.0, 44.0, 37.0, 59.0, 45.0, 50.0, 37.0, 45.0, 37.0, 32.0, 33.0, 29.0, 24.0, 22.0, 18.0, 16.0, 11.0, 14.0, 5.0, 5.0, 6.0, 3.0, 6.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.76953125, -4.6318359375, -4.494140625, -4.3564453125, -4.21875, -4.0810546875, -3.943359375, -3.8056640625, -3.66796875, -3.5302734375, -3.392578125, -3.2548828125, -3.1171875, -2.9794921875, -2.841796875, -2.7041015625, -2.56640625, -2.4287109375, -2.291015625, -2.1533203125, -2.015625, -1.8779296875, -1.740234375, -1.6025390625, -1.46484375, -1.3271484375, -1.189453125, -1.0517578125, -0.9140625, -0.7763671875, -0.638671875, -0.5009765625, -0.36328125, -0.2255859375, -0.087890625, 0.0498046875, 0.1875, 0.3251953125, 0.462890625, 0.6005859375, 0.73828125, 0.8759765625, 1.013671875, 1.1513671875, 1.2890625, 1.4267578125, 1.564453125, 1.7021484375, 1.83984375, 1.9775390625, 2.115234375, 2.2529296875, 2.390625, 2.5283203125, 2.666015625, 2.8037109375, 2.94140625, 3.0791015625, 3.216796875, 3.3544921875, 3.4921875, 3.6298828125, 3.767578125, 3.9052734375, 4.04296875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 1.0, 8.0, 10.0, 17.0, 23.0, 28.0, 48.0, 53.0, 90.0, 117.0, 179.0, 219.0, 325.0, 523.0, 686.0, 1007.0, 1539.0, 2573.0, 4282.0, 8191.0, 17594.0, 46342.0, 147199.0, 401085.0, 276558.0, 83623.0, 29064.0, 11799.0, 5862.0, 3314.0, 2084.0, 1286.0, 834.0, 589.0, 419.0, 275.0, 220.0, 142.0, 87.0, 79.0, 50.0, 36.0, 24.0, 19.0, 20.0, 10.0, 6.0, 4.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.9375, -5.75628662109375, -5.5750732421875, -5.39385986328125, -5.212646484375, -5.03143310546875, -4.8502197265625, -4.66900634765625, -4.48779296875, -4.30657958984375, -4.1253662109375, -3.94415283203125, -3.762939453125, -3.58172607421875, -3.4005126953125, -3.21929931640625, -3.0380859375, -2.85687255859375, -2.6756591796875, -2.49444580078125, -2.313232421875, -2.13201904296875, -1.9508056640625, -1.76959228515625, -1.58837890625, -1.40716552734375, -1.2259521484375, -1.04473876953125, -0.863525390625, -0.68231201171875, -0.5010986328125, -0.31988525390625, -0.138671875, 0.04254150390625, 0.2237548828125, 0.40496826171875, 0.586181640625, 0.76739501953125, 0.9486083984375, 1.12982177734375, 1.31103515625, 1.49224853515625, 1.6734619140625, 1.85467529296875, 2.035888671875, 2.21710205078125, 2.3983154296875, 2.57952880859375, 2.7607421875, 2.94195556640625, 3.1231689453125, 3.30438232421875, 3.485595703125, 3.66680908203125, 3.8480224609375, 4.02923583984375, 4.21044921875, 4.39166259765625, 4.5728759765625, 4.75408935546875, 4.935302734375, 5.11651611328125, 5.2977294921875, 5.47894287109375, 5.66015625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 8.0, 9.0, 6.0, 13.0, 6.0, 10.0, 13.0, 21.0, 20.0, 28.0, 33.0, 48.0, 51.0, 55.0, 71.0, 103.0, 247.0, 1587.0, 232.0, 103.0, 81.0, 61.0, 51.0, 34.0, 34.0, 25.0, 23.0, 22.0, 15.0, 19.0, 12.0, 5.0, 2.0, 5.0, 0.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.625, -19.94873046875, -19.2724609375, -18.59619140625, -17.919921875, -17.24365234375, -16.5673828125, -15.89111328125, -15.21484375, -14.53857421875, -13.8623046875, -13.18603515625, -12.509765625, -11.83349609375, -11.1572265625, -10.48095703125, -9.8046875, -9.12841796875, -8.4521484375, -7.77587890625, -7.099609375, -6.42333984375, -5.7470703125, -5.07080078125, -4.39453125, -3.71826171875, -3.0419921875, -2.36572265625, -1.689453125, -1.01318359375, -0.3369140625, 0.33935546875, 1.015625, 1.69189453125, 2.3681640625, 3.04443359375, 3.720703125, 4.39697265625, 5.0732421875, 5.74951171875, 6.42578125, 7.10205078125, 7.7783203125, 8.45458984375, 9.130859375, 9.80712890625, 10.4833984375, 11.15966796875, 11.8359375, 12.51220703125, 13.1884765625, 13.86474609375, 14.541015625, 15.21728515625, 15.8935546875, 16.56982421875, 17.24609375, 17.92236328125, 18.5986328125, 19.27490234375, 19.951171875, 20.62744140625, 21.3037109375, 21.97998046875, 22.65625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 10.0, 13.0, 13.0, 18.0, 34.0, 42.0, 59.0, 96.0, 190.0, 348.0, 741.0, 1920.0, 5902.0, 29064.0, 633383.0, 2398152.0, 61505.0, 9543.0, 2596.0, 1007.0, 446.0, 235.0, 156.0, 75.0, 59.0, 24.0, 20.0, 9.0, 8.0, 10.0, 7.0, 8.0, 2.0, 7.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.4375, -27.62890625, -26.8203125, -26.01171875, -25.203125, -24.39453125, -23.5859375, -22.77734375, -21.96875, -21.16015625, -20.3515625, -19.54296875, -18.734375, -17.92578125, -17.1171875, -16.30859375, -15.5, -14.69140625, -13.8828125, -13.07421875, -12.265625, -11.45703125, -10.6484375, -9.83984375, -9.03125, -8.22265625, -7.4140625, -6.60546875, -5.796875, -4.98828125, -4.1796875, -3.37109375, -2.5625, -1.75390625, -0.9453125, -0.13671875, 0.671875, 1.48046875, 2.2890625, 3.09765625, 3.90625, 4.71484375, 5.5234375, 6.33203125, 7.140625, 7.94921875, 8.7578125, 9.56640625, 10.375, 11.18359375, 11.9921875, 12.80078125, 13.609375, 14.41796875, 15.2265625, 16.03515625, 16.84375, 17.65234375, 18.4609375, 19.26953125, 20.078125, 20.88671875, 21.6953125, 22.50390625, 23.3125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 177.0, 765.0, 71.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.918807983398438, -13.378769874572754, -3.8387317657470703, 5.701305389404297, 15.241344451904297, 24.781383514404297, 34.32141876220703, 43.86145782470703, 53.40149688720703, 62.94153594970703, 72.48157501220703, 82.0216064453125, 91.5616455078125, 101.1016845703125, 110.6417236328125, 120.1817626953125, 129.7218017578125, 139.2618408203125, 148.8018798828125, 158.3419189453125, 167.8819580078125, 177.4219970703125, 186.9620361328125, 196.5020751953125, 206.0421142578125, 215.5821533203125, 225.1221923828125, 234.6622314453125, 244.2022705078125, 253.7423095703125, 263.2823486328125, 272.8223876953125, 282.3623962402344, 291.9024353027344, 301.4424743652344, 310.9825134277344, 320.5225524902344, 330.0625915527344, 339.6026306152344, 349.1426696777344, 358.6827087402344, 368.2227478027344, 377.7627868652344, 387.3028259277344, 396.8428649902344, 406.3829040527344, 415.9229431152344, 425.4629821777344, 435.00299072265625, 444.54302978515625, 454.08306884765625, 463.62310791015625, 473.16314697265625, 482.70318603515625, 492.24322509765625, 501.78326416015625, 511.32330322265625, 520.8633422851562, 530.4033813476562, 539.9434204101562, 549.4834594726562, 559.0234985351562, 568.5635375976562, 578.1035766601562, 587.6436157226562]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 2.0, 6.0, 8.0, 4.0, 9.0, 5.0, 6.0, 19.0, 12.0, 16.0, 17.0, 18.0, 18.0, 17.0, 17.0, 23.0, 25.0, 29.0, 24.0, 22.0, 27.0, 39.0, 33.0, 37.0, 33.0, 36.0, 34.0, 33.0, 42.0, 32.0, 36.0, 29.0, 27.0, 22.0, 28.0, 21.0, 22.0, 18.0, 19.0, 19.0, 21.0, 14.0, 17.0, 10.0, 20.0, 5.0, 8.0, 2.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-42.67377471923828, -41.35548400878906, -40.03718948364258, -38.71889877319336, -37.400604248046875, -36.082313537597656, -34.76402282714844, -33.44573211669922, -32.127437591552734, -30.809144973754883, -29.49085235595703, -28.172561645507812, -26.85426902770996, -25.53597640991211, -24.21768569946289, -22.89939308166504, -21.581100463867188, -20.262807846069336, -18.944515228271484, -17.626224517822266, -16.307931900024414, -14.989639282226562, -13.671347618103027, -12.353055953979492, -11.03476333618164, -9.716470718383789, -8.398179054260254, -7.0798869132995605, -5.761594772338867, -4.443302631378174, -3.1250104904174805, -1.8067188262939453, -0.48842620849609375, 0.8298659324645996, 2.148158073425293, 3.4664502143859863, 4.78474235534668, 6.103034496307373, 7.421326637268066, 8.739618301391602, 10.057910919189453, 11.376203536987305, 12.69449520111084, 14.012786865234375, 15.331079483032227, 16.649372100830078, 17.967662811279297, 19.28595542907715, 20.604248046875, 21.92254066467285, 23.240833282470703, 24.559123992919922, 25.877416610717773, 27.195709228515625, 28.513999938964844, 29.832292556762695, 31.150585174560547, 32.468875885009766, 33.78717041015625, 35.10546112060547, 36.42375183105469, 37.74204635620117, 39.06033706665039, 40.378631591796875, 41.696922302246094]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 14.0, 8.0, 6.0, 14.0, 14.0, 20.0, 13.0, 22.0, 16.0, 31.0, 25.0, 30.0, 34.0, 32.0, 30.0, 42.0, 35.0, 41.0, 44.0, 49.0, 53.0, 56.0, 38.0, 36.0, 40.0, 44.0, 31.0, 26.0, 24.0, 22.0, 18.0, 18.0, 16.0, 13.0, 10.0, 11.0, 5.0, 5.0, 3.0, 6.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-5.03125, -4.891632080078125, -4.75201416015625, -4.612396240234375, -4.4727783203125, -4.333160400390625, -4.19354248046875, -4.053924560546875, -3.914306640625, -3.774688720703125, -3.63507080078125, -3.495452880859375, -3.3558349609375, -3.216217041015625, -3.07659912109375, -2.936981201171875, -2.79736328125, -2.657745361328125, -2.51812744140625, -2.378509521484375, -2.2388916015625, -2.099273681640625, -1.95965576171875, -1.820037841796875, -1.680419921875, -1.540802001953125, -1.40118408203125, -1.261566162109375, -1.1219482421875, -0.982330322265625, -0.84271240234375, -0.703094482421875, -0.5634765625, -0.423858642578125, -0.28424072265625, -0.144622802734375, -0.0050048828125, 0.134613037109375, 0.27423095703125, 0.413848876953125, 0.553466796875, 0.693084716796875, 0.83270263671875, 0.972320556640625, 1.1119384765625, 1.251556396484375, 1.39117431640625, 1.530792236328125, 1.67041015625, 1.810028076171875, 1.94964599609375, 2.089263916015625, 2.2288818359375, 2.368499755859375, 2.50811767578125, 2.647735595703125, 2.787353515625, 2.926971435546875, 3.06658935546875, 3.206207275390625, 3.3458251953125, 3.485443115234375, 3.62506103515625, 3.764678955078125, 3.904296875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 5.0, 7.0, 5.0, 7.0, 9.0, 17.0, 25.0, 40.0, 43.0, 59.0, 79.0, 107.0, 192.0, 266.0, 390.0, 612.0, 1056.0, 1836.0, 3142.0, 6391.0, 14750.0, 45660.0, 246710.0, 2516002.0, 1188056.0, 119240.0, 28407.0, 10577.0, 4624.0, 2504.0, 1366.0, 770.0, 428.0, 296.0, 195.0, 117.0, 77.0, 57.0, 49.0, 36.0, 15.0, 13.0, 10.0, 14.0, 8.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.203125, -12.7880859375, -12.373046875, -11.9580078125, -11.54296875, -11.1279296875, -10.712890625, -10.2978515625, -9.8828125, -9.4677734375, -9.052734375, -8.6376953125, -8.22265625, -7.8076171875, -7.392578125, -6.9775390625, -6.5625, -6.1474609375, -5.732421875, -5.3173828125, -4.90234375, -4.4873046875, -4.072265625, -3.6572265625, -3.2421875, -2.8271484375, -2.412109375, -1.9970703125, -1.58203125, -1.1669921875, -0.751953125, -0.3369140625, 0.078125, 0.4931640625, 0.908203125, 1.3232421875, 1.73828125, 2.1533203125, 2.568359375, 2.9833984375, 3.3984375, 3.8134765625, 4.228515625, 4.6435546875, 5.05859375, 5.4736328125, 5.888671875, 6.3037109375, 6.71875, 7.1337890625, 7.548828125, 7.9638671875, 8.37890625, 8.7939453125, 9.208984375, 9.6240234375, 10.0390625, 10.4541015625, 10.869140625, 11.2841796875, 11.69921875, 12.1142578125, 12.529296875, 12.9443359375, 13.359375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 7.0, 10.0, 7.0, 12.0, 17.0, 20.0, 27.0, 30.0, 52.0, 58.0, 117.0, 152.0, 228.0, 297.0, 500.0, 599.0, 544.0, 397.0, 303.0, 211.0, 154.0, 97.0, 57.0, 43.0, 34.0, 26.0, 20.0, 18.0, 6.0, 7.0, 3.0, 4.0, 7.0, 9.0, 5.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1640625, -10.7899169921875, -10.415771484375, -10.0416259765625, -9.66748046875, -9.2933349609375, -8.919189453125, -8.5450439453125, -8.1708984375, -7.7967529296875, -7.422607421875, -7.0484619140625, -6.67431640625, -6.3001708984375, -5.926025390625, -5.5518798828125, -5.177734375, -4.8035888671875, -4.429443359375, -4.0552978515625, -3.68115234375, -3.3070068359375, -2.932861328125, -2.5587158203125, -2.1845703125, -1.8104248046875, -1.436279296875, -1.0621337890625, -0.68798828125, -0.3138427734375, 0.060302734375, 0.4344482421875, 0.80859375, 1.1827392578125, 1.556884765625, 1.9310302734375, 2.30517578125, 2.6793212890625, 3.053466796875, 3.4276123046875, 3.8017578125, 4.1759033203125, 4.550048828125, 4.9241943359375, 5.29833984375, 5.6724853515625, 6.046630859375, 6.4207763671875, 6.794921875, 7.1690673828125, 7.543212890625, 7.9173583984375, 8.29150390625, 8.6656494140625, 9.039794921875, 9.4139404296875, 9.7880859375, 10.1622314453125, 10.536376953125, 10.9105224609375, 11.28466796875, 11.6588134765625, 12.032958984375, 12.4071044921875, 12.78125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 7.0, 9.0, 9.0, 18.0, 23.0, 41.0, 72.0, 111.0, 199.0, 283.0, 448.0, 660.0, 1059.0, 1664.0, 2616.0, 4577.0, 8269.0, 16095.0, 37207.0, 106662.0, 423510.0, 2013054.0, 1211131.0, 241859.0, 69479.0, 26588.0, 12262.0, 6412.0, 3739.0, 2237.0, 1419.0, 851.0, 563.0, 373.0, 240.0, 178.0, 100.0, 81.0, 56.0, 29.0, 34.0, 20.0, 13.0, 8.0, 4.0, 11.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-13.3046875, -12.8583984375, -12.412109375, -11.9658203125, -11.51953125, -11.0732421875, -10.626953125, -10.1806640625, -9.734375, -9.2880859375, -8.841796875, -8.3955078125, -7.94921875, -7.5029296875, -7.056640625, -6.6103515625, -6.1640625, -5.7177734375, -5.271484375, -4.8251953125, -4.37890625, -3.9326171875, -3.486328125, -3.0400390625, -2.59375, -2.1474609375, -1.701171875, -1.2548828125, -0.80859375, -0.3623046875, 0.083984375, 0.5302734375, 0.9765625, 1.4228515625, 1.869140625, 2.3154296875, 2.76171875, 3.2080078125, 3.654296875, 4.1005859375, 4.546875, 4.9931640625, 5.439453125, 5.8857421875, 6.33203125, 6.7783203125, 7.224609375, 7.6708984375, 8.1171875, 8.5634765625, 9.009765625, 9.4560546875, 9.90234375, 10.3486328125, 10.794921875, 11.2412109375, 11.6875, 12.1337890625, 12.580078125, 13.0263671875, 13.47265625, 13.9189453125, 14.365234375, 14.8115234375, 15.2578125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 11.0, 13.0, 15.0, 17.0, 19.0, 27.0, 41.0, 51.0, 66.0, 71.0, 77.0, 92.0, 97.0, 78.0, 56.0, 63.0, 54.0, 47.0, 24.0, 22.0, 14.0, 7.0, 6.0, 5.0, 6.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.53321075439453, -56.934349060058594, -55.335487365722656, -53.73662567138672, -52.137760162353516, -50.53889846801758, -48.94003677368164, -47.3411750793457, -45.7423095703125, -44.14344787597656, -42.544586181640625, -40.94572448730469, -39.346858978271484, -37.74799728393555, -36.14913558959961, -34.55027389526367, -32.951412200927734, -31.352550506591797, -29.753686904907227, -28.15482521057129, -26.55596160888672, -24.95709991455078, -23.358238220214844, -21.759376525878906, -20.160512924194336, -18.5616512298584, -16.962787628173828, -15.36392593383789, -13.765063285827637, -12.166200637817383, -10.567338943481445, -8.968476295471191, -7.369609832763672, -5.770747184753418, -4.171885013580322, -2.5730228424072266, -0.9741601943969727, 0.6247024536132812, 2.2235641479492188, 3.8224267959594727, 5.421289443969727, 7.0201520919799805, 8.619014739990234, 10.217876434326172, 11.816739082336426, 13.41560173034668, 15.014463424682617, 16.613327026367188, 18.212188720703125, 19.811050415039062, 21.409914016723633, 23.00877571105957, 24.60763931274414, 26.206501007080078, 27.805362701416016, 29.404224395751953, 31.003087997436523, 32.601951599121094, 34.20081329345703, 35.79967498779297, 37.398536682128906, 38.997398376464844, 40.59626007080078, 42.195125579833984, 43.79398727416992]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 6.0, 6.0, 15.0, 16.0, 13.0, 26.0, 20.0, 24.0, 33.0, 38.0, 34.0, 41.0, 43.0, 60.0, 42.0, 36.0, 50.0, 47.0, 45.0, 39.0, 40.0, 37.0, 46.0, 28.0, 35.0, 29.0, 23.0, 26.0, 21.0, 13.0, 19.0, 10.0, 5.0, 10.0, 6.0, 2.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.39248275756836, -33.15092086791992, -31.90936279296875, -30.667800903320312, -29.426240921020508, -28.184680938720703, -26.9431209564209, -25.701560974121094, -24.459999084472656, -23.21843910217285, -21.976879119873047, -20.73531723022461, -19.493757247924805, -18.252197265625, -17.010637283325195, -15.769076347351074, -14.527517318725586, -13.285957336425781, -12.04439640045166, -10.802836418151855, -9.561275482177734, -8.31971549987793, -7.078155517578125, -5.836594581604004, -4.595034599304199, -3.3534741401672363, -2.1119139194488525, -0.8703536987304688, 0.37120676040649414, 1.612767219543457, 2.8543272018432617, 4.095888137817383, 5.3374481201171875, 6.57900857925415, 7.820569038391113, 9.062129020690918, 10.303689956665039, 11.545249938964844, 12.786809921264648, 14.02837085723877, 15.269930839538574, 16.511491775512695, 17.7530517578125, 18.994611740112305, 20.23617172241211, 21.477733612060547, 22.71929168701172, 23.960853576660156, 25.20241355895996, 26.443973541259766, 27.68553352355957, 28.927093505859375, 30.168655395507812, 31.410215377807617, 32.65177536010742, 33.89333724975586, 35.13489532470703, 36.37645721435547, 37.61801528930664, 38.85957717895508, 40.10113525390625, 41.34269714355469, 42.584259033203125, 43.8258171081543, 45.067378997802734]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 1.0, 4.0, 4.0, 4.0, 6.0, 10.0, 12.0, 17.0, 10.0, 14.0, 18.0, 22.0, 24.0, 27.0, 28.0, 38.0, 31.0, 35.0, 36.0, 45.0, 36.0, 38.0, 57.0, 42.0, 41.0, 58.0, 45.0, 37.0, 41.0, 32.0, 29.0, 28.0, 16.0, 17.0, 21.0, 13.0, 12.0, 11.0, 10.0, 7.0, 9.0, 4.0, 3.0, 7.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.59765625, -4.45953369140625, -4.3214111328125, -4.18328857421875, -4.045166015625, -3.90704345703125, -3.7689208984375, -3.63079833984375, -3.49267578125, -3.35455322265625, -3.2164306640625, -3.07830810546875, -2.940185546875, -2.80206298828125, -2.6639404296875, -2.52581787109375, -2.3876953125, -2.24957275390625, -2.1114501953125, -1.97332763671875, -1.835205078125, -1.69708251953125, -1.5589599609375, -1.42083740234375, -1.28271484375, -1.14459228515625, -1.0064697265625, -0.86834716796875, -0.730224609375, -0.59210205078125, -0.4539794921875, -0.31585693359375, -0.177734375, -0.03961181640625, 0.0985107421875, 0.23663330078125, 0.374755859375, 0.51287841796875, 0.6510009765625, 0.78912353515625, 0.92724609375, 1.06536865234375, 1.2034912109375, 1.34161376953125, 1.479736328125, 1.61785888671875, 1.7559814453125, 1.89410400390625, 2.0322265625, 2.17034912109375, 2.3084716796875, 2.44659423828125, 2.584716796875, 2.72283935546875, 2.8609619140625, 2.99908447265625, 3.13720703125, 3.27532958984375, 3.4134521484375, 3.55157470703125, 3.689697265625, 3.82781982421875, 3.9659423828125, 4.10406494140625, 4.2421875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 4.0, 5.0, 10.0, 12.0, 36.0, 49.0, 54.0, 99.0, 141.0, 208.0, 364.0, 589.0, 953.0, 1437.0, 2194.0, 3392.0, 5272.0, 8293.0, 12816.0, 19503.0, 30102.0, 46411.0, 70798.0, 111121.0, 172282.0, 192908.0, 131558.0, 83349.0, 53894.0, 35535.0, 22967.0, 14803.0, 9583.0, 6229.0, 4152.0, 2653.0, 1761.0, 1103.0, 723.0, 411.0, 313.0, 188.0, 107.0, 67.0, 49.0, 24.0, 8.0, 12.0, 12.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.1015625, -7.849853515625, -7.59814453125, -7.346435546875, -7.0947265625, -6.843017578125, -6.59130859375, -6.339599609375, -6.087890625, -5.836181640625, -5.58447265625, -5.332763671875, -5.0810546875, -4.829345703125, -4.57763671875, -4.325927734375, -4.07421875, -3.822509765625, -3.57080078125, -3.319091796875, -3.0673828125, -2.815673828125, -2.56396484375, -2.312255859375, -2.060546875, -1.808837890625, -1.55712890625, -1.305419921875, -1.0537109375, -0.802001953125, -0.55029296875, -0.298583984375, -0.046875, 0.204833984375, 0.45654296875, 0.708251953125, 0.9599609375, 1.211669921875, 1.46337890625, 1.715087890625, 1.966796875, 2.218505859375, 2.47021484375, 2.721923828125, 2.9736328125, 3.225341796875, 3.47705078125, 3.728759765625, 3.98046875, 4.232177734375, 4.48388671875, 4.735595703125, 4.9873046875, 5.239013671875, 5.49072265625, 5.742431640625, 5.994140625, 6.245849609375, 6.49755859375, 6.749267578125, 7.0009765625, 7.252685546875, 7.50439453125, 7.756103515625, 8.0078125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 6.0, 5.0, 5.0, 10.0, 10.0, 16.0, 16.0, 16.0, 19.0, 20.0, 20.0, 33.0, 29.0, 30.0, 24.0, 45.0, 49.0, 31.0, 52.0, 48.0, 1059.0, 33.0, 39.0, 32.0, 50.0, 41.0, 29.0, 30.0, 28.0, 35.0, 25.0, 34.0, 16.0, 13.0, 9.0, 15.0, 8.0, 8.0, 10.0, 3.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.623046875, -3.5184326171875, -3.413818359375, -3.3092041015625, -3.20458984375, -3.0999755859375, -2.995361328125, -2.8907470703125, -2.7861328125, -2.6815185546875, -2.576904296875, -2.4722900390625, -2.36767578125, -2.2630615234375, -2.158447265625, -2.0538330078125, -1.94921875, -1.8446044921875, -1.739990234375, -1.6353759765625, -1.53076171875, -1.4261474609375, -1.321533203125, -1.2169189453125, -1.1123046875, -1.0076904296875, -0.903076171875, -0.7984619140625, -0.69384765625, -0.5892333984375, -0.484619140625, -0.3800048828125, -0.275390625, -0.1707763671875, -0.066162109375, 0.0384521484375, 0.14306640625, 0.2476806640625, 0.352294921875, 0.4569091796875, 0.5615234375, 0.6661376953125, 0.770751953125, 0.8753662109375, 0.97998046875, 1.0845947265625, 1.189208984375, 1.2938232421875, 1.3984375, 1.5030517578125, 1.607666015625, 1.7122802734375, 1.81689453125, 1.9215087890625, 2.026123046875, 2.1307373046875, 2.2353515625, 2.3399658203125, 2.444580078125, 2.5491943359375, 2.65380859375, 2.7584228515625, 2.863037109375, 2.9676513671875, 3.072265625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 7.0, 8.0, 11.0, 16.0, 24.0, 31.0, 39.0, 61.0, 67.0, 91.0, 115.0, 124.0, 190.0, 265.0, 336.0, 430.0, 664.0, 942.0, 1429.0, 2237.0, 4058.0, 9003.0, 26257.0, 134860.0, 1414346.0, 420048.0, 52774.0, 14031.0, 5838.0, 2976.0, 1787.0, 1154.0, 795.0, 564.0, 405.0, 269.0, 206.0, 162.0, 127.0, 85.0, 66.0, 45.0, 43.0, 44.0, 20.0, 23.0, 15.0, 13.0, 10.0, 10.0, 6.0, 4.0, 0.0, 3.0, 1.0, 3.0], "bins": [-23.46875, -22.751953125, -22.03515625, -21.318359375, -20.6015625, -19.884765625, -19.16796875, -18.451171875, -17.734375, -17.017578125, -16.30078125, -15.583984375, -14.8671875, -14.150390625, -13.43359375, -12.716796875, -12.0, -11.283203125, -10.56640625, -9.849609375, -9.1328125, -8.416015625, -7.69921875, -6.982421875, -6.265625, -5.548828125, -4.83203125, -4.115234375, -3.3984375, -2.681640625, -1.96484375, -1.248046875, -0.53125, 0.185546875, 0.90234375, 1.619140625, 2.3359375, 3.052734375, 3.76953125, 4.486328125, 5.203125, 5.919921875, 6.63671875, 7.353515625, 8.0703125, 8.787109375, 9.50390625, 10.220703125, 10.9375, 11.654296875, 12.37109375, 13.087890625, 13.8046875, 14.521484375, 15.23828125, 15.955078125, 16.671875, 17.388671875, 18.10546875, 18.822265625, 19.5390625, 20.255859375, 20.97265625, 21.689453125, 22.40625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 6.0, 3.0, 6.0, 9.0, 14.0, 10.0, 15.0, 18.0, 22.0, 34.0, 40.0, 59.0, 65.0, 92.0, 134.0, 105.0, 101.0, 72.0, 43.0, 31.0, 18.0, 22.0, 15.0, 9.0, 9.0, 6.0, 8.0, 4.0, 7.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0], "bins": [-7.4140625, -7.21783447265625, -7.0216064453125, -6.82537841796875, -6.629150390625, -6.43292236328125, -6.2366943359375, -6.04046630859375, -5.84423828125, -5.64801025390625, -5.4517822265625, -5.25555419921875, -5.059326171875, -4.86309814453125, -4.6668701171875, -4.47064208984375, -4.2744140625, -4.07818603515625, -3.8819580078125, -3.68572998046875, -3.489501953125, -3.29327392578125, -3.0970458984375, -2.90081787109375, -2.70458984375, -2.50836181640625, -2.3121337890625, -2.11590576171875, -1.919677734375, -1.72344970703125, -1.5272216796875, -1.33099365234375, -1.134765625, -0.93853759765625, -0.7423095703125, -0.54608154296875, -0.349853515625, -0.15362548828125, 0.0426025390625, 0.23883056640625, 0.43505859375, 0.63128662109375, 0.8275146484375, 1.02374267578125, 1.219970703125, 1.41619873046875, 1.6124267578125, 1.80865478515625, 2.0048828125, 2.20111083984375, 2.3973388671875, 2.59356689453125, 2.789794921875, 2.98602294921875, 3.1822509765625, 3.37847900390625, 3.57470703125, 3.77093505859375, 3.9671630859375, 4.16339111328125, 4.359619140625, 4.55584716796875, 4.7520751953125, 4.94830322265625, 5.14453125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 5.0, 3.0, 3.0, 7.0, 6.0, 13.0, 20.0, 22.0, 30.0, 48.0, 61.0, 65.0, 152.0, 393.0, 1671.0, 12813.0, 837792.0, 186448.0, 7267.0, 1102.0, 252.0, 115.0, 65.0, 56.0, 43.0, 23.0, 22.0, 19.0, 10.0, 8.0, 5.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.3125, -87.072265625, -83.83203125, -80.591796875, -77.3515625, -74.111328125, -70.87109375, -67.630859375, -64.390625, -61.150390625, -57.91015625, -54.669921875, -51.4296875, -48.189453125, -44.94921875, -41.708984375, -38.46875, -35.228515625, -31.98828125, -28.748046875, -25.5078125, -22.267578125, -19.02734375, -15.787109375, -12.546875, -9.306640625, -6.06640625, -2.826171875, 0.4140625, 3.654296875, 6.89453125, 10.134765625, 13.375, 16.615234375, 19.85546875, 23.095703125, 26.3359375, 29.576171875, 32.81640625, 36.056640625, 39.296875, 42.537109375, 45.77734375, 49.017578125, 52.2578125, 55.498046875, 58.73828125, 61.978515625, 65.21875, 68.458984375, 71.69921875, 74.939453125, 78.1796875, 81.419921875, 84.66015625, 87.900390625, 91.140625, 94.380859375, 97.62109375, 100.861328125, 104.1015625, 107.341796875, 110.58203125, 113.822265625, 117.0625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 5.0, 15.0, 17.0, 20.0, 42.0, 54.0, 91.0, 125.0, 164.0, 145.0, 114.0, 73.0, 40.0, 23.0, 22.0, 12.0, 10.0, 13.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.96257781982422, -22.426504135131836, -21.890432357788086, -21.354358673095703, -20.818286895751953, -20.28221321105957, -19.74614143371582, -19.210067749023438, -18.673995971679688, -18.137922286987305, -17.601850509643555, -17.065776824951172, -16.529705047607422, -15.993631362915039, -15.457558631896973, -14.921485900878906, -14.385412216186523, -13.849339485168457, -13.31326675415039, -12.777194023132324, -12.241121292114258, -11.705047607421875, -11.168974876403809, -10.632902145385742, -10.096829414367676, -9.56075668334961, -9.024683952331543, -8.488611221313477, -7.952538013458252, -7.4164652824401855, -6.880392074584961, -6.3443193435668945, -5.808245658874512, -5.272172927856445, -4.736100196838379, -4.200026988983154, -3.663954257965088, -3.1278815269470215, -2.591808557510376, -2.0557355880737305, -1.519662857055664, -0.9835900068283081, -0.44751715660095215, 0.08855569362640381, 0.6246285438537598, 1.1607012748718262, 1.6967742443084717, 2.232847213745117, 2.7689199447631836, 3.30499267578125, 3.8410656452178955, 4.377138614654541, 4.913211345672607, 5.449284076690674, 5.985357284545898, 6.521430015563965, 7.057502746582031, 7.593575477600098, 8.129648208618164, 8.66572093963623, 9.201793670654297, 9.73786735534668, 10.273940086364746, 10.810012817382812, 11.346085548400879]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 0.0, 7.0, 2.0, 6.0, 8.0, 16.0, 14.0, 13.0, 11.0, 17.0, 21.0, 26.0, 37.0, 48.0, 39.0, 45.0, 35.0, 32.0, 45.0, 42.0, 45.0, 36.0, 34.0, 43.0, 54.0, 50.0, 33.0, 29.0, 30.0, 45.0, 22.0, 15.0, 19.0, 14.0, 11.0, 12.0, 22.0, 3.0, 7.0, 2.0, 4.0, 4.0, 7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.96848201751709, -6.724130153656006, -6.479778289794922, -6.23542594909668, -5.991074085235596, -5.746722221374512, -5.502370357513428, -5.258018493652344, -5.01366662979126, -4.769314765930176, -4.524962902069092, -4.280611038208008, -4.036258697509766, -3.7919068336486816, -3.5475549697875977, -3.3032031059265137, -3.0588510036468506, -2.8144991397857666, -2.5701470375061035, -2.3257951736450195, -2.0814433097839355, -1.837091326713562, -1.5927393436431885, -1.3483874797821045, -1.104035496711731, -0.8596835732460022, -0.6153316497802734, -0.3709796667098999, -0.12662774324417114, 0.11772418022155762, 0.36207616329193115, 0.6064280271530151, 0.8507800102233887, 1.0951319932937622, 1.3394838571548462, 1.5838358402252197, 1.8281877040863037, 2.072539806365967, 2.316891670227051, 2.5612435340881348, 2.8055953979492188, 3.0499472618103027, 3.294299364089966, 3.53865122795105, 3.783003091812134, 4.027355194091797, 4.271707057952881, 4.516058921813965, 4.760411262512207, 5.004763126373291, 5.249114990234375, 5.493467330932617, 5.737819194793701, 5.982171058654785, 6.226522922515869, 6.470874786376953, 6.715226650238037, 6.959578514099121, 7.203930377960205, 7.448282241821289, 7.692634582519531, 7.936986446380615, 8.1813383102417, 8.425689697265625, 8.670042037963867]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 7.0, 6.0, 3.0, 5.0, 12.0, 10.0, 16.0, 12.0, 23.0, 27.0, 25.0, 26.0, 23.0, 38.0, 35.0, 39.0, 39.0, 48.0, 47.0, 44.0, 42.0, 39.0, 38.0, 28.0, 37.0, 55.0, 33.0, 30.0, 23.0, 28.0, 27.0, 26.0, 16.0, 16.0, 13.0, 14.0, 6.0, 8.0, 10.0, 2.0, 7.0, 5.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.515625, -4.3792724609375, -4.242919921875, -4.1065673828125, -3.97021484375, -3.8338623046875, -3.697509765625, -3.5611572265625, -3.4248046875, -3.2884521484375, -3.152099609375, -3.0157470703125, -2.87939453125, -2.7430419921875, -2.606689453125, -2.4703369140625, -2.333984375, -2.1976318359375, -2.061279296875, -1.9249267578125, -1.78857421875, -1.6522216796875, -1.515869140625, -1.3795166015625, -1.2431640625, -1.1068115234375, -0.970458984375, -0.8341064453125, -0.69775390625, -0.5614013671875, -0.425048828125, -0.2886962890625, -0.15234375, -0.0159912109375, 0.120361328125, 0.2567138671875, 0.39306640625, 0.5294189453125, 0.665771484375, 0.8021240234375, 0.9384765625, 1.0748291015625, 1.211181640625, 1.3475341796875, 1.48388671875, 1.6202392578125, 1.756591796875, 1.8929443359375, 2.029296875, 2.1656494140625, 2.302001953125, 2.4383544921875, 2.57470703125, 2.7110595703125, 2.847412109375, 2.9837646484375, 3.1201171875, 3.2564697265625, 3.392822265625, 3.5291748046875, 3.66552734375, 3.8018798828125, 3.938232421875, 4.0745849609375, 4.2109375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 0.0, 3.0, 5.0, 4.0, 11.0, 9.0, 13.0, 22.0, 22.0, 20.0, 38.0, 50.0, 88.0, 84.0, 144.0, 169.0, 273.0, 316.0, 461.0, 657.0, 918.0, 1318.0, 1945.0, 2837.0, 4252.0, 6824.0, 13093.0, 29300.0, 83678.0, 282411.0, 410463.0, 126522.0, 41909.0, 16606.0, 8563.0, 4890.0, 3190.0, 2285.0, 1482.0, 1054.0, 716.0, 524.0, 393.0, 272.0, 198.0, 114.0, 107.0, 81.0, 53.0, 45.0, 35.0, 28.0, 13.0, 11.0, 13.0, 10.0, 12.0, 3.0, 4.0, 3.0, 5.0], "bins": [-9.1484375, -8.8726806640625, -8.596923828125, -8.3211669921875, -8.04541015625, -7.7696533203125, -7.493896484375, -7.2181396484375, -6.9423828125, -6.6666259765625, -6.390869140625, -6.1151123046875, -5.83935546875, -5.5635986328125, -5.287841796875, -5.0120849609375, -4.736328125, -4.4605712890625, -4.184814453125, -3.9090576171875, -3.63330078125, -3.3575439453125, -3.081787109375, -2.8060302734375, -2.5302734375, -2.2545166015625, -1.978759765625, -1.7030029296875, -1.42724609375, -1.1514892578125, -0.875732421875, -0.5999755859375, -0.32421875, -0.0484619140625, 0.227294921875, 0.5030517578125, 0.77880859375, 1.0545654296875, 1.330322265625, 1.6060791015625, 1.8818359375, 2.1575927734375, 2.433349609375, 2.7091064453125, 2.98486328125, 3.2606201171875, 3.536376953125, 3.8121337890625, 4.087890625, 4.3636474609375, 4.639404296875, 4.9151611328125, 5.19091796875, 5.4666748046875, 5.742431640625, 6.0181884765625, 6.2939453125, 6.5697021484375, 6.845458984375, 7.1212158203125, 7.39697265625, 7.6727294921875, 7.948486328125, 8.2242431640625, 8.5]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 9.0, 5.0, 5.0, 5.0, 6.0, 8.0, 14.0, 25.0, 29.0, 26.0, 37.0, 50.0, 47.0, 46.0, 80.0, 104.0, 147.0, 367.0, 1398.0, 166.0, 118.0, 61.0, 55.0, 43.0, 46.0, 33.0, 24.0, 31.0, 16.0, 14.0, 16.0, 5.0, 3.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.15625, -22.51318359375, -21.8701171875, -21.22705078125, -20.583984375, -19.94091796875, -19.2978515625, -18.65478515625, -18.01171875, -17.36865234375, -16.7255859375, -16.08251953125, -15.439453125, -14.79638671875, -14.1533203125, -13.51025390625, -12.8671875, -12.22412109375, -11.5810546875, -10.93798828125, -10.294921875, -9.65185546875, -9.0087890625, -8.36572265625, -7.72265625, -7.07958984375, -6.4365234375, -5.79345703125, -5.150390625, -4.50732421875, -3.8642578125, -3.22119140625, -2.578125, -1.93505859375, -1.2919921875, -0.64892578125, -0.005859375, 0.63720703125, 1.2802734375, 1.92333984375, 2.56640625, 3.20947265625, 3.8525390625, 4.49560546875, 5.138671875, 5.78173828125, 6.4248046875, 7.06787109375, 7.7109375, 8.35400390625, 8.9970703125, 9.64013671875, 10.283203125, 10.92626953125, 11.5693359375, 12.21240234375, 12.85546875, 13.49853515625, 14.1416015625, 14.78466796875, 15.427734375, 16.07080078125, 16.7138671875, 17.35693359375, 18.0]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 5.0, 3.0, 19.0, 21.0, 28.0, 71.0, 142.0, 317.0, 1013.0, 6940.0, 117627.0, 2960242.0, 53652.0, 4390.0, 736.0, 245.0, 113.0, 62.0, 38.0, 19.0, 9.0, 12.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.0625, -48.29931640625, -46.5361328125, -44.77294921875, -43.009765625, -41.24658203125, -39.4833984375, -37.72021484375, -35.95703125, -34.19384765625, -32.4306640625, -30.66748046875, -28.904296875, -27.14111328125, -25.3779296875, -23.61474609375, -21.8515625, -20.08837890625, -18.3251953125, -16.56201171875, -14.798828125, -13.03564453125, -11.2724609375, -9.50927734375, -7.74609375, -5.98291015625, -4.2197265625, -2.45654296875, -0.693359375, 1.06982421875, 2.8330078125, 4.59619140625, 6.359375, 8.12255859375, 9.8857421875, 11.64892578125, 13.412109375, 15.17529296875, 16.9384765625, 18.70166015625, 20.46484375, 22.22802734375, 23.9912109375, 25.75439453125, 27.517578125, 29.28076171875, 31.0439453125, 32.80712890625, 34.5703125, 36.33349609375, 38.0966796875, 39.85986328125, 41.623046875, 43.38623046875, 45.1494140625, 46.91259765625, 48.67578125, 50.43896484375, 52.2021484375, 53.96533203125, 55.728515625, 57.49169921875, 59.2548828125, 61.01806640625, 62.78125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [11.0, 121.0, 554.0, 305.0, 27.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.742321014404297, -16.29425811767578, -6.846195220947266, 2.60186767578125, 12.049930572509766, 21.49799346923828, 30.946056365966797, 40.39412307739258, 49.84218215942383, 59.290245056152344, 68.73831176757812, 78.18637084960938, 87.63442993164062, 97.0824966430664, 106.53056335449219, 115.97862243652344, 125.42668151855469, 134.87474060058594, 144.32281494140625, 153.7708740234375, 163.21893310546875, 172.6669921875, 182.11505126953125, 191.56312561035156, 201.0111846923828, 210.45924377441406, 219.90731811523438, 229.35537719726562, 238.80343627929688, 248.25149536132812, 257.6995544433594, 267.14764404296875, 276.595703125, 286.04376220703125, 295.4918212890625, 304.93988037109375, 314.387939453125, 323.8360290527344, 333.2840881347656, 342.7321472167969, 352.1802062988281, 361.6282653808594, 371.0763244628906, 380.5243835449219, 389.97247314453125, 399.4205322265625, 408.86859130859375, 418.316650390625, 427.76470947265625, 437.2127685546875, 446.66082763671875, 456.10888671875, 465.55694580078125, 475.0050354003906, 484.4530944824219, 493.9011535644531, 503.3492126464844, 512.7973022460938, 522.245361328125, 531.6934204101562, 541.1414794921875, 550.5895385742188, 560.03759765625, 569.4856567382812, 578.9337158203125]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 4.0, 6.0, 6.0, 7.0, 6.0, 14.0, 12.0, 20.0, 11.0, 23.0, 27.0, 31.0, 23.0, 29.0, 26.0, 35.0, 36.0, 40.0, 35.0, 34.0, 48.0, 37.0, 40.0, 51.0, 31.0, 35.0, 29.0, 39.0, 33.0, 33.0, 25.0, 29.0, 20.0, 18.0, 17.0, 21.0, 11.0, 7.0, 11.0, 12.0, 6.0, 8.0, 8.0, 5.0, 5.0, 0.0, 3.0, 2.0, 3.0], "bins": [-53.79496765136719, -52.34046936035156, -50.8859748840332, -49.43147659301758, -47.97697830200195, -46.522483825683594, -45.06798553466797, -43.613487243652344, -42.15898895263672, -40.704490661621094, -39.249996185302734, -37.79549789428711, -36.340999603271484, -34.886505126953125, -33.4320068359375, -31.977508544921875, -30.523014068603516, -29.068517684936523, -27.6140193939209, -26.159523010253906, -24.70502471923828, -23.25052833557129, -21.796031951904297, -20.341533660888672, -18.88703727722168, -17.432540893554688, -15.978042602539062, -14.52354621887207, -13.069048881530762, -11.614551544189453, -10.160055160522461, -8.705557823181152, -7.251064300537109, -5.796566963195801, -4.34207010269165, -2.8875732421875, -1.4330759048461914, 0.021421432495117188, 1.4759178161621094, 2.930415153503418, 4.384912490844727, 5.839409828186035, 7.2939066886901855, 8.748403549194336, 10.202900886535645, 11.657398223876953, 13.111894607543945, 14.566391944885254, 16.020889282226562, 17.475385665893555, 18.92988395690918, 20.384380340576172, 21.838878631591797, 23.29337501525879, 24.74787139892578, 26.202369689941406, 27.6568660736084, 29.11136245727539, 30.565860748291016, 32.020355224609375, 33.474853515625, 34.929351806640625, 36.38385009765625, 37.83834457397461, 39.292842864990234]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 5.0, 3.0, 12.0, 14.0, 10.0, 12.0, 21.0, 13.0, 26.0, 23.0, 28.0, 34.0, 38.0, 34.0, 46.0, 37.0, 39.0, 37.0, 46.0, 43.0, 44.0, 43.0, 45.0, 34.0, 40.0, 33.0, 30.0, 29.0, 27.0, 30.0, 20.0, 18.0, 15.0, 18.0, 10.0, 11.0, 7.0, 6.0, 2.0, 5.0, 2.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.06781005859375, -3.9246826171875, -3.78155517578125, -3.638427734375, -3.49530029296875, -3.3521728515625, -3.20904541015625, -3.06591796875, -2.92279052734375, -2.7796630859375, -2.63653564453125, -2.493408203125, -2.35028076171875, -2.2071533203125, -2.06402587890625, -1.9208984375, -1.77777099609375, -1.6346435546875, -1.49151611328125, -1.348388671875, -1.20526123046875, -1.0621337890625, -0.91900634765625, -0.77587890625, -0.63275146484375, -0.4896240234375, -0.34649658203125, -0.203369140625, -0.06024169921875, 0.0828857421875, 0.22601318359375, 0.369140625, 0.51226806640625, 0.6553955078125, 0.79852294921875, 0.941650390625, 1.08477783203125, 1.2279052734375, 1.37103271484375, 1.51416015625, 1.65728759765625, 1.8004150390625, 1.94354248046875, 2.086669921875, 2.22979736328125, 2.3729248046875, 2.51605224609375, 2.6591796875, 2.80230712890625, 2.9454345703125, 3.08856201171875, 3.231689453125, 3.37481689453125, 3.5179443359375, 3.66107177734375, 3.80419921875, 3.94732666015625, 4.0904541015625, 4.23358154296875, 4.376708984375, 4.51983642578125, 4.6629638671875, 4.80609130859375, 4.94921875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 5.0, 3.0, 9.0, 6.0, 11.0, 15.0, 23.0, 25.0, 45.0, 62.0, 79.0, 141.0, 178.0, 273.0, 371.0, 587.0, 965.0, 1589.0, 2702.0, 4812.0, 9713.0, 20942.0, 53623.0, 178141.0, 906545.0, 2197312.0, 605421.0, 130801.0, 43124.0, 17898.0, 8434.0, 4228.0, 2331.0, 1401.0, 831.0, 545.0, 336.0, 244.0, 159.0, 111.0, 79.0, 45.0, 28.0, 27.0, 17.0, 17.0, 13.0, 9.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.515625, -8.225830078125, -7.93603515625, -7.646240234375, -7.3564453125, -7.066650390625, -6.77685546875, -6.487060546875, -6.197265625, -5.907470703125, -5.61767578125, -5.327880859375, -5.0380859375, -4.748291015625, -4.45849609375, -4.168701171875, -3.87890625, -3.589111328125, -3.29931640625, -3.009521484375, -2.7197265625, -2.429931640625, -2.14013671875, -1.850341796875, -1.560546875, -1.270751953125, -0.98095703125, -0.691162109375, -0.4013671875, -0.111572265625, 0.17822265625, 0.468017578125, 0.7578125, 1.047607421875, 1.33740234375, 1.627197265625, 1.9169921875, 2.206787109375, 2.49658203125, 2.786376953125, 3.076171875, 3.365966796875, 3.65576171875, 3.945556640625, 4.2353515625, 4.525146484375, 4.81494140625, 5.104736328125, 5.39453125, 5.684326171875, 5.97412109375, 6.263916015625, 6.5537109375, 6.843505859375, 7.13330078125, 7.423095703125, 7.712890625, 8.002685546875, 8.29248046875, 8.582275390625, 8.8720703125, 9.161865234375, 9.45166015625, 9.741455078125, 10.03125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 8.0, 4.0, 9.0, 7.0, 15.0, 14.0, 19.0, 18.0, 38.0, 46.0, 52.0, 55.0, 84.0, 94.0, 157.0, 207.0, 225.0, 328.0, 379.0, 428.0, 405.0, 333.0, 251.0, 190.0, 169.0, 121.0, 95.0, 60.0, 58.0, 38.0, 36.0, 33.0, 24.0, 15.0, 13.0, 11.0, 9.0, 3.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.609375, -9.32421875, -9.0390625, -8.75390625, -8.46875, -8.18359375, -7.8984375, -7.61328125, -7.328125, -7.04296875, -6.7578125, -6.47265625, -6.1875, -5.90234375, -5.6171875, -5.33203125, -5.046875, -4.76171875, -4.4765625, -4.19140625, -3.90625, -3.62109375, -3.3359375, -3.05078125, -2.765625, -2.48046875, -2.1953125, -1.91015625, -1.625, -1.33984375, -1.0546875, -0.76953125, -0.484375, -0.19921875, 0.0859375, 0.37109375, 0.65625, 0.94140625, 1.2265625, 1.51171875, 1.796875, 2.08203125, 2.3671875, 2.65234375, 2.9375, 3.22265625, 3.5078125, 3.79296875, 4.078125, 4.36328125, 4.6484375, 4.93359375, 5.21875, 5.50390625, 5.7890625, 6.07421875, 6.359375, 6.64453125, 6.9296875, 7.21484375, 7.5, 7.78515625, 8.0703125, 8.35546875, 8.640625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 0.0, 4.0, 2.0, 8.0, 6.0, 14.0, 14.0, 16.0, 23.0, 41.0, 56.0, 79.0, 94.0, 139.0, 197.0, 298.0, 431.0, 640.0, 898.0, 1488.0, 2223.0, 3470.0, 5587.0, 9057.0, 15953.0, 29921.0, 60525.0, 138419.0, 370892.0, 1126825.0, 1513693.0, 550841.0, 193756.0, 80983.0, 38336.0, 19867.0, 11194.0, 6671.0, 3944.0, 2485.0, 1659.0, 1140.0, 728.0, 548.0, 334.0, 242.0, 176.0, 99.0, 67.0, 69.0, 45.0, 39.0, 17.0, 12.0, 7.0, 5.0, 6.0, 6.0, 3.0, 2.0, 2.0], "bins": [-9.8828125, -9.5849609375, -9.287109375, -8.9892578125, -8.69140625, -8.3935546875, -8.095703125, -7.7978515625, -7.5, -7.2021484375, -6.904296875, -6.6064453125, -6.30859375, -6.0107421875, -5.712890625, -5.4150390625, -5.1171875, -4.8193359375, -4.521484375, -4.2236328125, -3.92578125, -3.6279296875, -3.330078125, -3.0322265625, -2.734375, -2.4365234375, -2.138671875, -1.8408203125, -1.54296875, -1.2451171875, -0.947265625, -0.6494140625, -0.3515625, -0.0537109375, 0.244140625, 0.5419921875, 0.83984375, 1.1376953125, 1.435546875, 1.7333984375, 2.03125, 2.3291015625, 2.626953125, 2.9248046875, 3.22265625, 3.5205078125, 3.818359375, 4.1162109375, 4.4140625, 4.7119140625, 5.009765625, 5.3076171875, 5.60546875, 5.9033203125, 6.201171875, 6.4990234375, 6.796875, 7.0947265625, 7.392578125, 7.6904296875, 7.98828125, 8.2861328125, 8.583984375, 8.8818359375, 9.1796875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 8.0, 4.0, 7.0, 17.0, 14.0, 22.0, 31.0, 38.0, 39.0, 62.0, 51.0, 70.0, 63.0, 67.0, 61.0, 59.0, 85.0, 53.0, 55.0, 55.0, 38.0, 21.0, 18.0, 21.0, 16.0, 8.0, 6.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-51.06288146972656, -49.68735885620117, -48.31183624267578, -46.936317443847656, -45.560794830322266, -44.185272216796875, -42.809749603271484, -41.434226989746094, -40.05870819091797, -38.68318557739258, -37.30766296386719, -35.93214416503906, -34.55662155151367, -33.18109893798828, -31.80557632446289, -30.4300537109375, -29.05453109741211, -27.67900848388672, -26.30348777770996, -24.92796516418457, -23.552444458007812, -22.176921844482422, -20.80139923095703, -19.42587661743164, -18.050355911254883, -16.674833297729492, -15.299312591552734, -13.923789978027344, -12.54826831817627, -11.172746658325195, -9.797224044799805, -8.42170238494873, -7.046176910400391, -5.670655250549316, -4.295133113861084, -2.9196109771728516, -1.5440893173217773, -0.16856765747070312, 1.2069549560546875, 2.5824766159057617, 3.957998275756836, 5.33351993560791, 6.709042072296143, 8.084564208984375, 9.46008586883545, 10.835607528686523, 12.211130142211914, 13.586651802062988, 14.962173461914062, 16.337696075439453, 17.71321678161621, 19.0887393951416, 20.46426010131836, 21.83978271484375, 23.21530532836914, 24.59082794189453, 25.96634864807129, 27.34187126159668, 28.717391967773438, 30.092914581298828, 31.46843719482422, 32.843955993652344, 34.219482421875, 35.595001220703125, 36.970523834228516]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 5.0, 3.0, 4.0, 4.0, 6.0, 9.0, 11.0, 8.0, 15.0, 18.0, 21.0, 25.0, 23.0, 30.0, 29.0, 40.0, 41.0, 42.0, 47.0, 41.0, 49.0, 55.0, 49.0, 50.0, 32.0, 23.0, 35.0, 42.0, 38.0, 28.0, 28.0, 31.0, 15.0, 22.0, 18.0, 11.0, 12.0, 13.0, 8.0, 10.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.034820556640625, -37.83819580078125, -36.641571044921875, -35.444950103759766, -34.24832534790039, -33.051700592041016, -31.85507583618164, -30.6584529876709, -29.461830139160156, -28.26520538330078, -27.06858253479004, -25.871957778930664, -24.675334930419922, -23.478710174560547, -22.282085418701172, -21.08546257019043, -19.888837814331055, -18.69221305847168, -17.495590209960938, -16.298965454101562, -15.10234260559082, -13.905717849731445, -12.709094047546387, -11.512470245361328, -10.31584644317627, -9.119222640991211, -7.922598838806152, -6.7259745597839355, -5.529350757598877, -4.332726955413818, -3.1361026763916016, -1.939478874206543, -0.7428550720214844, 0.45376884937286377, 1.650392770767212, 2.8470168113708496, 4.043640613555908, 5.240264415740967, 6.436888694763184, 7.633512496948242, 8.8301362991333, 10.02676010131836, 11.223383903503418, 12.420007705688477, 13.616632461547852, 14.813255310058594, 16.00988006591797, 17.206504821777344, 18.403127670288086, 19.59975242614746, 20.796375274658203, 21.993000030517578, 23.18962287902832, 24.386247634887695, 25.582870483398438, 26.779495239257812, 27.976119995117188, 29.172744750976562, 30.369367599487305, 31.56599235534668, 32.76261520385742, 33.9592399597168, 35.15586471557617, 36.35248565673828, 37.549110412597656]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 8.0, 8.0, 2.0, 3.0, 11.0, 7.0, 9.0, 10.0, 5.0, 19.0, 12.0, 20.0, 20.0, 24.0, 25.0, 35.0, 33.0, 37.0, 32.0, 29.0, 35.0, 33.0, 38.0, 41.0, 29.0, 45.0, 42.0, 42.0, 34.0, 29.0, 31.0, 36.0, 18.0, 24.0, 27.0, 19.0, 21.0, 31.0, 10.0, 17.0, 10.0, 4.0, 8.0, 9.0, 5.0, 8.0, 5.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-4.34375, -4.21307373046875, -4.0823974609375, -3.95172119140625, -3.821044921875, -3.69036865234375, -3.5596923828125, -3.42901611328125, -3.29833984375, -3.16766357421875, -3.0369873046875, -2.90631103515625, -2.775634765625, -2.64495849609375, -2.5142822265625, -2.38360595703125, -2.2529296875, -2.12225341796875, -1.9915771484375, -1.86090087890625, -1.730224609375, -1.59954833984375, -1.4688720703125, -1.33819580078125, -1.20751953125, -1.07684326171875, -0.9461669921875, -0.81549072265625, -0.684814453125, -0.55413818359375, -0.4234619140625, -0.29278564453125, -0.162109375, -0.03143310546875, 0.0992431640625, 0.22991943359375, 0.360595703125, 0.49127197265625, 0.6219482421875, 0.75262451171875, 0.88330078125, 1.01397705078125, 1.1446533203125, 1.27532958984375, 1.406005859375, 1.53668212890625, 1.6673583984375, 1.79803466796875, 1.9287109375, 2.05938720703125, 2.1900634765625, 2.32073974609375, 2.451416015625, 2.58209228515625, 2.7127685546875, 2.84344482421875, 2.97412109375, 3.10479736328125, 3.2354736328125, 3.36614990234375, 3.496826171875, 3.62750244140625, 3.7581787109375, 3.88885498046875, 4.01953125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 14.0, 7.0, 20.0, 17.0, 55.0, 57.0, 100.0, 176.0, 206.0, 361.0, 565.0, 853.0, 1294.0, 2012.0, 3003.0, 4800.0, 7369.0, 11391.0, 17719.0, 27958.0, 45684.0, 80800.0, 162051.0, 276622.0, 182730.0, 89438.0, 49543.0, 30100.0, 18894.0, 12200.0, 7871.0, 5196.0, 3317.0, 2176.0, 1342.0, 888.0, 594.0, 392.0, 277.0, 135.0, 104.0, 74.0, 47.0, 35.0, 18.0, 17.0, 13.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.453125, -8.1673583984375, -7.881591796875, -7.5958251953125, -7.31005859375, -7.0242919921875, -6.738525390625, -6.4527587890625, -6.1669921875, -5.8812255859375, -5.595458984375, -5.3096923828125, -5.02392578125, -4.7381591796875, -4.452392578125, -4.1666259765625, -3.880859375, -3.5950927734375, -3.309326171875, -3.0235595703125, -2.73779296875, -2.4520263671875, -2.166259765625, -1.8804931640625, -1.5947265625, -1.3089599609375, -1.023193359375, -0.7374267578125, -0.45166015625, -0.1658935546875, 0.119873046875, 0.4056396484375, 0.69140625, 0.9771728515625, 1.262939453125, 1.5487060546875, 1.83447265625, 2.1202392578125, 2.406005859375, 2.6917724609375, 2.9775390625, 3.2633056640625, 3.549072265625, 3.8348388671875, 4.12060546875, 4.4063720703125, 4.692138671875, 4.9779052734375, 5.263671875, 5.5494384765625, 5.835205078125, 6.1209716796875, 6.40673828125, 6.6925048828125, 6.978271484375, 7.2640380859375, 7.5498046875, 7.8355712890625, 8.121337890625, 8.4071044921875, 8.69287109375, 8.9786376953125, 9.264404296875, 9.5501708984375, 9.8359375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 8.0, 3.0, 9.0, 17.0, 12.0, 21.0, 16.0, 14.0, 29.0, 19.0, 29.0, 25.0, 22.0, 31.0, 51.0, 42.0, 32.0, 45.0, 49.0, 1067.0, 38.0, 42.0, 38.0, 51.0, 38.0, 29.0, 30.0, 36.0, 28.0, 26.0, 18.0, 13.0, 14.0, 11.0, 12.0, 16.0, 10.0, 7.0, 9.0, 10.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-4.0703125, -3.954376220703125, -3.83843994140625, -3.722503662109375, -3.6065673828125, -3.490631103515625, -3.37469482421875, -3.258758544921875, -3.142822265625, -3.026885986328125, -2.91094970703125, -2.795013427734375, -2.6790771484375, -2.563140869140625, -2.44720458984375, -2.331268310546875, -2.21533203125, -2.099395751953125, -1.98345947265625, -1.867523193359375, -1.7515869140625, -1.635650634765625, -1.51971435546875, -1.403778076171875, -1.287841796875, -1.171905517578125, -1.05596923828125, -0.940032958984375, -0.8240966796875, -0.708160400390625, -0.59222412109375, -0.476287841796875, -0.3603515625, -0.244415283203125, -0.12847900390625, -0.012542724609375, 0.1033935546875, 0.219329833984375, 0.33526611328125, 0.451202392578125, 0.567138671875, 0.683074951171875, 0.79901123046875, 0.914947509765625, 1.0308837890625, 1.146820068359375, 1.26275634765625, 1.378692626953125, 1.49462890625, 1.610565185546875, 1.72650146484375, 1.842437744140625, 1.9583740234375, 2.074310302734375, 2.19024658203125, 2.306182861328125, 2.422119140625, 2.538055419921875, 2.65399169921875, 2.769927978515625, 2.8858642578125, 3.001800537109375, 3.11773681640625, 3.233673095703125, 3.349609375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 10.0, 8.0, 16.0, 19.0, 17.0, 32.0, 56.0, 73.0, 91.0, 150.0, 217.0, 304.0, 398.0, 626.0, 942.0, 1418.0, 2293.0, 3998.0, 7706.0, 16696.0, 42097.0, 131196.0, 756985.0, 911964.0, 140116.0, 43806.0, 17289.0, 7870.0, 4103.0, 2303.0, 1378.0, 934.0, 598.0, 401.0, 300.0, 191.0, 155.0, 111.0, 84.0, 47.0, 40.0, 34.0, 30.0, 10.0, 7.0, 7.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.1796875, -10.807373046875, -10.43505859375, -10.062744140625, -9.6904296875, -9.318115234375, -8.94580078125, -8.573486328125, -8.201171875, -7.828857421875, -7.45654296875, -7.084228515625, -6.7119140625, -6.339599609375, -5.96728515625, -5.594970703125, -5.22265625, -4.850341796875, -4.47802734375, -4.105712890625, -3.7333984375, -3.361083984375, -2.98876953125, -2.616455078125, -2.244140625, -1.871826171875, -1.49951171875, -1.127197265625, -0.7548828125, -0.382568359375, -0.01025390625, 0.362060546875, 0.734375, 1.106689453125, 1.47900390625, 1.851318359375, 2.2236328125, 2.595947265625, 2.96826171875, 3.340576171875, 3.712890625, 4.085205078125, 4.45751953125, 4.829833984375, 5.2021484375, 5.574462890625, 5.94677734375, 6.319091796875, 6.69140625, 7.063720703125, 7.43603515625, 7.808349609375, 8.1806640625, 8.552978515625, 8.92529296875, 9.297607421875, 9.669921875, 10.042236328125, 10.41455078125, 10.786865234375, 11.1591796875, 11.531494140625, 11.90380859375, 12.276123046875, 12.6484375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 7.0, 8.0, 7.0, 7.0, 12.0, 13.0, 25.0, 23.0, 35.0, 46.0, 62.0, 91.0, 112.0, 137.0, 94.0, 69.0, 63.0, 39.0, 20.0, 21.0, 20.0, 14.0, 10.0, 13.0, 5.0, 7.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.25390625, -4.12200927734375, -3.9901123046875, -3.85821533203125, -3.726318359375, -3.59442138671875, -3.4625244140625, -3.33062744140625, -3.19873046875, -3.06683349609375, -2.9349365234375, -2.80303955078125, -2.671142578125, -2.53924560546875, -2.4073486328125, -2.27545166015625, -2.1435546875, -2.01165771484375, -1.8797607421875, -1.74786376953125, -1.615966796875, -1.48406982421875, -1.3521728515625, -1.22027587890625, -1.08837890625, -0.95648193359375, -0.8245849609375, -0.69268798828125, -0.560791015625, -0.42889404296875, -0.2969970703125, -0.16510009765625, -0.033203125, 0.09869384765625, 0.2305908203125, 0.36248779296875, 0.494384765625, 0.62628173828125, 0.7581787109375, 0.89007568359375, 1.02197265625, 1.15386962890625, 1.2857666015625, 1.41766357421875, 1.549560546875, 1.68145751953125, 1.8133544921875, 1.94525146484375, 2.0771484375, 2.20904541015625, 2.3409423828125, 2.47283935546875, 2.604736328125, 2.73663330078125, 2.8685302734375, 3.00042724609375, 3.13232421875, 3.26422119140625, 3.3961181640625, 3.52801513671875, 3.659912109375, 3.79180908203125, 3.9237060546875, 4.05560302734375, 4.1875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 2.0, 7.0, 7.0, 7.0, 5.0, 16.0, 21.0, 26.0, 49.0, 55.0, 108.0, 185.0, 595.0, 3274.0, 42399.0, 965290.0, 32746.0, 2699.0, 579.0, 196.0, 96.0, 43.0, 36.0, 32.0, 17.0, 11.0, 10.0, 8.0, 9.0, 5.0, 2.0, 6.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.375, -64.1220703125, -61.869140625, -59.6162109375, -57.36328125, -55.1103515625, -52.857421875, -50.6044921875, -48.3515625, -46.0986328125, -43.845703125, -41.5927734375, -39.33984375, -37.0869140625, -34.833984375, -32.5810546875, -30.328125, -28.0751953125, -25.822265625, -23.5693359375, -21.31640625, -19.0634765625, -16.810546875, -14.5576171875, -12.3046875, -10.0517578125, -7.798828125, -5.5458984375, -3.29296875, -1.0400390625, 1.212890625, 3.4658203125, 5.71875, 7.9716796875, 10.224609375, 12.4775390625, 14.73046875, 16.9833984375, 19.236328125, 21.4892578125, 23.7421875, 25.9951171875, 28.248046875, 30.5009765625, 32.75390625, 35.0068359375, 37.259765625, 39.5126953125, 41.765625, 44.0185546875, 46.271484375, 48.5244140625, 50.77734375, 53.0302734375, 55.283203125, 57.5361328125, 59.7890625, 62.0419921875, 64.294921875, 66.5478515625, 68.80078125, 71.0537109375, 73.306640625, 75.5595703125, 77.8125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 7.0, 17.0, 15.0, 18.0, 33.0, 30.0, 44.0, 43.0, 87.0, 78.0, 106.0, 99.0, 94.0, 67.0, 64.0, 54.0, 29.0, 29.0, 18.0, 14.0, 16.0, 5.0, 11.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0], "bins": [-7.829045295715332, -7.630431175231934, -7.431817531585693, -7.233203887939453, -7.034589767456055, -6.835975646972656, -6.637362003326416, -6.438748359680176, -6.240134239196777, -6.041520118713379, -5.842906475067139, -5.644292831420898, -5.4456787109375, -5.247064590454102, -5.048450946807861, -4.849837303161621, -4.651223182678223, -4.452609062194824, -4.253995418548584, -4.055381774902344, -3.8567676544189453, -3.658153772354126, -3.4595398902893066, -3.2609260082244873, -3.062312126159668, -2.8636982440948486, -2.6650843620300293, -2.46647047996521, -2.2678565979003906, -2.0692427158355713, -1.870628833770752, -1.6720149517059326, -1.4734010696411133, -1.274787187576294, -1.0761733055114746, -0.8775594234466553, -0.6789455413818359, -0.4803316593170166, -0.28171777725219727, -0.08310389518737793, 0.1155099868774414, 0.31412386894226074, 0.5127377510070801, 0.7113516330718994, 0.9099655151367188, 1.108579397201538, 1.3071932792663574, 1.5058071613311768, 1.704421043395996, 1.9030349254608154, 2.1016488075256348, 2.300262689590454, 2.4988765716552734, 2.6974904537200928, 2.896104335784912, 3.0947182178497314, 3.293332099914551, 3.49194598197937, 3.6905598640441895, 3.889173746109009, 4.087787628173828, 4.286401748657227, 4.485015392303467, 4.683629035949707, 4.8822431564331055]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 7.0, 4.0, 7.0, 7.0, 13.0, 15.0, 17.0, 12.0, 15.0, 30.0, 38.0, 25.0, 24.0, 37.0, 35.0, 40.0, 30.0, 43.0, 49.0, 40.0, 53.0, 38.0, 51.0, 40.0, 30.0, 38.0, 31.0, 45.0, 30.0, 20.0, 28.0, 23.0, 24.0, 13.0, 8.0, 11.0, 13.0, 13.0, 5.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.798518180847168, -2.6885170936584473, -2.5785157680511475, -2.4685146808624268, -2.358513593673706, -2.2485122680664062, -2.1385111808776855, -2.028510093688965, -1.9185090065002441, -1.8085078001022339, -1.6985067129135132, -1.588505506515503, -1.4785044193267822, -1.368503212928772, -1.2585020065307617, -1.148500919342041, -1.0384997129440308, -0.9284985661506653, -0.8184974193572998, -0.7084962129592896, -0.5984951257705688, -0.4884939193725586, -0.3784927725791931, -0.26849162578582764, -0.15849047899246216, -0.04848932474851608, 0.06151182949542999, 0.17151299118995667, 0.28151413798332214, 0.39151531457901, 0.5015164613723755, 0.611517608165741, 0.7215187549591064, 0.8315199017524719, 0.9415210485458374, 1.0515222549438477, 1.1615233421325684, 1.2715245485305786, 1.3815257549285889, 1.4915268421173096, 1.6015279293060303, 1.7115291357040405, 1.8215302228927612, 1.9315314292907715, 2.041532516479492, 2.151533603668213, 2.2615349292755127, 2.3715360164642334, 2.481537342071533, 2.591538429260254, 2.7015397548675537, 2.8115408420562744, 2.921541929244995, 3.031543254852295, 3.1415443420410156, 3.2515454292297363, 3.361546516418457, 3.4715476036071777, 3.5815489292144775, 3.6915500164031982, 3.801551103591919, 3.9115524291992188, 4.0215535163879395, 4.13155460357666, 4.241555690765381]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 8.0, 5.0, 9.0, 5.0, 12.0, 14.0, 13.0, 14.0, 7.0, 16.0, 21.0, 21.0, 25.0, 28.0, 30.0, 42.0, 44.0, 38.0, 42.0, 39.0, 38.0, 36.0, 30.0, 49.0, 39.0, 36.0, 38.0, 28.0, 31.0, 33.0, 32.0, 25.0, 29.0, 21.0, 7.0, 17.0, 16.0, 6.0, 7.0, 11.0, 9.0, 10.0, 8.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.1875, -4.052001953125, -3.91650390625, -3.781005859375, -3.6455078125, -3.510009765625, -3.37451171875, -3.239013671875, -3.103515625, -2.968017578125, -2.83251953125, -2.697021484375, -2.5615234375, -2.426025390625, -2.29052734375, -2.155029296875, -2.01953125, -1.884033203125, -1.74853515625, -1.613037109375, -1.4775390625, -1.342041015625, -1.20654296875, -1.071044921875, -0.935546875, -0.800048828125, -0.66455078125, -0.529052734375, -0.3935546875, -0.258056640625, -0.12255859375, 0.012939453125, 0.1484375, 0.283935546875, 0.41943359375, 0.554931640625, 0.6904296875, 0.825927734375, 0.96142578125, 1.096923828125, 1.232421875, 1.367919921875, 1.50341796875, 1.638916015625, 1.7744140625, 1.909912109375, 2.04541015625, 2.180908203125, 2.31640625, 2.451904296875, 2.58740234375, 2.722900390625, 2.8583984375, 2.993896484375, 3.12939453125, 3.264892578125, 3.400390625, 3.535888671875, 3.67138671875, 3.806884765625, 3.9423828125, 4.077880859375, 4.21337890625, 4.348876953125, 4.484375]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 12.0, 8.0, 9.0, 16.0, 22.0, 25.0, 37.0, 63.0, 96.0, 154.0, 251.0, 488.0, 744.0, 1215.0, 2061.0, 3646.0, 6464.0, 12103.0, 23424.0, 50196.0, 125307.0, 336634.0, 291366.0, 105566.0, 43336.0, 20703.0, 10748.0, 5954.0, 3228.0, 1853.0, 1037.0, 677.0, 398.0, 262.0, 137.0, 117.0, 65.0, 52.0, 33.0, 22.0, 12.0, 6.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6640625, -5.4681396484375, -5.272216796875, -5.0762939453125, -4.88037109375, -4.6844482421875, -4.488525390625, -4.2926025390625, -4.0966796875, -3.9007568359375, -3.704833984375, -3.5089111328125, -3.31298828125, -3.1170654296875, -2.921142578125, -2.7252197265625, -2.529296875, -2.3333740234375, -2.137451171875, -1.9415283203125, -1.74560546875, -1.5496826171875, -1.353759765625, -1.1578369140625, -0.9619140625, -0.7659912109375, -0.570068359375, -0.3741455078125, -0.17822265625, 0.0177001953125, 0.213623046875, 0.4095458984375, 0.60546875, 0.8013916015625, 0.997314453125, 1.1932373046875, 1.38916015625, 1.5850830078125, 1.781005859375, 1.9769287109375, 2.1728515625, 2.3687744140625, 2.564697265625, 2.7606201171875, 2.95654296875, 3.1524658203125, 3.348388671875, 3.5443115234375, 3.740234375, 3.9361572265625, 4.132080078125, 4.3280029296875, 4.52392578125, 4.7198486328125, 4.915771484375, 5.1116943359375, 5.3076171875, 5.5035400390625, 5.699462890625, 5.8953857421875, 6.09130859375, 6.2872314453125, 6.483154296875, 6.6790771484375, 6.875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 2.0, 6.0, 4.0, 10.0, 13.0, 7.0, 14.0, 7.0, 16.0, 22.0, 18.0, 37.0, 26.0, 28.0, 36.0, 45.0, 39.0, 50.0, 70.0, 108.0, 202.0, 1326.0, 272.0, 174.0, 84.0, 67.0, 48.0, 37.0, 29.0, 35.0, 45.0, 22.0, 26.0, 22.0, 21.0, 16.0, 8.0, 16.0, 8.0, 12.0, 4.0, 7.0, 5.0, 6.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-14.5234375, -14.0367431640625, -13.550048828125, -13.0633544921875, -12.57666015625, -12.0899658203125, -11.603271484375, -11.1165771484375, -10.6298828125, -10.1431884765625, -9.656494140625, -9.1697998046875, -8.68310546875, -8.1964111328125, -7.709716796875, -7.2230224609375, -6.736328125, -6.2496337890625, -5.762939453125, -5.2762451171875, -4.78955078125, -4.3028564453125, -3.816162109375, -3.3294677734375, -2.8427734375, -2.3560791015625, -1.869384765625, -1.3826904296875, -0.89599609375, -0.4093017578125, 0.077392578125, 0.5640869140625, 1.05078125, 1.5374755859375, 2.024169921875, 2.5108642578125, 2.99755859375, 3.4842529296875, 3.970947265625, 4.4576416015625, 4.9443359375, 5.4310302734375, 5.917724609375, 6.4044189453125, 6.89111328125, 7.3778076171875, 7.864501953125, 8.3511962890625, 8.837890625, 9.3245849609375, 9.811279296875, 10.2979736328125, 10.78466796875, 11.2713623046875, 11.758056640625, 12.2447509765625, 12.7314453125, 13.2181396484375, 13.704833984375, 14.1915283203125, 14.67822265625, 15.1649169921875, 15.651611328125, 16.1383056640625, 16.625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 7.0, 9.0, 9.0, 18.0, 17.0, 21.0, 25.0, 41.0, 60.0, 74.0, 105.0, 146.0, 275.0, 447.0, 1219.0, 4732.0, 48747.0, 2511391.0, 557254.0, 16567.0, 2613.0, 825.0, 407.0, 236.0, 124.0, 93.0, 58.0, 48.0, 32.0, 20.0, 24.0, 11.0, 12.0, 11.0, 6.0, 5.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.796875, -26.8642578125, -25.931640625, -24.9990234375, -24.06640625, -23.1337890625, -22.201171875, -21.2685546875, -20.3359375, -19.4033203125, -18.470703125, -17.5380859375, -16.60546875, -15.6728515625, -14.740234375, -13.8076171875, -12.875, -11.9423828125, -11.009765625, -10.0771484375, -9.14453125, -8.2119140625, -7.279296875, -6.3466796875, -5.4140625, -4.4814453125, -3.548828125, -2.6162109375, -1.68359375, -0.7509765625, 0.181640625, 1.1142578125, 2.046875, 2.9794921875, 3.912109375, 4.8447265625, 5.77734375, 6.7099609375, 7.642578125, 8.5751953125, 9.5078125, 10.4404296875, 11.373046875, 12.3056640625, 13.23828125, 14.1708984375, 15.103515625, 16.0361328125, 16.96875, 17.9013671875, 18.833984375, 19.7666015625, 20.69921875, 21.6318359375, 22.564453125, 23.4970703125, 24.4296875, 25.3623046875, 26.294921875, 27.2275390625, 28.16015625, 29.0927734375, 30.025390625, 30.9580078125, 31.890625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 164.0, 833.0, 19.0, 1.0], "bins": [-866.4425659179688, -852.288818359375, -838.135009765625, -823.9812622070312, -809.8275146484375, -795.6737060546875, -781.5199584960938, -767.3662109375, -753.21240234375, -739.0586547851562, -724.9048461914062, -710.7510986328125, -696.5973510742188, -682.4435424804688, -668.289794921875, -654.1360473632812, -639.9822998046875, -625.8285522460938, -611.6747436523438, -597.52099609375, -583.3672485351562, -569.2134399414062, -555.0596923828125, -540.9059448242188, -526.7521362304688, -512.598388671875, -498.4446105957031, -484.29083251953125, -470.1370544433594, -455.9832763671875, -441.82952880859375, -427.6757507324219, -413.52197265625, -399.3681945800781, -385.2144470214844, -371.0606689453125, -356.9068908691406, -342.75311279296875, -328.599365234375, -314.4455871582031, -300.29180908203125, -286.1380310058594, -271.9842834472656, -257.83050537109375, -243.67672729492188, -229.52296447753906, -215.36920166015625, -201.21542358398438, -187.06167602539062, -172.9079132080078, -158.75413513183594, -144.60037231445312, -130.44659423828125, -116.29283142089844, -102.13906860351562, -87.98529815673828, -73.83152770996094, -59.677757263183594, -45.523990631103516, -31.370223999023438, -17.216453552246094, -3.06268310546875, 11.091079711914062, 25.244850158691406, 39.398624420166016]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 3.0, 2.0, 8.0, 5.0, 7.0, 11.0, 14.0, 19.0, 15.0, 19.0, 21.0, 31.0, 36.0, 36.0, 34.0, 45.0, 43.0, 38.0, 41.0, 49.0, 29.0, 46.0, 53.0, 47.0, 43.0, 33.0, 31.0, 26.0, 33.0, 32.0, 19.0, 15.0, 21.0, 14.0, 15.0, 20.0, 17.0, 9.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-40.04397964477539, -38.60231399536133, -37.16065216064453, -35.71898651123047, -34.277320861816406, -32.835655212402344, -31.393991470336914, -29.952327728271484, -28.510662078857422, -27.06899642944336, -25.62733268737793, -24.1856689453125, -22.744003295898438, -21.302337646484375, -19.860673904418945, -18.419010162353516, -16.977344512939453, -15.535679817199707, -14.094015121459961, -12.652350425720215, -11.210685729980469, -9.769021034240723, -8.327356338500977, -6.8856916427612305, -5.444026947021484, -4.002362251281738, -2.560697555541992, -1.119032859802246, 0.3226318359375, 1.764296531677246, 3.205961227416992, 4.647625923156738, 6.089290618896484, 7.5309553146362305, 8.972620010375977, 10.414284706115723, 11.855949401855469, 13.297614097595215, 14.739278793334961, 16.18094253540039, 17.622608184814453, 19.064273834228516, 20.505937576293945, 21.947601318359375, 23.389266967773438, 24.8309326171875, 26.27259635925293, 27.71426010131836, 29.155925750732422, 30.597591400146484, 32.03925323486328, 33.480918884277344, 34.922584533691406, 36.36425018310547, 37.80591583251953, 39.24757766723633, 40.68924331665039, 42.13090896606445, 43.57257080078125, 45.01423645019531, 46.455902099609375, 47.89756774902344, 49.3392333984375, 50.7808952331543, 52.22256088256836]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 9.0, 9.0, 6.0, 15.0, 12.0, 14.0, 10.0, 23.0, 18.0, 34.0, 42.0, 25.0, 34.0, 45.0, 38.0, 42.0, 41.0, 45.0, 53.0, 40.0, 36.0, 44.0, 35.0, 48.0, 38.0, 24.0, 43.0, 23.0, 30.0, 17.0, 17.0, 15.0, 10.0, 12.0, 9.0, 10.0, 6.0, 9.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.76171875, -4.60601806640625, -4.4503173828125, -4.29461669921875, -4.138916015625, -3.98321533203125, -3.8275146484375, -3.67181396484375, -3.51611328125, -3.36041259765625, -3.2047119140625, -3.04901123046875, -2.893310546875, -2.73760986328125, -2.5819091796875, -2.42620849609375, -2.2705078125, -2.11480712890625, -1.9591064453125, -1.80340576171875, -1.647705078125, -1.49200439453125, -1.3363037109375, -1.18060302734375, -1.02490234375, -0.86920166015625, -0.7135009765625, -0.55780029296875, -0.402099609375, -0.24639892578125, -0.0906982421875, 0.06500244140625, 0.220703125, 0.37640380859375, 0.5321044921875, 0.68780517578125, 0.843505859375, 0.99920654296875, 1.1549072265625, 1.31060791015625, 1.46630859375, 1.62200927734375, 1.7777099609375, 1.93341064453125, 2.089111328125, 2.24481201171875, 2.4005126953125, 2.55621337890625, 2.7119140625, 2.86761474609375, 3.0233154296875, 3.17901611328125, 3.334716796875, 3.49041748046875, 3.6461181640625, 3.80181884765625, 3.95751953125, 4.11322021484375, 4.2689208984375, 4.42462158203125, 4.580322265625, 4.73602294921875, 4.8917236328125, 5.04742431640625, 5.203125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 9.0, 6.0, 17.0, 19.0, 12.0, 22.0, 37.0, 39.0, 62.0, 87.0, 122.0, 175.0, 290.0, 397.0, 615.0, 961.0, 1556.0, 2701.0, 4989.0, 9782.0, 22385.0, 60486.0, 225146.0, 1361117.0, 1997202.0, 363034.0, 84754.0, 29869.0, 13267.0, 6353.0, 3455.0, 1954.0, 1166.0, 793.0, 428.0, 312.0, 200.0, 128.0, 105.0, 83.0, 37.0, 36.0, 23.0, 19.0, 14.0, 9.0, 5.0, 5.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0], "bins": [-11.625, -11.2845458984375, -10.944091796875, -10.6036376953125, -10.26318359375, -9.9227294921875, -9.582275390625, -9.2418212890625, -8.9013671875, -8.5609130859375, -8.220458984375, -7.8800048828125, -7.53955078125, -7.1990966796875, -6.858642578125, -6.5181884765625, -6.177734375, -5.8372802734375, -5.496826171875, -5.1563720703125, -4.81591796875, -4.4754638671875, -4.135009765625, -3.7945556640625, -3.4541015625, -3.1136474609375, -2.773193359375, -2.4327392578125, -2.09228515625, -1.7518310546875, -1.411376953125, -1.0709228515625, -0.73046875, -0.3900146484375, -0.049560546875, 0.2908935546875, 0.63134765625, 0.9718017578125, 1.312255859375, 1.6527099609375, 1.9931640625, 2.3336181640625, 2.674072265625, 3.0145263671875, 3.35498046875, 3.6954345703125, 4.035888671875, 4.3763427734375, 4.716796875, 5.0572509765625, 5.397705078125, 5.7381591796875, 6.07861328125, 6.4190673828125, 6.759521484375, 7.0999755859375, 7.4404296875, 7.7808837890625, 8.121337890625, 8.4617919921875, 8.80224609375, 9.1427001953125, 9.483154296875, 9.8236083984375, 10.1640625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 9.0, 9.0, 9.0, 9.0, 19.0, 17.0, 15.0, 30.0, 50.0, 43.0, 60.0, 68.0, 99.0, 142.0, 183.0, 256.0, 298.0, 395.0, 444.0, 429.0, 362.0, 283.0, 213.0, 149.0, 107.0, 77.0, 59.0, 54.0, 31.0, 34.0, 16.0, 20.0, 22.0, 13.0, 9.0, 8.0, 5.0, 2.0, 5.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.90625, -9.5838623046875, -9.261474609375, -8.9390869140625, -8.61669921875, -8.2943115234375, -7.971923828125, -7.6495361328125, -7.3271484375, -7.0047607421875, -6.682373046875, -6.3599853515625, -6.03759765625, -5.7152099609375, -5.392822265625, -5.0704345703125, -4.748046875, -4.4256591796875, -4.103271484375, -3.7808837890625, -3.45849609375, -3.1361083984375, -2.813720703125, -2.4913330078125, -2.1689453125, -1.8465576171875, -1.524169921875, -1.2017822265625, -0.87939453125, -0.5570068359375, -0.234619140625, 0.0877685546875, 0.41015625, 0.7325439453125, 1.054931640625, 1.3773193359375, 1.69970703125, 2.0220947265625, 2.344482421875, 2.6668701171875, 2.9892578125, 3.3116455078125, 3.634033203125, 3.9564208984375, 4.27880859375, 4.6011962890625, 4.923583984375, 5.2459716796875, 5.568359375, 5.8907470703125, 6.213134765625, 6.5355224609375, 6.85791015625, 7.1802978515625, 7.502685546875, 7.8250732421875, 8.1474609375, 8.4698486328125, 8.792236328125, 9.1146240234375, 9.43701171875, 9.7593994140625, 10.081787109375, 10.4041748046875, 10.7265625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 10.0, 24.0, 17.0, 32.0, 38.0, 63.0, 100.0, 203.0, 305.0, 612.0, 1049.0, 2032.0, 4391.0, 11083.0, 32821.0, 133647.0, 991762.0, 2568704.0, 348767.0, 65830.0, 19092.0, 7203.0, 3048.0, 1486.0, 809.0, 456.0, 266.0, 138.0, 98.0, 57.0, 31.0, 24.0, 21.0, 15.0, 9.0, 8.0, 5.0, 5.0, 1.0, 2.0, 8.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.6875, -18.0263671875, -17.365234375, -16.7041015625, -16.04296875, -15.3818359375, -14.720703125, -14.0595703125, -13.3984375, -12.7373046875, -12.076171875, -11.4150390625, -10.75390625, -10.0927734375, -9.431640625, -8.7705078125, -8.109375, -7.4482421875, -6.787109375, -6.1259765625, -5.46484375, -4.8037109375, -4.142578125, -3.4814453125, -2.8203125, -2.1591796875, -1.498046875, -0.8369140625, -0.17578125, 0.4853515625, 1.146484375, 1.8076171875, 2.46875, 3.1298828125, 3.791015625, 4.4521484375, 5.11328125, 5.7744140625, 6.435546875, 7.0966796875, 7.7578125, 8.4189453125, 9.080078125, 9.7412109375, 10.40234375, 11.0634765625, 11.724609375, 12.3857421875, 13.046875, 13.7080078125, 14.369140625, 15.0302734375, 15.69140625, 16.3525390625, 17.013671875, 17.6748046875, 18.3359375, 18.9970703125, 19.658203125, 20.3193359375, 20.98046875, 21.6416015625, 22.302734375, 22.9638671875, 23.625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 3.0, 10.0, 10.0, 29.0, 41.0, 65.0, 98.0, 103.0, 155.0, 122.0, 148.0, 85.0, 65.0, 42.0, 19.0, 13.0, 1.0, 3.0, 2.0, 1.0], "bins": [-169.6805419921875, -166.48260498046875, -163.28466796875, -160.0867462158203, -156.88880920410156, -153.6908721923828, -150.49293518066406, -147.29501342773438, -144.09707641601562, -140.89913940429688, -137.70120239257812, -134.50328063964844, -131.3053436279297, -128.10740661621094, -124.90946960449219, -121.71154022216797, -118.51360321044922, -115.31566619873047, -112.11773681640625, -108.9197998046875, -105.72187042236328, -102.52393341064453, -99.32600402832031, -96.12806701660156, -92.93013000488281, -89.73219299316406, -86.53426361083984, -83.3363265991211, -80.13839721679688, -76.94046020507812, -73.74252319335938, -70.54459381103516, -67.34666442871094, -64.14872741699219, -60.95079803466797, -57.75286102294922, -54.554931640625, -51.35699462890625, -48.159061431884766, -44.96112823486328, -41.76319885253906, -38.56526565551758, -35.367332458496094, -32.169395446777344, -28.971464157104492, -25.773530960083008, -22.57559585571289, -19.377662658691406, -16.179729461669922, -12.981796264648438, -9.783862113952637, -6.585927963256836, -3.3879947662353516, -0.1900615692138672, 3.00787353515625, 6.205806732177734, 9.403739929199219, 12.601673126220703, 15.799607276916504, 18.997541427612305, 22.19547462463379, 25.393407821655273, 28.59134292602539, 31.789276123046875, 34.98720932006836]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 6.0, 5.0, 6.0, 5.0, 9.0, 5.0, 16.0, 18.0, 15.0, 18.0, 18.0, 17.0, 19.0, 26.0, 19.0, 28.0, 42.0, 30.0, 49.0, 38.0, 30.0, 48.0, 42.0, 46.0, 51.0, 30.0, 36.0, 29.0, 30.0, 25.0, 46.0, 31.0, 29.0, 25.0, 15.0, 17.0, 18.0, 16.0, 11.0, 9.0, 10.0, 5.0, 10.0, 4.0, 4.0, 1.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.62541198730469, -32.482444763183594, -31.3394775390625, -30.196510314941406, -29.053543090820312, -27.91057586669922, -26.767610549926758, -25.624643325805664, -24.48167610168457, -23.338708877563477, -22.195741653442383, -21.05277442932129, -19.909809112548828, -18.766841888427734, -17.62387466430664, -16.480907440185547, -15.337940216064453, -14.19497299194336, -13.052005767822266, -11.909039497375488, -10.766072273254395, -9.6231050491333, -8.480138778686523, -7.33717155456543, -6.194204330444336, -5.051237106323242, -3.9082703590393066, -2.765303373336792, -1.6223363876342773, -0.4793691635131836, 0.663597583770752, 1.8065643310546875, 2.9495315551757812, 4.092498779296875, 5.2354655265808105, 6.378432273864746, 7.52139949798584, 8.664366722106934, 9.807332992553711, 10.950300216674805, 12.093267440795898, 13.236234664916992, 14.379201889038086, 15.522168159484863, 16.66513442993164, 17.808101654052734, 18.951068878173828, 20.094036102294922, 21.237003326416016, 22.37997055053711, 23.522937774658203, 24.665904998779297, 25.80887222290039, 26.951839447021484, 28.094804763793945, 29.23777198791504, 30.380739212036133, 31.523706436157227, 32.66667175292969, 33.80963897705078, 34.952606201171875, 36.09557342529297, 37.23854064941406, 38.381507873535156, 39.52447509765625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 7.0, 5.0, 10.0, 10.0, 12.0, 10.0, 14.0, 15.0, 17.0, 27.0, 21.0, 37.0, 35.0, 32.0, 42.0, 48.0, 35.0, 38.0, 36.0, 46.0, 40.0, 36.0, 43.0, 47.0, 43.0, 35.0, 33.0, 34.0, 29.0, 26.0, 28.0, 22.0, 17.0, 11.0, 16.0, 10.0, 7.0, 4.0, 4.0, 3.0, 6.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-4.98046875, -4.828125, -4.67578125, -4.5234375, -4.37109375, -4.21875, -4.06640625, -3.9140625, -3.76171875, -3.609375, -3.45703125, -3.3046875, -3.15234375, -3.0, -2.84765625, -2.6953125, -2.54296875, -2.390625, -2.23828125, -2.0859375, -1.93359375, -1.78125, -1.62890625, -1.4765625, -1.32421875, -1.171875, -1.01953125, -0.8671875, -0.71484375, -0.5625, -0.41015625, -0.2578125, -0.10546875, 0.046875, 0.19921875, 0.3515625, 0.50390625, 0.65625, 0.80859375, 0.9609375, 1.11328125, 1.265625, 1.41796875, 1.5703125, 1.72265625, 1.875, 2.02734375, 2.1796875, 2.33203125, 2.484375, 2.63671875, 2.7890625, 2.94140625, 3.09375, 3.24609375, 3.3984375, 3.55078125, 3.703125, 3.85546875, 4.0078125, 4.16015625, 4.3125, 4.46484375, 4.6171875, 4.76953125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 10.0, 12.0, 26.0, 38.0, 59.0, 128.0, 203.0, 368.0, 601.0, 1051.0, 1933.0, 3284.0, 5796.0, 10113.0, 17158.0, 28996.0, 51566.0, 110567.0, 477975.0, 185651.0, 66407.0, 36466.0, 21099.0, 12192.0, 7145.0, 4108.0, 2397.0, 1306.0, 810.0, 476.0, 259.0, 126.0, 82.0, 42.0, 27.0, 23.0, 16.0, 16.0, 8.0, 4.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.5625, -11.12939453125, -10.6962890625, -10.26318359375, -9.830078125, -9.39697265625, -8.9638671875, -8.53076171875, -8.09765625, -7.66455078125, -7.2314453125, -6.79833984375, -6.365234375, -5.93212890625, -5.4990234375, -5.06591796875, -4.6328125, -4.19970703125, -3.7666015625, -3.33349609375, -2.900390625, -2.46728515625, -2.0341796875, -1.60107421875, -1.16796875, -0.73486328125, -0.3017578125, 0.13134765625, 0.564453125, 0.99755859375, 1.4306640625, 1.86376953125, 2.296875, 2.72998046875, 3.1630859375, 3.59619140625, 4.029296875, 4.46240234375, 4.8955078125, 5.32861328125, 5.76171875, 6.19482421875, 6.6279296875, 7.06103515625, 7.494140625, 7.92724609375, 8.3603515625, 8.79345703125, 9.2265625, 9.65966796875, 10.0927734375, 10.52587890625, 10.958984375, 11.39208984375, 11.8251953125, 12.25830078125, 12.69140625, 13.12451171875, 13.5576171875, 13.99072265625, 14.423828125, 14.85693359375, 15.2900390625, 15.72314453125, 16.15625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 4.0, 4.0, 3.0, 5.0, 5.0, 11.0, 12.0, 10.0, 15.0, 22.0, 16.0, 17.0, 30.0, 30.0, 23.0, 32.0, 46.0, 33.0, 35.0, 48.0, 44.0, 37.0, 1064.0, 44.0, 29.0, 34.0, 34.0, 48.0, 28.0, 31.0, 32.0, 31.0, 26.0, 18.0, 18.0, 20.0, 18.0, 9.0, 14.0, 7.0, 12.0, 5.0, 3.0, 3.0, 6.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.5, -3.38812255859375, -3.2762451171875, -3.16436767578125, -3.052490234375, -2.94061279296875, -2.8287353515625, -2.71685791015625, -2.60498046875, -2.49310302734375, -2.3812255859375, -2.26934814453125, -2.157470703125, -2.04559326171875, -1.9337158203125, -1.82183837890625, -1.7099609375, -1.59808349609375, -1.4862060546875, -1.37432861328125, -1.262451171875, -1.15057373046875, -1.0386962890625, -0.92681884765625, -0.81494140625, -0.70306396484375, -0.5911865234375, -0.47930908203125, -0.367431640625, -0.25555419921875, -0.1436767578125, -0.03179931640625, 0.080078125, 0.19195556640625, 0.3038330078125, 0.41571044921875, 0.527587890625, 0.63946533203125, 0.7513427734375, 0.86322021484375, 0.97509765625, 1.08697509765625, 1.1988525390625, 1.31072998046875, 1.422607421875, 1.53448486328125, 1.6463623046875, 1.75823974609375, 1.8701171875, 1.98199462890625, 2.0938720703125, 2.20574951171875, 2.317626953125, 2.42950439453125, 2.5413818359375, 2.65325927734375, 2.76513671875, 2.87701416015625, 2.9888916015625, 3.10076904296875, 3.212646484375, 3.32452392578125, 3.4364013671875, 3.54827880859375, 3.66015625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 3.0, 14.0, 12.0, 22.0, 25.0, 36.0, 37.0, 68.0, 98.0, 147.0, 221.0, 294.0, 483.0, 681.0, 1065.0, 1640.0, 2545.0, 4020.0, 6876.0, 12345.0, 22429.0, 46106.0, 106253.0, 365239.0, 1196378.0, 186184.0, 70237.0, 32825.0, 16937.0, 9223.0, 5468.0, 3284.0, 1989.0, 1290.0, 868.0, 581.0, 362.0, 242.0, 198.0, 114.0, 80.0, 53.0, 52.0, 31.0, 19.0, 19.0, 10.0, 10.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.4375, -7.1917724609375, -6.946044921875, -6.7003173828125, -6.45458984375, -6.2088623046875, -5.963134765625, -5.7174072265625, -5.4716796875, -5.2259521484375, -4.980224609375, -4.7344970703125, -4.48876953125, -4.2430419921875, -3.997314453125, -3.7515869140625, -3.505859375, -3.2601318359375, -3.014404296875, -2.7686767578125, -2.52294921875, -2.2772216796875, -2.031494140625, -1.7857666015625, -1.5400390625, -1.2943115234375, -1.048583984375, -0.8028564453125, -0.55712890625, -0.3114013671875, -0.065673828125, 0.1800537109375, 0.42578125, 0.6715087890625, 0.917236328125, 1.1629638671875, 1.40869140625, 1.6544189453125, 1.900146484375, 2.1458740234375, 2.3916015625, 2.6373291015625, 2.883056640625, 3.1287841796875, 3.37451171875, 3.6202392578125, 3.865966796875, 4.1116943359375, 4.357421875, 4.6031494140625, 4.848876953125, 5.0946044921875, 5.34033203125, 5.5860595703125, 5.831787109375, 6.0775146484375, 6.3232421875, 6.5689697265625, 6.814697265625, 7.0604248046875, 7.30615234375, 7.5518798828125, 7.797607421875, 8.0433349609375, 8.2890625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 3.0, 6.0, 9.0, 9.0, 9.0, 14.0, 19.0, 33.0, 54.0, 60.0, 82.0, 214.0, 194.0, 87.0, 59.0, 41.0, 26.0, 13.0, 17.0, 7.0, 9.0, 9.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.74609375, -4.6273193359375, -4.508544921875, -4.3897705078125, -4.27099609375, -4.1522216796875, -4.033447265625, -3.9146728515625, -3.7958984375, -3.6771240234375, -3.558349609375, -3.4395751953125, -3.32080078125, -3.2020263671875, -3.083251953125, -2.9644775390625, -2.845703125, -2.7269287109375, -2.608154296875, -2.4893798828125, -2.37060546875, -2.2518310546875, -2.133056640625, -2.0142822265625, -1.8955078125, -1.7767333984375, -1.657958984375, -1.5391845703125, -1.42041015625, -1.3016357421875, -1.182861328125, -1.0640869140625, -0.9453125, -0.8265380859375, -0.707763671875, -0.5889892578125, -0.47021484375, -0.3514404296875, -0.232666015625, -0.1138916015625, 0.0048828125, 0.1236572265625, 0.242431640625, 0.3612060546875, 0.47998046875, 0.5987548828125, 0.717529296875, 0.8363037109375, 0.955078125, 1.0738525390625, 1.192626953125, 1.3114013671875, 1.43017578125, 1.5489501953125, 1.667724609375, 1.7864990234375, 1.9052734375, 2.0240478515625, 2.142822265625, 2.2615966796875, 2.38037109375, 2.4991455078125, 2.617919921875, 2.7366943359375, 2.85546875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 7.0, 11.0, 8.0, 22.0, 24.0, 30.0, 58.0, 123.0, 331.0, 2476.0, 120034.0, 919055.0, 5442.0, 546.0, 166.0, 73.0, 51.0, 27.0, 17.0, 15.0, 6.0, 5.0, 8.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.28125, -49.15771484375, -47.0341796875, -44.91064453125, -42.787109375, -40.66357421875, -38.5400390625, -36.41650390625, -34.29296875, -32.16943359375, -30.0458984375, -27.92236328125, -25.798828125, -23.67529296875, -21.5517578125, -19.42822265625, -17.3046875, -15.18115234375, -13.0576171875, -10.93408203125, -8.810546875, -6.68701171875, -4.5634765625, -2.43994140625, -0.31640625, 1.80712890625, 3.9306640625, 6.05419921875, 8.177734375, 10.30126953125, 12.4248046875, 14.54833984375, 16.671875, 18.79541015625, 20.9189453125, 23.04248046875, 25.166015625, 27.28955078125, 29.4130859375, 31.53662109375, 33.66015625, 35.78369140625, 37.9072265625, 40.03076171875, 42.154296875, 44.27783203125, 46.4013671875, 48.52490234375, 50.6484375, 52.77197265625, 54.8955078125, 57.01904296875, 59.142578125, 61.26611328125, 63.3896484375, 65.51318359375, 67.63671875, 69.76025390625, 71.8837890625, 74.00732421875, 76.130859375, 78.25439453125, 80.3779296875, 82.50146484375, 84.625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 11.0, 17.0, 37.0, 41.0, 77.0, 96.0, 131.0, 152.0, 135.0, 96.0, 67.0, 52.0, 25.0, 24.0, 17.0, 6.0, 9.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.79245662689209, -9.567646980285645, -9.3428373336792, -9.118026733398438, -8.893217086791992, -8.668407440185547, -8.443597793579102, -8.218788146972656, -7.993978023529053, -7.769168376922607, -7.544358253479004, -7.319548606872559, -7.094738960266113, -6.86992883682251, -6.6451191902160645, -6.420309066772461, -6.195499420166016, -5.97068977355957, -5.745879650115967, -5.5210700035095215, -5.296260356903076, -5.071450233459473, -4.846640586853027, -4.621830940246582, -4.397021293640137, -4.172211647033691, -3.947401762008667, -3.7225918769836426, -3.497781991958618, -3.2729721069335938, -3.0481624603271484, -2.823352575302124, -2.5985426902770996, -2.373732805252075, -2.14892315864563, -1.9241132736206055, -1.699303388595581, -1.4744936227798462, -1.2496838569641113, -1.024873971939087, -0.800064206123352, -0.5752543807029724, -0.35044458508491516, -0.1256347894668579, 0.09917503595352173, 0.32398486137390137, 0.5487946271896362, 0.7736045122146606, 0.9984142780303955, 1.2232240438461304, 1.4480339288711548, 1.6728436946868896, 1.897653579711914, 2.1224632263183594, 2.347273111343384, 2.572082996368408, 2.7968926429748535, 3.021702527999878, 3.2465121746063232, 3.4713220596313477, 3.696131944656372, 3.9209418296813965, 4.145751476287842, 4.370561599731445, 4.595371246337891]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 5.0, 13.0, 7.0, 14.0, 14.0, 21.0, 13.0, 20.0, 18.0, 18.0, 22.0, 26.0, 28.0, 37.0, 31.0, 32.0, 29.0, 33.0, 39.0, 38.0, 33.0, 49.0, 40.0, 33.0, 37.0, 31.0, 32.0, 24.0, 30.0, 28.0, 31.0, 23.0, 31.0, 16.0, 17.0, 14.0, 15.0, 8.0, 15.0, 11.0, 4.0, 5.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0], "bins": [-3.768362522125244, -3.6601686477661133, -3.5519750118255615, -3.4437811374664307, -3.3355872631073, -3.227393627166748, -3.119199752807617, -3.0110058784484863, -2.9028120040893555, -2.7946181297302246, -2.686424493789673, -2.578230619430542, -2.470036745071411, -2.3618431091308594, -2.2536492347717285, -2.1454553604125977, -2.037261724472046, -1.9290679693222046, -1.8208740949630737, -1.7126803398132324, -1.6044864654541016, -1.4962927103042603, -1.388098955154419, -1.279905080795288, -1.1717113256454468, -1.0635175704956055, -0.9553236961364746, -0.8471299409866333, -0.7389361262321472, -0.6307423114776611, -0.5225485563278198, -0.41435474157333374, -0.30616068840026855, -0.19796688854694366, -0.08977308869361877, 0.018420696258544922, 0.126614511013031, 0.2348083257675171, 0.3430020809173584, 0.4511958956718445, 0.5593897104263306, 0.6675835251808167, 0.7757773399353027, 0.883971095085144, 0.9921649098396301, 1.1003587245941162, 1.2085524797439575, 1.3167462348937988, 1.4249401092529297, 1.533133864402771, 1.6413277387619019, 1.7495214939117432, 1.857715368270874, 1.9659091234207153, 2.0741028785705566, 2.1822967529296875, 2.2904906272888184, 2.398684501647949, 2.506878137588501, 2.615072011947632, 2.7232658863067627, 2.8314595222473145, 2.9396533966064453, 3.047847270965576, 3.156040906906128]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 9.0, 6.0, 11.0, 7.0, 11.0, 7.0, 17.0, 16.0, 20.0, 17.0, 28.0, 22.0, 20.0, 25.0, 23.0, 39.0, 45.0, 43.0, 52.0, 39.0, 40.0, 27.0, 41.0, 33.0, 48.0, 39.0, 26.0, 30.0, 28.0, 40.0, 30.0, 24.0, 19.0, 22.0, 18.0, 15.0, 13.0, 11.0, 4.0, 5.0, 3.0, 9.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-4.1328125, -3.99151611328125, -3.8502197265625, -3.70892333984375, -3.567626953125, -3.42633056640625, -3.2850341796875, -3.14373779296875, -3.00244140625, -2.86114501953125, -2.7198486328125, -2.57855224609375, -2.437255859375, -2.29595947265625, -2.1546630859375, -2.01336669921875, -1.8720703125, -1.73077392578125, -1.5894775390625, -1.44818115234375, -1.306884765625, -1.16558837890625, -1.0242919921875, -0.88299560546875, -0.74169921875, -0.60040283203125, -0.4591064453125, -0.31781005859375, -0.176513671875, -0.03521728515625, 0.1060791015625, 0.24737548828125, 0.388671875, 0.52996826171875, 0.6712646484375, 0.81256103515625, 0.953857421875, 1.09515380859375, 1.2364501953125, 1.37774658203125, 1.51904296875, 1.66033935546875, 1.8016357421875, 1.94293212890625, 2.084228515625, 2.22552490234375, 2.3668212890625, 2.50811767578125, 2.6494140625, 2.79071044921875, 2.9320068359375, 3.07330322265625, 3.214599609375, 3.35589599609375, 3.4971923828125, 3.63848876953125, 3.77978515625, 3.92108154296875, 4.0623779296875, 4.20367431640625, 4.344970703125, 4.48626708984375, 4.6275634765625, 4.76885986328125, 4.91015625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 3.0, 10.0, 18.0, 24.0, 22.0, 40.0, 53.0, 81.0, 124.0, 200.0, 276.0, 455.0, 758.0, 1242.0, 2035.0, 3762.0, 6719.0, 12798.0, 25423.0, 54841.0, 124417.0, 293547.0, 291362.0, 122525.0, 53786.0, 25420.0, 12720.0, 6763.0, 3736.0, 2040.0, 1262.0, 735.0, 486.0, 313.0, 182.0, 116.0, 74.0, 63.0, 34.0, 26.0, 23.0, 13.0, 8.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.171875, -4.98712158203125, -4.8023681640625, -4.61761474609375, -4.432861328125, -4.24810791015625, -4.0633544921875, -3.87860107421875, -3.69384765625, -3.50909423828125, -3.3243408203125, -3.13958740234375, -2.954833984375, -2.77008056640625, -2.5853271484375, -2.40057373046875, -2.2158203125, -2.03106689453125, -1.8463134765625, -1.66156005859375, -1.476806640625, -1.29205322265625, -1.1072998046875, -0.92254638671875, -0.73779296875, -0.55303955078125, -0.3682861328125, -0.18353271484375, 0.001220703125, 0.18597412109375, 0.3707275390625, 0.55548095703125, 0.740234375, 0.92498779296875, 1.1097412109375, 1.29449462890625, 1.479248046875, 1.66400146484375, 1.8487548828125, 2.03350830078125, 2.21826171875, 2.40301513671875, 2.5877685546875, 2.77252197265625, 2.957275390625, 3.14202880859375, 3.3267822265625, 3.51153564453125, 3.6962890625, 3.88104248046875, 4.0657958984375, 4.25054931640625, 4.435302734375, 4.62005615234375, 4.8048095703125, 4.98956298828125, 5.17431640625, 5.35906982421875, 5.5438232421875, 5.72857666015625, 5.913330078125, 6.09808349609375, 6.2828369140625, 6.46759033203125, 6.65234375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 10.0, 6.0, 11.0, 8.0, 10.0, 14.0, 19.0, 18.0, 26.0, 29.0, 35.0, 30.0, 48.0, 37.0, 55.0, 70.0, 115.0, 250.0, 1484.0, 238.0, 102.0, 67.0, 65.0, 41.0, 39.0, 36.0, 25.0, 25.0, 22.0, 22.0, 17.0, 10.0, 13.0, 15.0, 5.0, 5.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.859375, -15.323974609375, -14.78857421875, -14.253173828125, -13.7177734375, -13.182373046875, -12.64697265625, -12.111572265625, -11.576171875, -11.040771484375, -10.50537109375, -9.969970703125, -9.4345703125, -8.899169921875, -8.36376953125, -7.828369140625, -7.29296875, -6.757568359375, -6.22216796875, -5.686767578125, -5.1513671875, -4.615966796875, -4.08056640625, -3.545166015625, -3.009765625, -2.474365234375, -1.93896484375, -1.403564453125, -0.8681640625, -0.332763671875, 0.20263671875, 0.738037109375, 1.2734375, 1.808837890625, 2.34423828125, 2.879638671875, 3.4150390625, 3.950439453125, 4.48583984375, 5.021240234375, 5.556640625, 6.092041015625, 6.62744140625, 7.162841796875, 7.6982421875, 8.233642578125, 8.76904296875, 9.304443359375, 9.83984375, 10.375244140625, 10.91064453125, 11.446044921875, 11.9814453125, 12.516845703125, 13.05224609375, 13.587646484375, 14.123046875, 14.658447265625, 15.19384765625, 15.729248046875, 16.2646484375, 16.800048828125, 17.33544921875, 17.870849609375, 18.40625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 4.0, 12.0, 16.0, 23.0, 29.0, 37.0, 63.0, 83.0, 152.0, 227.0, 373.0, 664.0, 1121.0, 2576.0, 9088.0, 90525.0, 2894179.0, 130185.0, 10323.0, 2967.0, 1255.0, 655.0, 431.0, 246.0, 148.0, 109.0, 65.0, 47.0, 33.0, 16.0, 13.0, 9.0, 6.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.59375, -31.560546875, -30.52734375, -29.494140625, -28.4609375, -27.427734375, -26.39453125, -25.361328125, -24.328125, -23.294921875, -22.26171875, -21.228515625, -20.1953125, -19.162109375, -18.12890625, -17.095703125, -16.0625, -15.029296875, -13.99609375, -12.962890625, -11.9296875, -10.896484375, -9.86328125, -8.830078125, -7.796875, -6.763671875, -5.73046875, -4.697265625, -3.6640625, -2.630859375, -1.59765625, -0.564453125, 0.46875, 1.501953125, 2.53515625, 3.568359375, 4.6015625, 5.634765625, 6.66796875, 7.701171875, 8.734375, 9.767578125, 10.80078125, 11.833984375, 12.8671875, 13.900390625, 14.93359375, 15.966796875, 17.0, 18.033203125, 19.06640625, 20.099609375, 21.1328125, 22.166015625, 23.19921875, 24.232421875, 25.265625, 26.298828125, 27.33203125, 28.365234375, 29.3984375, 30.431640625, 31.46484375, 32.498046875, 33.53125]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 236.0, 733.0, 43.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-598.5343017578125, -588.0835571289062, -577.6328125, -567.1820678710938, -556.7313232421875, -546.280517578125, -535.8297729492188, -525.3790283203125, -514.9282836914062, -504.4775390625, -494.02679443359375, -483.5760192871094, -473.1252746582031, -462.6745300292969, -452.2237854003906, -441.7730407714844, -431.3222961425781, -420.8715515136719, -410.4208068847656, -399.97003173828125, -389.519287109375, -379.06854248046875, -368.6177978515625, -358.16705322265625, -347.71630859375, -337.26556396484375, -326.8148193359375, -316.3640441894531, -305.9132995605469, -295.4625549316406, -285.0118103027344, -274.5610656738281, -264.11029052734375, -253.6595458984375, -243.2087860107422, -232.75804138183594, -222.30728149414062, -211.85653686523438, -201.40579223632812, -190.95504760742188, -180.50428771972656, -170.0535430908203, -159.602783203125, -149.15203857421875, -138.7012939453125, -128.2505340576172, -117.79978942871094, -107.34903717041016, -96.89828491210938, -86.4475326538086, -75.99678039550781, -65.54603576660156, -55.09528350830078, -44.64453125, -34.193782806396484, -23.74303436279297, -13.292282104492188, -2.841531753540039, 7.609218597412109, 18.059968948364258, 28.510719299316406, 38.96147155761719, 49.4122200012207, 59.86296844482422, 70.313720703125]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 6.0, 6.0, 4.0, 8.0, 4.0, 12.0, 7.0, 10.0, 17.0, 20.0, 27.0, 31.0, 16.0, 28.0, 24.0, 26.0, 24.0, 31.0, 24.0, 40.0, 37.0, 32.0, 42.0, 37.0, 35.0, 35.0, 32.0, 50.0, 37.0, 29.0, 20.0, 44.0, 25.0, 34.0, 20.0, 22.0, 27.0, 14.0, 11.0, 9.0, 11.0, 7.0, 8.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.96265411376953, -37.621543884277344, -36.280433654785156, -34.93932342529297, -33.59821319580078, -32.25709915161133, -30.91598892211914, -29.574878692626953, -28.233768463134766, -26.892658233642578, -25.55154800415039, -24.21043586730957, -22.869325637817383, -21.528215408325195, -20.187103271484375, -18.845993041992188, -17.5048828125, -16.163772583007812, -14.822661399841309, -13.481550216674805, -12.140439987182617, -10.79932975769043, -9.458218574523926, -8.117107391357422, -6.775997161865234, -5.434886455535889, -4.093775749206543, -2.7526650428771973, -1.4115543365478516, -0.07044363021850586, 1.2706670761108398, 2.6117782592773438, 3.9528884887695312, 5.293999195098877, 6.635109901428223, 7.976220607757568, 9.317331314086914, 10.658441543579102, 11.999552726745605, 13.34066390991211, 14.681774139404297, 16.022884368896484, 17.363994598388672, 18.705106735229492, 20.04621696472168, 21.387327194213867, 22.728439331054688, 24.069549560546875, 25.410659790039062, 26.75177001953125, 28.092880249023438, 29.433992385864258, 30.775102615356445, 32.116214752197266, 33.45732498168945, 34.79843521118164, 36.13954544067383, 37.480655670166016, 38.8217658996582, 40.16287612915039, 41.503990173339844, 42.84510040283203, 44.18621063232422, 45.527320861816406, 46.868431091308594]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 13.0, 8.0, 7.0, 10.0, 12.0, 10.0, 16.0, 26.0, 18.0, 27.0, 31.0, 33.0, 26.0, 38.0, 30.0, 35.0, 42.0, 34.0, 39.0, 38.0, 47.0, 37.0, 49.0, 42.0, 36.0, 34.0, 34.0, 29.0, 28.0, 35.0, 22.0, 14.0, 14.0, 14.0, 9.0, 10.0, 10.0, 6.0, 8.0, 10.0, 3.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.79083251953125, -4.6363525390625, -4.48187255859375, -4.327392578125, -4.17291259765625, -4.0184326171875, -3.86395263671875, -3.70947265625, -3.55499267578125, -3.4005126953125, -3.24603271484375, -3.091552734375, -2.93707275390625, -2.7825927734375, -2.62811279296875, -2.4736328125, -2.31915283203125, -2.1646728515625, -2.01019287109375, -1.855712890625, -1.70123291015625, -1.5467529296875, -1.39227294921875, -1.23779296875, -1.08331298828125, -0.9288330078125, -0.77435302734375, -0.619873046875, -0.46539306640625, -0.3109130859375, -0.15643310546875, -0.001953125, 0.15252685546875, 0.3070068359375, 0.46148681640625, 0.615966796875, 0.77044677734375, 0.9249267578125, 1.07940673828125, 1.23388671875, 1.38836669921875, 1.5428466796875, 1.69732666015625, 1.851806640625, 2.00628662109375, 2.1607666015625, 2.31524658203125, 2.4697265625, 2.62420654296875, 2.7786865234375, 2.93316650390625, 3.087646484375, 3.24212646484375, 3.3966064453125, 3.55108642578125, 3.70556640625, 3.86004638671875, 4.0145263671875, 4.16900634765625, 4.323486328125, 4.47796630859375, 4.6324462890625, 4.78692626953125, 4.94140625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 10.0, 3.0, 10.0, 6.0, 19.0, 32.0, 39.0, 62.0, 81.0, 159.0, 243.0, 483.0, 846.0, 1851.0, 4065.0, 10875.0, 34840.0, 198983.0, 2367866.0, 1418316.0, 114708.0, 25276.0, 8729.0, 3456.0, 1531.0, 744.0, 409.0, 223.0, 119.0, 94.0, 52.0, 46.0, 28.0, 22.0, 18.0, 12.0, 7.0, 4.0, 6.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.875, -14.34130859375, -13.8076171875, -13.27392578125, -12.740234375, -12.20654296875, -11.6728515625, -11.13916015625, -10.60546875, -10.07177734375, -9.5380859375, -9.00439453125, -8.470703125, -7.93701171875, -7.4033203125, -6.86962890625, -6.3359375, -5.80224609375, -5.2685546875, -4.73486328125, -4.201171875, -3.66748046875, -3.1337890625, -2.60009765625, -2.06640625, -1.53271484375, -0.9990234375, -0.46533203125, 0.068359375, 0.60205078125, 1.1357421875, 1.66943359375, 2.203125, 2.73681640625, 3.2705078125, 3.80419921875, 4.337890625, 4.87158203125, 5.4052734375, 5.93896484375, 6.47265625, 7.00634765625, 7.5400390625, 8.07373046875, 8.607421875, 9.14111328125, 9.6748046875, 10.20849609375, 10.7421875, 11.27587890625, 11.8095703125, 12.34326171875, 12.876953125, 13.41064453125, 13.9443359375, 14.47802734375, 15.01171875, 15.54541015625, 16.0791015625, 16.61279296875, 17.146484375, 17.68017578125, 18.2138671875, 18.74755859375, 19.28125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 13.0, 6.0, 13.0, 10.0, 21.0, 18.0, 22.0, 33.0, 38.0, 50.0, 82.0, 88.0, 121.0, 169.0, 254.0, 292.0, 371.0, 515.0, 439.0, 366.0, 288.0, 229.0, 159.0, 121.0, 94.0, 75.0, 34.0, 42.0, 29.0, 17.0, 12.0, 12.0, 7.0, 2.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.28125, -9.94677734375, -9.6123046875, -9.27783203125, -8.943359375, -8.60888671875, -8.2744140625, -7.93994140625, -7.60546875, -7.27099609375, -6.9365234375, -6.60205078125, -6.267578125, -5.93310546875, -5.5986328125, -5.26416015625, -4.9296875, -4.59521484375, -4.2607421875, -3.92626953125, -3.591796875, -3.25732421875, -2.9228515625, -2.58837890625, -2.25390625, -1.91943359375, -1.5849609375, -1.25048828125, -0.916015625, -0.58154296875, -0.2470703125, 0.08740234375, 0.421875, 0.75634765625, 1.0908203125, 1.42529296875, 1.759765625, 2.09423828125, 2.4287109375, 2.76318359375, 3.09765625, 3.43212890625, 3.7666015625, 4.10107421875, 4.435546875, 4.77001953125, 5.1044921875, 5.43896484375, 5.7734375, 6.10791015625, 6.4423828125, 6.77685546875, 7.111328125, 7.44580078125, 7.7802734375, 8.11474609375, 8.44921875, 8.78369140625, 9.1181640625, 9.45263671875, 9.787109375, 10.12158203125, 10.4560546875, 10.79052734375, 11.125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 13.0, 17.0, 37.0, 44.0, 79.0, 156.0, 246.0, 446.0, 804.0, 1456.0, 2784.0, 6053.0, 14702.0, 40794.0, 151682.0, 888094.0, 2446055.0, 491534.0, 99381.0, 29222.0, 10891.0, 4726.0, 2381.0, 1163.0, 637.0, 341.0, 199.0, 137.0, 80.0, 49.0, 27.0, 17.0, 9.0, 6.0, 5.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-19.390625, -18.857177734375, -18.32373046875, -17.790283203125, -17.2568359375, -16.723388671875, -16.18994140625, -15.656494140625, -15.123046875, -14.589599609375, -14.05615234375, -13.522705078125, -12.9892578125, -12.455810546875, -11.92236328125, -11.388916015625, -10.85546875, -10.322021484375, -9.78857421875, -9.255126953125, -8.7216796875, -8.188232421875, -7.65478515625, -7.121337890625, -6.587890625, -6.054443359375, -5.52099609375, -4.987548828125, -4.4541015625, -3.920654296875, -3.38720703125, -2.853759765625, -2.3203125, -1.786865234375, -1.25341796875, -0.719970703125, -0.1865234375, 0.346923828125, 0.88037109375, 1.413818359375, 1.947265625, 2.480712890625, 3.01416015625, 3.547607421875, 4.0810546875, 4.614501953125, 5.14794921875, 5.681396484375, 6.21484375, 6.748291015625, 7.28173828125, 7.815185546875, 8.3486328125, 8.882080078125, 9.41552734375, 9.948974609375, 10.482421875, 11.015869140625, 11.54931640625, 12.082763671875, 12.6162109375, 13.149658203125, 13.68310546875, 14.216552734375, 14.75]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 7.0, 2.0, 6.0, 4.0, 9.0, 3.0, 8.0, 20.0, 20.0, 32.0, 30.0, 47.0, 54.0, 56.0, 70.0, 71.0, 82.0, 71.0, 58.0, 59.0, 46.0, 62.0, 45.0, 33.0, 27.0, 20.0, 19.0, 21.0, 8.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.480926513671875, -50.98601531982422, -49.49110412597656, -47.996192932128906, -46.501277923583984, -45.00636672973633, -43.51145553588867, -42.016544342041016, -40.521629333496094, -39.02671813964844, -37.53180694580078, -36.036895751953125, -34.5419807434082, -33.04706954956055, -31.55215835571289, -30.057247161865234, -28.562335968017578, -27.067424774169922, -25.572511672973633, -24.077600479125977, -22.582687377929688, -21.08777618408203, -19.592864990234375, -18.09795379638672, -16.60304069519043, -15.108128547668457, -13.613216400146484, -12.118305206298828, -10.623393058776855, -9.128480911254883, -7.633569717407227, -6.138657569885254, -4.643741607666016, -3.148829698562622, -1.6539177894592285, -0.15900611877441406, 1.3359060287475586, 2.8308181762695312, 4.3257293701171875, 5.82064151763916, 7.315553665161133, 8.810465812683105, 10.305377960205078, 11.800289154052734, 13.295201301574707, 14.79011344909668, 16.285024642944336, 17.779937744140625, 19.27484893798828, 20.769760131835938, 22.264673233032227, 23.759584426879883, 25.254497528076172, 26.749408721923828, 28.244319915771484, 29.73923110961914, 31.23414421081543, 32.72905731201172, 34.223968505859375, 35.71887969970703, 37.21379089355469, 38.708702087402344, 40.20361328125, 41.69852828979492, 43.19343948364258]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 6.0, 4.0, 10.0, 8.0, 17.0, 23.0, 16.0, 22.0, 26.0, 23.0, 31.0, 26.0, 39.0, 40.0, 34.0, 42.0, 53.0, 54.0, 36.0, 39.0, 38.0, 46.0, 50.0, 31.0, 43.0, 30.0, 35.0, 26.0, 18.0, 21.0, 18.0, 12.0, 16.0, 10.0, 8.0, 11.0, 3.0, 9.0, 2.0, 4.0, 5.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-40.58366775512695, -39.310028076171875, -38.0363883972168, -36.76274490356445, -35.489105224609375, -34.2154655456543, -32.94182586669922, -31.668184280395508, -30.394542694091797, -29.12090301513672, -27.847261428833008, -26.57362174987793, -25.29998016357422, -24.02634048461914, -22.752700805664062, -21.47905921936035, -20.205419540405273, -18.931779861450195, -17.658138275146484, -16.384498596191406, -15.110857009887695, -13.837217330932617, -12.563576698303223, -11.289936065673828, -10.016295433044434, -8.742654800415039, -7.4690141677856445, -6.195374011993408, -4.921733379364014, -3.648092746734619, -2.374452590942383, -1.1008119583129883, 0.17282867431640625, 1.4464691877365112, 2.720109701156616, 3.9937500953674316, 5.267390727996826, 6.541031360626221, 7.814671516418457, 9.088312149047852, 10.361952781677246, 11.63559341430664, 12.909234046936035, 14.18287467956543, 15.456514358520508, 16.73015594482422, 18.003795623779297, 19.277435302734375, 20.551076889038086, 21.824716567993164, 23.098358154296875, 24.371997833251953, 25.645639419555664, 26.919279098510742, 28.192920684814453, 29.46656036376953, 30.74020004272461, 32.01383972167969, 33.287479400634766, 34.56112289428711, 35.83476257324219, 37.108402252197266, 38.382041931152344, 39.65568542480469, 40.929325103759766]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 7.0, 5.0, 4.0, 13.0, 10.0, 12.0, 5.0, 5.0, 14.0, 20.0, 20.0, 17.0, 25.0, 29.0, 22.0, 31.0, 36.0, 46.0, 31.0, 43.0, 42.0, 34.0, 40.0, 36.0, 55.0, 38.0, 38.0, 32.0, 34.0, 35.0, 28.0, 24.0, 18.0, 30.0, 21.0, 23.0, 18.0, 13.0, 4.0, 6.0, 7.0, 8.0, 10.0, 1.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.85546875, -4.70196533203125, -4.5484619140625, -4.39495849609375, -4.241455078125, -4.08795166015625, -3.9344482421875, -3.78094482421875, -3.62744140625, -3.47393798828125, -3.3204345703125, -3.16693115234375, -3.013427734375, -2.85992431640625, -2.7064208984375, -2.55291748046875, -2.3994140625, -2.24591064453125, -2.0924072265625, -1.93890380859375, -1.785400390625, -1.63189697265625, -1.4783935546875, -1.32489013671875, -1.17138671875, -1.01788330078125, -0.8643798828125, -0.71087646484375, -0.557373046875, -0.40386962890625, -0.2503662109375, -0.09686279296875, 0.056640625, 0.21014404296875, 0.3636474609375, 0.51715087890625, 0.670654296875, 0.82415771484375, 0.9776611328125, 1.13116455078125, 1.28466796875, 1.43817138671875, 1.5916748046875, 1.74517822265625, 1.898681640625, 2.05218505859375, 2.2056884765625, 2.35919189453125, 2.5126953125, 2.66619873046875, 2.8197021484375, 2.97320556640625, 3.126708984375, 3.28021240234375, 3.4337158203125, 3.58721923828125, 3.74072265625, 3.89422607421875, 4.0477294921875, 4.20123291015625, 4.354736328125, 4.50823974609375, 4.6617431640625, 4.81524658203125, 4.96875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 8.0, 3.0, 12.0, 22.0, 24.0, 52.0, 50.0, 69.0, 88.0, 123.0, 157.0, 218.0, 285.0, 395.0, 538.0, 738.0, 1109.0, 1784.0, 2918.0, 5726.0, 11958.0, 29188.0, 92808.0, 364616.0, 380723.0, 97507.0, 30706.0, 12204.0, 5805.0, 2951.0, 1750.0, 1196.0, 771.0, 539.0, 357.0, 314.0, 221.0, 155.0, 131.0, 81.0, 71.0, 66.0, 36.0, 23.0, 20.0, 10.0, 10.0, 9.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.7421875, -4.59857177734375, -4.4549560546875, -4.31134033203125, -4.167724609375, -4.02410888671875, -3.8804931640625, -3.73687744140625, -3.59326171875, -3.44964599609375, -3.3060302734375, -3.16241455078125, -3.018798828125, -2.87518310546875, -2.7315673828125, -2.58795166015625, -2.4443359375, -2.30072021484375, -2.1571044921875, -2.01348876953125, -1.869873046875, -1.72625732421875, -1.5826416015625, -1.43902587890625, -1.29541015625, -1.15179443359375, -1.0081787109375, -0.86456298828125, -0.720947265625, -0.57733154296875, -0.4337158203125, -0.29010009765625, -0.146484375, -0.00286865234375, 0.1407470703125, 0.28436279296875, 0.427978515625, 0.57159423828125, 0.7152099609375, 0.85882568359375, 1.00244140625, 1.14605712890625, 1.2896728515625, 1.43328857421875, 1.576904296875, 1.72052001953125, 1.8641357421875, 2.00775146484375, 2.1513671875, 2.29498291015625, 2.4385986328125, 2.58221435546875, 2.725830078125, 2.86944580078125, 3.0130615234375, 3.15667724609375, 3.30029296875, 3.44390869140625, 3.5875244140625, 3.73114013671875, 3.874755859375, 4.01837158203125, 4.1619873046875, 4.30560302734375, 4.44921875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 8.0, 5.0, 5.0, 6.0, 8.0, 6.0, 6.0, 19.0, 5.0, 14.0, 25.0, 15.0, 30.0, 22.0, 35.0, 29.0, 37.0, 31.0, 29.0, 38.0, 39.0, 30.0, 38.0, 1059.0, 39.0, 48.0, 36.0, 38.0, 24.0, 27.0, 35.0, 34.0, 22.0, 24.0, 32.0, 21.0, 19.0, 20.0, 15.0, 7.0, 9.0, 8.0, 6.0, 8.0, 4.0, 6.0, 2.0, 6.0, 2.0, 0.0, 1.0, 2.0], "bins": [-3.95703125, -3.844696044921875, -3.73236083984375, -3.620025634765625, -3.5076904296875, -3.395355224609375, -3.28302001953125, -3.170684814453125, -3.058349609375, -2.946014404296875, -2.83367919921875, -2.721343994140625, -2.6090087890625, -2.496673583984375, -2.38433837890625, -2.272003173828125, -2.15966796875, -2.047332763671875, -1.93499755859375, -1.822662353515625, -1.7103271484375, -1.597991943359375, -1.48565673828125, -1.373321533203125, -1.260986328125, -1.148651123046875, -1.03631591796875, -0.923980712890625, -0.8116455078125, -0.699310302734375, -0.58697509765625, -0.474639892578125, -0.3623046875, -0.249969482421875, -0.13763427734375, -0.025299072265625, 0.0870361328125, 0.199371337890625, 0.31170654296875, 0.424041748046875, 0.536376953125, 0.648712158203125, 0.76104736328125, 0.873382568359375, 0.9857177734375, 1.098052978515625, 1.21038818359375, 1.322723388671875, 1.43505859375, 1.547393798828125, 1.65972900390625, 1.772064208984375, 1.8843994140625, 1.996734619140625, 2.10906982421875, 2.221405029296875, 2.333740234375, 2.446075439453125, 2.55841064453125, 2.670745849609375, 2.7830810546875, 2.895416259765625, 3.00775146484375, 3.120086669921875, 3.232421875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 5.0, 12.0, 18.0, 23.0, 24.0, 51.0, 81.0, 92.0, 120.0, 191.0, 263.0, 463.0, 715.0, 1222.0, 2316.0, 4828.0, 10959.0, 31018.0, 127767.0, 1195991.0, 594371.0, 85618.0, 23415.0, 8732.0, 3945.0, 2035.0, 1056.0, 644.0, 379.0, 250.0, 149.0, 113.0, 73.0, 56.0, 39.0, 24.0, 21.0, 15.0, 15.0, 7.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.732421875, -2.637786865234375, -2.54315185546875, -2.448516845703125, -2.3538818359375, -2.259246826171875, -2.16461181640625, -2.069976806640625, -1.975341796875, -1.880706787109375, -1.78607177734375, -1.691436767578125, -1.5968017578125, -1.502166748046875, -1.40753173828125, -1.312896728515625, -1.21826171875, -1.123626708984375, -1.02899169921875, -0.934356689453125, -0.8397216796875, -0.745086669921875, -0.65045166015625, -0.555816650390625, -0.461181640625, -0.366546630859375, -0.27191162109375, -0.177276611328125, -0.0826416015625, 0.011993408203125, 0.10662841796875, 0.201263427734375, 0.2958984375, 0.390533447265625, 0.48516845703125, 0.579803466796875, 0.6744384765625, 0.769073486328125, 0.86370849609375, 0.958343505859375, 1.052978515625, 1.147613525390625, 1.24224853515625, 1.336883544921875, 1.4315185546875, 1.526153564453125, 1.62078857421875, 1.715423583984375, 1.81005859375, 1.904693603515625, 1.99932861328125, 2.093963623046875, 2.1885986328125, 2.283233642578125, 2.37786865234375, 2.472503662109375, 2.567138671875, 2.661773681640625, 2.75640869140625, 2.851043701171875, 2.9456787109375, 3.040313720703125, 3.13494873046875, 3.229583740234375, 3.32421875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 3.0, 5.0, 6.0, 7.0, 7.0, 9.0, 13.0, 9.0, 12.0, 16.0, 11.0, 35.0, 31.0, 53.0, 88.0, 100.0, 158.0, 108.0, 75.0, 71.0, 42.0, 32.0, 31.0, 6.0, 10.0, 11.0, 10.0, 5.0, 9.0, 3.0, 4.0, 5.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.58740234375, -0.5667953491210938, -0.5461883544921875, -0.5255813598632812, -0.504974365234375, -0.48436737060546875, -0.4637603759765625, -0.44315338134765625, -0.42254638671875, -0.40193939208984375, -0.3813323974609375, -0.36072540283203125, -0.340118408203125, -0.31951141357421875, -0.2989044189453125, -0.27829742431640625, -0.2576904296875, -0.23708343505859375, -0.2164764404296875, -0.19586944580078125, -0.175262451171875, -0.15465545654296875, -0.1340484619140625, -0.11344146728515625, -0.09283447265625, -0.07222747802734375, -0.0516204833984375, -0.03101348876953125, -0.010406494140625, 0.01020050048828125, 0.0308074951171875, 0.05141448974609375, 0.072021484375, 0.09262847900390625, 0.1132354736328125, 0.13384246826171875, 0.154449462890625, 0.17505645751953125, 0.1956634521484375, 0.21627044677734375, 0.23687744140625, 0.25748443603515625, 0.2780914306640625, 0.29869842529296875, 0.319305419921875, 0.33991241455078125, 0.3605194091796875, 0.38112640380859375, 0.4017333984375, 0.42234039306640625, 0.4429473876953125, 0.46355438232421875, 0.484161376953125, 0.5047683715820312, 0.5253753662109375, 0.5459823608398438, 0.56658935546875, 0.5871963500976562, 0.6078033447265625, 0.6284103393554688, 0.649017333984375, 0.6696243286132812, 0.6902313232421875, 0.7108383178710938, 0.7314453125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 7.0, 8.0, 4.0, 7.0, 14.0, 22.0, 34.0, 77.0, 150.0, 625.0, 48211.0, 995931.0, 2968.0, 277.0, 84.0, 35.0, 27.0, 16.0, 11.0, 10.0, 9.0, 4.0, 7.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.0625, -20.464599609375, -19.86669921875, -19.268798828125, -18.6708984375, -18.072998046875, -17.47509765625, -16.877197265625, -16.279296875, -15.681396484375, -15.08349609375, -14.485595703125, -13.8876953125, -13.289794921875, -12.69189453125, -12.093994140625, -11.49609375, -10.898193359375, -10.30029296875, -9.702392578125, -9.1044921875, -8.506591796875, -7.90869140625, -7.310791015625, -6.712890625, -6.114990234375, -5.51708984375, -4.919189453125, -4.3212890625, -3.723388671875, -3.12548828125, -2.527587890625, -1.9296875, -1.331787109375, -0.73388671875, -0.135986328125, 0.4619140625, 1.059814453125, 1.65771484375, 2.255615234375, 2.853515625, 3.451416015625, 4.04931640625, 4.647216796875, 5.2451171875, 5.843017578125, 6.44091796875, 7.038818359375, 7.63671875, 8.234619140625, 8.83251953125, 9.430419921875, 10.0283203125, 10.626220703125, 11.22412109375, 11.822021484375, 12.419921875, 13.017822265625, 13.61572265625, 14.213623046875, 14.8115234375, 15.409423828125, 16.00732421875, 16.605224609375, 17.203125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 21.0, 129.0, 411.0, 358.0, 78.0, 16.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.036080002784729, -0.8857355117797852, -0.7353910803794861, -0.585046648979187, -0.43470215797424316, -0.2843576669692993, -0.13401323556900024, 0.016331195831298828, 0.16667568683624268, 0.31702014803886414, 0.4673646092414856, 0.6177090406417847, 0.7680535316467285, 0.9183980226516724, 1.0687425136566162, 1.2190868854522705, 1.3694313764572144, 1.5197758674621582, 1.6701202392578125, 1.8204647302627563, 1.9708092212677002, 2.1211538314819336, 2.271498203277588, 2.421842575073242, 2.5721869468688965, 2.722531318664551, 2.872875928878784, 3.0232203006744385, 3.173564910888672, 3.323909282684326, 3.4742536544799805, 3.6245980262756348, 3.774942398071289, 3.9252867698669434, 4.075631141662598, 4.22597599029541, 4.3763203620910645, 4.526664733886719, 4.677009105682373, 4.827353477478027, 4.97769832611084, 5.128042697906494, 5.278387069702148, 5.428731918334961, 5.579076290130615, 5.7294206619262695, 5.879765033721924, 6.030109405517578, 6.180453777313232, 6.330798149108887, 6.481142520904541, 6.6314873695373535, 6.781831741333008, 6.932176113128662, 7.082520484924316, 7.232864856719971, 7.383209228515625, 7.533553600311279, 7.683897972106934, 7.834242820739746, 7.9845871925354, 8.134931564331055, 8.285276412963867, 8.435620307922363, 8.585965156555176]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 3.0, 4.0, 9.0, 13.0, 8.0, 12.0, 16.0, 23.0, 25.0, 26.0, 29.0, 26.0, 24.0, 35.0, 34.0, 39.0, 40.0, 44.0, 40.0, 40.0, 35.0, 44.0, 42.0, 52.0, 41.0, 38.0, 41.0, 28.0, 27.0, 19.0, 18.0, 23.0, 20.0, 11.0, 11.0, 8.0, 8.0, 8.0, 10.0, 9.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.750479519367218, -0.7282056212425232, -0.7059316635131836, -0.6836577653884888, -0.6613838076591492, -0.6391099095344543, -0.6168359518051147, -0.5945620536804199, -0.5722881555557251, -0.5500142574310303, -0.5277402997016907, -0.5054664015769958, -0.48319244384765625, -0.4609185457229614, -0.4386446177959442, -0.416370689868927, -0.3940967321395874, -0.3718228042125702, -0.349548876285553, -0.32727497816085815, -0.30500102043151855, -0.28272712230682373, -0.2604531943798065, -0.2381792664527893, -0.2159053385257721, -0.19363141059875488, -0.17135748267173767, -0.14908356964588165, -0.12680964171886444, -0.10453571379184723, -0.08226180076599121, -0.059987872838974, -0.03771394491195679, -0.015440020710229874, 0.00683390349149704, 0.029107823967933655, 0.05138175189495087, 0.07365567982196808, 0.0959295928478241, 0.11820352077484131, 0.14047744870185852, 0.16275137662887573, 0.18502530455589294, 0.20729921758174896, 0.22957314550876617, 0.2518470883369446, 0.2741209864616394, 0.2963949143886566, 0.31866884231567383, 0.34094277024269104, 0.36321669816970825, 0.3854905962944031, 0.4077645540237427, 0.4300384521484375, 0.4523123800754547, 0.4745863080024719, 0.49686023592948914, 0.5191341638565063, 0.5414080619812012, 0.5636820197105408, 0.5859559178352356, 0.6082298755645752, 0.63050377368927, 0.6527776718139648, 0.6750516295433044]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 4.0, 2.0, 6.0, 8.0, 12.0, 13.0, 7.0, 11.0, 21.0, 14.0, 12.0, 19.0, 29.0, 40.0, 24.0, 35.0, 33.0, 32.0, 25.0, 45.0, 58.0, 47.0, 44.0, 35.0, 43.0, 55.0, 34.0, 31.0, 31.0, 28.0, 28.0, 29.0, 20.0, 21.0, 19.0, 14.0, 14.0, 8.0, 11.0, 6.0, 9.0, 2.0, 7.0, 3.0, 8.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.89453125, -4.73675537109375, -4.5789794921875, -4.42120361328125, -4.263427734375, -4.10565185546875, -3.9478759765625, -3.79010009765625, -3.63232421875, -3.47454833984375, -3.3167724609375, -3.15899658203125, -3.001220703125, -2.84344482421875, -2.6856689453125, -2.52789306640625, -2.3701171875, -2.21234130859375, -2.0545654296875, -1.89678955078125, -1.739013671875, -1.58123779296875, -1.4234619140625, -1.26568603515625, -1.10791015625, -0.95013427734375, -0.7923583984375, -0.63458251953125, -0.476806640625, -0.31903076171875, -0.1612548828125, -0.00347900390625, 0.154296875, 0.31207275390625, 0.4698486328125, 0.62762451171875, 0.785400390625, 0.94317626953125, 1.1009521484375, 1.25872802734375, 1.41650390625, 1.57427978515625, 1.7320556640625, 1.88983154296875, 2.047607421875, 2.20538330078125, 2.3631591796875, 2.52093505859375, 2.6787109375, 2.83648681640625, 2.9942626953125, 3.15203857421875, 3.309814453125, 3.46759033203125, 3.6253662109375, 3.78314208984375, 3.94091796875, 4.09869384765625, 4.2564697265625, 4.41424560546875, 4.572021484375, 4.72979736328125, 4.8875732421875, 5.04534912109375, 5.203125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 10.0, 6.0, 18.0, 36.0, 40.0, 60.0, 93.0, 120.0, 177.0, 274.0, 408.0, 607.0, 1000.0, 1639.0, 2742.0, 4765.0, 8683.0, 16320.0, 33008.0, 70459.0, 163349.0, 326407.0, 228761.0, 97927.0, 44450.0, 21146.0, 11053.0, 6128.0, 3489.0, 2038.0, 1165.0, 714.0, 481.0, 275.0, 214.0, 157.0, 105.0, 79.0, 51.0, 33.0, 17.0, 20.0, 8.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.80078125, -6.58624267578125, -6.3717041015625, -6.15716552734375, -5.942626953125, -5.72808837890625, -5.5135498046875, -5.29901123046875, -5.08447265625, -4.86993408203125, -4.6553955078125, -4.44085693359375, -4.226318359375, -4.01177978515625, -3.7972412109375, -3.58270263671875, -3.3681640625, -3.15362548828125, -2.9390869140625, -2.72454833984375, -2.510009765625, -2.29547119140625, -2.0809326171875, -1.86639404296875, -1.65185546875, -1.43731689453125, -1.2227783203125, -1.00823974609375, -0.793701171875, -0.57916259765625, -0.3646240234375, -0.15008544921875, 0.064453125, 0.27899169921875, 0.4935302734375, 0.70806884765625, 0.922607421875, 1.13714599609375, 1.3516845703125, 1.56622314453125, 1.78076171875, 1.99530029296875, 2.2098388671875, 2.42437744140625, 2.638916015625, 2.85345458984375, 3.0679931640625, 3.28253173828125, 3.4970703125, 3.71160888671875, 3.9261474609375, 4.14068603515625, 4.355224609375, 4.56976318359375, 4.7843017578125, 4.99884033203125, 5.21337890625, 5.42791748046875, 5.6424560546875, 5.85699462890625, 6.071533203125, 6.28607177734375, 6.5006103515625, 6.71514892578125, 6.9296875]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 8.0, 5.0, 8.0, 12.0, 10.0, 14.0, 15.0, 15.0, 16.0, 24.0, 24.0, 28.0, 29.0, 33.0, 48.0, 50.0, 80.0, 119.0, 232.0, 1356.0, 248.0, 168.0, 97.0, 60.0, 40.0, 44.0, 31.0, 45.0, 18.0, 23.0, 20.0, 30.0, 18.0, 18.0, 15.0, 17.0, 10.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-15.2890625, -14.7745361328125, -14.260009765625, -13.7454833984375, -13.23095703125, -12.7164306640625, -12.201904296875, -11.6873779296875, -11.1728515625, -10.6583251953125, -10.143798828125, -9.6292724609375, -9.11474609375, -8.6002197265625, -8.085693359375, -7.5711669921875, -7.056640625, -6.5421142578125, -6.027587890625, -5.5130615234375, -4.99853515625, -4.4840087890625, -3.969482421875, -3.4549560546875, -2.9404296875, -2.4259033203125, -1.911376953125, -1.3968505859375, -0.88232421875, -0.3677978515625, 0.146728515625, 0.6612548828125, 1.17578125, 1.6903076171875, 2.204833984375, 2.7193603515625, 3.23388671875, 3.7484130859375, 4.262939453125, 4.7774658203125, 5.2919921875, 5.8065185546875, 6.321044921875, 6.8355712890625, 7.35009765625, 7.8646240234375, 8.379150390625, 8.8936767578125, 9.408203125, 9.9227294921875, 10.437255859375, 10.9517822265625, 11.46630859375, 11.9808349609375, 12.495361328125, 13.0098876953125, 13.5244140625, 14.0389404296875, 14.553466796875, 15.0679931640625, 15.58251953125, 16.0970458984375, 16.611572265625, 17.1260986328125, 17.640625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 10.0, 10.0, 15.0, 22.0, 25.0, 25.0, 38.0, 52.0, 72.0, 88.0, 102.0, 170.0, 238.0, 362.0, 853.0, 3523.0, 31595.0, 1256966.0, 1804532.0, 40607.0, 4156.0, 961.0, 402.0, 240.0, 138.0, 130.0, 92.0, 62.0, 54.0, 38.0, 32.0, 11.0, 22.0, 22.0, 9.0, 11.0, 8.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-32.34375, -31.4208984375, -30.498046875, -29.5751953125, -28.65234375, -27.7294921875, -26.806640625, -25.8837890625, -24.9609375, -24.0380859375, -23.115234375, -22.1923828125, -21.26953125, -20.3466796875, -19.423828125, -18.5009765625, -17.578125, -16.6552734375, -15.732421875, -14.8095703125, -13.88671875, -12.9638671875, -12.041015625, -11.1181640625, -10.1953125, -9.2724609375, -8.349609375, -7.4267578125, -6.50390625, -5.5810546875, -4.658203125, -3.7353515625, -2.8125, -1.8896484375, -0.966796875, -0.0439453125, 0.87890625, 1.8017578125, 2.724609375, 3.6474609375, 4.5703125, 5.4931640625, 6.416015625, 7.3388671875, 8.26171875, 9.1845703125, 10.107421875, 11.0302734375, 11.953125, 12.8759765625, 13.798828125, 14.7216796875, 15.64453125, 16.5673828125, 17.490234375, 18.4130859375, 19.3359375, 20.2587890625, 21.181640625, 22.1044921875, 23.02734375, 23.9501953125, 24.873046875, 25.7958984375, 26.71875]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 263.0, 681.0, 69.0, 2.0, 1.0], "bins": [-575.591064453125, -566.0364990234375, -556.48193359375, -546.9273681640625, -537.372802734375, -527.8182373046875, -518.263671875, -508.7091064453125, -499.154541015625, -489.5999755859375, -480.04541015625, -470.4908447265625, -460.936279296875, -451.3817138671875, -441.8271484375, -432.2725830078125, -422.7179870605469, -413.1634216308594, -403.6088562011719, -394.0542907714844, -384.4997253417969, -374.9451599121094, -365.3905944824219, -355.83599853515625, -346.28143310546875, -336.72686767578125, -327.17230224609375, -317.61773681640625, -308.06317138671875, -298.50860595703125, -288.95404052734375, -279.39947509765625, -269.84490966796875, -260.29034423828125, -250.73577880859375, -241.18121337890625, -231.62664794921875, -222.07208251953125, -212.5175018310547, -202.9629364013672, -193.40838623046875, -183.85382080078125, -174.29925537109375, -164.74468994140625, -155.19012451171875, -145.63555908203125, -136.0809783935547, -126.52641296386719, -116.97184753417969, -107.41728210449219, -97.86271667480469, -88.30814361572266, -78.75357818603516, -69.19901275634766, -59.64444351196289, -50.089874267578125, -40.53530502319336, -30.980737686157227, -21.426170349121094, -11.871603012084961, -2.317035675048828, 7.237529754638672, 16.792098999023438, 26.346668243408203, 35.9012336730957]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 6.0, 6.0, 15.0, 18.0, 15.0, 14.0, 14.0, 25.0, 25.0, 30.0, 24.0, 35.0, 40.0, 48.0, 44.0, 30.0, 58.0, 46.0, 28.0, 34.0, 37.0, 39.0, 31.0, 37.0, 26.0, 27.0, 34.0, 25.0, 29.0, 22.0, 18.0, 17.0, 24.0, 17.0, 6.0, 13.0, 6.0, 6.0, 4.0, 5.0, 4.0, 1.0, 7.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-44.46296310424805, -43.11493682861328, -41.76691436767578, -40.418888092041016, -39.07086181640625, -37.722835540771484, -36.37480926513672, -35.02678680419922, -33.67876052856445, -32.33073425292969, -30.982709884643555, -29.634685516357422, -28.286659240722656, -26.93863296508789, -25.590608596801758, -24.242584228515625, -22.89455795288086, -21.546531677246094, -20.19850730895996, -18.850482940673828, -17.502456665039062, -16.154430389404297, -14.806406021118164, -13.458380699157715, -12.110355377197266, -10.762330055236816, -9.414304733276367, -8.066279411315918, -6.718254089355469, -5.3702287673950195, -4.02220344543457, -2.674178123474121, -1.3261489868164062, 0.02187633514404297, 1.3699016571044922, 2.7179269790649414, 4.065952301025391, 5.41397762298584, 6.762002944946289, 8.110028266906738, 9.458053588867188, 10.806078910827637, 12.154104232788086, 13.502129554748535, 14.850154876708984, 16.19818115234375, 17.546205520629883, 18.894229888916016, 20.24225616455078, 21.590282440185547, 22.93830680847168, 24.286331176757812, 25.634357452392578, 26.982383728027344, 28.330408096313477, 29.67843246459961, 31.026458740234375, 32.37448501586914, 33.722511291503906, 35.070533752441406, 36.41856002807617, 37.76658630371094, 39.11460876464844, 40.4626350402832, 41.81066131591797]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 2.0, 8.0, 8.0, 11.0, 13.0, 10.0, 11.0, 13.0, 11.0, 16.0, 19.0, 17.0, 24.0, 38.0, 32.0, 28.0, 31.0, 39.0, 28.0, 31.0, 34.0, 46.0, 25.0, 46.0, 42.0, 40.0, 43.0, 29.0, 33.0, 24.0, 25.0, 29.0, 22.0, 28.0, 19.0, 11.0, 18.0, 10.0, 19.0, 16.0, 8.0, 8.0, 8.0, 10.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.5390625, -4.39093017578125, -4.2427978515625, -4.09466552734375, -3.946533203125, -3.79840087890625, -3.6502685546875, -3.50213623046875, -3.35400390625, -3.20587158203125, -3.0577392578125, -2.90960693359375, -2.761474609375, -2.61334228515625, -2.4652099609375, -2.31707763671875, -2.1689453125, -2.02081298828125, -1.8726806640625, -1.72454833984375, -1.576416015625, -1.42828369140625, -1.2801513671875, -1.13201904296875, -0.98388671875, -0.83575439453125, -0.6876220703125, -0.53948974609375, -0.391357421875, -0.24322509765625, -0.0950927734375, 0.05303955078125, 0.201171875, 0.34930419921875, 0.4974365234375, 0.64556884765625, 0.793701171875, 0.94183349609375, 1.0899658203125, 1.23809814453125, 1.38623046875, 1.53436279296875, 1.6824951171875, 1.83062744140625, 1.978759765625, 2.12689208984375, 2.2750244140625, 2.42315673828125, 2.5712890625, 2.71942138671875, 2.8675537109375, 3.01568603515625, 3.163818359375, 3.31195068359375, 3.4600830078125, 3.60821533203125, 3.75634765625, 3.90447998046875, 4.0526123046875, 4.20074462890625, 4.348876953125, 4.49700927734375, 4.6451416015625, 4.79327392578125, 4.94140625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 6.0, 12.0, 9.0, 21.0, 33.0, 37.0, 58.0, 91.0, 120.0, 197.0, 313.0, 518.0, 949.0, 1668.0, 3830.0, 9224.0, 27535.0, 122148.0, 1257270.0, 2439299.0, 259640.0, 46348.0, 13956.0, 5480.0, 2540.0, 1162.0, 675.0, 376.0, 258.0, 147.0, 107.0, 70.0, 50.0, 35.0, 27.0, 18.0, 13.0, 6.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-16.296875, -15.79052734375, -15.2841796875, -14.77783203125, -14.271484375, -13.76513671875, -13.2587890625, -12.75244140625, -12.24609375, -11.73974609375, -11.2333984375, -10.72705078125, -10.220703125, -9.71435546875, -9.2080078125, -8.70166015625, -8.1953125, -7.68896484375, -7.1826171875, -6.67626953125, -6.169921875, -5.66357421875, -5.1572265625, -4.65087890625, -4.14453125, -3.63818359375, -3.1318359375, -2.62548828125, -2.119140625, -1.61279296875, -1.1064453125, -0.60009765625, -0.09375, 0.41259765625, 0.9189453125, 1.42529296875, 1.931640625, 2.43798828125, 2.9443359375, 3.45068359375, 3.95703125, 4.46337890625, 4.9697265625, 5.47607421875, 5.982421875, 6.48876953125, 6.9951171875, 7.50146484375, 8.0078125, 8.51416015625, 9.0205078125, 9.52685546875, 10.033203125, 10.53955078125, 11.0458984375, 11.55224609375, 12.05859375, 12.56494140625, 13.0712890625, 13.57763671875, 14.083984375, 14.59033203125, 15.0966796875, 15.60302734375, 16.109375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 3.0, 5.0, 8.0, 7.0, 10.0, 13.0, 16.0, 18.0, 20.0, 30.0, 58.0, 63.0, 53.0, 83.0, 123.0, 152.0, 200.0, 271.0, 340.0, 406.0, 488.0, 382.0, 350.0, 237.0, 181.0, 148.0, 100.0, 67.0, 36.0, 44.0, 49.0, 29.0, 19.0, 17.0, 11.0, 12.0, 7.0, 4.0, 9.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1171875, -9.7943115234375, -9.471435546875, -9.1485595703125, -8.82568359375, -8.5028076171875, -8.179931640625, -7.8570556640625, -7.5341796875, -7.2113037109375, -6.888427734375, -6.5655517578125, -6.24267578125, -5.9197998046875, -5.596923828125, -5.2740478515625, -4.951171875, -4.6282958984375, -4.305419921875, -3.9825439453125, -3.65966796875, -3.3367919921875, -3.013916015625, -2.6910400390625, -2.3681640625, -2.0452880859375, -1.722412109375, -1.3995361328125, -1.07666015625, -0.7537841796875, -0.430908203125, -0.1080322265625, 0.21484375, 0.5377197265625, 0.860595703125, 1.1834716796875, 1.50634765625, 1.8292236328125, 2.152099609375, 2.4749755859375, 2.7978515625, 3.1207275390625, 3.443603515625, 3.7664794921875, 4.08935546875, 4.4122314453125, 4.735107421875, 5.0579833984375, 5.380859375, 5.7037353515625, 6.026611328125, 6.3494873046875, 6.67236328125, 6.9952392578125, 7.318115234375, 7.6409912109375, 7.9638671875, 8.2867431640625, 8.609619140625, 8.9324951171875, 9.25537109375, 9.5782470703125, 9.901123046875, 10.2239990234375, 10.546875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 8.0, 7.0, 11.0, 12.0, 15.0, 20.0, 29.0, 59.0, 86.0, 152.0, 244.0, 480.0, 934.0, 1970.0, 4433.0, 10766.0, 30362.0, 102570.0, 512982.0, 2489111.0, 832111.0, 144395.0, 39430.0, 13650.0, 5465.0, 2468.0, 1135.0, 555.0, 307.0, 172.0, 104.0, 71.0, 43.0, 21.0, 30.0, 21.0, 15.0, 10.0, 10.0, 5.0, 5.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.946044921875, -15.40771484375, -14.869384765625, -14.3310546875, -13.792724609375, -13.25439453125, -12.716064453125, -12.177734375, -11.639404296875, -11.10107421875, -10.562744140625, -10.0244140625, -9.486083984375, -8.94775390625, -8.409423828125, -7.87109375, -7.332763671875, -6.79443359375, -6.256103515625, -5.7177734375, -5.179443359375, -4.64111328125, -4.102783203125, -3.564453125, -3.026123046875, -2.48779296875, -1.949462890625, -1.4111328125, -0.872802734375, -0.33447265625, 0.203857421875, 0.7421875, 1.280517578125, 1.81884765625, 2.357177734375, 2.8955078125, 3.433837890625, 3.97216796875, 4.510498046875, 5.048828125, 5.587158203125, 6.12548828125, 6.663818359375, 7.2021484375, 7.740478515625, 8.27880859375, 8.817138671875, 9.35546875, 9.893798828125, 10.43212890625, 10.970458984375, 11.5087890625, 12.047119140625, 12.58544921875, 13.123779296875, 13.662109375, 14.200439453125, 14.73876953125, 15.277099609375, 15.8154296875, 16.353759765625, 16.89208984375, 17.430419921875, 17.96875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 8.0, 5.0, 12.0, 9.0, 18.0, 30.0, 45.0, 48.0, 57.0, 63.0, 79.0, 79.0, 86.0, 89.0, 78.0, 67.0, 56.0, 50.0, 40.0, 26.0, 18.0, 13.0, 11.0, 5.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.365509033203125, -43.6811637878418, -41.99681854248047, -40.312477111816406, -38.62813186645508, -36.94378662109375, -35.25944137573242, -33.575096130371094, -31.890750885009766, -30.206405639648438, -28.522062301635742, -26.837717056274414, -25.153371810913086, -23.46902847290039, -21.784683227539062, -20.100337982177734, -18.41599464416504, -16.73164939880371, -15.0473051071167, -13.362960815429688, -11.67861557006836, -9.994271278381348, -8.309926986694336, -6.625581741333008, -4.941237449645996, -3.256892681121826, -1.5725481510162354, 0.11179637908935547, 1.7961411476135254, 3.4804859161376953, 5.164830207824707, 6.849175453186035, 8.533519744873047, 10.217864036560059, 11.902209281921387, 13.586553573608398, 15.270898818969727, 16.955242156982422, 18.63958740234375, 20.323932647705078, 22.008277893066406, 23.692623138427734, 25.37696647644043, 27.061311721801758, 28.745656967163086, 30.43000030517578, 32.11434555053711, 33.79869079589844, 35.4830322265625, 37.16737747192383, 38.851722717285156, 40.53606414794922, 42.22040939331055, 43.904754638671875, 45.5890998840332, 47.27344512939453, 48.95779037475586, 50.64213562011719, 52.326480865478516, 54.010826110839844, 55.695167541503906, 57.379512786865234, 59.06385803222656, 60.74820327758789, 62.43254852294922]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 5.0, 7.0, 14.0, 14.0, 23.0, 13.0, 24.0, 21.0, 25.0, 36.0, 22.0, 36.0, 31.0, 42.0, 36.0, 39.0, 34.0, 48.0, 53.0, 38.0, 54.0, 38.0, 30.0, 40.0, 25.0, 29.0, 41.0, 31.0, 27.0, 23.0, 16.0, 17.0, 15.0, 12.0, 8.0, 9.0, 4.0, 5.0, 8.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-43.499874114990234, -42.1949348449707, -40.88999557495117, -39.585052490234375, -38.280113220214844, -36.97517395019531, -35.67023468017578, -34.36529541015625, -33.06035614013672, -31.755416870117188, -30.450475692749023, -29.145536422729492, -27.840595245361328, -26.535655975341797, -25.230716705322266, -23.925777435302734, -22.620834350585938, -21.315895080566406, -20.010953903198242, -18.70601463317871, -17.401073455810547, -16.096134185791016, -14.791194915771484, -13.486254692077637, -12.181314468383789, -10.876374244689941, -9.571434020996094, -8.266494750976562, -6.961554527282715, -5.656614303588867, -4.351674556732178, -3.0467348098754883, -1.7417984008789062, -0.4368584156036377, 0.8680815696716309, 2.1730215549468994, 3.477961540222168, 4.782901763916016, 6.087841510772705, 7.3927812576293945, 8.697721481323242, 10.00266170501709, 11.307601928710938, 12.612541198730469, 13.917481422424316, 15.222421646118164, 16.527360916137695, 17.83230209350586, 19.13724136352539, 20.442180633544922, 21.747121810913086, 23.052061080932617, 24.35700225830078, 25.661941528320312, 26.966880798339844, 28.271820068359375, 29.57676124572754, 30.88170051574707, 32.186641693115234, 33.491580963134766, 34.7965202331543, 36.101463317871094, 37.406402587890625, 38.711341857910156, 40.01628112792969]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 4.0, 7.0, 11.0, 9.0, 3.0, 7.0, 13.0, 14.0, 15.0, 18.0, 17.0, 30.0, 27.0, 31.0, 21.0, 25.0, 44.0, 31.0, 40.0, 34.0, 35.0, 45.0, 37.0, 31.0, 38.0, 36.0, 41.0, 43.0, 27.0, 27.0, 32.0, 28.0, 24.0, 16.0, 26.0, 15.0, 16.0, 12.0, 11.0, 10.0, 6.0, 7.0, 7.0, 11.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.82421875, -4.67535400390625, -4.5264892578125, -4.37762451171875, -4.228759765625, -4.07989501953125, -3.9310302734375, -3.78216552734375, -3.63330078125, -3.48443603515625, -3.3355712890625, -3.18670654296875, -3.037841796875, -2.88897705078125, -2.7401123046875, -2.59124755859375, -2.4423828125, -2.29351806640625, -2.1446533203125, -1.99578857421875, -1.846923828125, -1.69805908203125, -1.5491943359375, -1.40032958984375, -1.25146484375, -1.10260009765625, -0.9537353515625, -0.80487060546875, -0.656005859375, -0.50714111328125, -0.3582763671875, -0.20941162109375, -0.060546875, 0.08831787109375, 0.2371826171875, 0.38604736328125, 0.534912109375, 0.68377685546875, 0.8326416015625, 0.98150634765625, 1.13037109375, 1.27923583984375, 1.4281005859375, 1.57696533203125, 1.725830078125, 1.87469482421875, 2.0235595703125, 2.17242431640625, 2.3212890625, 2.47015380859375, 2.6190185546875, 2.76788330078125, 2.916748046875, 3.06561279296875, 3.2144775390625, 3.36334228515625, 3.51220703125, 3.66107177734375, 3.8099365234375, 3.95880126953125, 4.107666015625, 4.25653076171875, 4.4053955078125, 4.55426025390625, 4.703125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 10.0, 18.0, 31.0, 48.0, 67.0, 138.0, 206.0, 377.0, 687.0, 1443.0, 3588.0, 10535.0, 39558.0, 245584.0, 632597.0, 84161.0, 19402.0, 5825.0, 2116.0, 978.0, 472.0, 306.0, 142.0, 101.0, 54.0, 44.0, 18.0, 14.0, 5.0, 9.0, 4.0, 1.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.515625, -10.20849609375, -9.9013671875, -9.59423828125, -9.287109375, -8.97998046875, -8.6728515625, -8.36572265625, -8.05859375, -7.75146484375, -7.4443359375, -7.13720703125, -6.830078125, -6.52294921875, -6.2158203125, -5.90869140625, -5.6015625, -5.29443359375, -4.9873046875, -4.68017578125, -4.373046875, -4.06591796875, -3.7587890625, -3.45166015625, -3.14453125, -2.83740234375, -2.5302734375, -2.22314453125, -1.916015625, -1.60888671875, -1.3017578125, -0.99462890625, -0.6875, -0.38037109375, -0.0732421875, 0.23388671875, 0.541015625, 0.84814453125, 1.1552734375, 1.46240234375, 1.76953125, 2.07666015625, 2.3837890625, 2.69091796875, 2.998046875, 3.30517578125, 3.6123046875, 3.91943359375, 4.2265625, 4.53369140625, 4.8408203125, 5.14794921875, 5.455078125, 5.76220703125, 6.0693359375, 6.37646484375, 6.68359375, 6.99072265625, 7.2978515625, 7.60498046875, 7.912109375, 8.21923828125, 8.5263671875, 8.83349609375, 9.140625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 4.0, 5.0, 5.0, 6.0, 6.0, 8.0, 9.0, 8.0, 16.0, 16.0, 19.0, 15.0, 19.0, 19.0, 22.0, 32.0, 18.0, 27.0, 38.0, 41.0, 39.0, 31.0, 31.0, 51.0, 1066.0, 44.0, 23.0, 27.0, 37.0, 29.0, 30.0, 32.0, 34.0, 27.0, 26.0, 21.0, 24.0, 15.0, 17.0, 21.0, 12.0, 12.0, 6.0, 8.0, 10.0, 10.0, 1.0, 4.0, 4.0, 2.0, 1.0, 6.0, 3.0], "bins": [-3.73828125, -3.633209228515625, -3.52813720703125, -3.423065185546875, -3.3179931640625, -3.212921142578125, -3.10784912109375, -3.002777099609375, -2.897705078125, -2.792633056640625, -2.68756103515625, -2.582489013671875, -2.4774169921875, -2.372344970703125, -2.26727294921875, -2.162200927734375, -2.05712890625, -1.952056884765625, -1.84698486328125, -1.741912841796875, -1.6368408203125, -1.531768798828125, -1.42669677734375, -1.321624755859375, -1.216552734375, -1.111480712890625, -1.00640869140625, -0.901336669921875, -0.7962646484375, -0.691192626953125, -0.58612060546875, -0.481048583984375, -0.3759765625, -0.270904541015625, -0.16583251953125, -0.060760498046875, 0.0443115234375, 0.149383544921875, 0.25445556640625, 0.359527587890625, 0.464599609375, 0.569671630859375, 0.67474365234375, 0.779815673828125, 0.8848876953125, 0.989959716796875, 1.09503173828125, 1.200103759765625, 1.30517578125, 1.410247802734375, 1.51531982421875, 1.620391845703125, 1.7254638671875, 1.830535888671875, 1.93560791015625, 2.040679931640625, 2.145751953125, 2.250823974609375, 2.35589599609375, 2.460968017578125, 2.5660400390625, 2.671112060546875, 2.77618408203125, 2.881256103515625, 2.986328125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 7.0, 5.0, 7.0, 13.0, 9.0, 28.0, 17.0, 36.0, 67.0, 75.0, 108.0, 171.0, 311.0, 478.0, 951.0, 1809.0, 3807.0, 9027.0, 25176.0, 93379.0, 942939.0, 885544.0, 91293.0, 25024.0, 9036.0, 3693.0, 1807.0, 951.0, 479.0, 312.0, 171.0, 118.0, 74.0, 74.0, 33.0, 33.0, 12.0, 19.0, 13.0, 6.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.2764892578125, -4.142822265625, -4.0091552734375, -3.87548828125, -3.7418212890625, -3.608154296875, -3.4744873046875, -3.3408203125, -3.2071533203125, -3.073486328125, -2.9398193359375, -2.80615234375, -2.6724853515625, -2.538818359375, -2.4051513671875, -2.271484375, -2.1378173828125, -2.004150390625, -1.8704833984375, -1.73681640625, -1.6031494140625, -1.469482421875, -1.3358154296875, -1.2021484375, -1.0684814453125, -0.934814453125, -0.8011474609375, -0.66748046875, -0.5338134765625, -0.400146484375, -0.2664794921875, -0.1328125, 0.0008544921875, 0.134521484375, 0.2681884765625, 0.40185546875, 0.5355224609375, 0.669189453125, 0.8028564453125, 0.9365234375, 1.0701904296875, 1.203857421875, 1.3375244140625, 1.47119140625, 1.6048583984375, 1.738525390625, 1.8721923828125, 2.005859375, 2.1395263671875, 2.273193359375, 2.4068603515625, 2.54052734375, 2.6741943359375, 2.807861328125, 2.9415283203125, 3.0751953125, 3.2088623046875, 3.342529296875, 3.4761962890625, 3.60986328125, 3.7435302734375, 3.877197265625, 4.0108642578125, 4.14453125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 6.0, 10.0, 8.0, 15.0, 10.0, 23.0, 32.0, 37.0, 44.0, 65.0, 142.0, 203.0, 137.0, 63.0, 39.0, 47.0, 24.0, 22.0, 15.0, 12.0, 8.0, 6.0, 5.0, 6.0, 8.0, 5.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.009765625, -0.9820785522460938, -0.9543914794921875, -0.9267044067382812, -0.899017333984375, -0.8713302612304688, -0.8436431884765625, -0.8159561157226562, -0.78826904296875, -0.7605819702148438, -0.7328948974609375, -0.7052078247070312, -0.677520751953125, -0.6498336791992188, -0.6221466064453125, -0.5944595336914062, -0.5667724609375, -0.5390853881835938, -0.5113983154296875, -0.48371124267578125, -0.456024169921875, -0.42833709716796875, -0.4006500244140625, -0.37296295166015625, -0.34527587890625, -0.31758880615234375, -0.2899017333984375, -0.26221466064453125, -0.234527587890625, -0.20684051513671875, -0.1791534423828125, -0.15146636962890625, -0.123779296875, -0.09609222412109375, -0.0684051513671875, -0.04071807861328125, -0.013031005859375, 0.01465606689453125, 0.0423431396484375, 0.07003021240234375, 0.09771728515625, 0.12540435791015625, 0.1530914306640625, 0.18077850341796875, 0.208465576171875, 0.23615264892578125, 0.2638397216796875, 0.29152679443359375, 0.3192138671875, 0.34690093994140625, 0.3745880126953125, 0.40227508544921875, 0.429962158203125, 0.45764923095703125, 0.4853363037109375, 0.5130233764648438, 0.54071044921875, 0.5683975219726562, 0.5960845947265625, 0.6237716674804688, 0.651458740234375, 0.6791458129882812, 0.7068328857421875, 0.7345199584960938, 0.76220703125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 3.0, 3.0, 7.0, 3.0, 7.0, 6.0, 15.0, 11.0, 25.0, 33.0, 58.0, 130.0, 407.0, 3669.0, 207783.0, 829858.0, 5669.0, 535.0, 159.0, 60.0, 41.0, 19.0, 12.0, 12.0, 11.0, 8.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2265625, -14.6842041015625, -14.141845703125, -13.5994873046875, -13.05712890625, -12.5147705078125, -11.972412109375, -11.4300537109375, -10.8876953125, -10.3453369140625, -9.802978515625, -9.2606201171875, -8.71826171875, -8.1759033203125, -7.633544921875, -7.0911865234375, -6.548828125, -6.0064697265625, -5.464111328125, -4.9217529296875, -4.37939453125, -3.8370361328125, -3.294677734375, -2.7523193359375, -2.2099609375, -1.6676025390625, -1.125244140625, -0.5828857421875, -0.04052734375, 0.5018310546875, 1.044189453125, 1.5865478515625, 2.12890625, 2.6712646484375, 3.213623046875, 3.7559814453125, 4.29833984375, 4.8406982421875, 5.383056640625, 5.9254150390625, 6.4677734375, 7.0101318359375, 7.552490234375, 8.0948486328125, 8.63720703125, 9.1795654296875, 9.721923828125, 10.2642822265625, 10.806640625, 11.3489990234375, 11.891357421875, 12.4337158203125, 12.97607421875, 13.5184326171875, 14.060791015625, 14.6031494140625, 15.1455078125, 15.6878662109375, 16.230224609375, 16.7725830078125, 17.31494140625, 17.8572998046875, 18.399658203125, 18.9420166015625, 19.484375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 4.0, 10.0, 21.0, 43.0, 75.0, 151.0, 198.0, 213.0, 137.0, 75.0, 40.0, 25.0, 10.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9035966396331787, -0.813762366771698, -0.7239280939102173, -0.6340937614440918, -0.5442594885826111, -0.45442521572113037, -0.3645908832550049, -0.27475661039352417, -0.18492233753204346, -0.09508804976940155, -0.0052537620067596436, 0.08458054065704346, 0.17441481351852417, 0.2642490863800049, 0.35408341884613037, 0.4439176917076111, 0.5337519645690918, 0.6235862374305725, 0.7134205102920532, 0.8032548427581787, 0.8930891156196594, 0.9829233884811401, 1.0727577209472656, 1.1625919342041016, 1.252426266670227, 1.3422605991363525, 1.4320948123931885, 1.521929144859314, 1.6117634773254395, 1.7015976905822754, 1.7914320230484009, 1.8812663555145264, 1.9711003303527832, 2.060934543609619, 2.150768995285034, 2.24060320854187, 2.330437421798706, 2.420271873474121, 2.510106086730957, 2.599940299987793, 2.689774513244629, 2.779608726501465, 2.86944317817688, 2.959277391433716, 3.0491116046905518, 3.138946056365967, 3.2287802696228027, 3.3186144828796387, 3.4084489345550537, 3.4982831478118896, 3.5881175994873047, 3.6779518127441406, 3.7677860260009766, 3.8576202392578125, 3.9474546909332275, 4.037289142608643, 4.1271233558654785, 4.2169575691223145, 4.30679178237915, 4.3966264724731445, 4.4864606857299805, 4.576294898986816, 4.666129112243652, 4.755963325500488, 4.845797538757324]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 9.0, 11.0, 11.0, 15.0, 10.0, 21.0, 18.0, 16.0, 30.0, 35.0, 37.0, 44.0, 41.0, 42.0, 37.0, 45.0, 56.0, 35.0, 39.0, 48.0, 46.0, 31.0, 58.0, 37.0, 34.0, 30.0, 23.0, 26.0, 27.0, 17.0, 16.0, 12.0, 7.0, 7.0, 6.0, 8.0, 5.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6748338937759399, -0.6492640972137451, -0.6236943006515503, -0.5981245636940002, -0.5725547671318054, -0.5469849705696106, -0.5214152336120605, -0.4958454370498657, -0.4702756404876709, -0.4447058439254761, -0.41913607716560364, -0.3935663104057312, -0.3679965138435364, -0.34242671728134155, -0.3168569505214691, -0.2912871837615967, -0.26571738719940186, -0.24014760553836823, -0.2145778238773346, -0.18900804221630096, -0.16343826055526733, -0.1378684788942337, -0.11229869723320007, -0.08672891557216644, -0.06115913391113281, -0.03558935225009918, -0.010019570589065552, 0.015550211071968079, 0.04111999273300171, 0.06668977439403534, 0.09225955605506897, 0.1178293377161026, 0.14339911937713623, 0.16896890103816986, 0.1945386826992035, 0.22010846436023712, 0.24567824602127075, 0.2712480425834656, 0.296817809343338, 0.32238757610321045, 0.3479573726654053, 0.3735271692276001, 0.39909693598747253, 0.42466670274734497, 0.4502364993095398, 0.4758062958717346, 0.5013760328292847, 0.5269458293914795, 0.5525156259536743, 0.5780854225158691, 0.603655219078064, 0.629224956035614, 0.6547947525978088, 0.6803645491600037, 0.7059342861175537, 0.7315040826797485, 0.7570738792419434, 0.7826436758041382, 0.808213472366333, 0.8337832093238831, 0.8593530058860779, 0.8849228024482727, 0.9104925394058228, 0.9360623359680176, 0.9616321325302124]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 4.0, 6.0, 11.0, 6.0, 10.0, 13.0, 12.0, 13.0, 16.0, 20.0, 23.0, 29.0, 30.0, 23.0, 31.0, 26.0, 31.0, 35.0, 45.0, 33.0, 32.0, 42.0, 40.0, 28.0, 38.0, 33.0, 45.0, 34.0, 29.0, 38.0, 26.0, 24.0, 28.0, 22.0, 18.0, 11.0, 12.0, 14.0, 8.0, 9.0, 8.0, 10.0, 8.0, 6.0, 7.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.7265625, -4.58319091796875, -4.4398193359375, -4.29644775390625, -4.153076171875, -4.00970458984375, -3.8663330078125, -3.72296142578125, -3.57958984375, -3.43621826171875, -3.2928466796875, -3.14947509765625, -3.006103515625, -2.86273193359375, -2.7193603515625, -2.57598876953125, -2.4326171875, -2.28924560546875, -2.1458740234375, -2.00250244140625, -1.859130859375, -1.71575927734375, -1.5723876953125, -1.42901611328125, -1.28564453125, -1.14227294921875, -0.9989013671875, -0.85552978515625, -0.712158203125, -0.56878662109375, -0.4254150390625, -0.28204345703125, -0.138671875, 0.00469970703125, 0.1480712890625, 0.29144287109375, 0.434814453125, 0.57818603515625, 0.7215576171875, 0.86492919921875, 1.00830078125, 1.15167236328125, 1.2950439453125, 1.43841552734375, 1.581787109375, 1.72515869140625, 1.8685302734375, 2.01190185546875, 2.1552734375, 2.29864501953125, 2.4420166015625, 2.58538818359375, 2.728759765625, 2.87213134765625, 3.0155029296875, 3.15887451171875, 3.30224609375, 3.44561767578125, 3.5889892578125, 3.73236083984375, 3.875732421875, 4.01910400390625, 4.1624755859375, 4.30584716796875, 4.44921875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 11.0, 10.0, 15.0, 21.0, 36.0, 38.0, 53.0, 76.0, 108.0, 169.0, 213.0, 297.0, 437.0, 694.0, 901.0, 1376.0, 2026.0, 2948.0, 4539.0, 6970.0, 10829.0, 17815.0, 30081.0, 52979.0, 99920.0, 191042.0, 257095.0, 165625.0, 85163.0, 45997.0, 26362.0, 15625.0, 9959.0, 6244.0, 4202.0, 2687.0, 1841.0, 1266.0, 901.0, 590.0, 411.0, 301.0, 209.0, 132.0, 97.0, 65.0, 47.0, 44.0, 27.0, 24.0, 11.0, 13.0, 3.0, 5.0, 3.0, 4.0, 3.0, 2.0], "bins": [-5.2890625, -5.125732421875, -4.96240234375, -4.799072265625, -4.6357421875, -4.472412109375, -4.30908203125, -4.145751953125, -3.982421875, -3.819091796875, -3.65576171875, -3.492431640625, -3.3291015625, -3.165771484375, -3.00244140625, -2.839111328125, -2.67578125, -2.512451171875, -2.34912109375, -2.185791015625, -2.0224609375, -1.859130859375, -1.69580078125, -1.532470703125, -1.369140625, -1.205810546875, -1.04248046875, -0.879150390625, -0.7158203125, -0.552490234375, -0.38916015625, -0.225830078125, -0.0625, 0.100830078125, 0.26416015625, 0.427490234375, 0.5908203125, 0.754150390625, 0.91748046875, 1.080810546875, 1.244140625, 1.407470703125, 1.57080078125, 1.734130859375, 1.8974609375, 2.060791015625, 2.22412109375, 2.387451171875, 2.55078125, 2.714111328125, 2.87744140625, 3.040771484375, 3.2041015625, 3.367431640625, 3.53076171875, 3.694091796875, 3.857421875, 4.020751953125, 4.18408203125, 4.347412109375, 4.5107421875, 4.674072265625, 4.83740234375, 5.000732421875, 5.1640625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 8.0, 5.0, 6.0, 7.0, 13.0, 17.0, 20.0, 27.0, 30.0, 21.0, 31.0, 19.0, 30.0, 48.0, 40.0, 59.0, 87.0, 155.0, 319.0, 1335.0, 180.0, 111.0, 81.0, 64.0, 39.0, 38.0, 41.0, 35.0, 20.0, 30.0, 12.0, 23.0, 19.0, 20.0, 10.0, 8.0, 11.0, 10.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.0546875, -14.5716552734375, -14.088623046875, -13.6055908203125, -13.12255859375, -12.6395263671875, -12.156494140625, -11.6734619140625, -11.1904296875, -10.7073974609375, -10.224365234375, -9.7413330078125, -9.25830078125, -8.7752685546875, -8.292236328125, -7.8092041015625, -7.326171875, -6.8431396484375, -6.360107421875, -5.8770751953125, -5.39404296875, -4.9110107421875, -4.427978515625, -3.9449462890625, -3.4619140625, -2.9788818359375, -2.495849609375, -2.0128173828125, -1.52978515625, -1.0467529296875, -0.563720703125, -0.0806884765625, 0.40234375, 0.8853759765625, 1.368408203125, 1.8514404296875, 2.33447265625, 2.8175048828125, 3.300537109375, 3.7835693359375, 4.2666015625, 4.7496337890625, 5.232666015625, 5.7156982421875, 6.19873046875, 6.6817626953125, 7.164794921875, 7.6478271484375, 8.130859375, 8.6138916015625, 9.096923828125, 9.5799560546875, 10.06298828125, 10.5460205078125, 11.029052734375, 11.5120849609375, 11.9951171875, 12.4781494140625, 12.961181640625, 13.4442138671875, 13.92724609375, 14.4102783203125, 14.893310546875, 15.3763427734375, 15.859375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 3.0, 4.0, 11.0, 11.0, 14.0, 16.0, 25.0, 18.0, 33.0, 26.0, 47.0, 58.0, 80.0, 108.0, 116.0, 198.0, 292.0, 465.0, 1148.0, 5364.0, 53501.0, 1965922.0, 1077282.0, 34513.0, 4177.0, 966.0, 404.0, 220.0, 144.0, 110.0, 83.0, 68.0, 61.0, 55.0, 44.0, 23.0, 16.0, 19.0, 12.0, 16.0, 6.0, 3.0, 8.0, 6.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-26.8125, -25.9453125, -25.078125, -24.2109375, -23.34375, -22.4765625, -21.609375, -20.7421875, -19.875, -19.0078125, -18.140625, -17.2734375, -16.40625, -15.5390625, -14.671875, -13.8046875, -12.9375, -12.0703125, -11.203125, -10.3359375, -9.46875, -8.6015625, -7.734375, -6.8671875, -6.0, -5.1328125, -4.265625, -3.3984375, -2.53125, -1.6640625, -0.796875, 0.0703125, 0.9375, 1.8046875, 2.671875, 3.5390625, 4.40625, 5.2734375, 6.140625, 7.0078125, 7.875, 8.7421875, 9.609375, 10.4765625, 11.34375, 12.2109375, 13.078125, 13.9453125, 14.8125, 15.6796875, 16.546875, 17.4140625, 18.28125, 19.1484375, 20.015625, 20.8828125, 21.75, 22.6171875, 23.484375, 24.3515625, 25.21875, 26.0859375, 26.953125, 27.8203125, 28.6875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 40.0, 632.0, 336.0, 10.0, 0.0, 1.0], "bins": [-542.2586059570312, -533.1889038085938, -524.1192016601562, -515.0494995117188, -505.9798278808594, -496.9101257324219, -487.8404235839844, -478.770751953125, -469.7010498046875, -460.63134765625, -451.5616455078125, -442.4919738769531, -433.4222717285156, -424.3525695800781, -415.2828674316406, -406.21319580078125, -397.14349365234375, -388.07379150390625, -379.00408935546875, -369.9344177246094, -360.8647155761719, -351.7950134277344, -342.7253112792969, -333.6556396484375, -324.5859069824219, -315.5162048339844, -306.4465026855469, -297.3768310546875, -288.30712890625, -279.2374267578125, -270.167724609375, -261.0980224609375, -252.0283660888672, -242.9586639404297, -233.88897705078125, -224.81927490234375, -215.7495880126953, -206.6798858642578, -197.61019897460938, -188.54049682617188, -179.47079467773438, -170.40109252929688, -161.33140563964844, -152.26170349121094, -143.1920166015625, -134.122314453125, -125.05261993408203, -115.98292541503906, -106.91323852539062, -97.84354400634766, -88.77384948730469, -79.70414733886719, -70.63446044921875, -61.564762115478516, -52.49506378173828, -43.42536926269531, -34.35567092895508, -25.28597640991211, -16.216279983520508, -7.146583557128906, 1.9231109619140625, 10.992805480957031, 20.062503814697266, 29.132198333740234, 38.2018928527832]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 1.0, 4.0, 5.0, 7.0, 16.0, 6.0, 11.0, 7.0, 20.0, 16.0, 13.0, 11.0, 18.0, 20.0, 26.0, 27.0, 30.0, 29.0, 36.0, 24.0, 48.0, 26.0, 41.0, 44.0, 39.0, 28.0, 44.0, 35.0, 41.0, 35.0, 28.0, 28.0, 27.0, 29.0, 24.0, 22.0, 25.0, 14.0, 17.0, 7.0, 12.0, 14.0, 9.0, 12.0, 9.0, 4.0, 8.0, 3.0, 1.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.532100677490234, -37.267250061035156, -36.002403259277344, -34.737552642822266, -33.47270202636719, -32.20785140991211, -30.943004608154297, -29.67815399169922, -28.41330337524414, -27.148454666137695, -25.883604049682617, -24.618755340576172, -23.353904724121094, -22.08905601501465, -20.824207305908203, -19.559356689453125, -18.29450798034668, -17.029659271240234, -15.764808654785156, -14.499959945678711, -13.235109329223633, -11.970260620117188, -10.705410957336426, -9.440561294555664, -8.175711631774902, -6.910861968994141, -5.646012306213379, -4.381163120269775, -3.1163134574890137, -1.851463794708252, -0.5866146087646484, 0.6782350540161133, 1.943084716796875, 3.2079343795776367, 4.472784042358398, 5.737633228302002, 7.002482891082764, 8.267332077026367, 9.532181739807129, 10.79703140258789, 12.061881065368652, 13.326730728149414, 14.591580390930176, 15.856430053710938, 17.121278762817383, 18.38612937927246, 19.650978088378906, 20.915828704833984, 22.18067741394043, 23.445526123046875, 24.710376739501953, 25.9752254486084, 27.240076065063477, 28.504924774169922, 29.769775390625, 31.034624099731445, 32.29947280883789, 33.56432342529297, 34.82917022705078, 36.09402084350586, 37.35887145996094, 38.623722076416016, 39.88856887817383, 41.153419494628906, 42.418270111083984]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 5.0, 6.0, 7.0, 7.0, 16.0, 14.0, 22.0, 8.0, 28.0, 21.0, 27.0, 30.0, 35.0, 39.0, 34.0, 39.0, 47.0, 29.0, 30.0, 39.0, 33.0, 33.0, 47.0, 38.0, 40.0, 42.0, 37.0, 32.0, 33.0, 27.0, 16.0, 23.0, 14.0, 18.0, 12.0, 14.0, 13.0, 6.0, 10.0, 9.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.47265625, -5.30609130859375, -5.1395263671875, -4.97296142578125, -4.806396484375, -4.63983154296875, -4.4732666015625, -4.30670166015625, -4.14013671875, -3.97357177734375, -3.8070068359375, -3.64044189453125, -3.473876953125, -3.30731201171875, -3.1407470703125, -2.97418212890625, -2.8076171875, -2.64105224609375, -2.4744873046875, -2.30792236328125, -2.141357421875, -1.97479248046875, -1.8082275390625, -1.64166259765625, -1.47509765625, -1.30853271484375, -1.1419677734375, -0.97540283203125, -0.808837890625, -0.64227294921875, -0.4757080078125, -0.30914306640625, -0.142578125, 0.02398681640625, 0.1905517578125, 0.35711669921875, 0.523681640625, 0.69024658203125, 0.8568115234375, 1.02337646484375, 1.18994140625, 1.35650634765625, 1.5230712890625, 1.68963623046875, 1.856201171875, 2.02276611328125, 2.1893310546875, 2.35589599609375, 2.5224609375, 2.68902587890625, 2.8555908203125, 3.02215576171875, 3.188720703125, 3.35528564453125, 3.5218505859375, 3.68841552734375, 3.85498046875, 4.02154541015625, 4.1881103515625, 4.35467529296875, 4.521240234375, 4.68780517578125, 4.8543701171875, 5.02093505859375, 5.1875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 4.0, 5.0, 7.0, 10.0, 10.0, 23.0, 34.0, 26.0, 61.0, 91.0, 134.0, 220.0, 380.0, 579.0, 1004.0, 2083.0, 4532.0, 12105.0, 41655.0, 256795.0, 2413067.0, 1294230.0, 123036.0, 27364.0, 8960.0, 3824.0, 1785.0, 907.0, 503.0, 313.0, 188.0, 131.0, 76.0, 38.0, 43.0, 13.0, 18.0, 12.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.359375, -16.84619140625, -16.3330078125, -15.81982421875, -15.306640625, -14.79345703125, -14.2802734375, -13.76708984375, -13.25390625, -12.74072265625, -12.2275390625, -11.71435546875, -11.201171875, -10.68798828125, -10.1748046875, -9.66162109375, -9.1484375, -8.63525390625, -8.1220703125, -7.60888671875, -7.095703125, -6.58251953125, -6.0693359375, -5.55615234375, -5.04296875, -4.52978515625, -4.0166015625, -3.50341796875, -2.990234375, -2.47705078125, -1.9638671875, -1.45068359375, -0.9375, -0.42431640625, 0.0888671875, 0.60205078125, 1.115234375, 1.62841796875, 2.1416015625, 2.65478515625, 3.16796875, 3.68115234375, 4.1943359375, 4.70751953125, 5.220703125, 5.73388671875, 6.2470703125, 6.76025390625, 7.2734375, 7.78662109375, 8.2998046875, 8.81298828125, 9.326171875, 9.83935546875, 10.3525390625, 10.86572265625, 11.37890625, 11.89208984375, 12.4052734375, 12.91845703125, 13.431640625, 13.94482421875, 14.4580078125, 14.97119140625, 15.484375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 7.0, 4.0, 6.0, 13.0, 20.0, 20.0, 26.0, 32.0, 45.0, 64.0, 59.0, 84.0, 118.0, 215.0, 245.0, 292.0, 421.0, 447.0, 450.0, 362.0, 267.0, 205.0, 174.0, 117.0, 90.0, 64.0, 46.0, 42.0, 37.0, 26.0, 14.0, 9.0, 9.0, 6.0, 11.0, 6.0, 9.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.390625, -11.0546875, -10.71875, -10.3828125, -10.046875, -9.7109375, -9.375, -9.0390625, -8.703125, -8.3671875, -8.03125, -7.6953125, -7.359375, -7.0234375, -6.6875, -6.3515625, -6.015625, -5.6796875, -5.34375, -5.0078125, -4.671875, -4.3359375, -4.0, -3.6640625, -3.328125, -2.9921875, -2.65625, -2.3203125, -1.984375, -1.6484375, -1.3125, -0.9765625, -0.640625, -0.3046875, 0.03125, 0.3671875, 0.703125, 1.0390625, 1.375, 1.7109375, 2.046875, 2.3828125, 2.71875, 3.0546875, 3.390625, 3.7265625, 4.0625, 4.3984375, 4.734375, 5.0703125, 5.40625, 5.7421875, 6.078125, 6.4140625, 6.75, 7.0859375, 7.421875, 7.7578125, 8.09375, 8.4296875, 8.765625, 9.1015625, 9.4375, 9.7734375, 10.109375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 11.0, 13.0, 8.0, 11.0, 13.0, 16.0, 28.0, 45.0, 45.0, 61.0, 83.0, 151.0, 291.0, 626.0, 1785.0, 6331.0, 29316.0, 222146.0, 2950476.0, 891851.0, 72602.0, 13050.0, 3236.0, 1035.0, 382.0, 227.0, 113.0, 69.0, 57.0, 53.0, 27.0, 23.0, 25.0, 23.0, 6.0, 10.0, 7.0, 5.0, 5.0, 4.0, 2.0, 5.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.5625, -24.703125, -23.84375, -22.984375, -22.125, -21.265625, -20.40625, -19.546875, -18.6875, -17.828125, -16.96875, -16.109375, -15.25, -14.390625, -13.53125, -12.671875, -11.8125, -10.953125, -10.09375, -9.234375, -8.375, -7.515625, -6.65625, -5.796875, -4.9375, -4.078125, -3.21875, -2.359375, -1.5, -0.640625, 0.21875, 1.078125, 1.9375, 2.796875, 3.65625, 4.515625, 5.375, 6.234375, 7.09375, 7.953125, 8.8125, 9.671875, 10.53125, 11.390625, 12.25, 13.109375, 13.96875, 14.828125, 15.6875, 16.546875, 17.40625, 18.265625, 19.125, 19.984375, 20.84375, 21.703125, 22.5625, 23.421875, 24.28125, 25.140625, 26.0, 26.859375, 27.71875, 28.578125, 29.4375]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 7.0, 11.0, 16.0, 44.0, 76.0, 103.0, 113.0, 152.0, 113.0, 111.0, 97.0, 52.0, 50.0, 24.0, 12.0, 12.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.615234375, -56.06852722167969, -53.52181625366211, -50.9751091003418, -48.42839813232422, -45.881690979003906, -43.334983825683594, -40.788272857666016, -38.24156188964844, -35.694854736328125, -33.14814376831055, -30.601436614990234, -28.054725646972656, -25.508018493652344, -22.9613094329834, -20.414600372314453, -17.86789321899414, -15.321184158325195, -12.77447509765625, -10.227766990661621, -7.681057929992676, -5.1343488693237305, -2.5876407623291016, -0.04093170166015625, 2.505777359008789, 5.052486419677734, 7.5991950035095215, 10.145903587341309, 12.692612648010254, 15.2393217086792, 17.786029815673828, 20.332738876342773, 22.87944793701172, 25.426156997680664, 27.97286605834961, 30.519573211669922, 33.0662841796875, 35.61299133300781, 38.159698486328125, 40.7064094543457, 43.25312042236328, 45.799827575683594, 48.34653854370117, 50.893245697021484, 53.43995666503906, 55.986663818359375, 58.53337097167969, 61.080081939697266, 63.62678909301758, 66.17350006103516, 68.72020721435547, 71.26691436767578, 73.8136215209961, 76.36033630371094, 78.90704345703125, 81.45375061035156, 84.00045776367188, 86.54716491699219, 89.0938720703125, 91.64058685302734, 94.18729400634766, 96.73400115966797, 99.28070831298828, 101.82742309570312, 104.37413024902344]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 6.0, 7.0, 13.0, 5.0, 7.0, 16.0, 12.0, 20.0, 23.0, 26.0, 26.0, 44.0, 38.0, 47.0, 47.0, 41.0, 52.0, 50.0, 46.0, 40.0, 39.0, 35.0, 40.0, 35.0, 40.0, 42.0, 36.0, 27.0, 27.0, 28.0, 22.0, 10.0, 11.0, 11.0, 12.0, 4.0, 4.0, 2.0, 4.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-48.59585952758789, -47.260101318359375, -45.924339294433594, -44.58858108520508, -43.25282287597656, -41.91706085205078, -40.581302642822266, -39.24554443359375, -37.90978240966797, -36.57402420043945, -35.23826217651367, -33.902503967285156, -32.56674575805664, -31.230985641479492, -29.895225524902344, -28.559467315673828, -27.223709106445312, -25.887948989868164, -24.55219078063965, -23.2164306640625, -21.880672454833984, -20.544912338256836, -19.209152221679688, -17.873394012451172, -16.537633895874023, -15.201874732971191, -13.86611557006836, -12.530355453491211, -11.194596290588379, -9.858837127685547, -8.523077011108398, -7.187317848205566, -5.8515625, -4.515803337097168, -3.1800436973571777, -1.8442840576171875, -0.5085248947143555, 0.8272342681884766, 2.162994384765625, 3.498753547668457, 4.834512710571289, 6.170271873474121, 7.506031513214111, 8.841791152954102, 10.177550315856934, 11.513309478759766, 12.849069595336914, 14.184828758239746, 15.520587921142578, 16.856348037719727, 18.192106246948242, 19.52786636352539, 20.863624572753906, 22.199384689331055, 23.535144805908203, 24.87090301513672, 26.206663131713867, 27.542423248291016, 28.87818145751953, 30.21394157409668, 31.549701690673828, 32.885459899902344, 34.221221923828125, 35.55698013305664, 36.892738342285156]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 4.0, 9.0, 6.0, 10.0, 14.0, 17.0, 14.0, 11.0, 20.0, 18.0, 18.0, 28.0, 26.0, 21.0, 37.0, 32.0, 24.0, 37.0, 21.0, 39.0, 37.0, 33.0, 35.0, 45.0, 38.0, 53.0, 33.0, 41.0, 26.0, 24.0, 23.0, 28.0, 31.0, 24.0, 16.0, 21.0, 9.0, 14.0, 10.0, 10.0, 8.0, 7.0, 7.0, 6.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-5.3671875, -5.21295166015625, -5.0587158203125, -4.90447998046875, -4.750244140625, -4.59600830078125, -4.4417724609375, -4.28753662109375, -4.13330078125, -3.97906494140625, -3.8248291015625, -3.67059326171875, -3.516357421875, -3.36212158203125, -3.2078857421875, -3.05364990234375, -2.8994140625, -2.74517822265625, -2.5909423828125, -2.43670654296875, -2.282470703125, -2.12823486328125, -1.9739990234375, -1.81976318359375, -1.66552734375, -1.51129150390625, -1.3570556640625, -1.20281982421875, -1.048583984375, -0.89434814453125, -0.7401123046875, -0.58587646484375, -0.431640625, -0.27740478515625, -0.1231689453125, 0.03106689453125, 0.185302734375, 0.33953857421875, 0.4937744140625, 0.64801025390625, 0.80224609375, 0.95648193359375, 1.1107177734375, 1.26495361328125, 1.419189453125, 1.57342529296875, 1.7276611328125, 1.88189697265625, 2.0361328125, 2.19036865234375, 2.3446044921875, 2.49884033203125, 2.653076171875, 2.80731201171875, 2.9615478515625, 3.11578369140625, 3.27001953125, 3.42425537109375, 3.5784912109375, 3.73272705078125, 3.886962890625, 4.04119873046875, 4.1954345703125, 4.34967041015625, 4.50390625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 2.0, 3.0, 14.0, 8.0, 14.0, 14.0, 14.0, 19.0, 45.0, 47.0, 65.0, 96.0, 127.0, 158.0, 251.0, 402.0, 612.0, 1057.0, 1966.0, 4173.0, 10638.0, 39219.0, 295826.0, 592620.0, 73249.0, 16036.0, 5588.0, 2582.0, 1348.0, 807.0, 467.0, 329.0, 185.0, 151.0, 117.0, 80.0, 56.0, 49.0, 26.0, 23.0, 18.0, 15.0, 7.0, 10.0, 8.0, 3.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.4921875, -7.26641845703125, -7.0406494140625, -6.81488037109375, -6.589111328125, -6.36334228515625, -6.1375732421875, -5.91180419921875, -5.68603515625, -5.46026611328125, -5.2344970703125, -5.00872802734375, -4.782958984375, -4.55718994140625, -4.3314208984375, -4.10565185546875, -3.8798828125, -3.65411376953125, -3.4283447265625, -3.20257568359375, -2.976806640625, -2.75103759765625, -2.5252685546875, -2.29949951171875, -2.07373046875, -1.84796142578125, -1.6221923828125, -1.39642333984375, -1.170654296875, -0.94488525390625, -0.7191162109375, -0.49334716796875, -0.267578125, -0.04180908203125, 0.1839599609375, 0.40972900390625, 0.635498046875, 0.86126708984375, 1.0870361328125, 1.31280517578125, 1.53857421875, 1.76434326171875, 1.9901123046875, 2.21588134765625, 2.441650390625, 2.66741943359375, 2.8931884765625, 3.11895751953125, 3.3447265625, 3.57049560546875, 3.7962646484375, 4.02203369140625, 4.247802734375, 4.47357177734375, 4.6993408203125, 4.92510986328125, 5.15087890625, 5.37664794921875, 5.6024169921875, 5.82818603515625, 6.053955078125, 6.27972412109375, 6.5054931640625, 6.73126220703125, 6.95703125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 8.0, 5.0, 11.0, 9.0, 11.0, 17.0, 27.0, 19.0, 22.0, 21.0, 25.0, 31.0, 24.0, 29.0, 35.0, 40.0, 45.0, 46.0, 47.0, 1069.0, 38.0, 42.0, 35.0, 36.0, 44.0, 34.0, 39.0, 33.0, 26.0, 23.0, 25.0, 26.0, 14.0, 12.0, 20.0, 6.0, 11.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0], "bins": [-4.97265625, -4.840362548828125, -4.70806884765625, -4.575775146484375, -4.4434814453125, -4.311187744140625, -4.17889404296875, -4.046600341796875, -3.914306640625, -3.782012939453125, -3.64971923828125, -3.517425537109375, -3.3851318359375, -3.252838134765625, -3.12054443359375, -2.988250732421875, -2.85595703125, -2.723663330078125, -2.59136962890625, -2.459075927734375, -2.3267822265625, -2.194488525390625, -2.06219482421875, -1.929901123046875, -1.797607421875, -1.665313720703125, -1.53302001953125, -1.400726318359375, -1.2684326171875, -1.136138916015625, -1.00384521484375, -0.871551513671875, -0.7392578125, -0.606964111328125, -0.47467041015625, -0.342376708984375, -0.2100830078125, -0.077789306640625, 0.05450439453125, 0.186798095703125, 0.319091796875, 0.451385498046875, 0.58367919921875, 0.715972900390625, 0.8482666015625, 0.980560302734375, 1.11285400390625, 1.245147705078125, 1.37744140625, 1.509735107421875, 1.64202880859375, 1.774322509765625, 1.9066162109375, 2.038909912109375, 2.17120361328125, 2.303497314453125, 2.435791015625, 2.568084716796875, 2.70037841796875, 2.832672119140625, 2.9649658203125, 3.097259521484375, 3.22955322265625, 3.361846923828125, 3.494140625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 11.0, 6.0, 7.0, 16.0, 15.0, 23.0, 36.0, 52.0, 78.0, 111.0, 156.0, 233.0, 424.0, 672.0, 1153.0, 1986.0, 3901.0, 8680.0, 24331.0, 120783.0, 1588585.0, 284126.0, 38615.0, 11953.0, 5030.0, 2629.0, 1333.0, 804.0, 459.0, 331.0, 189.0, 115.0, 76.0, 63.0, 37.0, 28.0, 13.0, 23.0, 9.0, 12.0, 8.0, 2.0, 1.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.734375, -3.626678466796875, -3.51898193359375, -3.411285400390625, -3.3035888671875, -3.195892333984375, -3.08819580078125, -2.980499267578125, -2.872802734375, -2.765106201171875, -2.65740966796875, -2.549713134765625, -2.4420166015625, -2.334320068359375, -2.22662353515625, -2.118927001953125, -2.01123046875, -1.903533935546875, -1.79583740234375, -1.688140869140625, -1.5804443359375, -1.472747802734375, -1.36505126953125, -1.257354736328125, -1.149658203125, -1.041961669921875, -0.93426513671875, -0.826568603515625, -0.7188720703125, -0.611175537109375, -0.50347900390625, -0.395782470703125, -0.2880859375, -0.180389404296875, -0.07269287109375, 0.035003662109375, 0.1427001953125, 0.250396728515625, 0.35809326171875, 0.465789794921875, 0.573486328125, 0.681182861328125, 0.78887939453125, 0.896575927734375, 1.0042724609375, 1.111968994140625, 1.21966552734375, 1.327362060546875, 1.43505859375, 1.542755126953125, 1.65045166015625, 1.758148193359375, 1.8658447265625, 1.973541259765625, 2.08123779296875, 2.188934326171875, 2.296630859375, 2.404327392578125, 2.51202392578125, 2.619720458984375, 2.7274169921875, 2.835113525390625, 2.94281005859375, 3.050506591796875, 3.158203125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 6.0, 2.0, 4.0, 9.0, 9.0, 16.0, 18.0, 10.0, 22.0, 26.0, 47.0, 95.0, 174.0, 194.0, 147.0, 65.0, 32.0, 31.0, 19.0, 9.0, 15.0, 11.0, 9.0, 3.0, 3.0, 6.0, 3.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.482421875, -0.4674491882324219, -0.45247650146484375, -0.4375038146972656, -0.4225311279296875, -0.4075584411621094, -0.39258575439453125, -0.3776130676269531, -0.362640380859375, -0.3476676940917969, -0.33269500732421875, -0.3177223205566406, -0.3027496337890625, -0.2877769470214844, -0.27280426025390625, -0.2578315734863281, -0.24285888671875, -0.22788619995117188, -0.21291351318359375, -0.19794082641601562, -0.1829681396484375, -0.16799545288085938, -0.15302276611328125, -0.13805007934570312, -0.123077392578125, -0.10810470581054688, -0.09313201904296875, -0.07815933227539062, -0.0631866455078125, -0.048213958740234375, -0.03324127197265625, -0.018268585205078125, -0.0032958984375, 0.011676788330078125, 0.02664947509765625, 0.041622161865234375, 0.0565948486328125, 0.07156753540039062, 0.08654022216796875, 0.10151290893554688, 0.116485595703125, 0.13145828247070312, 0.14643096923828125, 0.16140365600585938, 0.1763763427734375, 0.19134902954101562, 0.20632171630859375, 0.22129440307617188, 0.23626708984375, 0.2512397766113281, 0.26621246337890625, 0.2811851501464844, 0.2961578369140625, 0.3111305236816406, 0.32610321044921875, 0.3410758972167969, 0.356048583984375, 0.3710212707519531, 0.38599395751953125, 0.4009666442871094, 0.4159393310546875, 0.4309120178222656, 0.44588470458984375, 0.4608573913574219, 0.475830078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 6.0, 5.0, 7.0, 10.0, 17.0, 26.0, 44.0, 66.0, 92.0, 259.0, 1967.0, 32799.0, 992348.0, 19101.0, 1276.0, 246.0, 95.0, 56.0, 31.0, 22.0, 19.0, 13.0, 14.0, 8.0, 5.0, 0.0, 5.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.9375, -7.658203125, -7.37890625, -7.099609375, -6.8203125, -6.541015625, -6.26171875, -5.982421875, -5.703125, -5.423828125, -5.14453125, -4.865234375, -4.5859375, -4.306640625, -4.02734375, -3.748046875, -3.46875, -3.189453125, -2.91015625, -2.630859375, -2.3515625, -2.072265625, -1.79296875, -1.513671875, -1.234375, -0.955078125, -0.67578125, -0.396484375, -0.1171875, 0.162109375, 0.44140625, 0.720703125, 1.0, 1.279296875, 1.55859375, 1.837890625, 2.1171875, 2.396484375, 2.67578125, 2.955078125, 3.234375, 3.513671875, 3.79296875, 4.072265625, 4.3515625, 4.630859375, 4.91015625, 5.189453125, 5.46875, 5.748046875, 6.02734375, 6.306640625, 6.5859375, 6.865234375, 7.14453125, 7.423828125, 7.703125, 7.982421875, 8.26171875, 8.541015625, 8.8203125, 9.099609375, 9.37890625, 9.658203125, 9.9375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 13.0, 52.0, 157.0, 316.0, 283.0, 136.0, 43.0, 11.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3676256239414215, -0.3048458695411682, -0.2420661300420761, -0.179286390542984, -0.11650663614273071, -0.05372688174247742, 0.009052842855453491, 0.07183259725570679, 0.13461235165596008, 0.19739210605621338, 0.2601718306541443, 0.3229515850543976, 0.3857313394546509, 0.4485110938549042, 0.5112907886505127, 0.5740705728530884, 0.6368503570556641, 0.699630081653595, 0.7624098658561707, 0.8251895904541016, 0.8879693746566772, 0.9507490992546082, 1.013528823852539, 1.0763086080551147, 1.1390882730484009, 1.2018680572509766, 1.2646477222442627, 1.3274275064468384, 1.390207290649414, 1.4529869556427002, 1.5157667398452759, 1.5785465240478516, 1.6413261890411377, 1.7041059732437134, 1.7668856382369995, 1.8296654224395752, 1.8924452066421509, 1.9552249908447266, 2.0180046558380127, 2.080784320831299, 2.143564224243164, 2.20634388923645, 2.2691237926483154, 2.3319034576416016, 2.3946831226348877, 2.457463026046753, 2.520242691040039, 2.583022356033325, 2.6458020210266113, 2.7085816860198975, 2.7713615894317627, 2.834141254425049, 2.896920919418335, 2.9597008228302, 3.0224804878234863, 3.0852601528167725, 3.1480400562286377, 3.210819721221924, 3.273599624633789, 3.336379289627075, 3.3991589546203613, 3.4619388580322266, 3.5247185230255127, 3.587498188018799, 3.650278091430664]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 9.0, 7.0, 10.0, 14.0, 9.0, 19.0, 16.0, 18.0, 22.0, 25.0, 30.0, 42.0, 34.0, 33.0, 41.0, 37.0, 44.0, 53.0, 48.0, 50.0, 52.0, 31.0, 44.0, 45.0, 40.0, 37.0, 28.0, 21.0, 29.0, 18.0, 19.0, 15.0, 8.0, 13.0, 7.0, 11.0, 5.0, 6.0, 2.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4619895815849304, -0.448482483625412, -0.43497538566589355, -0.4214682877063751, -0.4079611897468567, -0.39445406198501587, -0.3809469938278198, -0.367439866065979, -0.35393276810646057, -0.34042567014694214, -0.3269185721874237, -0.3134114742279053, -0.29990437626838684, -0.2863972783088684, -0.2728901505470276, -0.25938305258750916, -0.24587596952915192, -0.23236887156963348, -0.21886177361011505, -0.20535466074943542, -0.191847562789917, -0.17834046483039856, -0.16483336687088013, -0.1513262689113617, -0.13781917095184326, -0.12431207299232483, -0.1108049675822258, -0.09729786962270737, -0.08379076421260834, -0.0702836662530899, -0.05677656829357147, -0.04326946288347244, -0.029762357473373413, -0.016255255788564682, -0.0027481559664011, 0.010758943855762482, 0.024266045540571213, 0.037773147225379944, 0.051280245184898376, 0.0647873505949974, 0.07829444855451584, 0.09180154651403427, 0.1053086519241333, 0.11881574988365173, 0.13232284784317017, 0.1458299458026886, 0.15933704376220703, 0.17284415662288666, 0.1863512545824051, 0.19985835254192352, 0.21336545050144196, 0.22687256336212158, 0.24037966132164001, 0.25388675928115845, 0.2673938572406769, 0.2809009552001953, 0.29440805315971375, 0.3079151511192322, 0.3214222490787506, 0.33492934703826904, 0.3484364449977875, 0.3619435429573059, 0.37545067071914673, 0.38895776867866516, 0.4024648666381836]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [5.0, 1.0, 2.0, 3.0, 3.0, 8.0, 3.0, 1.0, 7.0, 6.0, 4.0, 11.0, 16.0, 15.0, 15.0, 24.0, 21.0, 23.0, 25.0, 24.0, 30.0, 36.0, 33.0, 25.0, 28.0, 48.0, 38.0, 36.0, 38.0, 45.0, 41.0, 33.0, 34.0, 39.0, 31.0, 40.0, 37.0, 22.0, 27.0, 26.0, 14.0, 19.0, 14.0, 9.0, 10.0, 8.0, 10.0, 7.0, 4.0, 3.0, 3.0, 1.0, 9.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5234375, -4.36444091796875, -4.2054443359375, -4.04644775390625, -3.887451171875, -3.72845458984375, -3.5694580078125, -3.41046142578125, -3.25146484375, -3.09246826171875, -2.9334716796875, -2.77447509765625, -2.615478515625, -2.45648193359375, -2.2974853515625, -2.13848876953125, -1.9794921875, -1.82049560546875, -1.6614990234375, -1.50250244140625, -1.343505859375, -1.18450927734375, -1.0255126953125, -0.86651611328125, -0.70751953125, -0.54852294921875, -0.3895263671875, -0.23052978515625, -0.071533203125, 0.08746337890625, 0.2464599609375, 0.40545654296875, 0.564453125, 0.72344970703125, 0.8824462890625, 1.04144287109375, 1.200439453125, 1.35943603515625, 1.5184326171875, 1.67742919921875, 1.83642578125, 1.99542236328125, 2.1544189453125, 2.31341552734375, 2.472412109375, 2.63140869140625, 2.7904052734375, 2.94940185546875, 3.1083984375, 3.26739501953125, 3.4263916015625, 3.58538818359375, 3.744384765625, 3.90338134765625, 4.0623779296875, 4.22137451171875, 4.38037109375, 4.53936767578125, 4.6983642578125, 4.85736083984375, 5.016357421875, 5.17535400390625, 5.3343505859375, 5.49334716796875, 5.65234375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 12.0, 8.0, 14.0, 30.0, 22.0, 24.0, 49.0, 74.0, 110.0, 117.0, 209.0, 270.0, 451.0, 680.0, 1100.0, 1786.0, 2877.0, 5317.0, 10189.0, 22274.0, 68841.0, 280511.0, 454810.0, 131734.0, 35974.0, 14311.0, 6902.0, 3896.0, 2156.0, 1298.0, 824.0, 524.0, 337.0, 239.0, 166.0, 117.0, 92.0, 73.0, 37.0, 36.0, 20.0, 10.0, 11.0, 6.0, 10.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.328125, -10.0076904296875, -9.687255859375, -9.3668212890625, -9.04638671875, -8.7259521484375, -8.405517578125, -8.0850830078125, -7.7646484375, -7.4442138671875, -7.123779296875, -6.8033447265625, -6.48291015625, -6.1624755859375, -5.842041015625, -5.5216064453125, -5.201171875, -4.8807373046875, -4.560302734375, -4.2398681640625, -3.91943359375, -3.5989990234375, -3.278564453125, -2.9581298828125, -2.6376953125, -2.3172607421875, -1.996826171875, -1.6763916015625, -1.35595703125, -1.0355224609375, -0.715087890625, -0.3946533203125, -0.07421875, 0.2462158203125, 0.566650390625, 0.8870849609375, 1.20751953125, 1.5279541015625, 1.848388671875, 2.1688232421875, 2.4892578125, 2.8096923828125, 3.130126953125, 3.4505615234375, 3.77099609375, 4.0914306640625, 4.411865234375, 4.7322998046875, 5.052734375, 5.3731689453125, 5.693603515625, 6.0140380859375, 6.33447265625, 6.6549072265625, 6.975341796875, 7.2957763671875, 7.6162109375, 7.9366455078125, 8.257080078125, 8.5775146484375, 8.89794921875, 9.2183837890625, 9.538818359375, 9.8592529296875, 10.1796875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 6.0, 5.0, 7.0, 5.0, 8.0, 12.0, 11.0, 19.0, 21.0, 17.0, 30.0, 29.0, 30.0, 27.0, 26.0, 53.0, 56.0, 64.0, 116.0, 240.0, 1361.0, 289.0, 133.0, 87.0, 44.0, 55.0, 45.0, 34.0, 28.0, 35.0, 29.0, 24.0, 10.0, 17.0, 16.0, 11.0, 10.0, 7.0, 6.0, 9.0, 9.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-16.828125, -16.3284912109375, -15.828857421875, -15.3292236328125, -14.82958984375, -14.3299560546875, -13.830322265625, -13.3306884765625, -12.8310546875, -12.3314208984375, -11.831787109375, -11.3321533203125, -10.83251953125, -10.3328857421875, -9.833251953125, -9.3336181640625, -8.833984375, -8.3343505859375, -7.834716796875, -7.3350830078125, -6.83544921875, -6.3358154296875, -5.836181640625, -5.3365478515625, -4.8369140625, -4.3372802734375, -3.837646484375, -3.3380126953125, -2.83837890625, -2.3387451171875, -1.839111328125, -1.3394775390625, -0.83984375, -0.3402099609375, 0.159423828125, 0.6590576171875, 1.15869140625, 1.6583251953125, 2.157958984375, 2.6575927734375, 3.1572265625, 3.6568603515625, 4.156494140625, 4.6561279296875, 5.15576171875, 5.6553955078125, 6.155029296875, 6.6546630859375, 7.154296875, 7.6539306640625, 8.153564453125, 8.6531982421875, 9.15283203125, 9.6524658203125, 10.152099609375, 10.6517333984375, 11.1513671875, 11.6510009765625, 12.150634765625, 12.6502685546875, 13.14990234375, 13.6495361328125, 14.149169921875, 14.6488037109375, 15.1484375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 8.0, 6.0, 18.0, 20.0, 25.0, 41.0, 53.0, 77.0, 87.0, 143.0, 193.0, 292.0, 528.0, 1892.0, 13106.0, 1110914.0, 1997194.0, 17327.0, 2209.0, 582.0, 288.0, 195.0, 160.0, 98.0, 70.0, 59.0, 36.0, 20.0, 22.0, 13.0, 8.0, 7.0, 9.0, 0.0, 3.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.96875, -28.7724609375, -27.576171875, -26.3798828125, -25.18359375, -23.9873046875, -22.791015625, -21.5947265625, -20.3984375, -19.2021484375, -18.005859375, -16.8095703125, -15.61328125, -14.4169921875, -13.220703125, -12.0244140625, -10.828125, -9.6318359375, -8.435546875, -7.2392578125, -6.04296875, -4.8466796875, -3.650390625, -2.4541015625, -1.2578125, -0.0615234375, 1.134765625, 2.3310546875, 3.52734375, 4.7236328125, 5.919921875, 7.1162109375, 8.3125, 9.5087890625, 10.705078125, 11.9013671875, 13.09765625, 14.2939453125, 15.490234375, 16.6865234375, 17.8828125, 19.0791015625, 20.275390625, 21.4716796875, 22.66796875, 23.8642578125, 25.060546875, 26.2568359375, 27.453125, 28.6494140625, 29.845703125, 31.0419921875, 32.23828125, 33.4345703125, 34.630859375, 35.8271484375, 37.0234375, 38.2197265625, 39.416015625, 40.6123046875, 41.80859375, 43.0048828125, 44.201171875, 45.3974609375, 46.59375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 7.0, 42.0, 134.0, 312.0, 328.0, 139.0, 41.0, 6.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.227622985839844, -28.985599517822266, -25.743576049804688, -22.501550674438477, -19.2595272064209, -16.01750373840332, -12.77547836303711, -9.533454895019531, -6.291431427001953, -3.049407482147217, 0.19261646270751953, 3.434640884399414, 6.676664352416992, 9.91868782043457, 13.160713195800781, 16.40273666381836, 19.644760131835938, 22.886783599853516, 26.128807067871094, 29.370832443237305, 32.61285400390625, 35.854881286621094, 39.09690475463867, 42.33892822265625, 45.58095169067383, 48.822975158691406, 52.064998626708984, 55.30702209472656, 58.549049377441406, 61.79106903076172, 65.03309631347656, 68.27511596679688, 71.51713562011719, 74.75916290283203, 78.00118255615234, 81.24320983886719, 84.4852294921875, 87.72725677490234, 90.96928405761719, 94.2113037109375, 97.45332336425781, 100.69535064697266, 103.93737030029297, 107.17939758300781, 110.42141723632812, 113.66344451904297, 116.90547180175781, 120.14749145507812, 123.38951873779297, 126.63154602050781, 129.87356567382812, 133.11558532714844, 136.3576202392578, 139.59963989257812, 142.84165954589844, 146.08367919921875, 149.32571411132812, 152.56773376464844, 155.8097686767578, 159.05178833007812, 162.29380798339844, 165.53582763671875, 168.77786254882812, 172.01988220214844, 175.26190185546875]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 4.0, 4.0, 3.0, 7.0, 12.0, 3.0, 7.0, 8.0, 11.0, 12.0, 18.0, 21.0, 32.0, 21.0, 30.0, 40.0, 44.0, 38.0, 35.0, 36.0, 40.0, 51.0, 48.0, 43.0, 47.0, 45.0, 41.0, 31.0, 31.0, 29.0, 37.0, 29.0, 21.0, 14.0, 22.0, 24.0, 10.0, 10.0, 9.0, 9.0, 7.0, 4.0, 4.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.6561279296875, -42.20943832397461, -40.76274490356445, -39.31605529785156, -37.86936569213867, -36.422672271728516, -34.975982666015625, -33.52928924560547, -32.08259963989258, -30.635908126831055, -29.189218521118164, -27.74252700805664, -26.295835494995117, -24.849143981933594, -23.402454376220703, -21.95576286315918, -20.50907325744629, -19.062381744384766, -17.615692138671875, -16.16900062561035, -14.722309112548828, -13.275618553161621, -11.828927993774414, -10.38223648071289, -8.935545921325684, -7.488854885101318, -6.042163848876953, -4.595473289489746, -3.148782253265381, -1.7020912170410156, -0.2554006576538086, 1.1912908554077148, 2.637981414794922, 4.084672451019287, 5.531363487243652, 6.978054046630859, 8.424745559692383, 9.87143611907959, 11.318126678466797, 12.76481819152832, 14.211508750915527, 15.658199310302734, 17.104890823364258, 18.55158233642578, 19.998271942138672, 21.444963455200195, 22.89165496826172, 24.33834457397461, 25.785036087036133, 27.231727600097656, 28.678417205810547, 30.12510871887207, 31.571800231933594, 33.018489837646484, 34.465179443359375, 35.91187286376953, 37.35856246948242, 38.80525207519531, 40.25194549560547, 41.69863510131836, 43.14532470703125, 44.592018127441406, 46.0387077331543, 47.48539733886719, 48.932090759277344]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 2.0, 6.0, 8.0, 6.0, 10.0, 7.0, 5.0, 22.0, 18.0, 24.0, 23.0, 31.0, 24.0, 24.0, 34.0, 36.0, 35.0, 36.0, 38.0, 34.0, 44.0, 38.0, 49.0, 39.0, 50.0, 43.0, 27.0, 31.0, 26.0, 32.0, 29.0, 26.0, 15.0, 24.0, 21.0, 12.0, 14.0, 10.0, 11.0, 11.0, 7.0, 3.0, 6.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0859375, -4.91436767578125, -4.7427978515625, -4.57122802734375, -4.399658203125, -4.22808837890625, -4.0565185546875, -3.88494873046875, -3.71337890625, -3.54180908203125, -3.3702392578125, -3.19866943359375, -3.027099609375, -2.85552978515625, -2.6839599609375, -2.51239013671875, -2.3408203125, -2.16925048828125, -1.9976806640625, -1.82611083984375, -1.654541015625, -1.48297119140625, -1.3114013671875, -1.13983154296875, -0.96826171875, -0.79669189453125, -0.6251220703125, -0.45355224609375, -0.281982421875, -0.11041259765625, 0.0611572265625, 0.23272705078125, 0.404296875, 0.57586669921875, 0.7474365234375, 0.91900634765625, 1.090576171875, 1.26214599609375, 1.4337158203125, 1.60528564453125, 1.77685546875, 1.94842529296875, 2.1199951171875, 2.29156494140625, 2.463134765625, 2.63470458984375, 2.8062744140625, 2.97784423828125, 3.1494140625, 3.32098388671875, 3.4925537109375, 3.66412353515625, 3.835693359375, 4.00726318359375, 4.1788330078125, 4.35040283203125, 4.52197265625, 4.69354248046875, 4.8651123046875, 5.03668212890625, 5.208251953125, 5.37982177734375, 5.5513916015625, 5.72296142578125, 5.89453125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 11.0, 8.0, 17.0, 13.0, 28.0, 29.0, 35.0, 51.0, 80.0, 94.0, 143.0, 196.0, 331.0, 451.0, 688.0, 1009.0, 1698.0, 2704.0, 4942.0, 9663.0, 20497.0, 52774.0, 174358.0, 794744.0, 1997171.0, 848509.0, 182834.0, 55418.0, 21932.0, 10518.0, 5204.0, 2885.0, 1758.0, 1121.0, 750.0, 491.0, 339.0, 237.0, 171.0, 100.0, 89.0, 64.0, 43.0, 33.0, 17.0, 17.0, 9.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.8046875, -9.49365234375, -9.1826171875, -8.87158203125, -8.560546875, -8.24951171875, -7.9384765625, -7.62744140625, -7.31640625, -7.00537109375, -6.6943359375, -6.38330078125, -6.072265625, -5.76123046875, -5.4501953125, -5.13916015625, -4.828125, -4.51708984375, -4.2060546875, -3.89501953125, -3.583984375, -3.27294921875, -2.9619140625, -2.65087890625, -2.33984375, -2.02880859375, -1.7177734375, -1.40673828125, -1.095703125, -0.78466796875, -0.4736328125, -0.16259765625, 0.1484375, 0.45947265625, 0.7705078125, 1.08154296875, 1.392578125, 1.70361328125, 2.0146484375, 2.32568359375, 2.63671875, 2.94775390625, 3.2587890625, 3.56982421875, 3.880859375, 4.19189453125, 4.5029296875, 4.81396484375, 5.125, 5.43603515625, 5.7470703125, 6.05810546875, 6.369140625, 6.68017578125, 6.9912109375, 7.30224609375, 7.61328125, 7.92431640625, 8.2353515625, 8.54638671875, 8.857421875, 9.16845703125, 9.4794921875, 9.79052734375, 10.1015625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 0.0, 14.0, 14.0, 13.0, 18.0, 33.0, 45.0, 57.0, 69.0, 99.0, 154.0, 252.0, 331.0, 452.0, 554.0, 561.0, 431.0, 274.0, 226.0, 144.0, 83.0, 63.0, 64.0, 34.0, 20.0, 25.0, 18.0, 10.0, 2.0, 4.0, 4.0, 7.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.21875, -12.8048095703125, -12.390869140625, -11.9769287109375, -11.56298828125, -11.1490478515625, -10.735107421875, -10.3211669921875, -9.9072265625, -9.4932861328125, -9.079345703125, -8.6654052734375, -8.25146484375, -7.8375244140625, -7.423583984375, -7.0096435546875, -6.595703125, -6.1817626953125, -5.767822265625, -5.3538818359375, -4.93994140625, -4.5260009765625, -4.112060546875, -3.6981201171875, -3.2841796875, -2.8702392578125, -2.456298828125, -2.0423583984375, -1.62841796875, -1.2144775390625, -0.800537109375, -0.3865966796875, 0.02734375, 0.4412841796875, 0.855224609375, 1.2691650390625, 1.68310546875, 2.0970458984375, 2.510986328125, 2.9249267578125, 3.3388671875, 3.7528076171875, 4.166748046875, 4.5806884765625, 4.99462890625, 5.4085693359375, 5.822509765625, 6.2364501953125, 6.650390625, 7.0643310546875, 7.478271484375, 7.8922119140625, 8.30615234375, 8.7200927734375, 9.134033203125, 9.5479736328125, 9.9619140625, 10.3758544921875, 10.789794921875, 11.2037353515625, 11.61767578125, 12.0316162109375, 12.445556640625, 12.8594970703125, 13.2734375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 3.0, 7.0, 10.0, 14.0, 26.0, 28.0, 50.0, 62.0, 102.0, 173.0, 408.0, 1632.0, 8562.0, 90484.0, 3012391.0, 1034035.0, 39621.0, 4892.0, 1026.0, 321.0, 158.0, 102.0, 60.0, 37.0, 16.0, 32.0, 11.0, 11.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.1875, -38.9638671875, -37.740234375, -36.5166015625, -35.29296875, -34.0693359375, -32.845703125, -31.6220703125, -30.3984375, -29.1748046875, -27.951171875, -26.7275390625, -25.50390625, -24.2802734375, -23.056640625, -21.8330078125, -20.609375, -19.3857421875, -18.162109375, -16.9384765625, -15.71484375, -14.4912109375, -13.267578125, -12.0439453125, -10.8203125, -9.5966796875, -8.373046875, -7.1494140625, -5.92578125, -4.7021484375, -3.478515625, -2.2548828125, -1.03125, 0.1923828125, 1.416015625, 2.6396484375, 3.86328125, 5.0869140625, 6.310546875, 7.5341796875, 8.7578125, 9.9814453125, 11.205078125, 12.4287109375, 13.65234375, 14.8759765625, 16.099609375, 17.3232421875, 18.546875, 19.7705078125, 20.994140625, 22.2177734375, 23.44140625, 24.6650390625, 25.888671875, 27.1123046875, 28.3359375, 29.5595703125, 30.783203125, 32.0068359375, 33.23046875, 34.4541015625, 35.677734375, 36.9013671875, 38.125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 9.0, 19.0, 30.0, 69.0, 119.0, 165.0, 196.0, 174.0, 108.0, 68.0, 32.0, 12.0, 9.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.75459289550781, -99.37123107910156, -95.98786926269531, -92.60450744628906, -89.22114562988281, -85.83778381347656, -82.45442199707031, -79.07106018066406, -75.68769836425781, -72.30433654785156, -68.92097473144531, -65.53761291503906, -62.15425109863281, -58.77088928222656, -55.38752365112305, -52.0041618347168, -48.62079620361328, -45.23743438720703, -41.85407257080078, -38.47071075439453, -35.08734893798828, -31.7039852142334, -28.320621490478516, -24.937259674072266, -21.553897857666016, -18.170536041259766, -14.7871732711792, -11.403810501098633, -8.020448684692383, -4.637086868286133, -1.25372314453125, 2.129638671875, 5.512992858886719, 8.896354675292969, 12.279717445373535, 15.663080215454102, 19.04644203186035, 22.4298038482666, 25.813167572021484, 29.196529388427734, 32.579891204833984, 35.963253021240234, 39.346614837646484, 42.72998046875, 46.11334228515625, 49.4967041015625, 52.88006591796875, 56.263427734375, 59.64678955078125, 63.0301513671875, 66.41351318359375, 69.796875, 73.18023681640625, 76.5635986328125, 79.94696044921875, 83.330322265625, 86.71368408203125, 90.0970458984375, 93.48040771484375, 96.86376953125, 100.24713134765625, 103.6304931640625, 107.01385498046875, 110.397216796875, 113.78058624267578]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 4.0, 9.0, 2.0, 5.0, 5.0, 11.0, 15.0, 13.0, 16.0, 22.0, 24.0, 21.0, 28.0, 28.0, 38.0, 40.0, 29.0, 45.0, 44.0, 53.0, 38.0, 38.0, 53.0, 42.0, 38.0, 40.0, 39.0, 36.0, 30.0, 25.0, 25.0, 16.0, 20.0, 18.0, 15.0, 17.0, 10.0, 9.0, 14.0, 11.0, 7.0, 4.0, 3.0, 2.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.102073669433594, -34.95222091674805, -33.8023681640625, -32.65251922607422, -31.502666473388672, -30.352813720703125, -29.202960968017578, -28.053110122680664, -26.90325927734375, -25.753406524658203, -24.60355567932129, -23.453702926635742, -22.303852081298828, -21.15399932861328, -20.004146575927734, -18.85429573059082, -17.704442977905273, -16.554590225219727, -15.404739379882812, -14.254886627197266, -13.105035781860352, -11.955183029174805, -10.805331230163574, -9.655479431152344, -8.505627632141113, -7.355775833129883, -6.205924034118652, -5.056071758270264, -3.906219959259033, -2.7563681602478027, -1.606515884399414, -0.4566640853881836, 0.6931877136230469, 1.843039631843567, 2.992891550064087, 4.1427435874938965, 5.292595386505127, 6.442447185516357, 7.592299461364746, 8.742151260375977, 9.892003059387207, 11.041854858398438, 12.191706657409668, 13.341558456420898, 14.491411209106445, 15.64126205444336, 16.791114807128906, 17.940967559814453, 19.090818405151367, 20.240671157836914, 21.390522003173828, 22.540374755859375, 23.69022560119629, 24.840078353881836, 25.98992919921875, 27.139781951904297, 28.289634704589844, 29.43948745727539, 30.589338302612305, 31.73919105529785, 32.889041900634766, 34.03889465332031, 35.18874740600586, 36.338600158691406, 37.48844909667969]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 7.0, 4.0, 12.0, 4.0, 18.0, 16.0, 26.0, 17.0, 32.0, 34.0, 38.0, 33.0, 37.0, 44.0, 42.0, 40.0, 40.0, 62.0, 44.0, 47.0, 63.0, 34.0, 41.0, 40.0, 48.0, 36.0, 18.0, 22.0, 23.0, 17.0, 10.0, 6.0, 14.0, 9.0, 8.0, 5.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.24609375, -6.04815673828125, -5.8502197265625, -5.65228271484375, -5.454345703125, -5.25640869140625, -5.0584716796875, -4.86053466796875, -4.66259765625, -4.46466064453125, -4.2667236328125, -4.06878662109375, -3.870849609375, -3.67291259765625, -3.4749755859375, -3.27703857421875, -3.0791015625, -2.88116455078125, -2.6832275390625, -2.48529052734375, -2.287353515625, -2.08941650390625, -1.8914794921875, -1.69354248046875, -1.49560546875, -1.29766845703125, -1.0997314453125, -0.90179443359375, -0.703857421875, -0.50592041015625, -0.3079833984375, -0.11004638671875, 0.087890625, 0.28582763671875, 0.4837646484375, 0.68170166015625, 0.879638671875, 1.07757568359375, 1.2755126953125, 1.47344970703125, 1.67138671875, 1.86932373046875, 2.0672607421875, 2.26519775390625, 2.463134765625, 2.66107177734375, 2.8590087890625, 3.05694580078125, 3.2548828125, 3.45281982421875, 3.6507568359375, 3.84869384765625, 4.046630859375, 4.24456787109375, 4.4425048828125, 4.64044189453125, 4.83837890625, 5.03631591796875, 5.2342529296875, 5.43218994140625, 5.630126953125, 5.82806396484375, 6.0260009765625, 6.22393798828125, 6.421875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 8.0, 8.0, 16.0, 17.0, 21.0, 29.0, 29.0, 45.0, 58.0, 87.0, 107.0, 142.0, 243.0, 279.0, 436.0, 592.0, 954.0, 1369.0, 2285.0, 3900.0, 8101.0, 20157.0, 68555.0, 397990.0, 428968.0, 73784.0, 21228.0, 8404.0, 4019.0, 2294.0, 1409.0, 926.0, 608.0, 409.0, 277.0, 213.0, 166.0, 110.0, 83.0, 63.0, 32.0, 35.0, 27.0, 17.0, 17.0, 12.0, 13.0, 10.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.23046875, -6.02294921875, -5.8154296875, -5.60791015625, -5.400390625, -5.19287109375, -4.9853515625, -4.77783203125, -4.5703125, -4.36279296875, -4.1552734375, -3.94775390625, -3.740234375, -3.53271484375, -3.3251953125, -3.11767578125, -2.91015625, -2.70263671875, -2.4951171875, -2.28759765625, -2.080078125, -1.87255859375, -1.6650390625, -1.45751953125, -1.25, -1.04248046875, -0.8349609375, -0.62744140625, -0.419921875, -0.21240234375, -0.0048828125, 0.20263671875, 0.41015625, 0.61767578125, 0.8251953125, 1.03271484375, 1.240234375, 1.44775390625, 1.6552734375, 1.86279296875, 2.0703125, 2.27783203125, 2.4853515625, 2.69287109375, 2.900390625, 3.10791015625, 3.3154296875, 3.52294921875, 3.73046875, 3.93798828125, 4.1455078125, 4.35302734375, 4.560546875, 4.76806640625, 4.9755859375, 5.18310546875, 5.390625, 5.59814453125, 5.8056640625, 6.01318359375, 6.220703125, 6.42822265625, 6.6357421875, 6.84326171875, 7.05078125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 2.0, 7.0, 10.0, 3.0, 11.0, 10.0, 14.0, 11.0, 16.0, 20.0, 17.0, 22.0, 32.0, 24.0, 30.0, 29.0, 40.0, 43.0, 44.0, 33.0, 38.0, 37.0, 1067.0, 36.0, 24.0, 46.0, 34.0, 31.0, 34.0, 19.0, 28.0, 25.0, 35.0, 26.0, 15.0, 17.0, 12.0, 12.0, 7.0, 9.0, 9.0, 10.0, 6.0, 8.0, 6.0, 4.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.779296875, -3.662750244140625, -3.54620361328125, -3.429656982421875, -3.3131103515625, -3.196563720703125, -3.08001708984375, -2.963470458984375, -2.846923828125, -2.730377197265625, -2.61383056640625, -2.497283935546875, -2.3807373046875, -2.264190673828125, -2.14764404296875, -2.031097412109375, -1.91455078125, -1.798004150390625, -1.68145751953125, -1.564910888671875, -1.4483642578125, -1.331817626953125, -1.21527099609375, -1.098724365234375, -0.982177734375, -0.865631103515625, -0.74908447265625, -0.632537841796875, -0.5159912109375, -0.399444580078125, -0.28289794921875, -0.166351318359375, -0.0498046875, 0.066741943359375, 0.18328857421875, 0.299835205078125, 0.4163818359375, 0.532928466796875, 0.64947509765625, 0.766021728515625, 0.882568359375, 0.999114990234375, 1.11566162109375, 1.232208251953125, 1.3487548828125, 1.465301513671875, 1.58184814453125, 1.698394775390625, 1.81494140625, 1.931488037109375, 2.04803466796875, 2.164581298828125, 2.2811279296875, 2.397674560546875, 2.51422119140625, 2.630767822265625, 2.747314453125, 2.863861083984375, 2.98040771484375, 3.096954345703125, 3.2135009765625, 3.330047607421875, 3.44659423828125, 3.563140869140625, 3.6796875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 12.0, 8.0, 10.0, 16.0, 31.0, 46.0, 47.0, 79.0, 91.0, 138.0, 172.0, 257.0, 356.0, 451.0, 707.0, 1000.0, 1399.0, 2308.0, 3566.0, 6069.0, 11945.0, 27056.0, 84743.0, 506680.0, 1236515.0, 139832.0, 37928.0, 15410.0, 7670.0, 4271.0, 2645.0, 1759.0, 1084.0, 805.0, 567.0, 383.0, 293.0, 222.0, 141.0, 118.0, 83.0, 55.0, 49.0, 39.0, 18.0, 12.0, 9.0, 11.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-3.416015625, -3.313018798828125, -3.21002197265625, -3.107025146484375, -3.0040283203125, -2.901031494140625, -2.79803466796875, -2.695037841796875, -2.592041015625, -2.489044189453125, -2.38604736328125, -2.283050537109375, -2.1800537109375, -2.077056884765625, -1.97406005859375, -1.871063232421875, -1.76806640625, -1.665069580078125, -1.56207275390625, -1.459075927734375, -1.3560791015625, -1.253082275390625, -1.15008544921875, -1.047088623046875, -0.944091796875, -0.841094970703125, -0.73809814453125, -0.635101318359375, -0.5321044921875, -0.429107666015625, -0.32611083984375, -0.223114013671875, -0.1201171875, -0.017120361328125, 0.08587646484375, 0.188873291015625, 0.2918701171875, 0.394866943359375, 0.49786376953125, 0.600860595703125, 0.703857421875, 0.806854248046875, 0.90985107421875, 1.012847900390625, 1.1158447265625, 1.218841552734375, 1.32183837890625, 1.424835205078125, 1.52783203125, 1.630828857421875, 1.73382568359375, 1.836822509765625, 1.9398193359375, 2.042816162109375, 2.14581298828125, 2.248809814453125, 2.351806640625, 2.454803466796875, 2.55780029296875, 2.660797119140625, 2.7637939453125, 2.866790771484375, 2.96978759765625, 3.072784423828125, 3.17578125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 2.0, 3.0, 5.0, 4.0, 1.0, 9.0, 7.0, 13.0, 9.0, 7.0, 8.0, 8.0, 11.0, 13.0, 9.0, 19.0, 21.0, 46.0, 70.0, 130.0, 175.0, 109.0, 77.0, 56.0, 38.0, 23.0, 24.0, 11.0, 9.0, 15.0, 8.0, 9.0, 8.0, 6.0, 7.0, 6.0, 5.0, 3.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.7744140625, -0.7537765502929688, -0.7331390380859375, -0.7125015258789062, -0.691864013671875, -0.6712265014648438, -0.6505889892578125, -0.6299514770507812, -0.60931396484375, -0.5886764526367188, -0.5680389404296875, -0.5474014282226562, -0.526763916015625, -0.5061264038085938, -0.4854888916015625, -0.46485137939453125, -0.4442138671875, -0.42357635498046875, -0.4029388427734375, -0.38230133056640625, -0.361663818359375, -0.34102630615234375, -0.3203887939453125, -0.29975128173828125, -0.27911376953125, -0.25847625732421875, -0.2378387451171875, -0.21720123291015625, -0.196563720703125, -0.17592620849609375, -0.1552886962890625, -0.13465118408203125, -0.114013671875, -0.09337615966796875, -0.0727386474609375, -0.05210113525390625, -0.031463623046875, -0.01082611083984375, 0.0098114013671875, 0.03044891357421875, 0.05108642578125, 0.07172393798828125, 0.0923614501953125, 0.11299896240234375, 0.133636474609375, 0.15427398681640625, 0.1749114990234375, 0.19554901123046875, 0.2161865234375, 0.23682403564453125, 0.2574615478515625, 0.27809906005859375, 0.298736572265625, 0.31937408447265625, 0.3400115966796875, 0.36064910888671875, 0.38128662109375, 0.40192413330078125, 0.4225616455078125, 0.44319915771484375, 0.463836669921875, 0.48447418212890625, 0.5051116943359375, 0.5257492065429688, 0.54638671875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 4.0, 5.0, 6.0, 11.0, 6.0, 15.0, 10.0, 14.0, 23.0, 20.0, 30.0, 48.0, 63.0, 128.0, 322.0, 1284.0, 8941.0, 242241.0, 780575.0, 12461.0, 1568.0, 358.0, 137.0, 78.0, 49.0, 30.0, 21.0, 21.0, 12.0, 18.0, 14.0, 8.0, 6.0, 3.0, 1.0, 4.0, 3.0, 7.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.765625, -10.367919921875, -9.97021484375, -9.572509765625, -9.1748046875, -8.777099609375, -8.37939453125, -7.981689453125, -7.583984375, -7.186279296875, -6.78857421875, -6.390869140625, -5.9931640625, -5.595458984375, -5.19775390625, -4.800048828125, -4.40234375, -4.004638671875, -3.60693359375, -3.209228515625, -2.8115234375, -2.413818359375, -2.01611328125, -1.618408203125, -1.220703125, -0.822998046875, -0.42529296875, -0.027587890625, 0.3701171875, 0.767822265625, 1.16552734375, 1.563232421875, 1.9609375, 2.358642578125, 2.75634765625, 3.154052734375, 3.5517578125, 3.949462890625, 4.34716796875, 4.744873046875, 5.142578125, 5.540283203125, 5.93798828125, 6.335693359375, 6.7333984375, 7.131103515625, 7.52880859375, 7.926513671875, 8.32421875, 8.721923828125, 9.11962890625, 9.517333984375, 9.9150390625, 10.312744140625, 10.71044921875, 11.108154296875, 11.505859375, 11.903564453125, 12.30126953125, 12.698974609375, 13.0966796875, 13.494384765625, 13.89208984375, 14.289794921875, 14.6875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 5.0, 4.0, 10.0, 14.0, 34.0, 53.0, 109.0, 128.0, 168.0, 143.0, 123.0, 91.0, 56.0, 26.0, 23.0, 11.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3336033821105957, -2.281318426132202, -2.2290334701538086, -2.176748752593994, -2.1244637966156006, -2.072178840637207, -2.0198941230773926, -1.967609167098999, -1.9153242111206055, -1.863039255142212, -1.810754418373108, -1.758469581604004, -1.7061846256256104, -1.6538996696472168, -1.6016148328781128, -1.5493299961090088, -1.4970450401306152, -1.4447600841522217, -1.3924752473831177, -1.3401904106140137, -1.2879054546356201, -1.2356204986572266, -1.1833356618881226, -1.1310508251190186, -1.078765869140625, -1.0264809131622314, -0.9741960763931274, -0.9219111800193787, -0.8696262836456299, -0.8173413872718811, -0.7650564908981323, -0.7127715945243835, -0.6604868173599243, -0.6082019209861755, -0.5559170246124268, -0.503632128238678, -0.4513472318649292, -0.3990623354911804, -0.34677743911743164, -0.29449254274368286, -0.24220764636993408, -0.1899227499961853, -0.13763785362243652, -0.08535295724868774, -0.033068060874938965, 0.019216835498809814, 0.0715017318725586, 0.12378662824630737, 0.17607152462005615, 0.22835642099380493, 0.2806413173675537, 0.3329262137413025, 0.38521111011505127, 0.43749600648880005, 0.48978090286254883, 0.5420657992362976, 0.5943506956100464, 0.6466355919837952, 0.698920488357544, 0.7512053847312927, 0.8034902811050415, 0.8557751774787903, 0.9080600738525391, 0.9603449702262878, 1.0126298666000366]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 4.0, 6.0, 6.0, 5.0, 16.0, 16.0, 8.0, 13.0, 14.0, 16.0, 24.0, 26.0, 33.0, 22.0, 27.0, 29.0, 32.0, 39.0, 49.0, 41.0, 45.0, 54.0, 42.0, 36.0, 38.0, 45.0, 42.0, 38.0, 25.0, 29.0, 21.0, 21.0, 28.0, 22.0, 18.0, 12.0, 11.0, 3.0, 5.0, 13.0, 3.0, 4.0, 6.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42885005474090576, -0.4134022295475006, -0.39795440435409546, -0.3825065791606903, -0.36705875396728516, -0.35161092877388, -0.33616310358047485, -0.3207152783870697, -0.30526745319366455, -0.2898196280002594, -0.27437180280685425, -0.2589239776134491, -0.24347615242004395, -0.2280283272266388, -0.21258050203323364, -0.1971326768398285, -0.18168485164642334, -0.1662370264530182, -0.15078920125961304, -0.13534137606620789, -0.11989355087280273, -0.10444572567939758, -0.08899790048599243, -0.07355007529258728, -0.05810225009918213, -0.04265442490577698, -0.027206599712371826, -0.011758774518966675, 0.0036890506744384766, 0.019136875867843628, 0.03458470106124878, 0.05003252625465393, 0.06548035144805908, 0.08092817664146423, 0.09637600183486938, 0.11182382702827454, 0.1272716522216797, 0.14271947741508484, 0.15816730260849, 0.17361512780189514, 0.1890629529953003, 0.20451077818870544, 0.2199586033821106, 0.23540642857551575, 0.2508542537689209, 0.26630207896232605, 0.2817499041557312, 0.29719772934913635, 0.3126455545425415, 0.32809337973594666, 0.3435412049293518, 0.35898903012275696, 0.3744368553161621, 0.38988468050956726, 0.4053325057029724, 0.42078033089637756, 0.4362281560897827, 0.45167598128318787, 0.467123806476593, 0.48257163166999817, 0.4980194568634033, 0.5134673118591309, 0.5289151072502136, 0.5443629026412964, 0.5598107576370239]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 6.0, 4.0, 5.0, 8.0, 6.0, 13.0, 16.0, 9.0, 13.0, 22.0, 20.0, 23.0, 26.0, 32.0, 29.0, 36.0, 31.0, 40.0, 31.0, 32.0, 41.0, 41.0, 42.0, 51.0, 39.0, 43.0, 50.0, 24.0, 31.0, 34.0, 32.0, 28.0, 26.0, 15.0, 20.0, 11.0, 14.0, 14.0, 12.0, 6.0, 4.0, 6.0, 4.0, 9.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.828125, -5.65692138671875, -5.4857177734375, -5.31451416015625, -5.143310546875, -4.97210693359375, -4.8009033203125, -4.62969970703125, -4.45849609375, -4.28729248046875, -4.1160888671875, -3.94488525390625, -3.773681640625, -3.60247802734375, -3.4312744140625, -3.26007080078125, -3.0888671875, -2.91766357421875, -2.7464599609375, -2.57525634765625, -2.404052734375, -2.23284912109375, -2.0616455078125, -1.89044189453125, -1.71923828125, -1.54803466796875, -1.3768310546875, -1.20562744140625, -1.034423828125, -0.86322021484375, -0.6920166015625, -0.52081298828125, -0.349609375, -0.17840576171875, -0.0072021484375, 0.16400146484375, 0.335205078125, 0.50640869140625, 0.6776123046875, 0.84881591796875, 1.02001953125, 1.19122314453125, 1.3624267578125, 1.53363037109375, 1.704833984375, 1.87603759765625, 2.0472412109375, 2.21844482421875, 2.3896484375, 2.56085205078125, 2.7320556640625, 2.90325927734375, 3.074462890625, 3.24566650390625, 3.4168701171875, 3.58807373046875, 3.75927734375, 3.93048095703125, 4.1016845703125, 4.27288818359375, 4.444091796875, 4.61529541015625, 4.7864990234375, 4.95770263671875, 5.12890625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 2.0, 15.0, 17.0, 16.0, 17.0, 38.0, 45.0, 71.0, 116.0, 132.0, 186.0, 328.0, 420.0, 632.0, 975.0, 1677.0, 2820.0, 5292.0, 11934.0, 31929.0, 99938.0, 385844.0, 357755.0, 94406.0, 30368.0, 11306.0, 5064.0, 2711.0, 1549.0, 987.0, 667.0, 416.0, 261.0, 158.0, 154.0, 84.0, 63.0, 41.0, 32.0, 22.0, 26.0, 9.0, 14.0, 6.0, 10.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.140625, -9.813232421875, -9.48583984375, -9.158447265625, -8.8310546875, -8.503662109375, -8.17626953125, -7.848876953125, -7.521484375, -7.194091796875, -6.86669921875, -6.539306640625, -6.2119140625, -5.884521484375, -5.55712890625, -5.229736328125, -4.90234375, -4.574951171875, -4.24755859375, -3.920166015625, -3.5927734375, -3.265380859375, -2.93798828125, -2.610595703125, -2.283203125, -1.955810546875, -1.62841796875, -1.301025390625, -0.9736328125, -0.646240234375, -0.31884765625, 0.008544921875, 0.3359375, 0.663330078125, 0.99072265625, 1.318115234375, 1.6455078125, 1.972900390625, 2.30029296875, 2.627685546875, 2.955078125, 3.282470703125, 3.60986328125, 3.937255859375, 4.2646484375, 4.592041015625, 4.91943359375, 5.246826171875, 5.57421875, 5.901611328125, 6.22900390625, 6.556396484375, 6.8837890625, 7.211181640625, 7.53857421875, 7.865966796875, 8.193359375, 8.520751953125, 8.84814453125, 9.175537109375, 9.5029296875, 9.830322265625, 10.15771484375, 10.485107421875, 10.8125]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 3.0, 9.0, 17.0, 8.0, 15.0, 18.0, 18.0, 25.0, 24.0, 21.0, 28.0, 36.0, 33.0, 41.0, 54.0, 73.0, 114.0, 232.0, 1397.0, 249.0, 137.0, 90.0, 64.0, 58.0, 40.0, 36.0, 26.0, 19.0, 24.0, 25.0, 29.0, 17.0, 7.0, 18.0, 5.0, 9.0, 3.0, 5.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8984375, -15.3795166015625, -14.860595703125, -14.3416748046875, -13.82275390625, -13.3038330078125, -12.784912109375, -12.2659912109375, -11.7470703125, -11.2281494140625, -10.709228515625, -10.1903076171875, -9.67138671875, -9.1524658203125, -8.633544921875, -8.1146240234375, -7.595703125, -7.0767822265625, -6.557861328125, -6.0389404296875, -5.52001953125, -5.0010986328125, -4.482177734375, -3.9632568359375, -3.4443359375, -2.9254150390625, -2.406494140625, -1.8875732421875, -1.36865234375, -0.8497314453125, -0.330810546875, 0.1881103515625, 0.70703125, 1.2259521484375, 1.744873046875, 2.2637939453125, 2.78271484375, 3.3016357421875, 3.820556640625, 4.3394775390625, 4.8583984375, 5.3773193359375, 5.896240234375, 6.4151611328125, 6.93408203125, 7.4530029296875, 7.971923828125, 8.4908447265625, 9.009765625, 9.5286865234375, 10.047607421875, 10.5665283203125, 11.08544921875, 11.6043701171875, 12.123291015625, 12.6422119140625, 13.1611328125, 13.6800537109375, 14.198974609375, 14.7178955078125, 15.23681640625, 15.7557373046875, 16.274658203125, 16.7935791015625, 17.3125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 3.0, 11.0, 15.0, 18.0, 25.0, 29.0, 37.0, 41.0, 70.0, 97.0, 126.0, 192.0, 313.0, 584.0, 1456.0, 5851.0, 73373.0, 2912303.0, 140129.0, 7582.0, 1737.0, 638.0, 330.0, 240.0, 120.0, 93.0, 62.0, 62.0, 29.0, 38.0, 25.0, 19.0, 13.0, 11.0, 6.0, 6.0, 5.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.84375, -35.638671875, -34.43359375, -33.228515625, -32.0234375, -30.818359375, -29.61328125, -28.408203125, -27.203125, -25.998046875, -24.79296875, -23.587890625, -22.3828125, -21.177734375, -19.97265625, -18.767578125, -17.5625, -16.357421875, -15.15234375, -13.947265625, -12.7421875, -11.537109375, -10.33203125, -9.126953125, -7.921875, -6.716796875, -5.51171875, -4.306640625, -3.1015625, -1.896484375, -0.69140625, 0.513671875, 1.71875, 2.923828125, 4.12890625, 5.333984375, 6.5390625, 7.744140625, 8.94921875, 10.154296875, 11.359375, 12.564453125, 13.76953125, 14.974609375, 16.1796875, 17.384765625, 18.58984375, 19.794921875, 21.0, 22.205078125, 23.41015625, 24.615234375, 25.8203125, 27.025390625, 28.23046875, 29.435546875, 30.640625, 31.845703125, 33.05078125, 34.255859375, 35.4609375, 36.666015625, 37.87109375, 39.076171875, 40.28125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 513.0, 491.0, 8.0, 1.0], "bins": [-578.274169921875, -568.7924194335938, -559.3106689453125, -549.8289184570312, -540.34716796875, -530.8654174804688, -521.3836669921875, -511.90191650390625, -502.420166015625, -492.93841552734375, -483.4566650390625, -473.97491455078125, -464.4931640625, -455.01141357421875, -445.5296630859375, -436.04791259765625, -426.5661926269531, -417.0844421386719, -407.6026916503906, -398.1209411621094, -388.6391906738281, -379.1574401855469, -369.6756896972656, -360.1939697265625, -350.71221923828125, -341.23046875, -331.74871826171875, -322.2669677734375, -312.78521728515625, -303.303466796875, -293.82171630859375, -284.3399658203125, -274.85821533203125, -265.37646484375, -255.89471435546875, -246.4129638671875, -236.93121337890625, -227.449462890625, -217.9677276611328, -208.48597717285156, -199.00421142578125, -189.5224609375, -180.04071044921875, -170.5589599609375, -161.07720947265625, -151.595458984375, -142.1137237548828, -132.63197326660156, -123.15022277832031, -113.66847229003906, -104.18672180175781, -94.7049789428711, -85.22322845458984, -75.7414779663086, -66.25973510742188, -56.777984619140625, -47.29623794555664, -37.814491271972656, -28.332740783691406, -18.85099220275879, -9.369243621826172, 0.11250686645507812, 9.594253540039062, 19.076000213623047, 28.557750701904297]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 0.0, 5.0, 8.0, 7.0, 11.0, 11.0, 16.0, 12.0, 10.0, 12.0, 20.0, 11.0, 29.0, 32.0, 25.0, 33.0, 40.0, 22.0, 37.0, 44.0, 24.0, 39.0, 43.0, 42.0, 38.0, 36.0, 46.0, 35.0, 43.0, 34.0, 31.0, 29.0, 14.0, 24.0, 14.0, 16.0, 21.0, 24.0, 8.0, 10.0, 6.0, 12.0, 7.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-43.606597900390625, -42.325836181640625, -41.045074462890625, -39.764312744140625, -38.483551025390625, -37.202789306640625, -35.922027587890625, -34.641265869140625, -33.360504150390625, -32.079742431640625, -30.798980712890625, -29.518218994140625, -28.237457275390625, -26.956695556640625, -25.675933837890625, -24.395172119140625, -23.114410400390625, -21.833648681640625, -20.552886962890625, -19.272125244140625, -17.991363525390625, -16.710601806640625, -15.429840087890625, -14.149078369140625, -12.868316650390625, -11.587554931640625, -10.306793212890625, -9.026031494140625, -7.745269775390625, -6.464508056640625, -5.183746337890625, -3.902984619140625, -2.622222900390625, -1.341461181640625, -0.060699462890625, 1.220062255859375, 2.500823974609375, 3.781585693359375, 5.062347412109375, 6.343109130859375, 7.623870849609375, 8.904632568359375, 10.185394287109375, 11.466156005859375, 12.746917724609375, 14.027679443359375, 15.308441162109375, 16.589202880859375, 17.869964599609375, 19.150726318359375, 20.431488037109375, 21.712249755859375, 22.993011474609375, 24.273773193359375, 25.554534912109375, 26.835296630859375, 28.116058349609375, 29.396820068359375, 30.677581787109375, 31.958343505859375, 33.239105224609375, 34.519866943359375, 35.800628662109375, 37.081390380859375, 38.362152099609375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 4.0, 8.0, 4.0, 15.0, 11.0, 19.0, 17.0, 13.0, 17.0, 25.0, 32.0, 25.0, 29.0, 24.0, 31.0, 31.0, 36.0, 40.0, 43.0, 41.0, 51.0, 43.0, 41.0, 33.0, 32.0, 30.0, 50.0, 36.0, 21.0, 31.0, 26.0, 21.0, 20.0, 16.0, 12.0, 13.0, 15.0, 6.0, 12.0, 6.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.46484375, -5.28973388671875, -5.1146240234375, -4.93951416015625, -4.764404296875, -4.58929443359375, -4.4141845703125, -4.23907470703125, -4.06396484375, -3.88885498046875, -3.7137451171875, -3.53863525390625, -3.363525390625, -3.18841552734375, -3.0133056640625, -2.83819580078125, -2.6630859375, -2.48797607421875, -2.3128662109375, -2.13775634765625, -1.962646484375, -1.78753662109375, -1.6124267578125, -1.43731689453125, -1.26220703125, -1.08709716796875, -0.9119873046875, -0.73687744140625, -0.561767578125, -0.38665771484375, -0.2115478515625, -0.03643798828125, 0.138671875, 0.31378173828125, 0.4888916015625, 0.66400146484375, 0.839111328125, 1.01422119140625, 1.1893310546875, 1.36444091796875, 1.53955078125, 1.71466064453125, 1.8897705078125, 2.06488037109375, 2.239990234375, 2.41510009765625, 2.5902099609375, 2.76531982421875, 2.9404296875, 3.11553955078125, 3.2906494140625, 3.46575927734375, 3.640869140625, 3.81597900390625, 3.9910888671875, 4.16619873046875, 4.34130859375, 4.51641845703125, 4.6915283203125, 4.86663818359375, 5.041748046875, 5.21685791015625, 5.3919677734375, 5.56707763671875, 5.7421875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 8.0, 5.0, 8.0, 12.0, 12.0, 23.0, 33.0, 39.0, 66.0, 87.0, 130.0, 166.0, 259.0, 359.0, 611.0, 972.0, 1434.0, 2417.0, 4185.0, 7590.0, 15753.0, 35752.0, 101854.0, 381119.0, 1350538.0, 1576832.0, 498879.0, 129967.0, 44765.0, 18887.0, 9258.0, 4997.0, 2819.0, 1630.0, 976.0, 630.0, 397.0, 264.0, 167.0, 122.0, 101.0, 52.0, 31.0, 26.0, 15.0, 15.0, 7.0, 11.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.5703125, -9.2896728515625, -9.009033203125, -8.7283935546875, -8.44775390625, -8.1671142578125, -7.886474609375, -7.6058349609375, -7.3251953125, -7.0445556640625, -6.763916015625, -6.4832763671875, -6.20263671875, -5.9219970703125, -5.641357421875, -5.3607177734375, -5.080078125, -4.7994384765625, -4.518798828125, -4.2381591796875, -3.95751953125, -3.6768798828125, -3.396240234375, -3.1156005859375, -2.8349609375, -2.5543212890625, -2.273681640625, -1.9930419921875, -1.71240234375, -1.4317626953125, -1.151123046875, -0.8704833984375, -0.58984375, -0.3092041015625, -0.028564453125, 0.2520751953125, 0.53271484375, 0.8133544921875, 1.093994140625, 1.3746337890625, 1.6552734375, 1.9359130859375, 2.216552734375, 2.4971923828125, 2.77783203125, 3.0584716796875, 3.339111328125, 3.6197509765625, 3.900390625, 4.1810302734375, 4.461669921875, 4.7423095703125, 5.02294921875, 5.3035888671875, 5.584228515625, 5.8648681640625, 6.1455078125, 6.4261474609375, 6.706787109375, 6.9874267578125, 7.26806640625, 7.5487060546875, 7.829345703125, 8.1099853515625, 8.390625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 12.0, 5.0, 7.0, 16.0, 25.0, 29.0, 51.0, 72.0, 94.0, 158.0, 222.0, 355.0, 515.0, 659.0, 613.0, 429.0, 285.0, 184.0, 119.0, 75.0, 54.0, 35.0, 21.0, 14.0, 14.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.953125, -14.467041015625, -13.98095703125, -13.494873046875, -13.0087890625, -12.522705078125, -12.03662109375, -11.550537109375, -11.064453125, -10.578369140625, -10.09228515625, -9.606201171875, -9.1201171875, -8.634033203125, -8.14794921875, -7.661865234375, -7.17578125, -6.689697265625, -6.20361328125, -5.717529296875, -5.2314453125, -4.745361328125, -4.25927734375, -3.773193359375, -3.287109375, -2.801025390625, -2.31494140625, -1.828857421875, -1.3427734375, -0.856689453125, -0.37060546875, 0.115478515625, 0.6015625, 1.087646484375, 1.57373046875, 2.059814453125, 2.5458984375, 3.031982421875, 3.51806640625, 4.004150390625, 4.490234375, 4.976318359375, 5.46240234375, 5.948486328125, 6.4345703125, 6.920654296875, 7.40673828125, 7.892822265625, 8.37890625, 8.864990234375, 9.35107421875, 9.837158203125, 10.3232421875, 10.809326171875, 11.29541015625, 11.781494140625, 12.267578125, 12.753662109375, 13.23974609375, 13.725830078125, 14.2119140625, 14.697998046875, 15.18408203125, 15.670166015625, 16.15625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 8.0, 12.0, 14.0, 22.0, 27.0, 60.0, 94.0, 142.0, 299.0, 761.0, 7137.0, 665801.0, 3495636.0, 22068.0, 1294.0, 428.0, 169.0, 92.0, 77.0, 53.0, 36.0, 13.0, 16.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.875, -71.83203125, -69.7890625, -67.74609375, -65.703125, -63.66015625, -61.6171875, -59.57421875, -57.53125, -55.48828125, -53.4453125, -51.40234375, -49.359375, -47.31640625, -45.2734375, -43.23046875, -41.1875, -39.14453125, -37.1015625, -35.05859375, -33.015625, -30.97265625, -28.9296875, -26.88671875, -24.84375, -22.80078125, -20.7578125, -18.71484375, -16.671875, -14.62890625, -12.5859375, -10.54296875, -8.5, -6.45703125, -4.4140625, -2.37109375, -0.328125, 1.71484375, 3.7578125, 5.80078125, 7.84375, 9.88671875, 11.9296875, 13.97265625, 16.015625, 18.05859375, 20.1015625, 22.14453125, 24.1875, 26.23046875, 28.2734375, 30.31640625, 32.359375, 34.40234375, 36.4453125, 38.48828125, 40.53125, 42.57421875, 44.6171875, 46.66015625, 48.703125, 50.74609375, 52.7890625, 54.83203125, 56.875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 6.0, 18.0, 35.0, 57.0, 123.0, 183.0, 206.0, 180.0, 103.0, 59.0, 30.0, 8.0, 4.0, 3.0, 1.0], "bins": [-200.24513244628906, -196.63206481933594, -193.0189971923828, -189.40591430664062, -185.7928466796875, -182.17977905273438, -178.56671142578125, -174.95364379882812, -171.340576171875, -167.72750854492188, -164.11444091796875, -160.50137329101562, -156.88829040527344, -153.2752227783203, -149.6621551513672, -146.04908752441406, -142.43600463867188, -138.82293701171875, -135.20986938476562, -131.5968017578125, -127.98372650146484, -124.37065124511719, -120.75758361816406, -117.14451599121094, -113.53144836425781, -109.91838073730469, -106.30530548095703, -102.6922378540039, -99.07917022705078, -95.46609497070312, -91.85302734375, -88.23995971679688, -84.62688446044922, -81.0138168334961, -77.40074157714844, -73.78767395019531, -70.17460632324219, -66.56153106689453, -62.948463439941406, -59.335391998291016, -55.722320556640625, -52.109249114990234, -48.49618148803711, -44.88311004638672, -41.27003860473633, -37.65696716308594, -34.04389953613281, -30.430828094482422, -26.817760467529297, -23.20469093322754, -19.59161949157715, -15.97854995727539, -12.365479469299316, -8.752408981323242, -5.139339447021484, -1.5262680053710938, 2.086801528930664, 5.699872016906738, 9.312942504882812, 12.92601203918457, 16.539081573486328, 20.15215301513672, 23.765222549438477, 27.378293991088867, 30.991363525390625]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 7.0, 2.0, 6.0, 8.0, 11.0, 13.0, 20.0, 12.0, 15.0, 21.0, 23.0, 37.0, 31.0, 29.0, 19.0, 31.0, 34.0, 43.0, 49.0, 42.0, 32.0, 36.0, 32.0, 39.0, 43.0, 33.0, 35.0, 35.0, 32.0, 21.0, 24.0, 28.0, 15.0, 21.0, 16.0, 22.0, 15.0, 16.0, 7.0, 6.0, 9.0, 5.0, 7.0, 6.0, 4.0, 7.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-38.01980209350586, -36.915428161621094, -35.811058044433594, -34.70668411254883, -33.60231018066406, -32.49794006347656, -31.393566131591797, -30.289194107055664, -29.18482208251953, -28.0804500579834, -26.976078033447266, -25.8717041015625, -24.767332077026367, -23.662960052490234, -22.55858612060547, -21.454214096069336, -20.349842071533203, -19.24547004699707, -18.141098022460938, -17.036724090576172, -15.932352066040039, -14.827980041503906, -13.723607063293457, -12.619234085083008, -11.514862060546875, -10.410490036010742, -9.306117057800293, -8.201744079589844, -7.097372055053711, -5.99299955368042, -4.888627052307129, -3.784254550933838, -2.6798782348632812, -1.5755057334899902, -0.4711332321166992, 0.6332392692565918, 1.7376117706298828, 2.841984272003174, 3.946356773376465, 5.050729274749756, 6.155101776123047, 7.259474277496338, 8.363846778869629, 9.468219757080078, 10.572591781616211, 11.676963806152344, 12.781336784362793, 13.885709762573242, 14.990081787109375, 16.094453811645508, 17.19882583618164, 18.303199768066406, 19.40757179260254, 20.511943817138672, 21.616317749023438, 22.72068977355957, 23.825061798095703, 24.929433822631836, 26.03380584716797, 27.138179779052734, 28.242551803588867, 29.346923828125, 30.451297760009766, 31.5556697845459, 32.66004180908203]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 8.0, 8.0, 11.0, 12.0, 11.0, 16.0, 18.0, 19.0, 27.0, 19.0, 36.0, 33.0, 42.0, 28.0, 33.0, 43.0, 45.0, 49.0, 49.0, 48.0, 38.0, 37.0, 33.0, 49.0, 51.0, 29.0, 30.0, 20.0, 19.0, 22.0, 22.0, 15.0, 14.0, 15.0, 9.0, 1.0, 7.0, 9.0, 5.0, 6.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.41796875, -6.232177734375, -6.04638671875, -5.860595703125, -5.6748046875, -5.489013671875, -5.30322265625, -5.117431640625, -4.931640625, -4.745849609375, -4.56005859375, -4.374267578125, -4.1884765625, -4.002685546875, -3.81689453125, -3.631103515625, -3.4453125, -3.259521484375, -3.07373046875, -2.887939453125, -2.7021484375, -2.516357421875, -2.33056640625, -2.144775390625, -1.958984375, -1.773193359375, -1.58740234375, -1.401611328125, -1.2158203125, -1.030029296875, -0.84423828125, -0.658447265625, -0.47265625, -0.286865234375, -0.10107421875, 0.084716796875, 0.2705078125, 0.456298828125, 0.64208984375, 0.827880859375, 1.013671875, 1.199462890625, 1.38525390625, 1.571044921875, 1.7568359375, 1.942626953125, 2.12841796875, 2.314208984375, 2.5, 2.685791015625, 2.87158203125, 3.057373046875, 3.2431640625, 3.428955078125, 3.61474609375, 3.800537109375, 3.986328125, 4.172119140625, 4.35791015625, 4.543701171875, 4.7294921875, 4.915283203125, 5.10107421875, 5.286865234375, 5.47265625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 9.0, 22.0, 26.0, 29.0, 36.0, 71.0, 104.0, 176.0, 300.0, 471.0, 738.0, 1213.0, 1999.0, 3244.0, 5794.0, 11592.0, 30421.0, 140933.0, 591391.0, 194036.0, 37073.0, 13260.0, 6356.0, 3561.0, 2121.0, 1354.0, 853.0, 510.0, 292.0, 218.0, 129.0, 75.0, 61.0, 38.0, 13.0, 16.0, 7.0, 4.0, 4.0, 2.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.66015625, -5.43890380859375, -5.2176513671875, -4.99639892578125, -4.775146484375, -4.55389404296875, -4.3326416015625, -4.11138916015625, -3.89013671875, -3.66888427734375, -3.4476318359375, -3.22637939453125, -3.005126953125, -2.78387451171875, -2.5626220703125, -2.34136962890625, -2.1201171875, -1.89886474609375, -1.6776123046875, -1.45635986328125, -1.235107421875, -1.01385498046875, -0.7926025390625, -0.57135009765625, -0.35009765625, -0.12884521484375, 0.0924072265625, 0.31365966796875, 0.534912109375, 0.75616455078125, 0.9774169921875, 1.19866943359375, 1.419921875, 1.64117431640625, 1.8624267578125, 2.08367919921875, 2.304931640625, 2.52618408203125, 2.7474365234375, 2.96868896484375, 3.18994140625, 3.41119384765625, 3.6324462890625, 3.85369873046875, 4.074951171875, 4.29620361328125, 4.5174560546875, 4.73870849609375, 4.9599609375, 5.18121337890625, 5.4024658203125, 5.62371826171875, 5.844970703125, 6.06622314453125, 6.2874755859375, 6.50872802734375, 6.72998046875, 6.95123291015625, 7.1724853515625, 7.39373779296875, 7.614990234375, 7.83624267578125, 8.0574951171875, 8.27874755859375, 8.5]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 9.0, 5.0, 18.0, 5.0, 10.0, 14.0, 18.0, 21.0, 17.0, 20.0, 33.0, 33.0, 30.0, 42.0, 37.0, 41.0, 45.0, 33.0, 33.0, 1059.0, 43.0, 40.0, 38.0, 38.0, 35.0, 34.0, 31.0, 31.0, 26.0, 23.0, 27.0, 22.0, 14.0, 20.0, 15.0, 12.0, 8.0, 4.0, 6.0, 8.0, 1.0, 5.0, 8.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 4.0], "bins": [-3.966796875, -3.847412109375, -3.72802734375, -3.608642578125, -3.4892578125, -3.369873046875, -3.25048828125, -3.131103515625, -3.01171875, -2.892333984375, -2.77294921875, -2.653564453125, -2.5341796875, -2.414794921875, -2.29541015625, -2.176025390625, -2.056640625, -1.937255859375, -1.81787109375, -1.698486328125, -1.5791015625, -1.459716796875, -1.34033203125, -1.220947265625, -1.1015625, -0.982177734375, -0.86279296875, -0.743408203125, -0.6240234375, -0.504638671875, -0.38525390625, -0.265869140625, -0.146484375, -0.027099609375, 0.09228515625, 0.211669921875, 0.3310546875, 0.450439453125, 0.56982421875, 0.689208984375, 0.80859375, 0.927978515625, 1.04736328125, 1.166748046875, 1.2861328125, 1.405517578125, 1.52490234375, 1.644287109375, 1.763671875, 1.883056640625, 2.00244140625, 2.121826171875, 2.2412109375, 2.360595703125, 2.47998046875, 2.599365234375, 2.71875, 2.838134765625, 2.95751953125, 3.076904296875, 3.1962890625, 3.315673828125, 3.43505859375, 3.554443359375, 3.673828125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 13.0, 9.0, 10.0, 27.0, 37.0, 44.0, 60.0, 92.0, 117.0, 177.0, 270.0, 442.0, 666.0, 947.0, 1631.0, 2642.0, 4752.0, 8975.0, 19724.0, 57572.0, 314483.0, 1437067.0, 174214.0, 40187.0, 15439.0, 7323.0, 3916.0, 2342.0, 1328.0, 874.0, 617.0, 364.0, 242.0, 152.0, 123.0, 77.0, 55.0, 39.0, 27.0, 22.0, 10.0, 8.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.578125, -3.45623779296875, -3.3343505859375, -3.21246337890625, -3.090576171875, -2.96868896484375, -2.8468017578125, -2.72491455078125, -2.60302734375, -2.48114013671875, -2.3592529296875, -2.23736572265625, -2.115478515625, -1.99359130859375, -1.8717041015625, -1.74981689453125, -1.6279296875, -1.50604248046875, -1.3841552734375, -1.26226806640625, -1.140380859375, -1.01849365234375, -0.8966064453125, -0.77471923828125, -0.65283203125, -0.53094482421875, -0.4090576171875, -0.28717041015625, -0.165283203125, -0.04339599609375, 0.0784912109375, 0.20037841796875, 0.322265625, 0.44415283203125, 0.5660400390625, 0.68792724609375, 0.809814453125, 0.93170166015625, 1.0535888671875, 1.17547607421875, 1.29736328125, 1.41925048828125, 1.5411376953125, 1.66302490234375, 1.784912109375, 1.90679931640625, 2.0286865234375, 2.15057373046875, 2.2724609375, 2.39434814453125, 2.5162353515625, 2.63812255859375, 2.760009765625, 2.88189697265625, 3.0037841796875, 3.12567138671875, 3.24755859375, 3.36944580078125, 3.4913330078125, 3.61322021484375, 3.735107421875, 3.85699462890625, 3.9788818359375, 4.10076904296875, 4.22265625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 8.0, 5.0, 8.0, 14.0, 29.0, 46.0, 76.0, 150.0, 212.0, 170.0, 121.0, 57.0, 39.0, 18.0, 5.0, 7.0, 7.0, 6.0, 4.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1572265625, -1.116943359375, -1.07666015625, -1.036376953125, -0.99609375, -0.955810546875, -0.91552734375, -0.875244140625, -0.8349609375, -0.794677734375, -0.75439453125, -0.714111328125, -0.673828125, -0.633544921875, -0.59326171875, -0.552978515625, -0.5126953125, -0.472412109375, -0.43212890625, -0.391845703125, -0.3515625, -0.311279296875, -0.27099609375, -0.230712890625, -0.1904296875, -0.150146484375, -0.10986328125, -0.069580078125, -0.029296875, 0.010986328125, 0.05126953125, 0.091552734375, 0.1318359375, 0.172119140625, 0.21240234375, 0.252685546875, 0.29296875, 0.333251953125, 0.37353515625, 0.413818359375, 0.4541015625, 0.494384765625, 0.53466796875, 0.574951171875, 0.615234375, 0.655517578125, 0.69580078125, 0.736083984375, 0.7763671875, 0.816650390625, 0.85693359375, 0.897216796875, 0.9375, 0.977783203125, 1.01806640625, 1.058349609375, 1.0986328125, 1.138916015625, 1.17919921875, 1.219482421875, 1.259765625, 1.300048828125, 1.34033203125, 1.380615234375, 1.4208984375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 6.0, 1.0, 5.0, 2.0, 9.0, 8.0, 11.0, 13.0, 47.0, 76.0, 113.0, 567.0, 11898.0, 1016460.0, 18279.0, 746.0, 149.0, 71.0, 46.0, 11.0, 14.0, 7.0, 5.0, 3.0, 4.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.5625, -26.787353515625, -26.01220703125, -25.237060546875, -24.4619140625, -23.686767578125, -22.91162109375, -22.136474609375, -21.361328125, -20.586181640625, -19.81103515625, -19.035888671875, -18.2607421875, -17.485595703125, -16.71044921875, -15.935302734375, -15.16015625, -14.385009765625, -13.60986328125, -12.834716796875, -12.0595703125, -11.284423828125, -10.50927734375, -9.734130859375, -8.958984375, -8.183837890625, -7.40869140625, -6.633544921875, -5.8583984375, -5.083251953125, -4.30810546875, -3.532958984375, -2.7578125, -1.982666015625, -1.20751953125, -0.432373046875, 0.3427734375, 1.117919921875, 1.89306640625, 2.668212890625, 3.443359375, 4.218505859375, 4.99365234375, 5.768798828125, 6.5439453125, 7.319091796875, 8.09423828125, 8.869384765625, 9.64453125, 10.419677734375, 11.19482421875, 11.969970703125, 12.7451171875, 13.520263671875, 14.29541015625, 15.070556640625, 15.845703125, 16.620849609375, 17.39599609375, 18.171142578125, 18.9462890625, 19.721435546875, 20.49658203125, 21.271728515625, 22.046875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 17.0, 17.0, 21.0, 48.0, 99.0, 102.0, 143.0, 168.0, 132.0, 98.0, 65.0, 39.0, 14.0, 23.0, 7.0, 7.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9073007106781006, -0.8467980027198792, -0.7862952351570129, -0.7257925271987915, -0.6652897596359253, -0.6047870516777039, -0.5442843437194824, -0.4837815761566162, -0.4232788383960724, -0.36277610063552856, -0.30227336287498474, -0.2417706400156021, -0.1812679022550583, -0.12076517939567566, -0.060262441635131836, 0.0002402961254119873, 0.06074303388595581, 0.12124577164649963, 0.18174850940704346, 0.2422512322664261, 0.3027539849281311, 0.36325669288635254, 0.42375943064689636, 0.4842621684074402, 0.5447648763656616, 0.6052675843238831, 0.6657703518867493, 0.7262730598449707, 0.7867758274078369, 0.8472785353660583, 0.9077812433242798, 0.968284010887146, 1.0287867784500122, 1.0892895460128784, 1.149792194366455, 1.2102949619293213, 1.2707977294921875, 1.3313004970550537, 1.3918031454086304, 1.4523059129714966, 1.5128086805343628, 1.573311448097229, 1.6338140964508057, 1.6943168640136719, 1.754819631576538, 1.8153223991394043, 1.875825047492981, 1.9363278150558472, 1.9968304634094238, 2.05733323097229, 2.1178359985351562, 2.1783387660980225, 2.2388412952423096, 2.299344062805176, 2.359846830368042, 2.420349597930908, 2.4808523654937744, 2.5413551330566406, 2.601857900619507, 2.662360668182373, 2.72286319732666, 2.7833659648895264, 2.8438687324523926, 2.904371500015259, 2.964874267578125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 0.0, 4.0, 0.0, 2.0, 1.0, 3.0, 10.0, 2.0, 9.0, 8.0, 16.0, 8.0, 16.0, 15.0, 19.0, 20.0, 22.0, 25.0, 16.0, 29.0, 34.0, 28.0, 21.0, 30.0, 36.0, 43.0, 39.0, 39.0, 37.0, 31.0, 35.0, 33.0, 41.0, 25.0, 31.0, 27.0, 31.0, 23.0, 19.0, 23.0, 15.0, 23.0, 22.0, 14.0, 16.0, 8.0, 8.0, 12.0, 10.0, 6.0, 3.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0], "bins": [-0.6260077357292175, -0.6070824861526489, -0.5881571769714355, -0.5692319273948669, -0.5503066182136536, -0.531381368637085, -0.5124560594558716, -0.493530809879303, -0.474605530500412, -0.455680251121521, -0.43675497174263, -0.417829692363739, -0.3989044427871704, -0.37997913360595703, -0.3610538840293884, -0.34212860465049744, -0.32320332527160645, -0.30427804589271545, -0.28535276651382446, -0.26642748713493347, -0.24750222265720367, -0.22857694327831268, -0.20965167880058289, -0.1907263994216919, -0.1718011200428009, -0.1528758406639099, -0.13395056128501892, -0.11502529680728912, -0.09610001742839813, -0.07717473804950714, -0.05824946612119675, -0.03932419419288635, -0.020398855209350586, -0.0014735795557498932, 0.0174516960978508, 0.03637697175145149, 0.055302247405052185, 0.07422752678394318, 0.09315279871225357, 0.11207807064056396, 0.13100335001945496, 0.14992862939834595, 0.16885390877723694, 0.18777917325496674, 0.20670445263385773, 0.22562973201274872, 0.24455499649047852, 0.2634802758693695, 0.2824055552482605, 0.3013308346271515, 0.3202561140060425, 0.33918139338493347, 0.35810667276382446, 0.37703192234039307, 0.39595720171928406, 0.41488248109817505, 0.43380776047706604, 0.45273303985595703, 0.471658319234848, 0.490583598613739, 0.5095088481903076, 0.528434157371521, 0.5473594069480896, 0.5662846565246582, 0.5852099657058716]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 11.0, 11.0, 10.0, 8.0, 10.0, 15.0, 16.0, 16.0, 26.0, 28.0, 18.0, 32.0, 32.0, 31.0, 35.0, 32.0, 28.0, 31.0, 51.0, 43.0, 40.0, 55.0, 30.0, 31.0, 37.0, 28.0, 32.0, 34.0, 33.0, 32.0, 16.0, 17.0, 17.0, 20.0, 12.0, 15.0, 10.0, 6.0, 13.0, 6.0, 9.0, 4.0, 3.0, 6.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0], "bins": [-5.6015625, -5.4373779296875, -5.273193359375, -5.1090087890625, -4.94482421875, -4.7806396484375, -4.616455078125, -4.4522705078125, -4.2880859375, -4.1239013671875, -3.959716796875, -3.7955322265625, -3.63134765625, -3.4671630859375, -3.302978515625, -3.1387939453125, -2.974609375, -2.8104248046875, -2.646240234375, -2.4820556640625, -2.31787109375, -2.1536865234375, -1.989501953125, -1.8253173828125, -1.6611328125, -1.4969482421875, -1.332763671875, -1.1685791015625, -1.00439453125, -0.8402099609375, -0.676025390625, -0.5118408203125, -0.34765625, -0.1834716796875, -0.019287109375, 0.1448974609375, 0.30908203125, 0.4732666015625, 0.637451171875, 0.8016357421875, 0.9658203125, 1.1300048828125, 1.294189453125, 1.4583740234375, 1.62255859375, 1.7867431640625, 1.950927734375, 2.1151123046875, 2.279296875, 2.4434814453125, 2.607666015625, 2.7718505859375, 2.93603515625, 3.1002197265625, 3.264404296875, 3.4285888671875, 3.5927734375, 3.7569580078125, 3.921142578125, 4.0853271484375, 4.24951171875, 4.4136962890625, 4.577880859375, 4.7420654296875, 4.90625]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 3.0, 7.0, 14.0, 12.0, 17.0, 15.0, 29.0, 45.0, 52.0, 66.0, 113.0, 139.0, 190.0, 266.0, 420.0, 651.0, 1007.0, 1517.0, 2570.0, 4477.0, 8049.0, 14674.0, 28547.0, 57881.0, 129641.0, 277484.0, 275114.0, 126901.0, 56876.0, 27874.0, 14474.0, 7792.0, 4418.0, 2616.0, 1606.0, 1014.0, 588.0, 412.0, 306.0, 187.0, 120.0, 101.0, 68.0, 52.0, 43.0, 31.0, 24.0, 13.0, 13.0, 10.0, 3.0, 5.0, 1.0, 3.0, 3.0, 5.0, 2.0], "bins": [-6.71875, -6.51507568359375, -6.3114013671875, -6.10772705078125, -5.904052734375, -5.70037841796875, -5.4967041015625, -5.29302978515625, -5.08935546875, -4.88568115234375, -4.6820068359375, -4.47833251953125, -4.274658203125, -4.07098388671875, -3.8673095703125, -3.66363525390625, -3.4599609375, -3.25628662109375, -3.0526123046875, -2.84893798828125, -2.645263671875, -2.44158935546875, -2.2379150390625, -2.03424072265625, -1.83056640625, -1.62689208984375, -1.4232177734375, -1.21954345703125, -1.015869140625, -0.81219482421875, -0.6085205078125, -0.40484619140625, -0.201171875, 0.00250244140625, 0.2061767578125, 0.40985107421875, 0.613525390625, 0.81719970703125, 1.0208740234375, 1.22454833984375, 1.42822265625, 1.63189697265625, 1.8355712890625, 2.03924560546875, 2.242919921875, 2.44659423828125, 2.6502685546875, 2.85394287109375, 3.0576171875, 3.26129150390625, 3.4649658203125, 3.66864013671875, 3.872314453125, 4.07598876953125, 4.2796630859375, 4.48333740234375, 4.68701171875, 4.89068603515625, 5.0943603515625, 5.29803466796875, 5.501708984375, 5.70538330078125, 5.9090576171875, 6.11273193359375, 6.31640625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 11.0, 9.0, 7.0, 12.0, 6.0, 9.0, 12.0, 18.0, 17.0, 18.0, 28.0, 35.0, 39.0, 42.0, 40.0, 45.0, 43.0, 80.0, 107.0, 194.0, 1320.0, 293.0, 160.0, 94.0, 64.0, 49.0, 42.0, 27.0, 38.0, 23.0, 30.0, 16.0, 22.0, 21.0, 19.0, 10.0, 11.0, 11.0, 3.0, 8.0, 7.0, 7.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.90625, -16.376953125, -15.84765625, -15.318359375, -14.7890625, -14.259765625, -13.73046875, -13.201171875, -12.671875, -12.142578125, -11.61328125, -11.083984375, -10.5546875, -10.025390625, -9.49609375, -8.966796875, -8.4375, -7.908203125, -7.37890625, -6.849609375, -6.3203125, -5.791015625, -5.26171875, -4.732421875, -4.203125, -3.673828125, -3.14453125, -2.615234375, -2.0859375, -1.556640625, -1.02734375, -0.498046875, 0.03125, 0.560546875, 1.08984375, 1.619140625, 2.1484375, 2.677734375, 3.20703125, 3.736328125, 4.265625, 4.794921875, 5.32421875, 5.853515625, 6.3828125, 6.912109375, 7.44140625, 7.970703125, 8.5, 9.029296875, 9.55859375, 10.087890625, 10.6171875, 11.146484375, 11.67578125, 12.205078125, 12.734375, 13.263671875, 13.79296875, 14.322265625, 14.8515625, 15.380859375, 15.91015625, 16.439453125, 16.96875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 5.0, 5.0, 12.0, 9.0, 9.0, 16.0, 16.0, 18.0, 21.0, 40.0, 28.0, 43.0, 83.0, 82.0, 104.0, 149.0, 217.0, 446.0, 1219.0, 5759.0, 72352.0, 2650396.0, 395868.0, 14860.0, 2270.0, 577.0, 305.0, 179.0, 137.0, 105.0, 85.0, 66.0, 46.0, 38.0, 38.0, 17.0, 11.0, 17.0, 10.0, 10.0, 6.0, 7.0, 9.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.28125, -34.23486328125, -33.1884765625, -32.14208984375, -31.095703125, -30.04931640625, -29.0029296875, -27.95654296875, -26.91015625, -25.86376953125, -24.8173828125, -23.77099609375, -22.724609375, -21.67822265625, -20.6318359375, -19.58544921875, -18.5390625, -17.49267578125, -16.4462890625, -15.39990234375, -14.353515625, -13.30712890625, -12.2607421875, -11.21435546875, -10.16796875, -9.12158203125, -8.0751953125, -7.02880859375, -5.982421875, -4.93603515625, -3.8896484375, -2.84326171875, -1.796875, -0.75048828125, 0.2958984375, 1.34228515625, 2.388671875, 3.43505859375, 4.4814453125, 5.52783203125, 6.57421875, 7.62060546875, 8.6669921875, 9.71337890625, 10.759765625, 11.80615234375, 12.8525390625, 13.89892578125, 14.9453125, 15.99169921875, 17.0380859375, 18.08447265625, 19.130859375, 20.17724609375, 21.2236328125, 22.27001953125, 23.31640625, 24.36279296875, 25.4091796875, 26.45556640625, 27.501953125, 28.54833984375, 29.5947265625, 30.64111328125, 31.6875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 786.0, 224.0, 1.0], "bins": [-964.4215087890625, -948.8115844726562, -933.2017211914062, -917.591796875, -901.98193359375, -886.3720092773438, -870.7621459960938, -855.1522216796875, -839.5423583984375, -823.9324340820312, -808.3225708007812, -792.712646484375, -777.102783203125, -761.4928588867188, -745.8829956054688, -730.2730712890625, -714.6632080078125, -699.0532836914062, -683.4434204101562, -667.83349609375, -652.2236328125, -636.6137084960938, -621.0038452148438, -605.3939208984375, -589.7840576171875, -574.1741333007812, -558.5642700195312, -542.954345703125, -527.344482421875, -511.7345886230469, -496.12469482421875, -480.5148010253906, -464.9048767089844, -449.29498291015625, -433.6850891113281, -418.0751953125, -402.4653015136719, -386.85540771484375, -371.2455139160156, -355.6356201171875, -340.0257263183594, -324.41583251953125, -308.8059387207031, -293.196044921875, -277.5861511230469, -261.97625732421875, -246.36636352539062, -230.7564697265625, -215.14657592773438, -199.53668212890625, -183.92678833007812, -168.31689453125, -152.70700073242188, -137.09710693359375, -121.4872055053711, -105.87731170654297, -90.26741027832031, -74.65751647949219, -59.04762268066406, -43.43772506713867, -27.827831268310547, -12.217933654785156, 3.3919601440429688, 19.001853942871094, 34.61174774169922]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 8.0, 8.0, 9.0, 7.0, 14.0, 9.0, 11.0, 17.0, 23.0, 23.0, 28.0, 33.0, 26.0, 27.0, 40.0, 36.0, 44.0, 34.0, 41.0, 37.0, 34.0, 37.0, 53.0, 34.0, 32.0, 37.0, 34.0, 33.0, 26.0, 25.0, 24.0, 19.0, 25.0, 22.0, 20.0, 18.0, 12.0, 12.0, 8.0, 7.0, 6.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-48.105690002441406, -46.686134338378906, -45.26657485961914, -43.84701919555664, -42.42746353149414, -41.007904052734375, -39.588348388671875, -38.168792724609375, -36.749237060546875, -35.329681396484375, -33.91012191772461, -32.49056625366211, -31.07101058959961, -29.651453018188477, -28.231895446777344, -26.812339782714844, -25.392780303955078, -23.973222732543945, -22.553667068481445, -21.134109497070312, -19.714553833007812, -18.29499626159668, -16.875438690185547, -15.45588207244873, -14.036325454711914, -12.616768836975098, -11.197212219238281, -9.777654647827148, -8.358098030090332, -6.938541412353516, -5.518983840942383, -4.099427223205566, -2.67987060546875, -1.2603137493133545, 0.15924310684204102, 1.5788002014160156, 2.998356819152832, 4.417913436889648, 5.837471008300781, 7.257027626037598, 8.676584243774414, 10.09614086151123, 11.515697479248047, 12.93525505065918, 14.354811668395996, 15.774368286132812, 17.193925857543945, 18.613483428955078, 20.033039093017578, 21.45259666442871, 22.87215232849121, 24.291709899902344, 25.711265563964844, 27.130823135375977, 28.55038070678711, 29.96993637084961, 31.389493942260742, 32.809051513671875, 34.228607177734375, 35.648162841796875, 37.06772232055664, 38.48727798461914, 39.906837463378906, 41.326393127441406, 42.745948791503906]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 5.0, 4.0, 6.0, 7.0, 7.0, 9.0, 11.0, 14.0, 11.0, 18.0, 22.0, 11.0, 20.0, 21.0, 27.0, 32.0, 26.0, 29.0, 37.0, 48.0, 25.0, 43.0, 41.0, 42.0, 41.0, 34.0, 35.0, 37.0, 33.0, 48.0, 40.0, 31.0, 23.0, 24.0, 27.0, 16.0, 18.0, 10.0, 11.0, 9.0, 13.0, 8.0, 9.0, 6.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-6.1171875, -5.940185546875, -5.76318359375, -5.586181640625, -5.4091796875, -5.232177734375, -5.05517578125, -4.878173828125, -4.701171875, -4.524169921875, -4.34716796875, -4.170166015625, -3.9931640625, -3.816162109375, -3.63916015625, -3.462158203125, -3.28515625, -3.108154296875, -2.93115234375, -2.754150390625, -2.5771484375, -2.400146484375, -2.22314453125, -2.046142578125, -1.869140625, -1.692138671875, -1.51513671875, -1.338134765625, -1.1611328125, -0.984130859375, -0.80712890625, -0.630126953125, -0.453125, -0.276123046875, -0.09912109375, 0.077880859375, 0.2548828125, 0.431884765625, 0.60888671875, 0.785888671875, 0.962890625, 1.139892578125, 1.31689453125, 1.493896484375, 1.6708984375, 1.847900390625, 2.02490234375, 2.201904296875, 2.37890625, 2.555908203125, 2.73291015625, 2.909912109375, 3.0869140625, 3.263916015625, 3.44091796875, 3.617919921875, 3.794921875, 3.971923828125, 4.14892578125, 4.325927734375, 4.5029296875, 4.679931640625, 4.85693359375, 5.033935546875, 5.2109375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 1.0, 4.0, 4.0, 8.0, 5.0, 11.0, 13.0, 15.0, 19.0, 30.0, 38.0, 54.0, 77.0, 109.0, 114.0, 193.0, 315.0, 478.0, 725.0, 1306.0, 2372.0, 4877.0, 10850.0, 28626.0, 97487.0, 481829.0, 1987055.0, 1250766.0, 237091.0, 55224.0, 18361.0, 7793.0, 3684.0, 1912.0, 1041.0, 621.0, 349.0, 231.0, 165.0, 131.0, 74.0, 50.0, 48.0, 28.0, 31.0, 25.0, 9.0, 11.0, 8.0, 3.0, 5.0, 3.0, 6.0, 2.0, 1.0, 2.0], "bins": [-12.5703125, -12.208984375, -11.84765625, -11.486328125, -11.125, -10.763671875, -10.40234375, -10.041015625, -9.6796875, -9.318359375, -8.95703125, -8.595703125, -8.234375, -7.873046875, -7.51171875, -7.150390625, -6.7890625, -6.427734375, -6.06640625, -5.705078125, -5.34375, -4.982421875, -4.62109375, -4.259765625, -3.8984375, -3.537109375, -3.17578125, -2.814453125, -2.453125, -2.091796875, -1.73046875, -1.369140625, -1.0078125, -0.646484375, -0.28515625, 0.076171875, 0.4375, 0.798828125, 1.16015625, 1.521484375, 1.8828125, 2.244140625, 2.60546875, 2.966796875, 3.328125, 3.689453125, 4.05078125, 4.412109375, 4.7734375, 5.134765625, 5.49609375, 5.857421875, 6.21875, 6.580078125, 6.94140625, 7.302734375, 7.6640625, 8.025390625, 8.38671875, 8.748046875, 9.109375, 9.470703125, 9.83203125, 10.193359375, 10.5546875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 13.0, 18.0, 21.0, 25.0, 50.0, 69.0, 104.0, 172.0, 287.0, 470.0, 651.0, 759.0, 548.0, 304.0, 229.0, 131.0, 81.0, 45.0, 41.0, 14.0, 10.0, 8.0, 6.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.375, -16.83447265625, -16.2939453125, -15.75341796875, -15.212890625, -14.67236328125, -14.1318359375, -13.59130859375, -13.05078125, -12.51025390625, -11.9697265625, -11.42919921875, -10.888671875, -10.34814453125, -9.8076171875, -9.26708984375, -8.7265625, -8.18603515625, -7.6455078125, -7.10498046875, -6.564453125, -6.02392578125, -5.4833984375, -4.94287109375, -4.40234375, -3.86181640625, -3.3212890625, -2.78076171875, -2.240234375, -1.69970703125, -1.1591796875, -0.61865234375, -0.078125, 0.46240234375, 1.0029296875, 1.54345703125, 2.083984375, 2.62451171875, 3.1650390625, 3.70556640625, 4.24609375, 4.78662109375, 5.3271484375, 5.86767578125, 6.408203125, 6.94873046875, 7.4892578125, 8.02978515625, 8.5703125, 9.11083984375, 9.6513671875, 10.19189453125, 10.732421875, 11.27294921875, 11.8134765625, 12.35400390625, 12.89453125, 13.43505859375, 13.9755859375, 14.51611328125, 15.056640625, 15.59716796875, 16.1376953125, 16.67822265625, 17.21875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 10.0, 6.0, 14.0, 18.0, 42.0, 70.0, 122.0, 254.0, 607.0, 4244.0, 336027.0, 3830344.0, 20634.0, 1145.0, 344.0, 158.0, 93.0, 46.0, 37.0, 28.0, 11.0, 16.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.5625, -71.20703125, -68.8515625, -66.49609375, -64.140625, -61.78515625, -59.4296875, -57.07421875, -54.71875, -52.36328125, -50.0078125, -47.65234375, -45.296875, -42.94140625, -40.5859375, -38.23046875, -35.875, -33.51953125, -31.1640625, -28.80859375, -26.453125, -24.09765625, -21.7421875, -19.38671875, -17.03125, -14.67578125, -12.3203125, -9.96484375, -7.609375, -5.25390625, -2.8984375, -0.54296875, 1.8125, 4.16796875, 6.5234375, 8.87890625, 11.234375, 13.58984375, 15.9453125, 18.30078125, 20.65625, 23.01171875, 25.3671875, 27.72265625, 30.078125, 32.43359375, 34.7890625, 37.14453125, 39.5, 41.85546875, 44.2109375, 46.56640625, 48.921875, 51.27734375, 53.6328125, 55.98828125, 58.34375, 60.69921875, 63.0546875, 65.41015625, 67.765625, 70.12109375, 72.4765625, 74.83203125, 77.1875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 9.0, 25.0, 40.0, 98.0, 177.0, 246.0, 211.0, 99.0, 69.0, 23.0, 8.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-206.31053161621094, -202.23532104492188, -198.1601104736328, -194.08489990234375, -190.0096893310547, -185.93447875976562, -181.85928344726562, -177.78407287597656, -173.7088623046875, -169.63365173339844, -165.55844116210938, -161.4832305908203, -157.40802001953125, -153.33282470703125, -149.25759887695312, -145.18240356445312, -141.107177734375, -137.03196716308594, -132.95675659179688, -128.8815460205078, -124.80634307861328, -120.73113250732422, -116.65592193603516, -112.5807113647461, -108.50550842285156, -104.4302978515625, -100.35508728027344, -96.27987670898438, -92.20467376708984, -88.12946319580078, -84.05425262451172, -79.97904205322266, -75.90383911132812, -71.82862854003906, -67.75341796875, -63.6782112121582, -59.603004455566406, -55.527793884277344, -51.45258331298828, -47.37737274169922, -43.30216598510742, -39.22695541381836, -35.15174865722656, -31.0765380859375, -27.00132942199707, -22.92612075805664, -18.850910186767578, -14.775701522827148, -10.700492858886719, -6.625283718109131, -2.550074577331543, 1.5251350402832031, 5.600343704223633, 9.675552368164062, 13.750762939453125, 17.825971603393555, 21.901180267333984, 25.976388931274414, 30.051597595214844, 34.126808166503906, 38.20201873779297, 42.277225494384766, 46.35243606567383, 50.427642822265625, 54.50285339355469]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 2.0, 5.0, 5.0, 8.0, 4.0, 7.0, 9.0, 16.0, 17.0, 12.0, 15.0, 20.0, 26.0, 22.0, 21.0, 33.0, 27.0, 42.0, 40.0, 34.0, 34.0, 30.0, 45.0, 30.0, 29.0, 34.0, 48.0, 27.0, 46.0, 35.0, 26.0, 28.0, 34.0, 16.0, 23.0, 20.0, 17.0, 18.0, 18.0, 13.0, 16.0, 10.0, 12.0, 4.0, 9.0, 3.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-39.10951232910156, -37.98291778564453, -36.8563232421875, -35.72972869873047, -34.60313415527344, -33.476539611816406, -32.349945068359375, -31.223350524902344, -30.096755981445312, -28.97016143798828, -27.84356689453125, -26.71697235107422, -25.590377807617188, -24.463783264160156, -23.337188720703125, -22.210594177246094, -21.084001541137695, -19.957406997680664, -18.830812454223633, -17.7042179107666, -16.57762336730957, -15.451028823852539, -14.324435234069824, -13.197840690612793, -12.071246147155762, -10.94465160369873, -9.8180570602417, -8.691463470458984, -7.564868450164795, -6.438273906707764, -5.311679840087891, -4.185085296630859, -3.058490753173828, -1.9318963289260864, -0.8053019046783447, 0.3212924003601074, 1.4478869438171387, 2.57448148727417, 3.701075553894043, 4.827670097351074, 5.9542646408081055, 7.080859184265137, 8.207453727722168, 9.334047317504883, 10.460641860961914, 11.587236404418945, 12.713830947875977, 13.840425491333008, 14.967020034790039, 16.09361457824707, 17.2202091217041, 18.346803665161133, 19.473398208618164, 20.599992752075195, 21.726585388183594, 22.853179931640625, 23.979774475097656, 25.106369018554688, 26.23296356201172, 27.35955810546875, 28.48615264892578, 29.612747192382812, 30.739341735839844, 31.865936279296875, 32.992530822753906]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 4.0, 2.0, 5.0, 11.0, 7.0, 13.0, 9.0, 15.0, 17.0, 12.0, 13.0, 25.0, 14.0, 26.0, 22.0, 34.0, 27.0, 33.0, 36.0, 35.0, 46.0, 39.0, 26.0, 26.0, 53.0, 35.0, 42.0, 38.0, 32.0, 33.0, 22.0, 26.0, 33.0, 30.0, 23.0, 21.0, 18.0, 10.0, 16.0, 14.0, 11.0, 6.0, 7.0, 4.0, 7.0, 3.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.57421875, -5.4122314453125, -5.250244140625, -5.0882568359375, -4.92626953125, -4.7642822265625, -4.602294921875, -4.4403076171875, -4.2783203125, -4.1163330078125, -3.954345703125, -3.7923583984375, -3.63037109375, -3.4683837890625, -3.306396484375, -3.1444091796875, -2.982421875, -2.8204345703125, -2.658447265625, -2.4964599609375, -2.33447265625, -2.1724853515625, -2.010498046875, -1.8485107421875, -1.6865234375, -1.5245361328125, -1.362548828125, -1.2005615234375, -1.03857421875, -0.8765869140625, -0.714599609375, -0.5526123046875, -0.390625, -0.2286376953125, -0.066650390625, 0.0953369140625, 0.25732421875, 0.4193115234375, 0.581298828125, 0.7432861328125, 0.9052734375, 1.0672607421875, 1.229248046875, 1.3912353515625, 1.55322265625, 1.7152099609375, 1.877197265625, 2.0391845703125, 2.201171875, 2.3631591796875, 2.525146484375, 2.6871337890625, 2.84912109375, 3.0111083984375, 3.173095703125, 3.3350830078125, 3.4970703125, 3.6590576171875, 3.821044921875, 3.9830322265625, 4.14501953125, 4.3070068359375, 4.468994140625, 4.6309814453125, 4.79296875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 7.0, 10.0, 11.0, 29.0, 67.0, 91.0, 251.0, 502.0, 1262.0, 3561.0, 12969.0, 74848.0, 608691.0, 301093.0, 33982.0, 7354.0, 2234.0, 897.0, 373.0, 159.0, 87.0, 41.0, 16.0, 12.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.28515625, -5.09503173828125, -4.9049072265625, -4.71478271484375, -4.524658203125, -4.33453369140625, -4.1444091796875, -3.95428466796875, -3.76416015625, -3.57403564453125, -3.3839111328125, -3.19378662109375, -3.003662109375, -2.81353759765625, -2.6234130859375, -2.43328857421875, -2.2431640625, -2.05303955078125, -1.8629150390625, -1.67279052734375, -1.482666015625, -1.29254150390625, -1.1024169921875, -0.91229248046875, -0.72216796875, -0.53204345703125, -0.3419189453125, -0.15179443359375, 0.038330078125, 0.22845458984375, 0.4185791015625, 0.60870361328125, 0.798828125, 0.98895263671875, 1.1790771484375, 1.36920166015625, 1.559326171875, 1.74945068359375, 1.9395751953125, 2.12969970703125, 2.31982421875, 2.50994873046875, 2.7000732421875, 2.89019775390625, 3.080322265625, 3.27044677734375, 3.4605712890625, 3.65069580078125, 3.8408203125, 4.03094482421875, 4.2210693359375, 4.41119384765625, 4.601318359375, 4.79144287109375, 4.9815673828125, 5.17169189453125, 5.36181640625, 5.55194091796875, 5.7420654296875, 5.93218994140625, 6.122314453125, 6.31243896484375, 6.5025634765625, 6.69268798828125, 6.8828125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 9.0, 7.0, 4.0, 8.0, 11.0, 9.0, 7.0, 14.0, 17.0, 16.0, 22.0, 18.0, 17.0, 18.0, 24.0, 20.0, 31.0, 35.0, 27.0, 29.0, 29.0, 36.0, 48.0, 1058.0, 33.0, 35.0, 40.0, 33.0, 32.0, 35.0, 29.0, 33.0, 26.0, 26.0, 22.0, 15.0, 20.0, 18.0, 15.0, 14.0, 15.0, 9.0, 14.0, 6.0, 8.0, 6.0, 5.0, 4.0, 2.0, 3.0, 5.0, 3.0, 1.0, 2.0, 3.0], "bins": [-3.42578125, -3.321441650390625, -3.21710205078125, -3.112762451171875, -3.0084228515625, -2.904083251953125, -2.79974365234375, -2.695404052734375, -2.591064453125, -2.486724853515625, -2.38238525390625, -2.278045654296875, -2.1737060546875, -2.069366455078125, -1.96502685546875, -1.860687255859375, -1.75634765625, -1.652008056640625, -1.54766845703125, -1.443328857421875, -1.3389892578125, -1.234649658203125, -1.13031005859375, -1.025970458984375, -0.921630859375, -0.817291259765625, -0.71295166015625, -0.608612060546875, -0.5042724609375, -0.399932861328125, -0.29559326171875, -0.191253662109375, -0.0869140625, 0.017425537109375, 0.12176513671875, 0.226104736328125, 0.3304443359375, 0.434783935546875, 0.53912353515625, 0.643463134765625, 0.747802734375, 0.852142333984375, 0.95648193359375, 1.060821533203125, 1.1651611328125, 1.269500732421875, 1.37384033203125, 1.478179931640625, 1.58251953125, 1.686859130859375, 1.79119873046875, 1.895538330078125, 1.9998779296875, 2.104217529296875, 2.20855712890625, 2.312896728515625, 2.417236328125, 2.521575927734375, 2.62591552734375, 2.730255126953125, 2.8345947265625, 2.938934326171875, 3.04327392578125, 3.147613525390625, 3.251953125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 11.0, 14.0, 19.0, 30.0, 45.0, 60.0, 83.0, 146.0, 198.0, 296.0, 444.0, 695.0, 1090.0, 1654.0, 2547.0, 4413.0, 8306.0, 17761.0, 49780.0, 181354.0, 1214765.0, 454722.0, 100116.0, 30460.0, 12555.0, 6148.0, 3383.0, 2165.0, 1340.0, 852.0, 556.0, 344.0, 237.0, 174.0, 123.0, 68.0, 70.0, 42.0, 21.0, 14.0, 11.0, 7.0, 8.0, 4.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.638671875, -1.583648681640625, -1.52862548828125, -1.473602294921875, -1.4185791015625, -1.363555908203125, -1.30853271484375, -1.253509521484375, -1.198486328125, -1.143463134765625, -1.08843994140625, -1.033416748046875, -0.9783935546875, -0.923370361328125, -0.86834716796875, -0.813323974609375, -0.75830078125, -0.703277587890625, -0.64825439453125, -0.593231201171875, -0.5382080078125, -0.483184814453125, -0.42816162109375, -0.373138427734375, -0.318115234375, -0.263092041015625, -0.20806884765625, -0.153045654296875, -0.0980224609375, -0.042999267578125, 0.01202392578125, 0.067047119140625, 0.1220703125, 0.177093505859375, 0.23211669921875, 0.287139892578125, 0.3421630859375, 0.397186279296875, 0.45220947265625, 0.507232666015625, 0.562255859375, 0.617279052734375, 0.67230224609375, 0.727325439453125, 0.7823486328125, 0.837371826171875, 0.89239501953125, 0.947418212890625, 1.00244140625, 1.057464599609375, 1.11248779296875, 1.167510986328125, 1.2225341796875, 1.277557373046875, 1.33258056640625, 1.387603759765625, 1.442626953125, 1.497650146484375, 1.55267333984375, 1.607696533203125, 1.6627197265625, 1.717742919921875, 1.77276611328125, 1.827789306640625, 1.8828125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 6.0, 5.0, 7.0, 7.0, 8.0, 21.0, 11.0, 20.0, 20.0, 27.0, 35.0, 67.0, 82.0, 96.0, 133.0, 128.0, 88.0, 56.0, 35.0, 29.0, 21.0, 21.0, 10.0, 9.0, 11.0, 5.0, 5.0, 7.0, 6.0, 6.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31884765625, -0.3064002990722656, -0.29395294189453125, -0.2815055847167969, -0.2690582275390625, -0.2566108703613281, -0.24416351318359375, -0.23171615600585938, -0.219268798828125, -0.20682144165039062, -0.19437408447265625, -0.18192672729492188, -0.1694793701171875, -0.15703201293945312, -0.14458465576171875, -0.13213729858398438, -0.11968994140625, -0.10724258422851562, -0.09479522705078125, -0.08234786987304688, -0.0699005126953125, -0.057453155517578125, -0.04500579833984375, -0.032558441162109375, -0.020111083984375, -0.007663726806640625, 0.00478363037109375, 0.017230987548828125, 0.0296783447265625, 0.042125701904296875, 0.05457305908203125, 0.06702041625976562, 0.0794677734375, 0.09191513061523438, 0.10436248779296875, 0.11680984497070312, 0.1292572021484375, 0.14170455932617188, 0.15415191650390625, 0.16659927368164062, 0.179046630859375, 0.19149398803710938, 0.20394134521484375, 0.21638870239257812, 0.2288360595703125, 0.24128341674804688, 0.25373077392578125, 0.2661781311035156, 0.27862548828125, 0.2910728454589844, 0.30352020263671875, 0.3159675598144531, 0.3284149169921875, 0.3408622741699219, 0.35330963134765625, 0.3657569885253906, 0.378204345703125, 0.3906517028808594, 0.40309906005859375, 0.4155464172363281, 0.4279937744140625, 0.4404411315917969, 0.45288848876953125, 0.4653358459472656, 0.477783203125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 5.0, 9.0, 3.0, 10.0, 16.0, 25.0, 17.0, 17.0, 42.0, 57.0, 91.0, 173.0, 423.0, 3592.0, 253180.0, 784894.0, 4898.0, 562.0, 175.0, 108.0, 67.0, 43.0, 27.0, 22.0, 26.0, 16.0, 12.0, 4.0, 9.0, 2.0, 6.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0], "bins": [-9.2890625, -9.05120849609375, -8.8133544921875, -8.57550048828125, -8.337646484375, -8.09979248046875, -7.8619384765625, -7.62408447265625, -7.38623046875, -7.14837646484375, -6.9105224609375, -6.67266845703125, -6.434814453125, -6.19696044921875, -5.9591064453125, -5.72125244140625, -5.4833984375, -5.24554443359375, -5.0076904296875, -4.76983642578125, -4.531982421875, -4.29412841796875, -4.0562744140625, -3.81842041015625, -3.58056640625, -3.34271240234375, -3.1048583984375, -2.86700439453125, -2.629150390625, -2.39129638671875, -2.1534423828125, -1.91558837890625, -1.677734375, -1.43988037109375, -1.2020263671875, -0.96417236328125, -0.726318359375, -0.48846435546875, -0.2506103515625, -0.01275634765625, 0.22509765625, 0.46295166015625, 0.7008056640625, 0.93865966796875, 1.176513671875, 1.41436767578125, 1.6522216796875, 1.89007568359375, 2.1279296875, 2.36578369140625, 2.6036376953125, 2.84149169921875, 3.079345703125, 3.31719970703125, 3.5550537109375, 3.79290771484375, 4.03076171875, 4.26861572265625, 4.5064697265625, 4.74432373046875, 4.982177734375, 5.22003173828125, 5.4578857421875, 5.69573974609375, 5.93359375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [7.0, 7.0, 86.0, 347.0, 399.0, 137.0, 24.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31863605976104736, -0.24157589673995972, -0.16451574862003326, -0.08745560050010681, -0.010395437479019165, 0.06666472554206848, 0.14372485876083374, 0.2207850217819214, 0.29784518480300903, 0.3749053478240967, 0.4519655108451843, 0.529025673866272, 0.6060857772827148, 0.6831459999084473, 0.7602061033248901, 0.8372662663459778, 0.9143264293670654, 0.9913865923881531, 1.0684467554092407, 1.1455068588256836, 1.222567081451416, 1.2996271848678589, 1.3766872882843018, 1.4537475109100342, 1.5308077335357666, 1.6078678369522095, 1.684928059577942, 1.7619881629943848, 1.8390483856201172, 1.91610848903656, 1.993168592453003, 2.0702288150787354, 2.1472890377044678, 2.2243492603302, 2.3014092445373535, 2.378469467163086, 2.4555296897888184, 2.532589912414551, 2.609649896621704, 2.6867101192474365, 2.763770341873169, 2.8408305644989014, 2.9178905487060547, 2.994950771331787, 3.0720109939575195, 3.149071216583252, 3.2261312007904053, 3.3031914234161377, 3.380251407623291, 3.4573116302490234, 3.5343716144561768, 3.611431837081909, 3.6884920597076416, 3.765552282333374, 3.8426122665405273, 3.9196724891662598, 3.996732711791992, 4.073792934417725, 4.150853157043457, 4.2279133796691895, 4.304973125457764, 4.382033348083496, 4.4590935707092285, 4.536153793334961, 4.613214015960693]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 12.0, 5.0, 10.0, 10.0, 13.0, 18.0, 12.0, 23.0, 23.0, 29.0, 38.0, 33.0, 45.0, 38.0, 42.0, 34.0, 45.0, 50.0, 53.0, 53.0, 39.0, 53.0, 49.0, 42.0, 26.0, 39.0, 27.0, 33.0, 16.0, 21.0, 17.0, 8.0, 12.0, 3.0, 3.0, 9.0, 4.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.4490535855293274, -0.4354099929332733, -0.4217664301395416, -0.40812283754348755, -0.39447927474975586, -0.3808356821537018, -0.3671920895576477, -0.353548526763916, -0.3399049639701843, -0.32626137137413025, -0.31261780858039856, -0.2989742159843445, -0.2853306531906128, -0.2716870605945587, -0.25804346799850464, -0.24439990520477295, -0.23075631260871887, -0.217112734913826, -0.2034691572189331, -0.18982556462287903, -0.17618200182914734, -0.16253840923309326, -0.14889483153820038, -0.1352512538433075, -0.12160767614841461, -0.10796409845352173, -0.09432052075862885, -0.08067693561315536, -0.06703335791826248, -0.0533897802233696, -0.03974619507789612, -0.026102617383003235, -0.012459039688110352, 0.001184539869427681, 0.014828119426965714, 0.028471700847148895, 0.04211527854204178, 0.05575885623693466, 0.06940244138240814, 0.08304601907730103, 0.09668959677219391, 0.11033317446708679, 0.12397675216197968, 0.13762032985687256, 0.15126392245292664, 0.16490748524665833, 0.1785510778427124, 0.19219465553760529, 0.20583823323249817, 0.21948181092739105, 0.23312538862228394, 0.246768981218338, 0.2604125440120697, 0.2740561366081238, 0.28769969940185547, 0.30134329199790955, 0.3149868845939636, 0.3286304771900177, 0.3422740399837494, 0.35591763257980347, 0.36956119537353516, 0.38320478796958923, 0.3968483805656433, 0.410491943359375, 0.4241355061531067]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 4.0, 10.0, 6.0, 15.0, 2.0, 12.0, 19.0, 13.0, 23.0, 17.0, 25.0, 20.0, 18.0, 21.0, 31.0, 22.0, 31.0, 24.0, 36.0, 38.0, 39.0, 39.0, 37.0, 30.0, 50.0, 34.0, 37.0, 37.0, 23.0, 36.0, 28.0, 32.0, 25.0, 13.0, 15.0, 22.0, 22.0, 15.0, 13.0, 12.0, 8.0, 7.0, 10.0, 3.0, 5.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0], "bins": [-5.3359375, -5.1806640625, -5.025390625, -4.8701171875, -4.71484375, -4.5595703125, -4.404296875, -4.2490234375, -4.09375, -3.9384765625, -3.783203125, -3.6279296875, -3.47265625, -3.3173828125, -3.162109375, -3.0068359375, -2.8515625, -2.6962890625, -2.541015625, -2.3857421875, -2.23046875, -2.0751953125, -1.919921875, -1.7646484375, -1.609375, -1.4541015625, -1.298828125, -1.1435546875, -0.98828125, -0.8330078125, -0.677734375, -0.5224609375, -0.3671875, -0.2119140625, -0.056640625, 0.0986328125, 0.25390625, 0.4091796875, 0.564453125, 0.7197265625, 0.875, 1.0302734375, 1.185546875, 1.3408203125, 1.49609375, 1.6513671875, 1.806640625, 1.9619140625, 2.1171875, 2.2724609375, 2.427734375, 2.5830078125, 2.73828125, 2.8935546875, 3.048828125, 3.2041015625, 3.359375, 3.5146484375, 3.669921875, 3.8251953125, 3.98046875, 4.1357421875, 4.291015625, 4.4462890625, 4.6015625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 9.0, 16.0, 15.0, 21.0, 35.0, 43.0, 73.0, 119.0, 182.0, 287.0, 504.0, 875.0, 1536.0, 2730.0, 5218.0, 9454.0, 18043.0, 35561.0, 73186.0, 154804.0, 350533.0, 206395.0, 94649.0, 45326.0, 22748.0, 11863.0, 6371.0, 3429.0, 1901.0, 1049.0, 627.0, 357.0, 209.0, 126.0, 70.0, 63.0, 43.0, 34.0, 17.0, 11.0, 12.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.6640625, -7.43646240234375, -7.2088623046875, -6.98126220703125, -6.753662109375, -6.52606201171875, -6.2984619140625, -6.07086181640625, -5.84326171875, -5.61566162109375, -5.3880615234375, -5.16046142578125, -4.932861328125, -4.70526123046875, -4.4776611328125, -4.25006103515625, -4.0224609375, -3.79486083984375, -3.5672607421875, -3.33966064453125, -3.112060546875, -2.88446044921875, -2.6568603515625, -2.42926025390625, -2.20166015625, -1.97406005859375, -1.7464599609375, -1.51885986328125, -1.291259765625, -1.06365966796875, -0.8360595703125, -0.60845947265625, -0.380859375, -0.15325927734375, 0.0743408203125, 0.30194091796875, 0.529541015625, 0.75714111328125, 0.9847412109375, 1.21234130859375, 1.43994140625, 1.66754150390625, 1.8951416015625, 2.12274169921875, 2.350341796875, 2.57794189453125, 2.8055419921875, 3.03314208984375, 3.2607421875, 3.48834228515625, 3.7159423828125, 3.94354248046875, 4.171142578125, 4.39874267578125, 4.6263427734375, 4.85394287109375, 5.08154296875, 5.30914306640625, 5.5367431640625, 5.76434326171875, 5.991943359375, 6.21954345703125, 6.4471435546875, 6.67474365234375, 6.90234375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 0.0, 6.0, 3.0, 5.0, 10.0, 12.0, 10.0, 15.0, 14.0, 31.0, 26.0, 32.0, 32.0, 24.0, 38.0, 43.0, 45.0, 85.0, 116.0, 182.0, 1425.0, 260.0, 140.0, 90.0, 66.0, 50.0, 26.0, 47.0, 40.0, 24.0, 26.0, 21.0, 20.0, 16.0, 16.0, 12.0, 11.0, 5.0, 7.0, 8.0, 10.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.2109375, -14.6822509765625, -14.153564453125, -13.6248779296875, -13.09619140625, -12.5675048828125, -12.038818359375, -11.5101318359375, -10.9814453125, -10.4527587890625, -9.924072265625, -9.3953857421875, -8.86669921875, -8.3380126953125, -7.809326171875, -7.2806396484375, -6.751953125, -6.2232666015625, -5.694580078125, -5.1658935546875, -4.63720703125, -4.1085205078125, -3.579833984375, -3.0511474609375, -2.5224609375, -1.9937744140625, -1.465087890625, -0.9364013671875, -0.40771484375, 0.1209716796875, 0.649658203125, 1.1783447265625, 1.70703125, 2.2357177734375, 2.764404296875, 3.2930908203125, 3.82177734375, 4.3504638671875, 4.879150390625, 5.4078369140625, 5.9365234375, 6.4652099609375, 6.993896484375, 7.5225830078125, 8.05126953125, 8.5799560546875, 9.108642578125, 9.6373291015625, 10.166015625, 10.6947021484375, 11.223388671875, 11.7520751953125, 12.28076171875, 12.8094482421875, 13.338134765625, 13.8668212890625, 14.3955078125, 14.9241943359375, 15.452880859375, 15.9815673828125, 16.51025390625, 17.0389404296875, 17.567626953125, 18.0963134765625, 18.625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 9.0, 9.0, 8.0, 17.0, 19.0, 30.0, 26.0, 42.0, 54.0, 76.0, 97.0, 144.0, 184.0, 340.0, 610.0, 1402.0, 4713.0, 49703.0, 2586631.0, 481163.0, 15560.0, 2644.0, 904.0, 446.0, 250.0, 189.0, 123.0, 82.0, 63.0, 42.0, 38.0, 18.0, 20.0, 18.0, 10.0, 6.0, 8.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-41.78125, -40.61376953125, -39.4462890625, -38.27880859375, -37.111328125, -35.94384765625, -34.7763671875, -33.60888671875, -32.44140625, -31.27392578125, -30.1064453125, -28.93896484375, -27.771484375, -26.60400390625, -25.4365234375, -24.26904296875, -23.1015625, -21.93408203125, -20.7666015625, -19.59912109375, -18.431640625, -17.26416015625, -16.0966796875, -14.92919921875, -13.76171875, -12.59423828125, -11.4267578125, -10.25927734375, -9.091796875, -7.92431640625, -6.7568359375, -5.58935546875, -4.421875, -3.25439453125, -2.0869140625, -0.91943359375, 0.248046875, 1.41552734375, 2.5830078125, 3.75048828125, 4.91796875, 6.08544921875, 7.2529296875, 8.42041015625, 9.587890625, 10.75537109375, 11.9228515625, 13.09033203125, 14.2578125, 15.42529296875, 16.5927734375, 17.76025390625, 18.927734375, 20.09521484375, 21.2626953125, 22.43017578125, 23.59765625, 24.76513671875, 25.9326171875, 27.10009765625, 28.267578125, 29.43505859375, 30.6025390625, 31.77001953125, 32.9375]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 23.0, 121.0, 277.0, 370.0, 168.0, 52.0, 5.0, 1.0, 0.0, 1.0], "bins": [-229.21580505371094, -225.20521545410156, -221.1946258544922, -217.1840362548828, -213.17343139648438, -209.162841796875, -205.15225219726562, -201.14166259765625, -197.13107299804688, -193.1204833984375, -189.10989379882812, -185.09930419921875, -181.08871459960938, -177.07810974121094, -173.06752014160156, -169.0569305419922, -165.0463409423828, -161.03575134277344, -157.02516174316406, -153.0145721435547, -149.00396728515625, -144.99337768554688, -140.9827880859375, -136.97219848632812, -132.96160888671875, -128.95101928710938, -124.9404296875, -120.9298324584961, -116.91924285888672, -112.90865325927734, -108.89805603027344, -104.88746643066406, -100.87686157226562, -96.86627197265625, -92.85568237304688, -88.84508514404297, -84.8344955444336, -80.82390594482422, -76.81330871582031, -72.80271911621094, -68.79212951660156, -64.78153991699219, -60.77094650268555, -56.760353088378906, -52.74976348876953, -48.739173889160156, -44.728580474853516, -40.717987060546875, -36.7073974609375, -32.696807861328125, -28.686214447021484, -24.675622940063477, -20.66503143310547, -16.65443992614746, -12.643848419189453, -8.633256912231445, -4.62266731262207, -0.6120758056640625, 3.3985157012939453, 7.409107208251953, 11.419698715209961, 15.430290222167969, 19.440881729125977, 23.451473236083984, 27.462064743041992]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 0.0, 3.0, 3.0, 1.0, 9.0, 6.0, 10.0, 8.0, 8.0, 17.0, 16.0, 33.0, 21.0, 34.0, 36.0, 37.0, 33.0, 46.0, 47.0, 50.0, 49.0, 45.0, 56.0, 46.0, 43.0, 40.0, 53.0, 34.0, 35.0, 29.0, 37.0, 29.0, 21.0, 22.0, 12.0, 11.0, 7.0, 3.0, 6.0, 3.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.44434356689453, -52.830101013183594, -51.215858459472656, -49.60161590576172, -47.98737335205078, -46.373130798339844, -44.75889205932617, -43.144649505615234, -41.5304069519043, -39.91616439819336, -38.30192184448242, -36.687679290771484, -35.07344055175781, -33.459197998046875, -31.844955444335938, -30.230712890625, -28.616470336914062, -27.002227783203125, -25.387985229492188, -23.773744583129883, -22.159502029418945, -20.545259475708008, -18.931018829345703, -17.316776275634766, -15.702533721923828, -14.08829116821289, -12.47404956817627, -10.859807968139648, -9.245565414428711, -7.631322860717773, -6.017081260681152, -4.402839660644531, -2.7885971069335938, -1.1743550300598145, 0.43988704681396484, 2.054129123687744, 3.6683712005615234, 5.282613754272461, 6.896855354309082, 8.511096954345703, 10.12533950805664, 11.739582061767578, 13.3538236618042, 14.96806526184082, 16.582307815551758, 18.196550369262695, 19.810791015625, 21.425033569335938, 23.039276123046875, 24.653518676757812, 26.26776123046875, 27.882001876831055, 29.496244430541992, 31.11048698425293, 32.724727630615234, 34.33897018432617, 35.95321273803711, 37.56745529174805, 39.181697845458984, 40.79594039916992, 42.410179138183594, 44.02442169189453, 45.63866424560547, 47.252906799316406, 48.867149353027344]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 2.0, 8.0, 6.0, 11.0, 5.0, 8.0, 14.0, 18.0, 22.0, 16.0, 18.0, 31.0, 24.0, 15.0, 25.0, 32.0, 32.0, 29.0, 40.0, 34.0, 34.0, 39.0, 36.0, 37.0, 51.0, 40.0, 35.0, 31.0, 32.0, 27.0, 27.0, 24.0, 33.0, 26.0, 18.0, 26.0, 19.0, 9.0, 12.0, 6.0, 6.0, 6.0, 5.0, 8.0, 5.0, 6.0, 2.0, 4.0, 3.0, 3.0, 2.0], "bins": [-6.14453125, -5.97088623046875, -5.7972412109375, -5.62359619140625, -5.449951171875, -5.27630615234375, -5.1026611328125, -4.92901611328125, -4.75537109375, -4.58172607421875, -4.4080810546875, -4.23443603515625, -4.060791015625, -3.88714599609375, -3.7135009765625, -3.53985595703125, -3.3662109375, -3.19256591796875, -3.0189208984375, -2.84527587890625, -2.671630859375, -2.49798583984375, -2.3243408203125, -2.15069580078125, -1.97705078125, -1.80340576171875, -1.6297607421875, -1.45611572265625, -1.282470703125, -1.10882568359375, -0.9351806640625, -0.76153564453125, -0.587890625, -0.41424560546875, -0.2406005859375, -0.06695556640625, 0.106689453125, 0.28033447265625, 0.4539794921875, 0.62762451171875, 0.80126953125, 0.97491455078125, 1.1485595703125, 1.32220458984375, 1.495849609375, 1.66949462890625, 1.8431396484375, 2.01678466796875, 2.1904296875, 2.36407470703125, 2.5377197265625, 2.71136474609375, 2.885009765625, 3.05865478515625, 3.2322998046875, 3.40594482421875, 3.57958984375, 3.75323486328125, 3.9268798828125, 4.10052490234375, 4.274169921875, 4.44781494140625, 4.6214599609375, 4.79510498046875, 4.96875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 5.0, 3.0, 9.0, 3.0, 6.0, 14.0, 12.0, 12.0, 18.0, 47.0, 44.0, 77.0, 99.0, 132.0, 185.0, 263.0, 433.0, 710.0, 1025.0, 1566.0, 2549.0, 4536.0, 8642.0, 17655.0, 45170.0, 152090.0, 646220.0, 1867020.0, 1067654.0, 257521.0, 70194.0, 24722.0, 11371.0, 5713.0, 3258.0, 1922.0, 1166.0, 810.0, 462.0, 321.0, 204.0, 138.0, 98.0, 51.0, 53.0, 33.0, 19.0, 16.0, 5.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-9.90625, -9.6121826171875, -9.318115234375, -9.0240478515625, -8.72998046875, -8.4359130859375, -8.141845703125, -7.8477783203125, -7.5537109375, -7.2596435546875, -6.965576171875, -6.6715087890625, -6.37744140625, -6.0833740234375, -5.789306640625, -5.4952392578125, -5.201171875, -4.9071044921875, -4.613037109375, -4.3189697265625, -4.02490234375, -3.7308349609375, -3.436767578125, -3.1427001953125, -2.8486328125, -2.5545654296875, -2.260498046875, -1.9664306640625, -1.67236328125, -1.3782958984375, -1.084228515625, -0.7901611328125, -0.49609375, -0.2020263671875, 0.092041015625, 0.3861083984375, 0.68017578125, 0.9742431640625, 1.268310546875, 1.5623779296875, 1.8564453125, 2.1505126953125, 2.444580078125, 2.7386474609375, 3.03271484375, 3.3267822265625, 3.620849609375, 3.9149169921875, 4.208984375, 4.5030517578125, 4.797119140625, 5.0911865234375, 5.38525390625, 5.6793212890625, 5.973388671875, 6.2674560546875, 6.5615234375, 6.8555908203125, 7.149658203125, 7.4437255859375, 7.73779296875, 8.0318603515625, 8.325927734375, 8.6199951171875, 8.9140625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 6.0, 8.0, 17.0, 18.0, 23.0, 22.0, 36.0, 42.0, 49.0, 80.0, 119.0, 135.0, 181.0, 256.0, 354.0, 433.0, 464.0, 449.0, 370.0, 284.0, 191.0, 131.0, 91.0, 66.0, 57.0, 51.0, 36.0, 22.0, 13.0, 12.0, 12.0, 11.0, 10.0, 7.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0], "bins": [-12.65625, -12.3367919921875, -12.017333984375, -11.6978759765625, -11.37841796875, -11.0589599609375, -10.739501953125, -10.4200439453125, -10.1005859375, -9.7811279296875, -9.461669921875, -9.1422119140625, -8.82275390625, -8.5032958984375, -8.183837890625, -7.8643798828125, -7.544921875, -7.2254638671875, -6.906005859375, -6.5865478515625, -6.26708984375, -5.9476318359375, -5.628173828125, -5.3087158203125, -4.9892578125, -4.6697998046875, -4.350341796875, -4.0308837890625, -3.71142578125, -3.3919677734375, -3.072509765625, -2.7530517578125, -2.43359375, -2.1141357421875, -1.794677734375, -1.4752197265625, -1.15576171875, -0.8363037109375, -0.516845703125, -0.1973876953125, 0.1220703125, 0.4415283203125, 0.760986328125, 1.0804443359375, 1.39990234375, 1.7193603515625, 2.038818359375, 2.3582763671875, 2.677734375, 2.9971923828125, 3.316650390625, 3.6361083984375, 3.95556640625, 4.2750244140625, 4.594482421875, 4.9139404296875, 5.2333984375, 5.5528564453125, 5.872314453125, 6.1917724609375, 6.51123046875, 6.8306884765625, 7.150146484375, 7.4696044921875, 7.7890625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 5.0, 7.0, 4.0, 11.0, 10.0, 11.0, 7.0, 16.0, 19.0, 31.0, 36.0, 46.0, 58.0, 75.0, 121.0, 188.0, 396.0, 1244.0, 8524.0, 234143.0, 3825269.0, 116510.0, 5614.0, 937.0, 329.0, 176.0, 122.0, 109.0, 67.0, 50.0, 28.0, 36.0, 26.0, 7.0, 22.0, 11.0, 6.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.375, -35.84423828125, -34.3134765625, -32.78271484375, -31.251953125, -29.72119140625, -28.1904296875, -26.65966796875, -25.12890625, -23.59814453125, -22.0673828125, -20.53662109375, -19.005859375, -17.47509765625, -15.9443359375, -14.41357421875, -12.8828125, -11.35205078125, -9.8212890625, -8.29052734375, -6.759765625, -5.22900390625, -3.6982421875, -2.16748046875, -0.63671875, 0.89404296875, 2.4248046875, 3.95556640625, 5.486328125, 7.01708984375, 8.5478515625, 10.07861328125, 11.609375, 13.14013671875, 14.6708984375, 16.20166015625, 17.732421875, 19.26318359375, 20.7939453125, 22.32470703125, 23.85546875, 25.38623046875, 26.9169921875, 28.44775390625, 29.978515625, 31.50927734375, 33.0400390625, 34.57080078125, 36.1015625, 37.63232421875, 39.1630859375, 40.69384765625, 42.224609375, 43.75537109375, 45.2861328125, 46.81689453125, 48.34765625, 49.87841796875, 51.4091796875, 52.93994140625, 54.470703125, 56.00146484375, 57.5322265625, 59.06298828125, 60.59375]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 30.0, 57.0, 126.0, 203.0, 253.0, 176.0, 106.0, 36.0, 17.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.36237335205078, -81.38146209716797, -77.40055084228516, -73.41963195800781, -69.438720703125, -65.45780944824219, -61.476898193359375, -57.49598693847656, -53.515071868896484, -49.53416061401367, -45.553245544433594, -41.57233428955078, -37.59142303466797, -33.61050796508789, -29.629596710205078, -25.648683547973633, -21.667770385742188, -17.686857223510742, -13.705945014953613, -9.725032806396484, -5.744119644165039, -1.7632064819335938, 2.2177047729492188, 6.198617935180664, 10.17953109741211, 14.160444259643555, 18.141357421875, 22.122268676757812, 26.103181838989258, 30.084095001220703, 34.065006256103516, 38.045921325683594, 42.02684020996094, 46.00775146484375, 49.98866653442383, 53.96957778930664, 57.95049285888672, 61.93140411376953, 65.91231536865234, 69.89322662353516, 73.8741455078125, 77.85505676269531, 81.83596801757812, 85.81687927246094, 89.79779815673828, 93.7787094116211, 97.7596206665039, 101.74053192138672, 105.72144317626953, 109.70235443115234, 113.68326568603516, 117.6641845703125, 121.64509582519531, 125.62600708007812, 129.60691833496094, 133.58782958984375, 137.56874084472656, 141.54965209960938, 145.5305633544922, 149.511474609375, 153.4923858642578, 157.47329711914062, 161.4542236328125, 165.4351348876953, 169.41604614257812]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 10.0, 10.0, 4.0, 18.0, 16.0, 27.0, 21.0, 15.0, 37.0, 31.0, 29.0, 35.0, 31.0, 45.0, 41.0, 44.0, 37.0, 32.0, 40.0, 48.0, 50.0, 37.0, 44.0, 39.0, 32.0, 33.0, 18.0, 26.0, 25.0, 12.0, 18.0, 16.0, 15.0, 8.0, 11.0, 9.0, 7.0, 3.0, 5.0, 3.0, 5.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.826637268066406, -32.704254150390625, -31.58186912536621, -30.459484100341797, -29.337100982666016, -28.214717864990234, -27.09233283996582, -25.969947814941406, -24.847564697265625, -23.725181579589844, -22.60279655456543, -21.480411529541016, -20.358028411865234, -19.235645294189453, -18.11326026916504, -16.990875244140625, -15.868492126464844, -14.746108055114746, -13.623723983764648, -12.50133991241455, -11.378955841064453, -10.256571769714355, -9.134187698364258, -8.01180362701416, -6.8894195556640625, -5.767035484313965, -4.644651412963867, -3.5222673416137695, -2.399883270263672, -1.2774991989135742, -0.15511512756347656, 0.9672689437866211, 2.0896568298339844, 3.212040901184082, 4.33442497253418, 5.456809043884277, 6.579193115234375, 7.701577186584473, 8.82396125793457, 9.946345329284668, 11.068729400634766, 12.191113471984863, 13.313497543334961, 14.435881614685059, 15.558265686035156, 16.680648803710938, 17.80303382873535, 18.925418853759766, 20.047801971435547, 21.170185089111328, 22.292570114135742, 23.414955139160156, 24.537338256835938, 25.65972137451172, 26.782106399536133, 27.904491424560547, 29.026874542236328, 30.14925765991211, 31.271642684936523, 32.39402770996094, 33.51641082763672, 34.6387939453125, 35.76117706298828, 36.88356399536133, 38.00594711303711]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 5.0, 10.0, 5.0, 19.0, 12.0, 21.0, 16.0, 15.0, 30.0, 29.0, 28.0, 25.0, 32.0, 25.0, 49.0, 40.0, 42.0, 37.0, 41.0, 41.0, 46.0, 46.0, 33.0, 48.0, 26.0, 37.0, 26.0, 30.0, 38.0, 24.0, 18.0, 16.0, 11.0, 14.0, 13.0, 10.0, 13.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.49609375, -6.3046875, -6.11328125, -5.921875, -5.73046875, -5.5390625, -5.34765625, -5.15625, -4.96484375, -4.7734375, -4.58203125, -4.390625, -4.19921875, -4.0078125, -3.81640625, -3.625, -3.43359375, -3.2421875, -3.05078125, -2.859375, -2.66796875, -2.4765625, -2.28515625, -2.09375, -1.90234375, -1.7109375, -1.51953125, -1.328125, -1.13671875, -0.9453125, -0.75390625, -0.5625, -0.37109375, -0.1796875, 0.01171875, 0.203125, 0.39453125, 0.5859375, 0.77734375, 0.96875, 1.16015625, 1.3515625, 1.54296875, 1.734375, 1.92578125, 2.1171875, 2.30859375, 2.5, 2.69140625, 2.8828125, 3.07421875, 3.265625, 3.45703125, 3.6484375, 3.83984375, 4.03125, 4.22265625, 4.4140625, 4.60546875, 4.796875, 4.98828125, 5.1796875, 5.37109375, 5.5625, 5.75390625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 7.0, 8.0, 16.0, 27.0, 21.0, 29.0, 29.0, 45.0, 73.0, 81.0, 120.0, 184.0, 199.0, 310.0, 427.0, 529.0, 821.0, 1146.0, 1659.0, 2558.0, 4046.0, 7591.0, 18686.0, 74731.0, 540695.0, 319602.0, 44396.0, 13493.0, 6135.0, 3455.0, 2245.0, 1485.0, 1020.0, 713.0, 528.0, 365.0, 279.0, 203.0, 163.0, 111.0, 86.0, 55.0, 56.0, 43.0, 28.0, 17.0, 8.0, 10.0, 6.0, 4.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.8984375, -4.7396240234375, -4.580810546875, -4.4219970703125, -4.26318359375, -4.1043701171875, -3.945556640625, -3.7867431640625, -3.6279296875, -3.4691162109375, -3.310302734375, -3.1514892578125, -2.99267578125, -2.8338623046875, -2.675048828125, -2.5162353515625, -2.357421875, -2.1986083984375, -2.039794921875, -1.8809814453125, -1.72216796875, -1.5633544921875, -1.404541015625, -1.2457275390625, -1.0869140625, -0.9281005859375, -0.769287109375, -0.6104736328125, -0.45166015625, -0.2928466796875, -0.134033203125, 0.0247802734375, 0.18359375, 0.3424072265625, 0.501220703125, 0.6600341796875, 0.81884765625, 0.9776611328125, 1.136474609375, 1.2952880859375, 1.4541015625, 1.6129150390625, 1.771728515625, 1.9305419921875, 2.08935546875, 2.2481689453125, 2.406982421875, 2.5657958984375, 2.724609375, 2.8834228515625, 3.042236328125, 3.2010498046875, 3.35986328125, 3.5186767578125, 3.677490234375, 3.8363037109375, 3.9951171875, 4.1539306640625, 4.312744140625, 4.4715576171875, 4.63037109375, 4.7891845703125, 4.947998046875, 5.1068115234375, 5.265625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 7.0, 6.0, 4.0, 12.0, 13.0, 11.0, 10.0, 13.0, 20.0, 14.0, 30.0, 27.0, 32.0, 26.0, 32.0, 53.0, 39.0, 38.0, 40.0, 44.0, 1071.0, 45.0, 43.0, 42.0, 38.0, 42.0, 29.0, 35.0, 30.0, 35.0, 24.0, 26.0, 17.0, 19.0, 11.0, 11.0, 7.0, 5.0, 10.0, 5.0, 3.0, 2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9921875, -3.85760498046875, -3.7230224609375, -3.58843994140625, -3.453857421875, -3.31927490234375, -3.1846923828125, -3.05010986328125, -2.91552734375, -2.78094482421875, -2.6463623046875, -2.51177978515625, -2.377197265625, -2.24261474609375, -2.1080322265625, -1.97344970703125, -1.8388671875, -1.70428466796875, -1.5697021484375, -1.43511962890625, -1.300537109375, -1.16595458984375, -1.0313720703125, -0.89678955078125, -0.76220703125, -0.62762451171875, -0.4930419921875, -0.35845947265625, -0.223876953125, -0.08929443359375, 0.0452880859375, 0.17987060546875, 0.314453125, 0.44903564453125, 0.5836181640625, 0.71820068359375, 0.852783203125, 0.98736572265625, 1.1219482421875, 1.25653076171875, 1.39111328125, 1.52569580078125, 1.6602783203125, 1.79486083984375, 1.929443359375, 2.06402587890625, 2.1986083984375, 2.33319091796875, 2.4677734375, 2.60235595703125, 2.7369384765625, 2.87152099609375, 3.006103515625, 3.14068603515625, 3.2752685546875, 3.40985107421875, 3.54443359375, 3.67901611328125, 3.8135986328125, 3.94818115234375, 4.082763671875, 4.21734619140625, 4.3519287109375, 4.48651123046875, 4.62109375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 4.0, 10.0, 19.0, 27.0, 31.0, 57.0, 104.0, 155.0, 243.0, 481.0, 907.0, 1747.0, 3780.0, 9731.0, 40252.0, 920138.0, 1060202.0, 41469.0, 9928.0, 3907.0, 1736.0, 955.0, 498.0, 280.0, 162.0, 97.0, 66.0, 44.0, 44.0, 15.0, 8.0, 7.0, 6.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.740234375, -3.611297607421875, -3.48236083984375, -3.353424072265625, -3.2244873046875, -3.095550537109375, -2.96661376953125, -2.837677001953125, -2.708740234375, -2.579803466796875, -2.45086669921875, -2.321929931640625, -2.1929931640625, -2.064056396484375, -1.93511962890625, -1.806182861328125, -1.67724609375, -1.548309326171875, -1.41937255859375, -1.290435791015625, -1.1614990234375, -1.032562255859375, -0.90362548828125, -0.774688720703125, -0.645751953125, -0.516815185546875, -0.38787841796875, -0.258941650390625, -0.1300048828125, -0.001068115234375, 0.12786865234375, 0.256805419921875, 0.3857421875, 0.514678955078125, 0.64361572265625, 0.772552490234375, 0.9014892578125, 1.030426025390625, 1.15936279296875, 1.288299560546875, 1.417236328125, 1.546173095703125, 1.67510986328125, 1.804046630859375, 1.9329833984375, 2.061920166015625, 2.19085693359375, 2.319793701171875, 2.44873046875, 2.577667236328125, 2.70660400390625, 2.835540771484375, 2.9644775390625, 3.093414306640625, 3.22235107421875, 3.351287841796875, 3.480224609375, 3.609161376953125, 3.73809814453125, 3.867034912109375, 3.9959716796875, 4.124908447265625, 4.25384521484375, 4.382781982421875, 4.51171875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 4.0, 11.0, 10.0, 19.0, 23.0, 37.0, 83.0, 326.0, 251.0, 94.0, 45.0, 16.0, 14.0, 7.0, 3.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75927734375, -0.7354965209960938, -0.7117156982421875, -0.6879348754882812, -0.664154052734375, -0.6403732299804688, -0.6165924072265625, -0.5928115844726562, -0.56903076171875, -0.5452499389648438, -0.5214691162109375, -0.49768829345703125, -0.473907470703125, -0.45012664794921875, -0.4263458251953125, -0.40256500244140625, -0.3787841796875, -0.35500335693359375, -0.3312225341796875, -0.30744171142578125, -0.283660888671875, -0.25988006591796875, -0.2360992431640625, -0.21231842041015625, -0.18853759765625, -0.16475677490234375, -0.1409759521484375, -0.11719512939453125, -0.093414306640625, -0.06963348388671875, -0.0458526611328125, -0.02207183837890625, 0.001708984375, 0.02548980712890625, 0.0492706298828125, 0.07305145263671875, 0.096832275390625, 0.12061309814453125, 0.1443939208984375, 0.16817474365234375, 0.19195556640625, 0.21573638916015625, 0.2395172119140625, 0.26329803466796875, 0.287078857421875, 0.31085968017578125, 0.3346405029296875, 0.35842132568359375, 0.3822021484375, 0.40598297119140625, 0.4297637939453125, 0.45354461669921875, 0.477325439453125, 0.5011062622070312, 0.5248870849609375, 0.5486679077148438, 0.57244873046875, 0.5962295532226562, 0.6200103759765625, 0.6437911987304688, 0.667572021484375, 0.6913528442382812, 0.7151336669921875, 0.7389144897460938, 0.7626953125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 7.0, 10.0, 8.0, 20.0, 17.0, 30.0, 48.0, 115.0, 290.0, 6027.0, 1033036.0, 8333.0, 316.0, 116.0, 54.0, 32.0, 19.0, 14.0, 16.0, 9.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.125, -14.6600341796875, -14.195068359375, -13.7301025390625, -13.26513671875, -12.8001708984375, -12.335205078125, -11.8702392578125, -11.4052734375, -10.9403076171875, -10.475341796875, -10.0103759765625, -9.54541015625, -9.0804443359375, -8.615478515625, -8.1505126953125, -7.685546875, -7.2205810546875, -6.755615234375, -6.2906494140625, -5.82568359375, -5.3607177734375, -4.895751953125, -4.4307861328125, -3.9658203125, -3.5008544921875, -3.035888671875, -2.5709228515625, -2.10595703125, -1.6409912109375, -1.176025390625, -0.7110595703125, -0.24609375, 0.2188720703125, 0.683837890625, 1.1488037109375, 1.61376953125, 2.0787353515625, 2.543701171875, 3.0086669921875, 3.4736328125, 3.9385986328125, 4.403564453125, 4.8685302734375, 5.33349609375, 5.7984619140625, 6.263427734375, 6.7283935546875, 7.193359375, 7.6583251953125, 8.123291015625, 8.5882568359375, 9.05322265625, 9.5181884765625, 9.983154296875, 10.4481201171875, 10.9130859375, 11.3780517578125, 11.843017578125, 12.3079833984375, 12.77294921875, 13.2379150390625, 13.702880859375, 14.1678466796875, 14.6328125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 12.0, 83.0, 356.0, 458.0, 85.0, 17.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.847208023071289, -3.723372459411621, -3.599536895751953, -3.475701332092285, -3.351865530014038, -3.22802996635437, -3.104194402694702, -2.980358839035034, -2.856523036956787, -2.732687473297119, -2.608851909637451, -2.485016345977783, -2.361180543899536, -2.237344980239868, -2.1135094165802, -1.9896738529205322, -1.8658382892608643, -1.7420027256011963, -1.6181670427322388, -1.4943314790725708, -1.3704957962036133, -1.2466602325439453, -1.1228246688842773, -0.9989890456199646, -0.8751534223556519, -0.7513177990913391, -0.6274821758270264, -0.5036466121673584, -0.37981098890304565, -0.2559753656387329, -0.13213980197906494, -0.008304178714752197, 0.11553144454956055, 0.2393670529127121, 0.36320266127586365, 0.487038254737854, 0.6108738780021667, 0.7347095012664795, 0.8585450649261475, 0.9823806881904602, 1.106216311454773, 1.230051875114441, 1.3538875579833984, 1.4777231216430664, 1.6015586853027344, 1.725394368171692, 1.8492299318313599, 1.9730656147003174, 2.0969011783599854, 2.2207367420196533, 2.3445723056793213, 2.4684081077575684, 2.5922436714172363, 2.7160792350769043, 2.8399147987365723, 2.9637503623962402, 3.087585926055908, 3.211421489715576, 3.335257053375244, 3.459092617034912, 3.582928419113159, 3.706763982772827, 3.830599546432495, 3.954435110092163, 4.07827091217041]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 3.0, 2.0, 8.0, 4.0, 7.0, 6.0, 10.0, 12.0, 10.0, 10.0, 13.0, 17.0, 18.0, 11.0, 25.0, 31.0, 29.0, 32.0, 25.0, 35.0, 48.0, 34.0, 34.0, 43.0, 38.0, 45.0, 50.0, 42.0, 45.0, 30.0, 30.0, 31.0, 29.0, 30.0, 28.0, 19.0, 20.0, 17.0, 13.0, 16.0, 14.0, 6.0, 14.0, 4.0, 2.0, 3.0, 2.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7016700506210327, -0.679858386516571, -0.6580467224121094, -0.6362350583076477, -0.614423394203186, -0.5926117300987244, -0.5708000659942627, -0.548988401889801, -0.5271767377853394, -0.5053650736808777, -0.483553409576416, -0.46174174547195435, -0.4399300813674927, -0.418118417263031, -0.39630675315856934, -0.37449508905410767, -0.352683424949646, -0.3308717608451843, -0.30906009674072266, -0.287248432636261, -0.2654367685317993, -0.24362510442733765, -0.22181344032287598, -0.2000017762184143, -0.17819011211395264, -0.15637844800949097, -0.1345667839050293, -0.11275511980056763, -0.09094345569610596, -0.06913179159164429, -0.04732012748718262, -0.025508463382720947, -0.003696739673614502, 0.018114924430847168, 0.03992658853530884, 0.06173825263977051, 0.08354991674423218, 0.10536158084869385, 0.12717324495315552, 0.1489849090576172, 0.17079657316207886, 0.19260823726654053, 0.2144199013710022, 0.23623156547546387, 0.25804322957992554, 0.2798548936843872, 0.3016665577888489, 0.32347822189331055, 0.3452898859977722, 0.3671015501022339, 0.38891321420669556, 0.4107248783111572, 0.4325365424156189, 0.45434820652008057, 0.47615987062454224, 0.4979715347290039, 0.5197831988334656, 0.5415948629379272, 0.5634065270423889, 0.5852181911468506, 0.6070298552513123, 0.6288415193557739, 0.6506531834602356, 0.6724648475646973, 0.6942765116691589]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 10.0, 11.0, 10.0, 15.0, 23.0, 13.0, 19.0, 19.0, 32.0, 35.0, 39.0, 24.0, 34.0, 27.0, 39.0, 34.0, 40.0, 46.0, 44.0, 44.0, 40.0, 43.0, 39.0, 38.0, 34.0, 34.0, 34.0, 18.0, 29.0, 18.0, 22.0, 20.0, 14.0, 13.0, 7.0, 7.0, 1.0, 6.0, 8.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.59765625, -6.404296875, -6.2109375, -6.017578125, -5.82421875, -5.630859375, -5.4375, -5.244140625, -5.05078125, -4.857421875, -4.6640625, -4.470703125, -4.27734375, -4.083984375, -3.890625, -3.697265625, -3.50390625, -3.310546875, -3.1171875, -2.923828125, -2.73046875, -2.537109375, -2.34375, -2.150390625, -1.95703125, -1.763671875, -1.5703125, -1.376953125, -1.18359375, -0.990234375, -0.796875, -0.603515625, -0.41015625, -0.216796875, -0.0234375, 0.169921875, 0.36328125, 0.556640625, 0.75, 0.943359375, 1.13671875, 1.330078125, 1.5234375, 1.716796875, 1.91015625, 2.103515625, 2.296875, 2.490234375, 2.68359375, 2.876953125, 3.0703125, 3.263671875, 3.45703125, 3.650390625, 3.84375, 4.037109375, 4.23046875, 4.423828125, 4.6171875, 4.810546875, 5.00390625, 5.197265625, 5.390625, 5.583984375, 5.77734375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 3.0, 17.0, 12.0, 17.0, 27.0, 35.0, 57.0, 86.0, 165.0, 241.0, 380.0, 725.0, 1159.0, 2117.0, 3901.0, 7478.0, 14131.0, 29171.0, 64845.0, 164561.0, 395674.0, 212379.0, 80313.0, 34790.0, 16968.0, 8865.0, 4663.0, 2505.0, 1371.0, 743.0, 418.0, 255.0, 188.0, 91.0, 60.0, 39.0, 21.0, 20.0, 15.0, 14.0, 6.0, 4.0, 4.0, 3.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.375, -8.12591552734375, -7.8768310546875, -7.62774658203125, -7.378662109375, -7.12957763671875, -6.8804931640625, -6.63140869140625, -6.38232421875, -6.13323974609375, -5.8841552734375, -5.63507080078125, -5.385986328125, -5.13690185546875, -4.8878173828125, -4.63873291015625, -4.3896484375, -4.14056396484375, -3.8914794921875, -3.64239501953125, -3.393310546875, -3.14422607421875, -2.8951416015625, -2.64605712890625, -2.39697265625, -2.14788818359375, -1.8988037109375, -1.64971923828125, -1.400634765625, -1.15155029296875, -0.9024658203125, -0.65338134765625, -0.404296875, -0.15521240234375, 0.0938720703125, 0.34295654296875, 0.592041015625, 0.84112548828125, 1.0902099609375, 1.33929443359375, 1.58837890625, 1.83746337890625, 2.0865478515625, 2.33563232421875, 2.584716796875, 2.83380126953125, 3.0828857421875, 3.33197021484375, 3.5810546875, 3.83013916015625, 4.0792236328125, 4.32830810546875, 4.577392578125, 4.82647705078125, 5.0755615234375, 5.32464599609375, 5.57373046875, 5.82281494140625, 6.0718994140625, 6.32098388671875, 6.570068359375, 6.81915283203125, 7.0682373046875, 7.31732177734375, 7.56640625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 3.0, 9.0, 7.0, 9.0, 11.0, 15.0, 22.0, 16.0, 11.0, 26.0, 23.0, 23.0, 33.0, 33.0, 53.0, 55.0, 67.0, 112.0, 219.0, 1403.0, 279.0, 129.0, 66.0, 53.0, 46.0, 46.0, 33.0, 36.0, 23.0, 30.0, 32.0, 19.0, 25.0, 15.0, 18.0, 9.0, 7.0, 4.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.75, -17.205078125, -16.66015625, -16.115234375, -15.5703125, -15.025390625, -14.48046875, -13.935546875, -13.390625, -12.845703125, -12.30078125, -11.755859375, -11.2109375, -10.666015625, -10.12109375, -9.576171875, -9.03125, -8.486328125, -7.94140625, -7.396484375, -6.8515625, -6.306640625, -5.76171875, -5.216796875, -4.671875, -4.126953125, -3.58203125, -3.037109375, -2.4921875, -1.947265625, -1.40234375, -0.857421875, -0.3125, 0.232421875, 0.77734375, 1.322265625, 1.8671875, 2.412109375, 2.95703125, 3.501953125, 4.046875, 4.591796875, 5.13671875, 5.681640625, 6.2265625, 6.771484375, 7.31640625, 7.861328125, 8.40625, 8.951171875, 9.49609375, 10.041015625, 10.5859375, 11.130859375, 11.67578125, 12.220703125, 12.765625, 13.310546875, 13.85546875, 14.400390625, 14.9453125, 15.490234375, 16.03515625, 16.580078125, 17.125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 7.0, 4.0, 10.0, 5.0, 17.0, 14.0, 30.0, 28.0, 34.0, 51.0, 72.0, 87.0, 102.0, 134.0, 246.0, 472.0, 1164.0, 6151.0, 119778.0, 2868042.0, 140159.0, 6576.0, 1235.0, 487.0, 216.0, 152.0, 105.0, 84.0, 42.0, 43.0, 28.0, 22.0, 32.0, 18.0, 15.0, 8.0, 6.0, 9.0, 4.0, 8.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-35.125, -33.97412109375, -32.8232421875, -31.67236328125, -30.521484375, -29.37060546875, -28.2197265625, -27.06884765625, -25.91796875, -24.76708984375, -23.6162109375, -22.46533203125, -21.314453125, -20.16357421875, -19.0126953125, -17.86181640625, -16.7109375, -15.56005859375, -14.4091796875, -13.25830078125, -12.107421875, -10.95654296875, -9.8056640625, -8.65478515625, -7.50390625, -6.35302734375, -5.2021484375, -4.05126953125, -2.900390625, -1.74951171875, -0.5986328125, 0.55224609375, 1.703125, 2.85400390625, 4.0048828125, 5.15576171875, 6.306640625, 7.45751953125, 8.6083984375, 9.75927734375, 10.91015625, 12.06103515625, 13.2119140625, 14.36279296875, 15.513671875, 16.66455078125, 17.8154296875, 18.96630859375, 20.1171875, 21.26806640625, 22.4189453125, 23.56982421875, 24.720703125, 25.87158203125, 27.0224609375, 28.17333984375, 29.32421875, 30.47509765625, 31.6259765625, 32.77685546875, 33.927734375, 35.07861328125, 36.2294921875, 37.38037109375, 38.53125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 27.0, 89.0, 181.0, 264.0, 239.0, 154.0, 42.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.67396545410156, -108.35453796386719, -106.03511047363281, -103.71568298339844, -101.39625549316406, -99.07682800292969, -96.75740051269531, -94.43797302246094, -92.11854553222656, -89.79911804199219, -87.47969055175781, -85.16026306152344, -82.84083557128906, -80.52140808105469, -78.20198059082031, -75.88255310058594, -73.5631332397461, -71.24370574951172, -68.92427825927734, -66.60485076904297, -64.2854232788086, -61.96599578857422, -59.64657211303711, -57.327144622802734, -55.00771713256836, -52.688289642333984, -50.36886215209961, -48.049434661865234, -45.730010986328125, -43.41058349609375, -41.091156005859375, -38.771728515625, -36.45230484008789, -34.132877349853516, -31.81344985961914, -29.4940242767334, -27.174596786499023, -24.85516929626465, -22.535743713378906, -20.21631622314453, -17.896888732910156, -15.577461242675781, -13.258034706115723, -10.938608169555664, -8.619180679321289, -6.299753189086914, -3.9803266525268555, -1.6609001159667969, 0.6585273742675781, 2.977954387664795, 5.297381401062012, 7.6168084144592285, 9.936235427856445, 12.25566291809082, 14.575089454650879, 16.894515991210938, 19.213943481445312, 21.533370971679688, 23.852798461914062, 26.172224044799805, 28.49165153503418, 30.811079025268555, 33.1305046081543, 35.44993209838867, 37.76935958862305]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 7.0, 6.0, 6.0, 10.0, 10.0, 17.0, 13.0, 16.0, 25.0, 14.0, 15.0, 27.0, 27.0, 29.0, 20.0, 33.0, 25.0, 36.0, 28.0, 41.0, 42.0, 40.0, 35.0, 35.0, 39.0, 38.0, 30.0, 35.0, 29.0, 34.0, 23.0, 25.0, 30.0, 21.0, 21.0, 22.0, 16.0, 17.0, 10.0, 15.0, 6.0, 4.0, 8.0, 4.0, 4.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-42.180118560791016, -40.8409309387207, -39.501747131347656, -38.162559509277344, -36.8233757019043, -35.484188079833984, -34.14500427246094, -32.805816650390625, -31.466630935668945, -30.127445220947266, -28.788259506225586, -27.449073791503906, -26.109886169433594, -24.770702362060547, -23.431514739990234, -22.092329025268555, -20.753143310546875, -19.413957595825195, -18.074771881103516, -16.735584259033203, -15.39639949798584, -14.05721378326416, -12.718027114868164, -11.378841400146484, -10.039655685424805, -8.700469970703125, -7.361283779144287, -6.022097587585449, -4.6829118728637695, -3.34372615814209, -2.0045394897460938, -0.6653537750244141, 0.6738357543945312, 2.01302170753479, 3.352207660675049, 4.691393852233887, 6.030579566955566, 7.369765281677246, 8.708951950073242, 10.048137664794922, 11.387323379516602, 12.726509094238281, 14.065694808959961, 15.404881477355957, 16.744068145751953, 18.083251953125, 19.422439575195312, 20.761625289916992, 22.100811004638672, 23.43999671936035, 24.77918243408203, 26.118370056152344, 27.45755386352539, 28.796741485595703, 30.135927200317383, 31.475112915039062, 32.814300537109375, 34.15348815917969, 35.492671966552734, 36.83185958862305, 38.171043395996094, 39.510231018066406, 40.84941864013672, 42.188602447509766, 43.52778625488281]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 6.0, 1.0, 5.0, 4.0, 6.0, 10.0, 11.0, 10.0, 9.0, 15.0, 7.0, 14.0, 16.0, 20.0, 20.0, 29.0, 33.0, 30.0, 40.0, 38.0, 37.0, 36.0, 43.0, 39.0, 40.0, 38.0, 32.0, 43.0, 43.0, 38.0, 27.0, 36.0, 30.0, 28.0, 25.0, 25.0, 21.0, 18.0, 17.0, 16.0, 16.0, 9.0, 7.0, 7.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-6.8828125, -6.68328857421875, -6.4837646484375, -6.28424072265625, -6.084716796875, -5.88519287109375, -5.6856689453125, -5.48614501953125, -5.28662109375, -5.08709716796875, -4.8875732421875, -4.68804931640625, -4.488525390625, -4.28900146484375, -4.0894775390625, -3.88995361328125, -3.6904296875, -3.49090576171875, -3.2913818359375, -3.09185791015625, -2.892333984375, -2.69281005859375, -2.4932861328125, -2.29376220703125, -2.09423828125, -1.89471435546875, -1.6951904296875, -1.49566650390625, -1.296142578125, -1.09661865234375, -0.8970947265625, -0.69757080078125, -0.498046875, -0.29852294921875, -0.0989990234375, 0.10052490234375, 0.300048828125, 0.49957275390625, 0.6990966796875, 0.89862060546875, 1.09814453125, 1.29766845703125, 1.4971923828125, 1.69671630859375, 1.896240234375, 2.09576416015625, 2.2952880859375, 2.49481201171875, 2.6943359375, 2.89385986328125, 3.0933837890625, 3.29290771484375, 3.492431640625, 3.69195556640625, 3.8914794921875, 4.09100341796875, 4.29052734375, 4.49005126953125, 4.6895751953125, 4.88909912109375, 5.088623046875, 5.28814697265625, 5.4876708984375, 5.68719482421875, 5.88671875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 11.0, 11.0, 14.0, 21.0, 20.0, 33.0, 49.0, 67.0, 102.0, 136.0, 231.0, 363.0, 534.0, 853.0, 1426.0, 2494.0, 4848.0, 9672.0, 21576.0, 56215.0, 213320.0, 1038171.0, 1996164.0, 638232.0, 135446.0, 40905.0, 16561.0, 7631.0, 3873.0, 2084.0, 1217.0, 714.0, 475.0, 274.0, 195.0, 117.0, 75.0, 52.0, 31.0, 19.0, 15.0, 14.0, 7.0, 5.0, 2.0, 4.0, 0.0, 1.0], "bins": [-14.6171875, -14.2359619140625, -13.854736328125, -13.4735107421875, -13.09228515625, -12.7110595703125, -12.329833984375, -11.9486083984375, -11.5673828125, -11.1861572265625, -10.804931640625, -10.4237060546875, -10.04248046875, -9.6612548828125, -9.280029296875, -8.8988037109375, -8.517578125, -8.1363525390625, -7.755126953125, -7.3739013671875, -6.99267578125, -6.6114501953125, -6.230224609375, -5.8489990234375, -5.4677734375, -5.0865478515625, -4.705322265625, -4.3240966796875, -3.94287109375, -3.5616455078125, -3.180419921875, -2.7991943359375, -2.41796875, -2.0367431640625, -1.655517578125, -1.2742919921875, -0.89306640625, -0.5118408203125, -0.130615234375, 0.2506103515625, 0.6318359375, 1.0130615234375, 1.394287109375, 1.7755126953125, 2.15673828125, 2.5379638671875, 2.919189453125, 3.3004150390625, 3.681640625, 4.0628662109375, 4.444091796875, 4.8253173828125, 5.20654296875, 5.5877685546875, 5.968994140625, 6.3502197265625, 6.7314453125, 7.1126708984375, 7.493896484375, 7.8751220703125, 8.25634765625, 8.6375732421875, 9.018798828125, 9.4000244140625, 9.78125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 5.0, 4.0, 10.0, 6.0, 20.0, 24.0, 33.0, 40.0, 57.0, 101.0, 127.0, 193.0, 286.0, 449.0, 572.0, 581.0, 503.0, 319.0, 215.0, 159.0, 110.0, 90.0, 48.0, 38.0, 22.0, 15.0, 16.0, 12.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-19.109375, -18.622314453125, -18.13525390625, -17.648193359375, -17.1611328125, -16.674072265625, -16.18701171875, -15.699951171875, -15.212890625, -14.725830078125, -14.23876953125, -13.751708984375, -13.2646484375, -12.777587890625, -12.29052734375, -11.803466796875, -11.31640625, -10.829345703125, -10.34228515625, -9.855224609375, -9.3681640625, -8.881103515625, -8.39404296875, -7.906982421875, -7.419921875, -6.932861328125, -6.44580078125, -5.958740234375, -5.4716796875, -4.984619140625, -4.49755859375, -4.010498046875, -3.5234375, -3.036376953125, -2.54931640625, -2.062255859375, -1.5751953125, -1.088134765625, -0.60107421875, -0.114013671875, 0.373046875, 0.860107421875, 1.34716796875, 1.834228515625, 2.3212890625, 2.808349609375, 3.29541015625, 3.782470703125, 4.26953125, 4.756591796875, 5.24365234375, 5.730712890625, 6.2177734375, 6.704833984375, 7.19189453125, 7.678955078125, 8.166015625, 8.653076171875, 9.14013671875, 9.627197265625, 10.1142578125, 10.601318359375, 11.08837890625, 11.575439453125, 12.0625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 4.0, 13.0, 27.0, 28.0, 34.0, 51.0, 93.0, 176.0, 319.0, 720.0, 2210.0, 20557.0, 1184640.0, 2942876.0, 37621.0, 3279.0, 818.0, 356.0, 156.0, 93.0, 62.0, 39.0, 35.0, 23.0, 13.0, 10.0, 5.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.8125, -38.0888671875, -36.365234375, -34.6416015625, -32.91796875, -31.1943359375, -29.470703125, -27.7470703125, -26.0234375, -24.2998046875, -22.576171875, -20.8525390625, -19.12890625, -17.4052734375, -15.681640625, -13.9580078125, -12.234375, -10.5107421875, -8.787109375, -7.0634765625, -5.33984375, -3.6162109375, -1.892578125, -0.1689453125, 1.5546875, 3.2783203125, 5.001953125, 6.7255859375, 8.44921875, 10.1728515625, 11.896484375, 13.6201171875, 15.34375, 17.0673828125, 18.791015625, 20.5146484375, 22.23828125, 23.9619140625, 25.685546875, 27.4091796875, 29.1328125, 30.8564453125, 32.580078125, 34.3037109375, 36.02734375, 37.7509765625, 39.474609375, 41.1982421875, 42.921875, 44.6455078125, 46.369140625, 48.0927734375, 49.81640625, 51.5400390625, 53.263671875, 54.9873046875, 56.7109375, 58.4345703125, 60.158203125, 61.8818359375, 63.60546875, 65.3291015625, 67.052734375, 68.7763671875, 70.5]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 18.0, 202.0, 583.0, 194.0, 18.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-503.06396484375, -491.7706604003906, -480.4773864746094, -469.18408203125, -457.8907775878906, -446.59747314453125, -435.30419921875, -424.0108947753906, -412.71759033203125, -401.4242858886719, -390.1310119628906, -378.83770751953125, -367.5444030761719, -356.2510986328125, -344.95782470703125, -333.6645202636719, -322.3712463378906, -311.07794189453125, -299.78466796875, -288.4913635253906, -277.19805908203125, -265.90478515625, -254.61148071289062, -243.31817626953125, -232.02488708496094, -220.73159790039062, -209.43829345703125, -198.14500427246094, -186.85171508789062, -175.55841064453125, -164.26512145996094, -152.97183227539062, -141.67855834960938, -130.38526916503906, -119.09196472167969, -107.79867553710938, -96.50537872314453, -85.21208190917969, -73.91879272460938, -62.62549591064453, -51.33219909667969, -40.038902282714844, -28.745609283447266, -17.452316284179688, -6.159019470214844, 5.13427734375, 16.427566528320312, 27.720863342285156, 39.01416015625, 50.307456970214844, 61.60074996948242, 72.89404296875, 84.18733978271484, 95.48063659667969, 106.77392578125, 118.06722259521484, 129.3605194091797, 140.65380859375, 151.94711303710938, 163.2404022216797, 174.53369140625, 185.82699584960938, 197.1202850341797, 208.41357421875, 219.70687866210938]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 7.0, 9.0, 13.0, 7.0, 13.0, 18.0, 15.0, 26.0, 38.0, 44.0, 46.0, 47.0, 39.0, 50.0, 63.0, 53.0, 68.0, 63.0, 40.0, 51.0, 43.0, 47.0, 33.0, 42.0, 27.0, 20.0, 21.0, 19.0, 10.0, 9.0, 8.0, 7.0, 5.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.62851333618164, -52.81309127807617, -50.9976692199707, -49.182247161865234, -47.36682891845703, -45.55140686035156, -43.735984802246094, -41.920562744140625, -40.105140686035156, -38.28971862792969, -36.47429656982422, -34.65887451171875, -32.84345245361328, -31.028032302856445, -29.21261215209961, -27.39719009399414, -25.581768035888672, -23.766345977783203, -21.950923919677734, -20.1355037689209, -18.32008171081543, -16.50465965270996, -14.689238548278809, -12.873817443847656, -11.058395385742188, -9.242973327636719, -7.427552223205566, -5.612130641937256, -3.7967090606689453, -1.9812870025634766, -0.16586589813232422, 1.6495552062988281, 3.4649734497070312, 5.280395030975342, 7.095816612243652, 8.911237716674805, 10.726659774780273, 12.542081832885742, 14.357502937316895, 16.172924041748047, 17.988346099853516, 19.803768157958984, 21.619190216064453, 23.43461036682129, 25.250032424926758, 27.065454483032227, 28.880874633789062, 30.69629669189453, 32.51171875, 34.32714080810547, 36.14256286621094, 37.957984924316406, 39.773406982421875, 41.588829040527344, 43.40424728393555, 45.219669342041016, 47.035091400146484, 48.85051345825195, 50.66593551635742, 52.48135757446289, 54.296775817871094, 56.11219787597656, 57.92761993408203, 59.7430419921875, 61.55846405029297]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 2.0, 5.0, 4.0, 10.0, 7.0, 13.0, 14.0, 12.0, 16.0, 19.0, 17.0, 30.0, 34.0, 24.0, 42.0, 37.0, 41.0, 36.0, 36.0, 33.0, 51.0, 54.0, 54.0, 43.0, 48.0, 49.0, 35.0, 35.0, 32.0, 19.0, 27.0, 18.0, 29.0, 21.0, 8.0, 13.0, 10.0, 13.0, 8.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.80078125, -7.583984375, -7.3671875, -7.150390625, -6.93359375, -6.716796875, -6.5, -6.283203125, -6.06640625, -5.849609375, -5.6328125, -5.416015625, -5.19921875, -4.982421875, -4.765625, -4.548828125, -4.33203125, -4.115234375, -3.8984375, -3.681640625, -3.46484375, -3.248046875, -3.03125, -2.814453125, -2.59765625, -2.380859375, -2.1640625, -1.947265625, -1.73046875, -1.513671875, -1.296875, -1.080078125, -0.86328125, -0.646484375, -0.4296875, -0.212890625, 0.00390625, 0.220703125, 0.4375, 0.654296875, 0.87109375, 1.087890625, 1.3046875, 1.521484375, 1.73828125, 1.955078125, 2.171875, 2.388671875, 2.60546875, 2.822265625, 3.0390625, 3.255859375, 3.47265625, 3.689453125, 3.90625, 4.123046875, 4.33984375, 4.556640625, 4.7734375, 4.990234375, 5.20703125, 5.423828125, 5.640625, 5.857421875, 6.07421875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 10.0, 16.0, 13.0, 26.0, 38.0, 45.0, 71.0, 104.0, 163.0, 244.0, 353.0, 553.0, 852.0, 1310.0, 2044.0, 3316.0, 5421.0, 9084.0, 15408.0, 26087.0, 44885.0, 76397.0, 124390.0, 177881.0, 189487.0, 144980.0, 92054.0, 54506.0, 31971.0, 18686.0, 10725.0, 6618.0, 3877.0, 2448.0, 1552.0, 960.0, 637.0, 431.0, 308.0, 204.0, 122.0, 81.0, 67.0, 44.0, 25.0, 24.0, 12.0, 8.0, 9.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1533203125, -1.1163330078125, -1.079345703125, -1.0423583984375, -1.00537109375, -0.9683837890625, -0.931396484375, -0.8944091796875, -0.857421875, -0.8204345703125, -0.783447265625, -0.7464599609375, -0.70947265625, -0.6724853515625, -0.635498046875, -0.5985107421875, -0.5615234375, -0.5245361328125, -0.487548828125, -0.4505615234375, -0.41357421875, -0.3765869140625, -0.339599609375, -0.3026123046875, -0.265625, -0.2286376953125, -0.191650390625, -0.1546630859375, -0.11767578125, -0.0806884765625, -0.043701171875, -0.0067138671875, 0.0302734375, 0.0672607421875, 0.104248046875, 0.1412353515625, 0.17822265625, 0.2152099609375, 0.252197265625, 0.2891845703125, 0.326171875, 0.3631591796875, 0.400146484375, 0.4371337890625, 0.47412109375, 0.5111083984375, 0.548095703125, 0.5850830078125, 0.6220703125, 0.6590576171875, 0.696044921875, 0.7330322265625, 0.77001953125, 0.8070068359375, 0.843994140625, 0.8809814453125, 0.91796875, 0.9549560546875, 0.991943359375, 1.0289306640625, 1.06591796875, 1.1029052734375, 1.139892578125, 1.1768798828125, 1.2138671875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 8.0, 5.0, 8.0, 15.0, 10.0, 12.0, 9.0, 13.0, 21.0, 27.0, 19.0, 35.0, 24.0, 20.0, 31.0, 36.0, 38.0, 37.0, 48.0, 37.0, 1078.0, 47.0, 30.0, 40.0, 42.0, 29.0, 41.0, 31.0, 31.0, 25.0, 31.0, 28.0, 22.0, 20.0, 10.0, 17.0, 4.0, 11.0, 6.0, 8.0, 7.0, 2.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-4.38671875, -4.2550048828125, -4.123291015625, -3.9915771484375, -3.85986328125, -3.7281494140625, -3.596435546875, -3.4647216796875, -3.3330078125, -3.2012939453125, -3.069580078125, -2.9378662109375, -2.80615234375, -2.6744384765625, -2.542724609375, -2.4110107421875, -2.279296875, -2.1475830078125, -2.015869140625, -1.8841552734375, -1.75244140625, -1.6207275390625, -1.489013671875, -1.3572998046875, -1.2255859375, -1.0938720703125, -0.962158203125, -0.8304443359375, -0.69873046875, -0.5670166015625, -0.435302734375, -0.3035888671875, -0.171875, -0.0401611328125, 0.091552734375, 0.2232666015625, 0.35498046875, 0.4866943359375, 0.618408203125, 0.7501220703125, 0.8818359375, 1.0135498046875, 1.145263671875, 1.2769775390625, 1.40869140625, 1.5404052734375, 1.672119140625, 1.8038330078125, 1.935546875, 2.0672607421875, 2.198974609375, 2.3306884765625, 2.46240234375, 2.5941162109375, 2.725830078125, 2.8575439453125, 2.9892578125, 3.1209716796875, 3.252685546875, 3.3843994140625, 3.51611328125, 3.6478271484375, 3.779541015625, 3.9112548828125, 4.04296875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 8.0, 3.0, 6.0, 8.0, 16.0, 20.0, 30.0, 44.0, 64.0, 79.0, 123.0, 179.0, 255.0, 426.0, 546.0, 894.0, 1347.0, 2039.0, 3441.0, 5387.0, 8799.0, 14805.0, 25890.0, 46115.0, 81466.0, 151980.0, 389320.0, 861008.0, 236003.0, 114906.0, 64132.0, 36255.0, 20444.0, 11889.0, 6981.0, 4241.0, 2784.0, 1750.0, 1157.0, 708.0, 490.0, 351.0, 236.0, 160.0, 98.0, 80.0, 44.0, 50.0, 21.0, 25.0, 14.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.71484375, -0.6927032470703125, -0.670562744140625, -0.6484222412109375, -0.62628173828125, -0.6041412353515625, -0.582000732421875, -0.5598602294921875, -0.5377197265625, -0.5155792236328125, -0.493438720703125, -0.4712982177734375, -0.44915771484375, -0.4270172119140625, -0.404876708984375, -0.3827362060546875, -0.360595703125, -0.3384552001953125, -0.316314697265625, -0.2941741943359375, -0.27203369140625, -0.2498931884765625, -0.227752685546875, -0.2056121826171875, -0.1834716796875, -0.1613311767578125, -0.139190673828125, -0.1170501708984375, -0.09490966796875, -0.0727691650390625, -0.050628662109375, -0.0284881591796875, -0.00634765625, 0.0157928466796875, 0.037933349609375, 0.0600738525390625, 0.08221435546875, 0.1043548583984375, 0.126495361328125, 0.1486358642578125, 0.1707763671875, 0.1929168701171875, 0.215057373046875, 0.2371978759765625, 0.25933837890625, 0.2814788818359375, 0.303619384765625, 0.3257598876953125, 0.347900390625, 0.3700408935546875, 0.392181396484375, 0.4143218994140625, 0.43646240234375, 0.4586029052734375, 0.480743408203125, 0.5028839111328125, 0.5250244140625, 0.5471649169921875, 0.569305419921875, 0.5914459228515625, 0.61358642578125, 0.6357269287109375, 0.657867431640625, 0.6800079345703125, 0.7021484375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 3.0, 9.0, 6.0, 12.0, 7.0, 8.0, 19.0, 21.0, 29.0, 42.0, 43.0, 49.0, 65.0, 64.0, 76.0, 90.0, 66.0, 55.0, 56.0, 36.0, 45.0, 33.0, 21.0, 23.0, 15.0, 19.0, 21.0, 15.0, 10.0, 7.0, 5.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1981201171875, -0.19153594970703125, -0.1849517822265625, -0.17836761474609375, -0.171783447265625, -0.16519927978515625, -0.1586151123046875, -0.15203094482421875, -0.14544677734375, -0.13886260986328125, -0.1322784423828125, -0.12569427490234375, -0.119110107421875, -0.11252593994140625, -0.1059417724609375, -0.09935760498046875, -0.0927734375, -0.08618927001953125, -0.0796051025390625, -0.07302093505859375, -0.066436767578125, -0.05985260009765625, -0.0532684326171875, -0.04668426513671875, -0.04010009765625, -0.03351593017578125, -0.0269317626953125, -0.02034759521484375, -0.013763427734375, -0.00717926025390625, -0.0005950927734375, 0.00598907470703125, 0.0125732421875, 0.01915740966796875, 0.0257415771484375, 0.03232574462890625, 0.038909912109375, 0.04549407958984375, 0.0520782470703125, 0.05866241455078125, 0.06524658203125, 0.07183074951171875, 0.0784149169921875, 0.08499908447265625, 0.091583251953125, 0.09816741943359375, 0.1047515869140625, 0.11133575439453125, 0.117919921875, 0.12450408935546875, 0.1310882568359375, 0.13767242431640625, 0.144256591796875, 0.15084075927734375, 0.1574249267578125, 0.16400909423828125, 0.17059326171875, 0.17717742919921875, 0.1837615966796875, 0.19034576416015625, 0.196929931640625, 0.20351409912109375, 0.2100982666015625, 0.21668243408203125, 0.2232666015625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 2.0, 6.0, 14.0, 11.0, 13.0, 16.0, 24.0, 25.0, 34.0, 40.0, 46.0, 61.0, 109.0, 193.0, 551.0, 13663.0, 1024664.0, 8167.0, 423.0, 138.0, 104.0, 67.0, 49.0, 35.0, 21.0, 14.0, 12.0, 14.0, 7.0, 5.0, 7.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.171875, -5.01251220703125, -4.8531494140625, -4.69378662109375, -4.534423828125, -4.37506103515625, -4.2156982421875, -4.05633544921875, -3.89697265625, -3.73760986328125, -3.5782470703125, -3.41888427734375, -3.259521484375, -3.10015869140625, -2.9407958984375, -2.78143310546875, -2.6220703125, -2.46270751953125, -2.3033447265625, -2.14398193359375, -1.984619140625, -1.82525634765625, -1.6658935546875, -1.50653076171875, -1.34716796875, -1.18780517578125, -1.0284423828125, -0.86907958984375, -0.709716796875, -0.55035400390625, -0.3909912109375, -0.23162841796875, -0.072265625, 0.08709716796875, 0.2464599609375, 0.40582275390625, 0.565185546875, 0.72454833984375, 0.8839111328125, 1.04327392578125, 1.20263671875, 1.36199951171875, 1.5213623046875, 1.68072509765625, 1.840087890625, 1.99945068359375, 2.1588134765625, 2.31817626953125, 2.4775390625, 2.63690185546875, 2.7962646484375, 2.95562744140625, 3.114990234375, 3.27435302734375, 3.4337158203125, 3.59307861328125, 3.75244140625, 3.91180419921875, 4.0711669921875, 4.23052978515625, 4.389892578125, 4.54925537109375, 4.7086181640625, 4.86798095703125, 5.02734375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 7.0, 38.0, 128.0, 288.0, 308.0, 164.0, 58.0, 19.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2116115540266037, -0.1819620430469513, -0.1523125171661377, -0.12266300618648529, -0.09301348775625229, -0.06336396932601929, -0.03371445834636688, -0.004064932465553284, 0.02558457851409912, 0.05523409694433212, 0.08488361537456512, 0.11453312635421753, 0.14418265223503113, 0.17383216321468353, 0.20348167419433594, 0.23313120007514954, 0.26278072595596313, 0.29243025183677673, 0.32207974791526794, 0.35172927379608154, 0.38137879967689514, 0.41102832555770874, 0.44067782163619995, 0.47032734751701355, 0.49997684359550476, 0.5296263694763184, 0.5592758655548096, 0.5889253616333008, 0.6185749173164368, 0.648224413394928, 0.677873969078064, 0.7075234651565552, 0.7371730208396912, 0.7668225169181824, 0.7964720726013184, 0.8261215686798096, 0.8557710647583008, 0.8854206204414368, 0.915070116519928, 0.944719672203064, 0.9743691682815552, 1.0040186643600464, 1.0336681604385376, 1.0633177757263184, 1.0929672718048096, 1.1226167678833008, 1.152266263961792, 1.1819157600402832, 1.2115652561187744, 1.2412147521972656, 1.2708642482757568, 1.300513744354248, 1.3301633596420288, 1.35981285572052, 1.3894623517990112, 1.4191118478775024, 1.4487614631652832, 1.4784109592437744, 1.5080604553222656, 1.5377099514007568, 1.5673595666885376, 1.5970090627670288, 1.62665855884552, 1.6563080549240112, 1.6859575510025024]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 5.0, 2.0, 5.0, 5.0, 6.0, 5.0, 14.0, 14.0, 15.0, 23.0, 21.0, 28.0, 17.0, 24.0, 26.0, 25.0, 41.0, 45.0, 49.0, 50.0, 40.0, 35.0, 39.0, 49.0, 32.0, 38.0, 34.0, 38.0, 37.0, 28.0, 33.0, 37.0, 21.0, 16.0, 17.0, 11.0, 15.0, 12.0, 9.0, 10.0, 4.0, 9.0, 6.0, 6.0, 3.0, 0.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2594142556190491, -0.25147873163223267, -0.24354323744773865, -0.23560771346092224, -0.22767220437526703, -0.21973669528961182, -0.2118011713027954, -0.2038656622171402, -0.19593015313148499, -0.18799464404582977, -0.18005913496017456, -0.17212361097335815, -0.16418810188770294, -0.15625259280204773, -0.14831706881523132, -0.1403815597295761, -0.1324460506439209, -0.12451054155826569, -0.11657502502202988, -0.10863950848579407, -0.10070399940013885, -0.09276849031448364, -0.08483297377824783, -0.07689745724201202, -0.06896194815635681, -0.0610264353454113, -0.05309092253446579, -0.04515540972352028, -0.03721989691257477, -0.029284384101629257, -0.021348871290683746, -0.013413358479738235, -0.005477845668792725, 0.0024576671421527863, 0.010393179953098297, 0.018328692764043808, 0.02626420557498932, 0.03419971838593483, 0.04213523119688034, 0.05007074400782585, 0.05800625681877136, 0.06594176590442657, 0.07387728244066238, 0.0818127989768982, 0.0897483080625534, 0.09768381714820862, 0.10561933368444443, 0.11355485022068024, 0.12149035930633545, 0.12942586839199066, 0.13736137747764587, 0.14529690146446228, 0.1532324105501175, 0.1611679196357727, 0.1691034436225891, 0.17703895270824432, 0.18497446179389954, 0.19290997087955475, 0.20084547996520996, 0.20878100395202637, 0.21671651303768158, 0.2246520221233368, 0.2325875461101532, 0.2405230551958084, 0.24845856428146362]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 5.0, 2.0, 3.0, 14.0, 14.0, 17.0, 8.0, 20.0, 24.0, 23.0, 18.0, 26.0, 33.0, 32.0, 41.0, 35.0, 33.0, 48.0, 47.0, 56.0, 37.0, 51.0, 41.0, 41.0, 38.0, 39.0, 41.0, 28.0, 39.0, 13.0, 21.0, 15.0, 17.0, 22.0, 14.0, 14.0, 8.0, 7.0, 7.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-7.7890625, -7.5770263671875, -7.364990234375, -7.1529541015625, -6.94091796875, -6.7288818359375, -6.516845703125, -6.3048095703125, -6.0927734375, -5.8807373046875, -5.668701171875, -5.4566650390625, -5.24462890625, -5.0325927734375, -4.820556640625, -4.6085205078125, -4.396484375, -4.1844482421875, -3.972412109375, -3.7603759765625, -3.54833984375, -3.3363037109375, -3.124267578125, -2.9122314453125, -2.7001953125, -2.4881591796875, -2.276123046875, -2.0640869140625, -1.85205078125, -1.6400146484375, -1.427978515625, -1.2159423828125, -1.00390625, -0.7918701171875, -0.579833984375, -0.3677978515625, -0.15576171875, 0.0562744140625, 0.268310546875, 0.4803466796875, 0.6923828125, 0.9044189453125, 1.116455078125, 1.3284912109375, 1.54052734375, 1.7525634765625, 1.964599609375, 2.1766357421875, 2.388671875, 2.6007080078125, 2.812744140625, 3.0247802734375, 3.23681640625, 3.4488525390625, 3.660888671875, 3.8729248046875, 4.0849609375, 4.2969970703125, 4.509033203125, 4.7210693359375, 4.93310546875, 5.1451416015625, 5.357177734375, 5.5692138671875, 5.78125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 4.0, 11.0, 9.0, 13.0, 19.0, 28.0, 45.0, 86.0, 110.0, 143.0, 240.0, 300.0, 408.0, 608.0, 864.0, 1274.0, 1902.0, 2816.0, 4461.0, 6917.0, 11868.0, 21206.0, 43084.0, 105251.0, 252957.0, 310980.0, 155030.0, 60997.0, 27863.0, 14798.0, 8596.0, 5273.0, 3368.0, 2218.0, 1407.0, 1048.0, 726.0, 480.0, 359.0, 221.0, 180.0, 134.0, 73.0, 57.0, 34.0, 27.0, 19.0, 12.0, 20.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.5078125, -7.250732421875, -6.99365234375, -6.736572265625, -6.4794921875, -6.222412109375, -5.96533203125, -5.708251953125, -5.451171875, -5.194091796875, -4.93701171875, -4.679931640625, -4.4228515625, -4.165771484375, -3.90869140625, -3.651611328125, -3.39453125, -3.137451171875, -2.88037109375, -2.623291015625, -2.3662109375, -2.109130859375, -1.85205078125, -1.594970703125, -1.337890625, -1.080810546875, -0.82373046875, -0.566650390625, -0.3095703125, -0.052490234375, 0.20458984375, 0.461669921875, 0.71875, 0.975830078125, 1.23291015625, 1.489990234375, 1.7470703125, 2.004150390625, 2.26123046875, 2.518310546875, 2.775390625, 3.032470703125, 3.28955078125, 3.546630859375, 3.8037109375, 4.060791015625, 4.31787109375, 4.574951171875, 4.83203125, 5.089111328125, 5.34619140625, 5.603271484375, 5.8603515625, 6.117431640625, 6.37451171875, 6.631591796875, 6.888671875, 7.145751953125, 7.40283203125, 7.659912109375, 7.9169921875, 8.174072265625, 8.43115234375, 8.688232421875, 8.9453125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 3.0, 3.0, 5.0, 8.0, 5.0, 6.0, 7.0, 9.0, 12.0, 9.0, 14.0, 13.0, 14.0, 22.0, 16.0, 21.0, 24.0, 34.0, 38.0, 34.0, 44.0, 54.0, 80.0, 129.0, 215.0, 1313.0, 251.0, 168.0, 79.0, 65.0, 52.0, 38.0, 32.0, 21.0, 23.0, 34.0, 16.0, 21.0, 20.0, 20.0, 14.0, 10.0, 9.0, 9.0, 7.0, 6.0, 3.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-17.34375, -16.81298828125, -16.2822265625, -15.75146484375, -15.220703125, -14.68994140625, -14.1591796875, -13.62841796875, -13.09765625, -12.56689453125, -12.0361328125, -11.50537109375, -10.974609375, -10.44384765625, -9.9130859375, -9.38232421875, -8.8515625, -8.32080078125, -7.7900390625, -7.25927734375, -6.728515625, -6.19775390625, -5.6669921875, -5.13623046875, -4.60546875, -4.07470703125, -3.5439453125, -3.01318359375, -2.482421875, -1.95166015625, -1.4208984375, -0.89013671875, -0.359375, 0.17138671875, 0.7021484375, 1.23291015625, 1.763671875, 2.29443359375, 2.8251953125, 3.35595703125, 3.88671875, 4.41748046875, 4.9482421875, 5.47900390625, 6.009765625, 6.54052734375, 7.0712890625, 7.60205078125, 8.1328125, 8.66357421875, 9.1943359375, 9.72509765625, 10.255859375, 10.78662109375, 11.3173828125, 11.84814453125, 12.37890625, 12.90966796875, 13.4404296875, 13.97119140625, 14.501953125, 15.03271484375, 15.5634765625, 16.09423828125, 16.625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 5.0, 8.0, 12.0, 11.0, 13.0, 22.0, 24.0, 30.0, 34.0, 33.0, 69.0, 90.0, 137.0, 243.0, 520.0, 1166.0, 3216.0, 11424.0, 72749.0, 1974252.0, 1023341.0, 45042.0, 8466.0, 2631.0, 1037.0, 418.0, 203.0, 128.0, 83.0, 68.0, 46.0, 30.0, 26.0, 24.0, 19.0, 14.0, 15.0, 5.0, 14.0, 5.0, 6.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.40625, -22.623291015625, -21.84033203125, -21.057373046875, -20.2744140625, -19.491455078125, -18.70849609375, -17.925537109375, -17.142578125, -16.359619140625, -15.57666015625, -14.793701171875, -14.0107421875, -13.227783203125, -12.44482421875, -11.661865234375, -10.87890625, -10.095947265625, -9.31298828125, -8.530029296875, -7.7470703125, -6.964111328125, -6.18115234375, -5.398193359375, -4.615234375, -3.832275390625, -3.04931640625, -2.266357421875, -1.4833984375, -0.700439453125, 0.08251953125, 0.865478515625, 1.6484375, 2.431396484375, 3.21435546875, 3.997314453125, 4.7802734375, 5.563232421875, 6.34619140625, 7.129150390625, 7.912109375, 8.695068359375, 9.47802734375, 10.260986328125, 11.0439453125, 11.826904296875, 12.60986328125, 13.392822265625, 14.17578125, 14.958740234375, 15.74169921875, 16.524658203125, 17.3076171875, 18.090576171875, 18.87353515625, 19.656494140625, 20.439453125, 21.222412109375, 22.00537109375, 22.788330078125, 23.5712890625, 24.354248046875, 25.13720703125, 25.920166015625, 26.703125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 11.0, 12.0, 24.0, 30.0, 57.0, 87.0, 118.0, 112.0, 146.0, 102.0, 98.0, 82.0, 56.0, 26.0, 19.0, 13.0, 5.0, 4.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.635294914245605, -14.387138366699219, -13.138980865478516, -11.890824317932129, -10.642667770385742, -9.394511222839355, -8.146354675292969, -6.898197174072266, -5.650040626525879, -4.401884078979492, -3.1537270545959473, -1.9055702686309814, -0.6574134826660156, 0.5907430648803711, 1.838900089263916, 3.087057113647461, 4.335213661193848, 5.583370208740234, 6.831527233123779, 8.079684257507324, 9.327840805053711, 10.575997352600098, 11.824153900146484, 13.072311401367188, 14.320467948913574, 15.568624496459961, 16.816781997680664, 18.064937591552734, 19.313095092773438, 20.56125259399414, 21.80940818786621, 23.057565689086914, 24.30572509765625, 25.553882598876953, 26.802038192749023, 28.050195693969727, 29.298351287841797, 30.5465087890625, 31.794666290283203, 33.042823791503906, 34.290977478027344, 35.53913497924805, 36.78729248046875, 38.03544616699219, 39.28360366821289, 40.531761169433594, 41.7799186706543, 43.028076171875, 44.2762336730957, 45.524391174316406, 46.77254867553711, 48.02070236206055, 49.26885986328125, 50.51701736450195, 51.765174865722656, 53.01333236694336, 54.26148986816406, 55.509647369384766, 56.75780487060547, 58.005958557128906, 59.25411605834961, 60.50227355957031, 61.750431060791016, 62.99858856201172, 64.24674224853516]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 4.0, 10.0, 8.0, 12.0, 12.0, 14.0, 11.0, 17.0, 15.0, 18.0, 23.0, 19.0, 20.0, 37.0, 26.0, 23.0, 43.0, 40.0, 36.0, 46.0, 40.0, 32.0, 42.0, 31.0, 33.0, 37.0, 40.0, 28.0, 26.0, 21.0, 32.0, 29.0, 19.0, 20.0, 26.0, 19.0, 15.0, 13.0, 8.0, 15.0, 5.0, 7.0, 3.0, 8.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-43.75348663330078, -42.29636001586914, -40.839229583740234, -39.382102966308594, -37.92497634887695, -36.46784591674805, -35.010719299316406, -33.5535888671875, -32.09646224975586, -30.639333724975586, -29.182207107543945, -27.725078582763672, -26.2679500579834, -24.810821533203125, -23.353694915771484, -21.89656639099121, -20.43943977355957, -18.982311248779297, -17.525184631347656, -16.068056106567383, -14.61092758178711, -13.153800010681152, -11.696672439575195, -10.239543914794922, -8.782416343688965, -7.32528829574585, -5.868160247802734, -4.411032676696777, -2.953904628753662, -1.4967765808105469, -0.039649009704589844, 1.4174795150756836, 2.8746070861816406, 4.331735134124756, 5.788863182067871, 7.245990753173828, 8.703119277954102, 10.160246849060059, 11.617374420166016, 13.074502944946289, 14.531630516052246, 15.988758087158203, 17.445886611938477, 18.90301513671875, 20.36014175415039, 21.817270278930664, 23.274398803710938, 24.731525421142578, 26.18865394592285, 27.645782470703125, 29.102909088134766, 30.56003761291504, 32.01716613769531, 33.47429275512695, 34.931419372558594, 36.3885498046875, 37.84567642211914, 39.30280303955078, 40.75993347167969, 42.21706008911133, 43.67418670654297, 45.131317138671875, 46.588443756103516, 48.045570373535156, 49.50270080566406]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 3.0, 8.0, 4.0, 4.0, 6.0, 21.0, 12.0, 8.0, 16.0, 19.0, 30.0, 16.0, 24.0, 33.0, 31.0, 27.0, 37.0, 36.0, 32.0, 37.0, 34.0, 33.0, 49.0, 44.0, 49.0, 46.0, 50.0, 28.0, 34.0, 39.0, 28.0, 26.0, 25.0, 19.0, 19.0, 14.0, 13.0, 7.0, 6.0, 8.0, 10.0, 7.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.91796875, -6.71356201171875, -6.5091552734375, -6.30474853515625, -6.100341796875, -5.89593505859375, -5.6915283203125, -5.48712158203125, -5.28271484375, -5.07830810546875, -4.8739013671875, -4.66949462890625, -4.465087890625, -4.26068115234375, -4.0562744140625, -3.85186767578125, -3.6474609375, -3.44305419921875, -3.2386474609375, -3.03424072265625, -2.829833984375, -2.62542724609375, -2.4210205078125, -2.21661376953125, -2.01220703125, -1.80780029296875, -1.6033935546875, -1.39898681640625, -1.194580078125, -0.99017333984375, -0.7857666015625, -0.58135986328125, -0.376953125, -0.17254638671875, 0.0318603515625, 0.23626708984375, 0.440673828125, 0.64508056640625, 0.8494873046875, 1.05389404296875, 1.25830078125, 1.46270751953125, 1.6671142578125, 1.87152099609375, 2.075927734375, 2.28033447265625, 2.4847412109375, 2.68914794921875, 2.8935546875, 3.09796142578125, 3.3023681640625, 3.50677490234375, 3.711181640625, 3.91558837890625, 4.1199951171875, 4.32440185546875, 4.52880859375, 4.73321533203125, 4.9376220703125, 5.14202880859375, 5.346435546875, 5.55084228515625, 5.7552490234375, 5.95965576171875, 6.1640625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 8.0, 5.0, 9.0, 15.0, 11.0, 15.0, 21.0, 40.0, 29.0, 52.0, 54.0, 81.0, 103.0, 134.0, 212.0, 293.0, 451.0, 795.0, 1513.0, 2886.0, 6571.0, 16374.0, 55151.0, 289364.0, 1968241.0, 1560787.0, 221247.0, 44754.0, 13735.0, 5408.0, 2520.0, 1284.0, 738.0, 417.0, 284.0, 154.0, 121.0, 99.0, 60.0, 40.0, 37.0, 41.0, 26.0, 26.0, 17.0, 10.0, 13.0, 14.0, 4.0, 4.0, 4.0, 2.0, 4.0, 3.0], "bins": [-15.3515625, -14.9119873046875, -14.472412109375, -14.0328369140625, -13.59326171875, -13.1536865234375, -12.714111328125, -12.2745361328125, -11.8349609375, -11.3953857421875, -10.955810546875, -10.5162353515625, -10.07666015625, -9.6370849609375, -9.197509765625, -8.7579345703125, -8.318359375, -7.8787841796875, -7.439208984375, -6.9996337890625, -6.56005859375, -6.1204833984375, -5.680908203125, -5.2413330078125, -4.8017578125, -4.3621826171875, -3.922607421875, -3.4830322265625, -3.04345703125, -2.6038818359375, -2.164306640625, -1.7247314453125, -1.28515625, -0.8455810546875, -0.406005859375, 0.0335693359375, 0.47314453125, 0.9127197265625, 1.352294921875, 1.7918701171875, 2.2314453125, 2.6710205078125, 3.110595703125, 3.5501708984375, 3.98974609375, 4.4293212890625, 4.868896484375, 5.3084716796875, 5.748046875, 6.1876220703125, 6.627197265625, 7.0667724609375, 7.50634765625, 7.9459228515625, 8.385498046875, 8.8250732421875, 9.2646484375, 9.7042236328125, 10.143798828125, 10.5833740234375, 11.02294921875, 11.4625244140625, 11.902099609375, 12.3416748046875, 12.78125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 14.0, 12.0, 19.0, 19.0, 38.0, 41.0, 59.0, 62.0, 114.0, 123.0, 203.0, 247.0, 380.0, 433.0, 468.0, 445.0, 330.0, 284.0, 167.0, 146.0, 125.0, 81.0, 69.0, 38.0, 32.0, 26.0, 16.0, 17.0, 11.0, 14.0, 12.0, 8.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.9140625, -9.578125, -9.2421875, -8.90625, -8.5703125, -8.234375, -7.8984375, -7.5625, -7.2265625, -6.890625, -6.5546875, -6.21875, -5.8828125, -5.546875, -5.2109375, -4.875, -4.5390625, -4.203125, -3.8671875, -3.53125, -3.1953125, -2.859375, -2.5234375, -2.1875, -1.8515625, -1.515625, -1.1796875, -0.84375, -0.5078125, -0.171875, 0.1640625, 0.5, 0.8359375, 1.171875, 1.5078125, 1.84375, 2.1796875, 2.515625, 2.8515625, 3.1875, 3.5234375, 3.859375, 4.1953125, 4.53125, 4.8671875, 5.203125, 5.5390625, 5.875, 6.2109375, 6.546875, 6.8828125, 7.21875, 7.5546875, 7.890625, 8.2265625, 8.5625, 8.8984375, 9.234375, 9.5703125, 9.90625, 10.2421875, 10.578125, 10.9140625, 11.25, 11.5859375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 9.0, 8.0, 12.0, 15.0, 18.0, 25.0, 30.0, 38.0, 51.0, 100.0, 143.0, 228.0, 487.0, 1142.0, 5468.0, 48636.0, 1415668.0, 2631838.0, 79858.0, 7786.0, 1540.0, 526.0, 221.0, 137.0, 97.0, 61.0, 33.0, 36.0, 18.0, 20.0, 9.0, 10.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.53125, -40.34765625, -39.1640625, -37.98046875, -36.796875, -35.61328125, -34.4296875, -33.24609375, -32.0625, -30.87890625, -29.6953125, -28.51171875, -27.328125, -26.14453125, -24.9609375, -23.77734375, -22.59375, -21.41015625, -20.2265625, -19.04296875, -17.859375, -16.67578125, -15.4921875, -14.30859375, -13.125, -11.94140625, -10.7578125, -9.57421875, -8.390625, -7.20703125, -6.0234375, -4.83984375, -3.65625, -2.47265625, -1.2890625, -0.10546875, 1.078125, 2.26171875, 3.4453125, 4.62890625, 5.8125, 6.99609375, 8.1796875, 9.36328125, 10.546875, 11.73046875, 12.9140625, 14.09765625, 15.28125, 16.46484375, 17.6484375, 18.83203125, 20.015625, 21.19921875, 22.3828125, 23.56640625, 24.75, 25.93359375, 27.1171875, 28.30078125, 29.484375, 30.66796875, 31.8515625, 33.03515625, 34.21875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 17.0, 19.0, 15.0, 40.0, 43.0, 67.0, 75.0, 76.0, 91.0, 82.0, 82.0, 91.0, 73.0, 56.0, 41.0, 35.0, 29.0, 17.0, 16.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.31757164001465, -21.973878860473633, -20.630186080932617, -19.2864933013916, -17.942800521850586, -16.59910774230957, -15.255415916442871, -13.911723136901855, -12.56803035736084, -11.224337577819824, -9.880644798278809, -8.53695297241211, -7.1932597160339355, -5.84956693649292, -4.5058746337890625, -3.162181854248047, -1.8184890747070312, -0.4747964143753052, 0.8688962459564209, 2.2125887870788574, 3.556281566619873, 4.899974346160889, 6.243666648864746, 7.587359428405762, 8.931052207946777, 10.274744987487793, 11.618437767028809, 12.962129592895508, 14.305822372436523, 15.649515151977539, 16.993207931518555, 18.33690071105957, 19.68059539794922, 21.024288177490234, 22.36798095703125, 23.711673736572266, 25.05536651611328, 26.399059295654297, 27.742752075195312, 29.086444854736328, 30.430137634277344, 31.77383041381836, 33.117523193359375, 34.46121597290039, 35.804908752441406, 37.14860153198242, 38.49229431152344, 39.83598709106445, 41.17967987060547, 42.523372650146484, 43.8670654296875, 45.210758209228516, 46.55445098876953, 47.89814376831055, 49.24183654785156, 50.58552932739258, 51.92921829223633, 53.272911071777344, 54.61660385131836, 55.960296630859375, 57.30398941040039, 58.647682189941406, 59.99137496948242, 61.33506774902344, 62.67876052856445]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 7.0, 3.0, 7.0, 8.0, 9.0, 9.0, 9.0, 13.0, 22.0, 24.0, 22.0, 20.0, 30.0, 30.0, 27.0, 27.0, 40.0, 28.0, 27.0, 40.0, 38.0, 40.0, 47.0, 47.0, 39.0, 41.0, 30.0, 40.0, 26.0, 31.0, 30.0, 24.0, 23.0, 22.0, 18.0, 14.0, 13.0, 11.0, 7.0, 17.0, 11.0, 6.0, 10.0, 7.0, 1.0, 3.0, 2.0, 4.0, 1.0, 7.0], "bins": [-42.02437973022461, -40.8835334777832, -39.74268341064453, -38.601837158203125, -37.46099090576172, -36.32014465332031, -35.179298400878906, -34.038448333740234, -32.89760208129883, -31.756755828857422, -30.615907669067383, -29.475059509277344, -28.334213256835938, -27.19336700439453, -26.052518844604492, -24.911670684814453, -23.770824432373047, -22.62997817993164, -21.4891300201416, -20.348281860351562, -19.207435607910156, -18.06658935546875, -16.92574119567871, -15.784893989562988, -14.644046783447266, -13.503199577331543, -12.36235237121582, -11.221505165100098, -10.080657958984375, -8.939810752868652, -7.79896354675293, -6.658116340637207, -5.517271041870117, -4.3764238357543945, -3.235576629638672, -2.094729423522949, -0.9538822174072266, 0.1869649887084961, 1.3278121948242188, 2.4686594009399414, 3.609506607055664, 4.750353813171387, 5.891201019287109, 7.032048225402832, 8.172895431518555, 9.313742637634277, 10.45458984375, 11.595437049865723, 12.736284255981445, 13.877131462097168, 15.01797866821289, 16.158824920654297, 17.299673080444336, 18.440521240234375, 19.58136749267578, 20.722213745117188, 21.863061904907227, 23.003910064697266, 24.144756317138672, 25.285602569580078, 26.426450729370117, 27.567298889160156, 28.708145141601562, 29.84899139404297, 30.989839553833008]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 3.0, 10.0, 16.0, 8.0, 19.0, 18.0, 10.0, 18.0, 21.0, 31.0, 25.0, 32.0, 35.0, 44.0, 28.0, 39.0, 29.0, 52.0, 50.0, 42.0, 47.0, 36.0, 55.0, 38.0, 38.0, 26.0, 32.0, 27.0, 25.0, 19.0, 22.0, 17.0, 14.0, 12.0, 13.0, 9.0, 11.0, 11.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.82421875, -6.6168212890625, -6.409423828125, -6.2020263671875, -5.99462890625, -5.7872314453125, -5.579833984375, -5.3724365234375, -5.1650390625, -4.9576416015625, -4.750244140625, -4.5428466796875, -4.33544921875, -4.1280517578125, -3.920654296875, -3.7132568359375, -3.505859375, -3.2984619140625, -3.091064453125, -2.8836669921875, -2.67626953125, -2.4688720703125, -2.261474609375, -2.0540771484375, -1.8466796875, -1.6392822265625, -1.431884765625, -1.2244873046875, -1.01708984375, -0.8096923828125, -0.602294921875, -0.3948974609375, -0.1875, 0.0198974609375, 0.227294921875, 0.4346923828125, 0.64208984375, 0.8494873046875, 1.056884765625, 1.2642822265625, 1.4716796875, 1.6790771484375, 1.886474609375, 2.0938720703125, 2.30126953125, 2.5086669921875, 2.716064453125, 2.9234619140625, 3.130859375, 3.3382568359375, 3.545654296875, 3.7530517578125, 3.96044921875, 4.1678466796875, 4.375244140625, 4.5826416015625, 4.7900390625, 4.9974365234375, 5.204833984375, 5.4122314453125, 5.61962890625, 5.8270263671875, 6.034423828125, 6.2418212890625, 6.44921875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 14.0, 19.0, 34.0, 30.0, 41.0, 79.0, 145.0, 157.0, 274.0, 385.0, 599.0, 876.0, 1439.0, 2218.0, 3399.0, 5787.0, 9416.0, 15792.0, 26334.0, 44881.0, 75248.0, 120644.0, 169444.0, 184108.0, 145898.0, 96253.0, 58475.0, 34227.0, 20561.0, 12079.0, 7299.0, 4471.0, 2808.0, 1747.0, 1159.0, 761.0, 528.0, 288.0, 205.0, 160.0, 98.0, 75.0, 42.0, 17.0, 12.0, 15.0, 11.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.87451171875, -0.8473968505859375, -0.820281982421875, -0.7931671142578125, -0.76605224609375, -0.7389373779296875, -0.711822509765625, -0.6847076416015625, -0.6575927734375, -0.6304779052734375, -0.603363037109375, -0.5762481689453125, -0.54913330078125, -0.5220184326171875, -0.494903564453125, -0.4677886962890625, -0.440673828125, -0.4135589599609375, -0.386444091796875, -0.3593292236328125, -0.33221435546875, -0.3050994873046875, -0.277984619140625, -0.2508697509765625, -0.2237548828125, -0.1966400146484375, -0.169525146484375, -0.1424102783203125, -0.11529541015625, -0.0881805419921875, -0.061065673828125, -0.0339508056640625, -0.0068359375, 0.0202789306640625, 0.047393798828125, 0.0745086669921875, 0.10162353515625, 0.1287384033203125, 0.155853271484375, 0.1829681396484375, 0.2100830078125, 0.2371978759765625, 0.264312744140625, 0.2914276123046875, 0.31854248046875, 0.3456573486328125, 0.372772216796875, 0.3998870849609375, 0.427001953125, 0.4541168212890625, 0.481231689453125, 0.5083465576171875, 0.53546142578125, 0.5625762939453125, 0.589691162109375, 0.6168060302734375, 0.6439208984375, 0.6710357666015625, 0.698150634765625, 0.7252655029296875, 0.75238037109375, 0.7794952392578125, 0.806610107421875, 0.8337249755859375, 0.86083984375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 6.0, 8.0, 3.0, 2.0, 7.0, 10.0, 11.0, 13.0, 18.0, 14.0, 24.0, 22.0, 28.0, 27.0, 36.0, 33.0, 37.0, 33.0, 36.0, 37.0, 55.0, 1062.0, 45.0, 42.0, 40.0, 30.0, 45.0, 37.0, 38.0, 39.0, 22.0, 31.0, 27.0, 22.0, 14.0, 13.0, 12.0, 21.0, 9.0, 6.0, 4.0, 2.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.41015625, -4.26788330078125, -4.1256103515625, -3.98333740234375, -3.841064453125, -3.69879150390625, -3.5565185546875, -3.41424560546875, -3.27197265625, -3.12969970703125, -2.9874267578125, -2.84515380859375, -2.702880859375, -2.56060791015625, -2.4183349609375, -2.27606201171875, -2.1337890625, -1.99151611328125, -1.8492431640625, -1.70697021484375, -1.564697265625, -1.42242431640625, -1.2801513671875, -1.13787841796875, -0.99560546875, -0.85333251953125, -0.7110595703125, -0.56878662109375, -0.426513671875, -0.28424072265625, -0.1419677734375, 0.00030517578125, 0.142578125, 0.28485107421875, 0.4271240234375, 0.56939697265625, 0.711669921875, 0.85394287109375, 0.9962158203125, 1.13848876953125, 1.28076171875, 1.42303466796875, 1.5653076171875, 1.70758056640625, 1.849853515625, 1.99212646484375, 2.1343994140625, 2.27667236328125, 2.4189453125, 2.56121826171875, 2.7034912109375, 2.84576416015625, 2.988037109375, 3.13031005859375, 3.2725830078125, 3.41485595703125, 3.55712890625, 3.69940185546875, 3.8416748046875, 3.98394775390625, 4.126220703125, 4.26849365234375, 4.4107666015625, 4.55303955078125, 4.6953125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 10.0, 8.0, 15.0, 21.0, 27.0, 61.0, 89.0, 106.0, 190.0, 300.0, 454.0, 647.0, 1047.0, 1600.0, 2571.0, 4022.0, 6383.0, 10532.0, 17440.0, 28092.0, 45975.0, 74636.0, 120532.0, 237457.0, 938755.0, 273744.0, 127471.0, 78825.0, 48896.0, 29490.0, 18231.0, 11017.0, 6753.0, 4257.0, 2658.0, 1690.0, 1067.0, 666.0, 468.0, 313.0, 203.0, 146.0, 87.0, 69.0, 35.0, 25.0, 15.0, 11.0, 10.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.47021484375, -0.45482635498046875, -0.4394378662109375, -0.42404937744140625, -0.408660888671875, -0.39327239990234375, -0.3778839111328125, -0.36249542236328125, -0.34710693359375, -0.33171844482421875, -0.3163299560546875, -0.30094146728515625, -0.285552978515625, -0.27016448974609375, -0.2547760009765625, -0.23938751220703125, -0.2239990234375, -0.20861053466796875, -0.1932220458984375, -0.17783355712890625, -0.162445068359375, -0.14705657958984375, -0.1316680908203125, -0.11627960205078125, -0.10089111328125, -0.08550262451171875, -0.0701141357421875, -0.05472564697265625, -0.039337158203125, -0.02394866943359375, -0.0085601806640625, 0.00682830810546875, 0.022216796875, 0.03760528564453125, 0.0529937744140625, 0.06838226318359375, 0.083770751953125, 0.09915924072265625, 0.1145477294921875, 0.12993621826171875, 0.14532470703125, 0.16071319580078125, 0.1761016845703125, 0.19149017333984375, 0.206878662109375, 0.22226715087890625, 0.2376556396484375, 0.25304412841796875, 0.2684326171875, 0.28382110595703125, 0.2992095947265625, 0.31459808349609375, 0.329986572265625, 0.34537506103515625, 0.3607635498046875, 0.37615203857421875, 0.39154052734375, 0.40692901611328125, 0.4223175048828125, 0.43770599365234375, 0.453094482421875, 0.46848297119140625, 0.4838714599609375, 0.49925994873046875, 0.5146484375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 6.0, 8.0, 7.0, 16.0, 14.0, 28.0, 32.0, 56.0, 77.0, 79.0, 103.0, 93.0, 117.0, 99.0, 60.0, 64.0, 36.0, 24.0, 19.0, 6.0, 9.0, 5.0, 9.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.127685546875, -0.12337875366210938, -0.11907196044921875, -0.11476516723632812, -0.1104583740234375, -0.10615158081054688, -0.10184478759765625, -0.09753799438476562, -0.093231201171875, -0.08892440795898438, -0.08461761474609375, -0.08031082153320312, -0.0760040283203125, -0.07169723510742188, -0.06739044189453125, -0.06308364868164062, -0.05877685546875, -0.054470062255859375, -0.05016326904296875, -0.045856475830078125, -0.0415496826171875, -0.037242889404296875, -0.03293609619140625, -0.028629302978515625, -0.024322509765625, -0.020015716552734375, -0.01570892333984375, -0.011402130126953125, -0.0070953369140625, -0.002788543701171875, 0.00151824951171875, 0.005825042724609375, 0.0101318359375, 0.014438629150390625, 0.01874542236328125, 0.023052215576171875, 0.0273590087890625, 0.031665802001953125, 0.03597259521484375, 0.040279388427734375, 0.044586181640625, 0.048892974853515625, 0.05319976806640625, 0.057506561279296875, 0.0618133544921875, 0.06612014770507812, 0.07042694091796875, 0.07473373413085938, 0.07904052734375, 0.08334732055664062, 0.08765411376953125, 0.09196090698242188, 0.0962677001953125, 0.10057449340820312, 0.10488128662109375, 0.10918807983398438, 0.113494873046875, 0.11780166625976562, 0.12210845947265625, 0.12641525268554688, 0.1307220458984375, 0.13502883911132812, 0.13933563232421875, 0.14364242553710938, 0.14794921875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 7.0, 7.0, 7.0, 14.0, 18.0, 40.0, 52.0, 94.0, 170.0, 612.0, 346236.0, 700105.0, 690.0, 203.0, 102.0, 63.0, 36.0, 25.0, 14.0, 11.0, 9.0, 8.0, 8.0, 4.0, 4.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.765625, -3.658111572265625, -3.55059814453125, -3.443084716796875, -3.3355712890625, -3.228057861328125, -3.12054443359375, -3.013031005859375, -2.905517578125, -2.798004150390625, -2.69049072265625, -2.582977294921875, -2.4754638671875, -2.367950439453125, -2.26043701171875, -2.152923583984375, -2.04541015625, -1.937896728515625, -1.83038330078125, -1.722869873046875, -1.6153564453125, -1.507843017578125, -1.40032958984375, -1.292816162109375, -1.185302734375, -1.077789306640625, -0.97027587890625, -0.862762451171875, -0.7552490234375, -0.647735595703125, -0.54022216796875, -0.432708740234375, -0.3251953125, -0.217681884765625, -0.11016845703125, -0.002655029296875, 0.1048583984375, 0.212371826171875, 0.31988525390625, 0.427398681640625, 0.534912109375, 0.642425537109375, 0.74993896484375, 0.857452392578125, 0.9649658203125, 1.072479248046875, 1.17999267578125, 1.287506103515625, 1.39501953125, 1.502532958984375, 1.61004638671875, 1.717559814453125, 1.8250732421875, 1.932586669921875, 2.04010009765625, 2.147613525390625, 2.255126953125, 2.362640380859375, 2.47015380859375, 2.577667236328125, 2.6851806640625, 2.792694091796875, 2.90020751953125, 3.007720947265625, 3.115234375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 8.0, 279.0, 638.0, 80.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1365938037633896, -0.10405667126178741, -0.07151953876018524, -0.03898240625858307, -0.006445273756980896, 0.026091858744621277, 0.05862899124622345, 0.09116612374782562, 0.1237032562494278, 0.15624038875102997, 0.18877752125263214, 0.22131465375423431, 0.2538517713546753, 0.28638893365859985, 0.31892603635787964, 0.3514631986618042, 0.384000301361084, 0.41653743386268616, 0.44907456636428833, 0.4816116988658905, 0.5141488313674927, 0.5466859340667725, 0.579223096370697, 0.6117602586746216, 0.6442973613739014, 0.6768344640731812, 0.7093716263771057, 0.7419087886810303, 0.7744458913803101, 0.8069829940795898, 0.8395201563835144, 0.872057318687439, 0.9045945405960083, 0.9371316432952881, 0.9696688055992126, 1.0022059679031372, 1.034743070602417, 1.0672801733016968, 1.0998172760009766, 1.132354497909546, 1.1648916006088257, 1.1974287033081055, 1.2299659252166748, 1.2625030279159546, 1.2950401306152344, 1.3275772333145142, 1.360114336013794, 1.3926515579223633, 1.425188660621643, 1.4577257633209229, 1.4902629852294922, 1.522800087928772, 1.5553371906280518, 1.5878742933273315, 1.6204113960266113, 1.6529486179351807, 1.6854857206344604, 1.7180228233337402, 1.7505600452423096, 1.7830971479415894, 1.8156342506408691, 1.848171353340149, 1.8807084560394287, 1.913245677947998, 1.9457827806472778]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 6.0, 9.0, 12.0, 8.0, 18.0, 19.0, 22.0, 19.0, 27.0, 36.0, 36.0, 37.0, 34.0, 59.0, 44.0, 55.0, 58.0, 49.0, 43.0, 44.0, 58.0, 40.0, 33.0, 38.0, 33.0, 26.0, 19.0, 27.0, 19.0, 24.0, 15.0, 10.0, 8.0, 11.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1974562406539917, -0.19122140109539032, -0.18498654663562775, -0.17875170707702637, -0.1725168526172638, -0.16628201305866241, -0.16004717350006104, -0.15381231904029846, -0.14757747948169708, -0.1413426399230957, -0.13510778546333313, -0.12887294590473175, -0.12263809889554977, -0.1164032518863678, -0.11016841232776642, -0.10393356531858444, -0.09769871830940247, -0.09146387130022049, -0.08522902429103851, -0.07899418473243713, -0.07275933772325516, -0.06652449071407318, -0.0602896474301815, -0.054054804146289825, -0.04781995713710785, -0.04158511012792587, -0.035350266844034195, -0.029115421697497368, -0.02288057655096054, -0.016645731404423714, -0.010410886257886887, -0.004176042973995209, 0.0020588040351867676, 0.008293649181723595, 0.014528494328260422, 0.02076333947479725, 0.026998184621334076, 0.03323303163051605, 0.03946787491440773, 0.04570271819829941, 0.051937565207481384, 0.05817241221666336, 0.06440725922584534, 0.07064209878444672, 0.07687694579362869, 0.08311179280281067, 0.08934663236141205, 0.09558147937059402, 0.101816326379776, 0.10805117338895798, 0.11428602039813995, 0.12052085995674133, 0.1267557144165039, 0.13299055397510529, 0.13922539353370667, 0.14546024799346924, 0.15169508755207062, 0.157929927110672, 0.16416478157043457, 0.17039962112903595, 0.17663446068763733, 0.1828693151473999, 0.18910415470600128, 0.19533899426460266, 0.20157384872436523]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 6.0, 11.0, 14.0, 16.0, 17.0, 24.0, 18.0, 28.0, 39.0, 28.0, 31.0, 42.0, 38.0, 35.0, 44.0, 46.0, 57.0, 56.0, 44.0, 38.0, 52.0, 43.0, 49.0, 30.0, 28.0, 24.0, 23.0, 14.0, 12.0, 19.0, 21.0, 17.0, 10.0, 8.0, 7.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3046875, -7.0760498046875, -6.847412109375, -6.6187744140625, -6.39013671875, -6.1614990234375, -5.932861328125, -5.7042236328125, -5.4755859375, -5.2469482421875, -5.018310546875, -4.7896728515625, -4.56103515625, -4.3323974609375, -4.103759765625, -3.8751220703125, -3.646484375, -3.4178466796875, -3.189208984375, -2.9605712890625, -2.73193359375, -2.5032958984375, -2.274658203125, -2.0460205078125, -1.8173828125, -1.5887451171875, -1.360107421875, -1.1314697265625, -0.90283203125, -0.6741943359375, -0.445556640625, -0.2169189453125, 0.01171875, 0.2403564453125, 0.468994140625, 0.6976318359375, 0.92626953125, 1.1549072265625, 1.383544921875, 1.6121826171875, 1.8408203125, 2.0694580078125, 2.298095703125, 2.5267333984375, 2.75537109375, 2.9840087890625, 3.212646484375, 3.4412841796875, 3.669921875, 3.8985595703125, 4.127197265625, 4.3558349609375, 4.58447265625, 4.8131103515625, 5.041748046875, 5.2703857421875, 5.4990234375, 5.7276611328125, 5.956298828125, 6.1849365234375, 6.41357421875, 6.6422119140625, 6.870849609375, 7.0994873046875, 7.328125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 7.0, 9.0, 18.0, 17.0, 22.0, 27.0, 41.0, 52.0, 84.0, 138.0, 187.0, 288.0, 427.0, 687.0, 983.0, 1577.0, 2836.0, 5713.0, 12710.0, 37599.0, 187383.0, 595557.0, 146904.0, 31978.0, 11240.0, 5101.0, 2553.0, 1566.0, 901.0, 635.0, 429.0, 283.0, 193.0, 126.0, 86.0, 70.0, 35.0, 28.0, 18.0, 6.0, 6.0, 10.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0], "bins": [-13.7421875, -13.3311767578125, -12.920166015625, -12.5091552734375, -12.09814453125, -11.6871337890625, -11.276123046875, -10.8651123046875, -10.4541015625, -10.0430908203125, -9.632080078125, -9.2210693359375, -8.81005859375, -8.3990478515625, -7.988037109375, -7.5770263671875, -7.166015625, -6.7550048828125, -6.343994140625, -5.9329833984375, -5.52197265625, -5.1109619140625, -4.699951171875, -4.2889404296875, -3.8779296875, -3.4669189453125, -3.055908203125, -2.6448974609375, -2.23388671875, -1.8228759765625, -1.411865234375, -1.0008544921875, -0.58984375, -0.1788330078125, 0.232177734375, 0.6431884765625, 1.05419921875, 1.4652099609375, 1.876220703125, 2.2872314453125, 2.6982421875, 3.1092529296875, 3.520263671875, 3.9312744140625, 4.34228515625, 4.7532958984375, 5.164306640625, 5.5753173828125, 5.986328125, 6.3973388671875, 6.808349609375, 7.2193603515625, 7.63037109375, 8.0413818359375, 8.452392578125, 8.8634033203125, 9.2744140625, 9.6854248046875, 10.096435546875, 10.5074462890625, 10.91845703125, 11.3294677734375, 11.740478515625, 12.1514892578125, 12.5625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 6.0, 5.0, 5.0, 7.0, 12.0, 11.0, 11.0, 16.0, 23.0, 14.0, 17.0, 25.0, 19.0, 31.0, 38.0, 36.0, 39.0, 33.0, 63.0, 102.0, 246.0, 1487.0, 259.0, 102.0, 51.0, 41.0, 44.0, 42.0, 28.0, 33.0, 35.0, 19.0, 22.0, 14.0, 19.0, 28.0, 12.0, 9.0, 9.0, 9.0, 8.0, 11.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-20.1875, -19.6025390625, -19.017578125, -18.4326171875, -17.84765625, -17.2626953125, -16.677734375, -16.0927734375, -15.5078125, -14.9228515625, -14.337890625, -13.7529296875, -13.16796875, -12.5830078125, -11.998046875, -11.4130859375, -10.828125, -10.2431640625, -9.658203125, -9.0732421875, -8.48828125, -7.9033203125, -7.318359375, -6.7333984375, -6.1484375, -5.5634765625, -4.978515625, -4.3935546875, -3.80859375, -3.2236328125, -2.638671875, -2.0537109375, -1.46875, -0.8837890625, -0.298828125, 0.2861328125, 0.87109375, 1.4560546875, 2.041015625, 2.6259765625, 3.2109375, 3.7958984375, 4.380859375, 4.9658203125, 5.55078125, 6.1357421875, 6.720703125, 7.3056640625, 7.890625, 8.4755859375, 9.060546875, 9.6455078125, 10.23046875, 10.8154296875, 11.400390625, 11.9853515625, 12.5703125, 13.1552734375, 13.740234375, 14.3251953125, 14.91015625, 15.4951171875, 16.080078125, 16.6650390625, 17.25]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 10.0, 12.0, 8.0, 13.0, 14.0, 13.0, 18.0, 24.0, 28.0, 40.0, 41.0, 49.0, 62.0, 83.0, 123.0, 224.0, 374.0, 1005.0, 2600.0, 7780.0, 37873.0, 1500098.0, 1544286.0, 38319.0, 7905.0, 2567.0, 967.0, 409.0, 219.0, 129.0, 94.0, 60.0, 43.0, 46.0, 31.0, 19.0, 25.0, 14.0, 17.0, 12.0, 11.0, 8.0, 3.0, 4.0, 5.0, 6.0, 2.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-25.515625, -24.692626953125, -23.86962890625, -23.046630859375, -22.2236328125, -21.400634765625, -20.57763671875, -19.754638671875, -18.931640625, -18.108642578125, -17.28564453125, -16.462646484375, -15.6396484375, -14.816650390625, -13.99365234375, -13.170654296875, -12.34765625, -11.524658203125, -10.70166015625, -9.878662109375, -9.0556640625, -8.232666015625, -7.40966796875, -6.586669921875, -5.763671875, -4.940673828125, -4.11767578125, -3.294677734375, -2.4716796875, -1.648681640625, -0.82568359375, -0.002685546875, 0.8203125, 1.643310546875, 2.46630859375, 3.289306640625, 4.1123046875, 4.935302734375, 5.75830078125, 6.581298828125, 7.404296875, 8.227294921875, 9.05029296875, 9.873291015625, 10.6962890625, 11.519287109375, 12.34228515625, 13.165283203125, 13.98828125, 14.811279296875, 15.63427734375, 16.457275390625, 17.2802734375, 18.103271484375, 18.92626953125, 19.749267578125, 20.572265625, 21.395263671875, 22.21826171875, 23.041259765625, 23.8642578125, 24.687255859375, 25.51025390625, 26.333251953125, 27.15625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 15.0, 171.0, 494.0, 298.0, 40.0], "bins": [-268.88287353515625, -264.5195007324219, -260.1560974121094, -255.792724609375, -251.42935180664062, -247.0659637451172, -242.70257568359375, -238.33920288085938, -233.97581481933594, -229.6124267578125, -225.24905395507812, -220.8856658935547, -216.52227783203125, -212.15890502929688, -207.79551696777344, -203.43214416503906, -199.06875610351562, -194.7053680419922, -190.3419952392578, -185.97860717773438, -181.615234375, -177.25184631347656, -172.88845825195312, -168.52508544921875, -164.1616973876953, -159.79830932617188, -155.4349365234375, -151.07154846191406, -146.70816040039062, -142.34478759765625, -137.9813995361328, -133.61802673339844, -129.254638671875, -124.8912582397461, -120.52787780761719, -116.16448974609375, -111.80110931396484, -107.43772888183594, -103.0743408203125, -98.7109603881836, -94.34758758544922, -89.98420715332031, -85.62081909179688, -81.25743865966797, -76.89405822753906, -72.53067779541016, -68.16729736328125, -63.80390930175781, -59.440528869628906, -55.0771484375, -50.71376419067383, -46.350379943847656, -41.98699951171875, -37.623619079589844, -33.26023483276367, -28.896852493286133, -24.533470153808594, -20.170087814331055, -15.806705474853516, -11.443323135375977, -7.0799407958984375, -2.7165584564208984, 1.6468238830566406, 6.01020622253418, 10.373589515686035]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 10.0, 13.0, 8.0, 9.0, 15.0, 20.0, 13.0, 22.0, 21.0, 25.0, 27.0, 34.0, 46.0, 41.0, 34.0, 43.0, 38.0, 45.0, 47.0, 44.0, 45.0, 41.0, 35.0, 37.0, 30.0, 36.0, 27.0, 24.0, 24.0, 23.0, 18.0, 20.0, 16.0, 8.0, 9.0, 10.0, 15.0, 6.0, 7.0, 6.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.25464630126953, -39.76279067993164, -38.27093505859375, -36.77907943725586, -35.28722381591797, -33.795372009277344, -32.30351638793945, -30.811660766601562, -29.319805145263672, -27.82794952392578, -26.33609390258789, -24.844240188598633, -23.352384567260742, -21.86052894592285, -20.368675231933594, -18.876819610595703, -17.384963989257812, -15.893108367919922, -14.401253700256348, -12.909399032592773, -11.417543411254883, -9.925687789916992, -8.433833122253418, -6.941978454589844, -5.450122833251953, -3.9582676887512207, -2.4664125442504883, -0.9745573997497559, 0.5172977447509766, 2.009152889251709, 3.5010080337524414, 4.992862701416016, 6.484722137451172, 7.976577281951904, 9.468432426452637, 10.960287094116211, 12.452142715454102, 13.943998336791992, 15.435853004455566, 16.92770767211914, 18.41956329345703, 19.911418914794922, 21.403274536132812, 22.89512825012207, 24.38698387145996, 25.87883949279785, 27.37069320678711, 28.862548828125, 30.35440444946289, 31.84626007080078, 33.33811569213867, 34.82997131347656, 36.32182312011719, 37.81367874145508, 39.30553436279297, 40.79738998413086, 42.28924560546875, 43.78110122680664, 45.27295684814453, 46.76481246948242, 48.25666809082031, 49.74851989746094, 51.24037551879883, 52.73223114013672, 54.22408676147461]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 7.0, 5.0, 6.0, 14.0, 13.0, 16.0, 18.0, 26.0, 19.0, 34.0, 38.0, 28.0, 38.0, 32.0, 35.0, 45.0, 47.0, 52.0, 49.0, 49.0, 35.0, 48.0, 43.0, 40.0, 43.0, 40.0, 40.0, 27.0, 20.0, 20.0, 15.0, 9.0, 19.0, 5.0, 6.0, 3.0, 5.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.94921875, -7.71759033203125, -7.4859619140625, -7.25433349609375, -7.022705078125, -6.79107666015625, -6.5594482421875, -6.32781982421875, -6.09619140625, -5.86456298828125, -5.6329345703125, -5.40130615234375, -5.169677734375, -4.93804931640625, -4.7064208984375, -4.47479248046875, -4.2431640625, -4.01153564453125, -3.7799072265625, -3.54827880859375, -3.316650390625, -3.08502197265625, -2.8533935546875, -2.62176513671875, -2.39013671875, -2.15850830078125, -1.9268798828125, -1.69525146484375, -1.463623046875, -1.23199462890625, -1.0003662109375, -0.76873779296875, -0.537109375, -0.30548095703125, -0.0738525390625, 0.15777587890625, 0.389404296875, 0.62103271484375, 0.8526611328125, 1.08428955078125, 1.31591796875, 1.54754638671875, 1.7791748046875, 2.01080322265625, 2.242431640625, 2.47406005859375, 2.7056884765625, 2.93731689453125, 3.1689453125, 3.40057373046875, 3.6322021484375, 3.86383056640625, 4.095458984375, 4.32708740234375, 4.5587158203125, 4.79034423828125, 5.02197265625, 5.25360107421875, 5.4852294921875, 5.71685791015625, 5.948486328125, 6.18011474609375, 6.4117431640625, 6.64337158203125, 6.875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 6.0, 6.0, 4.0, 9.0, 11.0, 9.0, 21.0, 31.0, 45.0, 55.0, 63.0, 74.0, 104.0, 166.0, 199.0, 320.0, 440.0, 631.0, 980.0, 1412.0, 2369.0, 4006.0, 7311.0, 13884.0, 29389.0, 72893.0, 223384.0, 769673.0, 1696095.0, 938443.0, 275981.0, 87783.0, 33563.0, 15598.0, 7834.0, 4330.0, 2522.0, 1510.0, 936.0, 651.0, 438.0, 315.0, 228.0, 160.0, 112.0, 74.0, 64.0, 43.0, 40.0, 20.0, 13.0, 15.0, 8.0, 8.0, 9.0, 6.0, 2.0, 0.0, 2.0], "bins": [-9.0390625, -8.7698974609375, -8.500732421875, -8.2315673828125, -7.96240234375, -7.6932373046875, -7.424072265625, -7.1549072265625, -6.8857421875, -6.6165771484375, -6.347412109375, -6.0782470703125, -5.80908203125, -5.5399169921875, -5.270751953125, -5.0015869140625, -4.732421875, -4.4632568359375, -4.194091796875, -3.9249267578125, -3.65576171875, -3.3865966796875, -3.117431640625, -2.8482666015625, -2.5791015625, -2.3099365234375, -2.040771484375, -1.7716064453125, -1.50244140625, -1.2332763671875, -0.964111328125, -0.6949462890625, -0.42578125, -0.1566162109375, 0.112548828125, 0.3817138671875, 0.65087890625, 0.9200439453125, 1.189208984375, 1.4583740234375, 1.7275390625, 1.9967041015625, 2.265869140625, 2.5350341796875, 2.80419921875, 3.0733642578125, 3.342529296875, 3.6116943359375, 3.880859375, 4.1500244140625, 4.419189453125, 4.6883544921875, 4.95751953125, 5.2266845703125, 5.495849609375, 5.7650146484375, 6.0341796875, 6.3033447265625, 6.572509765625, 6.8416748046875, 7.11083984375, 7.3800048828125, 7.649169921875, 7.9183349609375, 8.1875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 12.0, 14.0, 7.0, 12.0, 14.0, 18.0, 22.0, 25.0, 46.0, 41.0, 68.0, 102.0, 129.0, 152.0, 247.0, 313.0, 384.0, 437.0, 445.0, 379.0, 279.0, 258.0, 151.0, 115.0, 105.0, 69.0, 47.0, 38.0, 35.0, 29.0, 22.0, 8.0, 7.0, 6.0, 11.0, 8.0, 1.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.6171875, -8.3099365234375, -8.002685546875, -7.6954345703125, -7.38818359375, -7.0809326171875, -6.773681640625, -6.4664306640625, -6.1591796875, -5.8519287109375, -5.544677734375, -5.2374267578125, -4.93017578125, -4.6229248046875, -4.315673828125, -4.0084228515625, -3.701171875, -3.3939208984375, -3.086669921875, -2.7794189453125, -2.47216796875, -2.1649169921875, -1.857666015625, -1.5504150390625, -1.2431640625, -0.9359130859375, -0.628662109375, -0.3214111328125, -0.01416015625, 0.2930908203125, 0.600341796875, 0.9075927734375, 1.21484375, 1.5220947265625, 1.829345703125, 2.1365966796875, 2.44384765625, 2.7510986328125, 3.058349609375, 3.3656005859375, 3.6728515625, 3.9801025390625, 4.287353515625, 4.5946044921875, 4.90185546875, 5.2091064453125, 5.516357421875, 5.8236083984375, 6.130859375, 6.4381103515625, 6.745361328125, 7.0526123046875, 7.35986328125, 7.6671142578125, 7.974365234375, 8.2816162109375, 8.5888671875, 8.8961181640625, 9.203369140625, 9.5106201171875, 9.81787109375, 10.1251220703125, 10.432373046875, 10.7396240234375, 11.046875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 4.0, 4.0, 7.0, 13.0, 16.0, 13.0, 17.0, 26.0, 51.0, 49.0, 71.0, 88.0, 148.0, 226.0, 411.0, 780.0, 2254.0, 7723.0, 34154.0, 239527.0, 2670720.0, 1112257.0, 100634.0, 17542.0, 4628.0, 1389.0, 580.0, 338.0, 175.0, 128.0, 74.0, 59.0, 35.0, 28.0, 26.0, 20.0, 12.0, 15.0, 15.0, 6.0, 5.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-26.375, -25.63818359375, -24.9013671875, -24.16455078125, -23.427734375, -22.69091796875, -21.9541015625, -21.21728515625, -20.48046875, -19.74365234375, -19.0068359375, -18.27001953125, -17.533203125, -16.79638671875, -16.0595703125, -15.32275390625, -14.5859375, -13.84912109375, -13.1123046875, -12.37548828125, -11.638671875, -10.90185546875, -10.1650390625, -9.42822265625, -8.69140625, -7.95458984375, -7.2177734375, -6.48095703125, -5.744140625, -5.00732421875, -4.2705078125, -3.53369140625, -2.796875, -2.06005859375, -1.3232421875, -0.58642578125, 0.150390625, 0.88720703125, 1.6240234375, 2.36083984375, 3.09765625, 3.83447265625, 4.5712890625, 5.30810546875, 6.044921875, 6.78173828125, 7.5185546875, 8.25537109375, 8.9921875, 9.72900390625, 10.4658203125, 11.20263671875, 11.939453125, 12.67626953125, 13.4130859375, 14.14990234375, 14.88671875, 15.62353515625, 16.3603515625, 17.09716796875, 17.833984375, 18.57080078125, 19.3076171875, 20.04443359375, 20.78125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 6.0, 17.0, 29.0, 41.0, 58.0, 87.0, 110.0, 132.0, 131.0, 114.0, 87.0, 72.0, 53.0, 27.0, 20.0, 12.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.549772262573242, -24.68872833251953, -22.827682495117188, -20.966638565063477, -19.105592727661133, -17.244548797607422, -15.383503913879395, -13.522459030151367, -11.66141414642334, -9.800369262695312, -7.939324378967285, -6.078279972076416, -4.217235088348389, -2.3561906814575195, -0.4951457977294922, 1.3658990859985352, 3.2269439697265625, 5.08798885345459, 6.949033737182617, 8.810077667236328, 10.671123504638672, 12.532167434692383, 14.39321231842041, 16.254257202148438, 18.11530303955078, 19.976346969604492, 21.837392807006836, 23.698436737060547, 25.55948257446289, 27.4205265045166, 29.281570434570312, 31.142616271972656, 33.003658294677734, 34.86470413208008, 36.725746154785156, 38.5867919921875, 40.447837829589844, 42.30888366699219, 44.169925689697266, 46.03097152709961, 47.89201736450195, 49.7530632019043, 51.614105224609375, 53.47515106201172, 55.33619689941406, 57.197242736816406, 59.058284759521484, 60.91933059692383, 62.780372619628906, 64.64141845703125, 66.5024642944336, 68.36351013183594, 70.22454833984375, 72.0855941772461, 73.94664001464844, 75.80768585205078, 77.66873168945312, 79.52977752685547, 81.39082336425781, 83.25186920166016, 85.11290740966797, 86.97395324707031, 88.83499908447266, 90.696044921875, 92.55709075927734]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 9.0, 11.0, 14.0, 13.0, 22.0, 18.0, 13.0, 33.0, 32.0, 33.0, 41.0, 51.0, 46.0, 61.0, 48.0, 46.0, 50.0, 38.0, 41.0, 33.0, 48.0, 49.0, 43.0, 34.0, 34.0, 29.0, 16.0, 18.0, 21.0, 11.0, 10.0, 4.0, 9.0, 10.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.291927337646484, -36.987159729003906, -35.682395935058594, -34.37763214111328, -33.0728645324707, -31.768098831176758, -30.463333129882812, -29.158567428588867, -27.853801727294922, -26.549036026000977, -25.24427032470703, -23.939504623413086, -22.63473892211914, -21.329973220825195, -20.02520751953125, -18.720441818237305, -17.41567611694336, -16.110910415649414, -14.806144714355469, -13.501379013061523, -12.196613311767578, -10.891847610473633, -9.587081909179688, -8.282316207885742, -6.977550506591797, -5.672784805297852, -4.368019104003906, -3.063253402709961, -1.7584877014160156, -0.4537220001220703, 0.851043701171875, 2.1558094024658203, 3.4605712890625, 4.765336990356445, 6.070102691650391, 7.374868392944336, 8.679634094238281, 9.984399795532227, 11.289165496826172, 12.593931198120117, 13.898696899414062, 15.203462600708008, 16.508228302001953, 17.8129940032959, 19.117759704589844, 20.42252540588379, 21.727291107177734, 23.03205680847168, 24.336822509765625, 25.64158821105957, 26.946353912353516, 28.25111961364746, 29.555885314941406, 30.86065101623535, 32.1654167175293, 33.470184326171875, 34.77494812011719, 36.0797119140625, 37.38447952270508, 38.689247131347656, 39.99401092529297, 41.29877471923828, 42.60354232788086, 43.90830993652344, 45.21307373046875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 4.0, 2.0, 7.0, 9.0, 5.0, 12.0, 12.0, 13.0, 18.0, 18.0, 22.0, 24.0, 21.0, 32.0, 38.0, 40.0, 34.0, 38.0, 28.0, 48.0, 42.0, 35.0, 39.0, 48.0, 40.0, 33.0, 38.0, 38.0, 33.0, 36.0, 31.0, 29.0, 18.0, 13.0, 14.0, 12.0, 9.0, 14.0, 9.0, 8.0, 4.0, 5.0, 9.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.453125, -6.24755859375, -6.0419921875, -5.83642578125, -5.630859375, -5.42529296875, -5.2197265625, -5.01416015625, -4.80859375, -4.60302734375, -4.3974609375, -4.19189453125, -3.986328125, -3.78076171875, -3.5751953125, -3.36962890625, -3.1640625, -2.95849609375, -2.7529296875, -2.54736328125, -2.341796875, -2.13623046875, -1.9306640625, -1.72509765625, -1.51953125, -1.31396484375, -1.1083984375, -0.90283203125, -0.697265625, -0.49169921875, -0.2861328125, -0.08056640625, 0.125, 0.33056640625, 0.5361328125, 0.74169921875, 0.947265625, 1.15283203125, 1.3583984375, 1.56396484375, 1.76953125, 1.97509765625, 2.1806640625, 2.38623046875, 2.591796875, 2.79736328125, 3.0029296875, 3.20849609375, 3.4140625, 3.61962890625, 3.8251953125, 4.03076171875, 4.236328125, 4.44189453125, 4.6474609375, 4.85302734375, 5.05859375, 5.26416015625, 5.4697265625, 5.67529296875, 5.880859375, 6.08642578125, 6.2919921875, 6.49755859375, 6.703125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 0.0, 2.0, 4.0, 2.0, 8.0, 15.0, 8.0, 23.0, 25.0, 49.0, 54.0, 62.0, 103.0, 120.0, 172.0, 262.0, 458.0, 717.0, 1205.0, 2361.0, 4381.0, 8714.0, 17371.0, 36093.0, 74393.0, 142790.0, 223481.0, 228002.0, 151237.0, 78998.0, 38984.0, 18514.0, 9211.0, 4822.0, 2412.0, 1353.0, 763.0, 474.0, 254.0, 211.0, 130.0, 85.0, 74.0, 49.0, 27.0, 26.0, 14.0, 13.0, 10.0, 13.0, 8.0, 5.0, 3.0, 2.0], "bins": [-1.4052734375, -1.367340087890625, -1.32940673828125, -1.291473388671875, -1.2535400390625, -1.215606689453125, -1.17767333984375, -1.139739990234375, -1.101806640625, -1.063873291015625, -1.02593994140625, -0.988006591796875, -0.9500732421875, -0.912139892578125, -0.87420654296875, -0.836273193359375, -0.79833984375, -0.760406494140625, -0.72247314453125, -0.684539794921875, -0.6466064453125, -0.608673095703125, -0.57073974609375, -0.532806396484375, -0.494873046875, -0.456939697265625, -0.41900634765625, -0.381072998046875, -0.3431396484375, -0.305206298828125, -0.26727294921875, -0.229339599609375, -0.19140625, -0.153472900390625, -0.11553955078125, -0.077606201171875, -0.0396728515625, -0.001739501953125, 0.03619384765625, 0.074127197265625, 0.112060546875, 0.149993896484375, 0.18792724609375, 0.225860595703125, 0.2637939453125, 0.301727294921875, 0.33966064453125, 0.377593994140625, 0.41552734375, 0.453460693359375, 0.49139404296875, 0.529327392578125, 0.5672607421875, 0.605194091796875, 0.64312744140625, 0.681060791015625, 0.718994140625, 0.756927490234375, 0.79486083984375, 0.832794189453125, 0.8707275390625, 0.908660888671875, 0.94659423828125, 0.984527587890625, 1.0224609375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 7.0, 4.0, 13.0, 13.0, 16.0, 24.0, 12.0, 23.0, 27.0, 31.0, 24.0, 34.0, 39.0, 42.0, 46.0, 34.0, 41.0, 52.0, 1067.0, 42.0, 38.0, 40.0, 41.0, 40.0, 42.0, 34.0, 46.0, 23.0, 24.0, 19.0, 15.0, 13.0, 9.0, 13.0, 9.0, 4.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-5.140625, -4.994140625, -4.84765625, -4.701171875, -4.5546875, -4.408203125, -4.26171875, -4.115234375, -3.96875, -3.822265625, -3.67578125, -3.529296875, -3.3828125, -3.236328125, -3.08984375, -2.943359375, -2.796875, -2.650390625, -2.50390625, -2.357421875, -2.2109375, -2.064453125, -1.91796875, -1.771484375, -1.625, -1.478515625, -1.33203125, -1.185546875, -1.0390625, -0.892578125, -0.74609375, -0.599609375, -0.453125, -0.306640625, -0.16015625, -0.013671875, 0.1328125, 0.279296875, 0.42578125, 0.572265625, 0.71875, 0.865234375, 1.01171875, 1.158203125, 1.3046875, 1.451171875, 1.59765625, 1.744140625, 1.890625, 2.037109375, 2.18359375, 2.330078125, 2.4765625, 2.623046875, 2.76953125, 2.916015625, 3.0625, 3.208984375, 3.35546875, 3.501953125, 3.6484375, 3.794921875, 3.94140625, 4.087890625, 4.234375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 8.0, 7.0, 7.0, 20.0, 21.0, 26.0, 39.0, 76.0, 112.0, 167.0, 306.0, 664.0, 1237.0, 2802.0, 6301.0, 15969.0, 41612.0, 109237.0, 283665.0, 1243714.0, 238677.0, 93321.0, 35350.0, 13426.0, 5527.0, 2362.0, 1130.0, 598.0, 301.0, 170.0, 88.0, 61.0, 42.0, 23.0, 16.0, 13.0, 10.0, 9.0, 2.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90673828125, -0.8769302368164062, -0.8471221923828125, -0.8173141479492188, -0.787506103515625, -0.7576980590820312, -0.7278900146484375, -0.6980819702148438, -0.66827392578125, -0.6384658813476562, -0.6086578369140625, -0.5788497924804688, -0.549041748046875, -0.5192337036132812, -0.4894256591796875, -0.45961761474609375, -0.4298095703125, -0.40000152587890625, -0.3701934814453125, -0.34038543701171875, -0.310577392578125, -0.28076934814453125, -0.2509613037109375, -0.22115325927734375, -0.19134521484375, -0.16153717041015625, -0.1317291259765625, -0.10192108154296875, -0.072113037109375, -0.04230499267578125, -0.0124969482421875, 0.01731109619140625, 0.047119140625, 0.07692718505859375, 0.1067352294921875, 0.13654327392578125, 0.166351318359375, 0.19615936279296875, 0.2259674072265625, 0.25577545166015625, 0.28558349609375, 0.31539154052734375, 0.3451995849609375, 0.37500762939453125, 0.404815673828125, 0.43462371826171875, 0.4644317626953125, 0.49423980712890625, 0.5240478515625, 0.5538558959960938, 0.5836639404296875, 0.6134719848632812, 0.643280029296875, 0.6730880737304688, 0.7028961181640625, 0.7327041625976562, 0.76251220703125, 0.7923202514648438, 0.8221282958984375, 0.8519363403320312, 0.881744384765625, 0.9115524291992188, 0.9413604736328125, 0.9711685180664062, 1.0009765625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 7.0, 7.0, 10.0, 11.0, 21.0, 20.0, 32.0, 29.0, 58.0, 84.0, 102.0, 161.0, 138.0, 95.0, 67.0, 36.0, 31.0, 19.0, 21.0, 16.0, 8.0, 5.0, 10.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1795654296875, -0.17407989501953125, -0.1685943603515625, -0.16310882568359375, -0.157623291015625, -0.15213775634765625, -0.1466522216796875, -0.14116668701171875, -0.13568115234375, -0.13019561767578125, -0.1247100830078125, -0.11922454833984375, -0.113739013671875, -0.10825347900390625, -0.1027679443359375, -0.09728240966796875, -0.091796875, -0.08631134033203125, -0.0808258056640625, -0.07534027099609375, -0.069854736328125, -0.06436920166015625, -0.0588836669921875, -0.05339813232421875, -0.04791259765625, -0.04242706298828125, -0.0369415283203125, -0.03145599365234375, -0.025970458984375, -0.02048492431640625, -0.0149993896484375, -0.00951385498046875, -0.0040283203125, 0.00145721435546875, 0.0069427490234375, 0.01242828369140625, 0.017913818359375, 0.02339935302734375, 0.0288848876953125, 0.03437042236328125, 0.03985595703125, 0.04534149169921875, 0.0508270263671875, 0.05631256103515625, 0.061798095703125, 0.06728363037109375, 0.0727691650390625, 0.07825469970703125, 0.083740234375, 0.08922576904296875, 0.0947113037109375, 0.10019683837890625, 0.105682373046875, 0.11116790771484375, 0.1166534423828125, 0.12213897705078125, 0.12762451171875, 0.13311004638671875, 0.1385955810546875, 0.14408111572265625, 0.149566650390625, 0.15505218505859375, 0.1605377197265625, 0.16602325439453125, 0.1715087890625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 10.0, 4.0, 14.0, 16.0, 19.0, 23.0, 49.0, 75.0, 112.0, 292.0, 2130.0, 1041439.0, 3690.0, 284.0, 153.0, 68.0, 51.0, 30.0, 19.0, 21.0, 14.0, 12.0, 7.0, 3.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.83984375, -3.7181396484375, -3.596435546875, -3.4747314453125, -3.35302734375, -3.2313232421875, -3.109619140625, -2.9879150390625, -2.8662109375, -2.7445068359375, -2.622802734375, -2.5010986328125, -2.37939453125, -2.2576904296875, -2.135986328125, -2.0142822265625, -1.892578125, -1.7708740234375, -1.649169921875, -1.5274658203125, -1.40576171875, -1.2840576171875, -1.162353515625, -1.0406494140625, -0.9189453125, -0.7972412109375, -0.675537109375, -0.5538330078125, -0.43212890625, -0.3104248046875, -0.188720703125, -0.0670166015625, 0.0546875, 0.1763916015625, 0.298095703125, 0.4197998046875, 0.54150390625, 0.6632080078125, 0.784912109375, 0.9066162109375, 1.0283203125, 1.1500244140625, 1.271728515625, 1.3934326171875, 1.51513671875, 1.6368408203125, 1.758544921875, 1.8802490234375, 2.001953125, 2.1236572265625, 2.245361328125, 2.3670654296875, 2.48876953125, 2.6104736328125, 2.732177734375, 2.8538818359375, 2.9755859375, 3.0972900390625, 3.218994140625, 3.3406982421875, 3.46240234375, 3.5841064453125, 3.705810546875, 3.8275146484375, 3.94921875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 12.0, 102.0, 545.0, 310.0, 41.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.076398566365242, -0.05583025887608528, -0.03526195138692856, -0.014693643897771835, 0.005874663591384888, 0.02644297480583191, 0.047011278569698334, 0.06757958233356476, 0.08814789354801178, 0.1087162047624588, 0.12928450107574463, 0.14985281229019165, 0.17042112350463867, 0.1909894347190857, 0.21155774593353271, 0.23212604224681854, 0.25269436836242676, 0.2732626795768738, 0.2938309907913208, 0.3143993020057678, 0.33496761322021484, 0.35553592443466187, 0.3761042058467865, 0.3966725170612335, 0.41724079847335815, 0.4378091096878052, 0.4583774209022522, 0.4789457321166992, 0.49951404333114624, 0.5200823545455933, 0.5406506657600403, 0.5612189769744873, 0.5817872285842896, 0.6023555397987366, 0.6229238510131836, 0.6434921622276306, 0.6640604734420776, 0.6846287846565247, 0.7051970958709717, 0.7257653474807739, 0.7463337182998657, 0.7669020295143127, 0.7874703407287598, 0.8080386519432068, 0.8286069631576538, 0.8491752743721008, 0.8697435855865479, 0.8903118371963501, 0.9108801484107971, 0.9314484596252441, 0.9520167708396912, 0.9725850820541382, 0.9931533932685852, 1.0137217044830322, 1.0342899560928345, 1.0548583269119263, 1.0754265785217285, 1.0959948301315308, 1.1165632009506226, 1.1371314525604248, 1.1576998233795166, 1.1782680749893188, 1.1988364458084106, 1.219404697418213, 1.2399730682373047]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 7.0, 6.0, 7.0, 8.0, 17.0, 18.0, 14.0, 19.0, 12.0, 20.0, 16.0, 31.0, 32.0, 22.0, 27.0, 41.0, 41.0, 38.0, 34.0, 41.0, 45.0, 38.0, 51.0, 33.0, 36.0, 35.0, 37.0, 21.0, 50.0, 29.0, 21.0, 24.0, 21.0, 21.0, 23.0, 12.0, 12.0, 8.0, 5.0, 10.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0], "bins": [-0.14001882076263428, -0.1358327567577362, -0.13164669275283813, -0.12746064364910126, -0.12327457964420319, -0.11908851563930511, -0.11490245908498764, -0.11071640253067017, -0.1065303385257721, -0.10234427452087402, -0.09815821796655655, -0.09397216141223907, -0.089786097407341, -0.08560003340244293, -0.08141397684812546, -0.07722792029380798, -0.07304185628890991, -0.06885579228401184, -0.06466973572969437, -0.060483675450086594, -0.05629761517047882, -0.05211155489087105, -0.047925494611263275, -0.0437394343316555, -0.03955337405204773, -0.03536731377243996, -0.031181253492832184, -0.02699519321322441, -0.022809132933616638, -0.018623072654008865, -0.014437012374401093, -0.01025095209479332, -0.006064891815185547, -0.001878831535577774, 0.0023072287440299988, 0.006493289023637772, 0.010679349303245544, 0.014865409582853317, 0.01905146986246109, 0.023237530142068863, 0.027423590421676636, 0.03160965070128441, 0.03579571098089218, 0.039981771260499954, 0.04416783154010773, 0.0483538918197155, 0.05253995209932327, 0.056726012378931046, 0.06091207265853882, 0.06509813666343689, 0.06928419321775436, 0.07347024977207184, 0.07765631377696991, 0.08184237778186798, 0.08602843433618546, 0.09021449089050293, 0.094400554895401, 0.09858661890029907, 0.10277267545461655, 0.10695873200893402, 0.11114479601383209, 0.11533086001873016, 0.11951691657304764, 0.12370297312736511, 0.12788903713226318]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 5.0, 7.0, 5.0, 12.0, 4.0, 12.0, 18.0, 16.0, 23.0, 22.0, 19.0, 27.0, 22.0, 38.0, 42.0, 46.0, 30.0, 48.0, 43.0, 37.0, 50.0, 45.0, 51.0, 48.0, 46.0, 44.0, 41.0, 39.0, 21.0, 29.0, 22.0, 17.0, 10.0, 9.0, 11.0, 17.0, 4.0, 5.0, 5.0, 5.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3671875, -7.1363525390625, -6.905517578125, -6.6746826171875, -6.44384765625, -6.2130126953125, -5.982177734375, -5.7513427734375, -5.5205078125, -5.2896728515625, -5.058837890625, -4.8280029296875, -4.59716796875, -4.3663330078125, -4.135498046875, -3.9046630859375, -3.673828125, -3.4429931640625, -3.212158203125, -2.9813232421875, -2.75048828125, -2.5196533203125, -2.288818359375, -2.0579833984375, -1.8271484375, -1.5963134765625, -1.365478515625, -1.1346435546875, -0.90380859375, -0.6729736328125, -0.442138671875, -0.2113037109375, 0.01953125, 0.2503662109375, 0.481201171875, 0.7120361328125, 0.94287109375, 1.1737060546875, 1.404541015625, 1.6353759765625, 1.8662109375, 2.0970458984375, 2.327880859375, 2.5587158203125, 2.78955078125, 3.0203857421875, 3.251220703125, 3.4820556640625, 3.712890625, 3.9437255859375, 4.174560546875, 4.4053955078125, 4.63623046875, 4.8670654296875, 5.097900390625, 5.3287353515625, 5.5595703125, 5.7904052734375, 6.021240234375, 6.2520751953125, 6.48291015625, 6.7137451171875, 6.944580078125, 7.1754150390625, 7.40625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 5.0, 12.0, 10.0, 14.0, 16.0, 27.0, 29.0, 36.0, 57.0, 92.0, 117.0, 184.0, 262.0, 472.0, 844.0, 1441.0, 2337.0, 4266.0, 7472.0, 13588.0, 25142.0, 53522.0, 161296.0, 473121.0, 185668.0, 58428.0, 26863.0, 14319.0, 8014.0, 4517.0, 2621.0, 1439.0, 888.0, 494.0, 323.0, 204.0, 133.0, 83.0, 54.0, 47.0, 26.0, 18.0, 21.0, 13.0, 9.0, 5.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.1015625, -10.760498046875, -10.41943359375, -10.078369140625, -9.7373046875, -9.396240234375, -9.05517578125, -8.714111328125, -8.373046875, -8.031982421875, -7.69091796875, -7.349853515625, -7.0087890625, -6.667724609375, -6.32666015625, -5.985595703125, -5.64453125, -5.303466796875, -4.96240234375, -4.621337890625, -4.2802734375, -3.939208984375, -3.59814453125, -3.257080078125, -2.916015625, -2.574951171875, -2.23388671875, -1.892822265625, -1.5517578125, -1.210693359375, -0.86962890625, -0.528564453125, -0.1875, 0.153564453125, 0.49462890625, 0.835693359375, 1.1767578125, 1.517822265625, 1.85888671875, 2.199951171875, 2.541015625, 2.882080078125, 3.22314453125, 3.564208984375, 3.9052734375, 4.246337890625, 4.58740234375, 4.928466796875, 5.26953125, 5.610595703125, 5.95166015625, 6.292724609375, 6.6337890625, 6.974853515625, 7.31591796875, 7.656982421875, 7.998046875, 8.339111328125, 8.68017578125, 9.021240234375, 9.3623046875, 9.703369140625, 10.04443359375, 10.385498046875, 10.7265625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 11.0, 8.0, 16.0, 11.0, 17.0, 21.0, 30.0, 24.0, 19.0, 36.0, 31.0, 40.0, 44.0, 55.0, 72.0, 120.0, 215.0, 1425.0, 234.0, 111.0, 93.0, 68.0, 39.0, 34.0, 30.0, 32.0, 35.0, 17.0, 34.0, 18.0, 15.0, 22.0, 13.0, 14.0, 4.0, 10.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-17.265625, -16.70068359375, -16.1357421875, -15.57080078125, -15.005859375, -14.44091796875, -13.8759765625, -13.31103515625, -12.74609375, -12.18115234375, -11.6162109375, -11.05126953125, -10.486328125, -9.92138671875, -9.3564453125, -8.79150390625, -8.2265625, -7.66162109375, -7.0966796875, -6.53173828125, -5.966796875, -5.40185546875, -4.8369140625, -4.27197265625, -3.70703125, -3.14208984375, -2.5771484375, -2.01220703125, -1.447265625, -0.88232421875, -0.3173828125, 0.24755859375, 0.8125, 1.37744140625, 1.9423828125, 2.50732421875, 3.072265625, 3.63720703125, 4.2021484375, 4.76708984375, 5.33203125, 5.89697265625, 6.4619140625, 7.02685546875, 7.591796875, 8.15673828125, 8.7216796875, 9.28662109375, 9.8515625, 10.41650390625, 10.9814453125, 11.54638671875, 12.111328125, 12.67626953125, 13.2412109375, 13.80615234375, 14.37109375, 14.93603515625, 15.5009765625, 16.06591796875, 16.630859375, 17.19580078125, 17.7607421875, 18.32568359375, 18.890625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 8.0, 5.0, 12.0, 20.0, 18.0, 22.0, 20.0, 49.0, 66.0, 76.0, 119.0, 187.0, 334.0, 600.0, 1870.0, 9394.0, 84930.0, 2724202.0, 298888.0, 19576.0, 3293.0, 883.0, 381.0, 270.0, 144.0, 94.0, 57.0, 53.0, 27.0, 34.0, 19.0, 12.0, 7.0, 8.0, 8.0, 6.0, 7.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.765625, -27.687744140625, -26.60986328125, -25.531982421875, -24.4541015625, -23.376220703125, -22.29833984375, -21.220458984375, -20.142578125, -19.064697265625, -17.98681640625, -16.908935546875, -15.8310546875, -14.753173828125, -13.67529296875, -12.597412109375, -11.51953125, -10.441650390625, -9.36376953125, -8.285888671875, -7.2080078125, -6.130126953125, -5.05224609375, -3.974365234375, -2.896484375, -1.818603515625, -0.74072265625, 0.337158203125, 1.4150390625, 2.492919921875, 3.57080078125, 4.648681640625, 5.7265625, 6.804443359375, 7.88232421875, 8.960205078125, 10.0380859375, 11.115966796875, 12.19384765625, 13.271728515625, 14.349609375, 15.427490234375, 16.50537109375, 17.583251953125, 18.6611328125, 19.739013671875, 20.81689453125, 21.894775390625, 22.97265625, 24.050537109375, 25.12841796875, 26.206298828125, 27.2841796875, 28.362060546875, 29.43994140625, 30.517822265625, 31.595703125, 32.673583984375, 33.75146484375, 34.829345703125, 35.9072265625, 36.985107421875, 38.06298828125, 39.140869140625, 40.21875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 22.0, 67.0, 180.0, 245.0, 260.0, 145.0, 61.0, 21.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.071720123291016, -14.571301460266113, -12.070882797241211, -9.570463180541992, -7.07004451751709, -4.5696258544921875, -2.0692062377929688, 0.4312114715576172, 2.931631088256836, 5.432049751281738, 7.932468891143799, 10.43288803100586, 12.933306694030762, 15.433725357055664, 17.934144973754883, 20.43456268310547, 22.934982299804688, 25.435401916503906, 27.935819625854492, 30.43623924255371, 32.9366569519043, 35.437076568603516, 37.937496185302734, 40.43791198730469, 42.938331604003906, 45.438751220703125, 47.939170837402344, 50.43959045410156, 52.940006256103516, 55.440425872802734, 57.94084548950195, 60.441261291503906, 62.941688537597656, 65.44210815429688, 67.9425277709961, 70.44294738769531, 72.94336700439453, 75.44378662109375, 77.94419860839844, 80.44461822509766, 82.94503784179688, 85.4454574584961, 87.94587707519531, 90.44629669189453, 92.94671630859375, 95.44712829589844, 97.94755554199219, 100.44796752929688, 102.94839477539062, 105.44881439208984, 107.94923400878906, 110.44965362548828, 112.9500732421875, 115.45048522949219, 117.95091247558594, 120.45132446289062, 122.95174407958984, 125.45216369628906, 127.95258331298828, 130.4530029296875, 132.9534149169922, 135.45384216308594, 137.95425415039062, 140.45468139648438, 142.95509338378906]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 11.0, 2.0, 6.0, 10.0, 10.0, 13.0, 22.0, 22.0, 17.0, 29.0, 26.0, 26.0, 41.0, 31.0, 43.0, 53.0, 44.0, 48.0, 44.0, 38.0, 49.0, 34.0, 34.0, 39.0, 47.0, 25.0, 23.0, 29.0, 34.0, 25.0, 18.0, 20.0, 18.0, 11.0, 18.0, 9.0, 5.0, 8.0, 13.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.56861877441406, -42.98087692260742, -41.39313888549805, -39.805397033691406, -38.21765899658203, -36.62991714477539, -35.04217529296875, -33.454437255859375, -31.866697311401367, -30.27895736694336, -28.69121742248535, -27.103477478027344, -25.515735626220703, -23.927997589111328, -22.340255737304688, -20.75251579284668, -19.164775848388672, -17.577035903930664, -15.989295959472656, -14.401555061340332, -12.813815116882324, -11.226075172424316, -9.638334274291992, -8.050594329833984, -6.462854385375977, -4.875114440917969, -3.2873740196228027, -1.6996335983276367, -0.1118936538696289, 1.475846290588379, 3.063587188720703, 4.651327133178711, 6.239070892333984, 7.826810836791992, 9.41455078125, 11.002291679382324, 12.590031623840332, 14.17777156829834, 15.765512466430664, 17.353252410888672, 18.94099235534668, 20.528732299804688, 22.116472244262695, 23.704212188720703, 25.291954040527344, 26.87969207763672, 28.46743392944336, 30.055173873901367, 31.642913818359375, 33.230655670166016, 34.81839370727539, 36.40613555908203, 37.993873596191406, 39.58161544799805, 41.16935729980469, 42.75709533691406, 44.34483337402344, 45.93257522583008, 47.52031326293945, 49.108055114746094, 50.69579315185547, 52.28353500366211, 53.87127685546875, 55.459014892578125, 57.046756744384766]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 8.0, 6.0, 12.0, 9.0, 15.0, 15.0, 7.0, 21.0, 29.0, 22.0, 33.0, 25.0, 35.0, 28.0, 42.0, 40.0, 38.0, 39.0, 33.0, 44.0, 38.0, 42.0, 48.0, 33.0, 40.0, 38.0, 36.0, 34.0, 30.0, 26.0, 27.0, 21.0, 15.0, 16.0, 8.0, 12.0, 6.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.01953125, -6.7979736328125, -6.576416015625, -6.3548583984375, -6.13330078125, -5.9117431640625, -5.690185546875, -5.4686279296875, -5.2470703125, -5.0255126953125, -4.803955078125, -4.5823974609375, -4.36083984375, -4.1392822265625, -3.917724609375, -3.6961669921875, -3.474609375, -3.2530517578125, -3.031494140625, -2.8099365234375, -2.58837890625, -2.3668212890625, -2.145263671875, -1.9237060546875, -1.7021484375, -1.4805908203125, -1.259033203125, -1.0374755859375, -0.81591796875, -0.5943603515625, -0.372802734375, -0.1512451171875, 0.0703125, 0.2918701171875, 0.513427734375, 0.7349853515625, 0.95654296875, 1.1781005859375, 1.399658203125, 1.6212158203125, 1.8427734375, 2.0643310546875, 2.285888671875, 2.5074462890625, 2.72900390625, 2.9505615234375, 3.172119140625, 3.3936767578125, 3.615234375, 3.8367919921875, 4.058349609375, 4.2799072265625, 4.50146484375, 4.7230224609375, 4.944580078125, 5.1661376953125, 5.3876953125, 5.6092529296875, 5.830810546875, 6.0523681640625, 6.27392578125, 6.4954833984375, 6.717041015625, 6.9385986328125, 7.16015625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 9.0, 2.0, 20.0, 20.0, 21.0, 37.0, 29.0, 71.0, 102.0, 125.0, 180.0, 255.0, 368.0, 633.0, 1032.0, 1795.0, 3217.0, 6060.0, 13004.0, 30722.0, 91372.0, 342958.0, 1295408.0, 1676513.0, 522871.0, 133376.0, 41698.0, 16159.0, 7556.0, 3722.0, 1953.0, 1120.0, 669.0, 384.0, 254.0, 172.0, 111.0, 72.0, 62.0, 35.0, 31.0, 25.0, 18.0, 12.0, 10.0, 4.0, 7.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.40625, -10.09228515625, -9.7783203125, -9.46435546875, -9.150390625, -8.83642578125, -8.5224609375, -8.20849609375, -7.89453125, -7.58056640625, -7.2666015625, -6.95263671875, -6.638671875, -6.32470703125, -6.0107421875, -5.69677734375, -5.3828125, -5.06884765625, -4.7548828125, -4.44091796875, -4.126953125, -3.81298828125, -3.4990234375, -3.18505859375, -2.87109375, -2.55712890625, -2.2431640625, -1.92919921875, -1.615234375, -1.30126953125, -0.9873046875, -0.67333984375, -0.359375, -0.04541015625, 0.2685546875, 0.58251953125, 0.896484375, 1.21044921875, 1.5244140625, 1.83837890625, 2.15234375, 2.46630859375, 2.7802734375, 3.09423828125, 3.408203125, 3.72216796875, 4.0361328125, 4.35009765625, 4.6640625, 4.97802734375, 5.2919921875, 5.60595703125, 5.919921875, 6.23388671875, 6.5478515625, 6.86181640625, 7.17578125, 7.48974609375, 7.8037109375, 8.11767578125, 8.431640625, 8.74560546875, 9.0595703125, 9.37353515625, 9.6875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 6.0, 11.0, 18.0, 11.0, 30.0, 42.0, 68.0, 77.0, 104.0, 163.0, 266.0, 416.0, 580.0, 655.0, 513.0, 370.0, 242.0, 161.0, 107.0, 81.0, 50.0, 28.0, 25.0, 13.0, 13.0, 7.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.09375, -11.6533203125, -11.212890625, -10.7724609375, -10.33203125, -9.8916015625, -9.451171875, -9.0107421875, -8.5703125, -8.1298828125, -7.689453125, -7.2490234375, -6.80859375, -6.3681640625, -5.927734375, -5.4873046875, -5.046875, -4.6064453125, -4.166015625, -3.7255859375, -3.28515625, -2.8447265625, -2.404296875, -1.9638671875, -1.5234375, -1.0830078125, -0.642578125, -0.2021484375, 0.23828125, 0.6787109375, 1.119140625, 1.5595703125, 2.0, 2.4404296875, 2.880859375, 3.3212890625, 3.76171875, 4.2021484375, 4.642578125, 5.0830078125, 5.5234375, 5.9638671875, 6.404296875, 6.8447265625, 7.28515625, 7.7255859375, 8.166015625, 8.6064453125, 9.046875, 9.4873046875, 9.927734375, 10.3681640625, 10.80859375, 11.2490234375, 11.689453125, 12.1298828125, 12.5703125, 13.0107421875, 13.451171875, 13.8916015625, 14.33203125, 14.7724609375, 15.212890625, 15.6533203125, 16.09375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 13.0, 15.0, 16.0, 24.0, 60.0, 60.0, 133.0, 253.0, 487.0, 1336.0, 5192.0, 40707.0, 1106551.0, 2941080.0, 86518.0, 8666.0, 1849.0, 669.0, 237.0, 151.0, 97.0, 56.0, 33.0, 24.0, 16.0, 12.0, 5.0, 5.0, 6.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-43.5625, -42.3896484375, -41.216796875, -40.0439453125, -38.87109375, -37.6982421875, -36.525390625, -35.3525390625, -34.1796875, -33.0068359375, -31.833984375, -30.6611328125, -29.48828125, -28.3154296875, -27.142578125, -25.9697265625, -24.796875, -23.6240234375, -22.451171875, -21.2783203125, -20.10546875, -18.9326171875, -17.759765625, -16.5869140625, -15.4140625, -14.2412109375, -13.068359375, -11.8955078125, -10.72265625, -9.5498046875, -8.376953125, -7.2041015625, -6.03125, -4.8583984375, -3.685546875, -2.5126953125, -1.33984375, -0.1669921875, 1.005859375, 2.1787109375, 3.3515625, 4.5244140625, 5.697265625, 6.8701171875, 8.04296875, 9.2158203125, 10.388671875, 11.5615234375, 12.734375, 13.9072265625, 15.080078125, 16.2529296875, 17.42578125, 18.5986328125, 19.771484375, 20.9443359375, 22.1171875, 23.2900390625, 24.462890625, 25.6357421875, 26.80859375, 27.9814453125, 29.154296875, 30.3271484375, 31.5]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 11.0, 25.0, 198.0, 444.0, 265.0, 59.0, 14.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-149.0503387451172, -142.17860412597656, -135.30686950683594, -128.4351348876953, -121.56340026855469, -114.69166564941406, -107.81993103027344, -100.94819641113281, -94.07646179199219, -87.20472717285156, -80.33299255371094, -73.46125793457031, -66.58952331542969, -59.71778869628906, -52.84605407714844, -45.97431945800781, -39.10258483886719, -32.23085021972656, -25.359115600585938, -18.487380981445312, -11.615646362304688, -4.7439117431640625, 2.1278228759765625, 8.999557495117188, 15.871292114257812, 22.743026733398438, 29.614761352539062, 36.48649597167969, 43.35823059082031, 50.22996520996094, 57.10169982910156, 63.97343444824219, 70.84515380859375, 77.71688842773438, 84.588623046875, 91.46035766601562, 98.33209228515625, 105.20382690429688, 112.0755615234375, 118.94729614257812, 125.81903076171875, 132.69076538085938, 139.5625, 146.43423461914062, 153.30596923828125, 160.17770385742188, 167.0494384765625, 173.92117309570312, 180.79290771484375, 187.66464233398438, 194.536376953125, 201.40811157226562, 208.27984619140625, 215.15158081054688, 222.0233154296875, 228.89505004882812, 235.76678466796875, 242.63851928710938, 249.51025390625, 256.3819885253906, 263.25372314453125, 270.1254577636719, 276.9971923828125, 283.8689270019531, 290.74066162109375]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 6.0, 8.0, 9.0, 3.0, 15.0, 11.0, 12.0, 14.0, 19.0, 19.0, 26.0, 21.0, 31.0, 36.0, 21.0, 29.0, 36.0, 44.0, 39.0, 37.0, 38.0, 50.0, 39.0, 43.0, 38.0, 45.0, 39.0, 32.0, 30.0, 21.0, 23.0, 28.0, 30.0, 23.0, 17.0, 14.0, 11.0, 11.0, 11.0, 10.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.35907745361328, -33.19776153564453, -32.03644943237305, -30.875133514404297, -29.71381950378418, -28.552505493164062, -27.391191482543945, -26.229877471923828, -25.068561553955078, -23.90724754333496, -22.745933532714844, -21.584617614746094, -20.423303604125977, -19.26198959350586, -18.100675582885742, -16.939361572265625, -15.778047561645508, -14.61673355102539, -13.455418586730957, -12.29410457611084, -11.132789611816406, -9.971475601196289, -8.810161590576172, -7.648846626281738, -6.487532615661621, -5.326218128204346, -4.16490364074707, -3.003589630126953, -1.8422751426696777, -0.6809606552124023, 0.48035335540771484, 1.6416683197021484, 2.8029823303222656, 3.964296817779541, 5.125611305236816, 6.286925315856934, 7.448239803314209, 8.609554290771484, 9.770868301391602, 10.932183265686035, 12.093497276306152, 13.25481128692627, 14.416126251220703, 15.57744026184082, 16.738754272460938, 17.900070190429688, 19.061382293701172, 20.222698211669922, 21.38401222229004, 22.545326232910156, 23.706640243530273, 24.86795425415039, 26.02927017211914, 27.190584182739258, 28.351898193359375, 29.513214111328125, 30.67452621459961, 31.835840225219727, 32.997154235839844, 34.158470153808594, 35.31978225708008, 36.48109817504883, 37.64241027832031, 38.80372619628906, 39.96504211425781]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 9.0, 11.0, 12.0, 11.0, 12.0, 12.0, 17.0, 9.0, 29.0, 25.0, 29.0, 19.0, 31.0, 34.0, 44.0, 46.0, 39.0, 30.0, 51.0, 47.0, 50.0, 35.0, 37.0, 34.0, 41.0, 44.0, 32.0, 33.0, 29.0, 24.0, 27.0, 18.0, 19.0, 10.0, 9.0, 10.0, 10.0, 2.0, 8.0, 5.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.0390625, -7.81219482421875, -7.5853271484375, -7.35845947265625, -7.131591796875, -6.90472412109375, -6.6778564453125, -6.45098876953125, -6.22412109375, -5.99725341796875, -5.7703857421875, -5.54351806640625, -5.316650390625, -5.08978271484375, -4.8629150390625, -4.63604736328125, -4.4091796875, -4.18231201171875, -3.9554443359375, -3.72857666015625, -3.501708984375, -3.27484130859375, -3.0479736328125, -2.82110595703125, -2.59423828125, -2.36737060546875, -2.1405029296875, -1.91363525390625, -1.686767578125, -1.45989990234375, -1.2330322265625, -1.00616455078125, -0.779296875, -0.55242919921875, -0.3255615234375, -0.09869384765625, 0.128173828125, 0.35504150390625, 0.5819091796875, 0.80877685546875, 1.03564453125, 1.26251220703125, 1.4893798828125, 1.71624755859375, 1.943115234375, 2.16998291015625, 2.3968505859375, 2.62371826171875, 2.8505859375, 3.07745361328125, 3.3043212890625, 3.53118896484375, 3.758056640625, 3.98492431640625, 4.2117919921875, 4.43865966796875, 4.66552734375, 4.89239501953125, 5.1192626953125, 5.34613037109375, 5.572998046875, 5.79986572265625, 6.0267333984375, 6.25360107421875, 6.48046875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 13.0, 9.0, 18.0, 39.0, 56.0, 72.0, 93.0, 164.0, 251.0, 387.0, 535.0, 826.0, 1282.0, 2010.0, 3453.0, 5019.0, 8057.0, 12956.0, 20871.0, 32910.0, 51759.0, 78621.0, 114226.0, 148558.0, 158432.0, 133409.0, 96422.0, 64748.0, 41998.0, 26556.0, 16627.0, 10333.0, 6554.0, 4062.0, 2550.0, 1638.0, 1028.0, 720.0, 441.0, 291.0, 194.0, 128.0, 91.0, 48.0, 33.0, 23.0, 18.0, 6.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7138671875, -0.690277099609375, -0.66668701171875, -0.643096923828125, -0.6195068359375, -0.595916748046875, -0.57232666015625, -0.548736572265625, -0.525146484375, -0.501556396484375, -0.47796630859375, -0.454376220703125, -0.4307861328125, -0.407196044921875, -0.38360595703125, -0.360015869140625, -0.33642578125, -0.312835693359375, -0.28924560546875, -0.265655517578125, -0.2420654296875, -0.218475341796875, -0.19488525390625, -0.171295166015625, -0.147705078125, -0.124114990234375, -0.10052490234375, -0.076934814453125, -0.0533447265625, -0.029754638671875, -0.00616455078125, 0.017425537109375, 0.041015625, 0.064605712890625, 0.08819580078125, 0.111785888671875, 0.1353759765625, 0.158966064453125, 0.18255615234375, 0.206146240234375, 0.229736328125, 0.253326416015625, 0.27691650390625, 0.300506591796875, 0.3240966796875, 0.347686767578125, 0.37127685546875, 0.394866943359375, 0.41845703125, 0.442047119140625, 0.46563720703125, 0.489227294921875, 0.5128173828125, 0.536407470703125, 0.55999755859375, 0.583587646484375, 0.607177734375, 0.630767822265625, 0.65435791015625, 0.677947998046875, 0.7015380859375, 0.725128173828125, 0.74871826171875, 0.772308349609375, 0.7958984375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 7.0, 6.0, 10.0, 9.0, 13.0, 11.0, 9.0, 15.0, 15.0, 18.0, 22.0, 29.0, 29.0, 33.0, 27.0, 31.0, 38.0, 40.0, 43.0, 42.0, 38.0, 1063.0, 45.0, 35.0, 31.0, 39.0, 30.0, 27.0, 38.0, 33.0, 34.0, 28.0, 27.0, 20.0, 18.0, 12.0, 12.0, 13.0, 5.0, 10.0, 5.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.21484375, -4.0728759765625, -3.930908203125, -3.7889404296875, -3.64697265625, -3.5050048828125, -3.363037109375, -3.2210693359375, -3.0791015625, -2.9371337890625, -2.795166015625, -2.6531982421875, -2.51123046875, -2.3692626953125, -2.227294921875, -2.0853271484375, -1.943359375, -1.8013916015625, -1.659423828125, -1.5174560546875, -1.37548828125, -1.2335205078125, -1.091552734375, -0.9495849609375, -0.8076171875, -0.6656494140625, -0.523681640625, -0.3817138671875, -0.23974609375, -0.0977783203125, 0.044189453125, 0.1861572265625, 0.328125, 0.4700927734375, 0.612060546875, 0.7540283203125, 0.89599609375, 1.0379638671875, 1.179931640625, 1.3218994140625, 1.4638671875, 1.6058349609375, 1.747802734375, 1.8897705078125, 2.03173828125, 2.1737060546875, 2.315673828125, 2.4576416015625, 2.599609375, 2.7415771484375, 2.883544921875, 3.0255126953125, 3.16748046875, 3.3094482421875, 3.451416015625, 3.5933837890625, 3.7353515625, 3.8773193359375, 4.019287109375, 4.1612548828125, 4.30322265625, 4.4451904296875, 4.587158203125, 4.7291259765625, 4.87109375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 3.0, 8.0, 10.0, 17.0, 29.0, 24.0, 42.0, 69.0, 100.0, 175.0, 284.0, 437.0, 727.0, 1207.0, 2035.0, 3619.0, 6169.0, 10791.0, 19222.0, 33775.0, 58960.0, 102372.0, 182785.0, 913507.0, 415904.0, 146349.0, 84954.0, 48695.0, 27862.0, 15661.0, 8798.0, 5069.0, 3034.0, 1741.0, 1033.0, 637.0, 375.0, 234.0, 158.0, 86.0, 57.0, 49.0, 21.0, 11.0, 22.0, 4.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56982421875, -0.5513381958007812, -0.5328521728515625, -0.5143661499023438, -0.495880126953125, -0.47739410400390625, -0.4589080810546875, -0.44042205810546875, -0.42193603515625, -0.40345001220703125, -0.3849639892578125, -0.36647796630859375, -0.347991943359375, -0.32950592041015625, -0.3110198974609375, -0.29253387451171875, -0.2740478515625, -0.25556182861328125, -0.2370758056640625, -0.21858978271484375, -0.200103759765625, -0.18161773681640625, -0.1631317138671875, -0.14464569091796875, -0.12615966796875, -0.10767364501953125, -0.0891876220703125, -0.07070159912109375, -0.052215576171875, -0.03372955322265625, -0.0152435302734375, 0.00324249267578125, 0.021728515625, 0.04021453857421875, 0.0587005615234375, 0.07718658447265625, 0.095672607421875, 0.11415863037109375, 0.1326446533203125, 0.15113067626953125, 0.16961669921875, 0.18810272216796875, 0.2065887451171875, 0.22507476806640625, 0.243560791015625, 0.26204681396484375, 0.2805328369140625, 0.29901885986328125, 0.3175048828125, 0.33599090576171875, 0.3544769287109375, 0.37296295166015625, 0.391448974609375, 0.40993499755859375, 0.4284210205078125, 0.44690704345703125, 0.46539306640625, 0.48387908935546875, 0.5023651123046875, 0.5208511352539062, 0.539337158203125, 0.5578231811523438, 0.5763092041015625, 0.5947952270507812, 0.61328125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 7.0, 13.0, 11.0, 17.0, 28.0, 32.0, 39.0, 55.0, 53.0, 71.0, 94.0, 89.0, 95.0, 76.0, 72.0, 61.0, 43.0, 29.0, 29.0, 15.0, 14.0, 8.0, 8.0, 9.0, 3.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12115478515625, -0.11742305755615234, -0.11369132995605469, -0.10995960235595703, -0.10622787475585938, -0.10249614715576172, -0.09876441955566406, -0.0950326919555664, -0.09130096435546875, -0.0875692367553711, -0.08383750915527344, -0.08010578155517578, -0.07637405395507812, -0.07264232635498047, -0.06891059875488281, -0.06517887115478516, -0.0614471435546875, -0.057715415954589844, -0.05398368835449219, -0.05025196075439453, -0.046520233154296875, -0.04278850555419922, -0.03905677795410156, -0.035325050354003906, -0.03159332275390625, -0.027861595153808594, -0.024129867553710938, -0.02039813995361328, -0.016666412353515625, -0.012934684753417969, -0.009202957153320312, -0.005471229553222656, -0.001739501953125, 0.0019922256469726562, 0.0057239532470703125, 0.009455680847167969, 0.013187408447265625, 0.01691913604736328, 0.020650863647460938, 0.024382591247558594, 0.02811431884765625, 0.031846046447753906, 0.03557777404785156, 0.03930950164794922, 0.043041229248046875, 0.04677295684814453, 0.05050468444824219, 0.054236412048339844, 0.0579681396484375, 0.061699867248535156, 0.06543159484863281, 0.06916332244873047, 0.07289505004882812, 0.07662677764892578, 0.08035850524902344, 0.0840902328491211, 0.08782196044921875, 0.0915536880493164, 0.09528541564941406, 0.09901714324951172, 0.10274887084960938, 0.10648059844970703, 0.11021232604980469, 0.11394405364990234, 0.11767578125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 3.0, 7.0, 4.0, 12.0, 14.0, 17.0, 21.0, 36.0, 48.0, 64.0, 129.0, 195.0, 398.0, 2388.0, 1002709.0, 41161.0, 686.0, 246.0, 131.0, 74.0, 53.0, 36.0, 26.0, 23.0, 13.0, 11.0, 7.0, 11.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.52734375, -2.44775390625, -2.3681640625, -2.28857421875, -2.208984375, -2.12939453125, -2.0498046875, -1.97021484375, -1.890625, -1.81103515625, -1.7314453125, -1.65185546875, -1.572265625, -1.49267578125, -1.4130859375, -1.33349609375, -1.25390625, -1.17431640625, -1.0947265625, -1.01513671875, -0.935546875, -0.85595703125, -0.7763671875, -0.69677734375, -0.6171875, -0.53759765625, -0.4580078125, -0.37841796875, -0.298828125, -0.21923828125, -0.1396484375, -0.06005859375, 0.01953125, 0.09912109375, 0.1787109375, 0.25830078125, 0.337890625, 0.41748046875, 0.4970703125, 0.57666015625, 0.65625, 0.73583984375, 0.8154296875, 0.89501953125, 0.974609375, 1.05419921875, 1.1337890625, 1.21337890625, 1.29296875, 1.37255859375, 1.4521484375, 1.53173828125, 1.611328125, 1.69091796875, 1.7705078125, 1.85009765625, 1.9296875, 2.00927734375, 2.0888671875, 2.16845703125, 2.248046875, 2.32763671875, 2.4072265625, 2.48681640625, 2.56640625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [9.0, 59.0, 380.0, 472.0, 81.0, 10.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06752588599920273, -0.045472241938114166, -0.023418594151735306, -0.0013649463653564453, 0.020688697695732117, 0.04274234175682068, 0.06479599326848984, 0.0868496373295784, 0.10890328139066696, 0.13095693290233612, 0.15301057696342468, 0.17506422102451324, 0.1971178650856018, 0.21917150914669037, 0.24122515320777893, 0.2632788121700287, 0.28533244132995605, 0.3073861002922058, 0.3294397294521332, 0.35149338841438293, 0.3735470175743103, 0.39560067653656006, 0.4176543354988098, 0.4397079646587372, 0.46176162362098694, 0.4838152825832367, 0.5058689117431641, 0.5279225707054138, 0.5499762296676636, 0.5720298290252686, 0.5940834879875183, 0.6161371469497681, 0.6381908059120178, 0.6602444648742676, 0.6822981238365173, 0.7043517231941223, 0.7264053821563721, 0.7484590411186218, 0.7705127000808716, 0.7925662994384766, 0.8146199584007263, 0.8366736173629761, 0.8587272763252258, 0.8807808756828308, 0.9028345346450806, 0.9248881936073303, 0.9469418525695801, 0.9689954519271851, 0.9910491704940796, 1.0131027698516846, 1.035156488418579, 1.057210087776184, 1.0792638063430786, 1.1013174057006836, 1.1233710050582886, 1.145424723625183, 1.167478322982788, 1.189531922340393, 1.2115856409072876, 1.2336392402648926, 1.255692958831787, 1.277746558189392, 1.299800157546997, 1.3218538761138916, 1.3439074754714966]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 11.0, 7.0, 11.0, 14.0, 11.0, 16.0, 14.0, 18.0, 15.0, 29.0, 30.0, 22.0, 36.0, 29.0, 29.0, 37.0, 37.0, 38.0, 34.0, 41.0, 41.0, 35.0, 39.0, 34.0, 48.0, 46.0, 27.0, 30.0, 37.0, 29.0, 36.0, 25.0, 17.0, 10.0, 17.0, 10.0, 4.0, 3.0, 5.0, 7.0, 11.0, 2.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11770528554916382, -0.11405579000711441, -0.1104062870144844, -0.106756791472435, -0.10310728847980499, -0.09945779293775558, -0.09580829739570618, -0.09215879440307617, -0.08850929886102676, -0.08485980331897736, -0.08121030032634735, -0.07756080478429794, -0.07391130924224854, -0.07026180624961853, -0.06661231070756912, -0.06296281516551971, -0.05931331217288971, -0.05566381290555, -0.0520143136382103, -0.04836481809616089, -0.04471531882882118, -0.041065819561481476, -0.03741632401943207, -0.03376682475209236, -0.030117325484752655, -0.02646782621741295, -0.02281832881271839, -0.019168831408023834, -0.015519332140684128, -0.011869832873344421, -0.008220335468649864, -0.004570838063955307, -0.0009213387966156006, 0.0027281595394015312, 0.006377657875418663, 0.010027156211435795, 0.013676654547452927, 0.017326153814792633, 0.02097565121948719, 0.024625148624181747, 0.028274647891521454, 0.03192414715886116, 0.03557364642620087, 0.039223141968250275, 0.04287264123558998, 0.04652214050292969, 0.050171636044979095, 0.0538211353123188, 0.05747063457965851, 0.061120133846998215, 0.06476963311433792, 0.06841912865638733, 0.07206863164901733, 0.07571812719106674, 0.07936762273311615, 0.08301712572574615, 0.08666662126779556, 0.09031611680984497, 0.09396561980247498, 0.09761511534452438, 0.10126461088657379, 0.1049141138792038, 0.1085636094212532, 0.11221310496330261, 0.11586260795593262]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 5.0, 7.0, 15.0, 10.0, 8.0, 16.0, 14.0, 15.0, 14.0, 22.0, 22.0, 24.0, 26.0, 31.0, 35.0, 35.0, 53.0, 34.0, 52.0, 39.0, 41.0, 41.0, 40.0, 31.0, 35.0, 33.0, 39.0, 35.0, 34.0, 32.0, 25.0, 22.0, 18.0, 17.0, 16.0, 11.0, 9.0, 11.0, 6.0, 3.0, 7.0, 2.0, 1.0, 5.0, 3.0, 0.0, 6.0], "bins": [-7.9375, -7.72552490234375, -7.5135498046875, -7.30157470703125, -7.089599609375, -6.87762451171875, -6.6656494140625, -6.45367431640625, -6.24169921875, -6.02972412109375, -5.8177490234375, -5.60577392578125, -5.393798828125, -5.18182373046875, -4.9698486328125, -4.75787353515625, -4.5458984375, -4.33392333984375, -4.1219482421875, -3.90997314453125, -3.697998046875, -3.48602294921875, -3.2740478515625, -3.06207275390625, -2.85009765625, -2.63812255859375, -2.4261474609375, -2.21417236328125, -2.002197265625, -1.79022216796875, -1.5782470703125, -1.36627197265625, -1.154296875, -0.94232177734375, -0.7303466796875, -0.51837158203125, -0.306396484375, -0.09442138671875, 0.1175537109375, 0.32952880859375, 0.54150390625, 0.75347900390625, 0.9654541015625, 1.17742919921875, 1.389404296875, 1.60137939453125, 1.8133544921875, 2.02532958984375, 2.2373046875, 2.44927978515625, 2.6612548828125, 2.87322998046875, 3.085205078125, 3.29718017578125, 3.5091552734375, 3.72113037109375, 3.93310546875, 4.14508056640625, 4.3570556640625, 4.56903076171875, 4.781005859375, 4.99298095703125, 5.2049560546875, 5.41693115234375, 5.62890625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 7.0, 5.0, 8.0, 16.0, 19.0, 23.0, 46.0, 53.0, 104.0, 154.0, 189.0, 358.0, 571.0, 1016.0, 1698.0, 2703.0, 4849.0, 9020.0, 17606.0, 37440.0, 95278.0, 286831.0, 364503.0, 131027.0, 48376.0, 21685.0, 11068.0, 5964.0, 3223.0, 1881.0, 1107.0, 653.0, 394.0, 243.0, 145.0, 99.0, 66.0, 40.0, 26.0, 20.0, 12.0, 6.0, 9.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.1171875, -10.7713623046875, -10.425537109375, -10.0797119140625, -9.73388671875, -9.3880615234375, -9.042236328125, -8.6964111328125, -8.3505859375, -8.0047607421875, -7.658935546875, -7.3131103515625, -6.96728515625, -6.6214599609375, -6.275634765625, -5.9298095703125, -5.583984375, -5.2381591796875, -4.892333984375, -4.5465087890625, -4.20068359375, -3.8548583984375, -3.509033203125, -3.1632080078125, -2.8173828125, -2.4715576171875, -2.125732421875, -1.7799072265625, -1.43408203125, -1.0882568359375, -0.742431640625, -0.3966064453125, -0.05078125, 0.2950439453125, 0.640869140625, 0.9866943359375, 1.33251953125, 1.6783447265625, 2.024169921875, 2.3699951171875, 2.7158203125, 3.0616455078125, 3.407470703125, 3.7532958984375, 4.09912109375, 4.4449462890625, 4.790771484375, 5.1365966796875, 5.482421875, 5.8282470703125, 6.174072265625, 6.5198974609375, 6.86572265625, 7.2115478515625, 7.557373046875, 7.9031982421875, 8.2490234375, 8.5948486328125, 8.940673828125, 9.2864990234375, 9.63232421875, 9.9781494140625, 10.323974609375, 10.6697998046875, 11.015625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 5.0, 4.0, 0.0, 8.0, 6.0, 4.0, 8.0, 9.0, 8.0, 10.0, 20.0, 13.0, 25.0, 19.0, 23.0, 28.0, 31.0, 32.0, 32.0, 52.0, 59.0, 105.0, 139.0, 277.0, 1351.0, 199.0, 102.0, 67.0, 55.0, 51.0, 40.0, 33.0, 34.0, 24.0, 21.0, 20.0, 24.0, 12.0, 21.0, 16.0, 14.0, 9.0, 8.0, 5.0, 8.0, 8.0, 5.0, 2.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-17.59375, -17.04833984375, -16.5029296875, -15.95751953125, -15.412109375, -14.86669921875, -14.3212890625, -13.77587890625, -13.23046875, -12.68505859375, -12.1396484375, -11.59423828125, -11.048828125, -10.50341796875, -9.9580078125, -9.41259765625, -8.8671875, -8.32177734375, -7.7763671875, -7.23095703125, -6.685546875, -6.14013671875, -5.5947265625, -5.04931640625, -4.50390625, -3.95849609375, -3.4130859375, -2.86767578125, -2.322265625, -1.77685546875, -1.2314453125, -0.68603515625, -0.140625, 0.40478515625, 0.9501953125, 1.49560546875, 2.041015625, 2.58642578125, 3.1318359375, 3.67724609375, 4.22265625, 4.76806640625, 5.3134765625, 5.85888671875, 6.404296875, 6.94970703125, 7.4951171875, 8.04052734375, 8.5859375, 9.13134765625, 9.6767578125, 10.22216796875, 10.767578125, 11.31298828125, 11.8583984375, 12.40380859375, 12.94921875, 13.49462890625, 14.0400390625, 14.58544921875, 15.130859375, 15.67626953125, 16.2216796875, 16.76708984375, 17.3125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 1.0, 5.0, 7.0, 7.0, 8.0, 17.0, 14.0, 26.0, 23.0, 37.0, 61.0, 77.0, 134.0, 217.0, 407.0, 746.0, 1848.0, 5533.0, 22915.0, 177352.0, 2456921.0, 427463.0, 39097.0, 8160.0, 2541.0, 961.0, 452.0, 234.0, 124.0, 87.0, 68.0, 48.0, 25.0, 23.0, 20.0, 16.0, 10.0, 6.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.65625, -19.935302734375, -19.21435546875, -18.493408203125, -17.7724609375, -17.051513671875, -16.33056640625, -15.609619140625, -14.888671875, -14.167724609375, -13.44677734375, -12.725830078125, -12.0048828125, -11.283935546875, -10.56298828125, -9.842041015625, -9.12109375, -8.400146484375, -7.67919921875, -6.958251953125, -6.2373046875, -5.516357421875, -4.79541015625, -4.074462890625, -3.353515625, -2.632568359375, -1.91162109375, -1.190673828125, -0.4697265625, 0.251220703125, 0.97216796875, 1.693115234375, 2.4140625, 3.135009765625, 3.85595703125, 4.576904296875, 5.2978515625, 6.018798828125, 6.73974609375, 7.460693359375, 8.181640625, 8.902587890625, 9.62353515625, 10.344482421875, 11.0654296875, 11.786376953125, 12.50732421875, 13.228271484375, 13.94921875, 14.670166015625, 15.39111328125, 16.112060546875, 16.8330078125, 17.553955078125, 18.27490234375, 18.995849609375, 19.716796875, 20.437744140625, 21.15869140625, 21.879638671875, 22.6005859375, 23.321533203125, 24.04248046875, 24.763427734375, 25.484375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 147.0, 651.0, 210.0, 5.0, 1.0, 0.0, 1.0], "bins": [-437.4383239746094, -429.96990966796875, -422.5014953613281, -415.0330810546875, -407.5646667480469, -400.09625244140625, -392.6278381347656, -385.159423828125, -377.6910400390625, -370.2226257324219, -362.75421142578125, -355.2857971191406, -347.8173828125, -340.3489685058594, -332.88055419921875, -325.41217041015625, -317.9437255859375, -310.4753112792969, -303.00689697265625, -295.5384826660156, -288.070068359375, -280.6016540527344, -273.13323974609375, -265.66485595703125, -258.1964111328125, -250.72799682617188, -243.25958251953125, -235.79116821289062, -228.32275390625, -220.85433959960938, -213.3859405517578, -205.9175262451172, -198.44912719726562, -190.980712890625, -183.51229858398438, -176.04388427734375, -168.57546997070312, -161.1070556640625, -153.63865661621094, -146.1702423095703, -138.70184326171875, -131.23342895507812, -123.7650146484375, -116.2966079711914, -108.82819366455078, -101.35977935791016, -93.89137268066406, -86.42295837402344, -78.95453643798828, -71.48612213134766, -64.01771545410156, -56.54930114746094, -49.08088684082031, -41.61247253417969, -34.14406204223633, -26.67565155029297, -19.207237243652344, -11.738824844360352, -4.270412445068359, 3.197999954223633, 10.666412353515625, 18.13482666015625, 25.60323715209961, 33.07164764404297, 40.540061950683594]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 7.0, 7.0, 11.0, 16.0, 12.0, 19.0, 15.0, 17.0, 24.0, 28.0, 30.0, 27.0, 37.0, 40.0, 47.0, 41.0, 39.0, 38.0, 45.0, 39.0, 37.0, 41.0, 42.0, 43.0, 28.0, 36.0, 27.0, 34.0, 30.0, 34.0, 18.0, 19.0, 19.0, 14.0, 9.0, 9.0, 6.0, 7.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.208702087402344, -42.77646255493164, -41.34422302246094, -39.911983489990234, -38.47974395751953, -37.04750442504883, -35.615264892578125, -34.18302536010742, -32.75078582763672, -31.318546295166016, -29.886306762695312, -28.45406723022461, -27.021827697753906, -25.589588165283203, -24.1573486328125, -22.725109100341797, -21.292871475219727, -19.860631942749023, -18.42839241027832, -16.996152877807617, -15.563913345336914, -14.131673812866211, -12.699435234069824, -11.267195701599121, -9.834956169128418, -8.402716636657715, -6.970477104187012, -5.538238048553467, -4.105998516082764, -2.6737589836120605, -1.2415199279785156, 0.1907196044921875, 1.6229591369628906, 3.0551986694335938, 4.487438201904297, 5.919677257537842, 7.351916790008545, 8.784156799316406, 10.216395378112793, 11.648634910583496, 13.0808744430542, 14.513113975524902, 15.945353507995605, 17.377592086791992, 18.809831619262695, 20.2420711517334, 21.6743106842041, 23.106550216674805, 24.538789749145508, 25.97102928161621, 27.403268814086914, 28.835508346557617, 30.26774787902832, 31.699987411499023, 33.132225036621094, 34.5644645690918, 35.9967041015625, 37.4289436340332, 38.861183166503906, 40.29342269897461, 41.72566223144531, 43.157901763916016, 44.59014129638672, 46.02238082885742, 47.454620361328125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 8.0, 5.0, 6.0, 11.0, 11.0, 12.0, 15.0, 19.0, 17.0, 26.0, 22.0, 19.0, 31.0, 33.0, 32.0, 38.0, 37.0, 33.0, 31.0, 38.0, 34.0, 33.0, 34.0, 40.0, 33.0, 44.0, 36.0, 29.0, 31.0, 20.0, 29.0, 19.0, 25.0, 25.0, 15.0, 15.0, 11.0, 17.0, 15.0, 11.0, 5.0, 7.0, 2.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.52734375, -6.33038330078125, -6.1334228515625, -5.93646240234375, -5.739501953125, -5.54254150390625, -5.3455810546875, -5.14862060546875, -4.95166015625, -4.75469970703125, -4.5577392578125, -4.36077880859375, -4.163818359375, -3.96685791015625, -3.7698974609375, -3.57293701171875, -3.3759765625, -3.17901611328125, -2.9820556640625, -2.78509521484375, -2.588134765625, -2.39117431640625, -2.1942138671875, -1.99725341796875, -1.80029296875, -1.60333251953125, -1.4063720703125, -1.20941162109375, -1.012451171875, -0.81549072265625, -0.6185302734375, -0.42156982421875, -0.224609375, -0.02764892578125, 0.1693115234375, 0.36627197265625, 0.563232421875, 0.76019287109375, 0.9571533203125, 1.15411376953125, 1.35107421875, 1.54803466796875, 1.7449951171875, 1.94195556640625, 2.138916015625, 2.33587646484375, 2.5328369140625, 2.72979736328125, 2.9267578125, 3.12371826171875, 3.3206787109375, 3.51763916015625, 3.714599609375, 3.91156005859375, 4.1085205078125, 4.30548095703125, 4.50244140625, 4.69940185546875, 4.8963623046875, 5.09332275390625, 5.290283203125, 5.48724365234375, 5.6842041015625, 5.88116455078125, 6.078125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 11.0, 15.0, 22.0, 37.0, 43.0, 56.0, 97.0, 128.0, 179.0, 265.0, 393.0, 575.0, 836.0, 1253.0, 2108.0, 3263.0, 5573.0, 10145.0, 20053.0, 45245.0, 122538.0, 403371.0, 1286671.0, 1518133.0, 515793.0, 152776.0, 54003.0, 23015.0, 11345.0, 6206.0, 3580.0, 2342.0, 1408.0, 929.0, 607.0, 411.0, 276.0, 173.0, 125.0, 90.0, 53.0, 38.0, 33.0, 24.0, 14.0, 8.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-8.71875, -8.455322265625, -8.19189453125, -7.928466796875, -7.6650390625, -7.401611328125, -7.13818359375, -6.874755859375, -6.611328125, -6.347900390625, -6.08447265625, -5.821044921875, -5.5576171875, -5.294189453125, -5.03076171875, -4.767333984375, -4.50390625, -4.240478515625, -3.97705078125, -3.713623046875, -3.4501953125, -3.186767578125, -2.92333984375, -2.659912109375, -2.396484375, -2.133056640625, -1.86962890625, -1.606201171875, -1.3427734375, -1.079345703125, -0.81591796875, -0.552490234375, -0.2890625, -0.025634765625, 0.23779296875, 0.501220703125, 0.7646484375, 1.028076171875, 1.29150390625, 1.554931640625, 1.818359375, 2.081787109375, 2.34521484375, 2.608642578125, 2.8720703125, 3.135498046875, 3.39892578125, 3.662353515625, 3.92578125, 4.189208984375, 4.45263671875, 4.716064453125, 4.9794921875, 5.242919921875, 5.50634765625, 5.769775390625, 6.033203125, 6.296630859375, 6.56005859375, 6.823486328125, 7.0869140625, 7.350341796875, 7.61376953125, 7.877197265625, 8.140625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 4.0, 7.0, 8.0, 7.0, 14.0, 11.0, 14.0, 18.0, 25.0, 49.0, 39.0, 53.0, 68.0, 111.0, 122.0, 194.0, 238.0, 306.0, 401.0, 462.0, 430.0, 357.0, 287.0, 190.0, 175.0, 123.0, 78.0, 58.0, 43.0, 43.0, 33.0, 21.0, 16.0, 12.0, 14.0, 8.0, 10.0, 6.0, 6.0, 5.0, 2.0, 1.0, 0.0, 5.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.390625, -8.108642578125, -7.82666015625, -7.544677734375, -7.2626953125, -6.980712890625, -6.69873046875, -6.416748046875, -6.134765625, -5.852783203125, -5.57080078125, -5.288818359375, -5.0068359375, -4.724853515625, -4.44287109375, -4.160888671875, -3.87890625, -3.596923828125, -3.31494140625, -3.032958984375, -2.7509765625, -2.468994140625, -2.18701171875, -1.905029296875, -1.623046875, -1.341064453125, -1.05908203125, -0.777099609375, -0.4951171875, -0.213134765625, 0.06884765625, 0.350830078125, 0.6328125, 0.914794921875, 1.19677734375, 1.478759765625, 1.7607421875, 2.042724609375, 2.32470703125, 2.606689453125, 2.888671875, 3.170654296875, 3.45263671875, 3.734619140625, 4.0166015625, 4.298583984375, 4.58056640625, 4.862548828125, 5.14453125, 5.426513671875, 5.70849609375, 5.990478515625, 6.2724609375, 6.554443359375, 6.83642578125, 7.118408203125, 7.400390625, 7.682373046875, 7.96435546875, 8.246337890625, 8.5283203125, 8.810302734375, 9.09228515625, 9.374267578125, 9.65625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 6.0, 22.0, 13.0, 14.0, 24.0, 29.0, 35.0, 57.0, 73.0, 107.0, 173.0, 322.0, 561.0, 1150.0, 2406.0, 5606.0, 13737.0, 39723.0, 141088.0, 741279.0, 2470377.0, 599957.0, 120881.0, 34873.0, 12352.0, 4811.0, 2198.0, 1053.0, 522.0, 281.0, 178.0, 99.0, 74.0, 47.0, 34.0, 31.0, 20.0, 9.0, 17.0, 12.0, 4.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-14.5859375, -14.1363525390625, -13.686767578125, -13.2371826171875, -12.78759765625, -12.3380126953125, -11.888427734375, -11.4388427734375, -10.9892578125, -10.5396728515625, -10.090087890625, -9.6405029296875, -9.19091796875, -8.7413330078125, -8.291748046875, -7.8421630859375, -7.392578125, -6.9429931640625, -6.493408203125, -6.0438232421875, -5.59423828125, -5.1446533203125, -4.695068359375, -4.2454833984375, -3.7958984375, -3.3463134765625, -2.896728515625, -2.4471435546875, -1.99755859375, -1.5479736328125, -1.098388671875, -0.6488037109375, -0.19921875, 0.2503662109375, 0.699951171875, 1.1495361328125, 1.59912109375, 2.0487060546875, 2.498291015625, 2.9478759765625, 3.3974609375, 3.8470458984375, 4.296630859375, 4.7462158203125, 5.19580078125, 5.6453857421875, 6.094970703125, 6.5445556640625, 6.994140625, 7.4437255859375, 7.893310546875, 8.3428955078125, 8.79248046875, 9.2420654296875, 9.691650390625, 10.1412353515625, 10.5908203125, 11.0404052734375, 11.489990234375, 11.9395751953125, 12.38916015625, 12.8387451171875, 13.288330078125, 13.7379150390625, 14.1875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 11.0, 97.0, 390.0, 389.0, 115.0, 12.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-281.0858459472656, -274.97674560546875, -268.86761474609375, -262.7585144042969, -256.6493835449219, -250.54026794433594, -244.43115234375, -238.32205200195312, -232.21292114257812, -226.1038055419922, -219.99468994140625, -213.8855743408203, -207.77645874023438, -201.66734313964844, -195.5582275390625, -189.44912719726562, -183.3400115966797, -177.23089599609375, -171.1217803955078, -165.01266479492188, -158.90354919433594, -152.79443359375, -146.68533325195312, -140.57620239257812, -134.46710205078125, -128.3579864501953, -122.24887084960938, -116.13975524902344, -110.0306396484375, -103.92152404785156, -97.81241607666016, -91.70330047607422, -85.59418487548828, -79.48506927490234, -73.3759536743164, -67.266845703125, -61.1577262878418, -55.04861068725586, -48.93949890136719, -42.83038330078125, -36.72126770019531, -30.612152099609375, -24.50303840637207, -18.393924713134766, -12.284809112548828, -6.175693511962891, -0.06658172607421875, 6.042533874511719, 12.151649475097656, 18.260765075683594, 24.3698787689209, 30.478992462158203, 36.58810806274414, 42.69722366333008, 48.80633544921875, 54.91545104980469, 61.024566650390625, 67.13368225097656, 73.2427978515625, 79.35191345214844, 85.46102905273438, 91.57014465332031, 97.67925262451172, 103.78836822509766, 109.8974838256836]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 3.0, 3.0, 9.0, 9.0, 7.0, 9.0, 12.0, 21.0, 17.0, 19.0, 19.0, 16.0, 26.0, 33.0, 34.0, 27.0, 30.0, 37.0, 38.0, 32.0, 31.0, 41.0, 48.0, 35.0, 37.0, 36.0, 34.0, 32.0, 26.0, 21.0, 29.0, 29.0, 35.0, 22.0, 26.0, 27.0, 16.0, 18.0, 9.0, 11.0, 9.0, 8.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.415390014648438, -28.467071533203125, -27.518753051757812, -26.5704345703125, -25.622114181518555, -24.673795700073242, -23.72547721862793, -22.777158737182617, -21.828838348388672, -20.88051986694336, -19.932201385498047, -18.983882904052734, -18.03556251525879, -17.087244033813477, -16.138925552368164, -15.190607070922852, -14.242288589477539, -13.293970108032227, -12.345650672912598, -11.397332191467285, -10.449012756347656, -9.500694274902344, -8.552375793457031, -7.6040568351745605, -6.65573787689209, -5.707418918609619, -4.759099960327148, -3.810781478881836, -2.8624625205993652, -1.9141435623168945, -0.965825080871582, -0.017506122589111328, 0.9308109283447266, 1.8791297674179077, 2.827448606491089, 3.7757673263549805, 4.724086284637451, 5.672405242919922, 6.620723724365234, 7.569042682647705, 8.517361640930176, 9.465680122375488, 10.413999557495117, 11.36231803894043, 12.310636520385742, 13.258955955505371, 14.207274436950684, 15.155593872070312, 16.103912353515625, 17.052230834960938, 18.00054931640625, 18.948867797851562, 19.897188186645508, 20.84550666809082, 21.793825149536133, 22.742143630981445, 23.69046401977539, 24.638782501220703, 25.587100982666016, 26.535419464111328, 27.483739852905273, 28.432058334350586, 29.3803768157959, 30.32869529724121, 31.277013778686523]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 5.0, 4.0, 13.0, 7.0, 9.0, 22.0, 19.0, 17.0, 26.0, 26.0, 20.0, 32.0, 26.0, 31.0, 39.0, 36.0, 41.0, 40.0, 41.0, 46.0, 47.0, 47.0, 42.0, 43.0, 27.0, 34.0, 31.0, 30.0, 30.0, 30.0, 25.0, 17.0, 14.0, 14.0, 10.0, 15.0, 14.0, 8.0, 5.0, 8.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.234375, -7.00677490234375, -6.7791748046875, -6.55157470703125, -6.323974609375, -6.09637451171875, -5.8687744140625, -5.64117431640625, -5.41357421875, -5.18597412109375, -4.9583740234375, -4.73077392578125, -4.503173828125, -4.27557373046875, -4.0479736328125, -3.82037353515625, -3.5927734375, -3.36517333984375, -3.1375732421875, -2.90997314453125, -2.682373046875, -2.45477294921875, -2.2271728515625, -1.99957275390625, -1.77197265625, -1.54437255859375, -1.3167724609375, -1.08917236328125, -0.861572265625, -0.63397216796875, -0.4063720703125, -0.17877197265625, 0.048828125, 0.27642822265625, 0.5040283203125, 0.73162841796875, 0.959228515625, 1.18682861328125, 1.4144287109375, 1.64202880859375, 1.86962890625, 2.09722900390625, 2.3248291015625, 2.55242919921875, 2.780029296875, 3.00762939453125, 3.2352294921875, 3.46282958984375, 3.6904296875, 3.91802978515625, 4.1456298828125, 4.37322998046875, 4.600830078125, 4.82843017578125, 5.0560302734375, 5.28363037109375, 5.51123046875, 5.73883056640625, 5.9664306640625, 6.19403076171875, 6.421630859375, 6.64923095703125, 6.8768310546875, 7.10443115234375, 7.33203125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 7.0, 4.0, 20.0, 18.0, 43.0, 46.0, 70.0, 119.0, 169.0, 249.0, 430.0, 648.0, 993.0, 1562.0, 2518.0, 3854.0, 6001.0, 9825.0, 15358.0, 24273.0, 37460.0, 57436.0, 83894.0, 114500.0, 140918.0, 145318.0, 124405.0, 93596.0, 65162.0, 43185.0, 27801.0, 18125.0, 11031.0, 7199.0, 4442.0, 2922.0, 1802.0, 1132.0, 725.0, 443.0, 296.0, 201.0, 140.0, 86.0, 52.0, 33.0, 19.0, 10.0, 5.0, 4.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.6904296875, -0.6689605712890625, -0.647491455078125, -0.6260223388671875, -0.60455322265625, -0.5830841064453125, -0.561614990234375, -0.5401458740234375, -0.5186767578125, -0.4972076416015625, -0.475738525390625, -0.4542694091796875, -0.43280029296875, -0.4113311767578125, -0.389862060546875, -0.3683929443359375, -0.346923828125, -0.3254547119140625, -0.303985595703125, -0.2825164794921875, -0.26104736328125, -0.2395782470703125, -0.218109130859375, -0.1966400146484375, -0.1751708984375, -0.1537017822265625, -0.132232666015625, -0.1107635498046875, -0.08929443359375, -0.0678253173828125, -0.046356201171875, -0.0248870849609375, -0.00341796875, 0.0180511474609375, 0.039520263671875, 0.0609893798828125, 0.08245849609375, 0.1039276123046875, 0.125396728515625, 0.1468658447265625, 0.1683349609375, 0.1898040771484375, 0.211273193359375, 0.2327423095703125, 0.25421142578125, 0.2756805419921875, 0.297149658203125, 0.3186187744140625, 0.340087890625, 0.3615570068359375, 0.383026123046875, 0.4044952392578125, 0.42596435546875, 0.4474334716796875, 0.468902587890625, 0.4903717041015625, 0.5118408203125, 0.5333099365234375, 0.554779052734375, 0.5762481689453125, 0.59771728515625, 0.6191864013671875, 0.640655517578125, 0.6621246337890625, 0.68359375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 7.0, 4.0, 7.0, 3.0, 11.0, 7.0, 7.0, 17.0, 8.0, 19.0, 18.0, 14.0, 12.0, 15.0, 22.0, 21.0, 28.0, 25.0, 27.0, 28.0, 39.0, 36.0, 33.0, 32.0, 37.0, 1052.0, 29.0, 37.0, 35.0, 27.0, 26.0, 28.0, 36.0, 44.0, 30.0, 21.0, 24.0, 18.0, 20.0, 18.0, 15.0, 15.0, 13.0, 9.0, 18.0, 4.0, 8.0, 7.0, 8.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-3.966796875, -3.842742919921875, -3.71868896484375, -3.594635009765625, -3.4705810546875, -3.346527099609375, -3.22247314453125, -3.098419189453125, -2.974365234375, -2.850311279296875, -2.72625732421875, -2.602203369140625, -2.4781494140625, -2.354095458984375, -2.23004150390625, -2.105987548828125, -1.98193359375, -1.857879638671875, -1.73382568359375, -1.609771728515625, -1.4857177734375, -1.361663818359375, -1.23760986328125, -1.113555908203125, -0.989501953125, -0.865447998046875, -0.74139404296875, -0.617340087890625, -0.4932861328125, -0.369232177734375, -0.24517822265625, -0.121124267578125, 0.0029296875, 0.126983642578125, 0.25103759765625, 0.375091552734375, 0.4991455078125, 0.623199462890625, 0.74725341796875, 0.871307373046875, 0.995361328125, 1.119415283203125, 1.24346923828125, 1.367523193359375, 1.4915771484375, 1.615631103515625, 1.73968505859375, 1.863739013671875, 1.98779296875, 2.111846923828125, 2.23590087890625, 2.359954833984375, 2.4840087890625, 2.608062744140625, 2.73211669921875, 2.856170654296875, 2.980224609375, 3.104278564453125, 3.22833251953125, 3.352386474609375, 3.4764404296875, 3.600494384765625, 3.72454833984375, 3.848602294921875, 3.97265625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 12.0, 15.0, 26.0, 45.0, 47.0, 88.0, 135.0, 239.0, 374.0, 596.0, 946.0, 1501.0, 2594.0, 4205.0, 7045.0, 11917.0, 20217.0, 33707.0, 55591.0, 89316.0, 146529.0, 569659.0, 755545.0, 155663.0, 94357.0, 58645.0, 35411.0, 21354.0, 12437.0, 7499.0, 4433.0, 2629.0, 1657.0, 1007.0, 648.0, 389.0, 248.0, 167.0, 81.0, 57.0, 37.0, 25.0, 18.0, 12.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.54931640625, -0.5336456298828125, -0.517974853515625, -0.5023040771484375, -0.48663330078125, -0.4709625244140625, -0.455291748046875, -0.4396209716796875, -0.4239501953125, -0.4082794189453125, -0.392608642578125, -0.3769378662109375, -0.36126708984375, -0.3455963134765625, -0.329925537109375, -0.3142547607421875, -0.298583984375, -0.2829132080078125, -0.267242431640625, -0.2515716552734375, -0.23590087890625, -0.2202301025390625, -0.204559326171875, -0.1888885498046875, -0.1732177734375, -0.1575469970703125, -0.141876220703125, -0.1262054443359375, -0.11053466796875, -0.0948638916015625, -0.079193115234375, -0.0635223388671875, -0.0478515625, -0.0321807861328125, -0.016510009765625, -0.0008392333984375, 0.01483154296875, 0.0305023193359375, 0.046173095703125, 0.0618438720703125, 0.0775146484375, 0.0931854248046875, 0.108856201171875, 0.1245269775390625, 0.14019775390625, 0.1558685302734375, 0.171539306640625, 0.1872100830078125, 0.202880859375, 0.2185516357421875, 0.234222412109375, 0.2498931884765625, 0.26556396484375, 0.2812347412109375, 0.296905517578125, 0.3125762939453125, 0.3282470703125, 0.3439178466796875, 0.359588623046875, 0.3752593994140625, 0.39093017578125, 0.4066009521484375, 0.422271728515625, 0.4379425048828125, 0.45361328125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 0.0, 6.0, 7.0, 8.0, 9.0, 9.0, 16.0, 22.0, 27.0, 26.0, 24.0, 26.0, 46.0, 40.0, 62.0, 60.0, 73.0, 71.0, 68.0, 54.0, 66.0, 41.0, 44.0, 43.0, 24.0, 27.0, 23.0, 17.0, 17.0, 11.0, 9.0, 6.0, 7.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.063720703125, -0.061690330505371094, -0.05965995788574219, -0.05762958526611328, -0.055599212646484375, -0.05356884002685547, -0.05153846740722656, -0.049508094787597656, -0.04747772216796875, -0.045447349548339844, -0.04341697692871094, -0.04138660430908203, -0.039356231689453125, -0.03732585906982422, -0.03529548645019531, -0.033265113830566406, -0.0312347412109375, -0.029204368591308594, -0.027173995971679688, -0.02514362335205078, -0.023113250732421875, -0.02108287811279297, -0.019052505493164062, -0.017022132873535156, -0.01499176025390625, -0.012961387634277344, -0.010931015014648438, -0.008900642395019531, -0.006870269775390625, -0.004839897155761719, -0.0028095245361328125, -0.0007791519165039062, 0.001251220703125, 0.0032815933227539062, 0.0053119659423828125, 0.007342338562011719, 0.009372711181640625, 0.011403083801269531, 0.013433456420898438, 0.015463829040527344, 0.01749420166015625, 0.019524574279785156, 0.021554946899414062, 0.02358531951904297, 0.025615692138671875, 0.02764606475830078, 0.029676437377929688, 0.031706809997558594, 0.0337371826171875, 0.035767555236816406, 0.03779792785644531, 0.03982830047607422, 0.041858673095703125, 0.04388904571533203, 0.04591941833496094, 0.047949790954589844, 0.04998016357421875, 0.052010536193847656, 0.05404090881347656, 0.05607128143310547, 0.058101654052734375, 0.06013202667236328, 0.06216239929199219, 0.0641927719116211, 0.06622314453125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 7.0, 13.0, 17.0, 26.0, 27.0, 39.0, 49.0, 66.0, 83.0, 148.0, 248.0, 582.0, 8406.0, 1033196.0, 4394.0, 544.0, 235.0, 124.0, 86.0, 53.0, 42.0, 31.0, 28.0, 25.0, 13.0, 13.0, 8.0, 11.0, 6.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.498046875, -1.451873779296875, -1.40570068359375, -1.359527587890625, -1.3133544921875, -1.267181396484375, -1.22100830078125, -1.174835205078125, -1.128662109375, -1.082489013671875, -1.03631591796875, -0.990142822265625, -0.9439697265625, -0.897796630859375, -0.85162353515625, -0.805450439453125, -0.75927734375, -0.713104248046875, -0.66693115234375, -0.620758056640625, -0.5745849609375, -0.528411865234375, -0.48223876953125, -0.436065673828125, -0.389892578125, -0.343719482421875, -0.29754638671875, -0.251373291015625, -0.2052001953125, -0.159027099609375, -0.11285400390625, -0.066680908203125, -0.0205078125, 0.025665283203125, 0.07183837890625, 0.118011474609375, 0.1641845703125, 0.210357666015625, 0.25653076171875, 0.302703857421875, 0.348876953125, 0.395050048828125, 0.44122314453125, 0.487396240234375, 0.5335693359375, 0.579742431640625, 0.62591552734375, 0.672088623046875, 0.71826171875, 0.764434814453125, 0.81060791015625, 0.856781005859375, 0.9029541015625, 0.949127197265625, 0.99530029296875, 1.041473388671875, 1.087646484375, 1.133819580078125, 1.17999267578125, 1.226165771484375, 1.2723388671875, 1.318511962890625, 1.36468505859375, 1.410858154296875, 1.45703125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 8.0, 44.0, 274.0, 446.0, 183.0, 47.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28768807649612427, -0.27716535329818726, -0.26664260029792786, -0.25611987709999084, -0.24559713900089264, -0.23507440090179443, -0.22455167770385742, -0.21402893960475922, -0.203506201505661, -0.1929834634065628, -0.1824607253074646, -0.1719380021095276, -0.16141526401042938, -0.15089252591133118, -0.14036980271339417, -0.12984706461429596, -0.11932432651519775, -0.10880158841609955, -0.09827885776758194, -0.08775612711906433, -0.07723338901996613, -0.06671065092086792, -0.05618792027235031, -0.0456651896238327, -0.0351424515247345, -0.02461971715092659, -0.014096982777118683, -0.0035742484033107758, 0.006948485970497131, 0.01747122034430504, 0.027993954718112946, 0.038516685366630554, 0.04903945326805115, 0.059562187641859055, 0.07008492201566696, 0.08060765266418457, 0.09113039076328278, 0.10165312886238098, 0.11217585951089859, 0.1226985901594162, 0.1332213282585144, 0.1437440663576126, 0.15426680445671082, 0.16478952765464783, 0.17531226575374603, 0.18583500385284424, 0.19635772705078125, 0.20688046514987946, 0.21740320324897766, 0.22792594134807587, 0.23844867944717407, 0.24897140264511108, 0.2594941258430481, 0.2700168788433075, 0.2805396020412445, 0.2910623550415039, 0.3015850782394409, 0.31210780143737793, 0.32263055443763733, 0.33315327763557434, 0.34367603063583374, 0.35419875383377075, 0.36472147703170776, 0.3752442002296448, 0.3857669532299042]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 1.0, 2.0, 2.0, 6.0, 12.0, 13.0, 20.0, 11.0, 27.0, 20.0, 24.0, 23.0, 26.0, 26.0, 25.0, 32.0, 35.0, 38.0, 34.0, 42.0, 41.0, 37.0, 30.0, 46.0, 34.0, 28.0, 43.0, 29.0, 33.0, 30.0, 24.0, 20.0, 21.0, 18.0, 23.0, 18.0, 13.0, 16.0, 15.0, 7.0, 7.0, 11.0, 6.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0], "bins": [-0.0647420883178711, -0.0627637431025505, -0.06078539788722992, -0.05880705267190933, -0.056828707456588745, -0.05485036224126816, -0.05287201702594757, -0.050893671810626984, -0.048915326595306396, -0.04693698137998581, -0.04495863616466522, -0.042980290949344635, -0.04100194573402405, -0.03902360051870346, -0.037045255303382874, -0.035066910088062286, -0.0330885648727417, -0.031110219657421112, -0.029131874442100525, -0.027153529226779938, -0.02517518401145935, -0.023196838796138763, -0.021218493580818176, -0.01924014836549759, -0.017261803150177002, -0.015283457934856415, -0.013305112719535828, -0.01132676750421524, -0.009348422288894653, -0.007370077073574066, -0.005391731858253479, -0.003413386642932892, -0.0014350414276123047, 0.0005433037877082825, 0.0025216490030288696, 0.004499994218349457, 0.006478339433670044, 0.008456684648990631, 0.010435029864311218, 0.012413375079631805, 0.014391720294952393, 0.01637006551027298, 0.018348410725593567, 0.020326755940914154, 0.02230510115623474, 0.02428344637155533, 0.026261791586875916, 0.028240136802196503, 0.03021848201751709, 0.03219682723283768, 0.034175172448158264, 0.03615351766347885, 0.03813186287879944, 0.040110208094120026, 0.04208855330944061, 0.0440668985247612, 0.04604524374008179, 0.048023588955402374, 0.05000193417072296, 0.05198027938604355, 0.053958624601364136, 0.05593696981668472, 0.05791531503200531, 0.0598936602473259, 0.061872005462646484]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 7.0, 7.0, 6.0, 7.0, 12.0, 15.0, 18.0, 12.0, 22.0, 21.0, 29.0, 32.0, 26.0, 37.0, 38.0, 37.0, 39.0, 43.0, 46.0, 48.0, 46.0, 43.0, 30.0, 37.0, 32.0, 34.0, 36.0, 27.0, 39.0, 23.0, 31.0, 17.0, 21.0, 17.0, 12.0, 10.0, 8.0, 8.0, 7.0, 6.0, 8.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30078125, -6.07513427734375, -5.8494873046875, -5.62384033203125, -5.398193359375, -5.17254638671875, -4.9468994140625, -4.72125244140625, -4.49560546875, -4.26995849609375, -4.0443115234375, -3.81866455078125, -3.593017578125, -3.36737060546875, -3.1417236328125, -2.91607666015625, -2.6904296875, -2.46478271484375, -2.2391357421875, -2.01348876953125, -1.787841796875, -1.56219482421875, -1.3365478515625, -1.11090087890625, -0.88525390625, -0.65960693359375, -0.4339599609375, -0.20831298828125, 0.017333984375, 0.24298095703125, 0.4686279296875, 0.69427490234375, 0.919921875, 1.14556884765625, 1.3712158203125, 1.59686279296875, 1.822509765625, 2.04815673828125, 2.2738037109375, 2.49945068359375, 2.72509765625, 2.95074462890625, 3.1763916015625, 3.40203857421875, 3.627685546875, 3.85333251953125, 4.0789794921875, 4.30462646484375, 4.5302734375, 4.75592041015625, 4.9815673828125, 5.20721435546875, 5.432861328125, 5.65850830078125, 5.8841552734375, 6.10980224609375, 6.33544921875, 6.56109619140625, 6.7867431640625, 7.01239013671875, 7.238037109375, 7.46368408203125, 7.6893310546875, 7.91497802734375, 8.140625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 6.0, 5.0, 10.0, 16.0, 21.0, 28.0, 26.0, 45.0, 80.0, 106.0, 169.0, 272.0, 518.0, 902.0, 1633.0, 3176.0, 6295.0, 12485.0, 26370.0, 59370.0, 139627.0, 342751.0, 263260.0, 104778.0, 45266.0, 20536.0, 9874.0, 5011.0, 2628.0, 1367.0, 750.0, 443.0, 254.0, 153.0, 96.0, 59.0, 40.0, 38.0, 21.0, 22.0, 13.0, 7.0, 7.0, 4.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-10.78125, -10.431640625, -10.08203125, -9.732421875, -9.3828125, -9.033203125, -8.68359375, -8.333984375, -7.984375, -7.634765625, -7.28515625, -6.935546875, -6.5859375, -6.236328125, -5.88671875, -5.537109375, -5.1875, -4.837890625, -4.48828125, -4.138671875, -3.7890625, -3.439453125, -3.08984375, -2.740234375, -2.390625, -2.041015625, -1.69140625, -1.341796875, -0.9921875, -0.642578125, -0.29296875, 0.056640625, 0.40625, 0.755859375, 1.10546875, 1.455078125, 1.8046875, 2.154296875, 2.50390625, 2.853515625, 3.203125, 3.552734375, 3.90234375, 4.251953125, 4.6015625, 4.951171875, 5.30078125, 5.650390625, 6.0, 6.349609375, 6.69921875, 7.048828125, 7.3984375, 7.748046875, 8.09765625, 8.447265625, 8.796875, 9.146484375, 9.49609375, 9.845703125, 10.1953125, 10.544921875, 10.89453125, 11.244140625, 11.59375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 2.0, 5.0, 7.0, 5.0, 5.0, 8.0, 9.0, 12.0, 19.0, 19.0, 17.0, 17.0, 34.0, 26.0, 42.0, 42.0, 56.0, 63.0, 83.0, 128.0, 219.0, 1333.0, 267.0, 160.0, 100.0, 52.0, 52.0, 40.0, 34.0, 29.0, 27.0, 20.0, 23.0, 23.0, 17.0, 17.0, 12.0, 9.0, 7.0, 0.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.0, -18.399658203125, -17.79931640625, -17.198974609375, -16.5986328125, -15.998291015625, -15.39794921875, -14.797607421875, -14.197265625, -13.596923828125, -12.99658203125, -12.396240234375, -11.7958984375, -11.195556640625, -10.59521484375, -9.994873046875, -9.39453125, -8.794189453125, -8.19384765625, -7.593505859375, -6.9931640625, -6.392822265625, -5.79248046875, -5.192138671875, -4.591796875, -3.991455078125, -3.39111328125, -2.790771484375, -2.1904296875, -1.590087890625, -0.98974609375, -0.389404296875, 0.2109375, 0.811279296875, 1.41162109375, 2.011962890625, 2.6123046875, 3.212646484375, 3.81298828125, 4.413330078125, 5.013671875, 5.614013671875, 6.21435546875, 6.814697265625, 7.4150390625, 8.015380859375, 8.61572265625, 9.216064453125, 9.81640625, 10.416748046875, 11.01708984375, 11.617431640625, 12.2177734375, 12.818115234375, 13.41845703125, 14.018798828125, 14.619140625, 15.219482421875, 15.81982421875, 16.420166015625, 17.0205078125, 17.620849609375, 18.22119140625, 18.821533203125, 19.421875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 10.0, 9.0, 7.0, 15.0, 18.0, 28.0, 32.0, 50.0, 80.0, 89.0, 146.0, 195.0, 331.0, 598.0, 1491.0, 5860.0, 32032.0, 439301.0, 2497357.0, 145638.0, 16472.0, 3533.0, 1054.0, 463.0, 250.0, 200.0, 126.0, 86.0, 68.0, 50.0, 29.0, 26.0, 21.0, 11.0, 10.0, 5.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.03125, -21.25341796875, -20.4755859375, -19.69775390625, -18.919921875, -18.14208984375, -17.3642578125, -16.58642578125, -15.80859375, -15.03076171875, -14.2529296875, -13.47509765625, -12.697265625, -11.91943359375, -11.1416015625, -10.36376953125, -9.5859375, -8.80810546875, -8.0302734375, -7.25244140625, -6.474609375, -5.69677734375, -4.9189453125, -4.14111328125, -3.36328125, -2.58544921875, -1.8076171875, -1.02978515625, -0.251953125, 0.52587890625, 1.3037109375, 2.08154296875, 2.859375, 3.63720703125, 4.4150390625, 5.19287109375, 5.970703125, 6.74853515625, 7.5263671875, 8.30419921875, 9.08203125, 9.85986328125, 10.6376953125, 11.41552734375, 12.193359375, 12.97119140625, 13.7490234375, 14.52685546875, 15.3046875, 16.08251953125, 16.8603515625, 17.63818359375, 18.416015625, 19.19384765625, 19.9716796875, 20.74951171875, 21.52734375, 22.30517578125, 23.0830078125, 23.86083984375, 24.638671875, 25.41650390625, 26.1943359375, 26.97216796875, 27.75]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 131.0, 573.0, 279.0, 26.0, 1.0, 0.0, 2.0], "bins": [-437.6876220703125, -430.22930908203125, -422.7709655761719, -415.3126525878906, -407.85430908203125, -400.39599609375, -392.9376525878906, -385.4793395996094, -378.02099609375, -370.56268310546875, -363.1043395996094, -355.6460266113281, -348.18768310546875, -340.7293701171875, -333.2710266113281, -325.8127136230469, -318.3543701171875, -310.89605712890625, -303.4377136230469, -295.9794006347656, -288.52105712890625, -281.062744140625, -273.6044006347656, -266.1460876464844, -258.6877746582031, -251.2294464111328, -243.7711181640625, -236.3127899169922, -228.85446166992188, -221.39613342285156, -213.93780517578125, -206.4794921875, -199.02114868164062, -191.5628204345703, -184.1044921875, -176.6461639404297, -169.18783569335938, -161.72950744628906, -154.27117919921875, -146.8128662109375, -139.35452270507812, -131.8961944580078, -124.4378662109375, -116.97953796386719, -109.52120971679688, -102.06288146972656, -94.60456085205078, -87.14623260498047, -79.68790435791016, -72.22957611083984, -64.77124786376953, -57.312923431396484, -49.85459518432617, -42.39626693725586, -34.93794250488281, -27.4796142578125, -20.021286010742188, -12.562958717346191, -5.104631423950195, 2.3536949157714844, 9.812023162841797, 17.27035140991211, 24.728675842285156, 32.18700408935547, 39.64533233642578]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 4.0, 4.0, 4.0, 4.0, 7.0, 13.0, 14.0, 20.0, 18.0, 17.0, 25.0, 13.0, 29.0, 23.0, 40.0, 34.0, 26.0, 35.0, 30.0, 30.0, 38.0, 46.0, 41.0, 34.0, 46.0, 45.0, 48.0, 29.0, 25.0, 21.0, 32.0, 27.0, 25.0, 18.0, 25.0, 22.0, 10.0, 15.0, 10.0, 9.0, 9.0, 10.0, 4.0, 0.0, 5.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-41.61112594604492, -40.288978576660156, -38.96683120727539, -37.64468765258789, -36.322540283203125, -35.00039291381836, -33.678245544433594, -32.35609817504883, -31.033952713012695, -29.71180534362793, -28.389659881591797, -27.06751251220703, -25.745365142822266, -24.423219680786133, -23.101072311401367, -21.778926849365234, -20.45677947998047, -19.134632110595703, -17.81248664855957, -16.490339279174805, -15.168192863464355, -13.846046447753906, -12.52389907836914, -11.201752662658691, -9.879606246948242, -8.557459831237793, -7.2353129386901855, -5.913166046142578, -4.591019630432129, -3.2688732147216797, -1.9467263221740723, -0.6245794296264648, 0.6975631713867188, 2.019709825515747, 3.3418564796447754, 4.664003372192383, 5.986149787902832, 7.308296203613281, 8.630443572998047, 9.952589988708496, 11.274736404418945, 12.596882820129395, 13.919029235839844, 15.24117660522461, 16.563323974609375, 17.885469436645508, 19.207616806030273, 20.529762268066406, 21.851909637451172, 23.174057006835938, 24.49620246887207, 25.818349838256836, 27.14049530029297, 28.462642669677734, 29.7847900390625, 31.106937408447266, 32.42908477783203, 33.7512321472168, 35.07337951660156, 36.39552307128906, 37.71767044067383, 39.039817810058594, 40.36196517944336, 41.684112548828125, 43.006256103515625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 1.0, 5.0, 7.0, 5.0, 7.0, 8.0, 11.0, 13.0, 15.0, 22.0, 21.0, 29.0, 20.0, 31.0, 43.0, 42.0, 35.0, 42.0, 60.0, 50.0, 47.0, 53.0, 40.0, 52.0, 36.0, 44.0, 33.0, 27.0, 29.0, 31.0, 24.0, 25.0, 18.0, 24.0, 18.0, 8.0, 8.0, 9.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8515625, -8.596923828125, -8.34228515625, -8.087646484375, -7.8330078125, -7.578369140625, -7.32373046875, -7.069091796875, -6.814453125, -6.559814453125, -6.30517578125, -6.050537109375, -5.7958984375, -5.541259765625, -5.28662109375, -5.031982421875, -4.77734375, -4.522705078125, -4.26806640625, -4.013427734375, -3.7587890625, -3.504150390625, -3.24951171875, -2.994873046875, -2.740234375, -2.485595703125, -2.23095703125, -1.976318359375, -1.7216796875, -1.467041015625, -1.21240234375, -0.957763671875, -0.703125, -0.448486328125, -0.19384765625, 0.060791015625, 0.3154296875, 0.570068359375, 0.82470703125, 1.079345703125, 1.333984375, 1.588623046875, 1.84326171875, 2.097900390625, 2.3525390625, 2.607177734375, 2.86181640625, 3.116455078125, 3.37109375, 3.625732421875, 3.88037109375, 4.135009765625, 4.3896484375, 4.644287109375, 4.89892578125, 5.153564453125, 5.408203125, 5.662841796875, 5.91748046875, 6.172119140625, 6.4267578125, 6.681396484375, 6.93603515625, 7.190673828125, 7.4453125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0, 4.0, 8.0, 7.0, 7.0, 12.0, 6.0, 14.0, 17.0, 19.0, 24.0, 28.0, 38.0, 51.0, 73.0, 78.0, 98.0, 167.0, 221.0, 360.0, 965.0, 6865.0, 1197857.0, 2974295.0, 10602.0, 1128.0, 414.0, 241.0, 168.0, 115.0, 83.0, 63.0, 50.0, 37.0, 33.0, 28.0, 19.0, 14.0, 11.0, 14.0, 7.0, 9.0, 11.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-65.9375, -63.943359375, -61.94921875, -59.955078125, -57.9609375, -55.966796875, -53.97265625, -51.978515625, -49.984375, -47.990234375, -45.99609375, -44.001953125, -42.0078125, -40.013671875, -38.01953125, -36.025390625, -34.03125, -32.037109375, -30.04296875, -28.048828125, -26.0546875, -24.060546875, -22.06640625, -20.072265625, -18.078125, -16.083984375, -14.08984375, -12.095703125, -10.1015625, -8.107421875, -6.11328125, -4.119140625, -2.125, -0.130859375, 1.86328125, 3.857421875, 5.8515625, 7.845703125, 9.83984375, 11.833984375, 13.828125, 15.822265625, 17.81640625, 19.810546875, 21.8046875, 23.798828125, 25.79296875, 27.787109375, 29.78125, 31.775390625, 33.76953125, 35.763671875, 37.7578125, 39.751953125, 41.74609375, 43.740234375, 45.734375, 47.728515625, 49.72265625, 51.716796875, 53.7109375, 55.705078125, 57.69921875, 59.693359375, 61.6875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 2.0, 6.0, 3.0, 5.0, 4.0, 6.0, 8.0, 17.0, 16.0, 20.0, 22.0, 35.0, 47.0, 41.0, 59.0, 81.0, 109.0, 149.0, 210.0, 292.0, 399.0, 461.0, 531.0, 414.0, 284.0, 203.0, 148.0, 112.0, 76.0, 81.0, 44.0, 41.0, 26.0, 22.0, 25.0, 16.0, 12.0, 10.0, 7.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-10.0703125, -9.77490234375, -9.4794921875, -9.18408203125, -8.888671875, -8.59326171875, -8.2978515625, -8.00244140625, -7.70703125, -7.41162109375, -7.1162109375, -6.82080078125, -6.525390625, -6.22998046875, -5.9345703125, -5.63916015625, -5.34375, -5.04833984375, -4.7529296875, -4.45751953125, -4.162109375, -3.86669921875, -3.5712890625, -3.27587890625, -2.98046875, -2.68505859375, -2.3896484375, -2.09423828125, -1.798828125, -1.50341796875, -1.2080078125, -0.91259765625, -0.6171875, -0.32177734375, -0.0263671875, 0.26904296875, 0.564453125, 0.85986328125, 1.1552734375, 1.45068359375, 1.74609375, 2.04150390625, 2.3369140625, 2.63232421875, 2.927734375, 3.22314453125, 3.5185546875, 3.81396484375, 4.109375, 4.40478515625, 4.7001953125, 4.99560546875, 5.291015625, 5.58642578125, 5.8818359375, 6.17724609375, 6.47265625, 6.76806640625, 7.0634765625, 7.35888671875, 7.654296875, 7.94970703125, 8.2451171875, 8.54052734375, 8.8359375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 8.0, 7.0, 6.0, 8.0, 18.0, 20.0, 15.0, 28.0, 46.0, 51.0, 77.0, 109.0, 162.0, 361.0, 742.0, 2262.0, 7688.0, 34808.0, 246261.0, 3199405.0, 620905.0, 63486.0, 12349.0, 3238.0, 1096.0, 450.0, 229.0, 128.0, 74.0, 49.0, 55.0, 29.0, 29.0, 14.0, 10.0, 11.0, 13.0, 12.0, 4.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.171875, -26.38818359375, -25.6044921875, -24.82080078125, -24.037109375, -23.25341796875, -22.4697265625, -21.68603515625, -20.90234375, -20.11865234375, -19.3349609375, -18.55126953125, -17.767578125, -16.98388671875, -16.2001953125, -15.41650390625, -14.6328125, -13.84912109375, -13.0654296875, -12.28173828125, -11.498046875, -10.71435546875, -9.9306640625, -9.14697265625, -8.36328125, -7.57958984375, -6.7958984375, -6.01220703125, -5.228515625, -4.44482421875, -3.6611328125, -2.87744140625, -2.09375, -1.31005859375, -0.5263671875, 0.25732421875, 1.041015625, 1.82470703125, 2.6083984375, 3.39208984375, 4.17578125, 4.95947265625, 5.7431640625, 6.52685546875, 7.310546875, 8.09423828125, 8.8779296875, 9.66162109375, 10.4453125, 11.22900390625, 12.0126953125, 12.79638671875, 13.580078125, 14.36376953125, 15.1474609375, 15.93115234375, 16.71484375, 17.49853515625, 18.2822265625, 19.06591796875, 19.849609375, 20.63330078125, 21.4169921875, 22.20068359375, 22.984375]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 4.0, 16.0, 82.0, 256.0, 341.0, 212.0, 80.0, 22.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.23756217956543, -22.323129653930664, -17.4086971282959, -12.494264602661133, -7.579832077026367, -2.6653995513916016, 2.249032974243164, 7.16346549987793, 12.077898025512695, 16.99233055114746, 21.906763076782227, 26.821195602416992, 31.735628128051758, 36.650062561035156, 41.564491271972656, 46.47892761230469, 51.39335632324219, 56.30778884887695, 61.22222137451172, 66.13665771484375, 71.05108642578125, 75.96551513671875, 80.87995147705078, 85.79438781738281, 90.70881652832031, 95.62324523925781, 100.53768157958984, 105.45211791992188, 110.36654663085938, 115.28097534179688, 120.1954116821289, 125.10984802246094, 130.0242919921875, 134.938720703125, 139.8531494140625, 144.76759338378906, 149.68202209472656, 154.59645080566406, 159.51089477539062, 164.42532348632812, 169.33975219726562, 174.25418090820312, 179.16860961914062, 184.0830535888672, 188.9974822998047, 193.9119110107422, 198.82635498046875, 203.74078369140625, 208.65521240234375, 213.56964111328125, 218.48406982421875, 223.3985137939453, 228.3129425048828, 233.2273712158203, 238.14181518554688, 243.05624389648438, 247.97067260742188, 252.88510131835938, 257.7995300292969, 262.7139587402344, 267.62841796875, 272.5428466796875, 277.457275390625, 282.3717041015625, 287.2861328125]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 6.0, 11.0, 8.0, 11.0, 7.0, 13.0, 11.0, 11.0, 11.0, 26.0, 25.0, 19.0, 30.0, 31.0, 31.0, 27.0, 24.0, 35.0, 38.0, 43.0, 31.0, 36.0, 41.0, 38.0, 39.0, 30.0, 34.0, 47.0, 38.0, 34.0, 29.0, 25.0, 15.0, 21.0, 18.0, 24.0, 14.0, 14.0, 9.0, 5.0, 6.0, 8.0, 6.0, 6.0, 5.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.598541259765625, -33.48764419555664, -32.37674331665039, -31.265846252441406, -30.154949188232422, -29.044050216674805, -27.933151245117188, -26.822254180908203, -25.711355209350586, -24.60045623779297, -23.489559173583984, -22.378660202026367, -21.26776123046875, -20.156864166259766, -19.04596519470215, -17.93506622314453, -16.824169158935547, -15.713271141052246, -14.602373123168945, -13.491474151611328, -12.380576133728027, -11.269678115844727, -10.15877914428711, -9.047881126403809, -7.936983108520508, -6.826085090637207, -5.715186595916748, -4.604288101196289, -3.4933900833129883, -2.3824920654296875, -1.2715935707092285, -0.16069507598876953, 0.9502067565917969, 2.0611050128936768, 3.1720032691955566, 4.282901763916016, 5.393799781799316, 6.504697799682617, 7.615596294403076, 8.726494789123535, 9.837392807006836, 10.948290824890137, 12.059188842773438, 13.170087814331055, 14.280985832214355, 15.391883850097656, 16.502782821655273, 17.61368179321289, 18.724578857421875, 19.835477828979492, 20.946374893188477, 22.057273864746094, 23.168170928955078, 24.279069900512695, 25.389968872070312, 26.500865936279297, 27.611764907836914, 28.72266387939453, 29.833560943603516, 30.944459915161133, 32.05535888671875, 33.166255950927734, 34.27715301513672, 35.38805389404297, 36.49895095825195]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 10.0, 10.0, 7.0, 11.0, 12.0, 19.0, 19.0, 18.0, 17.0, 20.0, 26.0, 21.0, 21.0, 33.0, 35.0, 32.0, 37.0, 54.0, 51.0, 33.0, 38.0, 36.0, 37.0, 43.0, 42.0, 35.0, 25.0, 30.0, 31.0, 28.0, 30.0, 20.0, 18.0, 12.0, 13.0, 18.0, 9.0, 13.0, 5.0, 9.0, 7.0, 4.0, 1.0, 3.0, 1.0, 5.0], "bins": [-8.40625, -8.18487548828125, -7.9635009765625, -7.74212646484375, -7.520751953125, -7.29937744140625, -7.0780029296875, -6.85662841796875, -6.63525390625, -6.41387939453125, -6.1925048828125, -5.97113037109375, -5.749755859375, -5.52838134765625, -5.3070068359375, -5.08563232421875, -4.8642578125, -4.64288330078125, -4.4215087890625, -4.20013427734375, -3.978759765625, -3.75738525390625, -3.5360107421875, -3.31463623046875, -3.09326171875, -2.87188720703125, -2.6505126953125, -2.42913818359375, -2.207763671875, -1.98638916015625, -1.7650146484375, -1.54364013671875, -1.322265625, -1.10089111328125, -0.8795166015625, -0.65814208984375, -0.436767578125, -0.21539306640625, 0.0059814453125, 0.22735595703125, 0.44873046875, 0.67010498046875, 0.8914794921875, 1.11285400390625, 1.334228515625, 1.55560302734375, 1.7769775390625, 1.99835205078125, 2.2197265625, 2.44110107421875, 2.6624755859375, 2.88385009765625, 3.105224609375, 3.32659912109375, 3.5479736328125, 3.76934814453125, 3.99072265625, 4.21209716796875, 4.4334716796875, 4.65484619140625, 4.876220703125, 5.09759521484375, 5.3189697265625, 5.54034423828125, 5.76171875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 7.0, 3.0, 9.0, 9.0, 22.0, 28.0, 35.0, 48.0, 62.0, 85.0, 113.0, 162.0, 215.0, 291.0, 417.0, 585.0, 803.0, 1122.0, 1637.0, 2427.0, 3748.0, 5752.0, 9868.0, 18124.0, 36664.0, 77440.0, 163592.0, 261498.0, 225809.0, 119516.0, 55734.0, 26518.0, 13699.0, 7852.0, 4679.0, 2988.0, 2034.0, 1389.0, 966.0, 720.0, 543.0, 369.0, 277.0, 183.0, 144.0, 99.0, 81.0, 51.0, 39.0, 37.0, 18.0, 14.0, 17.0, 10.0, 3.0, 2.0, 3.0, 2.0, 2.0], "bins": [-1.8642578125, -1.8073883056640625, -1.750518798828125, -1.6936492919921875, -1.63677978515625, -1.5799102783203125, -1.523040771484375, -1.4661712646484375, -1.4093017578125, -1.3524322509765625, -1.295562744140625, -1.2386932373046875, -1.18182373046875, -1.1249542236328125, -1.068084716796875, -1.0112152099609375, -0.954345703125, -0.8974761962890625, -0.840606689453125, -0.7837371826171875, -0.72686767578125, -0.6699981689453125, -0.613128662109375, -0.5562591552734375, -0.4993896484375, -0.4425201416015625, -0.385650634765625, -0.3287811279296875, -0.27191162109375, -0.2150421142578125, -0.158172607421875, -0.1013031005859375, -0.04443359375, 0.0124359130859375, 0.069305419921875, 0.1261749267578125, 0.18304443359375, 0.2399139404296875, 0.296783447265625, 0.3536529541015625, 0.4105224609375, 0.4673919677734375, 0.524261474609375, 0.5811309814453125, 0.63800048828125, 0.6948699951171875, 0.751739501953125, 0.8086090087890625, 0.865478515625, 0.9223480224609375, 0.979217529296875, 1.0360870361328125, 1.09295654296875, 1.1498260498046875, 1.206695556640625, 1.2635650634765625, 1.3204345703125, 1.3773040771484375, 1.434173583984375, 1.4910430908203125, 1.54791259765625, 1.6047821044921875, 1.661651611328125, 1.7185211181640625, 1.775390625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 6.0, 5.0, 9.0, 3.0, 7.0, 13.0, 11.0, 10.0, 17.0, 20.0, 23.0, 24.0, 24.0, 17.0, 34.0, 20.0, 30.0, 23.0, 30.0, 34.0, 43.0, 47.0, 30.0, 1059.0, 46.0, 33.0, 36.0, 49.0, 29.0, 35.0, 28.0, 22.0, 20.0, 24.0, 20.0, 19.0, 28.0, 15.0, 16.0, 12.0, 13.0, 12.0, 8.0, 4.0, 7.0, 4.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.83984375, -4.68548583984375, -4.5311279296875, -4.37677001953125, -4.222412109375, -4.06805419921875, -3.9136962890625, -3.75933837890625, -3.60498046875, -3.45062255859375, -3.2962646484375, -3.14190673828125, -2.987548828125, -2.83319091796875, -2.6788330078125, -2.52447509765625, -2.3701171875, -2.21575927734375, -2.0614013671875, -1.90704345703125, -1.752685546875, -1.59832763671875, -1.4439697265625, -1.28961181640625, -1.13525390625, -0.98089599609375, -0.8265380859375, -0.67218017578125, -0.517822265625, -0.36346435546875, -0.2091064453125, -0.05474853515625, 0.099609375, 0.25396728515625, 0.4083251953125, 0.56268310546875, 0.717041015625, 0.87139892578125, 1.0257568359375, 1.18011474609375, 1.33447265625, 1.48883056640625, 1.6431884765625, 1.79754638671875, 1.951904296875, 2.10626220703125, 2.2606201171875, 2.41497802734375, 2.5693359375, 2.72369384765625, 2.8780517578125, 3.03240966796875, 3.186767578125, 3.34112548828125, 3.4954833984375, 3.64984130859375, 3.80419921875, 3.95855712890625, 4.1129150390625, 4.26727294921875, 4.421630859375, 4.57598876953125, 4.7303466796875, 4.88470458984375, 5.0390625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 5.0, 4.0, 9.0, 13.0, 12.0, 26.0, 34.0, 57.0, 63.0, 98.0, 137.0, 192.0, 336.0, 508.0, 788.0, 1332.0, 2236.0, 4128.0, 7818.0, 17474.0, 45287.0, 131899.0, 524486.0, 1083668.0, 175064.0, 58671.0, 21975.0, 9559.0, 4615.0, 2573.0, 1471.0, 905.0, 570.0, 397.0, 234.0, 161.0, 102.0, 86.0, 46.0, 23.0, 22.0, 12.0, 18.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.5009765625, -1.454254150390625, -1.40753173828125, -1.360809326171875, -1.3140869140625, -1.267364501953125, -1.22064208984375, -1.173919677734375, -1.127197265625, -1.080474853515625, -1.03375244140625, -0.987030029296875, -0.9403076171875, -0.893585205078125, -0.84686279296875, -0.800140380859375, -0.75341796875, -0.706695556640625, -0.65997314453125, -0.613250732421875, -0.5665283203125, -0.519805908203125, -0.47308349609375, -0.426361083984375, -0.379638671875, -0.332916259765625, -0.28619384765625, -0.239471435546875, -0.1927490234375, -0.146026611328125, -0.09930419921875, -0.052581787109375, -0.005859375, 0.040863037109375, 0.08758544921875, 0.134307861328125, 0.1810302734375, 0.227752685546875, 0.27447509765625, 0.321197509765625, 0.367919921875, 0.414642333984375, 0.46136474609375, 0.508087158203125, 0.5548095703125, 0.601531982421875, 0.64825439453125, 0.694976806640625, 0.74169921875, 0.788421630859375, 0.83514404296875, 0.881866455078125, 0.9285888671875, 0.975311279296875, 1.02203369140625, 1.068756103515625, 1.115478515625, 1.162200927734375, 1.20892333984375, 1.255645751953125, 1.3023681640625, 1.349090576171875, 1.39581298828125, 1.442535400390625, 1.4892578125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 6.0, 7.0, 8.0, 8.0, 18.0, 20.0, 42.0, 83.0, 171.0, 227.0, 170.0, 96.0, 45.0, 22.0, 21.0, 11.0, 9.0, 8.0, 5.0, 4.0, 5.0, 0.0, 5.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.419677734375, -0.4054985046386719, -0.39131927490234375, -0.3771400451660156, -0.3629608154296875, -0.3487815856933594, -0.33460235595703125, -0.3204231262207031, -0.306243896484375, -0.2920646667480469, -0.27788543701171875, -0.2637062072753906, -0.2495269775390625, -0.23534774780273438, -0.22116851806640625, -0.20698928833007812, -0.19281005859375, -0.17863082885742188, -0.16445159912109375, -0.15027236938476562, -0.1360931396484375, -0.12191390991210938, -0.10773468017578125, -0.09355545043945312, -0.079376220703125, -0.06519699096679688, -0.05101776123046875, -0.036838531494140625, -0.0226593017578125, -0.008480072021484375, 0.00569915771484375, 0.019878387451171875, 0.0340576171875, 0.048236846923828125, 0.06241607666015625, 0.07659530639648438, 0.0907745361328125, 0.10495376586914062, 0.11913299560546875, 0.13331222534179688, 0.147491455078125, 0.16167068481445312, 0.17584991455078125, 0.19002914428710938, 0.2042083740234375, 0.21838760375976562, 0.23256683349609375, 0.24674606323242188, 0.26092529296875, 0.2751045227050781, 0.28928375244140625, 0.3034629821777344, 0.3176422119140625, 0.3318214416503906, 0.34600067138671875, 0.3601799011230469, 0.374359130859375, 0.3885383605957031, 0.40271759033203125, 0.4168968200683594, 0.4310760498046875, 0.4452552795410156, 0.45943450927734375, 0.4736137390136719, 0.48779296875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 2.0, 0.0, 7.0, 1.0, 6.0, 8.0, 10.0, 11.0, 14.0, 31.0, 42.0, 83.0, 120.0, 282.0, 1418.0, 1041163.0, 4629.0, 358.0, 134.0, 103.0, 44.0, 24.0, 21.0, 11.0, 7.0, 10.0, 6.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.6640625, -10.3560791015625, -10.048095703125, -9.7401123046875, -9.43212890625, -9.1241455078125, -8.816162109375, -8.5081787109375, -8.2001953125, -7.8922119140625, -7.584228515625, -7.2762451171875, -6.96826171875, -6.6602783203125, -6.352294921875, -6.0443115234375, -5.736328125, -5.4283447265625, -5.120361328125, -4.8123779296875, -4.50439453125, -4.1964111328125, -3.888427734375, -3.5804443359375, -3.2724609375, -2.9644775390625, -2.656494140625, -2.3485107421875, -2.04052734375, -1.7325439453125, -1.424560546875, -1.1165771484375, -0.80859375, -0.5006103515625, -0.192626953125, 0.1153564453125, 0.42333984375, 0.7313232421875, 1.039306640625, 1.3472900390625, 1.6552734375, 1.9632568359375, 2.271240234375, 2.5792236328125, 2.88720703125, 3.1951904296875, 3.503173828125, 3.8111572265625, 4.119140625, 4.4271240234375, 4.735107421875, 5.0430908203125, 5.35107421875, 5.6590576171875, 5.967041015625, 6.2750244140625, 6.5830078125, 6.8909912109375, 7.198974609375, 7.5069580078125, 7.81494140625, 8.1229248046875, 8.430908203125, 8.7388916015625, 9.046875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 8.0, 13.0, 59.0, 251.0, 402.0, 212.0, 56.0, 11.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6390513181686401, -0.6128795146942139, -0.5867077708244324, -0.5605359673500061, -0.5343642234802246, -0.5081924200057983, -0.48202061653137207, -0.4558488428592682, -0.4296770691871643, -0.4035052955150604, -0.37733352184295654, -0.3511617183685303, -0.3249899446964264, -0.2988181710243225, -0.27264636754989624, -0.24647459387779236, -0.22030282020568848, -0.1941310465335846, -0.16795925796031952, -0.14178746938705444, -0.11561569571495056, -0.08944392204284668, -0.0632721334695816, -0.03710034489631653, -0.010928571224212646, 0.015243209898471832, 0.04141499102115631, 0.06758677214384079, 0.09375855326652527, 0.11993032693862915, 0.14610211551189423, 0.1722739040851593, 0.19844567775726318, 0.22461745142936707, 0.25078922510147095, 0.2769610285758972, 0.3031328022480011, 0.329304575920105, 0.35547637939453125, 0.38164815306663513, 0.407819926738739, 0.4339917004108429, 0.4601634740829468, 0.48633527755737305, 0.5125070810317993, 0.5386788249015808, 0.5648506283760071, 0.5910223722457886, 0.6171941757202148, 0.6433659791946411, 0.6695377230644226, 0.6957095265388489, 0.7218812704086304, 0.7480530738830566, 0.7742248773574829, 0.8003966808319092, 0.8265684247016907, 0.8527402281761169, 0.8789119720458984, 0.9050837755203247, 0.931255578994751, 0.9574273228645325, 0.9835991263389587, 1.0097708702087402, 1.0359426736831665]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 0.0, 5.0, 9.0, 5.0, 4.0, 9.0, 13.0, 11.0, 19.0, 11.0, 14.0, 14.0, 32.0, 19.0, 22.0, 33.0, 33.0, 36.0, 33.0, 31.0, 39.0, 35.0, 39.0, 32.0, 31.0, 32.0, 30.0, 30.0, 39.0, 44.0, 31.0, 32.0, 36.0, 26.0, 20.0, 25.0, 22.0, 11.0, 13.0, 13.0, 14.0, 16.0, 12.0, 7.0, 4.0, 3.0, 1.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2659212350845337, -0.2571878433227539, -0.2484544813632965, -0.23972110450267792, -0.23098772764205933, -0.22225433588027954, -0.21352095901966095, -0.20478758215904236, -0.19605420529842377, -0.18732082843780518, -0.17858745157718658, -0.169854074716568, -0.1611206829547882, -0.1523873209953308, -0.14365392923355103, -0.13492055237293243, -0.12618717551231384, -0.11745379865169525, -0.10872042179107666, -0.09998703747987747, -0.09125366061925888, -0.08252028375864029, -0.0737868994474411, -0.06505352258682251, -0.05632014572620392, -0.04758676886558533, -0.03885338827967644, -0.030120009556412697, -0.021386630833148956, -0.012653253972530365, -0.003919873386621475, 0.0048135071992874146, 0.013546884059906006, 0.022280262783169746, 0.031013641506433487, 0.03974702209234238, 0.04848039895296097, 0.05721377581357956, 0.06594716012477875, 0.07468053698539734, 0.08341391384601593, 0.09214729070663452, 0.10088066756725311, 0.1096140518784523, 0.11834742873907089, 0.1270807981491089, 0.13581418991088867, 0.14454756677150726, 0.15328094363212585, 0.16201432049274445, 0.17074769735336304, 0.17948107421398163, 0.18821445107460022, 0.19694784283638, 0.2056812196969986, 0.2144145965576172, 0.22314797341823578, 0.23188135027885437, 0.24061472713947296, 0.24934810400009155, 0.25808149576187134, 0.26681485772132874, 0.2755482494831085, 0.2842816114425659, 0.2930150032043457]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 1.0, 7.0, 6.0, 8.0, 13.0, 13.0, 25.0, 15.0, 21.0, 18.0, 26.0, 29.0, 22.0, 30.0, 32.0, 46.0, 36.0, 54.0, 48.0, 59.0, 53.0, 52.0, 54.0, 43.0, 33.0, 35.0, 33.0, 20.0, 23.0, 22.0, 21.0, 29.0, 21.0, 11.0, 8.0, 8.0, 11.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-9.3515625, -9.09783935546875, -8.8441162109375, -8.59039306640625, -8.336669921875, -8.08294677734375, -7.8292236328125, -7.57550048828125, -7.32177734375, -7.06805419921875, -6.8143310546875, -6.56060791015625, -6.306884765625, -6.05316162109375, -5.7994384765625, -5.54571533203125, -5.2919921875, -5.03826904296875, -4.7845458984375, -4.53082275390625, -4.277099609375, -4.02337646484375, -3.7696533203125, -3.51593017578125, -3.26220703125, -3.00848388671875, -2.7547607421875, -2.50103759765625, -2.247314453125, -1.99359130859375, -1.7398681640625, -1.48614501953125, -1.232421875, -0.97869873046875, -0.7249755859375, -0.47125244140625, -0.217529296875, 0.03619384765625, 0.2899169921875, 0.54364013671875, 0.79736328125, 1.05108642578125, 1.3048095703125, 1.55853271484375, 1.812255859375, 2.06597900390625, 2.3197021484375, 2.57342529296875, 2.8271484375, 3.08087158203125, 3.3345947265625, 3.58831787109375, 3.842041015625, 4.09576416015625, 4.3494873046875, 4.60321044921875, 4.85693359375, 5.11065673828125, 5.3643798828125, 5.61810302734375, 5.871826171875, 6.12554931640625, 6.3792724609375, 6.63299560546875, 6.88671875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 7.0, 9.0, 18.0, 30.0, 32.0, 47.0, 85.0, 130.0, 173.0, 331.0, 511.0, 873.0, 1537.0, 2693.0, 5075.0, 9376.0, 17734.0, 35179.0, 71032.0, 155169.0, 297704.0, 236230.0, 108080.0, 51454.0, 25536.0, 13427.0, 7119.0, 3820.0, 2142.0, 1203.0, 619.0, 409.0, 278.0, 169.0, 91.0, 67.0, 45.0, 38.0, 30.0, 14.0, 12.0, 5.0, 9.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2578125, -7.98046875, -7.703125, -7.42578125, -7.1484375, -6.87109375, -6.59375, -6.31640625, -6.0390625, -5.76171875, -5.484375, -5.20703125, -4.9296875, -4.65234375, -4.375, -4.09765625, -3.8203125, -3.54296875, -3.265625, -2.98828125, -2.7109375, -2.43359375, -2.15625, -1.87890625, -1.6015625, -1.32421875, -1.046875, -0.76953125, -0.4921875, -0.21484375, 0.0625, 0.33984375, 0.6171875, 0.89453125, 1.171875, 1.44921875, 1.7265625, 2.00390625, 2.28125, 2.55859375, 2.8359375, 3.11328125, 3.390625, 3.66796875, 3.9453125, 4.22265625, 4.5, 4.77734375, 5.0546875, 5.33203125, 5.609375, 5.88671875, 6.1640625, 6.44140625, 6.71875, 6.99609375, 7.2734375, 7.55078125, 7.828125, 8.10546875, 8.3828125, 8.66015625, 8.9375, 9.21484375, 9.4921875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 4.0, 8.0, 5.0, 5.0, 7.0, 5.0, 8.0, 17.0, 15.0, 21.0, 23.0, 39.0, 32.0, 25.0, 23.0, 33.0, 58.0, 72.0, 84.0, 197.0, 245.0, 1302.0, 228.0, 118.0, 79.0, 46.0, 55.0, 38.0, 38.0, 29.0, 26.0, 27.0, 16.0, 26.0, 22.0, 18.0, 5.0, 6.0, 7.0, 7.0, 9.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-17.890625, -17.3822021484375, -16.873779296875, -16.3653564453125, -15.85693359375, -15.3485107421875, -14.840087890625, -14.3316650390625, -13.8232421875, -13.3148193359375, -12.806396484375, -12.2979736328125, -11.78955078125, -11.2811279296875, -10.772705078125, -10.2642822265625, -9.755859375, -9.2474365234375, -8.739013671875, -8.2305908203125, -7.72216796875, -7.2137451171875, -6.705322265625, -6.1968994140625, -5.6884765625, -5.1800537109375, -4.671630859375, -4.1632080078125, -3.65478515625, -3.1463623046875, -2.637939453125, -2.1295166015625, -1.62109375, -1.1126708984375, -0.604248046875, -0.0958251953125, 0.41259765625, 0.9210205078125, 1.429443359375, 1.9378662109375, 2.4462890625, 2.9547119140625, 3.463134765625, 3.9715576171875, 4.47998046875, 4.9884033203125, 5.496826171875, 6.0052490234375, 6.513671875, 7.0220947265625, 7.530517578125, 8.0389404296875, 8.54736328125, 9.0557861328125, 9.564208984375, 10.0726318359375, 10.5810546875, 11.0894775390625, 11.597900390625, 12.1063232421875, 12.61474609375, 13.1231689453125, 13.631591796875, 14.1400146484375, 14.6484375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 4.0, 5.0, 6.0, 13.0, 8.0, 17.0, 34.0, 30.0, 38.0, 52.0, 86.0, 94.0, 152.0, 226.0, 343.0, 536.0, 1032.0, 4089.0, 590850.0, 2538024.0, 7128.0, 1182.0, 577.0, 339.0, 240.0, 154.0, 114.0, 101.0, 53.0, 40.0, 29.0, 26.0, 16.0, 14.0, 10.0, 14.0, 5.0, 0.0, 6.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-50.53125, -48.90625, -47.28125, -45.65625, -44.03125, -42.40625, -40.78125, -39.15625, -37.53125, -35.90625, -34.28125, -32.65625, -31.03125, -29.40625, -27.78125, -26.15625, -24.53125, -22.90625, -21.28125, -19.65625, -18.03125, -16.40625, -14.78125, -13.15625, -11.53125, -9.90625, -8.28125, -6.65625, -5.03125, -3.40625, -1.78125, -0.15625, 1.46875, 3.09375, 4.71875, 6.34375, 7.96875, 9.59375, 11.21875, 12.84375, 14.46875, 16.09375, 17.71875, 19.34375, 20.96875, 22.59375, 24.21875, 25.84375, 27.46875, 29.09375, 30.71875, 32.34375, 33.96875, 35.59375, 37.21875, 38.84375, 40.46875, 42.09375, 43.71875, 45.34375, 46.96875, 48.59375, 50.21875, 51.84375, 53.46875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 18.0, 91.0, 281.0, 429.0, 147.0, 40.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-278.3912353515625, -273.26239013671875, -268.1335144042969, -263.0046691894531, -257.8758239746094, -252.74696350097656, -247.61810302734375, -242.4892578125, -237.3603973388672, -232.23153686523438, -227.10269165039062, -221.9738311767578, -216.844970703125, -211.71612548828125, -206.58726501464844, -201.45840454101562, -196.32955932617188, -191.20069885253906, -186.0718536376953, -180.9429931640625, -175.8141326904297, -170.68528747558594, -165.55642700195312, -160.42758178710938, -155.2987060546875, -150.1698455810547, -145.04100036621094, -139.91213989257812, -134.7832794189453, -129.65443420410156, -124.52557373046875, -119.39672088623047, -114.26786804199219, -109.1390151977539, -104.0101547241211, -98.88130187988281, -93.75244903564453, -88.62359619140625, -83.49473571777344, -78.36588287353516, -73.23702239990234, -68.10816955566406, -62.979312896728516, -57.85045623779297, -52.72160339355469, -47.59274673461914, -42.463890075683594, -37.33503723144531, -32.206180572509766, -27.07732582092285, -21.948471069335938, -16.81961441040039, -11.690759658813477, -6.5619049072265625, -1.4330482482910156, 3.6958045959472656, 8.824661254882812, 13.953516006469727, 19.08237075805664, 24.211227416992188, 29.3400821685791, 34.468936920166016, 39.59779357910156, 44.726646423339844, 49.85550308227539]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 5.0, 11.0, 12.0, 11.0, 14.0, 22.0, 18.0, 32.0, 31.0, 36.0, 46.0, 32.0, 32.0, 43.0, 54.0, 51.0, 43.0, 52.0, 49.0, 43.0, 33.0, 41.0, 41.0, 40.0, 27.0, 29.0, 28.0, 23.0, 23.0, 17.0, 11.0, 3.0, 8.0, 14.0, 7.0, 4.0, 2.0, 6.0, 3.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.120872497558594, -47.44120407104492, -45.76153564453125, -44.08186721801758, -42.402198791503906, -40.7225341796875, -39.04286193847656, -37.363197326660156, -35.683528900146484, -34.00386047363281, -32.32419204711914, -30.64452362060547, -28.96485710144043, -27.285188674926758, -25.605520248413086, -23.925853729248047, -22.246183395385742, -20.56651496887207, -18.8868465423584, -17.20718002319336, -15.527511596679688, -13.847843170166016, -12.168174743652344, -10.488507270812988, -8.808838844299316, -7.129170894622803, -5.449502944946289, -3.769834518432617, -2.0901665687561035, -0.41049861907958984, 1.269169807434082, 2.9488372802734375, 4.628505706787109, 6.308173656463623, 7.987841606140137, 9.667510032653809, 11.347177505493164, 13.026845932006836, 14.706514358520508, 16.386180877685547, 18.06584930419922, 19.74551773071289, 21.425186157226562, 23.104854583740234, 24.784521102905273, 26.464189529418945, 28.143857955932617, 29.823524475097656, 31.50319480895996, 33.182861328125, 34.86252975463867, 36.542198181152344, 38.221866607666016, 39.90153503417969, 41.58120346069336, 43.26087188720703, 44.9405403137207, 46.620208740234375, 48.29987716674805, 49.97954559326172, 51.65921401977539, 53.33888244628906, 55.01854705810547, 56.69821548461914, 58.37788391113281]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 2.0, 6.0, 4.0, 14.0, 10.0, 9.0, 16.0, 12.0, 21.0, 19.0, 22.0, 21.0, 29.0, 31.0, 27.0, 33.0, 39.0, 23.0, 31.0, 40.0, 40.0, 52.0, 35.0, 46.0, 45.0, 40.0, 35.0, 33.0, 26.0, 39.0, 25.0, 27.0, 20.0, 19.0, 17.0, 18.0, 20.0, 14.0, 6.0, 7.0, 4.0, 6.0, 7.0, 5.0, 6.0, 1.0, 3.0], "bins": [-8.7421875, -8.51544189453125, -8.2886962890625, -8.06195068359375, -7.835205078125, -7.60845947265625, -7.3817138671875, -7.15496826171875, -6.92822265625, -6.70147705078125, -6.4747314453125, -6.24798583984375, -6.021240234375, -5.79449462890625, -5.5677490234375, -5.34100341796875, -5.1142578125, -4.88751220703125, -4.6607666015625, -4.43402099609375, -4.207275390625, -3.98052978515625, -3.7537841796875, -3.52703857421875, -3.30029296875, -3.07354736328125, -2.8468017578125, -2.62005615234375, -2.393310546875, -2.16656494140625, -1.9398193359375, -1.71307373046875, -1.486328125, -1.25958251953125, -1.0328369140625, -0.80609130859375, -0.579345703125, -0.35260009765625, -0.1258544921875, 0.10089111328125, 0.32763671875, 0.55438232421875, 0.7811279296875, 1.00787353515625, 1.234619140625, 1.46136474609375, 1.6881103515625, 1.91485595703125, 2.1416015625, 2.36834716796875, 2.5950927734375, 2.82183837890625, 3.048583984375, 3.27532958984375, 3.5020751953125, 3.72882080078125, 3.95556640625, 4.18231201171875, 4.4090576171875, 4.63580322265625, 4.862548828125, 5.08929443359375, 5.3160400390625, 5.54278564453125, 5.76953125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 6.0, 9.0, 8.0, 18.0, 20.0, 30.0, 35.0, 55.0, 75.0, 94.0, 116.0, 163.0, 229.0, 376.0, 561.0, 905.0, 1520.0, 2833.0, 6179.0, 16757.0, 70481.0, 590799.0, 2661463.0, 725323.0, 83115.0, 18721.0, 6671.0, 3186.0, 1653.0, 987.0, 580.0, 387.0, 263.0, 178.0, 137.0, 99.0, 71.0, 43.0, 40.0, 22.0, 21.0, 16.0, 3.0, 15.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-17.25, -16.685302734375, -16.12060546875, -15.555908203125, -14.9912109375, -14.426513671875, -13.86181640625, -13.297119140625, -12.732421875, -12.167724609375, -11.60302734375, -11.038330078125, -10.4736328125, -9.908935546875, -9.34423828125, -8.779541015625, -8.21484375, -7.650146484375, -7.08544921875, -6.520751953125, -5.9560546875, -5.391357421875, -4.82666015625, -4.261962890625, -3.697265625, -3.132568359375, -2.56787109375, -2.003173828125, -1.4384765625, -0.873779296875, -0.30908203125, 0.255615234375, 0.8203125, 1.385009765625, 1.94970703125, 2.514404296875, 3.0791015625, 3.643798828125, 4.20849609375, 4.773193359375, 5.337890625, 5.902587890625, 6.46728515625, 7.031982421875, 7.5966796875, 8.161376953125, 8.72607421875, 9.290771484375, 9.85546875, 10.420166015625, 10.98486328125, 11.549560546875, 12.1142578125, 12.678955078125, 13.24365234375, 13.808349609375, 14.373046875, 14.937744140625, 15.50244140625, 16.067138671875, 16.6318359375, 17.196533203125, 17.76123046875, 18.325927734375, 18.890625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 9.0, 2.0, 2.0, 1.0, 8.0, 6.0, 11.0, 17.0, 26.0, 31.0, 39.0, 54.0, 65.0, 104.0, 115.0, 166.0, 207.0, 272.0, 383.0, 494.0, 488.0, 389.0, 312.0, 182.0, 162.0, 120.0, 110.0, 86.0, 52.0, 42.0, 35.0, 20.0, 17.0, 21.0, 12.0, 5.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.109375, -11.71875, -11.328125, -10.9375, -10.546875, -10.15625, -9.765625, -9.375, -8.984375, -8.59375, -8.203125, -7.8125, -7.421875, -7.03125, -6.640625, -6.25, -5.859375, -5.46875, -5.078125, -4.6875, -4.296875, -3.90625, -3.515625, -3.125, -2.734375, -2.34375, -1.953125, -1.5625, -1.171875, -0.78125, -0.390625, 0.0, 0.390625, 0.78125, 1.171875, 1.5625, 1.953125, 2.34375, 2.734375, 3.125, 3.515625, 3.90625, 4.296875, 4.6875, 5.078125, 5.46875, 5.859375, 6.25, 6.640625, 7.03125, 7.421875, 7.8125, 8.203125, 8.59375, 8.984375, 9.375, 9.765625, 10.15625, 10.546875, 10.9375, 11.328125, 11.71875, 12.109375, 12.5, 12.890625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 6.0, 4.0, 6.0, 9.0, 15.0, 13.0, 41.0, 37.0, 49.0, 70.0, 111.0, 172.0, 270.0, 533.0, 1126.0, 2586.0, 7828.0, 33286.0, 221470.0, 2277625.0, 1464189.0, 149726.0, 24588.0, 6200.0, 2168.0, 900.0, 431.0, 252.0, 181.0, 109.0, 78.0, 50.0, 36.0, 29.0, 24.0, 17.0, 8.0, 8.0, 8.0, 9.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.1875, -20.5234375, -19.859375, -19.1953125, -18.53125, -17.8671875, -17.203125, -16.5390625, -15.875, -15.2109375, -14.546875, -13.8828125, -13.21875, -12.5546875, -11.890625, -11.2265625, -10.5625, -9.8984375, -9.234375, -8.5703125, -7.90625, -7.2421875, -6.578125, -5.9140625, -5.25, -4.5859375, -3.921875, -3.2578125, -2.59375, -1.9296875, -1.265625, -0.6015625, 0.0625, 0.7265625, 1.390625, 2.0546875, 2.71875, 3.3828125, 4.046875, 4.7109375, 5.375, 6.0390625, 6.703125, 7.3671875, 8.03125, 8.6953125, 9.359375, 10.0234375, 10.6875, 11.3515625, 12.015625, 12.6796875, 13.34375, 14.0078125, 14.671875, 15.3359375, 16.0, 16.6640625, 17.328125, 17.9921875, 18.65625, 19.3203125, 19.984375, 20.6484375, 21.3125]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 13.0, 132.0, 525.0, 288.0, 51.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-280.7438659667969, -272.155517578125, -263.56719970703125, -254.97885131835938, -246.39051818847656, -237.80218505859375, -229.21383666992188, -220.62550354003906, -212.03717041015625, -203.44883728027344, -194.86050415039062, -186.27215576171875, -177.68382263183594, -169.09548950195312, -160.50714111328125, -151.91880798339844, -143.33047485351562, -134.7421417236328, -126.15380096435547, -117.56546020507812, -108.97712707519531, -100.3887939453125, -91.80045318603516, -83.21211242675781, -74.623779296875, -66.03544616699219, -57.447105407714844, -48.858768463134766, -40.27043151855469, -31.68209457397461, -23.09375762939453, -14.505420684814453, -5.9171142578125, 2.671222686767578, 11.259559631347656, 19.847896575927734, 28.436233520507812, 37.02457046508789, 45.61290740966797, 54.20124435424805, 62.789581298828125, 71.37791442871094, 79.96625518798828, 88.55459594726562, 97.14292907714844, 105.73126220703125, 114.3196029663086, 122.90794372558594, 131.49627685546875, 140.08460998535156, 148.67294311523438, 157.26129150390625, 165.84962463378906, 174.43795776367188, 183.02630615234375, 191.61463928222656, 200.20297241210938, 208.7913055419922, 217.379638671875, 225.96798706054688, 234.5563201904297, 243.1446533203125, 251.73300170898438, 260.3213195800781, 268.90966796875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 5.0, 6.0, 6.0, 7.0, 8.0, 9.0, 13.0, 17.0, 14.0, 15.0, 17.0, 30.0, 24.0, 28.0, 37.0, 46.0, 26.0, 45.0, 45.0, 41.0, 34.0, 42.0, 52.0, 42.0, 46.0, 40.0, 29.0, 28.0, 36.0, 34.0, 20.0, 25.0, 19.0, 30.0, 19.0, 22.0, 11.0, 11.0, 6.0, 9.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.71988296508789, -42.24472427368164, -40.769569396972656, -39.294410705566406, -37.819252014160156, -36.344093322753906, -34.86893844604492, -33.39377975463867, -31.918622970581055, -30.443466186523438, -28.968307495117188, -27.49315071105957, -26.017993927001953, -24.542835235595703, -23.067678451538086, -21.59252166748047, -20.11736297607422, -18.6422061920166, -17.16704750061035, -15.691890716552734, -14.2167329788208, -12.741575241088867, -11.26641845703125, -9.791260719299316, -8.316102981567383, -6.840945243835449, -5.365787982940674, -3.8906307220458984, -2.415472984313965, -0.9403152465820312, 0.5348415374755859, 2.0099992752075195, 3.485157012939453, 4.960314750671387, 6.435472011566162, 7.9106292724609375, 9.385787010192871, 10.860944747924805, 12.336101531982422, 13.811259269714355, 15.286417007446289, 16.761573791503906, 18.236732482910156, 19.711889266967773, 21.18704605102539, 22.66220474243164, 24.137361526489258, 25.612518310546875, 27.087677001953125, 28.562833786010742, 30.037992477416992, 31.51314926147461, 32.98830795288086, 34.463462829589844, 35.938621520996094, 37.413780212402344, 38.888938903808594, 40.364097595214844, 41.83925247192383, 43.31441116333008, 44.78956985473633, 46.26472473144531, 47.73988342285156, 49.21504211425781, 50.6901969909668]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 2.0, 7.0, 9.0, 15.0, 14.0, 13.0, 21.0, 12.0, 26.0, 23.0, 37.0, 35.0, 27.0, 24.0, 29.0, 43.0, 50.0, 42.0, 40.0, 52.0, 44.0, 51.0, 31.0, 47.0, 46.0, 49.0, 27.0, 27.0, 25.0, 20.0, 17.0, 22.0, 13.0, 11.0, 17.0, 6.0, 2.0, 7.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.0390625, -7.81646728515625, -7.5938720703125, -7.37127685546875, -7.148681640625, -6.92608642578125, -6.7034912109375, -6.48089599609375, -6.25830078125, -6.03570556640625, -5.8131103515625, -5.59051513671875, -5.367919921875, -5.14532470703125, -4.9227294921875, -4.70013427734375, -4.4775390625, -4.25494384765625, -4.0323486328125, -3.80975341796875, -3.587158203125, -3.36456298828125, -3.1419677734375, -2.91937255859375, -2.69677734375, -2.47418212890625, -2.2515869140625, -2.02899169921875, -1.806396484375, -1.58380126953125, -1.3612060546875, -1.13861083984375, -0.916015625, -0.69342041015625, -0.4708251953125, -0.24822998046875, -0.025634765625, 0.19696044921875, 0.4195556640625, 0.64215087890625, 0.86474609375, 1.08734130859375, 1.3099365234375, 1.53253173828125, 1.755126953125, 1.97772216796875, 2.2003173828125, 2.42291259765625, 2.6455078125, 2.86810302734375, 3.0906982421875, 3.31329345703125, 3.535888671875, 3.75848388671875, 3.9810791015625, 4.20367431640625, 4.42626953125, 4.64886474609375, 4.8714599609375, 5.09405517578125, 5.316650390625, 5.53924560546875, 5.7618408203125, 5.98443603515625, 6.20703125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 10.0, 5.0, 5.0, 17.0, 47.0, 52.0, 64.0, 118.0, 173.0, 305.0, 503.0, 725.0, 1142.0, 1981.0, 3359.0, 5765.0, 10219.0, 18402.0, 33664.0, 60390.0, 104827.0, 161263.0, 198702.0, 173783.0, 116676.0, 68533.0, 38688.0, 21425.0, 11727.0, 6573.0, 3637.0, 2181.0, 1305.0, 834.0, 518.0, 326.0, 224.0, 137.0, 92.0, 57.0, 44.0, 27.0, 12.0, 6.0, 6.0, 4.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9453125, -0.9163284301757812, -0.8873443603515625, -0.8583602905273438, -0.829376220703125, -0.8003921508789062, -0.7714080810546875, -0.7424240112304688, -0.71343994140625, -0.6844558715820312, -0.6554718017578125, -0.6264877319335938, -0.597503662109375, -0.5685195922851562, -0.5395355224609375, -0.5105514526367188, -0.4815673828125, -0.45258331298828125, -0.4235992431640625, -0.39461517333984375, -0.365631103515625, -0.33664703369140625, -0.3076629638671875, -0.27867889404296875, -0.24969482421875, -0.22071075439453125, -0.1917266845703125, -0.16274261474609375, -0.133758544921875, -0.10477447509765625, -0.0757904052734375, -0.04680633544921875, -0.017822265625, 0.01116180419921875, 0.0401458740234375, 0.06912994384765625, 0.098114013671875, 0.12709808349609375, 0.1560821533203125, 0.18506622314453125, 0.21405029296875, 0.24303436279296875, 0.2720184326171875, 0.30100250244140625, 0.329986572265625, 0.35897064208984375, 0.3879547119140625, 0.41693878173828125, 0.4459228515625, 0.47490692138671875, 0.5038909912109375, 0.5328750610351562, 0.561859130859375, 0.5908432006835938, 0.6198272705078125, 0.6488113403320312, 0.67779541015625, 0.7067794799804688, 0.7357635498046875, 0.7647476196289062, 0.793731689453125, 0.8227157592773438, 0.8516998291015625, 0.8806838989257812, 0.90966796875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 4.0, 3.0, 8.0, 8.0, 7.0, 13.0, 16.0, 20.0, 17.0, 22.0, 31.0, 19.0, 24.0, 41.0, 36.0, 23.0, 49.0, 34.0, 44.0, 35.0, 39.0, 1066.0, 36.0, 34.0, 35.0, 43.0, 32.0, 28.0, 28.0, 33.0, 31.0, 22.0, 27.0, 14.0, 18.0, 15.0, 17.0, 12.0, 7.0, 5.0, 8.0, 7.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-5.8203125, -5.65704345703125, -5.4937744140625, -5.33050537109375, -5.167236328125, -5.00396728515625, -4.8406982421875, -4.67742919921875, -4.51416015625, -4.35089111328125, -4.1876220703125, -4.02435302734375, -3.861083984375, -3.69781494140625, -3.5345458984375, -3.37127685546875, -3.2080078125, -3.04473876953125, -2.8814697265625, -2.71820068359375, -2.554931640625, -2.39166259765625, -2.2283935546875, -2.06512451171875, -1.90185546875, -1.73858642578125, -1.5753173828125, -1.41204833984375, -1.248779296875, -1.08551025390625, -0.9222412109375, -0.75897216796875, -0.595703125, -0.43243408203125, -0.2691650390625, -0.10589599609375, 0.057373046875, 0.22064208984375, 0.3839111328125, 0.54718017578125, 0.71044921875, 0.87371826171875, 1.0369873046875, 1.20025634765625, 1.363525390625, 1.52679443359375, 1.6900634765625, 1.85333251953125, 2.0166015625, 2.17987060546875, 2.3431396484375, 2.50640869140625, 2.669677734375, 2.83294677734375, 2.9962158203125, 3.15948486328125, 3.32275390625, 3.48602294921875, 3.6492919921875, 3.81256103515625, 3.975830078125, 4.13909912109375, 4.3023681640625, 4.46563720703125, 4.62890625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 11.0, 8.0, 9.0, 23.0, 39.0, 46.0, 91.0, 138.0, 218.0, 387.0, 632.0, 1052.0, 1936.0, 3564.0, 6917.0, 13954.0, 29258.0, 61769.0, 128762.0, 294097.0, 1108960.0, 233980.0, 108982.0, 52409.0, 24492.0, 12256.0, 5937.0, 3161.0, 1700.0, 911.0, 546.0, 331.0, 197.0, 125.0, 72.0, 52.0, 38.0, 38.0, 18.0, 9.0, 3.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.75341796875, -0.7294158935546875, -0.705413818359375, -0.6814117431640625, -0.65740966796875, -0.6334075927734375, -0.609405517578125, -0.5854034423828125, -0.5614013671875, -0.5373992919921875, -0.513397216796875, -0.4893951416015625, -0.46539306640625, -0.4413909912109375, -0.417388916015625, -0.3933868408203125, -0.369384765625, -0.3453826904296875, -0.321380615234375, -0.2973785400390625, -0.27337646484375, -0.2493743896484375, -0.225372314453125, -0.2013702392578125, -0.1773681640625, -0.1533660888671875, -0.129364013671875, -0.1053619384765625, -0.08135986328125, -0.0573577880859375, -0.033355712890625, -0.0093536376953125, 0.0146484375, 0.0386505126953125, 0.062652587890625, 0.0866546630859375, 0.11065673828125, 0.1346588134765625, 0.158660888671875, 0.1826629638671875, 0.2066650390625, 0.2306671142578125, 0.254669189453125, 0.2786712646484375, 0.30267333984375, 0.3266754150390625, 0.350677490234375, 0.3746795654296875, 0.398681640625, 0.4226837158203125, 0.446685791015625, 0.4706878662109375, 0.49468994140625, 0.5186920166015625, 0.542694091796875, 0.5666961669921875, 0.5906982421875, 0.6147003173828125, 0.638702392578125, 0.6627044677734375, 0.68670654296875, 0.7107086181640625, 0.734710693359375, 0.7587127685546875, 0.78271484375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 6.0, 3.0, 7.0, 8.0, 9.0, 11.0, 20.0, 26.0, 45.0, 78.0, 111.0, 205.0, 183.0, 101.0, 55.0, 46.0, 21.0, 11.0, 11.0, 6.0, 5.0, 3.0, 5.0, 4.0, 3.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.174072265625, -0.16802978515625, -0.1619873046875, -0.15594482421875, -0.14990234375, -0.14385986328125, -0.1378173828125, -0.13177490234375, -0.125732421875, -0.11968994140625, -0.1136474609375, -0.10760498046875, -0.1015625, -0.09552001953125, -0.0894775390625, -0.08343505859375, -0.077392578125, -0.07135009765625, -0.0653076171875, -0.05926513671875, -0.05322265625, -0.04718017578125, -0.0411376953125, -0.03509521484375, -0.029052734375, -0.02301025390625, -0.0169677734375, -0.01092529296875, -0.0048828125, 0.00115966796875, 0.0072021484375, 0.01324462890625, 0.019287109375, 0.02532958984375, 0.0313720703125, 0.03741455078125, 0.04345703125, 0.04949951171875, 0.0555419921875, 0.06158447265625, 0.067626953125, 0.07366943359375, 0.0797119140625, 0.08575439453125, 0.091796875, 0.09783935546875, 0.1038818359375, 0.10992431640625, 0.115966796875, 0.12200927734375, 0.1280517578125, 0.13409423828125, 0.14013671875, 0.14617919921875, 0.1522216796875, 0.15826416015625, 0.164306640625, 0.17034912109375, 0.1763916015625, 0.18243408203125, 0.1884765625, 0.19451904296875, 0.2005615234375, 0.20660400390625, 0.212646484375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 8.0, 11.0, 7.0, 11.0, 16.0, 18.0, 14.0, 30.0, 51.0, 63.0, 103.0, 232.0, 501.0, 3142.0, 1018819.0, 23663.0, 1062.0, 337.0, 150.0, 84.0, 64.0, 39.0, 27.0, 22.0, 13.0, 16.0, 12.0, 6.0, 6.0, 5.0, 7.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.603515625, -3.49981689453125, -3.3961181640625, -3.29241943359375, -3.188720703125, -3.08502197265625, -2.9813232421875, -2.87762451171875, -2.77392578125, -2.67022705078125, -2.5665283203125, -2.46282958984375, -2.359130859375, -2.25543212890625, -2.1517333984375, -2.04803466796875, -1.9443359375, -1.84063720703125, -1.7369384765625, -1.63323974609375, -1.529541015625, -1.42584228515625, -1.3221435546875, -1.21844482421875, -1.11474609375, -1.01104736328125, -0.9073486328125, -0.80364990234375, -0.699951171875, -0.59625244140625, -0.4925537109375, -0.38885498046875, -0.28515625, -0.18145751953125, -0.0777587890625, 0.02593994140625, 0.129638671875, 0.23333740234375, 0.3370361328125, 0.44073486328125, 0.54443359375, 0.64813232421875, 0.7518310546875, 0.85552978515625, 0.959228515625, 1.06292724609375, 1.1666259765625, 1.27032470703125, 1.3740234375, 1.47772216796875, 1.5814208984375, 1.68511962890625, 1.788818359375, 1.89251708984375, 1.9962158203125, 2.09991455078125, 2.20361328125, 2.30731201171875, 2.4110107421875, 2.51470947265625, 2.618408203125, 2.72210693359375, 2.8258056640625, 2.92950439453125, 3.033203125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 24.0, 228.0, 567.0, 160.0, 26.0, 4.0, 2.0], "bins": [-1.2729188203811646, -1.2514715194702148, -1.2300242185592651, -1.2085769176483154, -1.1871296167373657, -1.165682315826416, -1.1442350149154663, -1.1227877140045166, -1.1013405323028564, -1.0798932313919067, -1.058445930480957, -1.0369986295700073, -1.0155513286590576, -0.9941040873527527, -0.972656786441803, -0.9512094855308533, -0.9297621250152588, -0.9083148241043091, -0.8868675231933594, -0.8654202222824097, -0.84397292137146, -0.822525680065155, -0.8010783791542053, -0.7796310782432556, -0.7581837773323059, -0.7367364764213562, -0.7152891755104065, -0.6938418745994568, -0.6723946332931519, -0.6509473323822021, -0.6295000314712524, -0.6080527305603027, -0.5866054892539978, -0.5651581883430481, -0.5437108874320984, -0.5222635865211487, -0.5008163452148438, -0.47936901450157166, -0.45792174339294434, -0.43647444248199463, -0.4150271415710449, -0.3935798406600952, -0.3721325397491455, -0.3506852686405182, -0.3292379677295685, -0.3077906668186188, -0.28634339570999146, -0.26489609479904175, -0.24344877898693085, -0.22200149297714233, -0.20055419206619263, -0.17910689115524292, -0.1576596051454544, -0.1362123191356659, -0.11476501822471619, -0.09331773221492767, -0.07187043130397797, -0.050423137843608856, -0.028975844383239746, -0.007528550922870636, 0.013918742537498474, 0.035366035997867584, 0.056813329458236694, 0.07826061546802521, 0.09970791637897491]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 6.0, 7.0, 8.0, 9.0, 12.0, 13.0, 13.0, 12.0, 20.0, 14.0, 24.0, 34.0, 19.0, 37.0, 31.0, 28.0, 30.0, 46.0, 38.0, 52.0, 43.0, 38.0, 36.0, 35.0, 52.0, 51.0, 35.0, 30.0, 25.0, 37.0, 20.0, 23.0, 23.0, 10.0, 18.0, 8.0, 17.0, 9.0, 5.0, 10.0, 11.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12928873300552368, -0.1251937597990036, -0.12109877169132233, -0.11700379103422165, -0.11290881037712097, -0.10881383717060089, -0.10471885651350021, -0.10062387585639954, -0.09652889519929886, -0.09243391454219818, -0.0883389338850975, -0.08424395322799683, -0.08014898002147675, -0.07605399191379547, -0.07195901870727539, -0.06786403805017471, -0.06376905739307404, -0.05967407673597336, -0.05557909607887268, -0.0514841191470623, -0.047389138489961624, -0.04329415783286095, -0.03919918090105057, -0.03510420024394989, -0.031009219586849213, -0.026914238929748535, -0.022819260135293007, -0.01872428134083748, -0.014629300683736801, -0.010534320026636124, -0.006439341232180595, -0.002344362437725067, 0.0017506182193756104, 0.005845597945153713, 0.009940577670931816, 0.014035557396709919, 0.018130537122488022, 0.0222255177795887, 0.026320496574044228, 0.030415475368499756, 0.03451045602560043, 0.03860543668270111, 0.04270041733980179, 0.04679539427161217, 0.050890374928712845, 0.05498535558581352, 0.0590803325176239, 0.06317531317472458, 0.06727029383182526, 0.07136527448892593, 0.07546025514602661, 0.07955523580312729, 0.08365021646022797, 0.08774518966674805, 0.09184017032384872, 0.0959351509809494, 0.10003013163805008, 0.10412511229515076, 0.10822009295225143, 0.11231507360935211, 0.11641004681587219, 0.12050503492355347, 0.12460000813007355, 0.12869498133659363, 0.1327899694442749]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 11.0, 5.0, 10.0, 6.0, 9.0, 10.0, 19.0, 14.0, 23.0, 18.0, 22.0, 29.0, 20.0, 28.0, 27.0, 31.0, 39.0, 28.0, 42.0, 58.0, 38.0, 38.0, 31.0, 44.0, 39.0, 48.0, 40.0, 30.0, 27.0, 34.0, 28.0, 24.0, 19.0, 17.0, 12.0, 8.0, 12.0, 10.0, 12.0, 7.0, 7.0, 6.0, 5.0, 6.0, 1.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.66796875, -6.471923828125, -6.27587890625, -6.079833984375, -5.8837890625, -5.687744140625, -5.49169921875, -5.295654296875, -5.099609375, -4.903564453125, -4.70751953125, -4.511474609375, -4.3154296875, -4.119384765625, -3.92333984375, -3.727294921875, -3.53125, -3.335205078125, -3.13916015625, -2.943115234375, -2.7470703125, -2.551025390625, -2.35498046875, -2.158935546875, -1.962890625, -1.766845703125, -1.57080078125, -1.374755859375, -1.1787109375, -0.982666015625, -0.78662109375, -0.590576171875, -0.39453125, -0.198486328125, -0.00244140625, 0.193603515625, 0.3896484375, 0.585693359375, 0.78173828125, 0.977783203125, 1.173828125, 1.369873046875, 1.56591796875, 1.761962890625, 1.9580078125, 2.154052734375, 2.35009765625, 2.546142578125, 2.7421875, 2.938232421875, 3.13427734375, 3.330322265625, 3.5263671875, 3.722412109375, 3.91845703125, 4.114501953125, 4.310546875, 4.506591796875, 4.70263671875, 4.898681640625, 5.0947265625, 5.290771484375, 5.48681640625, 5.682861328125, 5.87890625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 10.0, 9.0, 15.0, 15.0, 27.0, 31.0, 44.0, 72.0, 81.0, 102.0, 162.0, 202.0, 280.0, 383.0, 607.0, 949.0, 1560.0, 2320.0, 4057.0, 6969.0, 12600.0, 24353.0, 51139.0, 121030.0, 339015.0, 287378.0, 102029.0, 44223.0, 21643.0, 11104.0, 6120.0, 3713.0, 2147.0, 1327.0, 875.0, 567.0, 398.0, 253.0, 199.0, 151.0, 109.0, 69.0, 56.0, 42.0, 30.0, 34.0, 21.0, 20.0, 5.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.78515625, -7.53326416015625, -7.2813720703125, -7.02947998046875, -6.777587890625, -6.52569580078125, -6.2738037109375, -6.02191162109375, -5.77001953125, -5.51812744140625, -5.2662353515625, -5.01434326171875, -4.762451171875, -4.51055908203125, -4.2586669921875, -4.00677490234375, -3.7548828125, -3.50299072265625, -3.2510986328125, -2.99920654296875, -2.747314453125, -2.49542236328125, -2.2435302734375, -1.99163818359375, -1.73974609375, -1.48785400390625, -1.2359619140625, -0.98406982421875, -0.732177734375, -0.48028564453125, -0.2283935546875, 0.02349853515625, 0.275390625, 0.52728271484375, 0.7791748046875, 1.03106689453125, 1.282958984375, 1.53485107421875, 1.7867431640625, 2.03863525390625, 2.29052734375, 2.54241943359375, 2.7943115234375, 3.04620361328125, 3.298095703125, 3.54998779296875, 3.8018798828125, 4.05377197265625, 4.3056640625, 4.55755615234375, 4.8094482421875, 5.06134033203125, 5.313232421875, 5.56512451171875, 5.8170166015625, 6.06890869140625, 6.32080078125, 6.57269287109375, 6.8245849609375, 7.07647705078125, 7.328369140625, 7.58026123046875, 7.8321533203125, 8.08404541015625, 8.3359375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 4.0, 5.0, 5.0, 6.0, 6.0, 11.0, 4.0, 11.0, 16.0, 20.0, 34.0, 25.0, 25.0, 35.0, 40.0, 47.0, 59.0, 92.0, 133.0, 197.0, 1344.0, 243.0, 149.0, 110.0, 66.0, 62.0, 47.0, 52.0, 33.0, 31.0, 22.0, 17.0, 11.0, 13.0, 12.0, 11.0, 12.0, 8.0, 9.0, 8.0, 6.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8359375, -14.3363037109375, -13.836669921875, -13.3370361328125, -12.83740234375, -12.3377685546875, -11.838134765625, -11.3385009765625, -10.8388671875, -10.3392333984375, -9.839599609375, -9.3399658203125, -8.84033203125, -8.3406982421875, -7.841064453125, -7.3414306640625, -6.841796875, -6.3421630859375, -5.842529296875, -5.3428955078125, -4.84326171875, -4.3436279296875, -3.843994140625, -3.3443603515625, -2.8447265625, -2.3450927734375, -1.845458984375, -1.3458251953125, -0.84619140625, -0.3465576171875, 0.153076171875, 0.6527099609375, 1.15234375, 1.6519775390625, 2.151611328125, 2.6512451171875, 3.15087890625, 3.6505126953125, 4.150146484375, 4.6497802734375, 5.1494140625, 5.6490478515625, 6.148681640625, 6.6483154296875, 7.14794921875, 7.6475830078125, 8.147216796875, 8.6468505859375, 9.146484375, 9.6461181640625, 10.145751953125, 10.6453857421875, 11.14501953125, 11.6446533203125, 12.144287109375, 12.6439208984375, 13.1435546875, 13.6431884765625, 14.142822265625, 14.6424560546875, 15.14208984375, 15.6417236328125, 16.141357421875, 16.6409912109375, 17.140625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 6.0, 5.0, 10.0, 13.0, 20.0, 20.0, 32.0, 35.0, 26.0, 86.0, 96.0, 119.0, 172.0, 249.0, 377.0, 703.0, 1640.0, 15537.0, 3070729.0, 51364.0, 2179.0, 767.0, 473.0, 315.0, 208.0, 147.0, 94.0, 76.0, 56.0, 42.0, 35.0, 9.0, 15.0, 12.0, 10.0, 9.0, 4.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-53.84375, -52.28857421875, -50.7333984375, -49.17822265625, -47.623046875, -46.06787109375, -44.5126953125, -42.95751953125, -41.40234375, -39.84716796875, -38.2919921875, -36.73681640625, -35.181640625, -33.62646484375, -32.0712890625, -30.51611328125, -28.9609375, -27.40576171875, -25.8505859375, -24.29541015625, -22.740234375, -21.18505859375, -19.6298828125, -18.07470703125, -16.51953125, -14.96435546875, -13.4091796875, -11.85400390625, -10.298828125, -8.74365234375, -7.1884765625, -5.63330078125, -4.078125, -2.52294921875, -0.9677734375, 0.58740234375, 2.142578125, 3.69775390625, 5.2529296875, 6.80810546875, 8.36328125, 9.91845703125, 11.4736328125, 13.02880859375, 14.583984375, 16.13916015625, 17.6943359375, 19.24951171875, 20.8046875, 22.35986328125, 23.9150390625, 25.47021484375, 27.025390625, 28.58056640625, 30.1357421875, 31.69091796875, 33.24609375, 34.80126953125, 36.3564453125, 37.91162109375, 39.466796875, 41.02197265625, 42.5771484375, 44.13232421875, 45.6875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 8.0, 12.0, 53.0, 131.0, 247.0, 243.0, 196.0, 83.0, 27.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-188.53330993652344, -184.6287384033203, -180.7241668701172, -176.81961059570312, -172.9150390625, -169.01046752929688, -165.10589599609375, -161.20132446289062, -157.2967529296875, -153.39218139648438, -149.48760986328125, -145.58303833007812, -141.67848205566406, -137.77391052246094, -133.8693389892578, -129.9647674560547, -126.0602035522461, -122.15563201904297, -118.25106811523438, -114.34649658203125, -110.44192504882812, -106.537353515625, -102.6327896118164, -98.72821807861328, -94.82365417480469, -90.91908264160156, -87.01451873779297, -83.10994720458984, -79.20537567138672, -75.30081176757812, -71.396240234375, -67.49166870117188, -63.587100982666016, -59.682533264160156, -55.77796173095703, -51.87339401245117, -47.96882629394531, -44.06425476074219, -40.15968704223633, -36.25511932373047, -32.350547790527344, -28.44597816467285, -24.54140853881836, -20.6368408203125, -16.732271194458008, -12.827701568603516, -8.923133850097656, -5.018564224243164, -1.1139945983886719, 2.790574550628662, 6.695143699645996, 10.599712371826172, 14.504281997680664, 18.408851623535156, 22.313419342041016, 26.217988967895508, 30.12255859375, 34.02712631225586, 37.931697845458984, 41.836265563964844, 45.74083709716797, 49.64540481567383, 53.54997253417969, 57.45454406738281, 61.35911178588867]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 1.0, 2.0, 3.0, 6.0, 9.0, 4.0, 6.0, 15.0, 6.0, 17.0, 13.0, 28.0, 20.0, 24.0, 31.0, 23.0, 41.0, 26.0, 37.0, 45.0, 43.0, 42.0, 47.0, 50.0, 47.0, 40.0, 39.0, 32.0, 35.0, 38.0, 33.0, 30.0, 27.0, 19.0, 21.0, 14.0, 19.0, 10.0, 14.0, 7.0, 12.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.64940643310547, -48.09418869018555, -46.538970947265625, -44.9837532043457, -43.42853546142578, -41.87331771850586, -40.31809997558594, -38.762882232666016, -37.207664489746094, -35.65244674682617, -34.09722900390625, -32.54201126098633, -30.986793518066406, -29.431575775146484, -27.876358032226562, -26.32114028930664, -24.76592445373535, -23.21070671081543, -21.655488967895508, -20.100271224975586, -18.545053482055664, -16.989835739135742, -15.434618949890137, -13.879401206970215, -12.324183464050293, -10.768965721130371, -9.21374797821045, -7.6585307121276855, -6.103312969207764, -4.548095226287842, -2.992877960205078, -1.4376602172851562, 0.11755752563476562, 1.672775149345398, 3.2279927730560303, 4.783210277557373, 6.338428020477295, 7.893645763397217, 9.44886302947998, 11.004080772399902, 12.559298515319824, 14.114516258239746, 15.669734001159668, 17.224950790405273, 18.780168533325195, 20.335386276245117, 21.89060401916504, 23.44582176208496, 25.001039505004883, 26.556257247924805, 28.111474990844727, 29.66669273376465, 31.22191047668457, 32.77712631225586, 34.33234405517578, 35.8875617980957, 37.442779541015625, 38.99799728393555, 40.55321502685547, 42.10843276977539, 43.66365051269531, 45.218868255615234, 46.774085998535156, 48.32930374145508, 49.884521484375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 4.0, 5.0, 7.0, 8.0, 11.0, 13.0, 18.0, 12.0, 18.0, 26.0, 24.0, 29.0, 25.0, 31.0, 35.0, 34.0, 33.0, 39.0, 42.0, 44.0, 35.0, 44.0, 45.0, 46.0, 38.0, 32.0, 32.0, 35.0, 27.0, 27.0, 22.0, 19.0, 28.0, 12.0, 16.0, 17.0, 17.0, 7.0, 13.0, 9.0, 4.0, 5.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.11328125, -6.89801025390625, -6.6827392578125, -6.46746826171875, -6.252197265625, -6.03692626953125, -5.8216552734375, -5.60638427734375, -5.39111328125, -5.17584228515625, -4.9605712890625, -4.74530029296875, -4.530029296875, -4.31475830078125, -4.0994873046875, -3.88421630859375, -3.6689453125, -3.45367431640625, -3.2384033203125, -3.02313232421875, -2.807861328125, -2.59259033203125, -2.3773193359375, -2.16204833984375, -1.94677734375, -1.73150634765625, -1.5162353515625, -1.30096435546875, -1.085693359375, -0.87042236328125, -0.6551513671875, -0.43988037109375, -0.224609375, -0.00933837890625, 0.2059326171875, 0.42120361328125, 0.636474609375, 0.85174560546875, 1.0670166015625, 1.28228759765625, 1.49755859375, 1.71282958984375, 1.9281005859375, 2.14337158203125, 2.358642578125, 2.57391357421875, 2.7891845703125, 3.00445556640625, 3.2197265625, 3.43499755859375, 3.6502685546875, 3.86553955078125, 4.080810546875, 4.29608154296875, 4.5113525390625, 4.72662353515625, 4.94189453125, 5.15716552734375, 5.3724365234375, 5.58770751953125, 5.802978515625, 6.01824951171875, 6.2335205078125, 6.44879150390625, 6.6640625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 8.0, 5.0, 12.0, 18.0, 19.0, 32.0, 34.0, 53.0, 93.0, 147.0, 184.0, 290.0, 430.0, 691.0, 1142.0, 1863.0, 3246.0, 6740.0, 16228.0, 59462.0, 469919.0, 2377109.0, 1086532.0, 125069.0, 25302.0, 9304.0, 4333.0, 2339.0, 1331.0, 796.0, 524.0, 326.0, 231.0, 149.0, 86.0, 75.0, 56.0, 29.0, 23.0, 14.0, 16.0, 10.0, 7.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.671875, -13.195556640625, -12.71923828125, -12.242919921875, -11.7666015625, -11.290283203125, -10.81396484375, -10.337646484375, -9.861328125, -9.385009765625, -8.90869140625, -8.432373046875, -7.9560546875, -7.479736328125, -7.00341796875, -6.527099609375, -6.05078125, -5.574462890625, -5.09814453125, -4.621826171875, -4.1455078125, -3.669189453125, -3.19287109375, -2.716552734375, -2.240234375, -1.763916015625, -1.28759765625, -0.811279296875, -0.3349609375, 0.141357421875, 0.61767578125, 1.093994140625, 1.5703125, 2.046630859375, 2.52294921875, 2.999267578125, 3.4755859375, 3.951904296875, 4.42822265625, 4.904541015625, 5.380859375, 5.857177734375, 6.33349609375, 6.809814453125, 7.2861328125, 7.762451171875, 8.23876953125, 8.715087890625, 9.19140625, 9.667724609375, 10.14404296875, 10.620361328125, 11.0966796875, 11.572998046875, 12.04931640625, 12.525634765625, 13.001953125, 13.478271484375, 13.95458984375, 14.430908203125, 14.9072265625, 15.383544921875, 15.85986328125, 16.336181640625, 16.8125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 5.0, 5.0, 4.0, 16.0, 13.0, 23.0, 32.0, 57.0, 70.0, 118.0, 186.0, 226.0, 331.0, 509.0, 609.0, 524.0, 414.0, 305.0, 202.0, 125.0, 98.0, 58.0, 51.0, 34.0, 22.0, 12.0, 6.0, 11.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0], "bins": [-20.609375, -20.1470947265625, -19.684814453125, -19.2225341796875, -18.76025390625, -18.2979736328125, -17.835693359375, -17.3734130859375, -16.9111328125, -16.4488525390625, -15.986572265625, -15.5242919921875, -15.06201171875, -14.5997314453125, -14.137451171875, -13.6751708984375, -13.212890625, -12.7506103515625, -12.288330078125, -11.8260498046875, -11.36376953125, -10.9014892578125, -10.439208984375, -9.9769287109375, -9.5146484375, -9.0523681640625, -8.590087890625, -8.1278076171875, -7.66552734375, -7.2032470703125, -6.740966796875, -6.2786865234375, -5.81640625, -5.3541259765625, -4.891845703125, -4.4295654296875, -3.96728515625, -3.5050048828125, -3.042724609375, -2.5804443359375, -2.1181640625, -1.6558837890625, -1.193603515625, -0.7313232421875, -0.26904296875, 0.1932373046875, 0.655517578125, 1.1177978515625, 1.580078125, 2.0423583984375, 2.504638671875, 2.9669189453125, 3.42919921875, 3.8914794921875, 4.353759765625, 4.8160400390625, 5.2783203125, 5.7406005859375, 6.202880859375, 6.6651611328125, 7.12744140625, 7.5897216796875, 8.052001953125, 8.5142822265625, 8.9765625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 10.0, 9.0, 24.0, 31.0, 55.0, 83.0, 168.0, 319.0, 687.0, 1815.0, 7866.0, 100618.0, 3501216.0, 557357.0, 18946.0, 3187.0, 985.0, 430.0, 190.0, 115.0, 61.0, 39.0, 29.0, 16.0, 11.0, 6.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.46875, -22.47900390625, -21.4892578125, -20.49951171875, -19.509765625, -18.52001953125, -17.5302734375, -16.54052734375, -15.55078125, -14.56103515625, -13.5712890625, -12.58154296875, -11.591796875, -10.60205078125, -9.6123046875, -8.62255859375, -7.6328125, -6.64306640625, -5.6533203125, -4.66357421875, -3.673828125, -2.68408203125, -1.6943359375, -0.70458984375, 0.28515625, 1.27490234375, 2.2646484375, 3.25439453125, 4.244140625, 5.23388671875, 6.2236328125, 7.21337890625, 8.203125, 9.19287109375, 10.1826171875, 11.17236328125, 12.162109375, 13.15185546875, 14.1416015625, 15.13134765625, 16.12109375, 17.11083984375, 18.1005859375, 19.09033203125, 20.080078125, 21.06982421875, 22.0595703125, 23.04931640625, 24.0390625, 25.02880859375, 26.0185546875, 27.00830078125, 27.998046875, 28.98779296875, 29.9775390625, 30.96728515625, 31.95703125, 32.94677734375, 33.9365234375, 34.92626953125, 35.916015625, 36.90576171875, 37.8955078125, 38.88525390625, 39.875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 80.0, 359.0, 420.0, 127.0, 14.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-401.24871826171875, -393.54583740234375, -385.84295654296875, -378.14007568359375, -370.43719482421875, -362.73431396484375, -355.03143310546875, -347.3285827636719, -339.6257019042969, -331.9228210449219, -324.2199401855469, -316.5170593261719, -308.8141784667969, -301.111328125, -293.408447265625, -285.70556640625, -278.002685546875, -270.2998046875, -262.596923828125, -254.89404296875, -247.19117736816406, -239.48829650878906, -231.78541564941406, -224.08253479003906, -216.379638671875, -208.6767578125, -200.973876953125, -193.27099609375, -185.56813049316406, -177.86524963378906, -170.16236877441406, -162.45948791503906, -154.75662231445312, -147.05374145507812, -139.35086059570312, -131.64797973632812, -123.94511413574219, -116.24223327636719, -108.53935241699219, -100.83647155761719, -93.13360595703125, -85.43072509765625, -77.72785186767578, -70.02497100830078, -62.32209396362305, -54.61921691894531, -46.91633605957031, -39.21345901489258, -31.510581970214844, -23.80770492553711, -16.104825973510742, -8.401947021484375, -0.6990699768066406, 7.003807067871094, 14.706687927246094, 22.409564971923828, 30.112442016601562, 37.8153190612793, 45.51819610595703, 53.22107696533203, 60.923954010009766, 68.6268310546875, 76.3297119140625, 84.0325927734375, 91.73546600341797]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 13.0, 9.0, 21.0, 29.0, 35.0, 25.0, 45.0, 59.0, 45.0, 52.0, 73.0, 77.0, 58.0, 67.0, 61.0, 52.0, 51.0, 64.0, 37.0, 32.0, 19.0, 22.0, 16.0, 12.0, 15.0, 3.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.89328002929688, -64.6712417602539, -62.449195861816406, -60.22715759277344, -58.0051155090332, -55.78307342529297, -53.561031341552734, -51.3389892578125, -49.11695098876953, -46.8949089050293, -44.67286682128906, -42.450828552246094, -40.22878646850586, -38.006744384765625, -35.78470230102539, -33.562660217285156, -31.340618133544922, -29.118576049804688, -26.896535873413086, -24.67449378967285, -22.45245361328125, -20.230411529541016, -18.00836944580078, -15.786328315734863, -13.564287185668945, -11.342246055603027, -9.12020492553711, -6.898162841796875, -4.676121711730957, -2.454080581665039, -0.2320384979248047, 1.9900026321411133, 4.212043762207031, 6.434084892272949, 8.656126022338867, 10.878168106079102, 13.10020923614502, 15.322250366210938, 17.544292449951172, 19.766334533691406, 21.988374710083008, 24.210416793823242, 26.432456970214844, 28.654499053955078, 30.876541137695312, 33.09857940673828, 35.32062530517578, 37.54266357421875, 39.764705657958984, 41.98674774169922, 44.20878982543945, 46.43083190917969, 48.652870178222656, 50.87491226196289, 53.096954345703125, 55.31899642944336, 57.541038513183594, 59.76308059692383, 61.98512268066406, 64.20716094970703, 66.42920684814453, 68.6512451171875, 70.873291015625, 73.09532928466797, 75.31736755371094]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 7.0, 9.0, 14.0, 9.0, 12.0, 17.0, 25.0, 22.0, 27.0, 31.0, 25.0, 40.0, 29.0, 40.0, 49.0, 36.0, 36.0, 46.0, 55.0, 38.0, 42.0, 37.0, 40.0, 34.0, 33.0, 34.0, 33.0, 25.0, 35.0, 22.0, 21.0, 8.0, 17.0, 8.0, 10.0, 7.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.5859375, -6.3868408203125, -6.187744140625, -5.9886474609375, -5.78955078125, -5.5904541015625, -5.391357421875, -5.1922607421875, -4.9931640625, -4.7940673828125, -4.594970703125, -4.3958740234375, -4.19677734375, -3.9976806640625, -3.798583984375, -3.5994873046875, -3.400390625, -3.2012939453125, -3.002197265625, -2.8031005859375, -2.60400390625, -2.4049072265625, -2.205810546875, -2.0067138671875, -1.8076171875, -1.6085205078125, -1.409423828125, -1.2103271484375, -1.01123046875, -0.8121337890625, -0.613037109375, -0.4139404296875, -0.21484375, -0.0157470703125, 0.183349609375, 0.3824462890625, 0.58154296875, 0.7806396484375, 0.979736328125, 1.1788330078125, 1.3779296875, 1.5770263671875, 1.776123046875, 1.9752197265625, 2.17431640625, 2.3734130859375, 2.572509765625, 2.7716064453125, 2.970703125, 3.1697998046875, 3.368896484375, 3.5679931640625, 3.76708984375, 3.9661865234375, 4.165283203125, 4.3643798828125, 4.5634765625, 4.7625732421875, 4.961669921875, 5.1607666015625, 5.35986328125, 5.5589599609375, 5.758056640625, 5.9571533203125, 6.15625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 6.0, 3.0, 2.0, 7.0, 11.0, 17.0, 20.0, 21.0, 41.0, 58.0, 87.0, 111.0, 181.0, 275.0, 508.0, 998.0, 1927.0, 4110.0, 9266.0, 23270.0, 58565.0, 141246.0, 267866.0, 277974.0, 153327.0, 64135.0, 25278.0, 10320.0, 4474.0, 2019.0, 1017.0, 528.0, 321.0, 156.0, 123.0, 86.0, 59.0, 49.0, 19.0, 22.0, 17.0, 8.0, 12.0, 8.0, 5.0, 0.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.271484375, -1.2318115234375, -1.192138671875, -1.1524658203125, -1.11279296875, -1.0731201171875, -1.033447265625, -0.9937744140625, -0.9541015625, -0.9144287109375, -0.874755859375, -0.8350830078125, -0.79541015625, -0.7557373046875, -0.716064453125, -0.6763916015625, -0.63671875, -0.5970458984375, -0.557373046875, -0.5177001953125, -0.47802734375, -0.4383544921875, -0.398681640625, -0.3590087890625, -0.3193359375, -0.2796630859375, -0.239990234375, -0.2003173828125, -0.16064453125, -0.1209716796875, -0.081298828125, -0.0416259765625, -0.001953125, 0.0377197265625, 0.077392578125, 0.1170654296875, 0.15673828125, 0.1964111328125, 0.236083984375, 0.2757568359375, 0.3154296875, 0.3551025390625, 0.394775390625, 0.4344482421875, 0.47412109375, 0.5137939453125, 0.553466796875, 0.5931396484375, 0.6328125, 0.6724853515625, 0.712158203125, 0.7518310546875, 0.79150390625, 0.8311767578125, 0.870849609375, 0.9105224609375, 0.9501953125, 0.9898681640625, 1.029541015625, 1.0692138671875, 1.10888671875, 1.1485595703125, 1.188232421875, 1.2279052734375, 1.267578125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 5.0, 3.0, 7.0, 13.0, 5.0, 7.0, 25.0, 24.0, 21.0, 18.0, 21.0, 30.0, 28.0, 34.0, 34.0, 44.0, 36.0, 48.0, 51.0, 37.0, 1072.0, 52.0, 45.0, 40.0, 34.0, 34.0, 40.0, 34.0, 39.0, 29.0, 20.0, 17.0, 12.0, 19.0, 18.0, 5.0, 4.0, 6.0, 1.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0625, -4.9146728515625, -4.766845703125, -4.6190185546875, -4.47119140625, -4.3233642578125, -4.175537109375, -4.0277099609375, -3.8798828125, -3.7320556640625, -3.584228515625, -3.4364013671875, -3.28857421875, -3.1407470703125, -2.992919921875, -2.8450927734375, -2.697265625, -2.5494384765625, -2.401611328125, -2.2537841796875, -2.10595703125, -1.9581298828125, -1.810302734375, -1.6624755859375, -1.5146484375, -1.3668212890625, -1.218994140625, -1.0711669921875, -0.92333984375, -0.7755126953125, -0.627685546875, -0.4798583984375, -0.33203125, -0.1842041015625, -0.036376953125, 0.1114501953125, 0.25927734375, 0.4071044921875, 0.554931640625, 0.7027587890625, 0.8505859375, 0.9984130859375, 1.146240234375, 1.2940673828125, 1.44189453125, 1.5897216796875, 1.737548828125, 1.8853759765625, 2.033203125, 2.1810302734375, 2.328857421875, 2.4766845703125, 2.62451171875, 2.7723388671875, 2.920166015625, 3.0679931640625, 3.2158203125, 3.3636474609375, 3.511474609375, 3.6593017578125, 3.80712890625, 3.9549560546875, 4.102783203125, 4.2506103515625, 4.3984375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 7.0, 10.0, 15.0, 8.0, 25.0, 30.0, 51.0, 97.0, 137.0, 235.0, 345.0, 554.0, 1039.0, 1886.0, 3668.0, 7148.0, 14496.0, 29545.0, 61535.0, 123566.0, 252989.0, 1102921.0, 252580.0, 123442.0, 61009.0, 29921.0, 14438.0, 7148.0, 3684.0, 1938.0, 1079.0, 615.0, 350.0, 209.0, 146.0, 90.0, 54.0, 37.0, 27.0, 20.0, 12.0, 8.0, 6.0, 5.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6484375, -0.6278533935546875, -0.607269287109375, -0.5866851806640625, -0.56610107421875, -0.5455169677734375, -0.524932861328125, -0.5043487548828125, -0.4837646484375, -0.4631805419921875, -0.442596435546875, -0.4220123291015625, -0.40142822265625, -0.3808441162109375, -0.360260009765625, -0.3396759033203125, -0.319091796875, -0.2985076904296875, -0.277923583984375, -0.2573394775390625, -0.23675537109375, -0.2161712646484375, -0.195587158203125, -0.1750030517578125, -0.1544189453125, -0.1338348388671875, -0.113250732421875, -0.0926666259765625, -0.07208251953125, -0.0514984130859375, -0.030914306640625, -0.0103302001953125, 0.01025390625, 0.0308380126953125, 0.051422119140625, 0.0720062255859375, 0.09259033203125, 0.1131744384765625, 0.133758544921875, 0.1543426513671875, 0.1749267578125, 0.1955108642578125, 0.216094970703125, 0.2366790771484375, 0.25726318359375, 0.2778472900390625, 0.298431396484375, 0.3190155029296875, 0.339599609375, 0.3601837158203125, 0.380767822265625, 0.4013519287109375, 0.42193603515625, 0.4425201416015625, 0.463104248046875, 0.4836883544921875, 0.5042724609375, 0.5248565673828125, 0.545440673828125, 0.5660247802734375, 0.58660888671875, 0.6071929931640625, 0.627777099609375, 0.6483612060546875, 0.6689453125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 5.0, 3.0, 3.0, 6.0, 19.0, 17.0, 30.0, 137.0, 524.0, 132.0, 39.0, 14.0, 17.0, 7.0, 9.0, 5.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51025390625, -0.49454498291015625, -0.4788360595703125, -0.46312713623046875, -0.447418212890625, -0.43170928955078125, -0.4160003662109375, -0.40029144287109375, -0.38458251953125, -0.36887359619140625, -0.3531646728515625, -0.33745574951171875, -0.321746826171875, -0.30603790283203125, -0.2903289794921875, -0.27462005615234375, -0.2589111328125, -0.24320220947265625, -0.2274932861328125, -0.21178436279296875, -0.196075439453125, -0.18036651611328125, -0.1646575927734375, -0.14894866943359375, -0.13323974609375, -0.11753082275390625, -0.1018218994140625, -0.08611297607421875, -0.070404052734375, -0.05469512939453125, -0.0389862060546875, -0.02327728271484375, -0.007568359375, 0.00814056396484375, 0.0238494873046875, 0.03955841064453125, 0.055267333984375, 0.07097625732421875, 0.0866851806640625, 0.10239410400390625, 0.11810302734375, 0.13381195068359375, 0.1495208740234375, 0.16522979736328125, 0.180938720703125, 0.19664764404296875, 0.2123565673828125, 0.22806549072265625, 0.2437744140625, 0.25948333740234375, 0.2751922607421875, 0.29090118408203125, 0.306610107421875, 0.32231903076171875, 0.3380279541015625, 0.35373687744140625, 0.36944580078125, 0.38515472412109375, 0.4008636474609375, 0.41657257080078125, 0.432281494140625, 0.44799041748046875, 0.4636993408203125, 0.47940826416015625, 0.4951171875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 3.0, 6.0, 8.0, 13.0, 31.0, 30.0, 29.0, 41.0, 64.0, 177.0, 950.0, 9357.0, 1029628.0, 7042.0, 757.0, 139.0, 71.0, 35.0, 33.0, 29.0, 23.0, 17.0, 9.0, 9.0, 3.0, 5.0, 1.0, 5.0, 1.0, 3.0, 2.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.3046875, -8.0487060546875, -7.792724609375, -7.5367431640625, -7.28076171875, -7.0247802734375, -6.768798828125, -6.5128173828125, -6.2568359375, -6.0008544921875, -5.744873046875, -5.4888916015625, -5.23291015625, -4.9769287109375, -4.720947265625, -4.4649658203125, -4.208984375, -3.9530029296875, -3.697021484375, -3.4410400390625, -3.18505859375, -2.9290771484375, -2.673095703125, -2.4171142578125, -2.1611328125, -1.9051513671875, -1.649169921875, -1.3931884765625, -1.13720703125, -0.8812255859375, -0.625244140625, -0.3692626953125, -0.11328125, 0.1427001953125, 0.398681640625, 0.6546630859375, 0.91064453125, 1.1666259765625, 1.422607421875, 1.6785888671875, 1.9345703125, 2.1905517578125, 2.446533203125, 2.7025146484375, 2.95849609375, 3.2144775390625, 3.470458984375, 3.7264404296875, 3.982421875, 4.2384033203125, 4.494384765625, 4.7503662109375, 5.00634765625, 5.2623291015625, 5.518310546875, 5.7742919921875, 6.0302734375, 6.2862548828125, 6.542236328125, 6.7982177734375, 7.05419921875, 7.3101806640625, 7.566162109375, 7.8221435546875, 8.078125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 10.0, 15.0, 44.0, 201.0, 488.0, 163.0, 53.0, 22.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.724366545677185, -1.6827110052108765, -1.6410554647445679, -1.5994000434875488, -1.5577445030212402, -1.5160889625549316, -1.474433422088623, -1.4327778816223145, -1.3911224603652954, -1.3494669198989868, -1.3078113794326782, -1.2661559581756592, -1.2245004177093506, -1.182844877243042, -1.1411893367767334, -1.0995337963104248, -1.0578782558441162, -1.0162227153778076, -0.9745672345161438, -0.9329116940498352, -0.8912562131881714, -0.8496006727218628, -0.8079451322555542, -0.7662896513938904, -0.7246341705322266, -0.682978630065918, -0.6413231492042542, -0.5996676087379456, -0.5580121278762817, -0.5163565874099731, -0.47470107674598694, -0.43304556608200073, -0.39139002561569214, -0.34973451495170593, -0.3080790042877197, -0.26642346382141113, -0.22476796805858612, -0.18311245739459991, -0.14145693182945251, -0.09980142116546631, -0.0581459105014801, -0.016490396112203598, 0.025165118277072906, 0.06682063639163971, 0.10847614705562592, 0.15013165771961212, 0.19178718328475952, 0.23344269394874573, 0.27509820461273193, 0.31675371527671814, 0.35840922594070435, 0.40006476640701294, 0.44172024726867676, 0.48337578773498535, 0.525031328201294, 0.5666868090629578, 0.6083422899246216, 0.6499978303909302, 0.691653311252594, 0.7333088517189026, 0.7749643325805664, 0.816619873046875, 0.8582754135131836, 0.8999308943748474, 0.941586434841156]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 3.0, 6.0, 2.0, 5.0, 3.0, 10.0, 8.0, 6.0, 10.0, 13.0, 14.0, 13.0, 10.0, 16.0, 19.0, 23.0, 25.0, 26.0, 28.0, 40.0, 32.0, 37.0, 39.0, 43.0, 41.0, 36.0, 31.0, 42.0, 31.0, 56.0, 29.0, 31.0, 23.0, 30.0, 33.0, 25.0, 25.0, 24.0, 25.0, 19.0, 12.0, 13.0, 11.0, 8.0, 10.0, 4.0, 3.0, 4.0, 7.0, 2.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.3022770285606384, -0.29198208451271057, -0.2816871702671051, -0.27139222621917725, -0.2610972821712494, -0.2508023679256439, -0.24050742387771606, -0.2302124947309494, -0.21991756558418274, -0.20962263643741608, -0.19932769238948822, -0.18903276324272156, -0.1787378340959549, -0.16844290494918823, -0.15814796090126038, -0.1478530317544937, -0.13755808770656586, -0.1272631585597992, -0.11696822196245193, -0.10667328536510468, -0.09637835621833801, -0.08608341962099075, -0.0757884830236435, -0.06549355387687683, -0.05519861727952957, -0.04490368440747261, -0.03460875153541565, -0.02431381493806839, -0.014018882066011429, -0.0037239491939544678, 0.006570987403392792, 0.016865916550159454, 0.027160853147506714, 0.037455786019563675, 0.047750718891620636, 0.058045655488967896, 0.06834058463573456, 0.07863552123308182, 0.08893045783042908, 0.09922538697719574, 0.109520323574543, 0.11981526017189026, 0.13011018931865692, 0.14040511846542358, 0.15070006251335144, 0.1609949916601181, 0.17128992080688477, 0.18158486485481262, 0.19187979400157928, 0.20217472314834595, 0.2124696671962738, 0.22276459634304047, 0.23305952548980713, 0.24335446953773499, 0.25364941358566284, 0.2639443278312683, 0.27423927187919617, 0.284534215927124, 0.2948291301727295, 0.30512407422065735, 0.3154190182685852, 0.3257139325141907, 0.33600887656211853, 0.3463038206100464, 0.35659873485565186]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 4.0, 12.0, 8.0, 8.0, 10.0, 14.0, 15.0, 17.0, 21.0, 28.0, 23.0, 25.0, 30.0, 40.0, 37.0, 36.0, 25.0, 39.0, 37.0, 41.0, 54.0, 36.0, 39.0, 50.0, 34.0, 42.0, 26.0, 26.0, 30.0, 28.0, 26.0, 25.0, 22.0, 16.0, 17.0, 12.0, 11.0, 11.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-6.34765625, -6.1614990234375, -5.975341796875, -5.7891845703125, -5.60302734375, -5.4168701171875, -5.230712890625, -5.0445556640625, -4.8583984375, -4.6722412109375, -4.486083984375, -4.2999267578125, -4.11376953125, -3.9276123046875, -3.741455078125, -3.5552978515625, -3.369140625, -3.1829833984375, -2.996826171875, -2.8106689453125, -2.62451171875, -2.4383544921875, -2.252197265625, -2.0660400390625, -1.8798828125, -1.6937255859375, -1.507568359375, -1.3214111328125, -1.13525390625, -0.9490966796875, -0.762939453125, -0.5767822265625, -0.390625, -0.2044677734375, -0.018310546875, 0.1678466796875, 0.35400390625, 0.5401611328125, 0.726318359375, 0.9124755859375, 1.0986328125, 1.2847900390625, 1.470947265625, 1.6571044921875, 1.84326171875, 2.0294189453125, 2.215576171875, 2.4017333984375, 2.587890625, 2.7740478515625, 2.960205078125, 3.1463623046875, 3.33251953125, 3.5186767578125, 3.704833984375, 3.8909912109375, 4.0771484375, 4.2633056640625, 4.449462890625, 4.6356201171875, 4.82177734375, 5.0079345703125, 5.194091796875, 5.3802490234375, 5.56640625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 6.0, 6.0, 11.0, 4.0, 11.0, 21.0, 35.0, 48.0, 51.0, 55.0, 80.0, 121.0, 161.0, 254.0, 370.0, 613.0, 1158.0, 2060.0, 4215.0, 9576.0, 26588.0, 91104.0, 327324.0, 401780.0, 125121.0, 34917.0, 12011.0, 5075.0, 2441.0, 1244.0, 689.0, 453.0, 303.0, 179.0, 127.0, 86.0, 60.0, 51.0, 36.0, 28.0, 22.0, 21.0, 14.0, 10.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.4375, -7.2059326171875, -6.974365234375, -6.7427978515625, -6.51123046875, -6.2796630859375, -6.048095703125, -5.8165283203125, -5.5849609375, -5.3533935546875, -5.121826171875, -4.8902587890625, -4.65869140625, -4.4271240234375, -4.195556640625, -3.9639892578125, -3.732421875, -3.5008544921875, -3.269287109375, -3.0377197265625, -2.80615234375, -2.5745849609375, -2.343017578125, -2.1114501953125, -1.8798828125, -1.6483154296875, -1.416748046875, -1.1851806640625, -0.95361328125, -0.7220458984375, -0.490478515625, -0.2589111328125, -0.02734375, 0.2042236328125, 0.435791015625, 0.6673583984375, 0.89892578125, 1.1304931640625, 1.362060546875, 1.5936279296875, 1.8251953125, 2.0567626953125, 2.288330078125, 2.5198974609375, 2.75146484375, 2.9830322265625, 3.214599609375, 3.4461669921875, 3.677734375, 3.9093017578125, 4.140869140625, 4.3724365234375, 4.60400390625, 4.8355712890625, 5.067138671875, 5.2987060546875, 5.5302734375, 5.7618408203125, 5.993408203125, 6.2249755859375, 6.45654296875, 6.6881103515625, 6.919677734375, 7.1512451171875, 7.3828125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 8.0, 12.0, 11.0, 10.0, 16.0, 30.0, 33.0, 29.0, 38.0, 50.0, 50.0, 81.0, 109.0, 286.0, 1561.0, 247.0, 120.0, 64.0, 52.0, 47.0, 35.0, 25.0, 37.0, 39.0, 17.0, 11.0, 9.0, 2.0, 5.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.421875, -19.79248046875, -19.1630859375, -18.53369140625, -17.904296875, -17.27490234375, -16.6455078125, -16.01611328125, -15.38671875, -14.75732421875, -14.1279296875, -13.49853515625, -12.869140625, -12.23974609375, -11.6103515625, -10.98095703125, -10.3515625, -9.72216796875, -9.0927734375, -8.46337890625, -7.833984375, -7.20458984375, -6.5751953125, -5.94580078125, -5.31640625, -4.68701171875, -4.0576171875, -3.42822265625, -2.798828125, -2.16943359375, -1.5400390625, -0.91064453125, -0.28125, 0.34814453125, 0.9775390625, 1.60693359375, 2.236328125, 2.86572265625, 3.4951171875, 4.12451171875, 4.75390625, 5.38330078125, 6.0126953125, 6.64208984375, 7.271484375, 7.90087890625, 8.5302734375, 9.15966796875, 9.7890625, 10.41845703125, 11.0478515625, 11.67724609375, 12.306640625, 12.93603515625, 13.5654296875, 14.19482421875, 14.82421875, 15.45361328125, 16.0830078125, 16.71240234375, 17.341796875, 17.97119140625, 18.6005859375, 19.22998046875, 19.859375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 7.0, 14.0, 14.0, 18.0, 24.0, 34.0, 38.0, 58.0, 60.0, 82.0, 116.0, 206.0, 294.0, 527.0, 1200.0, 7686.0, 2068959.0, 1057835.0, 5851.0, 1151.0, 490.0, 286.0, 180.0, 156.0, 83.0, 81.0, 54.0, 36.0, 30.0, 24.0, 17.0, 18.0, 16.0, 10.0, 2.0, 6.0, 6.0, 6.0, 3.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-24.8125, -24.010986328125, -23.20947265625, -22.407958984375, -21.6064453125, -20.804931640625, -20.00341796875, -19.201904296875, -18.400390625, -17.598876953125, -16.79736328125, -15.995849609375, -15.1943359375, -14.392822265625, -13.59130859375, -12.789794921875, -11.98828125, -11.186767578125, -10.38525390625, -9.583740234375, -8.7822265625, -7.980712890625, -7.17919921875, -6.377685546875, -5.576171875, -4.774658203125, -3.97314453125, -3.171630859375, -2.3701171875, -1.568603515625, -0.76708984375, 0.034423828125, 0.8359375, 1.637451171875, 2.43896484375, 3.240478515625, 4.0419921875, 4.843505859375, 5.64501953125, 6.446533203125, 7.248046875, 8.049560546875, 8.85107421875, 9.652587890625, 10.4541015625, 11.255615234375, 12.05712890625, 12.858642578125, 13.66015625, 14.461669921875, 15.26318359375, 16.064697265625, 16.8662109375, 17.667724609375, 18.46923828125, 19.270751953125, 20.072265625, 20.873779296875, 21.67529296875, 22.476806640625, 23.2783203125, 24.079833984375, 24.88134765625, 25.682861328125, 26.484375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 21.0, 110.0, 321.0, 409.0, 127.0, 22.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-156.1680145263672, -152.91795349121094, -149.66787719726562, -146.41781616210938, -143.16775512695312, -139.9176788330078, -136.66761779785156, -133.41754150390625, -130.16748046875, -126.91741180419922, -123.66734313964844, -120.41728210449219, -117.1672134399414, -113.91714477539062, -110.66708374023438, -107.4170150756836, -104.16694641113281, -100.91687774658203, -97.66680908203125, -94.416748046875, -91.16667938232422, -87.91661071777344, -84.66654968261719, -81.4164810180664, -78.16641235351562, -74.91634368896484, -71.66627502441406, -68.41621398925781, -65.16614532470703, -61.91607666015625, -58.666011810302734, -55.41594696044922, -52.16587448120117, -48.915809631347656, -45.665740966796875, -42.415672302246094, -39.16560745239258, -35.91554260253906, -32.66547393798828, -29.415407180786133, -26.165340423583984, -22.915273666381836, -19.665206909179688, -16.41514015197754, -13.16507339477539, -9.915006637573242, -6.664939880371094, -3.4148731231689453, -0.16480636596679688, 3.0852603912353516, 6.3353271484375, 9.585393905639648, 12.835460662841797, 16.085527420043945, 19.335594177246094, 22.585660934448242, 25.83572769165039, 29.08579444885254, 32.33586120605469, 35.58592987060547, 38.835994720458984, 42.0860595703125, 45.33612823486328, 48.58619689941406, 51.83626174926758]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 10.0, 10.0, 7.0, 16.0, 16.0, 14.0, 16.0, 25.0, 12.0, 27.0, 21.0, 25.0, 31.0, 31.0, 26.0, 25.0, 35.0, 43.0, 52.0, 37.0, 29.0, 31.0, 34.0, 39.0, 31.0, 44.0, 32.0, 52.0, 26.0, 26.0, 20.0, 25.0, 10.0, 23.0, 17.0, 10.0, 10.0, 10.0, 14.0, 7.0, 8.0, 6.0, 3.0, 9.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.69558334350586, -33.70706558227539, -32.718544006347656, -31.730026245117188, -30.74150848388672, -29.752988815307617, -28.764469146728516, -27.775951385498047, -26.787431716918945, -25.798912048339844, -24.810394287109375, -23.821874618530273, -22.833354949951172, -21.844837188720703, -20.8563175201416, -19.8677978515625, -18.87928009033203, -17.89076042175293, -16.90224266052246, -15.91372299194336, -14.925204277038574, -13.936685562133789, -12.948165893554688, -11.959647178649902, -10.971128463745117, -9.982609748840332, -8.994091033935547, -8.005571365356445, -7.01705265045166, -6.028533935546875, -5.040014743804932, -4.051495552062988, -3.062976837158203, -2.074457883834839, -1.0859389305114746, -0.09741997718811035, 0.8910989761352539, 1.879617691040039, 2.8681368827819824, 3.856656074523926, 4.845174789428711, 5.833693504333496, 6.8222126960754395, 7.810731887817383, 8.799250602722168, 9.787769317626953, 10.776288986206055, 11.76480770111084, 12.753326416015625, 13.74184513092041, 14.730363845825195, 15.718883514404297, 16.707401275634766, 17.695920944213867, 18.68444061279297, 19.672958374023438, 20.66147804260254, 21.64999771118164, 22.63851547241211, 23.62703514099121, 24.615554809570312, 25.60407257080078, 26.592592239379883, 27.581111907958984, 28.569629669189453]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 8.0, 7.0, 8.0, 9.0, 9.0, 19.0, 16.0, 19.0, 24.0, 25.0, 35.0, 39.0, 27.0, 36.0, 44.0, 28.0, 35.0, 42.0, 47.0, 43.0, 55.0, 31.0, 45.0, 32.0, 39.0, 41.0, 32.0, 22.0, 31.0, 29.0, 23.0, 24.0, 21.0, 11.0, 9.0, 14.0, 7.0, 3.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.58984375, -7.36126708984375, -7.1326904296875, -6.90411376953125, -6.675537109375, -6.44696044921875, -6.2183837890625, -5.98980712890625, -5.76123046875, -5.53265380859375, -5.3040771484375, -5.07550048828125, -4.846923828125, -4.61834716796875, -4.3897705078125, -4.16119384765625, -3.9326171875, -3.70404052734375, -3.4754638671875, -3.24688720703125, -3.018310546875, -2.78973388671875, -2.5611572265625, -2.33258056640625, -2.10400390625, -1.87542724609375, -1.6468505859375, -1.41827392578125, -1.189697265625, -0.96112060546875, -0.7325439453125, -0.50396728515625, -0.275390625, -0.04681396484375, 0.1817626953125, 0.41033935546875, 0.638916015625, 0.86749267578125, 1.0960693359375, 1.32464599609375, 1.55322265625, 1.78179931640625, 2.0103759765625, 2.23895263671875, 2.467529296875, 2.69610595703125, 2.9246826171875, 3.15325927734375, 3.3818359375, 3.61041259765625, 3.8389892578125, 4.06756591796875, 4.296142578125, 4.52471923828125, 4.7532958984375, 4.98187255859375, 5.21044921875, 5.43902587890625, 5.6676025390625, 5.89617919921875, 6.124755859375, 6.35333251953125, 6.5819091796875, 6.81048583984375, 7.0390625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 9.0, 10.0, 12.0, 17.0, 30.0, 31.0, 40.0, 75.0, 93.0, 122.0, 186.0, 267.0, 385.0, 629.0, 1080.0, 2178.0, 5934.0, 28926.0, 505629.0, 3296177.0, 319673.0, 22594.0, 5219.0, 2039.0, 1055.0, 567.0, 402.0, 291.0, 183.0, 145.0, 87.0, 50.0, 34.0, 32.0, 24.0, 27.0, 9.0, 3.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.0625, -29.106201171875, -28.14990234375, -27.193603515625, -26.2373046875, -25.281005859375, -24.32470703125, -23.368408203125, -22.412109375, -21.455810546875, -20.49951171875, -19.543212890625, -18.5869140625, -17.630615234375, -16.67431640625, -15.718017578125, -14.76171875, -13.805419921875, -12.84912109375, -11.892822265625, -10.9365234375, -9.980224609375, -9.02392578125, -8.067626953125, -7.111328125, -6.155029296875, -5.19873046875, -4.242431640625, -3.2861328125, -2.329833984375, -1.37353515625, -0.417236328125, 0.5390625, 1.495361328125, 2.45166015625, 3.407958984375, 4.3642578125, 5.320556640625, 6.27685546875, 7.233154296875, 8.189453125, 9.145751953125, 10.10205078125, 11.058349609375, 12.0146484375, 12.970947265625, 13.92724609375, 14.883544921875, 15.83984375, 16.796142578125, 17.75244140625, 18.708740234375, 19.6650390625, 20.621337890625, 21.57763671875, 22.533935546875, 23.490234375, 24.446533203125, 25.40283203125, 26.359130859375, 27.3154296875, 28.271728515625, 29.22802734375, 30.184326171875, 31.140625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 7.0, 4.0, 11.0, 8.0, 10.0, 31.0, 32.0, 45.0, 62.0, 87.0, 141.0, 196.0, 269.0, 373.0, 451.0, 484.0, 458.0, 362.0, 291.0, 229.0, 147.0, 121.0, 70.0, 71.0, 42.0, 22.0, 16.0, 5.0, 9.0, 9.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.265625, -15.845703125, -15.42578125, -15.005859375, -14.5859375, -14.166015625, -13.74609375, -13.326171875, -12.90625, -12.486328125, -12.06640625, -11.646484375, -11.2265625, -10.806640625, -10.38671875, -9.966796875, -9.546875, -9.126953125, -8.70703125, -8.287109375, -7.8671875, -7.447265625, -7.02734375, -6.607421875, -6.1875, -5.767578125, -5.34765625, -4.927734375, -4.5078125, -4.087890625, -3.66796875, -3.248046875, -2.828125, -2.408203125, -1.98828125, -1.568359375, -1.1484375, -0.728515625, -0.30859375, 0.111328125, 0.53125, 0.951171875, 1.37109375, 1.791015625, 2.2109375, 2.630859375, 3.05078125, 3.470703125, 3.890625, 4.310546875, 4.73046875, 5.150390625, 5.5703125, 5.990234375, 6.41015625, 6.830078125, 7.25, 7.669921875, 8.08984375, 8.509765625, 8.9296875, 9.349609375, 9.76953125, 10.189453125, 10.609375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 7.0, 15.0, 30.0, 67.0, 171.0, 445.0, 1230.0, 3949.0, 15338.0, 86057.0, 738779.0, 2719830.0, 543105.0, 67437.0, 12704.0, 3435.0, 1032.0, 359.0, 172.0, 52.0, 35.0, 15.0, 7.0, 4.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.85205078125, -15.3134765625, -14.77490234375, -14.236328125, -13.69775390625, -13.1591796875, -12.62060546875, -12.08203125, -11.54345703125, -11.0048828125, -10.46630859375, -9.927734375, -9.38916015625, -8.8505859375, -8.31201171875, -7.7734375, -7.23486328125, -6.6962890625, -6.15771484375, -5.619140625, -5.08056640625, -4.5419921875, -4.00341796875, -3.46484375, -2.92626953125, -2.3876953125, -1.84912109375, -1.310546875, -0.77197265625, -0.2333984375, 0.30517578125, 0.84375, 1.38232421875, 1.9208984375, 2.45947265625, 2.998046875, 3.53662109375, 4.0751953125, 4.61376953125, 5.15234375, 5.69091796875, 6.2294921875, 6.76806640625, 7.306640625, 7.84521484375, 8.3837890625, 8.92236328125, 9.4609375, 9.99951171875, 10.5380859375, 11.07666015625, 11.615234375, 12.15380859375, 12.6923828125, 13.23095703125, 13.76953125, 14.30810546875, 14.8466796875, 15.38525390625, 15.923828125, 16.46240234375, 17.0009765625, 17.53955078125, 18.078125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 7.0, 15.0, 22.0, 27.0, 40.0, 54.0, 67.0, 79.0, 82.0, 105.0, 102.0, 95.0, 67.0, 62.0, 57.0, 33.0, 22.0, 23.0, 9.0, 11.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.50143432617188, -125.43001556396484, -122.35859680175781, -119.28717803955078, -116.21575927734375, -113.14434051513672, -110.07292175292969, -107.00150299072266, -103.93008422851562, -100.8586654663086, -97.78724670410156, -94.71582794189453, -91.6444091796875, -88.57299041748047, -85.50157165527344, -82.4301528930664, -79.35873413085938, -76.28731536865234, -73.21589660644531, -70.14447784423828, -67.07305908203125, -64.00164031982422, -60.93022155761719, -57.858802795410156, -54.787384033203125, -51.715965270996094, -48.64454650878906, -45.57312774658203, -42.501708984375, -39.43029022216797, -36.35887145996094, -33.287452697753906, -30.216041564941406, -27.144622802734375, -24.073204040527344, -21.001785278320312, -17.93036651611328, -14.85894775390625, -11.787528991699219, -8.716110229492188, -5.644691467285156, -2.573272705078125, 0.49814605712890625, 3.5695648193359375, 6.640983581542969, 9.71240234375, 12.783821105957031, 15.855239868164062, 18.926658630371094, 21.998077392578125, 25.069496154785156, 28.140914916992188, 31.21233367919922, 34.28375244140625, 37.35517120361328, 40.42658996582031, 43.498008728027344, 46.569427490234375, 49.640846252441406, 52.71226501464844, 55.78368377685547, 58.8551025390625, 61.92652130126953, 64.99794006347656, 68.0693588256836]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 11.0, 7.0, 7.0, 8.0, 7.0, 7.0, 8.0, 23.0, 24.0, 24.0, 29.0, 34.0, 28.0, 23.0, 28.0, 26.0, 30.0, 29.0, 44.0, 55.0, 52.0, 33.0, 50.0, 45.0, 34.0, 37.0, 37.0, 34.0, 28.0, 32.0, 15.0, 26.0, 18.0, 19.0, 15.0, 13.0, 11.0, 11.0, 12.0, 8.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-46.92509078979492, -45.40594482421875, -43.88679504394531, -42.367645263671875, -40.8484992980957, -39.32935333251953, -37.810203552246094, -36.291053771972656, -34.771907806396484, -33.25276184082031, -31.733612060546875, -30.21446418762207, -28.695316314697266, -27.17616844177246, -25.657020568847656, -24.13787269592285, -22.618724822998047, -21.099576950073242, -19.580429077148438, -18.061281204223633, -16.542133331298828, -15.022985458374023, -13.503837585449219, -11.984689712524414, -10.46554183959961, -8.946393966674805, -7.42724609375, -5.908098220825195, -4.388950347900391, -2.869802474975586, -1.3506546020507812, 0.16849327087402344, 1.6876411437988281, 3.206789016723633, 4.7259368896484375, 6.245084762573242, 7.764232635498047, 9.283380508422852, 10.802528381347656, 12.321676254272461, 13.840824127197266, 15.35997200012207, 16.879119873046875, 18.39826774597168, 19.917415618896484, 21.43656349182129, 22.955711364746094, 24.4748592376709, 25.994007110595703, 27.513154983520508, 29.032302856445312, 30.551450729370117, 32.07059860229492, 33.589744567871094, 35.10889434814453, 36.62804412841797, 38.14719009399414, 39.66633605957031, 41.18548583984375, 42.70463562011719, 44.22378158569336, 45.74292755126953, 47.26207733154297, 48.781227111816406, 50.30037307739258]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 6.0, 8.0, 9.0, 7.0, 9.0, 15.0, 13.0, 23.0, 29.0, 28.0, 32.0, 33.0, 33.0, 32.0, 50.0, 28.0, 37.0, 39.0, 46.0, 50.0, 48.0, 52.0, 45.0, 35.0, 24.0, 31.0, 44.0, 28.0, 27.0, 19.0, 19.0, 17.0, 5.0, 19.0, 13.0, 12.0, 5.0, 9.0, 2.0, 4.0, 1.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-98.9375, -95.7451171875, -92.552734375, -89.3603515625, -86.16796875, -82.9755859375, -79.783203125, -76.5908203125, -73.3984375, -70.2060546875, -67.013671875, -63.8212890625, -60.62890625, -57.4365234375, -54.244140625, -51.0517578125, -47.859375, -44.6669921875, -41.474609375, -38.2822265625, -35.08984375, -31.8974609375, -28.705078125, -25.5126953125, -22.3203125, -19.1279296875, -15.935546875, -12.7431640625, -9.55078125, -6.3583984375, -3.166015625, 0.0263671875, 3.21875, 6.4111328125, 9.603515625, 12.7958984375, 15.98828125, 19.1806640625, 22.373046875, 25.5654296875, 28.7578125, 31.9501953125, 35.142578125, 38.3349609375, 41.52734375, 44.7197265625, 47.912109375, 51.1044921875, 54.296875, 57.4892578125, 60.681640625, 63.8740234375, 67.06640625, 70.2587890625, 73.451171875, 76.6435546875, 79.8359375, 83.0283203125, 86.220703125, 89.4130859375, 92.60546875, 95.7978515625, 98.990234375, 102.1826171875, 105.375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 8.0, 18.0, 15.0, 21.0, 41.0, 71.0, 106.0, 187.0, 292.0, 452.0, 761.0, 1122.0, 1795.0, 3059.0, 4816.0, 7640.0, 12136.0, 19594.0, 30676.0, 47738.0, 73418.0, 106000.0, 140953.0, 156999.0, 138737.0, 103534.0, 71395.0, 46613.0, 29836.0, 18849.0, 11675.0, 7408.0, 4696.0, 2950.0, 1868.0, 1153.0, 713.0, 484.0, 268.0, 167.0, 112.0, 61.0, 36.0, 32.0, 21.0, 12.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.28515625, -5.12237548828125, -4.9595947265625, -4.79681396484375, -4.634033203125, -4.47125244140625, -4.3084716796875, -4.14569091796875, -3.98291015625, -3.82012939453125, -3.6573486328125, -3.49456787109375, -3.331787109375, -3.16900634765625, -3.0062255859375, -2.84344482421875, -2.6806640625, -2.51788330078125, -2.3551025390625, -2.19232177734375, -2.029541015625, -1.86676025390625, -1.7039794921875, -1.54119873046875, -1.37841796875, -1.21563720703125, -1.0528564453125, -0.89007568359375, -0.727294921875, -0.56451416015625, -0.4017333984375, -0.23895263671875, -0.076171875, 0.08660888671875, 0.2493896484375, 0.41217041015625, 0.574951171875, 0.73773193359375, 0.9005126953125, 1.06329345703125, 1.22607421875, 1.38885498046875, 1.5516357421875, 1.71441650390625, 1.877197265625, 2.03997802734375, 2.2027587890625, 2.36553955078125, 2.5283203125, 2.69110107421875, 2.8538818359375, 3.01666259765625, 3.179443359375, 3.34222412109375, 3.5050048828125, 3.66778564453125, 3.83056640625, 3.99334716796875, 4.1561279296875, 4.31890869140625, 4.481689453125, 4.64447021484375, 4.8072509765625, 4.97003173828125, 5.1328125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 10.0, 7.0, 14.0, 9.0, 11.0, 21.0, 18.0, 16.0, 32.0, 23.0, 32.0, 31.0, 46.0, 39.0, 34.0, 41.0, 61.0, 44.0, 1061.0, 47.0, 41.0, 39.0, 36.0, 36.0, 28.0, 31.0, 34.0, 22.0, 18.0, 22.0, 17.0, 27.0, 12.0, 17.0, 10.0, 7.0, 7.0, 11.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-67.6875, -65.78271484375, -63.8779296875, -61.97314453125, -60.068359375, -58.16357421875, -56.2587890625, -54.35400390625, -52.44921875, -50.54443359375, -48.6396484375, -46.73486328125, -44.830078125, -42.92529296875, -41.0205078125, -39.11572265625, -37.2109375, -35.30615234375, -33.4013671875, -31.49658203125, -29.591796875, -27.68701171875, -25.7822265625, -23.87744140625, -21.97265625, -20.06787109375, -18.1630859375, -16.25830078125, -14.353515625, -12.44873046875, -10.5439453125, -8.63916015625, -6.734375, -4.82958984375, -2.9248046875, -1.02001953125, 0.884765625, 2.78955078125, 4.6943359375, 6.59912109375, 8.50390625, 10.40869140625, 12.3134765625, 14.21826171875, 16.123046875, 18.02783203125, 19.9326171875, 21.83740234375, 23.7421875, 25.64697265625, 27.5517578125, 29.45654296875, 31.361328125, 33.26611328125, 35.1708984375, 37.07568359375, 38.98046875, 40.88525390625, 42.7900390625, 44.69482421875, 46.599609375, 48.50439453125, 50.4091796875, 52.31396484375, 54.21875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 6.0, 7.0, 15.0, 21.0, 18.0, 37.0, 71.0, 104.0, 158.0, 215.0, 354.0, 517.0, 773.0, 1270.0, 1845.0, 2849.0, 4704.0, 7120.0, 11219.0, 16851.0, 26225.0, 38980.0, 57934.0, 82399.0, 111638.0, 267595.0, 1044587.0, 126274.0, 93242.0, 66786.0, 45648.0, 30547.0, 20278.0, 12886.0, 8405.0, 5418.0, 3659.0, 2285.0, 1523.0, 918.0, 595.0, 400.0, 253.0, 175.0, 119.0, 75.0, 45.0, 31.0, 25.0, 16.0, 11.0, 4.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.984375, -3.8524169921875, -3.720458984375, -3.5885009765625, -3.45654296875, -3.3245849609375, -3.192626953125, -3.0606689453125, -2.9287109375, -2.7967529296875, -2.664794921875, -2.5328369140625, -2.40087890625, -2.2689208984375, -2.136962890625, -2.0050048828125, -1.873046875, -1.7410888671875, -1.609130859375, -1.4771728515625, -1.34521484375, -1.2132568359375, -1.081298828125, -0.9493408203125, -0.8173828125, -0.6854248046875, -0.553466796875, -0.4215087890625, -0.28955078125, -0.1575927734375, -0.025634765625, 0.1063232421875, 0.23828125, 0.3702392578125, 0.502197265625, 0.6341552734375, 0.76611328125, 0.8980712890625, 1.030029296875, 1.1619873046875, 1.2939453125, 1.4259033203125, 1.557861328125, 1.6898193359375, 1.82177734375, 1.9537353515625, 2.085693359375, 2.2176513671875, 2.349609375, 2.4815673828125, 2.613525390625, 2.7454833984375, 2.87744140625, 3.0093994140625, 3.141357421875, 3.2733154296875, 3.4052734375, 3.5372314453125, 3.669189453125, 3.8011474609375, 3.93310546875, 4.0650634765625, 4.197021484375, 4.3289794921875, 4.4609375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 1.0, 8.0, 7.0, 9.0, 5.0, 13.0, 13.0, 12.0, 21.0, 19.0, 17.0, 23.0, 35.0, 37.0, 57.0, 56.0, 79.0, 79.0, 86.0, 68.0, 51.0, 53.0, 41.0, 42.0, 30.0, 29.0, 19.0, 19.0, 11.0, 13.0, 7.0, 10.0, 6.0, 2.0, 2.0, 4.0, 3.0, 6.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21044921875, -0.20388221740722656, -0.19731521606445312, -0.1907482147216797, -0.18418121337890625, -0.1776142120361328, -0.17104721069335938, -0.16448020935058594, -0.1579132080078125, -0.15134620666503906, -0.14477920532226562, -0.1382122039794922, -0.13164520263671875, -0.1250782012939453, -0.11851119995117188, -0.11194419860839844, -0.105377197265625, -0.09881019592285156, -0.09224319458007812, -0.08567619323730469, -0.07910919189453125, -0.07254219055175781, -0.06597518920898438, -0.05940818786621094, -0.0528411865234375, -0.04627418518066406, -0.039707183837890625, -0.03314018249511719, -0.02657318115234375, -0.020006179809570312, -0.013439178466796875, -0.0068721771240234375, -0.00030517578125, 0.0062618255615234375, 0.012828826904296875, 0.019395828247070312, 0.02596282958984375, 0.03252983093261719, 0.039096832275390625, 0.04566383361816406, 0.0522308349609375, 0.05879783630371094, 0.06536483764648438, 0.07193183898925781, 0.07849884033203125, 0.08506584167480469, 0.09163284301757812, 0.09819984436035156, 0.104766845703125, 0.11133384704589844, 0.11790084838867188, 0.12446784973144531, 0.13103485107421875, 0.1376018524169922, 0.14416885375976562, 0.15073585510253906, 0.1573028564453125, 0.16386985778808594, 0.17043685913085938, 0.1770038604736328, 0.18357086181640625, 0.1901378631591797, 0.19670486450195312, 0.20327186584472656, 0.2098388671875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 2.0, 11.0, 14.0, 9.0, 28.0, 31.0, 36.0, 53.0, 61.0, 87.0, 134.0, 202.0, 294.0, 500.0, 780.0, 1414.0, 2583.0, 4834.0, 9584.0, 19884.0, 49708.0, 148872.0, 392764.0, 270155.0, 85869.0, 31621.0, 13731.0, 7008.0, 3482.0, 1909.0, 1103.0, 598.0, 401.0, 232.0, 149.0, 121.0, 64.0, 57.0, 51.0, 32.0, 25.0, 18.0, 11.0, 11.0, 6.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8759765625, -0.8483963012695312, -0.8208160400390625, -0.7932357788085938, -0.765655517578125, -0.7380752563476562, -0.7104949951171875, -0.6829147338867188, -0.65533447265625, -0.6277542114257812, -0.6001739501953125, -0.5725936889648438, -0.545013427734375, -0.5174331665039062, -0.4898529052734375, -0.46227264404296875, -0.4346923828125, -0.40711212158203125, -0.3795318603515625, -0.35195159912109375, -0.324371337890625, -0.29679107666015625, -0.2692108154296875, -0.24163055419921875, -0.21405029296875, -0.18647003173828125, -0.1588897705078125, -0.13130950927734375, -0.103729248046875, -0.07614898681640625, -0.0485687255859375, -0.02098846435546875, 0.006591796875, 0.03417205810546875, 0.0617523193359375, 0.08933258056640625, 0.116912841796875, 0.14449310302734375, 0.1720733642578125, 0.19965362548828125, 0.22723388671875, 0.25481414794921875, 0.2823944091796875, 0.30997467041015625, 0.337554931640625, 0.36513519287109375, 0.3927154541015625, 0.42029571533203125, 0.4478759765625, 0.47545623779296875, 0.5030364990234375, 0.5306167602539062, 0.558197021484375, 0.5857772827148438, 0.6133575439453125, 0.6409378051757812, 0.66851806640625, 0.6960983276367188, 0.7236785888671875, 0.7512588500976562, 0.778839111328125, 0.8064193725585938, 0.8339996337890625, 0.8615798950195312, 0.88916015625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 5.0, 6.0, 6.0, 14.0, 24.0, 28.0, 45.0, 62.0, 96.0, 94.0, 118.0, 110.0, 83.0, 83.0, 58.0, 48.0, 39.0, 37.0, 15.0, 15.0, 8.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21029828488826752, -0.19517464935779572, -0.18005099892616272, -0.16492736339569092, -0.14980372786521912, -0.13468009233474731, -0.11955644190311432, -0.10443280637264252, -0.08930916339159012, -0.07418552041053772, -0.05906188488006592, -0.04393824189901352, -0.02881460264325142, -0.013690963387489319, 0.0014326795935630798, 0.01655631512403488, 0.03167995810508728, 0.04680359736084938, 0.06192723661661148, 0.07705087959766388, 0.09217451512813568, 0.10729815810918808, 0.12242180109024048, 0.13754543662071228, 0.15266907215118408, 0.16779270768165588, 0.18291635811328888, 0.19803999364376068, 0.21316362917423248, 0.22828727960586548, 0.24341091513633728, 0.2585345506668091, 0.2736581861972809, 0.2887818217277527, 0.3039054572582245, 0.3190290927886963, 0.3341527581214905, 0.3492763936519623, 0.3644000291824341, 0.3795236647129059, 0.3946473002433777, 0.4097709357738495, 0.4248945713043213, 0.4400182366371155, 0.4551418721675873, 0.4702655076980591, 0.4853891432285309, 0.5005127787590027, 0.5156364440917969, 0.5307601094245911, 0.5458837151527405, 0.5610073804855347, 0.5761309862136841, 0.5912546515464783, 0.6063783168792725, 0.6215019226074219, 0.6366255283355713, 0.6517491936683655, 0.6668727993965149, 0.6819964647293091, 0.6971200704574585, 0.7122437357902527, 0.7273674011230469, 0.7424910068511963, 0.7576146721839905]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 2.0, 6.0, 12.0, 5.0, 7.0, 12.0, 17.0, 14.0, 15.0, 16.0, 26.0, 38.0, 20.0, 35.0, 30.0, 35.0, 27.0, 26.0, 33.0, 51.0, 46.0, 34.0, 30.0, 42.0, 37.0, 46.0, 35.0, 27.0, 30.0, 33.0, 27.0, 23.0, 27.0, 17.0, 20.0, 17.0, 11.0, 15.0, 18.0, 14.0, 3.0, 7.0, 3.0, 8.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2592123746871948, -0.2510314881801605, -0.24285058677196503, -0.23466970026493073, -0.22648881375789642, -0.21830791234970093, -0.21012702584266663, -0.20194613933563232, -0.19376525282859802, -0.18558436632156372, -0.17740346491336823, -0.16922257840633392, -0.16104169189929962, -0.15286079049110413, -0.14467990398406982, -0.13649901747703552, -0.12831811606884003, -0.12013722211122513, -0.11195633560419083, -0.10377544164657593, -0.09559455513954163, -0.08741366118192673, -0.07923276722431183, -0.07105188071727753, -0.06287098675966263, -0.05469009652733803, -0.04650920629501343, -0.03832831233739853, -0.03014742210507393, -0.02196653187274933, -0.01378563791513443, -0.00560474768280983, 0.0025761425495147705, 0.010757033713161945, 0.01893792487680912, 0.02711881697177887, 0.03529970720410347, 0.04348059743642807, 0.05166149139404297, 0.05984238162636757, 0.06802327185869217, 0.07620416581630707, 0.08438505232334137, 0.09256594628095627, 0.10074684023857117, 0.10892772674560547, 0.11710862070322037, 0.12528951466083527, 0.13347040116786957, 0.14165128767490387, 0.14983218908309937, 0.15801307559013367, 0.16619396209716797, 0.17437484860420227, 0.18255575001239777, 0.19073663651943207, 0.19891753792762756, 0.20709842443466187, 0.21527932584285736, 0.22346021234989166, 0.23164109885692596, 0.23982200026512146, 0.24800288677215576, 0.25618377327919006, 0.26436465978622437]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 2.0, 12.0, 12.0, 9.0, 9.0, 18.0, 18.0, 16.0, 28.0, 37.0, 38.0, 36.0, 36.0, 38.0, 39.0, 34.0, 42.0, 46.0, 55.0, 44.0, 44.0, 41.0, 48.0, 32.0, 38.0, 32.0, 23.0, 29.0, 17.0, 17.0, 22.0, 16.0, 16.0, 11.0, 5.0, 12.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-100.5625, -97.32421875, -94.0859375, -90.84765625, -87.609375, -84.37109375, -81.1328125, -77.89453125, -74.65625, -71.41796875, -68.1796875, -64.94140625, -61.703125, -58.46484375, -55.2265625, -51.98828125, -48.75, -45.51171875, -42.2734375, -39.03515625, -35.796875, -32.55859375, -29.3203125, -26.08203125, -22.84375, -19.60546875, -16.3671875, -13.12890625, -9.890625, -6.65234375, -3.4140625, -0.17578125, 3.0625, 6.30078125, 9.5390625, 12.77734375, 16.015625, 19.25390625, 22.4921875, 25.73046875, 28.96875, 32.20703125, 35.4453125, 38.68359375, 41.921875, 45.16015625, 48.3984375, 51.63671875, 54.875, 58.11328125, 61.3515625, 64.58984375, 67.828125, 71.06640625, 74.3046875, 77.54296875, 80.78125, 84.01953125, 87.2578125, 90.49609375, 93.734375, 96.97265625, 100.2109375, 103.44921875, 106.6875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 6.0, 7.0, 8.0, 8.0, 16.0, 15.0, 19.0, 30.0, 48.0, 51.0, 63.0, 117.0, 176.0, 296.0, 756.0, 2924.0, 21971.0, 268481.0, 647702.0, 94480.0, 8604.0, 1542.0, 497.0, 230.0, 127.0, 96.0, 52.0, 45.0, 38.0, 23.0, 23.0, 17.0, 19.0, 12.0, 7.0, 13.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.359375, -20.6767578125, -19.994140625, -19.3115234375, -18.62890625, -17.9462890625, -17.263671875, -16.5810546875, -15.8984375, -15.2158203125, -14.533203125, -13.8505859375, -13.16796875, -12.4853515625, -11.802734375, -11.1201171875, -10.4375, -9.7548828125, -9.072265625, -8.3896484375, -7.70703125, -7.0244140625, -6.341796875, -5.6591796875, -4.9765625, -4.2939453125, -3.611328125, -2.9287109375, -2.24609375, -1.5634765625, -0.880859375, -0.1982421875, 0.484375, 1.1669921875, 1.849609375, 2.5322265625, 3.21484375, 3.8974609375, 4.580078125, 5.2626953125, 5.9453125, 6.6279296875, 7.310546875, 7.9931640625, 8.67578125, 9.3583984375, 10.041015625, 10.7236328125, 11.40625, 12.0888671875, 12.771484375, 13.4541015625, 14.13671875, 14.8193359375, 15.501953125, 16.1845703125, 16.8671875, 17.5498046875, 18.232421875, 18.9150390625, 19.59765625, 20.2802734375, 20.962890625, 21.6455078125, 22.328125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 8.0, 7.0, 11.0, 11.0, 19.0, 21.0, 45.0, 37.0, 52.0, 67.0, 82.0, 72.0, 115.0, 2095.0, 63.0, 61.0, 56.0, 49.0, 48.0, 39.0, 25.0, 22.0, 20.0, 10.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-292.25, -285.150390625, -278.05078125, -270.951171875, -263.8515625, -256.751953125, -249.65234375, -242.552734375, -235.453125, -228.353515625, -221.25390625, -214.154296875, -207.0546875, -199.955078125, -192.85546875, -185.755859375, -178.65625, -171.556640625, -164.45703125, -157.357421875, -150.2578125, -143.158203125, -136.05859375, -128.958984375, -121.859375, -114.759765625, -107.66015625, -100.560546875, -93.4609375, -86.361328125, -79.26171875, -72.162109375, -65.0625, -57.962890625, -50.86328125, -43.763671875, -36.6640625, -29.564453125, -22.46484375, -15.365234375, -8.265625, -1.166015625, 5.93359375, 13.033203125, 20.1328125, 27.232421875, 34.33203125, 41.431640625, 48.53125, 55.630859375, 62.73046875, 69.830078125, 76.9296875, 84.029296875, 91.12890625, 98.228515625, 105.328125, 112.427734375, 119.52734375, 126.626953125, 133.7265625, 140.826171875, 147.92578125, 155.025390625, 162.125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 2.0, 10.0, 7.0, 10.0, 11.0, 30.0, 44.0, 101.0, 174.0, 399.0, 983.0, 3147.0, 22207.0, 1340303.0, 1750858.0, 22407.0, 3253.0, 1002.0, 393.0, 154.0, 75.0, 55.0, 36.0, 15.0, 11.0, 7.0, 6.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.453125, -24.681884765625, -23.91064453125, -23.139404296875, -22.3681640625, -21.596923828125, -20.82568359375, -20.054443359375, -19.283203125, -18.511962890625, -17.74072265625, -16.969482421875, -16.1982421875, -15.427001953125, -14.65576171875, -13.884521484375, -13.11328125, -12.342041015625, -11.57080078125, -10.799560546875, -10.0283203125, -9.257080078125, -8.48583984375, -7.714599609375, -6.943359375, -6.172119140625, -5.40087890625, -4.629638671875, -3.8583984375, -3.087158203125, -2.31591796875, -1.544677734375, -0.7734375, -0.002197265625, 0.76904296875, 1.540283203125, 2.3115234375, 3.082763671875, 3.85400390625, 4.625244140625, 5.396484375, 6.167724609375, 6.93896484375, 7.710205078125, 8.4814453125, 9.252685546875, 10.02392578125, 10.795166015625, 11.56640625, 12.337646484375, 13.10888671875, 13.880126953125, 14.6513671875, 15.422607421875, 16.19384765625, 16.965087890625, 17.736328125, 18.507568359375, 19.27880859375, 20.050048828125, 20.8212890625, 21.592529296875, 22.36376953125, 23.135009765625, 23.90625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 8.0, 5.0, 17.0, 36.0, 106.0, 236.0, 297.0, 192.0, 55.0, 13.0, 16.0, 8.0, 4.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-322.5245056152344, -308.7859802246094, -295.0474853515625, -281.3089599609375, -267.5704345703125, -253.8319091796875, -240.09339904785156, -226.35488891601562, -212.61636352539062, -198.87783813476562, -185.1393280029297, -171.40081787109375, -157.66229248046875, -143.92376708984375, -130.1852569580078, -116.44673919677734, -102.70822143554688, -88.9697036743164, -75.23118591308594, -61.49266815185547, -47.754150390625, -34.01563262939453, -20.277114868164062, -6.538597106933594, 7.199920654296875, 20.938438415527344, 34.67695617675781, 48.41547393798828, 62.15399169921875, 75.89250946044922, 89.63102722167969, 103.36954498291016, 117.1080322265625, 130.8465576171875, 144.58506774902344, 158.32357788085938, 172.06210327148438, 185.80062866210938, 199.5391387939453, 213.27764892578125, 227.01617431640625, 240.75469970703125, 254.4932098388672, 268.2317199707031, 281.9702453613281, 295.7087707519531, 309.447265625, 323.185791015625, 336.92431640625, 350.662841796875, 364.4013671875, 378.1398620605469, 391.8783874511719, 405.6169128417969, 419.35540771484375, 433.09393310546875, 446.83245849609375, 460.57098388671875, 474.30950927734375, 488.0480041503906, 501.7865295410156, 515.5250244140625, 529.2635498046875, 543.0020751953125, 556.7406005859375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 8.0, 4.0, 6.0, 6.0, 4.0, 15.0, 8.0, 16.0, 14.0, 25.0, 21.0, 26.0, 35.0, 22.0, 37.0, 38.0, 45.0, 48.0, 37.0, 35.0, 47.0, 49.0, 42.0, 39.0, 38.0, 28.0, 39.0, 36.0, 26.0, 29.0, 30.0, 24.0, 22.0, 17.0, 16.0, 8.0, 15.0, 14.0, 11.0, 12.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-226.7307891845703, -220.21975708007812, -213.70872497558594, -207.19769287109375, -200.68666076660156, -194.17562866210938, -187.66458129882812, -181.153564453125, -174.64251708984375, -168.13148498535156, -161.62045288085938, -155.1094207763672, -148.598388671875, -142.0873565673828, -135.57632446289062, -129.06527709960938, -122.55426025390625, -116.04322814941406, -109.53219604492188, -103.02116394042969, -96.5101318359375, -89.99909973144531, -83.4880599975586, -76.9770278930664, -70.46599578857422, -63.95496368408203, -57.443931579589844, -50.93289566040039, -44.4218635559082, -37.910831451416016, -31.399795532226562, -24.888763427734375, -18.377731323242188, -11.866698265075684, -5.35566520690918, 1.1553688049316406, 7.666400909423828, 14.177433013916016, 20.68846893310547, 27.199501037597656, 33.710533142089844, 40.22156524658203, 46.73259735107422, 53.24363327026367, 59.75466537475586, 66.26570129394531, 72.7767333984375, 79.28776550292969, 85.79879760742188, 92.30982971191406, 98.82086181640625, 105.33189392089844, 111.84292602539062, 118.35395812988281, 124.86499786376953, 131.37603759765625, 137.88705444335938, 144.39808654785156, 150.90911865234375, 157.42015075683594, 163.93118286132812, 170.4422149658203, 176.9532470703125, 183.46429443359375, 189.97532653808594]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 5.0, 11.0, 9.0, 13.0, 20.0, 21.0, 31.0, 32.0, 53.0, 62.0, 86.0, 114.0, 151.0, 212.0, 274.0, 419.0, 655.0, 1070.0, 2195.0, 4086.0, 8578.0, 1012342.0, 8549.0, 4169.0, 2123.0, 1079.0, 676.0, 386.0, 313.0, 215.0, 168.0, 113.0, 83.0, 44.0, 50.0, 34.0, 30.0, 19.0, 21.0, 16.0, 11.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.34611892700195, -40.86087417602539, -39.37562561035156, -37.890380859375, -36.40513610839844, -34.91988754272461, -33.43464279174805, -31.94939613342285, -30.464149475097656, -28.97890281677246, -27.493656158447266, -26.008411407470703, -24.523164749145508, -23.037918090820312, -21.55267333984375, -20.067426681518555, -18.58218002319336, -17.096933364868164, -15.611687660217285, -14.126441955566406, -12.641195297241211, -11.155948638916016, -9.670702934265137, -8.185457229614258, -6.7002105712890625, -5.214964389801025, -3.7297182083129883, -2.244472026824951, -0.7592258453369141, 0.726020336151123, 2.21126651763916, 3.696512222290039, 5.1817626953125, 6.667008876800537, 8.152255058288574, 9.637500762939453, 11.122747421264648, 12.607994079589844, 14.093239784240723, 15.578485488891602, 17.063732147216797, 18.548978805541992, 20.034225463867188, 21.51947021484375, 23.004716873168945, 24.48996353149414, 25.975208282470703, 27.4604549407959, 28.945701599121094, 30.43094825744629, 31.916194915771484, 33.40143966674805, 34.886688232421875, 36.37193298339844, 37.857177734375, 39.34242248535156, 40.82767105102539, 42.31291580200195, 43.79816436767578, 45.283409118652344, 46.768653869628906, 48.253902435302734, 49.7391471862793, 51.224395751953125, 52.70964050292969]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 3.0, 6.0, 8.0, 16.0, 14.0, 34.0, 52.0, 209.0, 51324128.0, 138493.0, 203.0, 47.0, 21.0, 14.0, 11.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1835.108642578125, -1764.511474609375, -1693.914306640625, -1623.317138671875, -1552.7198486328125, -1482.1226806640625, -1411.5255126953125, -1340.9283447265625, -1270.3310546875, -1199.73388671875, -1129.13671875, -1058.53955078125, -987.9422607421875, -917.3450927734375, -846.7479248046875, -776.1507568359375, -705.5535888671875, -634.9564208984375, -564.3591918945312, -493.76202392578125, -423.1648254394531, -352.567626953125, -281.970458984375, -211.37326049804688, -140.77606201171875, -70.17887115478516, 0.4183197021484375, 71.0155029296875, 141.61270141601562, 212.20989990234375, 282.80706787109375, 353.4042663574219, 424.00146484375, 494.5986633300781, 565.1958618164062, 635.7930297851562, 706.3902587890625, 776.9874267578125, 847.5845947265625, 918.1817626953125, 988.7789916992188, 1059.376220703125, 1129.973388671875, 1200.570556640625, 1271.167724609375, 1341.764892578125, 1412.362060546875, 1482.9593505859375, 1553.5565185546875, 1624.1536865234375, 1694.7508544921875, 1765.34814453125, 1835.9453125, 1906.54248046875, 1977.1396484375, 2047.73681640625, 2118.333984375, 2188.93115234375, 2259.5283203125, 2330.12548828125, 2400.72265625, 2471.31982421875, 2541.9169921875, 2612.514404296875, 2683.111572265625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 6.0, 10.0, 15.0, 17.0, 28.0, 57.0, 70.0, 133.0, 173.0, 275.0, 474.0, 843.0, 1415.0, 2461.0, 4628.0, 8347.0, 16162.0, 32036.0, 65901.0, 141713.0, 320511.0, 808669.0, 2635030.0, 1385751.0, 478262.0, 204811.0, 92418.0, 44246.0, 21822.0, 11406.0, 5949.0, 3231.0, 1923.0, 1027.0, 615.0, 358.0, 216.0, 132.0, 110.0, 42.0, 54.0, 36.0, 24.0, 15.0, 11.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.296875, -22.606201171875, -21.91552734375, -21.224853515625, -20.5341796875, -19.843505859375, -19.15283203125, -18.462158203125, -17.771484375, -17.080810546875, -16.39013671875, -15.699462890625, -15.0087890625, -14.318115234375, -13.62744140625, -12.936767578125, -12.24609375, -11.555419921875, -10.86474609375, -10.174072265625, -9.4833984375, -8.792724609375, -8.10205078125, -7.411376953125, -6.720703125, -6.030029296875, -5.33935546875, -4.648681640625, -3.9580078125, -3.267333984375, -2.57666015625, -1.885986328125, -1.1953125, -0.504638671875, 0.18603515625, 0.876708984375, 1.5673828125, 2.258056640625, 2.94873046875, 3.639404296875, 4.330078125, 5.020751953125, 5.71142578125, 6.402099609375, 7.0927734375, 7.783447265625, 8.47412109375, 9.164794921875, 9.85546875, 10.546142578125, 11.23681640625, 11.927490234375, 12.6181640625, 13.308837890625, 13.99951171875, 14.690185546875, 15.380859375, 16.071533203125, 16.76220703125, 17.452880859375, 18.1435546875, 18.834228515625, 19.52490234375, 20.215576171875, 20.90625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 5.0, 4.0, 11.0, 9.0, 6.0, 8.0, 18.0, 19.0, 21.0, 18.0, 23.0, 18.0, 30.0, 36.0, 37.0, 43.0, 62.0, 50.0, 97.0, 118.0, 212.0, 270.0, 229.0, 134.0, 93.0, 70.0, 41.0, 44.0, 36.0, 27.0, 28.0, 19.0, 25.0, 20.0, 24.0, 25.0, 14.0, 6.0, 22.0, 9.0, 7.0, 3.0, 7.0, 4.0, 7.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0], "bins": [-25.875, -25.107666015625, -24.34033203125, -23.572998046875, -22.8056640625, -22.038330078125, -21.27099609375, -20.503662109375, -19.736328125, -18.968994140625, -18.20166015625, -17.434326171875, -16.6669921875, -15.899658203125, -15.13232421875, -14.364990234375, -13.59765625, -12.830322265625, -12.06298828125, -11.295654296875, -10.5283203125, -9.760986328125, -8.99365234375, -8.226318359375, -7.458984375, -6.691650390625, -5.92431640625, -5.156982421875, -4.3896484375, -3.622314453125, -2.85498046875, -2.087646484375, -1.3203125, -0.552978515625, 0.21435546875, 0.981689453125, 1.7490234375, 2.516357421875, 3.28369140625, 4.051025390625, 4.818359375, 5.585693359375, 6.35302734375, 7.120361328125, 7.8876953125, 8.655029296875, 9.42236328125, 10.189697265625, 10.95703125, 11.724365234375, 12.49169921875, 13.259033203125, 14.0263671875, 14.793701171875, 15.56103515625, 16.328369140625, 17.095703125, 17.863037109375, 18.63037109375, 19.397705078125, 20.1650390625, 20.932373046875, 21.69970703125, 22.467041015625, 23.234375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 8.0, 15.0, 17.0, 31.0, 42.0, 61.0, 101.0, 170.0, 293.0, 505.0, 828.0, 1428.0, 2375.0, 4316.0, 7452.0, 12983.0, 22225.0, 39202.0, 67577.0, 112724.0, 183634.0, 292834.0, 497492.0, 1626686.0, 2027903.0, 575800.0, 316556.0, 199623.0, 123558.0, 73654.0, 43209.0, 24675.0, 14079.0, 8104.0, 4830.0, 2675.0, 1595.0, 907.0, 492.0, 339.0, 180.0, 100.0, 70.0, 39.0, 18.0, 14.0, 8.0, 2.0, 9.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.125, -7.8636474609375, -7.602294921875, -7.3409423828125, -7.07958984375, -6.8182373046875, -6.556884765625, -6.2955322265625, -6.0341796875, -5.7728271484375, -5.511474609375, -5.2501220703125, -4.98876953125, -4.7274169921875, -4.466064453125, -4.2047119140625, -3.943359375, -3.6820068359375, -3.420654296875, -3.1593017578125, -2.89794921875, -2.6365966796875, -2.375244140625, -2.1138916015625, -1.8525390625, -1.5911865234375, -1.329833984375, -1.0684814453125, -0.80712890625, -0.5457763671875, -0.284423828125, -0.0230712890625, 0.23828125, 0.4996337890625, 0.760986328125, 1.0223388671875, 1.28369140625, 1.5450439453125, 1.806396484375, 2.0677490234375, 2.3291015625, 2.5904541015625, 2.851806640625, 3.1131591796875, 3.37451171875, 3.6358642578125, 3.897216796875, 4.1585693359375, 4.419921875, 4.6812744140625, 4.942626953125, 5.2039794921875, 5.46533203125, 5.7266845703125, 5.988037109375, 6.2493896484375, 6.5107421875, 6.7720947265625, 7.033447265625, 7.2947998046875, 7.55615234375, 7.8175048828125, 8.078857421875, 8.3402099609375, 8.6015625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 6.0, 6.0, 8.0, 12.0, 10.0, 9.0, 18.0, 17.0, 17.0, 25.0, 32.0, 31.0, 37.0, 27.0, 40.0, 34.0, 60.0, 89.0, 241.0, 438.0, 315.0, 118.0, 52.0, 48.0, 48.0, 40.0, 34.0, 38.0, 21.0, 24.0, 24.0, 16.0, 17.0, 13.0, 12.0, 9.0, 7.0, 8.0, 6.0, 1.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-41.15625, -39.9716796875, -38.787109375, -37.6025390625, -36.41796875, -35.2333984375, -34.048828125, -32.8642578125, -31.6796875, -30.4951171875, -29.310546875, -28.1259765625, -26.94140625, -25.7568359375, -24.572265625, -23.3876953125, -22.203125, -21.0185546875, -19.833984375, -18.6494140625, -17.46484375, -16.2802734375, -15.095703125, -13.9111328125, -12.7265625, -11.5419921875, -10.357421875, -9.1728515625, -7.98828125, -6.8037109375, -5.619140625, -4.4345703125, -3.25, -2.0654296875, -0.880859375, 0.3037109375, 1.48828125, 2.6728515625, 3.857421875, 5.0419921875, 6.2265625, 7.4111328125, 8.595703125, 9.7802734375, 10.96484375, 12.1494140625, 13.333984375, 14.5185546875, 15.703125, 16.8876953125, 18.072265625, 19.2568359375, 20.44140625, 21.6259765625, 22.810546875, 23.9951171875, 25.1796875, 26.3642578125, 27.548828125, 28.7333984375, 29.91796875, 31.1025390625, 32.287109375, 33.4716796875, 34.65625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 11.0, 12.0, 18.0, 14.0, 36.0, 35.0, 41.0, 74.0, 95.0, 126.0, 171.0, 242.0, 315.0, 378.0, 556.0, 906.0, 1315.0, 2028.0, 3434.0, 6415.0, 13792.0, 30621.0, 73103.0, 214329.0, 5705690.0, 136508.0, 54022.0, 23249.0, 10568.0, 5038.0, 2796.0, 1649.0, 1122.0, 771.0, 528.0, 399.0, 312.0, 199.0, 141.0, 103.0, 76.0, 47.0, 41.0, 27.0, 28.0, 16.0, 12.0, 5.0, 6.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-46.59375, -45.15234375, -43.7109375, -42.26953125, -40.828125, -39.38671875, -37.9453125, -36.50390625, -35.0625, -33.62109375, -32.1796875, -30.73828125, -29.296875, -27.85546875, -26.4140625, -24.97265625, -23.53125, -22.08984375, -20.6484375, -19.20703125, -17.765625, -16.32421875, -14.8828125, -13.44140625, -12.0, -10.55859375, -9.1171875, -7.67578125, -6.234375, -4.79296875, -3.3515625, -1.91015625, -0.46875, 0.97265625, 2.4140625, 3.85546875, 5.296875, 6.73828125, 8.1796875, 9.62109375, 11.0625, 12.50390625, 13.9453125, 15.38671875, 16.828125, 18.26953125, 19.7109375, 21.15234375, 22.59375, 24.03515625, 25.4765625, 26.91796875, 28.359375, 29.80078125, 31.2421875, 32.68359375, 34.125, 35.56640625, 37.0078125, 38.44921875, 39.890625, 41.33203125, 42.7734375, 44.21484375, 45.65625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 7.0, 6.0, 9.0, 7.0, 8.0, 13.0, 12.0, 21.0, 17.0, 22.0, 27.0, 19.0, 32.0, 41.0, 25.0, 30.0, 33.0, 29.0, 40.0, 66.0, 305.0, 614.0, 205.0, 56.0, 39.0, 36.0, 31.0, 24.0, 29.0, 32.0, 29.0, 21.0, 18.0, 14.0, 18.0, 15.0, 16.0, 10.0, 6.0, 7.0, 8.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-64.5625, -62.4384765625, -60.314453125, -58.1904296875, -56.06640625, -53.9423828125, -51.818359375, -49.6943359375, -47.5703125, -45.4462890625, -43.322265625, -41.1982421875, -39.07421875, -36.9501953125, -34.826171875, -32.7021484375, -30.578125, -28.4541015625, -26.330078125, -24.2060546875, -22.08203125, -19.9580078125, -17.833984375, -15.7099609375, -13.5859375, -11.4619140625, -9.337890625, -7.2138671875, -5.08984375, -2.9658203125, -0.841796875, 1.2822265625, 3.40625, 5.5302734375, 7.654296875, 9.7783203125, 11.90234375, 14.0263671875, 16.150390625, 18.2744140625, 20.3984375, 22.5224609375, 24.646484375, 26.7705078125, 28.89453125, 31.0185546875, 33.142578125, 35.2666015625, 37.390625, 39.5146484375, 41.638671875, 43.7626953125, 45.88671875, 48.0107421875, 50.134765625, 52.2587890625, 54.3828125, 56.5068359375, 58.630859375, 60.7548828125, 62.87890625, 65.0029296875, 67.126953125, 69.2509765625, 71.375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 6.0, 9.0, 30.0, 48.0, 250.0, 499.0, 92.0, 20.0, 12.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-643.6936645507812, -624.3649291992188, -605.0362548828125, -585.70751953125, -566.3788452148438, -547.0501098632812, -527.721435546875, -508.3927001953125, -489.06402587890625, -469.7353210449219, -450.4066162109375, -431.0779113769531, -411.74920654296875, -392.4205017089844, -373.091796875, -353.7630615234375, -334.4343566894531, -315.10565185546875, -295.7769470214844, -276.4482421875, -257.1195373535156, -237.79083251953125, -218.4621124267578, -199.13340759277344, -179.80470275878906, -160.4759979248047, -141.1472930908203, -121.8185806274414, -102.48987579345703, -83.16117095947266, -63.83245849609375, -44.503753662109375, -25.175048828125, -5.846342086791992, 13.482364654541016, 32.811073303222656, 52.13977813720703, 71.4684829711914, 90.79719543457031, 110.12590026855469, 129.45460510253906, 148.78330993652344, 168.1120147705078, 187.44073486328125, 206.76943969726562, 226.09814453125, 245.42684936523438, 264.75555419921875, 284.0842590332031, 303.4129638671875, 322.7416687011719, 342.07037353515625, 361.3990783691406, 380.727783203125, 400.0565185546875, 419.38519287109375, 438.71392822265625, 458.0426330566406, 477.371337890625, 496.7000427246094, 516.0287475585938, 535.3574829101562, 554.6861572265625, 574.014892578125, 593.3435668945312]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 4.0, 8.0, 7.0, 9.0, 5.0, 14.0, 20.0, 16.0, 39.0, 142.0, 322.0, 221.0, 57.0, 21.0, 18.0, 17.0, 20.0, 11.0, 8.0, 9.0, 6.0, 2.0, 4.0, 4.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-411.84600830078125, -396.4272155761719, -381.0084228515625, -365.5896301269531, -350.17083740234375, -334.75201416015625, -319.333251953125, -303.9144287109375, -288.4956359863281, -273.07684326171875, -257.6580505371094, -242.2392578125, -226.82044982910156, -211.4016571044922, -195.9828643798828, -180.56405639648438, -165.14527893066406, -149.7264862060547, -134.3076934814453, -118.8888931274414, -103.4700927734375, -88.05130004882812, -72.63250732421875, -57.213706970214844, -41.79491424560547, -26.376117706298828, -10.95732307434082, 4.4614715576171875, 19.880268096923828, 35.29906463623047, 50.717857360839844, 66.13665771484375, 81.55545043945312, 96.9742431640625, 112.3930435180664, 127.81183624267578, 143.2306365966797, 158.64942932128906, 174.06822204589844, 189.48703002929688, 204.90582275390625, 220.32461547851562, 235.743408203125, 251.16220092773438, 266.58099365234375, 281.99981689453125, 297.4185791015625, 312.83740234375, 328.25616455078125, 343.6749572753906, 359.09375, 374.5125427246094, 389.93133544921875, 405.35015869140625, 420.7689208984375, 436.187744140625, 451.6065368652344, 467.02532958984375, 482.4441223144531, 497.8629150390625, 513.28173828125, 528.7005004882812, 544.1193237304688, 559.5380859375, 574.9569091796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 9.0, 3.0, 9.0, 19.0, 17.0, 21.0, 27.0, 41.0, 55.0, 60.0, 80.0, 139.0, 190.0, 262.0, 362.0, 539.0, 871.0, 1373.0, 2262.0, 4197.0, 8915.0, 23846.0, 188413.0, 3889863.0, 44642.0, 13907.0, 6130.0, 3063.0, 1815.0, 1110.0, 606.0, 446.0, 273.0, 183.0, 142.0, 122.0, 78.0, 53.0, 40.0, 29.0, 19.0, 19.0, 9.0, 6.0, 7.0, 8.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.02734375, -2.930328369140625, -2.83331298828125, -2.736297607421875, -2.6392822265625, -2.542266845703125, -2.44525146484375, -2.348236083984375, -2.251220703125, -2.154205322265625, -2.05718994140625, -1.960174560546875, -1.8631591796875, -1.766143798828125, -1.66912841796875, -1.572113037109375, -1.47509765625, -1.378082275390625, -1.28106689453125, -1.184051513671875, -1.0870361328125, -0.990020751953125, -0.89300537109375, -0.795989990234375, -0.698974609375, -0.601959228515625, -0.50494384765625, -0.407928466796875, -0.3109130859375, -0.213897705078125, -0.11688232421875, -0.019866943359375, 0.0771484375, 0.174163818359375, 0.27117919921875, 0.368194580078125, 0.4652099609375, 0.562225341796875, 0.65924072265625, 0.756256103515625, 0.853271484375, 0.950286865234375, 1.04730224609375, 1.144317626953125, 1.2413330078125, 1.338348388671875, 1.43536376953125, 1.532379150390625, 1.62939453125, 1.726409912109375, 1.82342529296875, 1.920440673828125, 2.0174560546875, 2.114471435546875, 2.21148681640625, 2.308502197265625, 2.405517578125, 2.502532958984375, 2.59954833984375, 2.696563720703125, 2.7935791015625, 2.890594482421875, 2.98760986328125, 3.084625244140625, 3.181640625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 3.0, 7.0, 3.0, 4.0, 9.0, 5.0, 12.0, 14.0, 13.0, 17.0, 485.0, 300.0, 16.0, 11.0, 21.0, 14.0, 8.0, 8.0, 7.0, 7.0, 5.0, 1.0, 7.0, 3.0, 7.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1923828125, -1.1550140380859375, -1.117645263671875, -1.0802764892578125, -1.04290771484375, -1.0055389404296875, -0.968170166015625, -0.9308013916015625, -0.8934326171875, -0.8560638427734375, -0.818695068359375, -0.7813262939453125, -0.74395751953125, -0.7065887451171875, -0.669219970703125, -0.6318511962890625, -0.594482421875, -0.5571136474609375, -0.519744873046875, -0.4823760986328125, -0.44500732421875, -0.4076385498046875, -0.370269775390625, -0.3329010009765625, -0.2955322265625, -0.2581634521484375, -0.220794677734375, -0.1834259033203125, -0.14605712890625, -0.1086883544921875, -0.071319580078125, -0.0339508056640625, 0.00341796875, 0.0407867431640625, 0.078155517578125, 0.1155242919921875, 0.15289306640625, 0.1902618408203125, 0.227630615234375, 0.2649993896484375, 0.3023681640625, 0.3397369384765625, 0.377105712890625, 0.4144744873046875, 0.45184326171875, 0.4892120361328125, 0.526580810546875, 0.5639495849609375, 0.601318359375, 0.6386871337890625, 0.676055908203125, 0.7134246826171875, 0.75079345703125, 0.7881622314453125, 0.825531005859375, 0.8628997802734375, 0.9002685546875, 0.9376373291015625, 0.975006103515625, 1.0123748779296875, 1.04974365234375, 1.0871124267578125, 1.124481201171875, 1.1618499755859375, 1.19921875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 5.0, 8.0, 6.0, 21.0, 28.0, 44.0, 42.0, 77.0, 117.0, 193.0, 329.0, 538.0, 1051.0, 2117.0, 4696.0, 11346.0, 31616.0, 119227.0, 2968516.0, 925796.0, 87327.0, 24459.0, 8994.0, 3866.0, 1798.0, 884.0, 456.0, 292.0, 141.0, 100.0, 55.0, 29.0, 21.0, 23.0, 13.0, 8.0, 4.0, 7.0, 4.0, 4.0, 3.0, 2.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.8359375, -4.68896484375, -4.5419921875, -4.39501953125, -4.248046875, -4.10107421875, -3.9541015625, -3.80712890625, -3.66015625, -3.51318359375, -3.3662109375, -3.21923828125, -3.072265625, -2.92529296875, -2.7783203125, -2.63134765625, -2.484375, -2.33740234375, -2.1904296875, -2.04345703125, -1.896484375, -1.74951171875, -1.6025390625, -1.45556640625, -1.30859375, -1.16162109375, -1.0146484375, -0.86767578125, -0.720703125, -0.57373046875, -0.4267578125, -0.27978515625, -0.1328125, 0.01416015625, 0.1611328125, 0.30810546875, 0.455078125, 0.60205078125, 0.7490234375, 0.89599609375, 1.04296875, 1.18994140625, 1.3369140625, 1.48388671875, 1.630859375, 1.77783203125, 1.9248046875, 2.07177734375, 2.21875, 2.36572265625, 2.5126953125, 2.65966796875, 2.806640625, 2.95361328125, 3.1005859375, 3.24755859375, 3.39453125, 3.54150390625, 3.6884765625, 3.83544921875, 3.982421875, 4.12939453125, 4.2763671875, 4.42333984375, 4.5703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 3.0, 6.0, 12.0, 15.0, 17.0, 23.0, 25.0, 27.0, 44.0, 65.0, 71.0, 130.0, 243.0, 586.0, 1698.0, 497.0, 207.0, 125.0, 85.0, 39.0, 37.0, 33.0, 16.0, 14.0, 11.0, 7.0, 10.0, 5.0, 4.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3798828125, -1.334503173828125, -1.28912353515625, -1.243743896484375, -1.1983642578125, -1.152984619140625, -1.10760498046875, -1.062225341796875, -1.016845703125, -0.971466064453125, -0.92608642578125, -0.880706787109375, -0.8353271484375, -0.789947509765625, -0.74456787109375, -0.699188232421875, -0.65380859375, -0.608428955078125, -0.56304931640625, -0.517669677734375, -0.4722900390625, -0.426910400390625, -0.38153076171875, -0.336151123046875, -0.290771484375, -0.245391845703125, -0.20001220703125, -0.154632568359375, -0.1092529296875, -0.063873291015625, -0.01849365234375, 0.026885986328125, 0.072265625, 0.117645263671875, 0.16302490234375, 0.208404541015625, 0.2537841796875, 0.299163818359375, 0.34454345703125, 0.389923095703125, 0.435302734375, 0.480682373046875, 0.52606201171875, 0.571441650390625, 0.6168212890625, 0.662200927734375, 0.70758056640625, 0.752960205078125, 0.79833984375, 0.843719482421875, 0.88909912109375, 0.934478759765625, 0.9798583984375, 1.025238037109375, 1.07061767578125, 1.115997314453125, 1.161376953125, 1.206756591796875, 1.25213623046875, 1.297515869140625, 1.3428955078125, 1.388275146484375, 1.43365478515625, 1.479034423828125, 1.5244140625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 8.0, 10.0, 31.0, 81.0, 257.0, 406.0, 152.0, 44.0, 11.0, 8.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-45.8751106262207, -45.02976989746094, -44.18443298339844, -43.33909225463867, -42.493751525878906, -41.64841079711914, -40.80307388305664, -39.957733154296875, -39.11239242553711, -38.267051696777344, -37.421714782714844, -36.57637405395508, -35.73103332519531, -34.88569259643555, -34.04035568237305, -33.19501495361328, -32.349674224853516, -31.504335403442383, -30.658994674682617, -29.813655853271484, -28.96831512451172, -28.122976303100586, -27.27763557434082, -26.432296752929688, -25.586957931518555, -24.741619110107422, -23.896278381347656, -23.050939559936523, -22.205598831176758, -21.360260009765625, -20.51491928100586, -19.669580459594727, -18.82423973083496, -17.978900909423828, -17.133560180664062, -16.28822135925293, -15.442880630493164, -14.597541809082031, -13.752201080322266, -12.906862258911133, -12.061521530151367, -11.216181755065918, -10.370841979980469, -9.52550220489502, -8.68016242980957, -7.834823131561279, -6.98948335647583, -6.144143581390381, -5.29880428314209, -4.453464508056641, -3.6081247329711914, -2.7627851963043213, -1.917445421218872, -1.072105884552002, -0.22676610946655273, 0.6185736656188965, 1.4639134407043457, 2.309253215789795, 3.154592990875244, 3.9999325275421143, 4.845272064208984, 5.690611839294434, 6.535951614379883, 7.381291389465332, 8.226631164550781]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 6.0, 14.0, 9.0, 11.0, 20.0, 26.0, 32.0, 30.0, 65.0, 57.0, 58.0, 76.0, 80.0, 76.0, 88.0, 62.0, 64.0, 58.0, 49.0, 33.0, 24.0, 24.0, 16.0, 12.0, 4.0, 7.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.994332313537598, -9.76247787475586, -9.530624389648438, -9.2987699508667, -9.066915512084961, -8.835062026977539, -8.6032075881958, -8.371353149414062, -8.13949966430664, -7.9076457023620605, -7.675791263580322, -7.443937301635742, -7.212082862854004, -6.980228900909424, -6.748374938964844, -6.5165205001831055, -6.284666061401367, -6.052812099456787, -5.820957660675049, -5.589103698730469, -5.3572492599487305, -5.12539529800415, -4.89354133605957, -4.661686897277832, -4.429832935333252, -4.197978973388672, -3.9661245346069336, -3.7342705726623535, -3.5024163722991943, -3.270562171936035, -3.038708209991455, -2.806854009628296, -2.5749998092651367, -2.3431456089019775, -2.1112914085388184, -1.8794374465942383, -1.647583246231079, -1.41572904586792, -1.1838749647140503, -0.9520208835601807, -0.7201666831970215, -0.4883125424385071, -0.2564584016799927, -0.02460426092147827, 0.20724987983703613, 0.4391040802001953, 0.6709581613540649, 0.9028122425079346, 1.1346664428710938, 1.366520643234253, 1.5983747243881226, 1.8302288055419922, 2.0620830059051514, 2.2939372062683105, 2.5257911682128906, 2.75764536857605, 2.989499568939209, 3.221353769302368, 3.4532079696655273, 3.6850619316101074, 3.9169161319732666, 4.148770332336426, 4.380624294281006, 4.612478256225586, 4.844332695007324]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 11.0, 15.0, 37.0, 34.0, 49.0, 95.0, 124.0, 169.0, 306.0, 453.0, 734.0, 1227.0, 2001.0, 3342.0, 5788.0, 10401.0, 19630.0, 41715.0, 842582.0, 65840.0, 24479.0, 12463.0, 6897.0, 3926.0, 2402.0, 1440.0, 867.0, 534.0, 345.0, 230.0, 148.0, 88.0, 54.0, 45.0, 23.0, 18.0, 14.0, 14.0, 3.0, 6.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.783203125, -2.695281982421875, -2.60736083984375, -2.519439697265625, -2.4315185546875, -2.343597412109375, -2.25567626953125, -2.167755126953125, -2.079833984375, -1.991912841796875, -1.90399169921875, -1.816070556640625, -1.7281494140625, -1.640228271484375, -1.55230712890625, -1.464385986328125, -1.37646484375, -1.288543701171875, -1.20062255859375, -1.112701416015625, -1.0247802734375, -0.936859130859375, -0.84893798828125, -0.761016845703125, -0.673095703125, -0.585174560546875, -0.49725341796875, -0.409332275390625, -0.3214111328125, -0.233489990234375, -0.14556884765625, -0.057647705078125, 0.0302734375, 0.118194580078125, 0.20611572265625, 0.294036865234375, 0.3819580078125, 0.469879150390625, 0.55780029296875, 0.645721435546875, 0.733642578125, 0.821563720703125, 0.90948486328125, 0.997406005859375, 1.0853271484375, 1.173248291015625, 1.26116943359375, 1.349090576171875, 1.43701171875, 1.524932861328125, 1.61285400390625, 1.700775146484375, 1.7886962890625, 1.876617431640625, 1.96453857421875, 2.052459716796875, 2.140380859375, 2.228302001953125, 2.31622314453125, 2.404144287109375, 2.4920654296875, 2.579986572265625, 2.66790771484375, 2.755828857421875, 2.84375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 5.0, 2.0, 6.0, 6.0, 5.0, 6.0, 9.0, 13.0, 9.0, 39.0, 267.0, 432.0, 79.0, 16.0, 17.0, 15.0, 9.0, 6.0, 5.0, 5.0, 8.0, 4.0, 6.0, 2.0, 7.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.1845703125, -1.1499176025390625, -1.115264892578125, -1.0806121826171875, -1.04595947265625, -1.0113067626953125, -0.976654052734375, -0.9420013427734375, -0.9073486328125, -0.8726959228515625, -0.838043212890625, -0.8033905029296875, -0.76873779296875, -0.7340850830078125, -0.699432373046875, -0.6647796630859375, -0.630126953125, -0.5954742431640625, -0.560821533203125, -0.5261688232421875, -0.49151611328125, -0.4568634033203125, -0.422210693359375, -0.3875579833984375, -0.3529052734375, -0.3182525634765625, -0.283599853515625, -0.2489471435546875, -0.21429443359375, -0.1796417236328125, -0.144989013671875, -0.1103363037109375, -0.07568359375, -0.0410308837890625, -0.006378173828125, 0.0282745361328125, 0.06292724609375, 0.0975799560546875, 0.132232666015625, 0.1668853759765625, 0.2015380859375, 0.2361907958984375, 0.270843505859375, 0.3054962158203125, 0.34014892578125, 0.3748016357421875, 0.409454345703125, 0.4441070556640625, 0.478759765625, 0.5134124755859375, 0.548065185546875, 0.5827178955078125, 0.61737060546875, 0.6520233154296875, 0.686676025390625, 0.7213287353515625, 0.7559814453125, 0.7906341552734375, 0.825286865234375, 0.8599395751953125, 0.89459228515625, 0.9292449951171875, 0.963897705078125, 0.9985504150390625, 1.033203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 6.0, 3.0, 10.0, 8.0, 21.0, 22.0, 26.0, 25.0, 36.0, 51.0, 57.0, 92.0, 153.0, 240.0, 353.0, 598.0, 1090.0, 2185.0, 5202.0, 13627.0, 42560.0, 151411.0, 443777.0, 274168.0, 75378.0, 22725.0, 7850.0, 3242.0, 1493.0, 746.0, 477.0, 286.0, 185.0, 123.0, 68.0, 66.0, 45.0, 21.0, 22.0, 29.0, 18.0, 15.0, 14.0, 6.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.658203125, -2.574432373046875, -2.49066162109375, -2.406890869140625, -2.3231201171875, -2.239349365234375, -2.15557861328125, -2.071807861328125, -1.988037109375, -1.904266357421875, -1.82049560546875, -1.736724853515625, -1.6529541015625, -1.569183349609375, -1.48541259765625, -1.401641845703125, -1.31787109375, -1.234100341796875, -1.15032958984375, -1.066558837890625, -0.9827880859375, -0.899017333984375, -0.81524658203125, -0.731475830078125, -0.647705078125, -0.563934326171875, -0.48016357421875, -0.396392822265625, -0.3126220703125, -0.228851318359375, -0.14508056640625, -0.061309814453125, 0.0224609375, 0.106231689453125, 0.19000244140625, 0.273773193359375, 0.3575439453125, 0.441314697265625, 0.52508544921875, 0.608856201171875, 0.692626953125, 0.776397705078125, 0.86016845703125, 0.943939208984375, 1.0277099609375, 1.111480712890625, 1.19525146484375, 1.279022216796875, 1.36279296875, 1.446563720703125, 1.53033447265625, 1.614105224609375, 1.6978759765625, 1.781646728515625, 1.86541748046875, 1.949188232421875, 2.032958984375, 2.116729736328125, 2.20050048828125, 2.284271240234375, 2.3680419921875, 2.451812744140625, 2.53558349609375, 2.619354248046875, 2.703125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 2.0, 6.0, 5.0, 5.0, 11.0, 12.0, 10.0, 21.0, 18.0, 11.0, 26.0, 26.0, 24.0, 39.0, 42.0, 34.0, 32.0, 38.0, 47.0, 49.0, 44.0, 52.0, 47.0, 44.0, 31.0, 33.0, 31.0, 42.0, 31.0, 28.0, 20.0, 26.0, 21.0, 12.0, 18.0, 9.0, 11.0, 7.0, 11.0, 8.0, 2.0, 9.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.42578125, -4.290771484375, -4.15576171875, -4.020751953125, -3.8857421875, -3.750732421875, -3.61572265625, -3.480712890625, -3.345703125, -3.210693359375, -3.07568359375, -2.940673828125, -2.8056640625, -2.670654296875, -2.53564453125, -2.400634765625, -2.265625, -2.130615234375, -1.99560546875, -1.860595703125, -1.7255859375, -1.590576171875, -1.45556640625, -1.320556640625, -1.185546875, -1.050537109375, -0.91552734375, -0.780517578125, -0.6455078125, -0.510498046875, -0.37548828125, -0.240478515625, -0.10546875, 0.029541015625, 0.16455078125, 0.299560546875, 0.4345703125, 0.569580078125, 0.70458984375, 0.839599609375, 0.974609375, 1.109619140625, 1.24462890625, 1.379638671875, 1.5146484375, 1.649658203125, 1.78466796875, 1.919677734375, 2.0546875, 2.189697265625, 2.32470703125, 2.459716796875, 2.5947265625, 2.729736328125, 2.86474609375, 2.999755859375, 3.134765625, 3.269775390625, 3.40478515625, 3.539794921875, 3.6748046875, 3.809814453125, 3.94482421875, 4.079833984375, 4.21484375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 7.0, 3.0, 8.0, 12.0, 13.0, 12.0, 20.0, 38.0, 66.0, 79.0, 126.0, 197.0, 371.0, 621.0, 1067.0, 2076.0, 4416.0, 11275.0, 37633.0, 197228.0, 603119.0, 142674.0, 29934.0, 9459.0, 3836.0, 1895.0, 983.0, 518.0, 320.0, 179.0, 113.0, 74.0, 52.0, 36.0, 28.0, 19.0, 18.0, 10.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.919921875, -3.809234619140625, -3.69854736328125, -3.587860107421875, -3.4771728515625, -3.366485595703125, -3.25579833984375, -3.145111083984375, -3.034423828125, -2.923736572265625, -2.81304931640625, -2.702362060546875, -2.5916748046875, -2.480987548828125, -2.37030029296875, -2.259613037109375, -2.14892578125, -2.038238525390625, -1.92755126953125, -1.816864013671875, -1.7061767578125, -1.595489501953125, -1.48480224609375, -1.374114990234375, -1.263427734375, -1.152740478515625, -1.04205322265625, -0.931365966796875, -0.8206787109375, -0.709991455078125, -0.59930419921875, -0.488616943359375, -0.3779296875, -0.267242431640625, -0.15655517578125, -0.045867919921875, 0.0648193359375, 0.175506591796875, 0.28619384765625, 0.396881103515625, 0.507568359375, 0.618255615234375, 0.72894287109375, 0.839630126953125, 0.9503173828125, 1.061004638671875, 1.17169189453125, 1.282379150390625, 1.39306640625, 1.503753662109375, 1.61444091796875, 1.725128173828125, 1.8358154296875, 1.946502685546875, 2.05718994140625, 2.167877197265625, 2.278564453125, 2.389251708984375, 2.49993896484375, 2.610626220703125, 2.7213134765625, 2.832000732421875, 2.94268798828125, 3.053375244140625, 3.1640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 6.0, 11.0, 17.0, 13.0, 17.0, 21.0, 24.0, 34.0, 43.0, 56.0, 68.0, 81.0, 81.0, 73.0, 74.0, 72.0, 79.0, 42.0, 34.0, 34.0, 32.0, 23.0, 9.0, 12.0, 8.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0001895427703857422, -0.0001845918595790863, -0.00017964094877243042, -0.00017469003796577454, -0.00016973912715911865, -0.00016478821635246277, -0.00015983730554580688, -0.000154886394739151, -0.00014993548393249512, -0.00014498457312583923, -0.00014003366231918335, -0.00013508275151252747, -0.00013013184070587158, -0.0001251809298992157, -0.00012023001909255981, -0.00011527910828590393, -0.00011032819747924805, -0.00010537728667259216, -0.00010042637586593628, -9.54754650592804e-05, -9.052455425262451e-05, -8.557364344596863e-05, -8.062273263931274e-05, -7.567182183265686e-05, -7.072091102600098e-05, -6.577000021934509e-05, -6.081908941268921e-05, -5.5868178606033325e-05, -5.091726779937744e-05, -4.596635699272156e-05, -4.1015446186065674e-05, -3.606453537940979e-05, -3.1113624572753906e-05, -2.6162713766098022e-05, -2.121180295944214e-05, -1.6260892152786255e-05, -1.1309981346130371e-05, -6.359070539474487e-06, -1.4081597328186035e-06, 3.5427510738372803e-06, 8.493661880493164e-06, 1.3444572687149048e-05, 1.839548349380493e-05, 2.3346394300460815e-05, 2.82973051071167e-05, 3.324821591377258e-05, 3.819912672042847e-05, 4.315003752708435e-05, 4.8100948333740234e-05, 5.305185914039612e-05, 5.8002769947052e-05, 6.295368075370789e-05, 6.790459156036377e-05, 7.285550236701965e-05, 7.780641317367554e-05, 8.275732398033142e-05, 8.77082347869873e-05, 9.265914559364319e-05, 9.761005640029907e-05, 0.00010256096720695496, 0.00010751187801361084, 0.00011246278882026672, 0.00011741369962692261, 0.0001223646104335785, 0.00012731552124023438]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 14.0, 16.0, 21.0, 25.0, 31.0, 70.0, 114.0, 169.0, 277.0, 562.0, 1099.0, 2330.0, 6177.0, 20211.0, 114589.0, 680716.0, 181395.0, 27453.0, 7601.0, 2918.0, 1266.0, 594.0, 338.0, 213.0, 114.0, 74.0, 46.0, 38.0, 23.0, 10.0, 14.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.8984375, -4.73297119140625, -4.5675048828125, -4.40203857421875, -4.236572265625, -4.07110595703125, -3.9056396484375, -3.74017333984375, -3.57470703125, -3.40924072265625, -3.2437744140625, -3.07830810546875, -2.912841796875, -2.74737548828125, -2.5819091796875, -2.41644287109375, -2.2509765625, -2.08551025390625, -1.9200439453125, -1.75457763671875, -1.589111328125, -1.42364501953125, -1.2581787109375, -1.09271240234375, -0.92724609375, -0.76177978515625, -0.5963134765625, -0.43084716796875, -0.265380859375, -0.09991455078125, 0.0655517578125, 0.23101806640625, 0.396484375, 0.56195068359375, 0.7274169921875, 0.89288330078125, 1.058349609375, 1.22381591796875, 1.3892822265625, 1.55474853515625, 1.72021484375, 1.88568115234375, 2.0511474609375, 2.21661376953125, 2.382080078125, 2.54754638671875, 2.7130126953125, 2.87847900390625, 3.0439453125, 3.20941162109375, 3.3748779296875, 3.54034423828125, 3.705810546875, 3.87127685546875, 4.0367431640625, 4.20220947265625, 4.36767578125, 4.53314208984375, 4.6986083984375, 4.86407470703125, 5.029541015625, 5.19500732421875, 5.3604736328125, 5.52593994140625, 5.69140625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 2.0, 9.0, 9.0, 12.0, 18.0, 32.0, 32.0, 44.0, 56.0, 60.0, 73.0, 94.0, 92.0, 83.0, 85.0, 71.0, 53.0, 47.0, 38.0, 14.0, 18.0, 14.0, 10.0, 5.0, 9.0, 5.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9453125, -2.8546142578125, -2.763916015625, -2.6732177734375, -2.58251953125, -2.4918212890625, -2.401123046875, -2.3104248046875, -2.2197265625, -2.1290283203125, -2.038330078125, -1.9476318359375, -1.85693359375, -1.7662353515625, -1.675537109375, -1.5848388671875, -1.494140625, -1.4034423828125, -1.312744140625, -1.2220458984375, -1.13134765625, -1.0406494140625, -0.949951171875, -0.8592529296875, -0.7685546875, -0.6778564453125, -0.587158203125, -0.4964599609375, -0.40576171875, -0.3150634765625, -0.224365234375, -0.1336669921875, -0.04296875, 0.0477294921875, 0.138427734375, 0.2291259765625, 0.31982421875, 0.4105224609375, 0.501220703125, 0.5919189453125, 0.6826171875, 0.7733154296875, 0.864013671875, 0.9547119140625, 1.04541015625, 1.1361083984375, 1.226806640625, 1.3175048828125, 1.408203125, 1.4989013671875, 1.589599609375, 1.6802978515625, 1.77099609375, 1.8616943359375, 1.952392578125, 2.0430908203125, 2.1337890625, 2.2244873046875, 2.315185546875, 2.4058837890625, 2.49658203125, 2.5872802734375, 2.677978515625, 2.7686767578125, 2.859375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 7.0, 9.0, 19.0, 119.0, 387.0, 351.0, 69.0, 23.0, 13.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.05615234375, -124.77410125732422, -121.49205017089844, -118.20999908447266, -114.92794799804688, -111.6458969116211, -108.36384582519531, -105.08180236816406, -101.79974365234375, -98.51769256591797, -95.23564147949219, -91.9535903930664, -88.67153930664062, -85.38948822021484, -82.10743713378906, -78.82539367675781, -75.54334259033203, -72.26129150390625, -68.97924041748047, -65.69718933105469, -62.415138244628906, -59.133087158203125, -55.85103988647461, -52.56898880004883, -49.28693771362305, -46.004886627197266, -42.722835540771484, -39.44078826904297, -36.15873718261719, -32.876686096191406, -29.594635009765625, -26.312583923339844, -23.03052520751953, -19.74847412109375, -16.46642303466797, -13.18437385559082, -9.902322769165039, -6.620271682739258, -3.3382225036621094, -0.056171417236328125, 3.225879669189453, 6.507930278778076, 9.7899808883667, 13.072031021118164, 16.354082107543945, 19.636133193969727, 22.918182373046875, 26.200233459472656, 29.482284545898438, 32.76433563232422, 36.04638671875, 39.32843780517578, 42.61048889160156, 45.892539978027344, 49.17458724975586, 52.45663833618164, 55.73868942260742, 59.0207405090332, 62.302791595458984, 65.5848388671875, 68.86688995361328, 72.14894104003906, 75.43099212646484, 78.71304321289062, 81.9950942993164]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 4.0, 3.0, 3.0, 10.0, 8.0, 21.0, 17.0, 20.0, 40.0, 77.0, 136.0, 166.0, 165.0, 106.0, 75.0, 46.0, 21.0, 14.0, 10.0, 9.0, 6.0, 4.0, 6.0, 6.0, 3.0, 4.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.16860961914062, -82.4225082397461, -79.6764144897461, -76.93031311035156, -74.18421173095703, -71.4381103515625, -68.6920166015625, -65.94591522216797, -63.1998176574707, -60.45372009277344, -57.707618713378906, -54.96152114868164, -52.215423583984375, -49.469322204589844, -46.72322463989258, -43.97712707519531, -41.23102569580078, -38.484928131103516, -35.738826751708984, -32.99272918701172, -30.24662971496582, -27.500530242919922, -24.754432678222656, -22.008333206176758, -19.26223373413086, -16.51613426208496, -13.770035743713379, -11.023937225341797, -8.277837753295898, -5.53173828125, -2.7856407165527344, -0.03954124450683594, 2.7065582275390625, 5.452657222747803, 8.198756217956543, 10.944854736328125, 13.690954208374023, 16.437053680419922, 19.183151245117188, 21.929250717163086, 24.675350189208984, 27.421449661254883, 30.16754913330078, 32.91364669799805, 35.65974426269531, 38.405845642089844, 41.15194320678711, 43.898040771484375, 46.644142150878906, 49.39023971557617, 52.1363410949707, 54.88243865966797, 57.6285400390625, 60.374637603759766, 63.12073516845703, 65.86683654785156, 68.61293029785156, 71.3590316772461, 74.1051254272461, 76.85122680664062, 79.59732818603516, 82.34342956542969, 85.08952331542969, 87.83562469482422, 90.58172607421875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 2.0, 3.0, 8.0, 5.0, 15.0, 7.0, 14.0, 25.0, 22.0, 34.0, 45.0, 66.0, 108.0, 158.0, 270.0, 397.0, 576.0, 1021.0, 1697.0, 2898.0, 5414.0, 11188.0, 30755.0, 253543.0, 3799917.0, 51803.0, 16715.0, 7711.0, 3936.0, 2158.0, 1326.0, 790.0, 538.0, 374.0, 239.0, 149.0, 104.0, 65.0, 44.0, 38.0, 34.0, 21.0, 12.0, 13.0, 9.0, 8.0, 5.0, 1.0, 1.0, 0.0, 4.0, 0.0, 5.0, 1.0, 0.0, 1.0], "bins": [-8.8671875, -8.5916748046875, -8.316162109375, -8.0406494140625, -7.76513671875, -7.4896240234375, -7.214111328125, -6.9385986328125, -6.6630859375, -6.3875732421875, -6.112060546875, -5.8365478515625, -5.56103515625, -5.2855224609375, -5.010009765625, -4.7344970703125, -4.458984375, -4.1834716796875, -3.907958984375, -3.6324462890625, -3.35693359375, -3.0814208984375, -2.805908203125, -2.5303955078125, -2.2548828125, -1.9793701171875, -1.703857421875, -1.4283447265625, -1.15283203125, -0.8773193359375, -0.601806640625, -0.3262939453125, -0.05078125, 0.2247314453125, 0.500244140625, 0.7757568359375, 1.05126953125, 1.3267822265625, 1.602294921875, 1.8778076171875, 2.1533203125, 2.4288330078125, 2.704345703125, 2.9798583984375, 3.25537109375, 3.5308837890625, 3.806396484375, 4.0819091796875, 4.357421875, 4.6329345703125, 4.908447265625, 5.1839599609375, 5.45947265625, 5.7349853515625, 6.010498046875, 6.2860107421875, 6.5615234375, 6.8370361328125, 7.112548828125, 7.3880615234375, 7.66357421875, 7.9390869140625, 8.214599609375, 8.4901123046875, 8.765625]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 4.0, 8.0, 10.0, 13.0, 13.0, 16.0, 33.0, 166.0, 355.0, 233.0, 40.0, 17.0, 16.0, 19.0, 11.0, 9.0, 10.0, 5.0, 6.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0234375, -0.9878082275390625, -0.952178955078125, -0.9165496826171875, -0.88092041015625, -0.8452911376953125, -0.809661865234375, -0.7740325927734375, -0.7384033203125, -0.7027740478515625, -0.667144775390625, -0.6315155029296875, -0.59588623046875, -0.5602569580078125, -0.524627685546875, -0.4889984130859375, -0.453369140625, -0.4177398681640625, -0.382110595703125, -0.3464813232421875, -0.31085205078125, -0.2752227783203125, -0.239593505859375, -0.2039642333984375, -0.1683349609375, -0.1327056884765625, -0.097076416015625, -0.0614471435546875, -0.02581787109375, 0.0098114013671875, 0.045440673828125, 0.0810699462890625, 0.11669921875, 0.1523284912109375, 0.187957763671875, 0.2235870361328125, 0.25921630859375, 0.2948455810546875, 0.330474853515625, 0.3661041259765625, 0.4017333984375, 0.4373626708984375, 0.472991943359375, 0.5086212158203125, 0.54425048828125, 0.5798797607421875, 0.615509033203125, 0.6511383056640625, 0.686767578125, 0.7223968505859375, 0.758026123046875, 0.7936553955078125, 0.82928466796875, 0.8649139404296875, 0.900543212890625, 0.9361724853515625, 0.9718017578125, 1.0074310302734375, 1.043060302734375, 1.0786895751953125, 1.11431884765625, 1.1499481201171875, 1.185577392578125, 1.2212066650390625, 1.2568359375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 11.0, 8.0, 11.0, 13.0, 25.0, 29.0, 57.0, 83.0, 130.0, 252.0, 543.0, 1048.0, 2187.0, 5142.0, 12458.0, 37983.0, 171197.0, 3484788.0, 387658.0, 59620.0, 18455.0, 6892.0, 2871.0, 1259.0, 652.0, 373.0, 171.0, 108.0, 78.0, 49.0, 42.0, 23.0, 14.0, 18.0, 9.0, 5.0, 7.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6640625, -8.4141845703125, -8.164306640625, -7.9144287109375, -7.66455078125, -7.4146728515625, -7.164794921875, -6.9149169921875, -6.6650390625, -6.4151611328125, -6.165283203125, -5.9154052734375, -5.66552734375, -5.4156494140625, -5.165771484375, -4.9158935546875, -4.666015625, -4.4161376953125, -4.166259765625, -3.9163818359375, -3.66650390625, -3.4166259765625, -3.166748046875, -2.9168701171875, -2.6669921875, -2.4171142578125, -2.167236328125, -1.9173583984375, -1.66748046875, -1.4176025390625, -1.167724609375, -0.9178466796875, -0.66796875, -0.4180908203125, -0.168212890625, 0.0816650390625, 0.33154296875, 0.5814208984375, 0.831298828125, 1.0811767578125, 1.3310546875, 1.5809326171875, 1.830810546875, 2.0806884765625, 2.33056640625, 2.5804443359375, 2.830322265625, 3.0802001953125, 3.330078125, 3.5799560546875, 3.829833984375, 4.0797119140625, 4.32958984375, 4.5794677734375, 4.829345703125, 5.0792236328125, 5.3291015625, 5.5789794921875, 5.828857421875, 6.0787353515625, 6.32861328125, 6.5784912109375, 6.828369140625, 7.0782470703125, 7.328125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 9.0, 6.0, 11.0, 7.0, 12.0, 12.0, 23.0, 29.0, 36.0, 47.0, 51.0, 59.0, 101.0, 163.0, 246.0, 536.0, 1459.0, 415.0, 233.0, 151.0, 104.0, 67.0, 67.0, 43.0, 33.0, 22.0, 22.0, 20.0, 13.0, 6.0, 11.0, 9.0, 8.0, 9.0, 3.0, 3.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.87158203125, -0.845458984375, -0.8193359375, -0.793212890625, -0.76708984375, -0.740966796875, -0.71484375, -0.688720703125, -0.66259765625, -0.636474609375, -0.6103515625, -0.584228515625, -0.55810546875, -0.531982421875, -0.505859375, -0.479736328125, -0.45361328125, -0.427490234375, -0.4013671875, -0.375244140625, -0.34912109375, -0.322998046875, -0.296875, -0.270751953125, -0.24462890625, -0.218505859375, -0.1923828125, -0.166259765625, -0.14013671875, -0.114013671875, -0.087890625, -0.061767578125, -0.03564453125, -0.009521484375, 0.0166015625, 0.042724609375, 0.06884765625, 0.094970703125, 0.12109375, 0.147216796875, 0.17333984375, 0.199462890625, 0.2255859375, 0.251708984375, 0.27783203125, 0.303955078125, 0.330078125, 0.356201171875, 0.38232421875, 0.408447265625, 0.4345703125, 0.460693359375, 0.48681640625, 0.512939453125, 0.5390625, 0.565185546875, 0.59130859375, 0.617431640625, 0.6435546875, 0.669677734375, 0.69580078125, 0.721923828125, 0.748046875, 0.774169921875, 0.80029296875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 6.0, 11.0, 84.0, 482.0, 324.0, 69.0, 16.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.853595733642578, -13.966403007507324, -13.079211235046387, -12.192018508911133, -11.304826736450195, -10.417634010314941, -9.530441284179688, -8.64324951171875, -7.756056785583496, -6.8688645362854, -5.981672286987305, -5.094479560852051, -4.207287311553955, -3.3200950622558594, -2.4329023361206055, -1.5457100868225098, -0.6585178375244141, 0.2286745309829712, 1.1158668994903564, 2.0030593872070312, 2.890251636505127, 3.7774438858032227, 4.664636611938477, 5.551828861236572, 6.439021110534668, 7.326213359832764, 8.21340560913086, 9.100598335266113, 9.987791061401367, 10.874982833862305, 11.762175559997559, 12.649368286132812, 13.53656005859375, 14.423752784729004, 15.310944557189941, 16.198137283325195, 17.085329055786133, 17.972522735595703, 18.85971450805664, 19.746906280517578, 20.634098052978516, 21.521289825439453, 22.408483505249023, 23.29567527770996, 24.1828670501709, 25.07006072998047, 25.957252502441406, 26.844444274902344, 27.731637954711914, 28.61882972717285, 29.506023406982422, 30.39321517944336, 31.280406951904297, 32.167598724365234, 33.05479431152344, 33.941986083984375, 34.82917785644531, 35.71636962890625, 36.60356140136719, 37.490753173828125, 38.37794876098633, 39.265140533447266, 40.1523323059082, 41.03952407836914, 41.92671585083008]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 13.0, 11.0, 9.0, 17.0, 27.0, 22.0, 30.0, 38.0, 54.0, 45.0, 61.0, 57.0, 49.0, 73.0, 68.0, 64.0, 66.0, 51.0, 42.0, 33.0, 26.0, 27.0, 27.0, 21.0, 11.0, 12.0, 9.0, 8.0, 11.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.310943603515625, -5.1390461921691895, -4.967148780822754, -4.795251846313477, -4.623354434967041, -4.4514570236206055, -4.27955961227417, -4.107662200927734, -3.935765266418457, -3.7638678550720215, -3.591970682144165, -3.4200732707977295, -3.248176097869873, -3.0762786865234375, -2.904381275177002, -2.7324841022491455, -2.56058669090271, -2.3886892795562744, -2.216792106628418, -2.0448946952819824, -1.872997522354126, -1.7011001110076904, -1.5292028188705444, -1.3573055267333984, -1.1854082345962524, -1.0135109424591064, -0.8416136503219604, -0.6697162985801697, -0.4978190064430237, -0.3259217143058777, -0.15402436256408691, 0.017872929573059082, 0.18977022171020508, 0.3616675138473511, 0.5335648059844971, 0.7054621577262878, 0.8773594498634338, 1.0492568016052246, 1.2211540937423706, 1.3930513858795166, 1.5649486780166626, 1.7368459701538086, 1.9087432622909546, 2.0806405544281006, 2.252537965774536, 2.4244351387023926, 2.596332550048828, 2.7682299613952637, 2.94012713432312, 3.1120245456695557, 3.283921718597412, 3.4558191299438477, 3.627716302871704, 3.7996137142181396, 3.971510887145996, 4.143408298492432, 4.315305709838867, 4.487203121185303, 4.659100532531738, 4.830997467041016, 5.002894878387451, 5.174792289733887, 5.346689701080322, 5.518587112426758, 5.690484046936035]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 9.0, 14.0, 6.0, 11.0, 17.0, 19.0, 29.0, 51.0, 70.0, 93.0, 181.0, 219.0, 313.0, 555.0, 934.0, 1545.0, 3187.0, 7014.0, 19173.0, 71997.0, 805148.0, 99823.0, 22106.0, 8216.0, 3447.0, 1752.0, 970.0, 538.0, 346.0, 257.0, 160.0, 92.0, 63.0, 53.0, 33.0, 20.0, 23.0, 12.0, 13.0, 8.0, 5.0, 7.0, 6.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.0078125, -5.811279296875, -5.61474609375, -5.418212890625, -5.2216796875, -5.025146484375, -4.82861328125, -4.632080078125, -4.435546875, -4.239013671875, -4.04248046875, -3.845947265625, -3.6494140625, -3.452880859375, -3.25634765625, -3.059814453125, -2.86328125, -2.666748046875, -2.47021484375, -2.273681640625, -2.0771484375, -1.880615234375, -1.68408203125, -1.487548828125, -1.291015625, -1.094482421875, -0.89794921875, -0.701416015625, -0.5048828125, -0.308349609375, -0.11181640625, 0.084716796875, 0.28125, 0.477783203125, 0.67431640625, 0.870849609375, 1.0673828125, 1.263916015625, 1.46044921875, 1.656982421875, 1.853515625, 2.050048828125, 2.24658203125, 2.443115234375, 2.6396484375, 2.836181640625, 3.03271484375, 3.229248046875, 3.42578125, 3.622314453125, 3.81884765625, 4.015380859375, 4.2119140625, 4.408447265625, 4.60498046875, 4.801513671875, 4.998046875, 5.194580078125, 5.39111328125, 5.587646484375, 5.7841796875, 5.980712890625, 6.17724609375, 6.373779296875, 6.5703125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 6.0, 7.0, 5.0, 8.0, 15.0, 29.0, 73.0, 175.0, 324.0, 191.0, 61.0, 19.0, 14.0, 17.0, 17.0, 11.0, 8.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.060546875, -1.0247039794921875, -0.988861083984375, -0.9530181884765625, -0.91717529296875, -0.8813323974609375, -0.845489501953125, -0.8096466064453125, -0.7738037109375, -0.7379608154296875, -0.702117919921875, -0.6662750244140625, -0.63043212890625, -0.5945892333984375, -0.558746337890625, -0.5229034423828125, -0.487060546875, -0.4512176513671875, -0.415374755859375, -0.3795318603515625, -0.34368896484375, -0.3078460693359375, -0.272003173828125, -0.2361602783203125, -0.2003173828125, -0.1644744873046875, -0.128631591796875, -0.0927886962890625, -0.05694580078125, -0.0211029052734375, 0.014739990234375, 0.0505828857421875, 0.08642578125, 0.1222686767578125, 0.158111572265625, 0.1939544677734375, 0.22979736328125, 0.2656402587890625, 0.301483154296875, 0.3373260498046875, 0.3731689453125, 0.4090118408203125, 0.444854736328125, 0.4806976318359375, 0.51654052734375, 0.5523834228515625, 0.588226318359375, 0.6240692138671875, 0.659912109375, 0.6957550048828125, 0.731597900390625, 0.7674407958984375, 0.80328369140625, 0.8391265869140625, 0.874969482421875, 0.9108123779296875, 0.9466552734375, 0.9824981689453125, 1.018341064453125, 1.0541839599609375, 1.09002685546875, 1.1258697509765625, 1.161712646484375, 1.1975555419921875, 1.2333984375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 9.0, 5.0, 11.0, 16.0, 20.0, 26.0, 47.0, 56.0, 95.0, 146.0, 251.0, 433.0, 855.0, 1726.0, 3815.0, 10514.0, 38926.0, 236856.0, 590091.0, 127067.0, 24145.0, 7500.0, 3005.0, 1325.0, 655.0, 386.0, 183.0, 122.0, 109.0, 57.0, 31.0, 16.0, 23.0, 11.0, 1.0, 8.0, 8.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8203125, -4.67572021484375, -4.5311279296875, -4.38653564453125, -4.241943359375, -4.09735107421875, -3.9527587890625, -3.80816650390625, -3.66357421875, -3.51898193359375, -3.3743896484375, -3.22979736328125, -3.085205078125, -2.94061279296875, -2.7960205078125, -2.65142822265625, -2.5068359375, -2.36224365234375, -2.2176513671875, -2.07305908203125, -1.928466796875, -1.78387451171875, -1.6392822265625, -1.49468994140625, -1.35009765625, -1.20550537109375, -1.0609130859375, -0.91632080078125, -0.771728515625, -0.62713623046875, -0.4825439453125, -0.33795166015625, -0.193359375, -0.04876708984375, 0.0958251953125, 0.24041748046875, 0.385009765625, 0.52960205078125, 0.6741943359375, 0.81878662109375, 0.96337890625, 1.10797119140625, 1.2525634765625, 1.39715576171875, 1.541748046875, 1.68634033203125, 1.8309326171875, 1.97552490234375, 2.1201171875, 2.26470947265625, 2.4093017578125, 2.55389404296875, 2.698486328125, 2.84307861328125, 2.9876708984375, 3.13226318359375, 3.27685546875, 3.42144775390625, 3.5660400390625, 3.71063232421875, 3.855224609375, 3.99981689453125, 4.1444091796875, 4.28900146484375, 4.43359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 8.0, 10.0, 10.0, 14.0, 4.0, 11.0, 17.0, 22.0, 28.0, 26.0, 28.0, 36.0, 42.0, 30.0, 48.0, 44.0, 45.0, 55.0, 49.0, 51.0, 53.0, 47.0, 33.0, 46.0, 42.0, 42.0, 28.0, 20.0, 27.0, 23.0, 19.0, 12.0, 7.0, 10.0, 7.0, 4.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.873046875, -2.788818359375, -2.70458984375, -2.620361328125, -2.5361328125, -2.451904296875, -2.36767578125, -2.283447265625, -2.19921875, -2.114990234375, -2.03076171875, -1.946533203125, -1.8623046875, -1.778076171875, -1.69384765625, -1.609619140625, -1.525390625, -1.441162109375, -1.35693359375, -1.272705078125, -1.1884765625, -1.104248046875, -1.02001953125, -0.935791015625, -0.8515625, -0.767333984375, -0.68310546875, -0.598876953125, -0.5146484375, -0.430419921875, -0.34619140625, -0.261962890625, -0.177734375, -0.093505859375, -0.00927734375, 0.074951171875, 0.1591796875, 0.243408203125, 0.32763671875, 0.411865234375, 0.49609375, 0.580322265625, 0.66455078125, 0.748779296875, 0.8330078125, 0.917236328125, 1.00146484375, 1.085693359375, 1.169921875, 1.254150390625, 1.33837890625, 1.422607421875, 1.5068359375, 1.591064453125, 1.67529296875, 1.759521484375, 1.84375, 1.927978515625, 2.01220703125, 2.096435546875, 2.1806640625, 2.264892578125, 2.34912109375, 2.433349609375, 2.517578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 8.0, 15.0, 16.0, 28.0, 42.0, 69.0, 89.0, 103.0, 190.0, 347.0, 623.0, 1221.0, 2809.0, 7336.0, 23432.0, 103993.0, 513816.0, 313979.0, 56547.0, 14657.0, 4962.0, 2037.0, 1006.0, 477.0, 242.0, 168.0, 115.0, 77.0, 55.0, 36.0, 19.0, 12.0, 9.0, 4.0, 4.0, 4.0, 4.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.34039306640625, -5.1612548828125, -4.98211669921875, -4.802978515625, -4.62384033203125, -4.4447021484375, -4.26556396484375, -4.08642578125, -3.90728759765625, -3.7281494140625, -3.54901123046875, -3.369873046875, -3.19073486328125, -3.0115966796875, -2.83245849609375, -2.6533203125, -2.47418212890625, -2.2950439453125, -2.11590576171875, -1.936767578125, -1.75762939453125, -1.5784912109375, -1.39935302734375, -1.22021484375, -1.04107666015625, -0.8619384765625, -0.68280029296875, -0.503662109375, -0.32452392578125, -0.1453857421875, 0.03375244140625, 0.212890625, 0.39202880859375, 0.5711669921875, 0.75030517578125, 0.929443359375, 1.10858154296875, 1.2877197265625, 1.46685791015625, 1.64599609375, 1.82513427734375, 2.0042724609375, 2.18341064453125, 2.362548828125, 2.54168701171875, 2.7208251953125, 2.89996337890625, 3.0791015625, 3.25823974609375, 3.4373779296875, 3.61651611328125, 3.795654296875, 3.97479248046875, 4.1539306640625, 4.33306884765625, 4.51220703125, 4.69134521484375, 4.8704833984375, 5.04962158203125, 5.228759765625, 5.40789794921875, 5.5870361328125, 5.76617431640625, 5.9453125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 5.0, 5.0, 6.0, 8.0, 11.0, 19.0, 18.0, 31.0, 56.0, 73.0, 137.0, 166.0, 189.0, 108.0, 66.0, 26.0, 18.0, 14.0, 9.0, 9.0, 2.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042629241943359375, -0.0004104003310203552, -0.0003945082426071167, -0.0003786161541938782, -0.00036272406578063965, -0.0003468319773674011, -0.0003309398889541626, -0.00031504780054092407, -0.00029915571212768555, -0.000283263623714447, -0.0002673715353012085, -0.00025147944688796997, -0.00023558735847473145, -0.00021969527006149292, -0.0002038031816482544, -0.00018791109323501587, -0.00017201900482177734, -0.00015612691640853882, -0.0001402348279953003, -0.00012434273958206177, -0.00010845065116882324, -9.255856275558472e-05, -7.666647434234619e-05, -6.0774385929107666e-05, -4.488229751586914e-05, -2.8990209102630615e-05, -1.309812068939209e-05, 2.7939677238464355e-06, 1.868605613708496e-05, 3.4578144550323486e-05, 5.047023296356201e-05, 6.636232137680054e-05, 8.225440979003906e-05, 9.814649820327759e-05, 0.00011403858661651611, 0.00012993067502975464, 0.00014582276344299316, 0.0001617148518562317, 0.00017760694026947021, 0.00019349902868270874, 0.00020939111709594727, 0.0002252832055091858, 0.00024117529392242432, 0.00025706738233566284, 0.00027295947074890137, 0.0002888515591621399, 0.0003047436475753784, 0.00032063573598861694, 0.00033652782440185547, 0.000352419912815094, 0.0003683120012283325, 0.00038420408964157104, 0.00040009617805480957, 0.0004159882664680481, 0.0004318803548812866, 0.00044777244329452515, 0.00046366453170776367, 0.0004795566201210022, 0.0004954487085342407, 0.0005113407969474792, 0.0005272328853607178, 0.0005431249737739563, 0.0005590170621871948, 0.0005749091506004333, 0.0005908012390136719]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 9.0, 2.0, 6.0, 17.0, 15.0, 25.0, 35.0, 51.0, 79.0, 74.0, 148.0, 220.0, 352.0, 547.0, 898.0, 1499.0, 2635.0, 5111.0, 10967.0, 25807.0, 73587.0, 235886.0, 411531.0, 181341.0, 57428.0, 21296.0, 8890.0, 4358.0, 2226.0, 1280.0, 806.0, 493.0, 274.0, 194.0, 143.0, 82.0, 45.0, 54.0, 43.0, 24.0, 14.0, 18.0, 12.0, 7.0, 6.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.0703125, -3.951934814453125, -3.83355712890625, -3.715179443359375, -3.5968017578125, -3.478424072265625, -3.36004638671875, -3.241668701171875, -3.123291015625, -3.004913330078125, -2.88653564453125, -2.768157958984375, -2.6497802734375, -2.531402587890625, -2.41302490234375, -2.294647216796875, -2.17626953125, -2.057891845703125, -1.93951416015625, -1.821136474609375, -1.7027587890625, -1.584381103515625, -1.46600341796875, -1.347625732421875, -1.229248046875, -1.110870361328125, -0.99249267578125, -0.874114990234375, -0.7557373046875, -0.637359619140625, -0.51898193359375, -0.400604248046875, -0.2822265625, -0.163848876953125, -0.04547119140625, 0.072906494140625, 0.1912841796875, 0.309661865234375, 0.42803955078125, 0.546417236328125, 0.664794921875, 0.783172607421875, 0.90155029296875, 1.019927978515625, 1.1383056640625, 1.256683349609375, 1.37506103515625, 1.493438720703125, 1.61181640625, 1.730194091796875, 1.84857177734375, 1.966949462890625, 2.0853271484375, 2.203704833984375, 2.32208251953125, 2.440460205078125, 2.558837890625, 2.677215576171875, 2.79559326171875, 2.913970947265625, 3.0323486328125, 3.150726318359375, 3.26910400390625, 3.387481689453125, 3.505859375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 6.0, 5.0, 2.0, 9.0, 9.0, 15.0, 18.0, 20.0, 24.0, 22.0, 39.0, 46.0, 45.0, 48.0, 64.0, 66.0, 86.0, 70.0, 62.0, 69.0, 43.0, 41.0, 30.0, 27.0, 32.0, 19.0, 17.0, 17.0, 7.0, 10.0, 8.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.412322998046875, -2.34027099609375, -2.268218994140625, -2.1961669921875, -2.124114990234375, -2.05206298828125, -1.980010986328125, -1.907958984375, -1.835906982421875, -1.76385498046875, -1.691802978515625, -1.6197509765625, -1.547698974609375, -1.47564697265625, -1.403594970703125, -1.33154296875, -1.259490966796875, -1.18743896484375, -1.115386962890625, -1.0433349609375, -0.971282958984375, -0.89923095703125, -0.827178955078125, -0.755126953125, -0.683074951171875, -0.61102294921875, -0.538970947265625, -0.4669189453125, -0.394866943359375, -0.32281494140625, -0.250762939453125, -0.1787109375, -0.106658935546875, -0.03460693359375, 0.037445068359375, 0.1094970703125, 0.181549072265625, 0.25360107421875, 0.325653076171875, 0.397705078125, 0.469757080078125, 0.54180908203125, 0.613861083984375, 0.6859130859375, 0.757965087890625, 0.83001708984375, 0.902069091796875, 0.97412109375, 1.046173095703125, 1.11822509765625, 1.190277099609375, 1.2623291015625, 1.334381103515625, 1.40643310546875, 1.478485107421875, 1.550537109375, 1.622589111328125, 1.69464111328125, 1.766693115234375, 1.8387451171875, 1.910797119140625, 1.98284912109375, 2.054901123046875, 2.126953125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 8.0, 11.0, 20.0, 56.0, 131.0, 249.0, 299.0, 128.0, 61.0, 21.0, 9.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.60840606689453, -43.08407211303711, -41.55973815917969, -40.03540802001953, -38.51107406616211, -36.98674011230469, -35.462406158447266, -33.938072204589844, -32.41373825073242, -30.889404296875, -29.36507225036621, -27.84073829650879, -26.316404342651367, -24.792072296142578, -23.267738342285156, -21.743404388427734, -20.219072341918945, -18.694738388061523, -17.170406341552734, -15.646072387695312, -14.12173843383789, -12.597405433654785, -11.07307243347168, -9.548738479614258, -8.024405479431152, -6.500072002410889, -4.975738525390625, -3.4514055252075195, -1.9270720481872559, -0.4027385711669922, 1.1215944290161133, 2.645928382873535, 4.170261383056641, 5.694594860076904, 7.218928337097168, 8.743261337280273, 10.267595291137695, 11.7919282913208, 13.316261291503906, 14.840595245361328, 16.36492919921875, 17.889263153076172, 19.41359519958496, 20.937929153442383, 22.462263107299805, 23.986595153808594, 25.510929107666016, 27.035263061523438, 28.559595108032227, 30.08392906188965, 31.608261108398438, 33.13259506225586, 34.65692901611328, 36.1812629699707, 37.705596923828125, 39.22992706298828, 40.7542610168457, 42.278594970703125, 43.80292892456055, 45.32726287841797, 46.851593017578125, 48.37592697143555, 49.90026092529297, 51.42459487915039, 52.94892883300781]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 6.0, 10.0, 9.0, 10.0, 17.0, 29.0, 53.0, 78.0, 114.0, 122.0, 134.0, 125.0, 88.0, 73.0, 62.0, 22.0, 22.0, 6.0, 5.0, 8.0, 4.0, 7.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.738487243652344, -32.44294738769531, -31.147403717041016, -29.851863861083984, -28.55632209777832, -27.260780334472656, -25.965238571166992, -24.669696807861328, -23.374156951904297, -22.078615188598633, -20.78307342529297, -19.487533569335938, -18.191991806030273, -16.89645004272461, -15.600908279418945, -14.305367469787598, -13.009824752807617, -11.714282989501953, -10.418742179870605, -9.123200416564941, -7.8276591300964355, -6.53211784362793, -5.236576080322266, -3.941035270690918, -2.645493507385254, -1.3499521017074585, -0.054410696029663086, 1.2411308288574219, 2.5366721153259277, 3.8322134017944336, 5.127755165100098, 6.423295974731445, 7.718837738037109, 9.014379501342773, 10.309920310974121, 11.605462074279785, 12.901002883911133, 14.196544647216797, 15.492086410522461, 16.787628173828125, 18.083168029785156, 19.37870979309082, 20.674251556396484, 21.969791412353516, 23.26533317565918, 24.560874938964844, 25.856416702270508, 27.151958465576172, 28.447500228881836, 29.7430419921875, 31.038583755493164, 32.33412551879883, 33.62966537475586, 34.925209045410156, 36.22074890136719, 37.51628875732422, 38.811832427978516, 40.10737228393555, 41.402915954589844, 42.698455810546875, 43.99399948120117, 45.2895393371582, 46.5850830078125, 47.88062286376953, 49.17616271972656]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 9.0, 15.0, 12.0, 16.0, 20.0, 27.0, 61.0, 67.0, 114.0, 143.0, 232.0, 366.0, 628.0, 1024.0, 2014.0, 3943.0, 9220.0, 32594.0, 490034.0, 3584747.0, 46749.0, 12025.0, 4767.0, 2313.0, 1158.0, 677.0, 469.0, 292.0, 167.0, 110.0, 67.0, 52.0, 31.0, 23.0, 22.0, 12.0, 10.0, 7.0, 6.0, 5.0, 9.0, 7.0, 3.0, 2.0, 3.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.1015625, -11.685791015625, -11.27001953125, -10.854248046875, -10.4384765625, -10.022705078125, -9.60693359375, -9.191162109375, -8.775390625, -8.359619140625, -7.94384765625, -7.528076171875, -7.1123046875, -6.696533203125, -6.28076171875, -5.864990234375, -5.44921875, -5.033447265625, -4.61767578125, -4.201904296875, -3.7861328125, -3.370361328125, -2.95458984375, -2.538818359375, -2.123046875, -1.707275390625, -1.29150390625, -0.875732421875, -0.4599609375, -0.044189453125, 0.37158203125, 0.787353515625, 1.203125, 1.618896484375, 2.03466796875, 2.450439453125, 2.8662109375, 3.281982421875, 3.69775390625, 4.113525390625, 4.529296875, 4.945068359375, 5.36083984375, 5.776611328125, 6.1923828125, 6.608154296875, 7.02392578125, 7.439697265625, 7.85546875, 8.271240234375, 8.68701171875, 9.102783203125, 9.5185546875, 9.934326171875, 10.35009765625, 10.765869140625, 11.181640625, 11.597412109375, 12.01318359375, 12.428955078125, 12.8447265625, 13.260498046875, 13.67626953125, 14.092041015625, 14.5078125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 6.0, 5.0, 10.0, 10.0, 8.0, 9.0, 18.0, 48.0, 130.0, 210.0, 260.0, 152.0, 54.0, 29.0, 17.0, 9.0, 9.0, 3.0, 5.0, 4.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92431640625, -0.8889999389648438, -0.8536834716796875, -0.8183670043945312, -0.783050537109375, -0.7477340698242188, -0.7124176025390625, -0.6771011352539062, -0.64178466796875, -0.6064682006835938, -0.5711517333984375, -0.5358352661132812, -0.500518798828125, -0.46520233154296875, -0.4298858642578125, -0.39456939697265625, -0.3592529296875, -0.32393646240234375, -0.2886199951171875, -0.25330352783203125, -0.217987060546875, -0.18267059326171875, -0.1473541259765625, -0.11203765869140625, -0.07672119140625, -0.04140472412109375, -0.0060882568359375, 0.02922821044921875, 0.064544677734375, 0.09986114501953125, 0.1351776123046875, 0.17049407958984375, 0.205810546875, 0.24112701416015625, 0.2764434814453125, 0.31175994873046875, 0.347076416015625, 0.38239288330078125, 0.4177093505859375, 0.45302581787109375, 0.48834228515625, 0.5236587524414062, 0.5589752197265625, 0.5942916870117188, 0.629608154296875, 0.6649246215820312, 0.7002410888671875, 0.7355575561523438, 0.7708740234375, 0.8061904907226562, 0.8415069580078125, 0.8768234252929688, 0.912139892578125, 0.9474563598632812, 0.9827728271484375, 1.0180892944335938, 1.05340576171875, 1.0887222290039062, 1.1240386962890625, 1.1593551635742188, 1.194671630859375, 1.2299880981445312, 1.2653045654296875, 1.3006210327148438, 1.3359375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 5.0, 10.0, 10.0, 11.0, 17.0, 25.0, 36.0, 66.0, 111.0, 236.0, 487.0, 1274.0, 3764.0, 13205.0, 70629.0, 2951443.0, 1080729.0, 55772.0, 11258.0, 3185.0, 1106.0, 440.0, 180.0, 96.0, 62.0, 24.0, 30.0, 22.0, 12.0, 10.0, 8.0, 8.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.5546875, -11.14111328125, -10.7275390625, -10.31396484375, -9.900390625, -9.48681640625, -9.0732421875, -8.65966796875, -8.24609375, -7.83251953125, -7.4189453125, -7.00537109375, -6.591796875, -6.17822265625, -5.7646484375, -5.35107421875, -4.9375, -4.52392578125, -4.1103515625, -3.69677734375, -3.283203125, -2.86962890625, -2.4560546875, -2.04248046875, -1.62890625, -1.21533203125, -0.8017578125, -0.38818359375, 0.025390625, 0.43896484375, 0.8525390625, 1.26611328125, 1.6796875, 2.09326171875, 2.5068359375, 2.92041015625, 3.333984375, 3.74755859375, 4.1611328125, 4.57470703125, 4.98828125, 5.40185546875, 5.8154296875, 6.22900390625, 6.642578125, 7.05615234375, 7.4697265625, 7.88330078125, 8.296875, 8.71044921875, 9.1240234375, 9.53759765625, 9.951171875, 10.36474609375, 10.7783203125, 11.19189453125, 11.60546875, 12.01904296875, 12.4326171875, 12.84619140625, 13.259765625, 13.67333984375, 14.0869140625, 14.50048828125, 14.9140625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 7.0, 7.0, 4.0, 5.0, 7.0, 10.0, 16.0, 12.0, 17.0, 30.0, 45.0, 71.0, 84.0, 142.0, 217.0, 497.0, 1566.0, 558.0, 277.0, 143.0, 104.0, 52.0, 61.0, 29.0, 23.0, 22.0, 13.0, 14.0, 9.0, 6.0, 6.0, 1.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1962890625, -1.1583404541015625, -1.120391845703125, -1.0824432373046875, -1.04449462890625, -1.0065460205078125, -0.968597412109375, -0.9306488037109375, -0.8927001953125, -0.8547515869140625, -0.816802978515625, -0.7788543701171875, -0.74090576171875, -0.7029571533203125, -0.665008544921875, -0.6270599365234375, -0.589111328125, -0.5511627197265625, -0.513214111328125, -0.4752655029296875, -0.43731689453125, -0.3993682861328125, -0.361419677734375, -0.3234710693359375, -0.2855224609375, -0.2475738525390625, -0.209625244140625, -0.1716766357421875, -0.13372802734375, -0.0957794189453125, -0.057830810546875, -0.0198822021484375, 0.01806640625, 0.0560150146484375, 0.093963623046875, 0.1319122314453125, 0.16986083984375, 0.2078094482421875, 0.245758056640625, 0.2837066650390625, 0.3216552734375, 0.3596038818359375, 0.397552490234375, 0.4355010986328125, 0.47344970703125, 0.5113983154296875, 0.549346923828125, 0.5872955322265625, 0.625244140625, 0.6631927490234375, 0.701141357421875, 0.7390899658203125, 0.77703857421875, 0.8149871826171875, 0.852935791015625, 0.8908843994140625, 0.9288330078125, 0.9667816162109375, 1.004730224609375, 1.0426788330078125, 1.08062744140625, 1.1185760498046875, 1.156524658203125, 1.1944732666015625, 1.232421875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 12.0, 26.0, 47.0, 78.0, 118.0, 188.0, 163.0, 139.0, 110.0, 48.0, 35.0, 14.0, 6.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.307052612304688, -8.938004493713379, -8.56895637512207, -8.199907302856445, -7.830859184265137, -7.461811065673828, -7.092762470245361, -6.7237138748168945, -6.354665756225586, -5.985617637634277, -5.6165690422058105, -5.247520446777344, -4.878472328186035, -4.509424209594727, -4.14037561416626, -3.771327257156372, -3.4022789001464844, -3.0332305431365967, -2.664182186126709, -2.2951338291168213, -1.9260854721069336, -1.557037115097046, -1.1879887580871582, -0.8189404010772705, -0.4498920440673828, -0.08084368705749512, 0.2882046699523926, 0.6572530269622803, 1.026301383972168, 1.3953497409820557, 1.7643980979919434, 2.133446455001831, 2.5024948120117188, 2.8715431690216064, 3.240591526031494, 3.609639883041382, 3.9786882400512695, 4.347736358642578, 4.716784954071045, 5.085833549499512, 5.45488166809082, 5.823929786682129, 6.192978382110596, 6.5620269775390625, 6.931075096130371, 7.30012321472168, 7.6691718101501465, 8.038220405578613, 8.407268524169922, 8.77631664276123, 9.145364761352539, 9.514413833618164, 9.883461952209473, 10.252510070800781, 10.621559143066406, 10.990607261657715, 11.359655380249023, 11.728703498840332, 12.09775161743164, 12.466800689697266, 12.835848808288574, 13.204896926879883, 13.573945999145508, 13.942994117736816, 14.312042236328125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 7.0, 12.0, 11.0, 13.0, 15.0, 18.0, 23.0, 23.0, 17.0, 39.0, 36.0, 47.0, 42.0, 47.0, 38.0, 49.0, 51.0, 56.0, 49.0, 56.0, 37.0, 27.0, 45.0, 34.0, 29.0, 25.0, 26.0, 23.0, 19.0, 19.0, 12.0, 11.0, 6.0, 5.0, 8.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.416264057159424, -4.275505542755127, -4.134746551513672, -3.993988037109375, -3.853229522705078, -3.712470769882202, -3.571712017059326, -3.4309535026550293, -3.2901949882507324, -3.1494362354278564, -3.0086777210235596, -2.8679189682006836, -2.7271604537963867, -2.5864017009735107, -2.4456429481506348, -2.304884433746338, -2.164125680923462, -2.023366928100586, -1.882608413696289, -1.741849660873413, -1.6010911464691162, -1.4603323936462402, -1.3195737600326538, -1.1788151264190674, -1.038056492805481, -0.8972978591918945, -0.7565392255783081, -0.6157805323600769, -0.4750218987464905, -0.33426326513290405, -0.19350457191467285, -0.052745938301086426, 0.0880126953125, 0.22877134382724762, 0.36952999234199524, 0.510288655757904, 0.6510472893714905, 0.7918059229850769, 0.9325646162033081, 1.0733232498168945, 1.214081883430481, 1.3548405170440674, 1.4955991506576538, 1.6363577842712402, 1.7771165370941162, 1.917875051498413, 2.058633804321289, 2.199392318725586, 2.340151071548462, 2.480909824371338, 2.6216683387756348, 2.7624270915985107, 2.9031856060028076, 3.0439443588256836, 3.1847028732299805, 3.3254616260528564, 3.4662203788757324, 3.6069791316986084, 3.7477376461029053, 3.8884963989257812, 4.029254913330078, 4.170013427734375, 4.31077241897583, 4.451530933380127, 4.592289447784424]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 6.0, 6.0, 8.0, 8.0, 9.0, 20.0, 22.0, 23.0, 45.0, 41.0, 58.0, 91.0, 121.0, 168.0, 244.0, 374.0, 579.0, 1012.0, 1695.0, 3269.0, 6529.0, 15671.0, 52631.0, 290332.0, 532043.0, 99591.0, 24815.0, 9161.0, 4269.0, 2239.0, 1231.0, 775.0, 448.0, 292.0, 203.0, 144.0, 88.0, 86.0, 58.0, 46.0, 27.0, 25.0, 13.0, 10.0, 13.0, 5.0, 5.0, 5.0, 2.0, 5.0, 0.0, 0.0, 3.0, 2.0], "bins": [-7.8046875, -7.5765380859375, -7.348388671875, -7.1202392578125, -6.89208984375, -6.6639404296875, -6.435791015625, -6.2076416015625, -5.9794921875, -5.7513427734375, -5.523193359375, -5.2950439453125, -5.06689453125, -4.8387451171875, -4.610595703125, -4.3824462890625, -4.154296875, -3.9261474609375, -3.697998046875, -3.4698486328125, -3.24169921875, -3.0135498046875, -2.785400390625, -2.5572509765625, -2.3291015625, -2.1009521484375, -1.872802734375, -1.6446533203125, -1.41650390625, -1.1883544921875, -0.960205078125, -0.7320556640625, -0.50390625, -0.2757568359375, -0.047607421875, 0.1805419921875, 0.40869140625, 0.6368408203125, 0.864990234375, 1.0931396484375, 1.3212890625, 1.5494384765625, 1.777587890625, 2.0057373046875, 2.23388671875, 2.4620361328125, 2.690185546875, 2.9183349609375, 3.146484375, 3.3746337890625, 3.602783203125, 3.8309326171875, 4.05908203125, 4.2872314453125, 4.515380859375, 4.7435302734375, 4.9716796875, 5.1998291015625, 5.427978515625, 5.6561279296875, 5.88427734375, 6.1124267578125, 6.340576171875, 6.5687255859375, 6.796875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 6.0, 10.0, 7.0, 21.0, 34.0, 56.0, 126.0, 201.0, 199.0, 164.0, 86.0, 40.0, 18.0, 14.0, 7.0, 6.0, 0.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.08984375, -1.053802490234375, -1.01776123046875, -0.981719970703125, -0.9456787109375, -0.909637451171875, -0.87359619140625, -0.837554931640625, -0.801513671875, -0.765472412109375, -0.72943115234375, -0.693389892578125, -0.6573486328125, -0.621307373046875, -0.58526611328125, -0.549224853515625, -0.51318359375, -0.477142333984375, -0.44110107421875, -0.405059814453125, -0.3690185546875, -0.332977294921875, -0.29693603515625, -0.260894775390625, -0.224853515625, -0.188812255859375, -0.15277099609375, -0.116729736328125, -0.0806884765625, -0.044647216796875, -0.00860595703125, 0.027435302734375, 0.0634765625, 0.099517822265625, 0.13555908203125, 0.171600341796875, 0.2076416015625, 0.243682861328125, 0.27972412109375, 0.315765380859375, 0.351806640625, 0.387847900390625, 0.42388916015625, 0.459930419921875, 0.4959716796875, 0.532012939453125, 0.56805419921875, 0.604095458984375, 0.64013671875, 0.676177978515625, 0.71221923828125, 0.748260498046875, 0.7843017578125, 0.820343017578125, 0.85638427734375, 0.892425537109375, 0.928466796875, 0.964508056640625, 1.00054931640625, 1.036590576171875, 1.0726318359375, 1.108673095703125, 1.14471435546875, 1.180755615234375, 1.216796875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 10.0, 14.0, 16.0, 27.0, 43.0, 60.0, 100.0, 150.0, 220.0, 411.0, 745.0, 1633.0, 3904.0, 12753.0, 56634.0, 301009.0, 508693.0, 125437.0, 25359.0, 6658.0, 2285.0, 1034.0, 526.0, 321.0, 178.0, 119.0, 70.0, 48.0, 26.0, 24.0, 15.0, 4.0, 10.0, 6.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.171875, -7.9102783203125, -7.648681640625, -7.3870849609375, -7.12548828125, -6.8638916015625, -6.602294921875, -6.3406982421875, -6.0791015625, -5.8175048828125, -5.555908203125, -5.2943115234375, -5.03271484375, -4.7711181640625, -4.509521484375, -4.2479248046875, -3.986328125, -3.7247314453125, -3.463134765625, -3.2015380859375, -2.93994140625, -2.6783447265625, -2.416748046875, -2.1551513671875, -1.8935546875, -1.6319580078125, -1.370361328125, -1.1087646484375, -0.84716796875, -0.5855712890625, -0.323974609375, -0.0623779296875, 0.19921875, 0.4608154296875, 0.722412109375, 0.9840087890625, 1.24560546875, 1.5072021484375, 1.768798828125, 2.0303955078125, 2.2919921875, 2.5535888671875, 2.815185546875, 3.0767822265625, 3.33837890625, 3.5999755859375, 3.861572265625, 4.1231689453125, 4.384765625, 4.6463623046875, 4.907958984375, 5.1695556640625, 5.43115234375, 5.6927490234375, 5.954345703125, 6.2159423828125, 6.4775390625, 6.7391357421875, 7.000732421875, 7.2623291015625, 7.52392578125, 7.7855224609375, 8.047119140625, 8.3087158203125, 8.5703125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 3.0, 8.0, 6.0, 6.0, 12.0, 9.0, 14.0, 21.0, 18.0, 14.0, 28.0, 30.0, 17.0, 31.0, 30.0, 28.0, 35.0, 38.0, 36.0, 48.0, 45.0, 40.0, 39.0, 50.0, 47.0, 35.0, 42.0, 30.0, 24.0, 28.0, 28.0, 18.0, 23.0, 24.0, 13.0, 14.0, 2.0, 10.0, 9.0, 12.0, 8.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.37890625, -2.30712890625, -2.2353515625, -2.16357421875, -2.091796875, -2.02001953125, -1.9482421875, -1.87646484375, -1.8046875, -1.73291015625, -1.6611328125, -1.58935546875, -1.517578125, -1.44580078125, -1.3740234375, -1.30224609375, -1.23046875, -1.15869140625, -1.0869140625, -1.01513671875, -0.943359375, -0.87158203125, -0.7998046875, -0.72802734375, -0.65625, -0.58447265625, -0.5126953125, -0.44091796875, -0.369140625, -0.29736328125, -0.2255859375, -0.15380859375, -0.08203125, -0.01025390625, 0.0615234375, 0.13330078125, 0.205078125, 0.27685546875, 0.3486328125, 0.42041015625, 0.4921875, 0.56396484375, 0.6357421875, 0.70751953125, 0.779296875, 0.85107421875, 0.9228515625, 0.99462890625, 1.06640625, 1.13818359375, 1.2099609375, 1.28173828125, 1.353515625, 1.42529296875, 1.4970703125, 1.56884765625, 1.640625, 1.71240234375, 1.7841796875, 1.85595703125, 1.927734375, 1.99951171875, 2.0712890625, 2.14306640625, 2.21484375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 7.0, 12.0, 13.0, 26.0, 39.0, 53.0, 108.0, 192.0, 319.0, 615.0, 1413.0, 3717.0, 11920.0, 50722.0, 280306.0, 538522.0, 124415.0, 25282.0, 6578.0, 2328.0, 954.0, 450.0, 244.0, 127.0, 77.0, 42.0, 23.0, 21.0, 7.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5703125, -6.3458251953125, -6.121337890625, -5.8968505859375, -5.67236328125, -5.4478759765625, -5.223388671875, -4.9989013671875, -4.7744140625, -4.5499267578125, -4.325439453125, -4.1009521484375, -3.87646484375, -3.6519775390625, -3.427490234375, -3.2030029296875, -2.978515625, -2.7540283203125, -2.529541015625, -2.3050537109375, -2.08056640625, -1.8560791015625, -1.631591796875, -1.4071044921875, -1.1826171875, -0.9581298828125, -0.733642578125, -0.5091552734375, -0.28466796875, -0.0601806640625, 0.164306640625, 0.3887939453125, 0.61328125, 0.8377685546875, 1.062255859375, 1.2867431640625, 1.51123046875, 1.7357177734375, 1.960205078125, 2.1846923828125, 2.4091796875, 2.6336669921875, 2.858154296875, 3.0826416015625, 3.30712890625, 3.5316162109375, 3.756103515625, 3.9805908203125, 4.205078125, 4.4295654296875, 4.654052734375, 4.8785400390625, 5.10302734375, 5.3275146484375, 5.552001953125, 5.7764892578125, 6.0009765625, 6.2254638671875, 6.449951171875, 6.6744384765625, 6.89892578125, 7.1234130859375, 7.347900390625, 7.5723876953125, 7.796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 0.0, 3.0, 4.0, 2.0, 8.0, 7.0, 9.0, 10.0, 18.0, 12.0, 27.0, 37.0, 40.0, 61.0, 65.0, 86.0, 86.0, 87.0, 91.0, 78.0, 54.0, 52.0, 32.0, 25.0, 20.0, 10.0, 11.0, 14.0, 8.0, 5.0, 5.0, 9.0, 3.0, 4.0, 1.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0006475448608398438, -0.000627368688583374, -0.0006071925163269043, -0.0005870163440704346, -0.0005668401718139648, -0.0005466639995574951, -0.0005264878273010254, -0.0005063116550445557, -0.00048613548278808594, -0.0004659593105316162, -0.0004457831382751465, -0.00042560696601867676, -0.00040543079376220703, -0.0003852546215057373, -0.0003650784492492676, -0.00034490227699279785, -0.0003247261047363281, -0.0003045499324798584, -0.00028437376022338867, -0.00026419758796691895, -0.00024402141571044922, -0.0002238452434539795, -0.00020366907119750977, -0.00018349289894104004, -0.0001633167266845703, -0.00014314055442810059, -0.00012296438217163086, -0.00010278820991516113, -8.26120376586914e-05, -6.243586540222168e-05, -4.225969314575195e-05, -2.2083520889282227e-05, -1.9073486328125e-06, 1.8268823623657227e-05, 3.844499588012695e-05, 5.862116813659668e-05, 7.87973403930664e-05, 9.897351264953613e-05, 0.00011914968490600586, 0.00013932585716247559, 0.0001595020294189453, 0.00017967820167541504, 0.00019985437393188477, 0.0002200305461883545, 0.00024020671844482422, 0.00026038289070129395, 0.00028055906295776367, 0.0003007352352142334, 0.0003209114074707031, 0.00034108757972717285, 0.0003612637519836426, 0.0003814399242401123, 0.00040161609649658203, 0.00042179226875305176, 0.0004419684410095215, 0.0004621446132659912, 0.00048232078552246094, 0.0005024969577789307, 0.0005226731300354004, 0.0005428493022918701, 0.0005630254745483398, 0.0005832016468048096, 0.0006033778190612793, 0.000623553991317749, 0.0006437301635742188]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 5.0, 8.0, 10.0, 14.0, 14.0, 26.0, 26.0, 42.0, 61.0, 70.0, 108.0, 152.0, 259.0, 380.0, 670.0, 1288.0, 2658.0, 5971.0, 15862.0, 49352.0, 187260.0, 492181.0, 208797.0, 53689.0, 17116.0, 6419.0, 2844.0, 1366.0, 711.0, 433.0, 263.0, 154.0, 100.0, 70.0, 55.0, 35.0, 29.0, 8.0, 14.0, 17.0, 6.0, 1.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.33203125, -5.14520263671875, -4.9583740234375, -4.77154541015625, -4.584716796875, -4.39788818359375, -4.2110595703125, -4.02423095703125, -3.83740234375, -3.65057373046875, -3.4637451171875, -3.27691650390625, -3.090087890625, -2.90325927734375, -2.7164306640625, -2.52960205078125, -2.3427734375, -2.15594482421875, -1.9691162109375, -1.78228759765625, -1.595458984375, -1.40863037109375, -1.2218017578125, -1.03497314453125, -0.84814453125, -0.66131591796875, -0.4744873046875, -0.28765869140625, -0.100830078125, 0.08599853515625, 0.2728271484375, 0.45965576171875, 0.646484375, 0.83331298828125, 1.0201416015625, 1.20697021484375, 1.393798828125, 1.58062744140625, 1.7674560546875, 1.95428466796875, 2.14111328125, 2.32794189453125, 2.5147705078125, 2.70159912109375, 2.888427734375, 3.07525634765625, 3.2620849609375, 3.44891357421875, 3.6357421875, 3.82257080078125, 4.0093994140625, 4.19622802734375, 4.383056640625, 4.56988525390625, 4.7567138671875, 4.94354248046875, 5.13037109375, 5.31719970703125, 5.5040283203125, 5.69085693359375, 5.877685546875, 6.06451416015625, 6.2513427734375, 6.43817138671875, 6.625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 4.0, 4.0, 6.0, 7.0, 6.0, 9.0, 4.0, 8.0, 9.0, 10.0, 28.0, 22.0, 21.0, 25.0, 34.0, 49.0, 41.0, 59.0, 75.0, 61.0, 69.0, 64.0, 72.0, 53.0, 48.0, 42.0, 31.0, 23.0, 28.0, 23.0, 13.0, 15.0, 8.0, 5.0, 4.0, 6.0, 7.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1015625, -2.02484130859375, -1.9481201171875, -1.87139892578125, -1.794677734375, -1.71795654296875, -1.6412353515625, -1.56451416015625, -1.48779296875, -1.41107177734375, -1.3343505859375, -1.25762939453125, -1.180908203125, -1.10418701171875, -1.0274658203125, -0.95074462890625, -0.8740234375, -0.79730224609375, -0.7205810546875, -0.64385986328125, -0.567138671875, -0.49041748046875, -0.4136962890625, -0.33697509765625, -0.26025390625, -0.18353271484375, -0.1068115234375, -0.03009033203125, 0.046630859375, 0.12335205078125, 0.2000732421875, 0.27679443359375, 0.353515625, 0.43023681640625, 0.5069580078125, 0.58367919921875, 0.660400390625, 0.73712158203125, 0.8138427734375, 0.89056396484375, 0.96728515625, 1.04400634765625, 1.1207275390625, 1.19744873046875, 1.274169921875, 1.35089111328125, 1.4276123046875, 1.50433349609375, 1.5810546875, 1.65777587890625, 1.7344970703125, 1.81121826171875, 1.887939453125, 1.96466064453125, 2.0413818359375, 2.11810302734375, 2.19482421875, 2.27154541015625, 2.3482666015625, 2.42498779296875, 2.501708984375, 2.57843017578125, 2.6551513671875, 2.73187255859375, 2.80859375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 30.0, 100.0, 183.0, 273.0, 220.0, 110.0, 37.0, 25.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.46561431884766, -78.89002227783203, -76.3144302368164, -73.73883819580078, -71.16325378417969, -68.58766174316406, -66.01206970214844, -63.43647766113281, -60.86088562011719, -58.28529357910156, -55.70970153808594, -53.13411331176758, -50.55852127075195, -47.98292922973633, -45.40734100341797, -42.831748962402344, -40.25615692138672, -37.680564880371094, -35.10497283935547, -32.52938461303711, -29.953792572021484, -27.37820053100586, -24.802610397338867, -22.227020263671875, -19.65142822265625, -17.075836181640625, -14.500246047973633, -11.924654960632324, -9.349063873291016, -6.773472785949707, -4.197881698608398, -1.6222915649414062, 0.9533004760742188, 3.5288915634155273, 6.104482650756836, 8.680073738098145, 11.255664825439453, 13.831255912780762, 16.40684700012207, 18.982437133789062, 21.558029174804688, 24.133621215820312, 26.709211349487305, 29.284801483154297, 31.860393524169922, 34.43598556518555, 37.011573791503906, 39.58716583251953, 42.162757873535156, 44.73834991455078, 47.313941955566406, 49.889530181884766, 52.46512222290039, 55.040714263916016, 57.616302490234375, 60.19189453125, 62.767486572265625, 65.34307861328125, 67.91867065429688, 70.4942626953125, 73.06985473632812, 75.64543914794922, 78.22103118896484, 80.79662322998047, 83.3722152709961]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 10.0, 12.0, 10.0, 19.0, 17.0, 31.0, 27.0, 38.0, 45.0, 59.0, 42.0, 55.0, 41.0, 48.0, 58.0, 60.0, 56.0, 42.0, 53.0, 48.0, 41.0, 34.0, 33.0, 19.0, 15.0, 15.0, 18.0, 10.0, 14.0, 5.0, 6.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-30.312210083007812, -29.533628463745117, -28.755046844482422, -27.97646713256836, -27.197885513305664, -26.41930389404297, -25.640722274780273, -24.862140655517578, -24.083560943603516, -23.30497932434082, -22.526397705078125, -21.747817993164062, -20.969236373901367, -20.190654754638672, -19.412073135375977, -18.63349151611328, -17.854909896850586, -17.07632827758789, -16.297746658325195, -15.519165992736816, -14.740585327148438, -13.962003707885742, -13.183422088623047, -12.404840469360352, -11.626259803771973, -10.847678184509277, -10.069097518920898, -9.290515899658203, -8.511934280395508, -7.733353614807129, -6.954771995544434, -6.1761908531188965, -5.397609710693359, -4.619028568267822, -3.840447187423706, -3.06186580657959, -2.2832846641540527, -1.5047035217285156, -0.7261219024658203, 0.0524592399597168, 0.8310403823852539, 1.6096216440200806, 2.3882029056549072, 3.1667842864990234, 3.9453654289245605, 4.723946571350098, 5.502528190612793, 6.28110933303833, 7.059690475463867, 7.838271617889404, 8.616852760314941, 9.395434379577637, 10.174015045166016, 10.952596664428711, 11.731178283691406, 12.509759902954102, 13.28834056854248, 14.066922187805176, 14.845502853393555, 15.62408447265625, 16.402666091918945, 17.18124771118164, 17.959827423095703, 18.7384090423584, 19.516990661621094]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 7.0, 4.0, 13.0, 13.0, 26.0, 85.0, 216.0, 639.0, 3365.0, 71515.0, 4092623.0, 22930.0, 2085.0, 468.0, 153.0, 65.0, 40.0, 21.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.59375, -35.49658203125, -34.3994140625, -33.30224609375, -32.205078125, -31.10791015625, -30.0107421875, -28.91357421875, -27.81640625, -26.71923828125, -25.6220703125, -24.52490234375, -23.427734375, -22.33056640625, -21.2333984375, -20.13623046875, -19.0390625, -17.94189453125, -16.8447265625, -15.74755859375, -14.650390625, -13.55322265625, -12.4560546875, -11.35888671875, -10.26171875, -9.16455078125, -8.0673828125, -6.97021484375, -5.873046875, -4.77587890625, -3.6787109375, -2.58154296875, -1.484375, -0.38720703125, 0.7099609375, 1.80712890625, 2.904296875, 4.00146484375, 5.0986328125, 6.19580078125, 7.29296875, 8.39013671875, 9.4873046875, 10.58447265625, 11.681640625, 12.77880859375, 13.8759765625, 14.97314453125, 16.0703125, 17.16748046875, 18.2646484375, 19.36181640625, 20.458984375, 21.55615234375, 22.6533203125, 23.75048828125, 24.84765625, 25.94482421875, 27.0419921875, 28.13916015625, 29.236328125, 30.33349609375, 31.4306640625, 32.52783203125, 33.625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 2.0, 5.0, 21.0, 36.0, 57.0, 106.0, 160.0, 180.0, 140.0, 129.0, 70.0, 32.0, 21.0, 11.0, 10.0, 7.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3525390625, -1.3110809326171875, -1.269622802734375, -1.2281646728515625, -1.18670654296875, -1.1452484130859375, -1.103790283203125, -1.0623321533203125, -1.0208740234375, -0.9794158935546875, -0.937957763671875, -0.8964996337890625, -0.85504150390625, -0.8135833740234375, -0.772125244140625, -0.7306671142578125, -0.689208984375, -0.6477508544921875, -0.606292724609375, -0.5648345947265625, -0.52337646484375, -0.4819183349609375, -0.440460205078125, -0.3990020751953125, -0.3575439453125, -0.3160858154296875, -0.274627685546875, -0.2331695556640625, -0.19171142578125, -0.1502532958984375, -0.108795166015625, -0.0673370361328125, -0.02587890625, 0.0155792236328125, 0.057037353515625, 0.0984954833984375, 0.13995361328125, 0.1814117431640625, 0.222869873046875, 0.2643280029296875, 0.3057861328125, 0.3472442626953125, 0.388702392578125, 0.4301605224609375, 0.47161865234375, 0.5130767822265625, 0.554534912109375, 0.5959930419921875, 0.637451171875, 0.6789093017578125, 0.720367431640625, 0.7618255615234375, 0.80328369140625, 0.8447418212890625, 0.886199951171875, 0.9276580810546875, 0.9691162109375, 1.0105743408203125, 1.052032470703125, 1.0934906005859375, 1.13494873046875, 1.1764068603515625, 1.217864990234375, 1.2593231201171875, 1.30078125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 7.0, 8.0, 11.0, 20.0, 30.0, 50.0, 58.0, 99.0, 197.0, 313.0, 614.0, 1298.0, 2718.0, 6477.0, 17603.0, 56734.0, 257600.0, 2901893.0, 781662.0, 116542.0, 31078.0, 10933.0, 4333.0, 1938.0, 900.0, 483.0, 279.0, 151.0, 100.0, 40.0, 31.0, 27.0, 17.0, 10.0, 9.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.25390625, -7.01019287109375, -6.7664794921875, -6.52276611328125, -6.279052734375, -6.03533935546875, -5.7916259765625, -5.54791259765625, -5.30419921875, -5.06048583984375, -4.8167724609375, -4.57305908203125, -4.329345703125, -4.08563232421875, -3.8419189453125, -3.59820556640625, -3.3544921875, -3.11077880859375, -2.8670654296875, -2.62335205078125, -2.379638671875, -2.13592529296875, -1.8922119140625, -1.64849853515625, -1.40478515625, -1.16107177734375, -0.9173583984375, -0.67364501953125, -0.429931640625, -0.18621826171875, 0.0574951171875, 0.30120849609375, 0.544921875, 0.78863525390625, 1.0323486328125, 1.27606201171875, 1.519775390625, 1.76348876953125, 2.0072021484375, 2.25091552734375, 2.49462890625, 2.73834228515625, 2.9820556640625, 3.22576904296875, 3.469482421875, 3.71319580078125, 3.9569091796875, 4.20062255859375, 4.4443359375, 4.68804931640625, 4.9317626953125, 5.17547607421875, 5.419189453125, 5.66290283203125, 5.9066162109375, 6.15032958984375, 6.39404296875, 6.63775634765625, 6.8814697265625, 7.12518310546875, 7.368896484375, 7.61260986328125, 7.8563232421875, 8.10003662109375, 8.34375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 6.0, 3.0, 6.0, 3.0, 11.0, 9.0, 19.0, 18.0, 44.0, 56.0, 74.0, 114.0, 160.0, 285.0, 437.0, 1167.0, 737.0, 323.0, 201.0, 108.0, 85.0, 61.0, 36.0, 27.0, 24.0, 18.0, 8.0, 13.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2548828125, -1.20623779296875, -1.1575927734375, -1.10894775390625, -1.060302734375, -1.01165771484375, -0.9630126953125, -0.91436767578125, -0.86572265625, -0.81707763671875, -0.7684326171875, -0.71978759765625, -0.671142578125, -0.62249755859375, -0.5738525390625, -0.52520751953125, -0.4765625, -0.42791748046875, -0.3792724609375, -0.33062744140625, -0.281982421875, -0.23333740234375, -0.1846923828125, -0.13604736328125, -0.08740234375, -0.03875732421875, 0.0098876953125, 0.05853271484375, 0.107177734375, 0.15582275390625, 0.2044677734375, 0.25311279296875, 0.3017578125, 0.35040283203125, 0.3990478515625, 0.44769287109375, 0.496337890625, 0.54498291015625, 0.5936279296875, 0.64227294921875, 0.69091796875, 0.73956298828125, 0.7882080078125, 0.83685302734375, 0.885498046875, 0.93414306640625, 0.9827880859375, 1.03143310546875, 1.080078125, 1.12872314453125, 1.1773681640625, 1.22601318359375, 1.274658203125, 1.32330322265625, 1.3719482421875, 1.42059326171875, 1.46923828125, 1.51788330078125, 1.5665283203125, 1.61517333984375, 1.663818359375, 1.71246337890625, 1.7611083984375, 1.80975341796875, 1.8583984375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 6.0, 9.0, 11.0, 23.0, 33.0, 54.0, 80.0, 124.0, 114.0, 159.0, 121.0, 99.0, 52.0, 47.0, 32.0, 17.0, 9.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.756229400634766, -16.33051109313965, -15.904792785644531, -15.479074478149414, -15.05335521697998, -14.627636909484863, -14.201918601989746, -13.776200294494629, -13.350481033325195, -12.924762725830078, -12.499044418334961, -12.073326110839844, -11.64760684967041, -11.221888542175293, -10.796170234680176, -10.370451927185059, -9.944733619689941, -9.519015312194824, -9.093297004699707, -8.667577743530273, -8.241859436035156, -7.816141128540039, -7.390422821044922, -6.964704513549805, -6.538985729217529, -6.113267421722412, -5.687548637390137, -5.2618303298950195, -4.836112022399902, -4.410393238067627, -3.9846749305725098, -3.5589563846588135, -3.1332387924194336, -2.7075202465057373, -2.281801700592041, -1.8560833930969238, -1.4303648471832275, -1.0046463012695312, -0.5789279937744141, -0.15320944786071777, 0.2725090980529785, 0.69822758436203, 1.1239460706710815, 1.5496644973754883, 1.9753830432891846, 2.401101589202881, 2.826819896697998, 3.2525384426116943, 3.6782569885253906, 4.103975296020508, 4.529694080352783, 4.9554123878479, 5.381131172180176, 5.806849479675293, 6.23256778717041, 6.658286094665527, 7.084004878997803, 7.50972318649292, 7.935441970825195, 8.361160278320312, 8.78687858581543, 9.212596893310547, 9.638315200805664, 10.064034461975098, 10.489752769470215]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 9.0, 10.0, 14.0, 12.0, 19.0, 28.0, 19.0, 28.0, 38.0, 32.0, 43.0, 40.0, 40.0, 57.0, 40.0, 53.0, 48.0, 52.0, 47.0, 45.0, 49.0, 48.0, 33.0, 28.0, 33.0, 26.0, 24.0, 15.0, 15.0, 14.0, 9.0, 8.0, 5.0, 6.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83173942565918, -5.624623775482178, -5.417508125305176, -5.210392951965332, -5.00327730178833, -4.796161651611328, -4.589046478271484, -4.381930828094482, -4.1748151779174805, -3.9676995277404785, -3.7605841159820557, -3.553468704223633, -3.346353054046631, -3.139237403869629, -2.932121992111206, -2.725006580352783, -2.5178909301757812, -2.3107752799987793, -2.1036598682403564, -1.896544337272644, -1.6894288063049316, -1.4823132753372192, -1.2751977443695068, -1.0680822134017944, -0.860966682434082, -0.6538511514663696, -0.4467356204986572, -0.23962008953094482, -0.03250455856323242, 0.17461097240447998, 0.3817265033721924, 0.5888420343399048, 0.795957088470459, 1.0030726194381714, 1.2101881504058838, 1.4173036813735962, 1.6244192123413086, 1.831534743309021, 2.0386502742767334, 2.2457656860351562, 2.452881336212158, 2.65999698638916, 2.867112398147583, 3.074227809906006, 3.281343460083008, 3.4884591102600098, 3.6955745220184326, 3.9026899337768555, 4.109805583953857, 4.316921234130859, 4.524036407470703, 4.731152057647705, 4.938267707824707, 5.145383358001709, 5.352499008178711, 5.559614181518555, 5.766729831695557, 5.973845481872559, 6.180960655212402, 6.388076305389404, 6.595191955566406, 6.802307605743408, 7.00942325592041, 7.216538429260254, 7.423654079437256]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 17.0, 26.0, 37.0, 47.0, 84.0, 129.0, 162.0, 244.0, 387.0, 681.0, 1174.0, 2134.0, 4991.0, 14174.0, 51863.0, 218358.0, 504321.0, 183776.0, 44068.0, 12538.0, 4563.0, 1937.0, 1030.0, 656.0, 367.0, 237.0, 192.0, 106.0, 81.0, 51.0, 37.0, 29.0, 16.0, 12.0, 8.0, 7.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.9453125, -6.7171630859375, -6.489013671875, -6.2608642578125, -6.03271484375, -5.8045654296875, -5.576416015625, -5.3482666015625, -5.1201171875, -4.8919677734375, -4.663818359375, -4.4356689453125, -4.20751953125, -3.9793701171875, -3.751220703125, -3.5230712890625, -3.294921875, -3.0667724609375, -2.838623046875, -2.6104736328125, -2.38232421875, -2.1541748046875, -1.926025390625, -1.6978759765625, -1.4697265625, -1.2415771484375, -1.013427734375, -0.7852783203125, -0.55712890625, -0.3289794921875, -0.100830078125, 0.1273193359375, 0.35546875, 0.5836181640625, 0.811767578125, 1.0399169921875, 1.26806640625, 1.4962158203125, 1.724365234375, 1.9525146484375, 2.1806640625, 2.4088134765625, 2.636962890625, 2.8651123046875, 3.09326171875, 3.3214111328125, 3.549560546875, 3.7777099609375, 4.005859375, 4.2340087890625, 4.462158203125, 4.6903076171875, 4.91845703125, 5.1466064453125, 5.374755859375, 5.6029052734375, 5.8310546875, 6.0592041015625, 6.287353515625, 6.5155029296875, 6.74365234375, 6.9718017578125, 7.199951171875, 7.4281005859375, 7.65625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 0.0, 4.0, 9.0, 7.0, 16.0, 19.0, 46.0, 78.0, 105.0, 129.0, 139.0, 138.0, 124.0, 63.0, 54.0, 30.0, 16.0, 11.0, 3.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.201171875, -1.16064453125, -1.1201171875, -1.07958984375, -1.0390625, -0.99853515625, -0.9580078125, -0.91748046875, -0.876953125, -0.83642578125, -0.7958984375, -0.75537109375, -0.71484375, -0.67431640625, -0.6337890625, -0.59326171875, -0.552734375, -0.51220703125, -0.4716796875, -0.43115234375, -0.390625, -0.35009765625, -0.3095703125, -0.26904296875, -0.228515625, -0.18798828125, -0.1474609375, -0.10693359375, -0.06640625, -0.02587890625, 0.0146484375, 0.05517578125, 0.095703125, 0.13623046875, 0.1767578125, 0.21728515625, 0.2578125, 0.29833984375, 0.3388671875, 0.37939453125, 0.419921875, 0.46044921875, 0.5009765625, 0.54150390625, 0.58203125, 0.62255859375, 0.6630859375, 0.70361328125, 0.744140625, 0.78466796875, 0.8251953125, 0.86572265625, 0.90625, 0.94677734375, 0.9873046875, 1.02783203125, 1.068359375, 1.10888671875, 1.1494140625, 1.18994140625, 1.23046875, 1.27099609375, 1.3115234375, 1.35205078125, 1.392578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 5.0, 5.0, 6.0, 14.0, 17.0, 12.0, 22.0, 16.0, 49.0, 56.0, 81.0, 112.0, 165.0, 280.0, 335.0, 599.0, 1041.0, 1880.0, 4198.0, 11347.0, 35562.0, 114740.0, 376299.0, 346923.0, 103910.0, 32170.0, 10332.0, 3856.0, 1828.0, 952.0, 557.0, 378.0, 236.0, 177.0, 112.0, 79.0, 67.0, 29.0, 23.0, 25.0, 19.0, 12.0, 11.0, 6.0, 6.0, 4.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.62109375, -7.39666748046875, -7.1722412109375, -6.94781494140625, -6.723388671875, -6.49896240234375, -6.2745361328125, -6.05010986328125, -5.82568359375, -5.60125732421875, -5.3768310546875, -5.15240478515625, -4.927978515625, -4.70355224609375, -4.4791259765625, -4.25469970703125, -4.0302734375, -3.80584716796875, -3.5814208984375, -3.35699462890625, -3.132568359375, -2.90814208984375, -2.6837158203125, -2.45928955078125, -2.23486328125, -2.01043701171875, -1.7860107421875, -1.56158447265625, -1.337158203125, -1.11273193359375, -0.8883056640625, -0.66387939453125, -0.439453125, -0.21502685546875, 0.0093994140625, 0.23382568359375, 0.458251953125, 0.68267822265625, 0.9071044921875, 1.13153076171875, 1.35595703125, 1.58038330078125, 1.8048095703125, 2.02923583984375, 2.253662109375, 2.47808837890625, 2.7025146484375, 2.92694091796875, 3.1513671875, 3.37579345703125, 3.6002197265625, 3.82464599609375, 4.049072265625, 4.27349853515625, 4.4979248046875, 4.72235107421875, 4.94677734375, 5.17120361328125, 5.3956298828125, 5.62005615234375, 5.844482421875, 6.06890869140625, 6.2933349609375, 6.51776123046875, 6.7421875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 10.0, 10.0, 5.0, 10.0, 11.0, 16.0, 15.0, 23.0, 21.0, 22.0, 28.0, 26.0, 37.0, 24.0, 44.0, 50.0, 35.0, 41.0, 49.0, 49.0, 43.0, 49.0, 47.0, 39.0, 31.0, 33.0, 27.0, 36.0, 29.0, 19.0, 20.0, 15.0, 12.0, 15.0, 7.0, 7.0, 3.0, 9.0, 10.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.345703125, -3.244720458984375, -3.14373779296875, -3.042755126953125, -2.9417724609375, -2.840789794921875, -2.73980712890625, -2.638824462890625, -2.537841796875, -2.436859130859375, -2.33587646484375, -2.234893798828125, -2.1339111328125, -2.032928466796875, -1.93194580078125, -1.830963134765625, -1.72998046875, -1.628997802734375, -1.52801513671875, -1.427032470703125, -1.3260498046875, -1.225067138671875, -1.12408447265625, -1.023101806640625, -0.922119140625, -0.821136474609375, -0.72015380859375, -0.619171142578125, -0.5181884765625, -0.417205810546875, -0.31622314453125, -0.215240478515625, -0.1142578125, -0.013275146484375, 0.08770751953125, 0.188690185546875, 0.2896728515625, 0.390655517578125, 0.49163818359375, 0.592620849609375, 0.693603515625, 0.794586181640625, 0.89556884765625, 0.996551513671875, 1.0975341796875, 1.198516845703125, 1.29949951171875, 1.400482177734375, 1.50146484375, 1.602447509765625, 1.70343017578125, 1.804412841796875, 1.9053955078125, 2.006378173828125, 2.10736083984375, 2.208343505859375, 2.309326171875, 2.410308837890625, 2.51129150390625, 2.612274169921875, 2.7132568359375, 2.814239501953125, 2.91522216796875, 3.016204833984375, 3.1171875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 6.0, 3.0, 7.0, 8.0, 9.0, 18.0, 20.0, 33.0, 36.0, 62.0, 97.0, 164.0, 212.0, 310.0, 591.0, 1003.0, 1845.0, 3570.0, 8773.0, 25123.0, 89728.0, 354191.0, 405959.0, 108235.0, 29514.0, 10120.0, 4138.0, 1992.0, 1040.0, 677.0, 387.0, 226.0, 156.0, 99.0, 57.0, 49.0, 31.0, 28.0, 13.0, 11.0, 4.0, 4.0, 3.0, 0.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.75, -5.590576171875, -5.43115234375, -5.271728515625, -5.1123046875, -4.952880859375, -4.79345703125, -4.634033203125, -4.474609375, -4.315185546875, -4.15576171875, -3.996337890625, -3.8369140625, -3.677490234375, -3.51806640625, -3.358642578125, -3.19921875, -3.039794921875, -2.88037109375, -2.720947265625, -2.5615234375, -2.402099609375, -2.24267578125, -2.083251953125, -1.923828125, -1.764404296875, -1.60498046875, -1.445556640625, -1.2861328125, -1.126708984375, -0.96728515625, -0.807861328125, -0.6484375, -0.489013671875, -0.32958984375, -0.170166015625, -0.0107421875, 0.148681640625, 0.30810546875, 0.467529296875, 0.626953125, 0.786376953125, 0.94580078125, 1.105224609375, 1.2646484375, 1.424072265625, 1.58349609375, 1.742919921875, 1.90234375, 2.061767578125, 2.22119140625, 2.380615234375, 2.5400390625, 2.699462890625, 2.85888671875, 3.018310546875, 3.177734375, 3.337158203125, 3.49658203125, 3.656005859375, 3.8154296875, 3.974853515625, 4.13427734375, 4.293701171875, 4.453125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 8.0, 2.0, 7.0, 11.0, 20.0, 17.0, 31.0, 18.0, 27.0, 37.0, 45.0, 52.0, 84.0, 101.0, 95.0, 83.0, 70.0, 40.0, 59.0, 26.0, 35.0, 22.0, 23.0, 13.0, 16.0, 8.0, 7.0, 9.0, 5.0, 5.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006237030029296875, -0.0006044134497642517, -0.0005851238965988159, -0.0005658343434333801, -0.0005465447902679443, -0.0005272552371025085, -0.0005079656839370728, -0.000488676130771637, -0.00046938657760620117, -0.0004500970244407654, -0.0004308074712753296, -0.0004115179181098938, -0.000392228364944458, -0.0003729388117790222, -0.0003536492586135864, -0.00033435970544815063, -0.00031507015228271484, -0.00029578059911727905, -0.00027649104595184326, -0.00025720149278640747, -0.00023791193962097168, -0.0002186223864555359, -0.0001993328332901001, -0.0001800432801246643, -0.00016075372695922852, -0.00014146417379379272, -0.00012217462062835693, -0.00010288506746292114, -8.359551429748535e-05, -6.430596113204956e-05, -4.501640796661377e-05, -2.572685480117798e-05, -6.4373016357421875e-06, 1.2852251529693604e-05, 3.2141804695129395e-05, 5.1431357860565186e-05, 7.072091102600098e-05, 9.001046419143677e-05, 0.00010930001735687256, 0.00012858957052230835, 0.00014787912368774414, 0.00016716867685317993, 0.00018645823001861572, 0.00020574778318405151, 0.0002250373363494873, 0.0002443268895149231, 0.0002636164426803589, 0.0002829059958457947, 0.00030219554901123047, 0.00032148510217666626, 0.00034077465534210205, 0.00036006420850753784, 0.00037935376167297363, 0.0003986433148384094, 0.0004179328680038452, 0.000437222421169281, 0.0004565119743347168, 0.0004758015275001526, 0.0004950910806655884, 0.0005143806338310242, 0.00053367018699646, 0.0005529597401618958, 0.0005722492933273315, 0.0005915388464927673, 0.0006108283996582031]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 9.0, 12.0, 14.0, 22.0, 16.0, 36.0, 54.0, 70.0, 123.0, 191.0, 332.0, 589.0, 1189.0, 2567.0, 6867.0, 23070.0, 119682.0, 621567.0, 219774.0, 36255.0, 9458.0, 3468.0, 1463.0, 713.0, 371.0, 219.0, 129.0, 100.0, 62.0, 37.0, 31.0, 19.0, 12.0, 7.0, 10.0, 7.0, 3.0, 2.0, 4.0, 0.0, 0.0, 2.0], "bins": [-9.703125, -9.45843505859375, -9.2137451171875, -8.96905517578125, -8.724365234375, -8.47967529296875, -8.2349853515625, -7.99029541015625, -7.74560546875, -7.50091552734375, -7.2562255859375, -7.01153564453125, -6.766845703125, -6.52215576171875, -6.2774658203125, -6.03277587890625, -5.7880859375, -5.54339599609375, -5.2987060546875, -5.05401611328125, -4.809326171875, -4.56463623046875, -4.3199462890625, -4.07525634765625, -3.83056640625, -3.58587646484375, -3.3411865234375, -3.09649658203125, -2.851806640625, -2.60711669921875, -2.3624267578125, -2.11773681640625, -1.873046875, -1.62835693359375, -1.3836669921875, -1.13897705078125, -0.894287109375, -0.64959716796875, -0.4049072265625, -0.16021728515625, 0.08447265625, 0.32916259765625, 0.5738525390625, 0.81854248046875, 1.063232421875, 1.30792236328125, 1.5526123046875, 1.79730224609375, 2.0419921875, 2.28668212890625, 2.5313720703125, 2.77606201171875, 3.020751953125, 3.26544189453125, 3.5101318359375, 3.75482177734375, 3.99951171875, 4.24420166015625, 4.4888916015625, 4.73358154296875, 4.978271484375, 5.22296142578125, 5.4676513671875, 5.71234130859375, 5.95703125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 2.0, 3.0, 8.0, 9.0, 9.0, 24.0, 22.0, 41.0, 60.0, 73.0, 93.0, 131.0, 142.0, 94.0, 89.0, 51.0, 40.0, 37.0, 21.0, 13.0, 11.0, 5.0, 9.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9765625, -4.8265380859375, -4.676513671875, -4.5264892578125, -4.37646484375, -4.2264404296875, -4.076416015625, -3.9263916015625, -3.7763671875, -3.6263427734375, -3.476318359375, -3.3262939453125, -3.17626953125, -3.0262451171875, -2.876220703125, -2.7261962890625, -2.576171875, -2.4261474609375, -2.276123046875, -2.1260986328125, -1.97607421875, -1.8260498046875, -1.676025390625, -1.5260009765625, -1.3759765625, -1.2259521484375, -1.075927734375, -0.9259033203125, -0.77587890625, -0.6258544921875, -0.475830078125, -0.3258056640625, -0.17578125, -0.0257568359375, 0.124267578125, 0.2742919921875, 0.42431640625, 0.5743408203125, 0.724365234375, 0.8743896484375, 1.0244140625, 1.1744384765625, 1.324462890625, 1.4744873046875, 1.62451171875, 1.7745361328125, 1.924560546875, 2.0745849609375, 2.224609375, 2.3746337890625, 2.524658203125, 2.6746826171875, 2.82470703125, 2.9747314453125, 3.124755859375, 3.2747802734375, 3.4248046875, 3.5748291015625, 3.724853515625, 3.8748779296875, 4.02490234375, 4.1749267578125, 4.324951171875, 4.4749755859375, 4.625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 4.0, 12.0, 18.0, 56.0, 111.0, 176.0, 201.0, 206.0, 120.0, 47.0, 27.0, 9.0, 7.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.3677978515625, -53.887420654296875, -51.40704345703125, -48.92666244506836, -46.446285247802734, -43.96590805053711, -41.48552703857422, -39.005149841308594, -36.52477264404297, -34.044395446777344, -31.564016342163086, -29.083637237548828, -26.603260040283203, -24.122882843017578, -21.64250373840332, -19.162124633789062, -16.681747436523438, -14.201369285583496, -11.720991134643555, -9.240612983703613, -6.760234832763672, -4.2798566818237305, -1.799478530883789, 0.6809005737304688, 3.1612777709960938, 5.641655921936035, 8.122034072875977, 10.602412223815918, 13.08279037475586, 15.5631685256958, 18.043546676635742, 20.52392578125, 23.004302978515625, 25.48468017578125, 27.965059280395508, 30.445438385009766, 32.92581558227539, 35.406192779541016, 37.886573791503906, 40.36695098876953, 42.847328186035156, 45.32770538330078, 47.808082580566406, 50.2884635925293, 52.76884078979492, 55.24921798706055, 57.72959899902344, 60.20997619628906, 62.69035339355469, 65.17073059082031, 67.65110778808594, 70.13148498535156, 72.61186218261719, 75.09224700927734, 77.57262420654297, 80.0530014038086, 82.53337860107422, 85.01375579833984, 87.49413299560547, 89.9745101928711, 92.45489501953125, 94.93527221679688, 97.4156494140625, 99.89602661132812, 102.37640380859375]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 5.0, 5.0, 9.0, 8.0, 9.0, 4.0, 10.0, 13.0, 15.0, 19.0, 28.0, 33.0, 23.0, 30.0, 34.0, 35.0, 39.0, 36.0, 43.0, 44.0, 45.0, 38.0, 48.0, 40.0, 36.0, 39.0, 38.0, 35.0, 34.0, 33.0, 17.0, 37.0, 15.0, 13.0, 15.0, 9.0, 15.0, 13.0, 15.0, 5.0, 4.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-23.49938201904297, -22.778366088867188, -22.057348251342773, -21.336332321166992, -20.61531639099121, -19.894298553466797, -19.173282623291016, -18.452266693115234, -17.731250762939453, -17.010234832763672, -16.289216995239258, -15.568201065063477, -14.847185134887695, -14.126168251037598, -13.4051513671875, -12.684135437011719, -11.963117599487305, -11.242100715637207, -10.521084785461426, -9.800067901611328, -9.079051971435547, -8.35803508758545, -7.637018203735352, -6.916001796722412, -6.194985389709473, -5.473968982696533, -4.752952575683594, -4.031935691833496, -3.3109192848205566, -2.589902877807617, -1.8688859939575195, -1.14786958694458, -0.4268512725830078, 0.2941652536392212, 1.0151817798614502, 1.7361984252929688, 2.457214832305908, 3.1782312393188477, 3.8992481231689453, 4.620264530181885, 5.341280937194824, 6.062297344207764, 6.783313751220703, 7.504330635070801, 8.225347518920898, 8.94636344909668, 9.667380332946777, 10.388397216796875, 11.109413146972656, 11.830430030822754, 12.551445960998535, 13.272462844848633, 13.993478775024414, 14.714495658874512, 15.43551254272461, 16.15652847290039, 16.877544403076172, 17.598560333251953, 18.319578170776367, 19.04059410095215, 19.76161003112793, 20.482627868652344, 21.203643798828125, 21.924659729003906, 22.64567756652832]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 12.0, 33.0, 39.0, 78.0, 159.0, 339.0, 866.0, 2921.0, 14627.0, 173050.0, 3883936.0, 103269.0, 10903.0, 2522.0, 830.0, 345.0, 155.0, 83.0, 47.0, 24.0, 13.0, 7.0, 7.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.65625, -11.2310791015625, -10.805908203125, -10.3807373046875, -9.95556640625, -9.5303955078125, -9.105224609375, -8.6800537109375, -8.2548828125, -7.8297119140625, -7.404541015625, -6.9793701171875, -6.55419921875, -6.1290283203125, -5.703857421875, -5.2786865234375, -4.853515625, -4.4283447265625, -4.003173828125, -3.5780029296875, -3.15283203125, -2.7276611328125, -2.302490234375, -1.8773193359375, -1.4521484375, -1.0269775390625, -0.601806640625, -0.1766357421875, 0.24853515625, 0.6737060546875, 1.098876953125, 1.5240478515625, 1.94921875, 2.3743896484375, 2.799560546875, 3.2247314453125, 3.64990234375, 4.0750732421875, 4.500244140625, 4.9254150390625, 5.3505859375, 5.7757568359375, 6.200927734375, 6.6260986328125, 7.05126953125, 7.4764404296875, 7.901611328125, 8.3267822265625, 8.751953125, 9.1771240234375, 9.602294921875, 10.0274658203125, 10.45263671875, 10.8778076171875, 11.302978515625, 11.7281494140625, 12.1533203125, 12.5784912109375, 13.003662109375, 13.4288330078125, 13.85400390625, 14.2791748046875, 14.704345703125, 15.1295166015625, 15.5546875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 17.0, 23.0, 36.0, 56.0, 77.0, 120.0, 145.0, 127.0, 109.0, 90.0, 81.0, 49.0, 26.0, 14.0, 9.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.25390625, -1.2076873779296875, -1.161468505859375, -1.1152496337890625, -1.06903076171875, -1.0228118896484375, -0.976593017578125, -0.9303741455078125, -0.8841552734375, -0.8379364013671875, -0.791717529296875, -0.7454986572265625, -0.69927978515625, -0.6530609130859375, -0.606842041015625, -0.5606231689453125, -0.514404296875, -0.4681854248046875, -0.421966552734375, -0.3757476806640625, -0.32952880859375, -0.2833099365234375, -0.237091064453125, -0.1908721923828125, -0.1446533203125, -0.0984344482421875, -0.052215576171875, -0.0059967041015625, 0.04022216796875, 0.0864410400390625, 0.132659912109375, 0.1788787841796875, 0.22509765625, 0.2713165283203125, 0.317535400390625, 0.3637542724609375, 0.40997314453125, 0.4561920166015625, 0.502410888671875, 0.5486297607421875, 0.5948486328125, 0.6410675048828125, 0.687286376953125, 0.7335052490234375, 0.77972412109375, 0.8259429931640625, 0.872161865234375, 0.9183807373046875, 0.964599609375, 1.0108184814453125, 1.057037353515625, 1.1032562255859375, 1.14947509765625, 1.1956939697265625, 1.241912841796875, 1.2881317138671875, 1.3343505859375, 1.3805694580078125, 1.426788330078125, 1.4730072021484375, 1.51922607421875, 1.5654449462890625, 1.611663818359375, 1.6578826904296875, 1.7041015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 14.0, 12.0, 23.0, 19.0, 30.0, 62.0, 75.0, 147.0, 270.0, 569.0, 1317.0, 3019.0, 7816.0, 23661.0, 89311.0, 581511.0, 3131988.0, 272717.0, 55239.0, 16370.0, 5789.0, 2222.0, 994.0, 491.0, 243.0, 144.0, 92.0, 41.0, 32.0, 15.0, 14.0, 8.0, 7.0, 11.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.4608154296875, -8.234130859375, -8.0074462890625, -7.78076171875, -7.5540771484375, -7.327392578125, -7.1007080078125, -6.8740234375, -6.6473388671875, -6.420654296875, -6.1939697265625, -5.96728515625, -5.7406005859375, -5.513916015625, -5.2872314453125, -5.060546875, -4.8338623046875, -4.607177734375, -4.3804931640625, -4.15380859375, -3.9271240234375, -3.700439453125, -3.4737548828125, -3.2470703125, -3.0203857421875, -2.793701171875, -2.5670166015625, -2.34033203125, -2.1136474609375, -1.886962890625, -1.6602783203125, -1.43359375, -1.2069091796875, -0.980224609375, -0.7535400390625, -0.52685546875, -0.3001708984375, -0.073486328125, 0.1531982421875, 0.3798828125, 0.6065673828125, 0.833251953125, 1.0599365234375, 1.28662109375, 1.5133056640625, 1.739990234375, 1.9666748046875, 2.193359375, 2.4200439453125, 2.646728515625, 2.8734130859375, 3.10009765625, 3.3267822265625, 3.553466796875, 3.7801513671875, 4.0068359375, 4.2335205078125, 4.460205078125, 4.6868896484375, 4.91357421875, 5.1402587890625, 5.366943359375, 5.5936279296875, 5.8203125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 2.0, 1.0, 6.0, 7.0, 7.0, 11.0, 15.0, 17.0, 8.0, 29.0, 31.0, 38.0, 55.0, 84.0, 102.0, 131.0, 225.0, 324.0, 685.0, 996.0, 381.0, 258.0, 137.0, 142.0, 87.0, 56.0, 50.0, 32.0, 26.0, 29.0, 23.0, 10.0, 7.0, 10.0, 9.0, 8.0, 6.0, 8.0, 5.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0634765625, -1.0242462158203125, -0.985015869140625, -0.9457855224609375, -0.90655517578125, -0.8673248291015625, -0.828094482421875, -0.7888641357421875, -0.7496337890625, -0.7104034423828125, -0.671173095703125, -0.6319427490234375, -0.59271240234375, -0.5534820556640625, -0.514251708984375, -0.4750213623046875, -0.435791015625, -0.3965606689453125, -0.357330322265625, -0.3180999755859375, -0.27886962890625, -0.2396392822265625, -0.200408935546875, -0.1611785888671875, -0.1219482421875, -0.0827178955078125, -0.043487548828125, -0.0042572021484375, 0.03497314453125, 0.0742034912109375, 0.113433837890625, 0.1526641845703125, 0.19189453125, 0.2311248779296875, 0.270355224609375, 0.3095855712890625, 0.34881591796875, 0.3880462646484375, 0.427276611328125, 0.4665069580078125, 0.5057373046875, 0.5449676513671875, 0.584197998046875, 0.6234283447265625, 0.66265869140625, 0.7018890380859375, 0.741119384765625, 0.7803497314453125, 0.819580078125, 0.8588104248046875, 0.898040771484375, 0.9372711181640625, 0.97650146484375, 1.0157318115234375, 1.054962158203125, 1.0941925048828125, 1.1334228515625, 1.1726531982421875, 1.211883544921875, 1.2511138916015625, 1.29034423828125, 1.3295745849609375, 1.368804931640625, 1.4080352783203125, 1.447265625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 13.0, 33.0, 65.0, 137.0, 216.0, 205.0, 164.0, 91.0, 51.0, 18.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.177021026611328, -17.479427337646484, -16.781831741333008, -16.084238052368164, -15.38664436340332, -14.68904972076416, -13.991455078125, -13.293861389160156, -12.596266746520996, -11.898672103881836, -11.201078414916992, -10.503483772277832, -9.805889129638672, -9.108295440673828, -8.410700798034668, -7.713106632232666, -7.015512466430664, -6.317918300628662, -5.62032413482666, -4.9227294921875, -4.225135326385498, -3.527541160583496, -2.829946517944336, -2.132352352142334, -1.434758186340332, -0.7371639013290405, -0.03956961631774902, 0.658024787902832, 1.355618953704834, 2.053213119506836, 2.750807762145996, 3.448401927947998, 4.145998001098633, 4.843592166900635, 5.541186332702637, 6.238780975341797, 6.936375141143799, 7.633969306945801, 8.331563949584961, 9.029157638549805, 9.726752281188965, 10.424346923828125, 11.121940612792969, 11.819535255432129, 12.517129898071289, 13.214723587036133, 13.912318229675293, 14.609912872314453, 15.307506561279297, 16.00510025024414, 16.702695846557617, 17.40028953552246, 18.097883224487305, 18.79547882080078, 19.493072509765625, 20.19066619873047, 20.888259887695312, 21.585853576660156, 22.283449172973633, 22.981042861938477, 23.67863655090332, 24.376232147216797, 25.07382583618164, 25.771419525146484, 26.46901512145996]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 3.0, 6.0, 4.0, 9.0, 10.0, 23.0, 15.0, 23.0, 13.0, 18.0, 29.0, 28.0, 26.0, 21.0, 37.0, 32.0, 30.0, 47.0, 43.0, 36.0, 31.0, 33.0, 36.0, 39.0, 32.0, 38.0, 37.0, 36.0, 36.0, 36.0, 16.0, 31.0, 28.0, 15.0, 15.0, 17.0, 9.0, 8.0, 6.0, 12.0, 6.0, 3.0, 2.0, 6.0, 2.0, 2.0, 7.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-5.330476760864258, -5.17071008682251, -5.01094388961792, -4.851177215576172, -4.691410541534424, -4.531644344329834, -4.371877670288086, -4.212111473083496, -4.052344799041748, -3.892578363418579, -3.732811689376831, -3.573045253753662, -3.413278818130493, -3.253512382507324, -3.093745708465576, -2.9339792728424072, -2.774212598800659, -2.6144461631774902, -2.454679489135742, -2.2949130535125732, -2.1351466178894043, -1.9753800630569458, -1.8156135082244873, -1.6558470726013184, -1.4960805177688599, -1.3363139629364014, -1.1765475273132324, -1.016780972480774, -0.8570144772529602, -0.6972479820251465, -0.537481427192688, -0.37771499156951904, -0.21794843673706055, -0.05818192660808563, 0.10158458352088928, 0.2613511085510254, 0.4211176037788391, 0.5808840990066528, 0.7406506538391113, 0.9004170894622803, 1.0601836442947388, 1.2199501991271973, 1.3797166347503662, 1.5394831895828247, 1.6992497444152832, 1.8590161800384521, 2.018782615661621, 2.178549289703369, 2.338315725326538, 2.498082160949707, 2.657848834991455, 2.817615270614624, 2.977381706237793, 3.137148380279541, 3.29691481590271, 3.456681251525879, 3.616447925567627, 3.776214361190796, 3.935981035232544, 4.095747470855713, 4.255514144897461, 4.415280342102051, 4.575047016143799, 4.734813690185547, 4.894579887390137]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 9.0, 9.0, 17.0, 31.0, 42.0, 65.0, 97.0, 134.0, 249.0, 335.0, 561.0, 1122.0, 2275.0, 5957.0, 17870.0, 61823.0, 215118.0, 452619.0, 204496.0, 58429.0, 16948.0, 5624.0, 2154.0, 1072.0, 573.0, 323.0, 220.0, 141.0, 95.0, 57.0, 37.0, 23.0, 9.0, 7.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.03515625, -4.8375244140625, -4.639892578125, -4.4422607421875, -4.24462890625, -4.0469970703125, -3.849365234375, -3.6517333984375, -3.4541015625, -3.2564697265625, -3.058837890625, -2.8612060546875, -2.66357421875, -2.4659423828125, -2.268310546875, -2.0706787109375, -1.873046875, -1.6754150390625, -1.477783203125, -1.2801513671875, -1.08251953125, -0.8848876953125, -0.687255859375, -0.4896240234375, -0.2919921875, -0.0943603515625, 0.103271484375, 0.3009033203125, 0.49853515625, 0.6961669921875, 0.893798828125, 1.0914306640625, 1.2890625, 1.4866943359375, 1.684326171875, 1.8819580078125, 2.07958984375, 2.2772216796875, 2.474853515625, 2.6724853515625, 2.8701171875, 3.0677490234375, 3.265380859375, 3.4630126953125, 3.66064453125, 3.8582763671875, 4.055908203125, 4.2535400390625, 4.451171875, 4.6488037109375, 4.846435546875, 5.0440673828125, 5.24169921875, 5.4393310546875, 5.636962890625, 5.8345947265625, 6.0322265625, 6.2298583984375, 6.427490234375, 6.6251220703125, 6.82275390625, 7.0203857421875, 7.218017578125, 7.4156494140625, 7.61328125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 5.0, 4.0, 15.0, 22.0, 37.0, 54.0, 78.0, 101.0, 105.0, 113.0, 111.0, 86.0, 76.0, 73.0, 37.0, 40.0, 13.0, 14.0, 10.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.26953125, -1.2269439697265625, -1.184356689453125, -1.1417694091796875, -1.09918212890625, -1.0565948486328125, -1.014007568359375, -0.9714202880859375, -0.9288330078125, -0.8862457275390625, -0.843658447265625, -0.8010711669921875, -0.75848388671875, -0.7158966064453125, -0.673309326171875, -0.6307220458984375, -0.588134765625, -0.5455474853515625, -0.502960205078125, -0.4603729248046875, -0.41778564453125, -0.3751983642578125, -0.332611083984375, -0.2900238037109375, -0.2474365234375, -0.2048492431640625, -0.162261962890625, -0.1196746826171875, -0.07708740234375, -0.0345001220703125, 0.008087158203125, 0.0506744384765625, 0.09326171875, 0.1358489990234375, 0.178436279296875, 0.2210235595703125, 0.26361083984375, 0.3061981201171875, 0.348785400390625, 0.3913726806640625, 0.4339599609375, 0.4765472412109375, 0.519134521484375, 0.5617218017578125, 0.60430908203125, 0.6468963623046875, 0.689483642578125, 0.7320709228515625, 0.774658203125, 0.8172454833984375, 0.859832763671875, 0.9024200439453125, 0.94500732421875, 0.9875946044921875, 1.030181884765625, 1.0727691650390625, 1.1153564453125, 1.1579437255859375, 1.200531005859375, 1.2431182861328125, 1.28570556640625, 1.3282928466796875, 1.370880126953125, 1.4134674072265625, 1.4560546875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 1.0, 1.0, 7.0, 7.0, 6.0, 23.0, 41.0, 47.0, 67.0, 116.0, 175.0, 263.0, 481.0, 857.0, 1805.0, 4445.0, 14240.0, 55587.0, 221524.0, 482711.0, 196978.0, 48762.0, 12772.0, 3927.0, 1624.0, 848.0, 478.0, 301.0, 164.0, 95.0, 69.0, 39.0, 36.0, 26.0, 11.0, 10.0, 6.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.26171875, -6.04913330078125, -5.8365478515625, -5.62396240234375, -5.411376953125, -5.19879150390625, -4.9862060546875, -4.77362060546875, -4.56103515625, -4.34844970703125, -4.1358642578125, -3.92327880859375, -3.710693359375, -3.49810791015625, -3.2855224609375, -3.07293701171875, -2.8603515625, -2.64776611328125, -2.4351806640625, -2.22259521484375, -2.010009765625, -1.79742431640625, -1.5848388671875, -1.37225341796875, -1.15966796875, -0.94708251953125, -0.7344970703125, -0.52191162109375, -0.309326171875, -0.09674072265625, 0.1158447265625, 0.32843017578125, 0.541015625, 0.75360107421875, 0.9661865234375, 1.17877197265625, 1.391357421875, 1.60394287109375, 1.8165283203125, 2.02911376953125, 2.24169921875, 2.45428466796875, 2.6668701171875, 2.87945556640625, 3.092041015625, 3.30462646484375, 3.5172119140625, 3.72979736328125, 3.9423828125, 4.15496826171875, 4.3675537109375, 4.58013916015625, 4.792724609375, 5.00531005859375, 5.2178955078125, 5.43048095703125, 5.64306640625, 5.85565185546875, 6.0682373046875, 6.28082275390625, 6.493408203125, 6.70599365234375, 6.9185791015625, 7.13116455078125, 7.34375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 7.0, 5.0, 10.0, 18.0, 13.0, 21.0, 29.0, 25.0, 27.0, 33.0, 36.0, 30.0, 59.0, 34.0, 44.0, 42.0, 46.0, 50.0, 38.0, 33.0, 45.0, 45.0, 36.0, 36.0, 35.0, 33.0, 26.0, 24.0, 14.0, 17.0, 13.0, 8.0, 8.0, 14.0, 9.0, 6.0, 5.0, 0.0, 6.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.486328125, -3.377777099609375, -3.26922607421875, -3.160675048828125, -3.0521240234375, -2.943572998046875, -2.83502197265625, -2.726470947265625, -2.617919921875, -2.509368896484375, -2.40081787109375, -2.292266845703125, -2.1837158203125, -2.075164794921875, -1.96661376953125, -1.858062744140625, -1.74951171875, -1.640960693359375, -1.53240966796875, -1.423858642578125, -1.3153076171875, -1.206756591796875, -1.09820556640625, -0.989654541015625, -0.881103515625, -0.772552490234375, -0.66400146484375, -0.555450439453125, -0.4468994140625, -0.338348388671875, -0.22979736328125, -0.121246337890625, -0.0126953125, 0.095855712890625, 0.20440673828125, 0.312957763671875, 0.4215087890625, 0.530059814453125, 0.63861083984375, 0.747161865234375, 0.855712890625, 0.964263916015625, 1.07281494140625, 1.181365966796875, 1.2899169921875, 1.398468017578125, 1.50701904296875, 1.615570068359375, 1.72412109375, 1.832672119140625, 1.94122314453125, 2.049774169921875, 2.1583251953125, 2.266876220703125, 2.37542724609375, 2.483978271484375, 2.592529296875, 2.701080322265625, 2.80963134765625, 2.918182373046875, 3.0267333984375, 3.135284423828125, 3.24383544921875, 3.352386474609375, 3.4609375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 5.0, 14.0, 15.0, 21.0, 31.0, 48.0, 89.0, 134.0, 256.0, 551.0, 1230.0, 2983.0, 8513.0, 27582.0, 107740.0, 421142.0, 359074.0, 84572.0, 22628.0, 7146.0, 2625.0, 1080.0, 501.0, 235.0, 137.0, 68.0, 44.0, 26.0, 25.0, 18.0, 15.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.8671875, -3.74603271484375, -3.6248779296875, -3.50372314453125, -3.382568359375, -3.26141357421875, -3.1402587890625, -3.01910400390625, -2.89794921875, -2.77679443359375, -2.6556396484375, -2.53448486328125, -2.413330078125, -2.29217529296875, -2.1710205078125, -2.04986572265625, -1.9287109375, -1.80755615234375, -1.6864013671875, -1.56524658203125, -1.444091796875, -1.32293701171875, -1.2017822265625, -1.08062744140625, -0.95947265625, -0.83831787109375, -0.7171630859375, -0.59600830078125, -0.474853515625, -0.35369873046875, -0.2325439453125, -0.11138916015625, 0.009765625, 0.13092041015625, 0.2520751953125, 0.37322998046875, 0.494384765625, 0.61553955078125, 0.7366943359375, 0.85784912109375, 0.97900390625, 1.10015869140625, 1.2213134765625, 1.34246826171875, 1.463623046875, 1.58477783203125, 1.7059326171875, 1.82708740234375, 1.9482421875, 2.06939697265625, 2.1905517578125, 2.31170654296875, 2.432861328125, 2.55401611328125, 2.6751708984375, 2.79632568359375, 2.91748046875, 3.03863525390625, 3.1597900390625, 3.28094482421875, 3.402099609375, 3.52325439453125, 3.6444091796875, 3.76556396484375, 3.88671875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 3.0, 6.0, 11.0, 9.0, 22.0, 24.0, 28.0, 26.0, 45.0, 51.0, 74.0, 83.0, 104.0, 112.0, 100.0, 77.0, 42.0, 40.0, 31.0, 31.0, 16.0, 14.0, 10.0, 10.0, 12.0, 2.0, 3.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0007815361022949219, -0.000759810209274292, -0.0007380843162536621, -0.0007163584232330322, -0.0006946325302124023, -0.0006729066371917725, -0.0006511807441711426, -0.0006294548511505127, -0.0006077289581298828, -0.0005860030651092529, -0.000564277172088623, -0.0005425512790679932, -0.0005208253860473633, -0.0004990994930267334, -0.0004773736000061035, -0.00045564770698547363, -0.00043392181396484375, -0.00041219592094421387, -0.000390470027923584, -0.0003687441349029541, -0.0003470182418823242, -0.00032529234886169434, -0.00030356645584106445, -0.00028184056282043457, -0.0002601146697998047, -0.0002383887767791748, -0.00021666288375854492, -0.00019493699073791504, -0.00017321109771728516, -0.00015148520469665527, -0.0001297593116760254, -0.00010803341865539551, -8.630752563476562e-05, -6.458163261413574e-05, -4.285573959350586e-05, -2.1129846572875977e-05, 5.960464477539062e-07, 2.232193946838379e-05, 4.404783248901367e-05, 6.577372550964355e-05, 8.749961853027344e-05, 0.00010922551155090332, 0.0001309514045715332, 0.00015267729759216309, 0.00017440319061279297, 0.00019612908363342285, 0.00021785497665405273, 0.00023958086967468262, 0.0002613067626953125, 0.0002830326557159424, 0.00030475854873657227, 0.00032648444175720215, 0.00034821033477783203, 0.0003699362277984619, 0.0003916621208190918, 0.0004133880138397217, 0.00043511390686035156, 0.00045683979988098145, 0.00047856569290161133, 0.0005002915859222412, 0.0005220174789428711, 0.000543743371963501, 0.0005654692649841309, 0.0005871951580047607, 0.0006089210510253906]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 5.0, 11.0, 22.0, 41.0, 67.0, 119.0, 192.0, 403.0, 882.0, 2310.0, 8414.0, 42480.0, 339791.0, 560785.0, 74364.0, 13294.0, 3266.0, 1070.0, 506.0, 246.0, 123.0, 77.0, 30.0, 18.0, 15.0, 7.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.87109375, -6.69097900390625, -6.5108642578125, -6.33074951171875, -6.150634765625, -5.97052001953125, -5.7904052734375, -5.61029052734375, -5.43017578125, -5.25006103515625, -5.0699462890625, -4.88983154296875, -4.709716796875, -4.52960205078125, -4.3494873046875, -4.16937255859375, -3.9892578125, -3.80914306640625, -3.6290283203125, -3.44891357421875, -3.268798828125, -3.08868408203125, -2.9085693359375, -2.72845458984375, -2.54833984375, -2.36822509765625, -2.1881103515625, -2.00799560546875, -1.827880859375, -1.64776611328125, -1.4676513671875, -1.28753662109375, -1.107421875, -0.92730712890625, -0.7471923828125, -0.56707763671875, -0.386962890625, -0.20684814453125, -0.0267333984375, 0.15338134765625, 0.33349609375, 0.51361083984375, 0.6937255859375, 0.87384033203125, 1.053955078125, 1.23406982421875, 1.4141845703125, 1.59429931640625, 1.7744140625, 1.95452880859375, 2.1346435546875, 2.31475830078125, 2.494873046875, 2.67498779296875, 2.8551025390625, 3.03521728515625, 3.21533203125, 3.39544677734375, 3.5755615234375, 3.75567626953125, 3.935791015625, 4.11590576171875, 4.2960205078125, 4.47613525390625, 4.65625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 5.0, 6.0, 6.0, 6.0, 21.0, 33.0, 48.0, 74.0, 135.0, 155.0, 157.0, 127.0, 86.0, 51.0, 32.0, 24.0, 16.0, 10.0, 7.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.97265625, -5.82763671875, -5.6826171875, -5.53759765625, -5.392578125, -5.24755859375, -5.1025390625, -4.95751953125, -4.8125, -4.66748046875, -4.5224609375, -4.37744140625, -4.232421875, -4.08740234375, -3.9423828125, -3.79736328125, -3.65234375, -3.50732421875, -3.3623046875, -3.21728515625, -3.072265625, -2.92724609375, -2.7822265625, -2.63720703125, -2.4921875, -2.34716796875, -2.2021484375, -2.05712890625, -1.912109375, -1.76708984375, -1.6220703125, -1.47705078125, -1.33203125, -1.18701171875, -1.0419921875, -0.89697265625, -0.751953125, -0.60693359375, -0.4619140625, -0.31689453125, -0.171875, -0.02685546875, 0.1181640625, 0.26318359375, 0.408203125, 0.55322265625, 0.6982421875, 0.84326171875, 0.98828125, 1.13330078125, 1.2783203125, 1.42333984375, 1.568359375, 1.71337890625, 1.8583984375, 2.00341796875, 2.1484375, 2.29345703125, 2.4384765625, 2.58349609375, 2.728515625, 2.87353515625, 3.0185546875, 3.16357421875, 3.30859375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 2.0, 6.0, 27.0, 39.0, 120.0, 218.0, 246.0, 206.0, 89.0, 35.0, 14.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.973995208740234, -52.52726745605469, -50.080543518066406, -47.633819580078125, -45.18709182739258, -42.74036407470703, -40.29364013671875, -37.84691619873047, -35.40018844604492, -32.953460693359375, -30.506736755371094, -28.06001091003418, -25.613285064697266, -23.16655921936035, -20.719833374023438, -18.273107528686523, -15.82638168334961, -13.379655838012695, -10.932929992675781, -8.486204147338867, -6.039478302001953, -3.592752456665039, -1.146026611328125, 1.300699234008789, 3.747425079345703, 6.194150924682617, 8.640876770019531, 11.087602615356445, 13.53432846069336, 15.981054306030273, 18.427780151367188, 20.8745059967041, 23.32122802734375, 25.767953872680664, 28.214679718017578, 30.661405563354492, 33.108131408691406, 35.55485534667969, 38.001583099365234, 40.44831085205078, 42.89503479003906, 45.341758728027344, 47.78848648071289, 50.23521423339844, 52.68193817138672, 55.128662109375, 57.57538986206055, 60.022117614746094, 62.468841552734375, 64.91556549072266, 67.36228942871094, 69.80902099609375, 72.25574493408203, 74.70246887207031, 77.14920043945312, 79.5959243774414, 82.04264831542969, 84.48937225341797, 86.93609619140625, 89.38282775878906, 91.82955169677734, 94.27627563476562, 96.72300720214844, 99.16973114013672, 101.616455078125]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 5.0, 6.0, 4.0, 6.0, 8.0, 9.0, 12.0, 7.0, 18.0, 19.0, 20.0, 28.0, 24.0, 28.0, 24.0, 37.0, 35.0, 40.0, 28.0, 47.0, 36.0, 49.0, 40.0, 34.0, 39.0, 39.0, 40.0, 48.0, 31.0, 32.0, 26.0, 32.0, 26.0, 16.0, 21.0, 15.0, 17.0, 9.0, 8.0, 10.0, 7.0, 7.0, 2.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-19.575660705566406, -18.952245712280273, -18.32883071899414, -17.705413818359375, -17.081998825073242, -16.45858383178711, -15.835168838500977, -15.211753845214844, -14.588337898254395, -13.964922904968262, -13.341506958007812, -12.71809196472168, -12.094676971435547, -11.471261024475098, -10.847846031188965, -10.224430084228516, -9.601015090942383, -8.97760009765625, -8.3541841506958, -7.730769157409668, -7.107353687286377, -6.483938217163086, -5.860523223876953, -5.237107753753662, -4.613692283630371, -3.99027681350708, -3.366861581802368, -2.7434463500976562, -2.1200308799743652, -1.4966154098510742, -0.8732001781463623, -0.2497849464416504, 0.3736305236816406, 0.9970458745956421, 1.6204612255096436, 2.2438764572143555, 2.8672919273376465, 3.4907073974609375, 4.11412239074707, 4.737537860870361, 5.360953330993652, 5.984368801116943, 6.607784271240234, 7.231199264526367, 7.854614734649658, 8.47803020477295, 9.101445198059082, 9.724861145019531, 10.348276138305664, 10.971691131591797, 11.595107078552246, 12.218522071838379, 12.841938018798828, 13.465353012084961, 14.088768005371094, 14.712182998657227, 15.335598945617676, 15.959013938903809, 16.582429885864258, 17.20584487915039, 17.829259872436523, 18.452674865722656, 19.076091766357422, 19.699506759643555, 20.322921752929688]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 11.0, 6.0, 13.0, 12.0, 24.0, 32.0, 45.0, 75.0, 126.0, 177.0, 369.0, 699.0, 1564.0, 3845.0, 11518.0, 47258.0, 464429.0, 3532101.0, 100663.0, 20262.0, 6364.0, 2435.0, 1056.0, 518.0, 267.0, 142.0, 106.0, 58.0, 42.0, 18.0, 19.0, 13.0, 4.0, 1.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.609375, -8.35015869140625, -8.0909423828125, -7.83172607421875, -7.572509765625, -7.31329345703125, -7.0540771484375, -6.79486083984375, -6.53564453125, -6.27642822265625, -6.0172119140625, -5.75799560546875, -5.498779296875, -5.23956298828125, -4.9803466796875, -4.72113037109375, -4.4619140625, -4.20269775390625, -3.9434814453125, -3.68426513671875, -3.425048828125, -3.16583251953125, -2.9066162109375, -2.64739990234375, -2.38818359375, -2.12896728515625, -1.8697509765625, -1.61053466796875, -1.351318359375, -1.09210205078125, -0.8328857421875, -0.57366943359375, -0.314453125, -0.05523681640625, 0.2039794921875, 0.46319580078125, 0.722412109375, 0.98162841796875, 1.2408447265625, 1.50006103515625, 1.75927734375, 2.01849365234375, 2.2777099609375, 2.53692626953125, 2.796142578125, 3.05535888671875, 3.3145751953125, 3.57379150390625, 3.8330078125, 4.09222412109375, 4.3514404296875, 4.61065673828125, 4.869873046875, 5.12908935546875, 5.3883056640625, 5.64752197265625, 5.90673828125, 6.16595458984375, 6.4251708984375, 6.68438720703125, 6.943603515625, 7.20281982421875, 7.4620361328125, 7.72125244140625, 7.98046875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 4.0, 6.0, 7.0, 16.0, 24.0, 40.0, 52.0, 74.0, 98.0, 97.0, 119.0, 103.0, 93.0, 70.0, 62.0, 53.0, 29.0, 26.0, 12.0, 12.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.236328125, -1.1918792724609375, -1.147430419921875, -1.1029815673828125, -1.05853271484375, -1.0140838623046875, -0.969635009765625, -0.9251861572265625, -0.8807373046875, -0.8362884521484375, -0.791839599609375, -0.7473907470703125, -0.70294189453125, -0.6584930419921875, -0.614044189453125, -0.5695953369140625, -0.525146484375, -0.4806976318359375, -0.436248779296875, -0.3917999267578125, -0.34735107421875, -0.3029022216796875, -0.258453369140625, -0.2140045166015625, -0.1695556640625, -0.1251068115234375, -0.080657958984375, -0.0362091064453125, 0.00823974609375, 0.0526885986328125, 0.097137451171875, 0.1415863037109375, 0.18603515625, 0.2304840087890625, 0.274932861328125, 0.3193817138671875, 0.36383056640625, 0.4082794189453125, 0.452728271484375, 0.4971771240234375, 0.5416259765625, 0.5860748291015625, 0.630523681640625, 0.6749725341796875, 0.71942138671875, 0.7638702392578125, 0.808319091796875, 0.8527679443359375, 0.897216796875, 0.9416656494140625, 0.986114501953125, 1.0305633544921875, 1.07501220703125, 1.1194610595703125, 1.163909912109375, 1.2083587646484375, 1.2528076171875, 1.2972564697265625, 1.341705322265625, 1.3861541748046875, 1.43060302734375, 1.4750518798828125, 1.519500732421875, 1.5639495849609375, 1.6083984375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 1.0, 7.0, 4.0, 6.0, 11.0, 34.0, 31.0, 59.0, 117.0, 198.0, 331.0, 541.0, 1082.0, 2203.0, 4804.0, 11698.0, 31330.0, 100610.0, 544317.0, 3081597.0, 304543.0, 70148.0, 23490.0, 8968.0, 3955.0, 1909.0, 959.0, 532.0, 303.0, 190.0, 114.0, 79.0, 56.0, 17.0, 18.0, 9.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.00390625, -5.8341064453125, -5.664306640625, -5.4945068359375, -5.32470703125, -5.1549072265625, -4.985107421875, -4.8153076171875, -4.6455078125, -4.4757080078125, -4.305908203125, -4.1361083984375, -3.96630859375, -3.7965087890625, -3.626708984375, -3.4569091796875, -3.287109375, -3.1173095703125, -2.947509765625, -2.7777099609375, -2.60791015625, -2.4381103515625, -2.268310546875, -2.0985107421875, -1.9287109375, -1.7589111328125, -1.589111328125, -1.4193115234375, -1.24951171875, -1.0797119140625, -0.909912109375, -0.7401123046875, -0.5703125, -0.4005126953125, -0.230712890625, -0.0609130859375, 0.10888671875, 0.2786865234375, 0.448486328125, 0.6182861328125, 0.7880859375, 0.9578857421875, 1.127685546875, 1.2974853515625, 1.46728515625, 1.6370849609375, 1.806884765625, 1.9766845703125, 2.146484375, 2.3162841796875, 2.486083984375, 2.6558837890625, 2.82568359375, 2.9954833984375, 3.165283203125, 3.3350830078125, 3.5048828125, 3.6746826171875, 3.844482421875, 4.0142822265625, 4.18408203125, 4.3538818359375, 4.523681640625, 4.6934814453125, 4.86328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 5.0, 5.0, 6.0, 11.0, 17.0, 20.0, 29.0, 42.0, 62.0, 100.0, 149.0, 298.0, 666.0, 1531.0, 503.0, 240.0, 126.0, 73.0, 59.0, 37.0, 24.0, 19.0, 16.0, 5.0, 9.0, 5.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.80078125, -1.741455078125, -1.68212890625, -1.622802734375, -1.5634765625, -1.504150390625, -1.44482421875, -1.385498046875, -1.326171875, -1.266845703125, -1.20751953125, -1.148193359375, -1.0888671875, -1.029541015625, -0.97021484375, -0.910888671875, -0.8515625, -0.792236328125, -0.73291015625, -0.673583984375, -0.6142578125, -0.554931640625, -0.49560546875, -0.436279296875, -0.376953125, -0.317626953125, -0.25830078125, -0.198974609375, -0.1396484375, -0.080322265625, -0.02099609375, 0.038330078125, 0.09765625, 0.156982421875, 0.21630859375, 0.275634765625, 0.3349609375, 0.394287109375, 0.45361328125, 0.512939453125, 0.572265625, 0.631591796875, 0.69091796875, 0.750244140625, 0.8095703125, 0.868896484375, 0.92822265625, 0.987548828125, 1.046875, 1.106201171875, 1.16552734375, 1.224853515625, 1.2841796875, 1.343505859375, 1.40283203125, 1.462158203125, 1.521484375, 1.580810546875, 1.64013671875, 1.699462890625, 1.7587890625, 1.818115234375, 1.87744140625, 1.936767578125, 1.99609375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 3.0, 5.0, 4.0, 7.0, 22.0, 34.0, 44.0, 83.0, 69.0, 104.0, 138.0, 129.0, 100.0, 96.0, 64.0, 40.0, 26.0, 11.0, 10.0, 5.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.698005676269531, -12.322754859924316, -11.947504043579102, -11.572253227233887, -11.197002410888672, -10.82175064086914, -10.446499824523926, -10.071249008178711, -9.695998191833496, -9.320747375488281, -8.945496559143066, -8.570245742797852, -8.19499397277832, -7.819743633270264, -7.444492340087891, -7.069241523742676, -6.693990707397461, -6.318739891052246, -5.943489074707031, -5.568237781524658, -5.192986965179443, -4.8177361488342285, -4.4424848556518555, -4.067234039306641, -3.691983222961426, -3.316732406616211, -2.941481351852417, -2.566230297088623, -2.190979480743408, -1.8157285451889038, -1.4404776096343994, -1.0652265548706055, -0.689976692199707, -0.31472575664520264, 0.06052517890930176, 0.43577611446380615, 0.8110270500183105, 1.186277985572815, 1.5615289211273193, 1.9367799758911133, 2.312030792236328, 2.687281608581543, 3.062532663345337, 3.437783718109131, 3.8130345344543457, 4.1882853507995605, 4.563536643981934, 4.938787460327148, 5.314038276672363, 5.689289093017578, 6.064539909362793, 6.439791202545166, 6.815042018890381, 7.190292835235596, 7.565544128417969, 7.940794944763184, 8.316045761108398, 8.691296577453613, 9.066547393798828, 9.441798210144043, 9.817049026489258, 10.192300796508789, 10.567551612854004, 10.942802429199219, 11.318053245544434]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 6.0, 7.0, 9.0, 12.0, 12.0, 20.0, 10.0, 16.0, 28.0, 34.0, 32.0, 36.0, 33.0, 38.0, 34.0, 45.0, 47.0, 51.0, 47.0, 52.0, 59.0, 66.0, 47.0, 35.0, 42.0, 43.0, 25.0, 21.0, 26.0, 15.0, 7.0, 15.0, 8.0, 10.0, 5.0, 1.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5156025886535645, -7.316101551055908, -7.116600513458252, -6.917099475860596, -6.7175984382629395, -6.518097400665283, -6.318596363067627, -6.119095325469971, -5.9195942878723145, -5.720093250274658, -5.520592212677002, -5.321091175079346, -5.1215901374816895, -4.922089099884033, -4.722588062286377, -4.523087024688721, -4.3235859870910645, -4.124084949493408, -3.924583911895752, -3.7250828742980957, -3.5255818367004395, -3.326080799102783, -3.126579761505127, -2.9270787239074707, -2.7275776863098145, -2.528076648712158, -2.328575611114502, -2.1290745735168457, -1.9295735359191895, -1.7300724983215332, -1.530571460723877, -1.3310704231262207, -1.1315698623657227, -0.9320688247680664, -0.7325677871704102, -0.5330667495727539, -0.33356571197509766, -0.1340646743774414, 0.06543636322021484, 0.2649374008178711, 0.46443843841552734, 0.6639394760131836, 0.8634405136108398, 1.062941551208496, 1.2624425888061523, 1.4619436264038086, 1.6614446640014648, 1.860945701599121, 2.0604467391967773, 2.2599477767944336, 2.45944881439209, 2.658949851989746, 2.8584508895874023, 3.0579519271850586, 3.257452964782715, 3.456954002380371, 3.6564550399780273, 3.8559560775756836, 4.05545711517334, 4.254958152770996, 4.454459190368652, 4.653960227966309, 4.853461265563965, 5.052962303161621, 5.252463340759277]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0, 11.0, 10.0, 14.0, 26.0, 28.0, 34.0, 75.0, 100.0, 200.0, 313.0, 612.0, 1132.0, 2493.0, 5923.0, 15888.0, 48630.0, 161365.0, 407332.0, 274614.0, 86436.0, 26758.0, 9300.0, 3665.0, 1673.0, 794.0, 465.0, 250.0, 148.0, 85.0, 61.0, 34.0, 25.0, 16.0, 14.0, 9.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.21484375, -5.03338623046875, -4.8519287109375, -4.67047119140625, -4.489013671875, -4.30755615234375, -4.1260986328125, -3.94464111328125, -3.76318359375, -3.58172607421875, -3.4002685546875, -3.21881103515625, -3.037353515625, -2.85589599609375, -2.6744384765625, -2.49298095703125, -2.3115234375, -2.13006591796875, -1.9486083984375, -1.76715087890625, -1.585693359375, -1.40423583984375, -1.2227783203125, -1.04132080078125, -0.85986328125, -0.67840576171875, -0.4969482421875, -0.31549072265625, -0.134033203125, 0.04742431640625, 0.2288818359375, 0.41033935546875, 0.591796875, 0.77325439453125, 0.9547119140625, 1.13616943359375, 1.317626953125, 1.49908447265625, 1.6805419921875, 1.86199951171875, 2.04345703125, 2.22491455078125, 2.4063720703125, 2.58782958984375, 2.769287109375, 2.95074462890625, 3.1322021484375, 3.31365966796875, 3.4951171875, 3.67657470703125, 3.8580322265625, 4.03948974609375, 4.220947265625, 4.40240478515625, 4.5838623046875, 4.76531982421875, 4.94677734375, 5.12823486328125, 5.3096923828125, 5.49114990234375, 5.672607421875, 5.85406494140625, 6.0355224609375, 6.21697998046875, 6.3984375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 7.0, 13.0, 15.0, 25.0, 42.0, 54.0, 68.0, 80.0, 80.0, 104.0, 104.0, 77.0, 76.0, 68.0, 40.0, 45.0, 39.0, 23.0, 16.0, 9.0, 8.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0302734375, -0.9894256591796875, -0.948577880859375, -0.9077301025390625, -0.86688232421875, -0.8260345458984375, -0.785186767578125, -0.7443389892578125, -0.7034912109375, -0.6626434326171875, -0.621795654296875, -0.5809478759765625, -0.54010009765625, -0.4992523193359375, -0.458404541015625, -0.4175567626953125, -0.376708984375, -0.3358612060546875, -0.295013427734375, -0.2541656494140625, -0.21331787109375, -0.1724700927734375, -0.131622314453125, -0.0907745361328125, -0.0499267578125, -0.0090789794921875, 0.031768798828125, 0.0726165771484375, 0.11346435546875, 0.1543121337890625, 0.195159912109375, 0.2360076904296875, 0.27685546875, 0.3177032470703125, 0.358551025390625, 0.3993988037109375, 0.44024658203125, 0.4810943603515625, 0.521942138671875, 0.5627899169921875, 0.6036376953125, 0.6444854736328125, 0.685333251953125, 0.7261810302734375, 0.76702880859375, 0.8078765869140625, 0.848724365234375, 0.8895721435546875, 0.930419921875, 0.9712677001953125, 1.012115478515625, 1.0529632568359375, 1.09381103515625, 1.1346588134765625, 1.175506591796875, 1.2163543701171875, 1.2572021484375, 1.2980499267578125, 1.338897705078125, 1.3797454833984375, 1.42059326171875, 1.4614410400390625, 1.502288818359375, 1.5431365966796875, 1.583984375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 6.0, 7.0, 23.0, 34.0, 41.0, 88.0, 140.0, 208.0, 427.0, 1108.0, 3058.0, 14260.0, 119195.0, 667959.0, 211947.0, 23168.0, 4294.0, 1385.0, 584.0, 279.0, 134.0, 90.0, 40.0, 23.0, 14.0, 9.0, 6.0, 10.0, 3.0, 2.0, 7.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1015625, -7.7725830078125, -7.443603515625, -7.1146240234375, -6.78564453125, -6.4566650390625, -6.127685546875, -5.7987060546875, -5.4697265625, -5.1407470703125, -4.811767578125, -4.4827880859375, -4.15380859375, -3.8248291015625, -3.495849609375, -3.1668701171875, -2.837890625, -2.5089111328125, -2.179931640625, -1.8509521484375, -1.52197265625, -1.1929931640625, -0.864013671875, -0.5350341796875, -0.2060546875, 0.1229248046875, 0.451904296875, 0.7808837890625, 1.10986328125, 1.4388427734375, 1.767822265625, 2.0968017578125, 2.42578125, 2.7547607421875, 3.083740234375, 3.4127197265625, 3.74169921875, 4.0706787109375, 4.399658203125, 4.7286376953125, 5.0576171875, 5.3865966796875, 5.715576171875, 6.0445556640625, 6.37353515625, 6.7025146484375, 7.031494140625, 7.3604736328125, 7.689453125, 8.0184326171875, 8.347412109375, 8.6763916015625, 9.00537109375, 9.3343505859375, 9.663330078125, 9.9923095703125, 10.3212890625, 10.6502685546875, 10.979248046875, 11.3082275390625, 11.63720703125, 11.9661865234375, 12.295166015625, 12.6241455078125, 12.953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 4.0, 8.0, 8.0, 15.0, 13.0, 15.0, 16.0, 24.0, 27.0, 37.0, 33.0, 29.0, 39.0, 35.0, 35.0, 55.0, 40.0, 35.0, 43.0, 49.0, 38.0, 40.0, 47.0, 40.0, 44.0, 37.0, 24.0, 24.0, 21.0, 25.0, 22.0, 16.0, 12.0, 9.0, 7.0, 7.0, 5.0, 8.0, 3.0, 9.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.57421875, -3.4591064453125, -3.343994140625, -3.2288818359375, -3.11376953125, -2.9986572265625, -2.883544921875, -2.7684326171875, -2.6533203125, -2.5382080078125, -2.423095703125, -2.3079833984375, -2.19287109375, -2.0777587890625, -1.962646484375, -1.8475341796875, -1.732421875, -1.6173095703125, -1.502197265625, -1.3870849609375, -1.27197265625, -1.1568603515625, -1.041748046875, -0.9266357421875, -0.8115234375, -0.6964111328125, -0.581298828125, -0.4661865234375, -0.35107421875, -0.2359619140625, -0.120849609375, -0.0057373046875, 0.109375, 0.2244873046875, 0.339599609375, 0.4547119140625, 0.56982421875, 0.6849365234375, 0.800048828125, 0.9151611328125, 1.0302734375, 1.1453857421875, 1.260498046875, 1.3756103515625, 1.49072265625, 1.6058349609375, 1.720947265625, 1.8360595703125, 1.951171875, 2.0662841796875, 2.181396484375, 2.2965087890625, 2.41162109375, 2.5267333984375, 2.641845703125, 2.7569580078125, 2.8720703125, 2.9871826171875, 3.102294921875, 3.2174072265625, 3.33251953125, 3.4476318359375, 3.562744140625, 3.6778564453125, 3.79296875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 6.0, 17.0, 16.0, 29.0, 37.0, 81.0, 167.0, 417.0, 1339.0, 4794.0, 26703.0, 511128.0, 472016.0, 25065.0, 4664.0, 1276.0, 433.0, 158.0, 82.0, 40.0, 17.0, 14.0, 8.0, 11.0, 8.0, 7.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.703125, -8.4310302734375, -8.158935546875, -7.8868408203125, -7.61474609375, -7.3426513671875, -7.070556640625, -6.7984619140625, -6.5263671875, -6.2542724609375, -5.982177734375, -5.7100830078125, -5.43798828125, -5.1658935546875, -4.893798828125, -4.6217041015625, -4.349609375, -4.0775146484375, -3.805419921875, -3.5333251953125, -3.26123046875, -2.9891357421875, -2.717041015625, -2.4449462890625, -2.1728515625, -1.9007568359375, -1.628662109375, -1.3565673828125, -1.08447265625, -0.8123779296875, -0.540283203125, -0.2681884765625, 0.00390625, 0.2760009765625, 0.548095703125, 0.8201904296875, 1.09228515625, 1.3643798828125, 1.636474609375, 1.9085693359375, 2.1806640625, 2.4527587890625, 2.724853515625, 2.9969482421875, 3.26904296875, 3.5411376953125, 3.813232421875, 4.0853271484375, 4.357421875, 4.6295166015625, 4.901611328125, 5.1737060546875, 5.44580078125, 5.7178955078125, 5.989990234375, 6.2620849609375, 6.5341796875, 6.8062744140625, 7.078369140625, 7.3504638671875, 7.62255859375, 7.8946533203125, 8.166748046875, 8.4388427734375, 8.7109375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 11.0, 13.0, 11.0, 29.0, 36.0, 49.0, 49.0, 89.0, 132.0, 152.0, 132.0, 82.0, 44.0, 44.0, 27.0, 20.0, 13.0, 15.0, 12.0, 9.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.000980377197265625, -0.0009534060955047607, -0.0009264349937438965, -0.0008994638919830322, -0.000872492790222168, -0.0008455216884613037, -0.0008185505867004395, -0.0007915794849395752, -0.0007646083831787109, -0.0007376372814178467, -0.0007106661796569824, -0.0006836950778961182, -0.0006567239761352539, -0.0006297528743743896, -0.0006027817726135254, -0.0005758106708526611, -0.0005488395690917969, -0.0005218684673309326, -0.0004948973655700684, -0.0004679262638092041, -0.00044095516204833984, -0.0004139840602874756, -0.00038701295852661133, -0.00036004185676574707, -0.0003330707550048828, -0.00030609965324401855, -0.0002791285514831543, -0.00025215744972229004, -0.00022518634796142578, -0.00019821524620056152, -0.00017124414443969727, -0.000144273042678833, -0.00011730194091796875, -9.033083915710449e-05, -6.335973739624023e-05, -3.6388635635375977e-05, -9.417533874511719e-06, 1.755356788635254e-05, 4.45246696472168e-05, 7.149577140808105e-05, 9.846687316894531e-05, 0.00012543797492980957, 0.00015240907669067383, 0.00017938017845153809, 0.00020635128021240234, 0.0002333223819732666, 0.00026029348373413086, 0.0002872645854949951, 0.0003142356872558594, 0.00034120678901672363, 0.0003681778907775879, 0.00039514899253845215, 0.0004221200942993164, 0.00044909119606018066, 0.0004760622978210449, 0.0005030333995819092, 0.0005300045013427734, 0.0005569756031036377, 0.000583946704864502, 0.0006109178066253662, 0.0006378889083862305, 0.0006648600101470947, 0.000691831111907959, 0.0007188022136688232, 0.0007457733154296875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 6.0, 11.0, 19.0, 34.0, 44.0, 59.0, 128.0, 209.0, 378.0, 778.0, 2128.0, 7925.0, 54888.0, 789561.0, 171889.0, 14796.0, 3418.0, 1127.0, 502.0, 246.0, 154.0, 90.0, 45.0, 25.0, 18.0, 18.0, 9.0, 7.0, 7.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-8.4453125, -8.1788330078125, -7.912353515625, -7.6458740234375, -7.37939453125, -7.1129150390625, -6.846435546875, -6.5799560546875, -6.3134765625, -6.0469970703125, -5.780517578125, -5.5140380859375, -5.24755859375, -4.9810791015625, -4.714599609375, -4.4481201171875, -4.181640625, -3.9151611328125, -3.648681640625, -3.3822021484375, -3.11572265625, -2.8492431640625, -2.582763671875, -2.3162841796875, -2.0498046875, -1.7833251953125, -1.516845703125, -1.2503662109375, -0.98388671875, -0.7174072265625, -0.450927734375, -0.1844482421875, 0.08203125, 0.3485107421875, 0.614990234375, 0.8814697265625, 1.14794921875, 1.4144287109375, 1.680908203125, 1.9473876953125, 2.2138671875, 2.4803466796875, 2.746826171875, 3.0133056640625, 3.27978515625, 3.5462646484375, 3.812744140625, 4.0792236328125, 4.345703125, 4.6121826171875, 4.878662109375, 5.1451416015625, 5.41162109375, 5.6781005859375, 5.944580078125, 6.2110595703125, 6.4775390625, 6.7440185546875, 7.010498046875, 7.2769775390625, 7.54345703125, 7.8099365234375, 8.076416015625, 8.3428955078125, 8.609375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 8.0, 1.0, 8.0, 8.0, 15.0, 29.0, 22.0, 36.0, 56.0, 99.0, 133.0, 157.0, 147.0, 107.0, 69.0, 37.0, 23.0, 11.0, 14.0, 7.0, 7.0, 7.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.521484375, -3.377349853515625, -3.23321533203125, -3.089080810546875, -2.9449462890625, -2.800811767578125, -2.65667724609375, -2.512542724609375, -2.368408203125, -2.224273681640625, -2.08013916015625, -1.936004638671875, -1.7918701171875, -1.647735595703125, -1.50360107421875, -1.359466552734375, -1.21533203125, -1.071197509765625, -0.92706298828125, -0.782928466796875, -0.6387939453125, -0.494659423828125, -0.35052490234375, -0.206390380859375, -0.062255859375, 0.081878662109375, 0.22601318359375, 0.370147705078125, 0.5142822265625, 0.658416748046875, 0.80255126953125, 0.946685791015625, 1.0908203125, 1.234954833984375, 1.37908935546875, 1.523223876953125, 1.6673583984375, 1.811492919921875, 1.95562744140625, 2.099761962890625, 2.243896484375, 2.388031005859375, 2.53216552734375, 2.676300048828125, 2.8204345703125, 2.964569091796875, 3.10870361328125, 3.252838134765625, 3.39697265625, 3.541107177734375, 3.68524169921875, 3.829376220703125, 3.9735107421875, 4.117645263671875, 4.26177978515625, 4.405914306640625, 4.550048828125, 4.694183349609375, 4.83831787109375, 4.982452392578125, 5.1265869140625, 5.270721435546875, 5.41485595703125, 5.558990478515625, 5.703125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 8.0, 12.0, 25.0, 41.0, 81.0, 127.0, 156.0, 178.0, 146.0, 113.0, 54.0, 24.0, 21.0, 7.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.51190185546875, -52.71718215942383, -50.92246627807617, -49.12774658203125, -47.333030700683594, -45.53831100463867, -43.74359130859375, -41.948875427246094, -40.15415573120117, -38.35943603515625, -36.564720153808594, -34.77000045776367, -32.97528076171875, -31.180564880371094, -29.385845184326172, -27.591127395629883, -25.796409606933594, -24.001691818237305, -22.206974029541016, -20.412254333496094, -18.617536544799805, -16.822818756103516, -15.02810001373291, -13.233381271362305, -11.438663482666016, -9.643945693969727, -7.849226951599121, -6.054508686065674, -4.259790420532227, -2.4650726318359375, -0.670353889465332, 1.1243648529052734, 2.9190826416015625, 4.71380090713501, 6.508519172668457, 8.303237915039062, 10.097955703735352, 11.89267349243164, 13.687392234802246, 15.482110977172852, 17.27682876586914, 19.07154655456543, 20.86626434326172, 22.66098403930664, 24.45570182800293, 26.25041961669922, 28.04513931274414, 29.83985710144043, 31.63457489013672, 33.42929458618164, 35.2240104675293, 37.01873016357422, 38.813446044921875, 40.6081657409668, 42.40288543701172, 44.197601318359375, 45.9923210144043, 47.78704071044922, 49.581756591796875, 51.3764762878418, 53.17119598388672, 54.965911865234375, 56.7606315612793, 58.55535125732422, 60.350067138671875]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 7.0, 4.0, 7.0, 8.0, 9.0, 12.0, 10.0, 21.0, 22.0, 18.0, 50.0, 35.0, 48.0, 35.0, 46.0, 50.0, 28.0, 53.0, 57.0, 57.0, 55.0, 56.0, 42.0, 44.0, 37.0, 38.0, 30.0, 24.0, 15.0, 16.0, 27.0, 12.0, 5.0, 5.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-29.059814453125, -28.28142738342285, -27.503042221069336, -26.724655151367188, -25.946269989013672, -25.167882919311523, -24.389495849609375, -23.61111068725586, -22.83272361755371, -22.054336547851562, -21.275951385498047, -20.4975643157959, -19.71917724609375, -18.940792083740234, -18.162405014038086, -17.384017944335938, -16.605632781982422, -15.82724666595459, -15.048860549926758, -14.27047348022461, -13.492087364196777, -12.713701248168945, -11.935314178466797, -11.156928062438965, -10.378541946411133, -9.6001558303833, -8.821769714355469, -8.04338264465332, -7.264996528625488, -6.486610412597656, -5.708223819732666, -4.929837226867676, -4.151451110839844, -3.3730647563934326, -2.5946784019470215, -1.8162920475006104, -1.0379056930541992, -0.2595193386077881, 0.518867015838623, 1.2972536087036133, 2.0756397247314453, 2.8540260791778564, 3.6324124336242676, 4.410799026489258, 5.18918514251709, 5.967571258544922, 6.745957851409912, 7.524344444274902, 8.302730560302734, 9.081116676330566, 9.859502792358398, 10.637889862060547, 11.416275978088379, 12.194662094116211, 12.97304916381836, 13.751435279846191, 14.529821395874023, 15.308207511901855, 16.086593627929688, 16.864980697631836, 17.643367767333984, 18.4217529296875, 19.20013999938965, 19.978527069091797, 20.756912231445312]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 9.0, 8.0, 10.0, 27.0, 33.0, 34.0, 66.0, 117.0, 168.0, 306.0, 633.0, 1182.0, 2611.0, 6000.0, 16644.0, 57908.0, 309491.0, 3300148.0, 397420.0, 69231.0, 19497.0, 6967.0, 2863.0, 1382.0, 675.0, 329.0, 187.0, 116.0, 81.0, 44.0, 34.0, 22.0, 7.0, 12.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.56640625, -4.38775634765625, -4.2091064453125, -4.03045654296875, -3.851806640625, -3.67315673828125, -3.4945068359375, -3.31585693359375, -3.13720703125, -2.95855712890625, -2.7799072265625, -2.60125732421875, -2.422607421875, -2.24395751953125, -2.0653076171875, -1.88665771484375, -1.7080078125, -1.52935791015625, -1.3507080078125, -1.17205810546875, -0.993408203125, -0.81475830078125, -0.6361083984375, -0.45745849609375, -0.27880859375, -0.10015869140625, 0.0784912109375, 0.25714111328125, 0.435791015625, 0.61444091796875, 0.7930908203125, 0.97174072265625, 1.150390625, 1.32904052734375, 1.5076904296875, 1.68634033203125, 1.864990234375, 2.04364013671875, 2.2222900390625, 2.40093994140625, 2.57958984375, 2.75823974609375, 2.9368896484375, 3.11553955078125, 3.294189453125, 3.47283935546875, 3.6514892578125, 3.83013916015625, 4.0087890625, 4.18743896484375, 4.3660888671875, 4.54473876953125, 4.723388671875, 4.90203857421875, 5.0806884765625, 5.25933837890625, 5.43798828125, 5.61663818359375, 5.7952880859375, 5.97393798828125, 6.152587890625, 6.33123779296875, 6.5098876953125, 6.68853759765625, 6.8671875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 9.0, 11.0, 16.0, 29.0, 37.0, 62.0, 82.0, 79.0, 82.0, 98.0, 92.0, 78.0, 83.0, 63.0, 45.0, 40.0, 30.0, 24.0, 15.0, 12.0, 8.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.994140625, -0.951141357421875, -0.90814208984375, -0.865142822265625, -0.8221435546875, -0.779144287109375, -0.73614501953125, -0.693145751953125, -0.650146484375, -0.607147216796875, -0.56414794921875, -0.521148681640625, -0.4781494140625, -0.435150146484375, -0.39215087890625, -0.349151611328125, -0.30615234375, -0.263153076171875, -0.22015380859375, -0.177154541015625, -0.1341552734375, -0.091156005859375, -0.04815673828125, -0.005157470703125, 0.037841796875, 0.080841064453125, 0.12384033203125, 0.166839599609375, 0.2098388671875, 0.252838134765625, 0.29583740234375, 0.338836669921875, 0.3818359375, 0.424835205078125, 0.46783447265625, 0.510833740234375, 0.5538330078125, 0.596832275390625, 0.63983154296875, 0.682830810546875, 0.725830078125, 0.768829345703125, 0.81182861328125, 0.854827880859375, 0.8978271484375, 0.940826416015625, 0.98382568359375, 1.026824951171875, 1.06982421875, 1.112823486328125, 1.15582275390625, 1.198822021484375, 1.2418212890625, 1.284820556640625, 1.32781982421875, 1.370819091796875, 1.413818359375, 1.456817626953125, 1.49981689453125, 1.542816162109375, 1.5858154296875, 1.628814697265625, 1.67181396484375, 1.714813232421875, 1.7578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 10.0, 11.0, 21.0, 53.0, 91.0, 181.0, 501.0, 1645.0, 7149.0, 48280.0, 985122.0, 3048509.0, 88451.0, 10819.0, 2278.0, 685.0, 273.0, 105.0, 40.0, 30.0, 12.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.69921875, -7.36627197265625, -7.0333251953125, -6.70037841796875, -6.367431640625, -6.03448486328125, -5.7015380859375, -5.36859130859375, -5.03564453125, -4.70269775390625, -4.3697509765625, -4.03680419921875, -3.703857421875, -3.37091064453125, -3.0379638671875, -2.70501708984375, -2.3720703125, -2.03912353515625, -1.7061767578125, -1.37322998046875, -1.040283203125, -0.70733642578125, -0.3743896484375, -0.04144287109375, 0.29150390625, 0.62445068359375, 0.9573974609375, 1.29034423828125, 1.623291015625, 1.95623779296875, 2.2891845703125, 2.62213134765625, 2.955078125, 3.28802490234375, 3.6209716796875, 3.95391845703125, 4.286865234375, 4.61981201171875, 4.9527587890625, 5.28570556640625, 5.61865234375, 5.95159912109375, 6.2845458984375, 6.61749267578125, 6.950439453125, 7.28338623046875, 7.6163330078125, 7.94927978515625, 8.2822265625, 8.61517333984375, 8.9481201171875, 9.28106689453125, 9.614013671875, 9.94696044921875, 10.2799072265625, 10.61285400390625, 10.94580078125, 11.27874755859375, 11.6116943359375, 11.94464111328125, 12.277587890625, 12.61053466796875, 12.9434814453125, 13.27642822265625, 13.609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 7.0, 6.0, 5.0, 15.0, 10.0, 21.0, 26.0, 40.0, 51.0, 85.0, 107.0, 179.0, 242.0, 438.0, 926.0, 762.0, 403.0, 227.0, 169.0, 87.0, 75.0, 38.0, 44.0, 27.0, 12.0, 21.0, 13.0, 10.0, 7.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.06640625, -1.999481201171875, -1.93255615234375, -1.865631103515625, -1.7987060546875, -1.731781005859375, -1.66485595703125, -1.597930908203125, -1.531005859375, -1.464080810546875, -1.39715576171875, -1.330230712890625, -1.2633056640625, -1.196380615234375, -1.12945556640625, -1.062530517578125, -0.99560546875, -0.928680419921875, -0.86175537109375, -0.794830322265625, -0.7279052734375, -0.660980224609375, -0.59405517578125, -0.527130126953125, -0.460205078125, -0.393280029296875, -0.32635498046875, -0.259429931640625, -0.1925048828125, -0.125579833984375, -0.05865478515625, 0.008270263671875, 0.0751953125, 0.142120361328125, 0.20904541015625, 0.275970458984375, 0.3428955078125, 0.409820556640625, 0.47674560546875, 0.543670654296875, 0.610595703125, 0.677520751953125, 0.74444580078125, 0.811370849609375, 0.8782958984375, 0.945220947265625, 1.01214599609375, 1.079071044921875, 1.14599609375, 1.212921142578125, 1.27984619140625, 1.346771240234375, 1.4136962890625, 1.480621337890625, 1.54754638671875, 1.614471435546875, 1.681396484375, 1.748321533203125, 1.81524658203125, 1.882171630859375, 1.9490966796875, 2.016021728515625, 2.08294677734375, 2.149871826171875, 2.216796875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 8.0, 18.0, 46.0, 85.0, 123.0, 175.0, 190.0, 157.0, 109.0, 51.0, 28.0, 7.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.930633544921875, -34.016761779785156, -33.10288619995117, -32.18901443481445, -31.275142669677734, -30.361268997192383, -29.44739532470703, -28.533523559570312, -27.61964988708496, -26.70577621459961, -25.79190444946289, -24.87803077697754, -23.96415901184082, -23.05028533935547, -22.13641357421875, -21.2225399017334, -20.308666229248047, -19.394792556762695, -18.480920791625977, -17.567047119140625, -16.653175354003906, -15.739301681518555, -14.82542896270752, -13.911556243896484, -12.997684478759766, -12.08381175994873, -11.169939041137695, -10.256065368652344, -9.342192649841309, -8.428319931030273, -7.514447212219238, -6.600574016571045, -5.686700820922852, -4.772828102111816, -3.858954906463623, -2.945082187652588, -2.0312092304229736, -1.1173362731933594, -0.20346355438232422, 0.7104096412658691, 1.6242823600769043, 2.5381553173065186, 3.452028274536133, 4.365900993347168, 5.279773712158203, 6.1936469078063965, 7.107519626617432, 8.021392822265625, 8.93526554107666, 9.849138259887695, 10.76301097869873, 11.676883697509766, 12.590757369995117, 13.504630088806152, 14.418502807617188, 15.332376480102539, 16.246248245239258, 17.16012191772461, 18.073993682861328, 18.98786735534668, 19.9017391204834, 20.81561279296875, 21.72948455810547, 22.64335823059082, 23.557231903076172]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 4.0, 3.0, 5.0, 7.0, 10.0, 11.0, 11.0, 15.0, 17.0, 15.0, 12.0, 23.0, 27.0, 37.0, 32.0, 33.0, 52.0, 39.0, 57.0, 46.0, 50.0, 38.0, 51.0, 39.0, 33.0, 37.0, 38.0, 31.0, 32.0, 26.0, 29.0, 23.0, 22.0, 19.0, 15.0, 6.0, 5.0, 12.0, 13.0, 6.0, 7.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-9.607721328735352, -9.32905101776123, -9.05038070678711, -8.771709442138672, -8.49303913116455, -8.21436882019043, -7.935698509216309, -7.657027721405029, -7.37835693359375, -7.099686622619629, -6.82101583480835, -6.5423455238342285, -6.263674736022949, -5.985004425048828, -5.706334114074707, -5.427663326263428, -5.148993015289307, -4.8703227043151855, -4.591651916503906, -4.312981605529785, -4.034310817718506, -3.7556405067443848, -3.4769699573516846, -3.1982994079589844, -2.919628858566284, -2.640958309173584, -2.362287759780884, -2.0836172103881836, -1.804946780204773, -1.5262762308120728, -1.247605800628662, -0.9689352512359619, -0.6902647018432617, -0.4115941822528839, -0.1329236626625061, 0.14574682712554932, 0.4244173765182495, 0.7030879259109497, 0.9817583560943604, 1.2604289054870605, 1.5390994548797607, 1.817770004272461, 2.096440553665161, 2.3751111030578613, 2.6537814140319824, 2.9324522018432617, 3.211122512817383, 3.489793062210083, 3.768463611602783, 4.047133922576904, 4.325804710388184, 4.604475021362305, 4.883145809173584, 5.161816120147705, 5.440486907958984, 5.7191572189331055, 5.997827529907227, 6.276497840881348, 6.555168628692627, 6.833838939666748, 7.112509727478027, 7.391180038452148, 7.6698503494262695, 7.948521137237549, 8.227191925048828]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 10.0, 11.0, 17.0, 16.0, 21.0, 48.0, 65.0, 94.0, 136.0, 214.0, 319.0, 514.0, 904.0, 1701.0, 3430.0, 7572.0, 16856.0, 39470.0, 95152.0, 258326.0, 375550.0, 143823.0, 58572.0, 24791.0, 10882.0, 4773.0, 2340.0, 1200.0, 668.0, 363.0, 226.0, 153.0, 102.0, 78.0, 49.0, 43.0, 32.0, 11.0, 12.0, 4.0, 7.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-6.1796875, -6.013671875, -5.84765625, -5.681640625, -5.515625, -5.349609375, -5.18359375, -5.017578125, -4.8515625, -4.685546875, -4.51953125, -4.353515625, -4.1875, -4.021484375, -3.85546875, -3.689453125, -3.5234375, -3.357421875, -3.19140625, -3.025390625, -2.859375, -2.693359375, -2.52734375, -2.361328125, -2.1953125, -2.029296875, -1.86328125, -1.697265625, -1.53125, -1.365234375, -1.19921875, -1.033203125, -0.8671875, -0.701171875, -0.53515625, -0.369140625, -0.203125, -0.037109375, 0.12890625, 0.294921875, 0.4609375, 0.626953125, 0.79296875, 0.958984375, 1.125, 1.291015625, 1.45703125, 1.623046875, 1.7890625, 1.955078125, 2.12109375, 2.287109375, 2.453125, 2.619140625, 2.78515625, 2.951171875, 3.1171875, 3.283203125, 3.44921875, 3.615234375, 3.78125, 3.947265625, 4.11328125, 4.279296875, 4.4453125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 1.0, 6.0, 1.0, 5.0, 11.0, 15.0, 28.0, 24.0, 53.0, 55.0, 69.0, 73.0, 83.0, 83.0, 90.0, 80.0, 68.0, 55.0, 48.0, 45.0, 26.0, 30.0, 18.0, 12.0, 9.0, 12.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9013671875, -0.862274169921875, -0.82318115234375, -0.784088134765625, -0.7449951171875, -0.705902099609375, -0.66680908203125, -0.627716064453125, -0.588623046875, -0.549530029296875, -0.51043701171875, -0.471343994140625, -0.4322509765625, -0.393157958984375, -0.35406494140625, -0.314971923828125, -0.27587890625, -0.236785888671875, -0.19769287109375, -0.158599853515625, -0.1195068359375, -0.080413818359375, -0.04132080078125, -0.002227783203125, 0.036865234375, 0.075958251953125, 0.11505126953125, 0.154144287109375, 0.1932373046875, 0.232330322265625, 0.27142333984375, 0.310516357421875, 0.349609375, 0.388702392578125, 0.42779541015625, 0.466888427734375, 0.5059814453125, 0.545074462890625, 0.58416748046875, 0.623260498046875, 0.662353515625, 0.701446533203125, 0.74053955078125, 0.779632568359375, 0.8187255859375, 0.857818603515625, 0.89691162109375, 0.936004638671875, 0.97509765625, 1.014190673828125, 1.05328369140625, 1.092376708984375, 1.1314697265625, 1.170562744140625, 1.20965576171875, 1.248748779296875, 1.287841796875, 1.326934814453125, 1.36602783203125, 1.405120849609375, 1.4442138671875, 1.483306884765625, 1.52239990234375, 1.561492919921875, 1.6005859375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 12.0, 16.0, 22.0, 20.0, 32.0, 43.0, 78.0, 117.0, 179.0, 324.0, 591.0, 1220.0, 2782.0, 7400.0, 22119.0, 77308.0, 309194.0, 462895.0, 114935.0, 32224.0, 10005.0, 3628.0, 1622.0, 747.0, 392.0, 248.0, 133.0, 89.0, 60.0, 41.0, 16.0, 21.0, 11.0, 7.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.859375, -6.64605712890625, -6.4327392578125, -6.21942138671875, -6.006103515625, -5.79278564453125, -5.5794677734375, -5.36614990234375, -5.15283203125, -4.93951416015625, -4.7261962890625, -4.51287841796875, -4.299560546875, -4.08624267578125, -3.8729248046875, -3.65960693359375, -3.4462890625, -3.23297119140625, -3.0196533203125, -2.80633544921875, -2.593017578125, -2.37969970703125, -2.1663818359375, -1.95306396484375, -1.73974609375, -1.52642822265625, -1.3131103515625, -1.09979248046875, -0.886474609375, -0.67315673828125, -0.4598388671875, -0.24652099609375, -0.033203125, 0.18011474609375, 0.3934326171875, 0.60675048828125, 0.820068359375, 1.03338623046875, 1.2467041015625, 1.46002197265625, 1.67333984375, 1.88665771484375, 2.0999755859375, 2.31329345703125, 2.526611328125, 2.73992919921875, 2.9532470703125, 3.16656494140625, 3.3798828125, 3.59320068359375, 3.8065185546875, 4.01983642578125, 4.233154296875, 4.44647216796875, 4.6597900390625, 4.87310791015625, 5.08642578125, 5.29974365234375, 5.5130615234375, 5.72637939453125, 5.939697265625, 6.15301513671875, 6.3663330078125, 6.57965087890625, 6.79296875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 2.0, 2.0, 9.0, 11.0, 10.0, 12.0, 20.0, 25.0, 13.0, 30.0, 34.0, 32.0, 41.0, 34.0, 51.0, 44.0, 55.0, 54.0, 49.0, 46.0, 40.0, 59.0, 58.0, 42.0, 43.0, 33.0, 19.0, 18.0, 20.0, 24.0, 15.0, 16.0, 11.0, 8.0, 3.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.125, -3.991943359375, -3.85888671875, -3.725830078125, -3.5927734375, -3.459716796875, -3.32666015625, -3.193603515625, -3.060546875, -2.927490234375, -2.79443359375, -2.661376953125, -2.5283203125, -2.395263671875, -2.26220703125, -2.129150390625, -1.99609375, -1.863037109375, -1.72998046875, -1.596923828125, -1.4638671875, -1.330810546875, -1.19775390625, -1.064697265625, -0.931640625, -0.798583984375, -0.66552734375, -0.532470703125, -0.3994140625, -0.266357421875, -0.13330078125, -0.000244140625, 0.1328125, 0.265869140625, 0.39892578125, 0.531982421875, 0.6650390625, 0.798095703125, 0.93115234375, 1.064208984375, 1.197265625, 1.330322265625, 1.46337890625, 1.596435546875, 1.7294921875, 1.862548828125, 1.99560546875, 2.128662109375, 2.26171875, 2.394775390625, 2.52783203125, 2.660888671875, 2.7939453125, 2.927001953125, 3.06005859375, 3.193115234375, 3.326171875, 3.459228515625, 3.59228515625, 3.725341796875, 3.8583984375, 3.991455078125, 4.12451171875, 4.257568359375, 4.390625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 2.0, 2.0, 3.0, 7.0, 12.0, 2.0, 11.0, 14.0, 21.0, 38.0, 80.0, 142.0, 328.0, 847.0, 2631.0, 10930.0, 105393.0, 804143.0, 108592.0, 11139.0, 2669.0, 866.0, 326.0, 131.0, 82.0, 36.0, 31.0, 15.0, 18.0, 12.0, 7.0, 7.0, 2.0, 1.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-11.2578125, -10.9576416015625, -10.657470703125, -10.3572998046875, -10.05712890625, -9.7569580078125, -9.456787109375, -9.1566162109375, -8.8564453125, -8.5562744140625, -8.256103515625, -7.9559326171875, -7.65576171875, -7.3555908203125, -7.055419921875, -6.7552490234375, -6.455078125, -6.1549072265625, -5.854736328125, -5.5545654296875, -5.25439453125, -4.9542236328125, -4.654052734375, -4.3538818359375, -4.0537109375, -3.7535400390625, -3.453369140625, -3.1531982421875, -2.85302734375, -2.5528564453125, -2.252685546875, -1.9525146484375, -1.65234375, -1.3521728515625, -1.052001953125, -0.7518310546875, -0.45166015625, -0.1514892578125, 0.148681640625, 0.4488525390625, 0.7490234375, 1.0491943359375, 1.349365234375, 1.6495361328125, 1.94970703125, 2.2498779296875, 2.550048828125, 2.8502197265625, 3.150390625, 3.4505615234375, 3.750732421875, 4.0509033203125, 4.35107421875, 4.6512451171875, 4.951416015625, 5.2515869140625, 5.5517578125, 5.8519287109375, 6.152099609375, 6.4522705078125, 6.75244140625, 7.0526123046875, 7.352783203125, 7.6529541015625, 7.953125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 5.0, 9.0, 3.0, 7.0, 12.0, 10.0, 39.0, 47.0, 61.0, 104.0, 204.0, 200.0, 115.0, 59.0, 43.0, 32.0, 26.0, 11.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014801025390625, -0.0014390945434570312, -0.0013980865478515625, -0.0013570785522460938, -0.001316070556640625, -0.0012750625610351562, -0.0012340545654296875, -0.0011930465698242188, -0.00115203857421875, -0.0011110305786132812, -0.0010700225830078125, -0.0010290145874023438, -0.000988006591796875, -0.0009469985961914062, -0.0009059906005859375, -0.0008649826049804688, -0.000823974609375, -0.0007829666137695312, -0.0007419586181640625, -0.0007009506225585938, -0.000659942626953125, -0.0006189346313476562, -0.0005779266357421875, -0.0005369186401367188, -0.00049591064453125, -0.00045490264892578125, -0.0004138946533203125, -0.00037288665771484375, -0.000331878662109375, -0.00029087066650390625, -0.0002498626708984375, -0.00020885467529296875, -0.0001678466796875, -0.00012683868408203125, -8.58306884765625e-05, -4.482269287109375e-05, -3.814697265625e-06, 3.719329833984375e-05, 7.82012939453125e-05, 0.00011920928955078125, 0.00016021728515625, 0.00020122528076171875, 0.0002422332763671875, 0.00028324127197265625, 0.000324249267578125, 0.00036525726318359375, 0.0004062652587890625, 0.00044727325439453125, 0.00048828125, 0.0005292892456054688, 0.0005702972412109375, 0.0006113052368164062, 0.000652313232421875, 0.0006933212280273438, 0.0007343292236328125, 0.0007753372192382812, 0.00081634521484375, 0.0008573532104492188, 0.0008983612060546875, 0.0009393692016601562, 0.000980377197265625, 0.0010213851928710938, 0.0010623931884765625, 0.0011034011840820312, 0.0011444091796875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 7.0, 4.0, 6.0, 19.0, 24.0, 64.0, 144.0, 410.0, 1426.0, 10552.0, 750193.0, 277985.0, 6211.0, 985.0, 296.0, 131.0, 51.0, 18.0, 17.0, 3.0, 6.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8984375, -15.3665771484375, -14.834716796875, -14.3028564453125, -13.77099609375, -13.2391357421875, -12.707275390625, -12.1754150390625, -11.6435546875, -11.1116943359375, -10.579833984375, -10.0479736328125, -9.51611328125, -8.9842529296875, -8.452392578125, -7.9205322265625, -7.388671875, -6.8568115234375, -6.324951171875, -5.7930908203125, -5.26123046875, -4.7293701171875, -4.197509765625, -3.6656494140625, -3.1337890625, -2.6019287109375, -2.070068359375, -1.5382080078125, -1.00634765625, -0.4744873046875, 0.057373046875, 0.5892333984375, 1.12109375, 1.6529541015625, 2.184814453125, 2.7166748046875, 3.24853515625, 3.7803955078125, 4.312255859375, 4.8441162109375, 5.3759765625, 5.9078369140625, 6.439697265625, 6.9715576171875, 7.50341796875, 8.0352783203125, 8.567138671875, 9.0989990234375, 9.630859375, 10.1627197265625, 10.694580078125, 11.2264404296875, 11.75830078125, 12.2901611328125, 12.822021484375, 13.3538818359375, 13.8857421875, 14.4176025390625, 14.949462890625, 15.4813232421875, 16.01318359375, 16.5450439453125, 17.076904296875, 17.6087646484375, 18.140625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 0.0, 3.0, 2.0, 4.0, 2.0, 7.0, 6.0, 12.0, 23.0, 34.0, 35.0, 57.0, 103.0, 164.0, 162.0, 130.0, 82.0, 53.0, 36.0, 30.0, 20.0, 22.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.484375, -3.33526611328125, -3.1861572265625, -3.03704833984375, -2.887939453125, -2.73883056640625, -2.5897216796875, -2.44061279296875, -2.29150390625, -2.14239501953125, -1.9932861328125, -1.84417724609375, -1.695068359375, -1.54595947265625, -1.3968505859375, -1.24774169921875, -1.0986328125, -0.94952392578125, -0.8004150390625, -0.65130615234375, -0.502197265625, -0.35308837890625, -0.2039794921875, -0.05487060546875, 0.09423828125, 0.24334716796875, 0.3924560546875, 0.54156494140625, 0.690673828125, 0.83978271484375, 0.9888916015625, 1.13800048828125, 1.287109375, 1.43621826171875, 1.5853271484375, 1.73443603515625, 1.883544921875, 2.03265380859375, 2.1817626953125, 2.33087158203125, 2.47998046875, 2.62908935546875, 2.7781982421875, 2.92730712890625, 3.076416015625, 3.22552490234375, 3.3746337890625, 3.52374267578125, 3.6728515625, 3.82196044921875, 3.9710693359375, 4.12017822265625, 4.269287109375, 4.41839599609375, 4.5675048828125, 4.71661376953125, 4.86572265625, 5.01483154296875, 5.1639404296875, 5.31304931640625, 5.462158203125, 5.61126708984375, 5.7603759765625, 5.90948486328125, 6.05859375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 8.0, 15.0, 30.0, 43.0, 81.0, 121.0, 132.0, 178.0, 139.0, 108.0, 54.0, 41.0, 22.0, 16.0, 7.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-82.56271362304688, -80.7380142211914, -78.9133071899414, -77.08860778808594, -75.26390838623047, -73.439208984375, -71.614501953125, -69.78980255126953, -67.96510314941406, -66.1404037475586, -64.3156967163086, -62.490997314453125, -60.666297912597656, -58.84159469604492, -57.01689147949219, -55.19219207763672, -53.36748504638672, -51.542781829833984, -49.718082427978516, -47.89337921142578, -46.06867980957031, -44.24397659301758, -42.419273376464844, -40.594573974609375, -38.76987075805664, -36.945167541503906, -35.12046813964844, -33.2957649230957, -31.4710636138916, -29.6463623046875, -27.821659088134766, -25.996957778930664, -24.172256469726562, -22.34755516052246, -20.52285385131836, -18.698150634765625, -16.873449325561523, -15.048748016357422, -13.224045753479004, -11.399343490600586, -9.574642181396484, -7.749940395355225, -5.925238609313965, -4.100536823272705, -2.2758350372314453, -0.45113372802734375, 1.3735685348510742, 3.198270797729492, 5.022972106933594, 6.8476738929748535, 8.672375679016113, 10.497077941894531, 12.321779251098633, 14.146480560302734, 15.971182823181152, 17.79588508605957, 19.620586395263672, 21.445287704467773, 23.269989013671875, 25.09469223022461, 26.91939353942871, 28.744094848632812, 30.568798065185547, 32.39350128173828, 34.21820068359375]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 2.0, 9.0, 10.0, 17.0, 13.0, 19.0, 19.0, 25.0, 30.0, 32.0, 55.0, 49.0, 43.0, 45.0, 41.0, 49.0, 45.0, 60.0, 52.0, 58.0, 36.0, 41.0, 50.0, 25.0, 32.0, 23.0, 29.0, 20.0, 14.0, 13.0, 13.0, 6.0, 7.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.374053955078125, -27.538291931152344, -26.702529907226562, -25.86676788330078, -25.031005859375, -24.19524383544922, -23.359481811523438, -22.523719787597656, -21.687957763671875, -20.852195739746094, -20.016433715820312, -19.18067169189453, -18.34490966796875, -17.50914764404297, -16.673385620117188, -15.837623596191406, -15.001862525939941, -14.16610050201416, -13.330338478088379, -12.494576454162598, -11.658814430236816, -10.823053359985352, -9.98729133605957, -9.151529312133789, -8.315767288208008, -7.480005264282227, -6.644243240356445, -5.808481216430664, -4.972719192504883, -4.13695764541626, -3.3011956214904785, -2.4654335975646973, -1.6296710968017578, -0.7939091324806213, 0.04185283184051514, 0.8776147365570068, 1.713376760482788, 2.5491385459899902, 3.3849005699157715, 4.220662593841553, 5.056424617767334, 5.892186641693115, 6.7279486656188965, 7.5637102127075195, 8.3994722366333, 9.235234260559082, 10.070996284484863, 10.906758308410645, 11.742520332336426, 12.578282356262207, 13.414044380187988, 14.24980640411377, 15.08556842803955, 15.921329498291016, 16.757091522216797, 17.592853546142578, 18.42861557006836, 19.26437759399414, 20.100139617919922, 20.935901641845703, 21.771663665771484, 22.607425689697266, 23.443187713623047, 24.278949737548828, 25.11471176147461]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 11.0, 6.0, 12.0, 13.0, 13.0, 38.0, 45.0, 64.0, 60.0, 121.0, 184.0, 273.0, 477.0, 800.0, 1329.0, 2512.0, 4834.0, 10369.0, 24408.0, 67668.0, 274844.0, 3208545.0, 449966.0, 91416.0, 30948.0, 12633.0, 5791.0, 3010.0, 1552.0, 871.0, 531.0, 313.0, 217.0, 115.0, 94.0, 54.0, 41.0, 24.0, 31.0, 13.0, 11.0, 4.0, 6.0, 4.0, 5.0, 1.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0], "bins": [-5.1328125, -4.98016357421875, -4.8275146484375, -4.67486572265625, -4.522216796875, -4.36956787109375, -4.2169189453125, -4.06427001953125, -3.91162109375, -3.75897216796875, -3.6063232421875, -3.45367431640625, -3.301025390625, -3.14837646484375, -2.9957275390625, -2.84307861328125, -2.6904296875, -2.53778076171875, -2.3851318359375, -2.23248291015625, -2.079833984375, -1.92718505859375, -1.7745361328125, -1.62188720703125, -1.46923828125, -1.31658935546875, -1.1639404296875, -1.01129150390625, -0.858642578125, -0.70599365234375, -0.5533447265625, -0.40069580078125, -0.248046875, -0.09539794921875, 0.0572509765625, 0.20989990234375, 0.362548828125, 0.51519775390625, 0.6678466796875, 0.82049560546875, 0.97314453125, 1.12579345703125, 1.2784423828125, 1.43109130859375, 1.583740234375, 1.73638916015625, 1.8890380859375, 2.04168701171875, 2.1943359375, 2.34698486328125, 2.4996337890625, 2.65228271484375, 2.804931640625, 2.95758056640625, 3.1102294921875, 3.26287841796875, 3.41552734375, 3.56817626953125, 3.7208251953125, 3.87347412109375, 4.026123046875, 4.17877197265625, 4.3314208984375, 4.48406982421875, 4.63671875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 6.0, 7.0, 11.0, 16.0, 24.0, 32.0, 47.0, 54.0, 75.0, 79.0, 79.0, 71.0, 90.0, 82.0, 81.0, 47.0, 52.0, 41.0, 26.0, 34.0, 17.0, 17.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.068359375, -1.0237884521484375, -0.979217529296875, -0.9346466064453125, -0.89007568359375, -0.8455047607421875, -0.800933837890625, -0.7563629150390625, -0.7117919921875, -0.6672210693359375, -0.622650146484375, -0.5780792236328125, -0.53350830078125, -0.4889373779296875, -0.444366455078125, -0.3997955322265625, -0.355224609375, -0.3106536865234375, -0.266082763671875, -0.2215118408203125, -0.17694091796875, -0.1323699951171875, -0.087799072265625, -0.0432281494140625, 0.0013427734375, 0.0459136962890625, 0.090484619140625, 0.1350555419921875, 0.17962646484375, 0.2241973876953125, 0.268768310546875, 0.3133392333984375, 0.35791015625, 0.4024810791015625, 0.447052001953125, 0.4916229248046875, 0.53619384765625, 0.5807647705078125, 0.625335693359375, 0.6699066162109375, 0.7144775390625, 0.7590484619140625, 0.803619384765625, 0.8481903076171875, 0.89276123046875, 0.9373321533203125, 0.981903076171875, 1.0264739990234375, 1.071044921875, 1.1156158447265625, 1.160186767578125, 1.2047576904296875, 1.24932861328125, 1.2938995361328125, 1.338470458984375, 1.3830413818359375, 1.4276123046875, 1.4721832275390625, 1.516754150390625, 1.5613250732421875, 1.60589599609375, 1.6504669189453125, 1.695037841796875, 1.7396087646484375, 1.7841796875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 10.0, 5.0, 9.0, 21.0, 48.0, 100.0, 188.0, 391.0, 852.0, 1993.0, 4632.0, 12509.0, 40569.0, 163176.0, 1927973.0, 1819187.0, 162554.0, 39744.0, 12450.0, 4435.0, 1905.0, 778.0, 417.0, 184.0, 71.0, 29.0, 20.0, 17.0, 8.0, 6.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9140625, -6.71649169921875, -6.5189208984375, -6.32135009765625, -6.123779296875, -5.92620849609375, -5.7286376953125, -5.53106689453125, -5.33349609375, -5.13592529296875, -4.9383544921875, -4.74078369140625, -4.543212890625, -4.34564208984375, -4.1480712890625, -3.95050048828125, -3.7529296875, -3.55535888671875, -3.3577880859375, -3.16021728515625, -2.962646484375, -2.76507568359375, -2.5675048828125, -2.36993408203125, -2.17236328125, -1.97479248046875, -1.7772216796875, -1.57965087890625, -1.382080078125, -1.18450927734375, -0.9869384765625, -0.78936767578125, -0.591796875, -0.39422607421875, -0.1966552734375, 0.00091552734375, 0.198486328125, 0.39605712890625, 0.5936279296875, 0.79119873046875, 0.98876953125, 1.18634033203125, 1.3839111328125, 1.58148193359375, 1.779052734375, 1.97662353515625, 2.1741943359375, 2.37176513671875, 2.5693359375, 2.76690673828125, 2.9644775390625, 3.16204833984375, 3.359619140625, 3.55718994140625, 3.7547607421875, 3.95233154296875, 4.14990234375, 4.34747314453125, 4.5450439453125, 4.74261474609375, 4.940185546875, 5.13775634765625, 5.3353271484375, 5.53289794921875, 5.73046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 5.0, 2.0, 7.0, 6.0, 8.0, 10.0, 11.0, 11.0, 12.0, 26.0, 32.0, 19.0, 47.0, 59.0, 92.0, 128.0, 178.0, 326.0, 542.0, 1086.0, 505.0, 260.0, 179.0, 137.0, 95.0, 70.0, 54.0, 36.0, 37.0, 20.0, 19.0, 14.0, 7.0, 4.0, 10.0, 2.0, 8.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.111328125, -2.0564727783203125, -2.001617431640625, -1.9467620849609375, -1.89190673828125, -1.8370513916015625, -1.782196044921875, -1.7273406982421875, -1.6724853515625, -1.6176300048828125, -1.562774658203125, -1.5079193115234375, -1.45306396484375, -1.3982086181640625, -1.343353271484375, -1.2884979248046875, -1.233642578125, -1.1787872314453125, -1.123931884765625, -1.0690765380859375, -1.01422119140625, -0.9593658447265625, -0.904510498046875, -0.8496551513671875, -0.7947998046875, -0.7399444580078125, -0.685089111328125, -0.6302337646484375, -0.57537841796875, -0.5205230712890625, -0.465667724609375, -0.4108123779296875, -0.35595703125, -0.3011016845703125, -0.246246337890625, -0.1913909912109375, -0.13653564453125, -0.0816802978515625, -0.026824951171875, 0.0280303955078125, 0.0828857421875, 0.1377410888671875, 0.192596435546875, 0.2474517822265625, 0.30230712890625, 0.3571624755859375, 0.412017822265625, 0.4668731689453125, 0.521728515625, 0.5765838623046875, 0.631439208984375, 0.6862945556640625, 0.74114990234375, 0.7960052490234375, 0.850860595703125, 0.9057159423828125, 0.9605712890625, 1.0154266357421875, 1.070281982421875, 1.1251373291015625, 1.17999267578125, 1.2348480224609375, 1.289703369140625, 1.3445587158203125, 1.3994140625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 7.0, 15.0, 17.0, 18.0, 38.0, 48.0, 63.0, 98.0, 108.0, 128.0, 97.0, 102.0, 71.0, 61.0, 58.0, 28.0, 16.0, 12.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.273287773132324, -14.823166847229004, -14.373045921325684, -13.922924995422363, -13.47280502319336, -13.022684097290039, -12.572563171386719, -12.122442245483398, -11.672321319580078, -11.222200393676758, -10.772079467773438, -10.321958541870117, -9.871837615966797, -9.421716690063477, -8.971596717834473, -8.521475791931152, -8.071354866027832, -7.621233940124512, -7.171113014221191, -6.720992565155029, -6.270871639251709, -5.820750713348389, -5.370630264282227, -4.920509338378906, -4.470388412475586, -4.020267486572266, -3.5701467990875244, -3.120026111602783, -2.669905185699463, -2.2197842597961426, -1.7696635723114014, -1.3195428848266602, -0.8694219589233398, -0.4193011522293091, 0.03081965446472168, 0.48094046115875244, 0.9310612678527832, 1.3811821937561035, 1.8313028812408447, 2.281423568725586, 2.7315444946289062, 3.1816654205322266, 3.6317861080169678, 4.081906795501709, 4.532027721405029, 4.98214864730835, 5.432269096374512, 5.882390022277832, 6.332510948181152, 6.782631874084473, 7.232752799987793, 7.682873249053955, 8.132993698120117, 8.583114624023438, 9.033235549926758, 9.483356475830078, 9.933477401733398, 10.383598327636719, 10.833719253540039, 11.28384017944336, 11.73396110534668, 12.18408203125, 12.634202003479004, 13.084322929382324, 13.534443855285645]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 9.0, 6.0, 8.0, 14.0, 18.0, 20.0, 22.0, 22.0, 24.0, 28.0, 37.0, 24.0, 32.0, 49.0, 33.0, 34.0, 43.0, 56.0, 47.0, 43.0, 46.0, 34.0, 31.0, 33.0, 34.0, 31.0, 35.0, 28.0, 23.0, 20.0, 13.0, 17.0, 11.0, 11.0, 9.0, 8.0, 4.0, 4.0, 3.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0], "bins": [-7.420932769775391, -7.196844577789307, -6.9727559089660645, -6.7486677169799805, -6.5245795249938965, -6.3004913330078125, -6.07640266418457, -5.852314472198486, -5.628226280212402, -5.404138088226318, -5.180049419403076, -4.955961227416992, -4.731873035430908, -4.507784843444824, -4.283696174621582, -4.059607982635498, -3.835519313812256, -3.6114308834075928, -3.387342691421509, -3.1632542610168457, -2.9391660690307617, -2.7150776386260986, -2.4909892082214355, -2.2669010162353516, -2.0428125858306885, -1.818724274635315, -1.5946359634399414, -1.3705475330352783, -1.1464592218399048, -0.9223709106445312, -0.6982824802398682, -0.47419416904449463, -0.2501058578491211, -0.02601751685142517, 0.19807082414627075, 0.42215919494628906, 0.6462475061416626, 0.8703358173370361, 1.0944242477416992, 1.3185125589370728, 1.5426008701324463, 1.7666891813278198, 1.9907774925231934, 2.2148659229278564, 2.4389543533325195, 2.6630425453186035, 2.8871309757232666, 3.1112194061279297, 3.3353075981140137, 3.5593960285186768, 3.7834842205047607, 4.007572650909424, 4.231660842895508, 4.45574951171875, 4.679837703704834, 4.903925895690918, 5.12801456451416, 5.352102756500244, 5.576191425323486, 5.80027961730957, 6.024367809295654, 6.248456001281738, 6.4725446701049805, 6.6966328620910645, 6.920721054077148]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 3.0, 6.0, 8.0, 18.0, 31.0, 28.0, 64.0, 90.0, 137.0, 215.0, 300.0, 540.0, 924.0, 1695.0, 3164.0, 6074.0, 12542.0, 26088.0, 55276.0, 119336.0, 265692.0, 296746.0, 137012.0, 63740.0, 29593.0, 14332.0, 6999.0, 3448.0, 1901.0, 1007.0, 608.0, 356.0, 195.0, 114.0, 90.0, 74.0, 39.0, 25.0, 17.0, 10.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.97265625, -4.81768798828125, -4.6627197265625, -4.50775146484375, -4.352783203125, -4.19781494140625, -4.0428466796875, -3.88787841796875, -3.73291015625, -3.57794189453125, -3.4229736328125, -3.26800537109375, -3.113037109375, -2.95806884765625, -2.8031005859375, -2.64813232421875, -2.4931640625, -2.33819580078125, -2.1832275390625, -2.02825927734375, -1.873291015625, -1.71832275390625, -1.5633544921875, -1.40838623046875, -1.25341796875, -1.09844970703125, -0.9434814453125, -0.78851318359375, -0.633544921875, -0.47857666015625, -0.3236083984375, -0.16864013671875, -0.013671875, 0.14129638671875, 0.2962646484375, 0.45123291015625, 0.606201171875, 0.76116943359375, 0.9161376953125, 1.07110595703125, 1.22607421875, 1.38104248046875, 1.5360107421875, 1.69097900390625, 1.845947265625, 2.00091552734375, 2.1558837890625, 2.31085205078125, 2.4658203125, 2.62078857421875, 2.7757568359375, 2.93072509765625, 3.085693359375, 3.24066162109375, 3.3956298828125, 3.55059814453125, 3.70556640625, 3.86053466796875, 4.0155029296875, 4.17047119140625, 4.325439453125, 4.48040771484375, 4.6353759765625, 4.79034423828125, 4.9453125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 13.0, 12.0, 16.0, 23.0, 33.0, 31.0, 51.0, 46.0, 62.0, 60.0, 66.0, 92.0, 62.0, 75.0, 63.0, 62.0, 44.0, 45.0, 38.0, 31.0, 24.0, 12.0, 13.0, 12.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8173828125, -0.776611328125, -0.73583984375, -0.695068359375, -0.654296875, -0.613525390625, -0.57275390625, -0.531982421875, -0.4912109375, -0.450439453125, -0.40966796875, -0.368896484375, -0.328125, -0.287353515625, -0.24658203125, -0.205810546875, -0.1650390625, -0.124267578125, -0.08349609375, -0.042724609375, -0.001953125, 0.038818359375, 0.07958984375, 0.120361328125, 0.1611328125, 0.201904296875, 0.24267578125, 0.283447265625, 0.32421875, 0.364990234375, 0.40576171875, 0.446533203125, 0.4873046875, 0.528076171875, 0.56884765625, 0.609619140625, 0.650390625, 0.691162109375, 0.73193359375, 0.772705078125, 0.8134765625, 0.854248046875, 0.89501953125, 0.935791015625, 0.9765625, 1.017333984375, 1.05810546875, 1.098876953125, 1.1396484375, 1.180419921875, 1.22119140625, 1.261962890625, 1.302734375, 1.343505859375, 1.38427734375, 1.425048828125, 1.4658203125, 1.506591796875, 1.54736328125, 1.588134765625, 1.62890625, 1.669677734375, 1.71044921875, 1.751220703125, 1.7919921875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 11.0, 11.0, 13.0, 22.0, 19.0, 34.0, 73.0, 101.0, 165.0, 263.0, 432.0, 854.0, 2119.0, 8335.0, 53929.0, 435585.0, 473931.0, 59244.0, 9036.0, 2249.0, 887.0, 454.0, 275.0, 170.0, 89.0, 67.0, 55.0, 32.0, 23.0, 26.0, 14.0, 13.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6484375, -10.31591796875, -9.9833984375, -9.65087890625, -9.318359375, -8.98583984375, -8.6533203125, -8.32080078125, -7.98828125, -7.65576171875, -7.3232421875, -6.99072265625, -6.658203125, -6.32568359375, -5.9931640625, -5.66064453125, -5.328125, -4.99560546875, -4.6630859375, -4.33056640625, -3.998046875, -3.66552734375, -3.3330078125, -3.00048828125, -2.66796875, -2.33544921875, -2.0029296875, -1.67041015625, -1.337890625, -1.00537109375, -0.6728515625, -0.34033203125, -0.0078125, 0.32470703125, 0.6572265625, 0.98974609375, 1.322265625, 1.65478515625, 1.9873046875, 2.31982421875, 2.65234375, 2.98486328125, 3.3173828125, 3.64990234375, 3.982421875, 4.31494140625, 4.6474609375, 4.97998046875, 5.3125, 5.64501953125, 5.9775390625, 6.31005859375, 6.642578125, 6.97509765625, 7.3076171875, 7.64013671875, 7.97265625, 8.30517578125, 8.6376953125, 8.97021484375, 9.302734375, 9.63525390625, 9.9677734375, 10.30029296875, 10.6328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 7.0, 5.0, 2.0, 15.0, 12.0, 14.0, 9.0, 19.0, 27.0, 37.0, 31.0, 52.0, 31.0, 33.0, 55.0, 43.0, 56.0, 45.0, 45.0, 46.0, 46.0, 39.0, 34.0, 36.0, 22.0, 49.0, 41.0, 30.0, 19.0, 30.0, 12.0, 19.0, 12.0, 15.0, 5.0, 2.0, 4.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.93304443359375, -3.7957763671875, -3.65850830078125, -3.521240234375, -3.38397216796875, -3.2467041015625, -3.10943603515625, -2.97216796875, -2.83489990234375, -2.6976318359375, -2.56036376953125, -2.423095703125, -2.28582763671875, -2.1485595703125, -2.01129150390625, -1.8740234375, -1.73675537109375, -1.5994873046875, -1.46221923828125, -1.324951171875, -1.18768310546875, -1.0504150390625, -0.91314697265625, -0.77587890625, -0.63861083984375, -0.5013427734375, -0.36407470703125, -0.226806640625, -0.08953857421875, 0.0477294921875, 0.18499755859375, 0.322265625, 0.45953369140625, 0.5968017578125, 0.73406982421875, 0.871337890625, 1.00860595703125, 1.1458740234375, 1.28314208984375, 1.42041015625, 1.55767822265625, 1.6949462890625, 1.83221435546875, 1.969482421875, 2.10675048828125, 2.2440185546875, 2.38128662109375, 2.5185546875, 2.65582275390625, 2.7930908203125, 2.93035888671875, 3.067626953125, 3.20489501953125, 3.3421630859375, 3.47943115234375, 3.61669921875, 3.75396728515625, 3.8912353515625, 4.02850341796875, 4.165771484375, 4.30303955078125, 4.4403076171875, 4.57757568359375, 4.71484375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 10.0, 14.0, 14.0, 17.0, 43.0, 83.0, 128.0, 215.0, 450.0, 932.0, 2573.0, 9168.0, 72736.0, 800379.0, 142804.0, 13410.0, 3243.0, 1219.0, 536.0, 267.0, 128.0, 75.0, 47.0, 22.0, 20.0, 12.0, 8.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.59375, -11.2855224609375, -10.977294921875, -10.6690673828125, -10.36083984375, -10.0526123046875, -9.744384765625, -9.4361572265625, -9.1279296875, -8.8197021484375, -8.511474609375, -8.2032470703125, -7.89501953125, -7.5867919921875, -7.278564453125, -6.9703369140625, -6.662109375, -6.3538818359375, -6.045654296875, -5.7374267578125, -5.42919921875, -5.1209716796875, -4.812744140625, -4.5045166015625, -4.1962890625, -3.8880615234375, -3.579833984375, -3.2716064453125, -2.96337890625, -2.6551513671875, -2.346923828125, -2.0386962890625, -1.73046875, -1.4222412109375, -1.114013671875, -0.8057861328125, -0.49755859375, -0.1893310546875, 0.118896484375, 0.4271240234375, 0.7353515625, 1.0435791015625, 1.351806640625, 1.6600341796875, 1.96826171875, 2.2764892578125, 2.584716796875, 2.8929443359375, 3.201171875, 3.5093994140625, 3.817626953125, 4.1258544921875, 4.43408203125, 4.7423095703125, 5.050537109375, 5.3587646484375, 5.6669921875, 5.9752197265625, 6.283447265625, 6.5916748046875, 6.89990234375, 7.2081298828125, 7.516357421875, 7.8245849609375, 8.1328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 6.0, 2.0, 21.0, 35.0, 75.0, 167.0, 351.0, 159.0, 79.0, 53.0, 25.0, 12.0, 12.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00199127197265625, -0.0019215643405914307, -0.0018518567085266113, -0.001782149076461792, -0.0017124414443969727, -0.0016427338123321533, -0.001573026180267334, -0.0015033185482025146, -0.0014336109161376953, -0.001363903284072876, -0.0012941956520080566, -0.0012244880199432373, -0.001154780387878418, -0.0010850727558135986, -0.0010153651237487793, -0.00094565749168396, -0.0008759498596191406, -0.0008062422275543213, -0.000736534595489502, -0.0006668269634246826, -0.0005971193313598633, -0.0005274116992950439, -0.0004577040672302246, -0.0003879964351654053, -0.00031828880310058594, -0.0002485811710357666, -0.00017887353897094727, -0.00010916590690612793, -3.9458274841308594e-05, 3.0249357223510742e-05, 9.995698928833008e-05, 0.00016966462135314941, 0.00023937225341796875, 0.0003090798854827881, 0.0003787875175476074, 0.00044849514961242676, 0.0005182027816772461, 0.0005879104137420654, 0.0006576180458068848, 0.0007273256778717041, 0.0007970333099365234, 0.0008667409420013428, 0.0009364485740661621, 0.0010061562061309814, 0.0010758638381958008, 0.0011455714702606201, 0.0012152791023254395, 0.0012849867343902588, 0.0013546943664550781, 0.0014244019985198975, 0.0014941096305847168, 0.0015638172626495361, 0.0016335248947143555, 0.0017032325267791748, 0.0017729401588439941, 0.0018426477909088135, 0.0019123554229736328, 0.001982063055038452, 0.0020517706871032715, 0.002121478319168091, 0.00219118595123291, 0.0022608935832977295, 0.002330601215362549, 0.002400308847427368, 0.0024700164794921875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 4.0, 10.0, 20.0, 26.0, 51.0, 121.0, 220.0, 535.0, 1512.0, 6682.0, 84407.0, 906704.0, 41502.0, 4706.0, 1234.0, 407.0, 204.0, 80.0, 46.0, 31.0, 16.0, 17.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.65625, -12.2257080078125, -11.795166015625, -11.3646240234375, -10.93408203125, -10.5035400390625, -10.072998046875, -9.6424560546875, -9.2119140625, -8.7813720703125, -8.350830078125, -7.9202880859375, -7.48974609375, -7.0592041015625, -6.628662109375, -6.1981201171875, -5.767578125, -5.3370361328125, -4.906494140625, -4.4759521484375, -4.04541015625, -3.6148681640625, -3.184326171875, -2.7537841796875, -2.3232421875, -1.8927001953125, -1.462158203125, -1.0316162109375, -0.60107421875, -0.1705322265625, 0.260009765625, 0.6905517578125, 1.12109375, 1.5516357421875, 1.982177734375, 2.4127197265625, 2.84326171875, 3.2738037109375, 3.704345703125, 4.1348876953125, 4.5654296875, 4.9959716796875, 5.426513671875, 5.8570556640625, 6.28759765625, 6.7181396484375, 7.148681640625, 7.5792236328125, 8.009765625, 8.4403076171875, 8.870849609375, 9.3013916015625, 9.73193359375, 10.1624755859375, 10.593017578125, 11.0235595703125, 11.4541015625, 11.8846435546875, 12.315185546875, 12.7457275390625, 13.17626953125, 13.6068115234375, 14.037353515625, 14.4678955078125, 14.8984375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 15.0, 25.0, 40.0, 81.0, 115.0, 226.0, 178.0, 110.0, 76.0, 42.0, 22.0, 12.0, 7.0, 7.0, 6.0, 4.0, 1.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.0703125, -6.85552978515625, -6.6407470703125, -6.42596435546875, -6.211181640625, -5.99639892578125, -5.7816162109375, -5.56683349609375, -5.35205078125, -5.13726806640625, -4.9224853515625, -4.70770263671875, -4.492919921875, -4.27813720703125, -4.0633544921875, -3.84857177734375, -3.6337890625, -3.41900634765625, -3.2042236328125, -2.98944091796875, -2.774658203125, -2.55987548828125, -2.3450927734375, -2.13031005859375, -1.91552734375, -1.70074462890625, -1.4859619140625, -1.27117919921875, -1.056396484375, -0.84161376953125, -0.6268310546875, -0.41204833984375, -0.197265625, 0.01751708984375, 0.2322998046875, 0.44708251953125, 0.661865234375, 0.87664794921875, 1.0914306640625, 1.30621337890625, 1.52099609375, 1.73577880859375, 1.9505615234375, 2.16534423828125, 2.380126953125, 2.59490966796875, 2.8096923828125, 3.02447509765625, 3.2392578125, 3.45404052734375, 3.6688232421875, 3.88360595703125, 4.098388671875, 4.31317138671875, 4.5279541015625, 4.74273681640625, 4.95751953125, 5.17230224609375, 5.3870849609375, 5.60186767578125, 5.816650390625, 6.03143310546875, 6.2462158203125, 6.46099853515625, 6.67578125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 6.0, 6.0, 2.0, 15.0, 28.0, 38.0, 60.0, 78.0, 99.0, 122.0, 140.0, 109.0, 97.0, 71.0, 56.0, 33.0, 18.0, 12.0, 3.0, 9.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.527965545654297, -30.051647186279297, -28.575326919555664, -27.09900665283203, -25.62268829345703, -24.14636993408203, -22.6700496673584, -21.193729400634766, -19.717411041259766, -18.241092681884766, -16.764772415161133, -15.288453102111816, -13.8121337890625, -12.335814476013184, -10.859495162963867, -9.38317584991455, -7.906856536865234, -6.430537223815918, -4.954217910766602, -3.477898597717285, -2.0015792846679688, -0.5252599716186523, 0.9510593414306641, 2.4273786544799805, 3.903697967529297, 5.380017280578613, 6.85633659362793, 8.332655906677246, 9.808975219726562, 11.285294532775879, 12.761613845825195, 14.237933158874512, 15.714248657226562, 17.190567016601562, 18.666887283325195, 20.143207550048828, 21.619525909423828, 23.095844268798828, 24.57216453552246, 26.048484802246094, 27.524803161621094, 29.001121520996094, 30.477441787719727, 31.95376205444336, 33.43008041381836, 34.90639877319336, 36.382720947265625, 37.859039306640625, 39.335357666015625, 40.811676025390625, 42.287994384765625, 43.76431655883789, 45.24063491821289, 46.71695327758789, 48.193275451660156, 49.669593811035156, 51.145912170410156, 52.622230529785156, 54.098548889160156, 55.57487106323242, 57.05118942260742, 58.52750778198242, 60.00382995605469, 61.48014831542969, 62.95646667480469]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 4.0, 9.0, 12.0, 11.0, 10.0, 13.0, 11.0, 18.0, 34.0, 18.0, 23.0, 29.0, 33.0, 31.0, 42.0, 33.0, 35.0, 37.0, 31.0, 54.0, 36.0, 42.0, 42.0, 30.0, 42.0, 47.0, 32.0, 34.0, 33.0, 29.0, 20.0, 25.0, 17.0, 17.0, 10.0, 11.0, 8.0, 5.0, 7.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.010038375854492, -22.29205322265625, -21.574066162109375, -20.8560791015625, -20.138093948364258, -19.420108795166016, -18.70212173461914, -17.984134674072266, -17.266149520874023, -16.54816436767578, -15.830177307128906, -15.112191200256348, -14.394205093383789, -13.67621898651123, -12.958232879638672, -12.240246772766113, -11.522260665893555, -10.804274559020996, -10.086288452148438, -9.368302345275879, -8.65031623840332, -7.932330131530762, -7.214344024658203, -6.4963579177856445, -5.778371810913086, -5.060385704040527, -4.342399597167969, -3.62441349029541, -2.9064273834228516, -2.188441276550293, -1.4704551696777344, -0.7524690628051758, -0.034481048583984375, 0.6835050582885742, 1.4014911651611328, 2.1194772720336914, 2.83746337890625, 3.5554494857788086, 4.273435592651367, 4.991421699523926, 5.709407806396484, 6.427393913269043, 7.145380020141602, 7.86336612701416, 8.581352233886719, 9.299338340759277, 10.017324447631836, 10.735310554504395, 11.453296661376953, 12.171282768249512, 12.88926887512207, 13.607254981994629, 14.325241088867188, 15.043227195739746, 15.761213302612305, 16.479198455810547, 17.197185516357422, 17.915172576904297, 18.63315773010254, 19.35114288330078, 20.069129943847656, 20.78711700439453, 21.505102157592773, 22.223087310791016, 22.94107437133789]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 4.0, 2.0, 5.0, 7.0, 12.0, 21.0, 32.0, 45.0, 80.0, 137.0, 299.0, 577.0, 1455.0, 4097.0, 13904.0, 57775.0, 473668.0, 3427544.0, 171025.0, 31203.0, 8125.0, 2507.0, 936.0, 393.0, 190.0, 115.0, 52.0, 29.0, 21.0, 9.0, 11.0, 2.0, 8.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7421875, -8.4796142578125, -8.217041015625, -7.9544677734375, -7.69189453125, -7.4293212890625, -7.166748046875, -6.9041748046875, -6.6416015625, -6.3790283203125, -6.116455078125, -5.8538818359375, -5.59130859375, -5.3287353515625, -5.066162109375, -4.8035888671875, -4.541015625, -4.2784423828125, -4.015869140625, -3.7532958984375, -3.49072265625, -3.2281494140625, -2.965576171875, -2.7030029296875, -2.4404296875, -2.1778564453125, -1.915283203125, -1.6527099609375, -1.39013671875, -1.1275634765625, -0.864990234375, -0.6024169921875, -0.33984375, -0.0772705078125, 0.185302734375, 0.4478759765625, 0.71044921875, 0.9730224609375, 1.235595703125, 1.4981689453125, 1.7607421875, 2.0233154296875, 2.285888671875, 2.5484619140625, 2.81103515625, 3.0736083984375, 3.336181640625, 3.5987548828125, 3.861328125, 4.1239013671875, 4.386474609375, 4.6490478515625, 4.91162109375, 5.1741943359375, 5.436767578125, 5.6993408203125, 5.9619140625, 6.2244873046875, 6.487060546875, 6.7496337890625, 7.01220703125, 7.2747802734375, 7.537353515625, 7.7999267578125, 8.0625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 6.0, 9.0, 12.0, 12.0, 18.0, 24.0, 31.0, 33.0, 37.0, 42.0, 48.0, 50.0, 69.0, 66.0, 74.0, 54.0, 61.0, 66.0, 47.0, 48.0, 35.0, 33.0, 18.0, 39.0, 16.0, 16.0, 8.0, 11.0, 3.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98681640625, -0.9483108520507812, -0.9098052978515625, -0.8712997436523438, -0.832794189453125, -0.7942886352539062, -0.7557830810546875, -0.7172775268554688, -0.67877197265625, -0.6402664184570312, -0.6017608642578125, -0.5632553100585938, -0.524749755859375, -0.48624420166015625, -0.4477386474609375, -0.40923309326171875, -0.3707275390625, -0.33222198486328125, -0.2937164306640625, -0.25521087646484375, -0.216705322265625, -0.17819976806640625, -0.1396942138671875, -0.10118865966796875, -0.06268310546875, -0.02417755126953125, 0.0143280029296875, 0.05283355712890625, 0.091339111328125, 0.12984466552734375, 0.1683502197265625, 0.20685577392578125, 0.245361328125, 0.28386688232421875, 0.3223724365234375, 0.36087799072265625, 0.399383544921875, 0.43788909912109375, 0.4763946533203125, 0.5149002075195312, 0.55340576171875, 0.5919113159179688, 0.6304168701171875, 0.6689224243164062, 0.707427978515625, 0.7459335327148438, 0.7844390869140625, 0.8229446411132812, 0.8614501953125, 0.8999557495117188, 0.9384613037109375, 0.9769668579101562, 1.015472412109375, 1.0539779663085938, 1.0924835205078125, 1.1309890747070312, 1.16949462890625, 1.2080001831054688, 1.2465057373046875, 1.2850112915039062, 1.323516845703125, 1.3620223999023438, 1.4005279541015625, 1.4390335083007812, 1.4775390625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 12.0, 14.0, 22.0, 28.0, 35.0, 58.0, 100.0, 117.0, 212.0, 378.0, 679.0, 1371.0, 2876.0, 6586.0, 16362.0, 46483.0, 157413.0, 904161.0, 2629876.0, 305319.0, 78195.0, 25717.0, 9904.0, 4205.0, 1930.0, 948.0, 490.0, 299.0, 165.0, 106.0, 67.0, 37.0, 26.0, 23.0, 23.0, 11.0, 7.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-5.89453125, -5.7271728515625, -5.559814453125, -5.3924560546875, -5.22509765625, -5.0577392578125, -4.890380859375, -4.7230224609375, -4.5556640625, -4.3883056640625, -4.220947265625, -4.0535888671875, -3.88623046875, -3.7188720703125, -3.551513671875, -3.3841552734375, -3.216796875, -3.0494384765625, -2.882080078125, -2.7147216796875, -2.54736328125, -2.3800048828125, -2.212646484375, -2.0452880859375, -1.8779296875, -1.7105712890625, -1.543212890625, -1.3758544921875, -1.20849609375, -1.0411376953125, -0.873779296875, -0.7064208984375, -0.5390625, -0.3717041015625, -0.204345703125, -0.0369873046875, 0.13037109375, 0.2977294921875, 0.465087890625, 0.6324462890625, 0.7998046875, 0.9671630859375, 1.134521484375, 1.3018798828125, 1.46923828125, 1.6365966796875, 1.803955078125, 1.9713134765625, 2.138671875, 2.3060302734375, 2.473388671875, 2.6407470703125, 2.80810546875, 2.9754638671875, 3.142822265625, 3.3101806640625, 3.4775390625, 3.6448974609375, 3.812255859375, 3.9796142578125, 4.14697265625, 4.3143310546875, 4.481689453125, 4.6490478515625, 4.81640625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 8.0, 6.0, 8.0, 18.0, 21.0, 15.0, 29.0, 39.0, 60.0, 81.0, 154.0, 221.0, 449.0, 1015.0, 843.0, 418.0, 245.0, 131.0, 93.0, 76.0, 47.0, 28.0, 23.0, 13.0, 8.0, 9.0, 7.0, 8.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.923828125, -2.83221435546875, -2.7406005859375, -2.64898681640625, -2.557373046875, -2.46575927734375, -2.3741455078125, -2.28253173828125, -2.19091796875, -2.09930419921875, -2.0076904296875, -1.91607666015625, -1.824462890625, -1.73284912109375, -1.6412353515625, -1.54962158203125, -1.4580078125, -1.36639404296875, -1.2747802734375, -1.18316650390625, -1.091552734375, -0.99993896484375, -0.9083251953125, -0.81671142578125, -0.72509765625, -0.63348388671875, -0.5418701171875, -0.45025634765625, -0.358642578125, -0.26702880859375, -0.1754150390625, -0.08380126953125, 0.0078125, 0.09942626953125, 0.1910400390625, 0.28265380859375, 0.374267578125, 0.46588134765625, 0.5574951171875, 0.64910888671875, 0.74072265625, 0.83233642578125, 0.9239501953125, 1.01556396484375, 1.107177734375, 1.19879150390625, 1.2904052734375, 1.38201904296875, 1.4736328125, 1.56524658203125, 1.6568603515625, 1.74847412109375, 1.840087890625, 1.93170166015625, 2.0233154296875, 2.11492919921875, 2.20654296875, 2.29815673828125, 2.3897705078125, 2.48138427734375, 2.572998046875, 2.66461181640625, 2.7562255859375, 2.84783935546875, 2.939453125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 16.0, 17.0, 31.0, 54.0, 81.0, 89.0, 129.0, 113.0, 101.0, 101.0, 78.0, 66.0, 37.0, 31.0, 18.0, 12.0, 7.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.346874237060547, -19.683998107910156, -19.0211238861084, -18.358247756958008, -17.695371627807617, -17.03249740600586, -16.36962127685547, -15.706746101379395, -15.04387092590332, -14.380995750427246, -13.718119621276855, -13.055244445800781, -12.392369270324707, -11.729494094848633, -11.066617965698242, -10.403742790222168, -9.740866661071777, -9.077991485595703, -8.415115356445312, -7.752240180969238, -7.089365005493164, -6.426489353179932, -5.763613700866699, -5.100738525390625, -4.437862873077393, -3.7749874591827393, -3.112112045288086, -2.4492363929748535, -1.7863609790802002, -1.1234855651855469, -0.46060991287231445, 0.20226526260375977, 0.8651409149169922, 1.5280163288116455, 2.190891742706299, 2.8537673950195312, 3.5166428089141846, 4.179518222808838, 4.84239387512207, 5.5052690505981445, 6.168144702911377, 6.831020355224609, 7.493895530700684, 8.156770706176758, 8.819646835327148, 9.482522010803223, 10.145397186279297, 10.808273315429688, 11.471148490905762, 12.134023666381836, 12.796899795532227, 13.4597749710083, 14.122650146484375, 14.785526275634766, 15.44840145111084, 16.111276626586914, 16.774152755737305, 17.437028884887695, 18.099903106689453, 18.762779235839844, 19.425655364990234, 20.088529586791992, 20.751405715942383, 21.41427993774414, 22.07715606689453]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 4.0, 2.0, 10.0, 11.0, 3.0, 19.0, 12.0, 20.0, 24.0, 22.0, 26.0, 21.0, 25.0, 29.0, 23.0, 39.0, 40.0, 49.0, 41.0, 35.0, 43.0, 36.0, 41.0, 39.0, 31.0, 35.0, 46.0, 31.0, 30.0, 25.0, 30.0, 21.0, 13.0, 24.0, 15.0, 13.0, 13.0, 15.0, 14.0, 6.0, 7.0, 5.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.615211486816406, -9.32125473022461, -9.027297973632812, -8.7333402633667, -8.439383506774902, -8.145426750183105, -7.851469993591309, -7.557513236999512, -7.263556003570557, -6.96959924697876, -6.675642013549805, -6.381685256958008, -6.087728500366211, -5.793771266937256, -5.499814510345459, -5.205857276916504, -4.911900520324707, -4.61794376373291, -4.323986530303955, -4.030029773712158, -3.7360727787017822, -3.4421157836914062, -3.1481590270996094, -2.8542020320892334, -2.5602450370788574, -2.2662880420684814, -1.972331166267395, -1.6783742904663086, -1.3844172954559326, -1.0904603004455566, -0.7965034246444702, -0.5025465488433838, -0.20859050750732422, 0.08536642789840698, 0.3793233633041382, 0.6732802987098694, 0.9672372341156006, 1.2611942291259766, 1.555151104927063, 1.8491079807281494, 2.1430649757385254, 2.4370219707489014, 2.7309789657592773, 3.024935722351074, 3.31889271736145, 3.612849712371826, 3.906806468963623, 4.200763702392578, 4.494720458984375, 4.788677215576172, 5.082634449005127, 5.376591205596924, 5.670548439025879, 5.964505195617676, 6.258461952209473, 6.5524187088012695, 6.846375942230225, 7.1403326988220215, 7.434289932250977, 7.728246688842773, 8.02220344543457, 8.316160202026367, 8.61011791229248, 8.904074668884277, 9.198031425476074]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 4.0, 7.0, 11.0, 13.0, 19.0, 22.0, 46.0, 72.0, 94.0, 139.0, 259.0, 361.0, 563.0, 910.0, 1508.0, 2616.0, 4153.0, 7256.0, 12388.0, 21949.0, 39180.0, 74059.0, 286151.0, 399812.0, 92428.0, 44480.0, 25264.0, 14382.0, 8227.0, 4920.0, 2781.0, 1702.0, 989.0, 626.0, 392.0, 283.0, 163.0, 111.0, 60.0, 49.0, 27.0, 20.0, 24.0, 17.0, 5.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.4140625, -4.26751708984375, -4.1209716796875, -3.97442626953125, -3.827880859375, -3.68133544921875, -3.5347900390625, -3.38824462890625, -3.24169921875, -3.09515380859375, -2.9486083984375, -2.80206298828125, -2.655517578125, -2.50897216796875, -2.3624267578125, -2.21588134765625, -2.0693359375, -1.92279052734375, -1.7762451171875, -1.62969970703125, -1.483154296875, -1.33660888671875, -1.1900634765625, -1.04351806640625, -0.89697265625, -0.75042724609375, -0.6038818359375, -0.45733642578125, -0.310791015625, -0.16424560546875, -0.0177001953125, 0.12884521484375, 0.275390625, 0.42193603515625, 0.5684814453125, 0.71502685546875, 0.861572265625, 1.00811767578125, 1.1546630859375, 1.30120849609375, 1.44775390625, 1.59429931640625, 1.7408447265625, 1.88739013671875, 2.033935546875, 2.18048095703125, 2.3270263671875, 2.47357177734375, 2.6201171875, 2.76666259765625, 2.9132080078125, 3.05975341796875, 3.206298828125, 3.35284423828125, 3.4993896484375, 3.64593505859375, 3.79248046875, 3.93902587890625, 4.0855712890625, 4.23211669921875, 4.378662109375, 4.52520751953125, 4.6717529296875, 4.81829833984375, 4.96484375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 4.0, 6.0, 9.0, 5.0, 6.0, 10.0, 14.0, 21.0, 18.0, 30.0, 33.0, 38.0, 42.0, 49.0, 51.0, 47.0, 59.0, 45.0, 77.0, 65.0, 45.0, 45.0, 42.0, 40.0, 38.0, 32.0, 33.0, 28.0, 20.0, 15.0, 10.0, 13.0, 7.0, 5.0, 1.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78515625, -0.747955322265625, -0.71075439453125, -0.673553466796875, -0.6363525390625, -0.599151611328125, -0.56195068359375, -0.524749755859375, -0.487548828125, -0.450347900390625, -0.41314697265625, -0.375946044921875, -0.3387451171875, -0.301544189453125, -0.26434326171875, -0.227142333984375, -0.18994140625, -0.152740478515625, -0.11553955078125, -0.078338623046875, -0.0411376953125, -0.003936767578125, 0.03326416015625, 0.070465087890625, 0.107666015625, 0.144866943359375, 0.18206787109375, 0.219268798828125, 0.2564697265625, 0.293670654296875, 0.33087158203125, 0.368072509765625, 0.4052734375, 0.442474365234375, 0.47967529296875, 0.516876220703125, 0.5540771484375, 0.591278076171875, 0.62847900390625, 0.665679931640625, 0.702880859375, 0.740081787109375, 0.77728271484375, 0.814483642578125, 0.8516845703125, 0.888885498046875, 0.92608642578125, 0.963287353515625, 1.00048828125, 1.037689208984375, 1.07489013671875, 1.112091064453125, 1.1492919921875, 1.186492919921875, 1.22369384765625, 1.260894775390625, 1.298095703125, 1.335296630859375, 1.37249755859375, 1.409698486328125, 1.4468994140625, 1.484100341796875, 1.52130126953125, 1.558502197265625, 1.595703125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 1.0, 2.0, 12.0, 7.0, 29.0, 18.0, 24.0, 45.0, 53.0, 83.0, 130.0, 171.0, 225.0, 425.0, 766.0, 1756.0, 5154.0, 20412.0, 100301.0, 757165.0, 126263.0, 25323.0, 6117.0, 1870.0, 843.0, 473.0, 261.0, 175.0, 136.0, 83.0, 63.0, 37.0, 36.0, 24.0, 24.0, 13.0, 8.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.3359375, -9.997802734375, -9.65966796875, -9.321533203125, -8.9833984375, -8.645263671875, -8.30712890625, -7.968994140625, -7.630859375, -7.292724609375, -6.95458984375, -6.616455078125, -6.2783203125, -5.940185546875, -5.60205078125, -5.263916015625, -4.92578125, -4.587646484375, -4.24951171875, -3.911376953125, -3.5732421875, -3.235107421875, -2.89697265625, -2.558837890625, -2.220703125, -1.882568359375, -1.54443359375, -1.206298828125, -0.8681640625, -0.530029296875, -0.19189453125, 0.146240234375, 0.484375, 0.822509765625, 1.16064453125, 1.498779296875, 1.8369140625, 2.175048828125, 2.51318359375, 2.851318359375, 3.189453125, 3.527587890625, 3.86572265625, 4.203857421875, 4.5419921875, 4.880126953125, 5.21826171875, 5.556396484375, 5.89453125, 6.232666015625, 6.57080078125, 6.908935546875, 7.2470703125, 7.585205078125, 7.92333984375, 8.261474609375, 8.599609375, 8.937744140625, 9.27587890625, 9.614013671875, 9.9521484375, 10.290283203125, 10.62841796875, 10.966552734375, 11.3046875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 2.0, 3.0, 7.0, 5.0, 11.0, 13.0, 13.0, 12.0, 13.0, 16.0, 27.0, 34.0, 31.0, 30.0, 35.0, 49.0, 49.0, 39.0, 44.0, 40.0, 61.0, 51.0, 54.0, 40.0, 42.0, 39.0, 36.0, 35.0, 38.0, 24.0, 23.0, 14.0, 8.0, 9.0, 11.0, 10.0, 5.0, 3.0, 3.0, 4.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.65625, -4.508056640625, -4.35986328125, -4.211669921875, -4.0634765625, -3.915283203125, -3.76708984375, -3.618896484375, -3.470703125, -3.322509765625, -3.17431640625, -3.026123046875, -2.8779296875, -2.729736328125, -2.58154296875, -2.433349609375, -2.28515625, -2.136962890625, -1.98876953125, -1.840576171875, -1.6923828125, -1.544189453125, -1.39599609375, -1.247802734375, -1.099609375, -0.951416015625, -0.80322265625, -0.655029296875, -0.5068359375, -0.358642578125, -0.21044921875, -0.062255859375, 0.0859375, 0.234130859375, 0.38232421875, 0.530517578125, 0.6787109375, 0.826904296875, 0.97509765625, 1.123291015625, 1.271484375, 1.419677734375, 1.56787109375, 1.716064453125, 1.8642578125, 2.012451171875, 2.16064453125, 2.308837890625, 2.45703125, 2.605224609375, 2.75341796875, 2.901611328125, 3.0498046875, 3.197998046875, 3.34619140625, 3.494384765625, 3.642578125, 3.790771484375, 3.93896484375, 4.087158203125, 4.2353515625, 4.383544921875, 4.53173828125, 4.679931640625, 4.828125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 11.0, 21.0, 26.0, 53.0, 70.0, 133.0, 429.0, 1388.0, 8449.0, 87626.0, 890544.0, 52484.0, 5575.0, 1096.0, 327.0, 125.0, 76.0, 38.0, 18.0, 16.0, 13.0, 9.0, 9.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0078125, -10.6334228515625, -10.259033203125, -9.8846435546875, -9.51025390625, -9.1358642578125, -8.761474609375, -8.3870849609375, -8.0126953125, -7.6383056640625, -7.263916015625, -6.8895263671875, -6.51513671875, -6.1407470703125, -5.766357421875, -5.3919677734375, -5.017578125, -4.6431884765625, -4.268798828125, -3.8944091796875, -3.52001953125, -3.1456298828125, -2.771240234375, -2.3968505859375, -2.0224609375, -1.6480712890625, -1.273681640625, -0.8992919921875, -0.52490234375, -0.1505126953125, 0.223876953125, 0.5982666015625, 0.97265625, 1.3470458984375, 1.721435546875, 2.0958251953125, 2.47021484375, 2.8446044921875, 3.218994140625, 3.5933837890625, 3.9677734375, 4.3421630859375, 4.716552734375, 5.0909423828125, 5.46533203125, 5.8397216796875, 6.214111328125, 6.5885009765625, 6.962890625, 7.3372802734375, 7.711669921875, 8.0860595703125, 8.46044921875, 8.8348388671875, 9.209228515625, 9.5836181640625, 9.9580078125, 10.3323974609375, 10.706787109375, 11.0811767578125, 11.45556640625, 11.8299560546875, 12.204345703125, 12.5787353515625, 12.953125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 9.0, 10.0, 20.0, 18.0, 25.0, 27.0, 38.0, 41.0, 163.0, 322.0, 130.0, 58.0, 34.0, 22.0, 27.0, 9.0, 5.0, 4.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.001850128173828125, -0.0018065646290779114, -0.0017630010843276978, -0.0017194375395774841, -0.0016758739948272705, -0.0016323104500770569, -0.0015887469053268433, -0.0015451833605766296, -0.001501619815826416, -0.0014580562710762024, -0.0014144927263259888, -0.0013709291815757751, -0.0013273656368255615, -0.001283802092075348, -0.0012402385473251343, -0.0011966750025749207, -0.001153111457824707, -0.0011095479130744934, -0.0010659843683242798, -0.0010224208235740662, -0.0009788572788238525, -0.0009352937340736389, -0.0008917301893234253, -0.0008481666445732117, -0.000804603099822998, -0.0007610395550727844, -0.0007174760103225708, -0.0006739124655723572, -0.0006303489208221436, -0.0005867853760719299, -0.0005432218313217163, -0.0004996582865715027, -0.00045609474182128906, -0.00041253119707107544, -0.0003689676523208618, -0.0003254041075706482, -0.00028184056282043457, -0.00023827701807022095, -0.00019471347332000732, -0.0001511499285697937, -0.00010758638381958008, -6.402283906936646e-05, -2.0459294319152832e-05, 2.310425043106079e-05, 6.666779518127441e-05, 0.00011023133993148804, 0.00015379488468170166, 0.00019735842943191528, 0.0002409219741821289, 0.00028448551893234253, 0.00032804906368255615, 0.0003716126084327698, 0.0004151761531829834, 0.000458739697933197, 0.0005023032426834106, 0.0005458667874336243, 0.0005894303321838379, 0.0006329938769340515, 0.0006765574216842651, 0.0007201209664344788, 0.0007636845111846924, 0.000807248055934906, 0.0008508116006851196, 0.0008943751454353333, 0.0009379386901855469]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 7.0, 20.0, 24.0, 56.0, 88.0, 157.0, 357.0, 981.0, 5297.0, 78868.0, 921461.0, 36593.0, 3226.0, 744.0, 310.0, 136.0, 87.0, 36.0, 29.0, 20.0, 14.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4921875, -11.0565185546875, -10.620849609375, -10.1851806640625, -9.74951171875, -9.3138427734375, -8.878173828125, -8.4425048828125, -8.0068359375, -7.5711669921875, -7.135498046875, -6.6998291015625, -6.26416015625, -5.8284912109375, -5.392822265625, -4.9571533203125, -4.521484375, -4.0858154296875, -3.650146484375, -3.2144775390625, -2.77880859375, -2.3431396484375, -1.907470703125, -1.4718017578125, -1.0361328125, -0.6004638671875, -0.164794921875, 0.2708740234375, 0.70654296875, 1.1422119140625, 1.577880859375, 2.0135498046875, 2.44921875, 2.8848876953125, 3.320556640625, 3.7562255859375, 4.19189453125, 4.6275634765625, 5.063232421875, 5.4989013671875, 5.9345703125, 6.3702392578125, 6.805908203125, 7.2415771484375, 7.67724609375, 8.1129150390625, 8.548583984375, 8.9842529296875, 9.419921875, 9.8555908203125, 10.291259765625, 10.7269287109375, 11.16259765625, 11.5982666015625, 12.033935546875, 12.4696044921875, 12.9052734375, 13.3409423828125, 13.776611328125, 14.2122802734375, 14.64794921875, 15.0836181640625, 15.519287109375, 15.9549560546875, 16.390625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 2.0, 6.0, 6.0, 7.0, 13.0, 7.0, 10.0, 15.0, 19.0, 22.0, 41.0, 65.0, 138.0, 193.0, 171.0, 82.0, 44.0, 24.0, 22.0, 18.0, 16.0, 12.0, 12.0, 11.0, 4.0, 8.0, 4.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.08203125, -3.93988037109375, -3.7977294921875, -3.65557861328125, -3.513427734375, -3.37127685546875, -3.2291259765625, -3.08697509765625, -2.94482421875, -2.80267333984375, -2.6605224609375, -2.51837158203125, -2.376220703125, -2.23406982421875, -2.0919189453125, -1.94976806640625, -1.8076171875, -1.66546630859375, -1.5233154296875, -1.38116455078125, -1.239013671875, -1.09686279296875, -0.9547119140625, -0.81256103515625, -0.67041015625, -0.52825927734375, -0.3861083984375, -0.24395751953125, -0.101806640625, 0.04034423828125, 0.1824951171875, 0.32464599609375, 0.466796875, 0.60894775390625, 0.7510986328125, 0.89324951171875, 1.035400390625, 1.17755126953125, 1.3197021484375, 1.46185302734375, 1.60400390625, 1.74615478515625, 1.8883056640625, 2.03045654296875, 2.172607421875, 2.31475830078125, 2.4569091796875, 2.59906005859375, 2.7412109375, 2.88336181640625, 3.0255126953125, 3.16766357421875, 3.309814453125, 3.45196533203125, 3.5941162109375, 3.73626708984375, 3.87841796875, 4.02056884765625, 4.1627197265625, 4.30487060546875, 4.447021484375, 4.58917236328125, 4.7313232421875, 4.87347412109375, 5.015625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 6.0, 9.0, 26.0, 80.0, 161.0, 236.0, 228.0, 142.0, 68.0, 29.0, 11.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-80.44749450683594, -77.3449478149414, -74.24240112304688, -71.13985443115234, -68.03730773925781, -64.93476867675781, -61.832218170166016, -58.72967529296875, -55.62712860107422, -52.52458190917969, -49.422035217285156, -46.319488525390625, -43.21694564819336, -40.11439895629883, -37.0118522644043, -33.90930938720703, -30.806758880615234, -27.704212188720703, -24.601667404174805, -21.499120712280273, -18.396575927734375, -15.294029235839844, -12.191482543945312, -9.088937759399414, -5.986391067504883, -2.883845090866089, 0.21870088577270508, 3.321247100830078, 6.423792839050293, 9.526338577270508, 12.628885269165039, 15.731430053710938, 18.83397674560547, 21.9365234375, 25.0390682220459, 28.14161491394043, 31.244159698486328, 34.34670639038086, 37.44925308227539, 40.551795959472656, 43.65434265136719, 46.75688934326172, 49.85943603515625, 52.96198272705078, 56.06452560424805, 59.16707229614258, 62.26961898803711, 65.37216186523438, 68.47471618652344, 71.57726287841797, 74.6798095703125, 77.78235626220703, 80.88490295410156, 83.98744201660156, 87.08999633789062, 90.19253540039062, 93.29508209228516, 96.39762878417969, 99.50017547607422, 102.60272216796875, 105.70526885986328, 108.80781555175781, 111.91035461425781, 115.01290130615234, 118.11544799804688]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 4.0, 11.0, 13.0, 10.0, 9.0, 20.0, 16.0, 23.0, 23.0, 22.0, 31.0, 33.0, 31.0, 38.0, 55.0, 29.0, 47.0, 39.0, 44.0, 38.0, 41.0, 47.0, 34.0, 45.0, 40.0, 39.0, 31.0, 34.0, 21.0, 15.0, 18.0, 16.0, 16.0, 16.0, 11.0, 7.0, 5.0, 3.0, 4.0, 6.0, 3.0, 2.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-24.649288177490234, -23.865467071533203, -23.081645965576172, -22.29782485961914, -21.51400375366211, -20.730182647705078, -19.946361541748047, -19.162540435791016, -18.378719329833984, -17.594898223876953, -16.811077117919922, -16.02725601196289, -15.24343490600586, -14.459613800048828, -13.675793647766113, -12.891972541809082, -12.108152389526367, -11.324331283569336, -10.540510177612305, -9.756689071655273, -8.972867965698242, -8.189046859741211, -7.405226707458496, -6.621405601501465, -5.837584495544434, -5.053763389587402, -4.269942283630371, -3.486121654510498, -2.702300548553467, -1.9184794425964355, -1.1346588134765625, -0.35083770751953125, 0.4329833984375, 1.2168043851852417, 2.0006253719329834, 2.7844462394714355, 3.568267345428467, 4.352088451385498, 5.135909080505371, 5.919730186462402, 6.703551292419434, 7.487372398376465, 8.271193504333496, 9.055013656616211, 9.838834762573242, 10.622655868530273, 11.406476974487305, 12.190298080444336, 12.974119186401367, 13.757940292358398, 14.54176139831543, 15.325582504272461, 16.109403610229492, 16.893224716186523, 17.677043914794922, 18.460865020751953, 19.244686126708984, 20.028507232666016, 20.812328338623047, 21.596149444580078, 22.37997055053711, 23.16379165649414, 23.947612762451172, 24.731433868408203, 25.515254974365234]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 3.0, 9.0, 16.0, 25.0, 30.0, 40.0, 82.0, 109.0, 191.0, 332.0, 588.0, 1048.0, 2060.0, 4309.0, 9408.0, 23961.0, 69361.0, 331414.0, 3310059.0, 329792.0, 69781.0, 23620.0, 9420.0, 4210.0, 2010.0, 1064.0, 545.0, 314.0, 165.0, 121.0, 63.0, 35.0, 33.0, 19.0, 12.0, 12.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.4921875, -7.2811279296875, -7.070068359375, -6.8590087890625, -6.64794921875, -6.4368896484375, -6.225830078125, -6.0147705078125, -5.8037109375, -5.5926513671875, -5.381591796875, -5.1705322265625, -4.95947265625, -4.7484130859375, -4.537353515625, -4.3262939453125, -4.115234375, -3.9041748046875, -3.693115234375, -3.4820556640625, -3.27099609375, -3.0599365234375, -2.848876953125, -2.6378173828125, -2.4267578125, -2.2156982421875, -2.004638671875, -1.7935791015625, -1.58251953125, -1.3714599609375, -1.160400390625, -0.9493408203125, -0.73828125, -0.5272216796875, -0.316162109375, -0.1051025390625, 0.10595703125, 0.3170166015625, 0.528076171875, 0.7391357421875, 0.9501953125, 1.1612548828125, 1.372314453125, 1.5833740234375, 1.79443359375, 2.0054931640625, 2.216552734375, 2.4276123046875, 2.638671875, 2.8497314453125, 3.060791015625, 3.2718505859375, 3.48291015625, 3.6939697265625, 3.905029296875, 4.1160888671875, 4.3271484375, 4.5382080078125, 4.749267578125, 4.9603271484375, 5.17138671875, 5.3824462890625, 5.593505859375, 5.8045654296875, 6.015625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 1.0, 7.0, 7.0, 10.0, 19.0, 22.0, 30.0, 43.0, 42.0, 40.0, 48.0, 54.0, 73.0, 60.0, 64.0, 62.0, 62.0, 75.0, 45.0, 41.0, 56.0, 37.0, 26.0, 18.0, 17.0, 13.0, 6.0, 10.0, 7.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.12109375, -1.0735015869140625, -1.025909423828125, -0.9783172607421875, -0.93072509765625, -0.8831329345703125, -0.835540771484375, -0.7879486083984375, -0.7403564453125, -0.6927642822265625, -0.645172119140625, -0.5975799560546875, -0.54998779296875, -0.5023956298828125, -0.454803466796875, -0.4072113037109375, -0.359619140625, -0.3120269775390625, -0.264434814453125, -0.2168426513671875, -0.16925048828125, -0.1216583251953125, -0.074066162109375, -0.0264739990234375, 0.0211181640625, 0.0687103271484375, 0.116302490234375, 0.1638946533203125, 0.21148681640625, 0.2590789794921875, 0.306671142578125, 0.3542633056640625, 0.40185546875, 0.4494476318359375, 0.497039794921875, 0.5446319580078125, 0.59222412109375, 0.6398162841796875, 0.687408447265625, 0.7350006103515625, 0.7825927734375, 0.8301849365234375, 0.877777099609375, 0.9253692626953125, 0.97296142578125, 1.0205535888671875, 1.068145751953125, 1.1157379150390625, 1.163330078125, 1.2109222412109375, 1.258514404296875, 1.3061065673828125, 1.35369873046875, 1.4012908935546875, 1.448883056640625, 1.4964752197265625, 1.5440673828125, 1.5916595458984375, 1.639251708984375, 1.6868438720703125, 1.73443603515625, 1.7820281982421875, 1.829620361328125, 1.8772125244140625, 1.9248046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 10.0, 5.0, 19.0, 20.0, 61.0, 82.0, 180.0, 389.0, 794.0, 1856.0, 4622.0, 12678.0, 41223.0, 188084.0, 2901714.0, 895106.0, 105325.0, 27106.0, 8964.0, 3336.0, 1432.0, 630.0, 284.0, 152.0, 82.0, 37.0, 29.0, 18.0, 16.0, 10.0, 8.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.88671875, -7.646484375, -7.40625, -7.166015625, -6.92578125, -6.685546875, -6.4453125, -6.205078125, -5.96484375, -5.724609375, -5.484375, -5.244140625, -5.00390625, -4.763671875, -4.5234375, -4.283203125, -4.04296875, -3.802734375, -3.5625, -3.322265625, -3.08203125, -2.841796875, -2.6015625, -2.361328125, -2.12109375, -1.880859375, -1.640625, -1.400390625, -1.16015625, -0.919921875, -0.6796875, -0.439453125, -0.19921875, 0.041015625, 0.28125, 0.521484375, 0.76171875, 1.001953125, 1.2421875, 1.482421875, 1.72265625, 1.962890625, 2.203125, 2.443359375, 2.68359375, 2.923828125, 3.1640625, 3.404296875, 3.64453125, 3.884765625, 4.125, 4.365234375, 4.60546875, 4.845703125, 5.0859375, 5.326171875, 5.56640625, 5.806640625, 6.046875, 6.287109375, 6.52734375, 6.767578125, 7.0078125, 7.248046875, 7.48828125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 6.0, 3.0, 6.0, 9.0, 11.0, 18.0, 22.0, 36.0, 50.0, 71.0, 91.0, 129.0, 221.0, 374.0, 927.0, 1002.0, 404.0, 221.0, 137.0, 96.0, 58.0, 47.0, 34.0, 24.0, 23.0, 15.0, 7.0, 9.0, 5.0, 1.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515625, -2.43450927734375, -2.3533935546875, -2.27227783203125, -2.191162109375, -2.11004638671875, -2.0289306640625, -1.94781494140625, -1.86669921875, -1.78558349609375, -1.7044677734375, -1.62335205078125, -1.542236328125, -1.46112060546875, -1.3800048828125, -1.29888916015625, -1.2177734375, -1.13665771484375, -1.0555419921875, -0.97442626953125, -0.893310546875, -0.81219482421875, -0.7310791015625, -0.64996337890625, -0.56884765625, -0.48773193359375, -0.4066162109375, -0.32550048828125, -0.244384765625, -0.16326904296875, -0.0821533203125, -0.00103759765625, 0.080078125, 0.16119384765625, 0.2423095703125, 0.32342529296875, 0.404541015625, 0.48565673828125, 0.5667724609375, 0.64788818359375, 0.72900390625, 0.81011962890625, 0.8912353515625, 0.97235107421875, 1.053466796875, 1.13458251953125, 1.2156982421875, 1.29681396484375, 1.3779296875, 1.45904541015625, 1.5401611328125, 1.62127685546875, 1.702392578125, 1.78350830078125, 1.8646240234375, 1.94573974609375, 2.02685546875, 2.10797119140625, 2.1890869140625, 2.27020263671875, 2.351318359375, 2.43243408203125, 2.5135498046875, 2.59466552734375, 2.67578125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 7.0, 12.0, 24.0, 54.0, 70.0, 131.0, 160.0, 184.0, 135.0, 105.0, 66.0, 25.0, 16.0, 10.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.0424747467041, -24.178417205810547, -23.31435775756836, -22.450300216674805, -21.58624267578125, -20.722183227539062, -19.858125686645508, -18.994068145751953, -18.1300106048584, -17.265953063964844, -16.401893615722656, -15.537836074829102, -14.673778533935547, -13.809720039367676, -12.945661544799805, -12.08160400390625, -11.217545509338379, -10.353487014770508, -9.489429473876953, -8.625370979309082, -7.761313438415527, -6.897254943847656, -6.033196926116943, -5.1691389083862305, -4.305080890655518, -3.4410228729248047, -2.576964855194092, -1.7129065990447998, -0.8488485813140869, 0.015209674835205078, 0.879267692565918, 1.7433257102966309, 2.6073837280273438, 3.4714417457580566, 4.3354997634887695, 5.199558258056641, 6.063615798950195, 6.927674293518066, 7.791732311248779, 8.655790328979492, 9.519847869873047, 10.383906364440918, 11.247963905334473, 12.112022399902344, 12.976079940795898, 13.84013843536377, 14.70419692993164, 15.568254470825195, 16.43231201171875, 17.296369552612305, 18.160429000854492, 19.024486541748047, 19.8885440826416, 20.752601623535156, 21.616661071777344, 22.4807186126709, 23.344778060913086, 24.20883560180664, 25.072895050048828, 25.936952590942383, 26.801010131835938, 27.665069580078125, 28.52912712097168, 29.393184661865234, 30.25724220275879]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 8.0, 8.0, 12.0, 14.0, 13.0, 10.0, 16.0, 16.0, 14.0, 17.0, 20.0, 17.0, 28.0, 33.0, 35.0, 27.0, 39.0, 42.0, 34.0, 40.0, 37.0, 27.0, 39.0, 35.0, 29.0, 35.0, 31.0, 43.0, 26.0, 27.0, 21.0, 24.0, 23.0, 26.0, 18.0, 18.0, 12.0, 10.0, 10.0, 8.0, 6.0, 12.0, 6.0, 6.0, 4.0, 2.0, 5.0, 4.0, 0.0, 5.0, 0.0, 1.0], "bins": [-8.33156967163086, -8.085251808166504, -7.838934421539307, -7.592616558074951, -7.346298694610596, -7.099981307983398, -6.853663444519043, -6.6073455810546875, -6.361027717590332, -6.114709854125977, -5.868392467498779, -5.622074604034424, -5.375756740570068, -5.129439353942871, -4.883121490478516, -4.63680362701416, -4.390485763549805, -4.144167900085449, -3.897850275039673, -3.6515326499938965, -3.405214786529541, -3.1588971614837646, -2.9125795364379883, -2.666261672973633, -2.4199442863464355, -2.173626661300659, -1.9273087978363037, -1.6809911727905273, -1.4346733093261719, -1.1883556842803955, -0.9420379400253296, -0.6957201957702637, -0.4494023323059082, -0.20308460295200348, 0.043233126401901245, 0.2895508408546448, 0.5358685851097107, 0.7821862697601318, 1.0285040140151978, 1.2748217582702637, 1.5211395025253296, 1.7674572467803955, 2.013774871826172, 2.2600927352905273, 2.5064103603363037, 2.75272798538208, 2.9990458488464355, 3.245363712310791, 3.4916813373565674, 3.7379989624023438, 3.984316825866699, 4.230634689331055, 4.476952075958252, 4.723269939422607, 4.969587802886963, 5.21590518951416, 5.462223052978516, 5.708540916442871, 5.954858303070068, 6.201176166534424, 6.447494029998779, 6.693811416625977, 6.940129280090332, 7.1864471435546875, 7.432765007019043]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 14.0, 10.0, 22.0, 25.0, 36.0, 35.0, 62.0, 90.0, 150.0, 188.0, 337.0, 536.0, 820.0, 1355.0, 2294.0, 4023.0, 6886.0, 12077.0, 22398.0, 44646.0, 124769.0, 477713.0, 224612.0, 60743.0, 28859.0, 15217.0, 8485.0, 4851.0, 2843.0, 1751.0, 965.0, 612.0, 349.0, 238.0, 155.0, 128.0, 87.0, 47.0, 46.0, 18.0, 17.0, 10.0, 8.0, 7.0, 7.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.23828125, -4.09552001953125, -3.9527587890625, -3.80999755859375, -3.667236328125, -3.52447509765625, -3.3817138671875, -3.23895263671875, -3.09619140625, -2.95343017578125, -2.8106689453125, -2.66790771484375, -2.525146484375, -2.38238525390625, -2.2396240234375, -2.09686279296875, -1.9541015625, -1.81134033203125, -1.6685791015625, -1.52581787109375, -1.383056640625, -1.24029541015625, -1.0975341796875, -0.95477294921875, -0.81201171875, -0.66925048828125, -0.5264892578125, -0.38372802734375, -0.240966796875, -0.09820556640625, 0.0445556640625, 0.18731689453125, 0.330078125, 0.47283935546875, 0.6156005859375, 0.75836181640625, 0.901123046875, 1.04388427734375, 1.1866455078125, 1.32940673828125, 1.47216796875, 1.61492919921875, 1.7576904296875, 1.90045166015625, 2.043212890625, 2.18597412109375, 2.3287353515625, 2.47149658203125, 2.6142578125, 2.75701904296875, 2.8997802734375, 3.04254150390625, 3.185302734375, 3.32806396484375, 3.4708251953125, 3.61358642578125, 3.75634765625, 3.89910888671875, 4.0418701171875, 4.18463134765625, 4.327392578125, 4.47015380859375, 4.6129150390625, 4.75567626953125, 4.8984375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 9.0, 8.0, 13.0, 6.0, 9.0, 18.0, 23.0, 23.0, 32.0, 36.0, 38.0, 46.0, 60.0, 52.0, 53.0, 59.0, 56.0, 56.0, 59.0, 56.0, 44.0, 46.0, 47.0, 38.0, 31.0, 21.0, 18.0, 12.0, 9.0, 10.0, 6.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1572265625, -1.1114959716796875, -1.065765380859375, -1.0200347900390625, -0.97430419921875, -0.9285736083984375, -0.882843017578125, -0.8371124267578125, -0.7913818359375, -0.7456512451171875, -0.699920654296875, -0.6541900634765625, -0.60845947265625, -0.5627288818359375, -0.516998291015625, -0.4712677001953125, -0.425537109375, -0.3798065185546875, -0.334075927734375, -0.2883453369140625, -0.24261474609375, -0.1968841552734375, -0.151153564453125, -0.1054229736328125, -0.0596923828125, -0.0139617919921875, 0.031768798828125, 0.0774993896484375, 0.12322998046875, 0.1689605712890625, 0.214691162109375, 0.2604217529296875, 0.30615234375, 0.3518829345703125, 0.397613525390625, 0.4433441162109375, 0.48907470703125, 0.5348052978515625, 0.580535888671875, 0.6262664794921875, 0.6719970703125, 0.7177276611328125, 0.763458251953125, 0.8091888427734375, 0.85491943359375, 0.9006500244140625, 0.946380615234375, 0.9921112060546875, 1.037841796875, 1.0835723876953125, 1.129302978515625, 1.1750335693359375, 1.22076416015625, 1.2664947509765625, 1.312225341796875, 1.3579559326171875, 1.4036865234375, 1.4494171142578125, 1.495147705078125, 1.5408782958984375, 1.58660888671875, 1.6323394775390625, 1.678070068359375, 1.7238006591796875, 1.76953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 2.0, 2.0, 2.0, 1.0, 11.0, 8.0, 19.0, 10.0, 30.0, 43.0, 61.0, 90.0, 139.0, 226.0, 359.0, 720.0, 1527.0, 3209.0, 7481.0, 17868.0, 44741.0, 230119.0, 630112.0, 67507.0, 25379.0, 10305.0, 4429.0, 1909.0, 925.0, 532.0, 281.0, 166.0, 104.0, 65.0, 47.0, 37.0, 29.0, 21.0, 11.0, 6.0, 9.0, 2.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.20703125, -6.96832275390625, -6.7296142578125, -6.49090576171875, -6.252197265625, -6.01348876953125, -5.7747802734375, -5.53607177734375, -5.29736328125, -5.05865478515625, -4.8199462890625, -4.58123779296875, -4.342529296875, -4.10382080078125, -3.8651123046875, -3.62640380859375, -3.3876953125, -3.14898681640625, -2.9102783203125, -2.67156982421875, -2.432861328125, -2.19415283203125, -1.9554443359375, -1.71673583984375, -1.47802734375, -1.23931884765625, -1.0006103515625, -0.76190185546875, -0.523193359375, -0.28448486328125, -0.0457763671875, 0.19293212890625, 0.431640625, 0.67034912109375, 0.9090576171875, 1.14776611328125, 1.386474609375, 1.62518310546875, 1.8638916015625, 2.10260009765625, 2.34130859375, 2.58001708984375, 2.8187255859375, 3.05743408203125, 3.296142578125, 3.53485107421875, 3.7735595703125, 4.01226806640625, 4.2509765625, 4.48968505859375, 4.7283935546875, 4.96710205078125, 5.205810546875, 5.44451904296875, 5.6832275390625, 5.92193603515625, 6.16064453125, 6.39935302734375, 6.6380615234375, 6.87677001953125, 7.115478515625, 7.35418701171875, 7.5928955078125, 7.83160400390625, 8.0703125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 6.0, 4.0, 5.0, 3.0, 12.0, 12.0, 17.0, 32.0, 21.0, 37.0, 35.0, 55.0, 33.0, 55.0, 74.0, 63.0, 73.0, 69.0, 54.0, 66.0, 65.0, 35.0, 30.0, 26.0, 30.0, 16.0, 15.0, 10.0, 14.0, 5.0, 7.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.453125, -6.22943115234375, -6.0057373046875, -5.78204345703125, -5.558349609375, -5.33465576171875, -5.1109619140625, -4.88726806640625, -4.66357421875, -4.43988037109375, -4.2161865234375, -3.99249267578125, -3.768798828125, -3.54510498046875, -3.3214111328125, -3.09771728515625, -2.8740234375, -2.65032958984375, -2.4266357421875, -2.20294189453125, -1.979248046875, -1.75555419921875, -1.5318603515625, -1.30816650390625, -1.08447265625, -0.86077880859375, -0.6370849609375, -0.41339111328125, -0.189697265625, 0.03399658203125, 0.2576904296875, 0.48138427734375, 0.705078125, 0.92877197265625, 1.1524658203125, 1.37615966796875, 1.599853515625, 1.82354736328125, 2.0472412109375, 2.27093505859375, 2.49462890625, 2.71832275390625, 2.9420166015625, 3.16571044921875, 3.389404296875, 3.61309814453125, 3.8367919921875, 4.06048583984375, 4.2841796875, 4.50787353515625, 4.7315673828125, 4.95526123046875, 5.178955078125, 5.40264892578125, 5.6263427734375, 5.85003662109375, 6.07373046875, 6.29742431640625, 6.5211181640625, 6.74481201171875, 6.968505859375, 7.19219970703125, 7.4158935546875, 7.63958740234375, 7.86328125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 4.0, 12.0, 15.0, 24.0, 59.0, 89.0, 151.0, 307.0, 561.0, 1055.0, 2404.0, 5432.0, 13626.0, 36147.0, 116073.0, 648559.0, 153305.0, 43176.0, 15875.0, 6357.0, 2792.0, 1228.0, 591.0, 327.0, 163.0, 95.0, 53.0, 32.0, 15.0, 9.0, 5.0, 1.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.525390625, -3.42041015625, -3.3154296875, -3.21044921875, -3.10546875, -3.00048828125, -2.8955078125, -2.79052734375, -2.685546875, -2.58056640625, -2.4755859375, -2.37060546875, -2.265625, -2.16064453125, -2.0556640625, -1.95068359375, -1.845703125, -1.74072265625, -1.6357421875, -1.53076171875, -1.42578125, -1.32080078125, -1.2158203125, -1.11083984375, -1.005859375, -0.90087890625, -0.7958984375, -0.69091796875, -0.5859375, -0.48095703125, -0.3759765625, -0.27099609375, -0.166015625, -0.06103515625, 0.0439453125, 0.14892578125, 0.25390625, 0.35888671875, 0.4638671875, 0.56884765625, 0.673828125, 0.77880859375, 0.8837890625, 0.98876953125, 1.09375, 1.19873046875, 1.3037109375, 1.40869140625, 1.513671875, 1.61865234375, 1.7236328125, 1.82861328125, 1.93359375, 2.03857421875, 2.1435546875, 2.24853515625, 2.353515625, 2.45849609375, 2.5634765625, 2.66845703125, 2.7734375, 2.87841796875, 2.9833984375, 3.08837890625, 3.193359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 3.0, 2.0, 4.0, 6.0, 10.0, 7.0, 11.0, 20.0, 18.0, 25.0, 39.0, 102.0, 249.0, 250.0, 94.0, 40.0, 23.0, 20.0, 17.0, 15.0, 6.0, 12.0, 4.0, 4.0, 4.0, 5.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0011625289916992188, -0.0011319443583488464, -0.0011013597249984741, -0.0010707750916481018, -0.0010401904582977295, -0.0010096058249473572, -0.0009790211915969849, -0.0009484365582466125, -0.0009178519248962402, -0.0008872672915458679, -0.0008566826581954956, -0.0008260980248451233, -0.000795513391494751, -0.0007649287581443787, -0.0007343441247940063, -0.000703759491443634, -0.0006731748580932617, -0.0006425902247428894, -0.0006120055913925171, -0.0005814209580421448, -0.0005508363246917725, -0.0005202516913414001, -0.0004896670579910278, -0.0004590824246406555, -0.0004284977912902832, -0.0003979131579399109, -0.0003673285245895386, -0.00033674389123916626, -0.00030615925788879395, -0.00027557462453842163, -0.0002449899911880493, -0.000214405357837677, -0.0001838207244873047, -0.00015323609113693237, -0.00012265145778656006, -9.206682443618774e-05, -6.148219108581543e-05, -3.0897557735443115e-05, -3.129243850708008e-07, 3.0271708965301514e-05, 6.085634231567383e-05, 9.144097566604614e-05, 0.00012202560901641846, 0.00015261024236679077, 0.00018319487571716309, 0.0002137795090675354, 0.0002443641424179077, 0.00027494877576828003, 0.00030553340911865234, 0.00033611804246902466, 0.00036670267581939697, 0.0003972873091697693, 0.0004278719425201416, 0.0004584565758705139, 0.0004890412092208862, 0.0005196258425712585, 0.0005502104759216309, 0.0005807951092720032, 0.0006113797426223755, 0.0006419643759727478, 0.0006725490093231201, 0.0007031336426734924, 0.0007337182760238647, 0.0007643029093742371, 0.0007948875427246094]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 7.0, 14.0, 16.0, 40.0, 58.0, 127.0, 262.0, 651.0, 1769.0, 6604.0, 32369.0, 345985.0, 604680.0, 43918.0, 8568.0, 2134.0, 720.0, 311.0, 141.0, 73.0, 45.0, 23.0, 15.0, 9.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83203125, -4.64678955078125, -4.4615478515625, -4.27630615234375, -4.091064453125, -3.90582275390625, -3.7205810546875, -3.53533935546875, -3.35009765625, -3.16485595703125, -2.9796142578125, -2.79437255859375, -2.609130859375, -2.42388916015625, -2.2386474609375, -2.05340576171875, -1.8681640625, -1.68292236328125, -1.4976806640625, -1.31243896484375, -1.127197265625, -0.94195556640625, -0.7567138671875, -0.57147216796875, -0.38623046875, -0.20098876953125, -0.0157470703125, 0.16949462890625, 0.354736328125, 0.53997802734375, 0.7252197265625, 0.91046142578125, 1.095703125, 1.28094482421875, 1.4661865234375, 1.65142822265625, 1.836669921875, 2.02191162109375, 2.2071533203125, 2.39239501953125, 2.57763671875, 2.76287841796875, 2.9481201171875, 3.13336181640625, 3.318603515625, 3.50384521484375, 3.6890869140625, 3.87432861328125, 4.0595703125, 4.24481201171875, 4.4300537109375, 4.61529541015625, 4.800537109375, 4.98577880859375, 5.1710205078125, 5.35626220703125, 5.54150390625, 5.72674560546875, 5.9119873046875, 6.09722900390625, 6.282470703125, 6.46771240234375, 6.6529541015625, 6.83819580078125, 7.0234375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 7.0, 8.0, 14.0, 14.0, 20.0, 28.0, 38.0, 70.0, 118.0, 197.0, 212.0, 109.0, 62.0, 42.0, 19.0, 9.0, 12.0, 6.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.9296875, -5.77362060546875, -5.6175537109375, -5.46148681640625, -5.305419921875, -5.14935302734375, -4.9932861328125, -4.83721923828125, -4.68115234375, -4.52508544921875, -4.3690185546875, -4.21295166015625, -4.056884765625, -3.90081787109375, -3.7447509765625, -3.58868408203125, -3.4326171875, -3.27655029296875, -3.1204833984375, -2.96441650390625, -2.808349609375, -2.65228271484375, -2.4962158203125, -2.34014892578125, -2.18408203125, -2.02801513671875, -1.8719482421875, -1.71588134765625, -1.559814453125, -1.40374755859375, -1.2476806640625, -1.09161376953125, -0.935546875, -0.77947998046875, -0.6234130859375, -0.46734619140625, -0.311279296875, -0.15521240234375, 0.0008544921875, 0.15692138671875, 0.31298828125, 0.46905517578125, 0.6251220703125, 0.78118896484375, 0.937255859375, 1.09332275390625, 1.2493896484375, 1.40545654296875, 1.5615234375, 1.71759033203125, 1.8736572265625, 2.02972412109375, 2.185791015625, 2.34185791015625, 2.4979248046875, 2.65399169921875, 2.81005859375, 2.96612548828125, 3.1221923828125, 3.27825927734375, 3.434326171875, 3.59039306640625, 3.7464599609375, 3.90252685546875, 4.05859375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 2.0, 5.0, 12.0, 24.0, 32.0, 67.0, 95.0, 140.0, 140.0, 147.0, 144.0, 98.0, 57.0, 20.0, 13.0, 6.0, 1.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.44891357421875, -36.419551849365234, -34.39019012451172, -32.36082458496094, -30.331462860107422, -28.302101135253906, -26.272737503051758, -24.24337387084961, -22.214012145996094, -20.184650421142578, -18.15528678894043, -16.12592315673828, -14.096561431884766, -12.067198753356934, -10.037836074829102, -8.00847339630127, -5.9791107177734375, -3.9497480392456055, -1.9203853607177734, 0.1089773178100586, 2.1383399963378906, 4.167702674865723, 6.197065353393555, 8.226428031921387, 10.255790710449219, 12.28515338897705, 14.314516067504883, 16.34387969970703, 18.373241424560547, 20.402603149414062, 22.43196678161621, 24.46133041381836, 26.490692138671875, 28.52005386352539, 30.54941749572754, 32.57878112792969, 34.6081428527832, 36.63750457763672, 38.6668701171875, 40.696231842041016, 42.72559356689453, 44.75495529174805, 46.78431701660156, 48.813682556152344, 50.84304428100586, 52.872406005859375, 54.901771545410156, 56.93113327026367, 58.96049499511719, 60.9898567199707, 63.01921844482422, 65.048583984375, 67.07794189453125, 69.10730743408203, 71.13667297363281, 73.16603088378906, 75.19539642333984, 77.22476196289062, 79.25411987304688, 81.28348541259766, 83.31285095214844, 85.34220886230469, 87.37157440185547, 89.40093231201172, 91.4302978515625]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 6.0, 10.0, 6.0, 8.0, 7.0, 19.0, 14.0, 19.0, 19.0, 24.0, 33.0, 26.0, 27.0, 34.0, 35.0, 35.0, 36.0, 53.0, 32.0, 37.0, 43.0, 28.0, 41.0, 47.0, 42.0, 27.0, 30.0, 33.0, 24.0, 24.0, 28.0, 19.0, 21.0, 16.0, 15.0, 11.0, 6.0, 8.0, 5.0, 8.0, 6.0, 8.0, 3.0, 3.0, 2.0, 2.0, 5.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.90359115600586, -22.145753860473633, -21.387914657592773, -20.630077362060547, -19.87224006652832, -19.114402770996094, -18.356563568115234, -17.598726272583008, -16.84088897705078, -16.083051681518555, -15.325213432312012, -14.567375183105469, -13.809537887573242, -13.0516996383667, -12.293861389160156, -11.53602409362793, -10.77818489074707, -10.020346641540527, -9.2625093460083, -8.504671096801758, -7.746833324432373, -6.988995552062988, -6.231157302856445, -5.4733195304870605, -4.715481758117676, -3.957643985748291, -3.199805974960327, -2.4419679641723633, -1.6841301918029785, -0.9262924194335938, -0.16845417022705078, 0.589383602142334, 1.3472232818603516, 2.1050610542297363, 2.8628990650177, 3.620737075805664, 4.378574848175049, 5.136412620544434, 5.894250869750977, 6.652088642120361, 7.409926414489746, 8.167764663696289, 8.925601959228516, 9.683440208435059, 10.441278457641602, 11.199115753173828, 11.956954002380371, 12.714792251586914, 13.47262954711914, 14.230467796325684, 14.98830509185791, 15.746143341064453, 16.50398063659668, 17.261817932128906, 18.019657135009766, 18.777494430541992, 19.53533172607422, 20.293169021606445, 21.051008224487305, 21.80884552001953, 22.566682815551758, 23.324520111083984, 24.082359313964844, 24.84019660949707, 25.59803581237793]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 12.0, 20.0, 24.0, 20.0, 37.0, 65.0, 74.0, 121.0, 225.0, 368.0, 532.0, 928.0, 1603.0, 2787.0, 5321.0, 10740.0, 24023.0, 62826.0, 223818.0, 3096346.0, 584195.0, 110670.0, 37200.0, 15631.0, 7461.0, 3819.0, 2065.0, 1224.0, 747.0, 466.0, 292.0, 195.0, 139.0, 84.0, 63.0, 33.0, 32.0, 20.0, 11.0, 7.0, 12.0, 5.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.1875, -5.98626708984375, -5.7850341796875, -5.58380126953125, -5.382568359375, -5.18133544921875, -4.9801025390625, -4.77886962890625, -4.57763671875, -4.37640380859375, -4.1751708984375, -3.97393798828125, -3.772705078125, -3.57147216796875, -3.3702392578125, -3.16900634765625, -2.9677734375, -2.76654052734375, -2.5653076171875, -2.36407470703125, -2.162841796875, -1.96160888671875, -1.7603759765625, -1.55914306640625, -1.35791015625, -1.15667724609375, -0.9554443359375, -0.75421142578125, -0.552978515625, -0.35174560546875, -0.1505126953125, 0.05072021484375, 0.251953125, 0.45318603515625, 0.6544189453125, 0.85565185546875, 1.056884765625, 1.25811767578125, 1.4593505859375, 1.66058349609375, 1.86181640625, 2.06304931640625, 2.2642822265625, 2.46551513671875, 2.666748046875, 2.86798095703125, 3.0692138671875, 3.27044677734375, 3.4716796875, 3.67291259765625, 3.8741455078125, 4.07537841796875, 4.276611328125, 4.47784423828125, 4.6790771484375, 4.88031005859375, 5.08154296875, 5.28277587890625, 5.4840087890625, 5.68524169921875, 5.886474609375, 6.08770751953125, 6.2889404296875, 6.49017333984375, 6.69140625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 15.0, 9.0, 16.0, 13.0, 21.0, 19.0, 38.0, 31.0, 48.0, 44.0, 49.0, 43.0, 67.0, 57.0, 50.0, 73.0, 50.0, 43.0, 50.0, 36.0, 48.0, 36.0, 30.0, 28.0, 15.0, 13.0, 10.0, 10.0, 6.0, 7.0, 6.0, 1.0, 4.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1064453125, -1.0593414306640625, -1.012237548828125, -0.9651336669921875, -0.91802978515625, -0.8709259033203125, -0.823822021484375, -0.7767181396484375, -0.7296142578125, -0.6825103759765625, -0.635406494140625, -0.5883026123046875, -0.54119873046875, -0.4940948486328125, -0.446990966796875, -0.3998870849609375, -0.352783203125, -0.3056793212890625, -0.258575439453125, -0.2114715576171875, -0.16436767578125, -0.1172637939453125, -0.070159912109375, -0.0230560302734375, 0.0240478515625, 0.0711517333984375, 0.118255615234375, 0.1653594970703125, 0.21246337890625, 0.2595672607421875, 0.306671142578125, 0.3537750244140625, 0.40087890625, 0.4479827880859375, 0.495086669921875, 0.5421905517578125, 0.58929443359375, 0.6363983154296875, 0.683502197265625, 0.7306060791015625, 0.7777099609375, 0.8248138427734375, 0.871917724609375, 0.9190216064453125, 0.96612548828125, 1.0132293701171875, 1.060333251953125, 1.1074371337890625, 1.154541015625, 1.2016448974609375, 1.248748779296875, 1.2958526611328125, 1.34295654296875, 1.3900604248046875, 1.437164306640625, 1.4842681884765625, 1.5313720703125, 1.5784759521484375, 1.625579833984375, 1.6726837158203125, 1.71978759765625, 1.7668914794921875, 1.813995361328125, 1.8610992431640625, 1.908203125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 18.0, 25.0, 30.0, 61.0, 117.0, 190.0, 276.0, 545.0, 828.0, 1644.0, 3103.0, 6831.0, 16272.0, 47463.0, 181875.0, 2711887.0, 1027852.0, 131910.0, 37880.0, 13719.0, 5724.0, 2759.0, 1356.0, 771.0, 463.0, 277.0, 144.0, 97.0, 71.0, 37.0, 24.0, 10.0, 12.0, 3.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.61328125, -7.34979248046875, -7.0863037109375, -6.82281494140625, -6.559326171875, -6.29583740234375, -6.0323486328125, -5.76885986328125, -5.50537109375, -5.24188232421875, -4.9783935546875, -4.71490478515625, -4.451416015625, -4.18792724609375, -3.9244384765625, -3.66094970703125, -3.3974609375, -3.13397216796875, -2.8704833984375, -2.60699462890625, -2.343505859375, -2.08001708984375, -1.8165283203125, -1.55303955078125, -1.28955078125, -1.02606201171875, -0.7625732421875, -0.49908447265625, -0.235595703125, 0.02789306640625, 0.2913818359375, 0.55487060546875, 0.818359375, 1.08184814453125, 1.3453369140625, 1.60882568359375, 1.872314453125, 2.13580322265625, 2.3992919921875, 2.66278076171875, 2.92626953125, 3.18975830078125, 3.4532470703125, 3.71673583984375, 3.980224609375, 4.24371337890625, 4.5072021484375, 4.77069091796875, 5.0341796875, 5.29766845703125, 5.5611572265625, 5.82464599609375, 6.088134765625, 6.35162353515625, 6.6151123046875, 6.87860107421875, 7.14208984375, 7.40557861328125, 7.6690673828125, 7.93255615234375, 8.196044921875, 8.45953369140625, 8.7230224609375, 8.98651123046875, 9.25]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 7.0, 8.0, 15.0, 21.0, 31.0, 55.0, 87.0, 117.0, 213.0, 438.0, 1624.0, 690.0, 289.0, 148.0, 88.0, 67.0, 49.0, 35.0, 23.0, 15.0, 13.0, 7.0, 7.0, 6.0, 7.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.609375, -3.4837646484375, -3.358154296875, -3.2325439453125, -3.10693359375, -2.9813232421875, -2.855712890625, -2.7301025390625, -2.6044921875, -2.4788818359375, -2.353271484375, -2.2276611328125, -2.10205078125, -1.9764404296875, -1.850830078125, -1.7252197265625, -1.599609375, -1.4739990234375, -1.348388671875, -1.2227783203125, -1.09716796875, -0.9715576171875, -0.845947265625, -0.7203369140625, -0.5947265625, -0.4691162109375, -0.343505859375, -0.2178955078125, -0.09228515625, 0.0333251953125, 0.158935546875, 0.2845458984375, 0.41015625, 0.5357666015625, 0.661376953125, 0.7869873046875, 0.91259765625, 1.0382080078125, 1.163818359375, 1.2894287109375, 1.4150390625, 1.5406494140625, 1.666259765625, 1.7918701171875, 1.91748046875, 2.0430908203125, 2.168701171875, 2.2943115234375, 2.419921875, 2.5455322265625, 2.671142578125, 2.7967529296875, 2.92236328125, 3.0479736328125, 3.173583984375, 3.2991943359375, 3.4248046875, 3.5504150390625, 3.676025390625, 3.8016357421875, 3.92724609375, 4.0528564453125, 4.178466796875, 4.3040771484375, 4.4296875]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 21.0, 67.0, 140.0, 275.0, 254.0, 148.0, 65.0, 22.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.699344635009766, -39.0065803527832, -37.31381607055664, -35.62105178833008, -33.92829132080078, -32.23552703857422, -30.542762756347656, -28.849998474121094, -27.15723419189453, -25.46446990966797, -23.771705627441406, -22.078943252563477, -20.386178970336914, -18.69341468811035, -17.000652313232422, -15.30788803100586, -13.615123748779297, -11.922359466552734, -10.229596138000488, -8.536832809448242, -6.84406852722168, -5.151304244995117, -3.458540916442871, -1.765777587890625, -0.0730133056640625, 1.6197504997253418, 3.312514305114746, 5.00527811050415, 6.698041915893555, 8.390806198120117, 10.083569526672363, 11.77633285522461, 13.469100952148438, 15.161865234375, 16.854629516601562, 18.547391891479492, 20.240156173706055, 21.932920455932617, 23.625682830810547, 25.31844711303711, 27.011211395263672, 28.703975677490234, 30.396739959716797, 32.08950424194336, 33.782264709472656, 35.47502899169922, 37.16779327392578, 38.860557556152344, 40.553321838378906, 42.24608612060547, 43.93885040283203, 45.631614685058594, 47.324378967285156, 49.01714324951172, 50.709903717041016, 52.40266799926758, 54.09543228149414, 55.7881965637207, 57.480960845947266, 59.17372512817383, 60.866485595703125, 62.55924987792969, 64.25201416015625, 65.94477844238281, 67.63754272460938]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 9.0, 10.0, 13.0, 17.0, 22.0, 19.0, 25.0, 42.0, 46.0, 53.0, 54.0, 53.0, 67.0, 60.0, 59.0, 73.0, 59.0, 53.0, 57.0, 49.0, 41.0, 36.0, 22.0, 25.0, 22.0, 6.0, 2.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.989720344543457, -14.430143356323242, -13.870567321777344, -13.310990333557129, -12.751413345336914, -12.191837310791016, -11.6322603225708, -11.072683334350586, -10.513107299804688, -9.953530311584473, -9.393954277038574, -8.83437728881836, -8.274800300598145, -7.715223789215088, -7.155647277832031, -6.596070289611816, -6.036493301391602, -5.476916790008545, -4.91733980178833, -4.357763290405273, -3.7981865406036377, -3.238609790802002, -2.6790332794189453, -2.1194565296173096, -1.5598797798156738, -1.000303030014038, -0.4407263994216919, 0.1188502311706543, 0.67842698097229, 1.2380037307739258, 1.7975802421569824, 2.357156991958618, 2.9167346954345703, 3.476311445236206, 4.035888195037842, 4.595464706420898, 5.155041694641113, 5.71461820602417, 6.274194717407227, 6.833771705627441, 7.393348217010498, 7.952924728393555, 8.51250171661377, 9.072078704833984, 9.631654739379883, 10.191231727600098, 10.750808715820312, 11.310384750366211, 11.869961738586426, 12.42953872680664, 12.989114761352539, 13.548691749572754, 14.108268737792969, 14.667844772338867, 15.227421760559082, 15.786998748779297, 16.346574783325195, 16.906150817871094, 17.465728759765625, 18.025304794311523, 18.584880828857422, 19.144458770751953, 19.70403480529785, 20.26361083984375, 20.82318878173828]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 14.0, 12.0, 30.0, 47.0, 86.0, 131.0, 189.0, 327.0, 595.0, 1146.0, 2030.0, 3989.0, 7780.0, 15782.0, 30580.0, 57972.0, 108948.0, 229863.0, 294794.0, 140030.0, 73343.0, 39595.0, 20343.0, 10238.0, 5055.0, 2586.0, 1354.0, 693.0, 387.0, 245.0, 133.0, 92.0, 56.0, 41.0, 21.0, 11.0, 6.0, 7.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.51953125, -4.36981201171875, -4.2200927734375, -4.07037353515625, -3.920654296875, -3.77093505859375, -3.6212158203125, -3.47149658203125, -3.32177734375, -3.17205810546875, -3.0223388671875, -2.87261962890625, -2.722900390625, -2.57318115234375, -2.4234619140625, -2.27374267578125, -2.1240234375, -1.97430419921875, -1.8245849609375, -1.67486572265625, -1.525146484375, -1.37542724609375, -1.2257080078125, -1.07598876953125, -0.92626953125, -0.77655029296875, -0.6268310546875, -0.47711181640625, -0.327392578125, -0.17767333984375, -0.0279541015625, 0.12176513671875, 0.271484375, 0.42120361328125, 0.5709228515625, 0.72064208984375, 0.870361328125, 1.02008056640625, 1.1697998046875, 1.31951904296875, 1.46923828125, 1.61895751953125, 1.7686767578125, 1.91839599609375, 2.068115234375, 2.21783447265625, 2.3675537109375, 2.51727294921875, 2.6669921875, 2.81671142578125, 2.9664306640625, 3.11614990234375, 3.265869140625, 3.41558837890625, 3.5653076171875, 3.71502685546875, 3.86474609375, 4.01446533203125, 4.1641845703125, 4.31390380859375, 4.463623046875, 4.61334228515625, 4.7630615234375, 4.91278076171875, 5.0625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 2.0, 11.0, 9.0, 7.0, 14.0, 14.0, 18.0, 24.0, 22.0, 32.0, 27.0, 45.0, 34.0, 45.0, 50.0, 42.0, 46.0, 44.0, 63.0, 46.0, 54.0, 60.0, 51.0, 22.0, 34.0, 28.0, 30.0, 18.0, 20.0, 15.0, 16.0, 15.0, 7.0, 9.0, 4.0, 7.0, 4.0, 3.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2265625, -1.1812896728515625, -1.136016845703125, -1.0907440185546875, -1.04547119140625, -1.0001983642578125, -0.954925537109375, -0.9096527099609375, -0.8643798828125, -0.8191070556640625, -0.773834228515625, -0.7285614013671875, -0.68328857421875, -0.6380157470703125, -0.592742919921875, -0.5474700927734375, -0.502197265625, -0.4569244384765625, -0.411651611328125, -0.3663787841796875, -0.32110595703125, -0.2758331298828125, -0.230560302734375, -0.1852874755859375, -0.1400146484375, -0.0947418212890625, -0.049468994140625, -0.0041961669921875, 0.04107666015625, 0.0863494873046875, 0.131622314453125, 0.1768951416015625, 0.22216796875, 0.2674407958984375, 0.312713623046875, 0.3579864501953125, 0.40325927734375, 0.4485321044921875, 0.493804931640625, 0.5390777587890625, 0.5843505859375, 0.6296234130859375, 0.674896240234375, 0.7201690673828125, 0.76544189453125, 0.8107147216796875, 0.855987548828125, 0.9012603759765625, 0.946533203125, 0.9918060302734375, 1.037078857421875, 1.0823516845703125, 1.12762451171875, 1.1728973388671875, 1.218170166015625, 1.2634429931640625, 1.3087158203125, 1.3539886474609375, 1.399261474609375, 1.4445343017578125, 1.48980712890625, 1.5350799560546875, 1.580352783203125, 1.6256256103515625, 1.6708984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 9.0, 7.0, 18.0, 19.0, 30.0, 55.0, 65.0, 102.0, 151.0, 226.0, 356.0, 556.0, 1074.0, 2752.0, 12265.0, 98630.0, 694053.0, 205105.0, 25454.0, 4269.0, 1421.0, 740.0, 406.0, 249.0, 164.0, 109.0, 74.0, 60.0, 34.0, 16.0, 17.0, 19.0, 10.0, 1.0, 5.0, 6.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.679443359375, -11.24169921875, -10.803955078125, -10.3662109375, -9.928466796875, -9.49072265625, -9.052978515625, -8.615234375, -8.177490234375, -7.73974609375, -7.302001953125, -6.8642578125, -6.426513671875, -5.98876953125, -5.551025390625, -5.11328125, -4.675537109375, -4.23779296875, -3.800048828125, -3.3623046875, -2.924560546875, -2.48681640625, -2.049072265625, -1.611328125, -1.173583984375, -0.73583984375, -0.298095703125, 0.1396484375, 0.577392578125, 1.01513671875, 1.452880859375, 1.890625, 2.328369140625, 2.76611328125, 3.203857421875, 3.6416015625, 4.079345703125, 4.51708984375, 4.954833984375, 5.392578125, 5.830322265625, 6.26806640625, 6.705810546875, 7.1435546875, 7.581298828125, 8.01904296875, 8.456787109375, 8.89453125, 9.332275390625, 9.77001953125, 10.207763671875, 10.6455078125, 11.083251953125, 11.52099609375, 11.958740234375, 12.396484375, 12.834228515625, 13.27197265625, 13.709716796875, 14.1474609375, 14.585205078125, 15.02294921875, 15.460693359375, 15.8984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 2.0, 9.0, 11.0, 7.0, 3.0, 13.0, 16.0, 16.0, 18.0, 14.0, 28.0, 34.0, 31.0, 36.0, 53.0, 52.0, 54.0, 54.0, 50.0, 60.0, 74.0, 52.0, 34.0, 42.0, 37.0, 32.0, 26.0, 29.0, 16.0, 31.0, 15.0, 15.0, 6.0, 8.0, 5.0, 6.0, 2.0, 5.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.53515625, -6.28314208984375, -6.0311279296875, -5.77911376953125, -5.527099609375, -5.27508544921875, -5.0230712890625, -4.77105712890625, -4.51904296875, -4.26702880859375, -4.0150146484375, -3.76300048828125, -3.510986328125, -3.25897216796875, -3.0069580078125, -2.75494384765625, -2.5029296875, -2.25091552734375, -1.9989013671875, -1.74688720703125, -1.494873046875, -1.24285888671875, -0.9908447265625, -0.73883056640625, -0.48681640625, -0.23480224609375, 0.0172119140625, 0.26922607421875, 0.521240234375, 0.77325439453125, 1.0252685546875, 1.27728271484375, 1.529296875, 1.78131103515625, 2.0333251953125, 2.28533935546875, 2.537353515625, 2.78936767578125, 3.0413818359375, 3.29339599609375, 3.54541015625, 3.79742431640625, 4.0494384765625, 4.30145263671875, 4.553466796875, 4.80548095703125, 5.0574951171875, 5.30950927734375, 5.5615234375, 5.81353759765625, 6.0655517578125, 6.31756591796875, 6.569580078125, 6.82159423828125, 7.0736083984375, 7.32562255859375, 7.57763671875, 7.82965087890625, 8.0816650390625, 8.33367919921875, 8.585693359375, 8.83770751953125, 9.0897216796875, 9.34173583984375, 9.59375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 2.0, 5.0, 7.0, 11.0, 14.0, 11.0, 30.0, 42.0, 99.0, 161.0, 393.0, 1018.0, 3061.0, 12482.0, 74637.0, 603511.0, 298016.0, 43457.0, 8081.0, 2147.0, 743.0, 306.0, 140.0, 64.0, 44.0, 24.0, 13.0, 3.0, 11.0, 7.0, 4.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.40625, -8.17181396484375, -7.9373779296875, -7.70294189453125, -7.468505859375, -7.23406982421875, -6.9996337890625, -6.76519775390625, -6.53076171875, -6.29632568359375, -6.0618896484375, -5.82745361328125, -5.593017578125, -5.35858154296875, -5.1241455078125, -4.88970947265625, -4.6552734375, -4.42083740234375, -4.1864013671875, -3.95196533203125, -3.717529296875, -3.48309326171875, -3.2486572265625, -3.01422119140625, -2.77978515625, -2.54534912109375, -2.3109130859375, -2.07647705078125, -1.842041015625, -1.60760498046875, -1.3731689453125, -1.13873291015625, -0.904296875, -0.66986083984375, -0.4354248046875, -0.20098876953125, 0.033447265625, 0.26788330078125, 0.5023193359375, 0.73675537109375, 0.97119140625, 1.20562744140625, 1.4400634765625, 1.67449951171875, 1.908935546875, 2.14337158203125, 2.3778076171875, 2.61224365234375, 2.8466796875, 3.08111572265625, 3.3155517578125, 3.54998779296875, 3.784423828125, 4.01885986328125, 4.2532958984375, 4.48773193359375, 4.72216796875, 4.95660400390625, 5.1910400390625, 5.42547607421875, 5.659912109375, 5.89434814453125, 6.1287841796875, 6.36322021484375, 6.59765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 8.0, 9.0, 8.0, 5.0, 9.0, 12.0, 10.0, 17.0, 23.0, 35.0, 38.0, 38.0, 39.0, 51.0, 92.0, 156.0, 153.0, 65.0, 38.0, 38.0, 29.0, 30.0, 18.0, 7.0, 14.0, 8.0, 9.0, 6.0, 7.0, 4.0, 8.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0011463165283203125, -0.001116037368774414, -0.0010857582092285156, -0.0010554790496826172, -0.0010251998901367188, -0.0009949207305908203, -0.0009646415710449219, -0.0009343624114990234, -0.000904083251953125, -0.0008738040924072266, -0.0008435249328613281, -0.0008132457733154297, -0.0007829666137695312, -0.0007526874542236328, -0.0007224082946777344, -0.0006921291351318359, -0.0006618499755859375, -0.0006315708160400391, -0.0006012916564941406, -0.0005710124969482422, -0.0005407333374023438, -0.0005104541778564453, -0.0004801750183105469, -0.00044989585876464844, -0.00041961669921875, -0.00038933753967285156, -0.0003590583801269531, -0.0003287792205810547, -0.00029850006103515625, -0.0002682209014892578, -0.00023794174194335938, -0.00020766258239746094, -0.0001773834228515625, -0.00014710426330566406, -0.00011682510375976562, -8.654594421386719e-05, -5.626678466796875e-05, -2.5987625122070312e-05, 4.291534423828125e-06, 3.457069396972656e-05, 6.4849853515625e-05, 9.512901306152344e-05, 0.00012540817260742188, 0.0001556873321533203, 0.00018596649169921875, 0.0002162456512451172, 0.0002465248107910156, 0.00027680397033691406, 0.0003070831298828125, 0.00033736228942871094, 0.0003676414489746094, 0.0003979206085205078, 0.00042819976806640625, 0.0004584789276123047, 0.0004887580871582031, 0.0005190372467041016, 0.00054931640625, 0.0005795955657958984, 0.0006098747253417969, 0.0006401538848876953, 0.0006704330444335938, 0.0007007122039794922, 0.0007309913635253906, 0.0007612705230712891, 0.0007915496826171875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 12.0, 13.0, 23.0, 37.0, 47.0, 97.0, 177.0, 297.0, 635.0, 1481.0, 5784.0, 51151.0, 695683.0, 267940.0, 19947.0, 3189.0, 998.0, 457.0, 232.0, 147.0, 76.0, 46.0, 30.0, 18.0, 9.0, 9.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.03125, -10.72314453125, -10.4150390625, -10.10693359375, -9.798828125, -9.49072265625, -9.1826171875, -8.87451171875, -8.56640625, -8.25830078125, -7.9501953125, -7.64208984375, -7.333984375, -7.02587890625, -6.7177734375, -6.40966796875, -6.1015625, -5.79345703125, -5.4853515625, -5.17724609375, -4.869140625, -4.56103515625, -4.2529296875, -3.94482421875, -3.63671875, -3.32861328125, -3.0205078125, -2.71240234375, -2.404296875, -2.09619140625, -1.7880859375, -1.47998046875, -1.171875, -0.86376953125, -0.5556640625, -0.24755859375, 0.060546875, 0.36865234375, 0.6767578125, 0.98486328125, 1.29296875, 1.60107421875, 1.9091796875, 2.21728515625, 2.525390625, 2.83349609375, 3.1416015625, 3.44970703125, 3.7578125, 4.06591796875, 4.3740234375, 4.68212890625, 4.990234375, 5.29833984375, 5.6064453125, 5.91455078125, 6.22265625, 6.53076171875, 6.8388671875, 7.14697265625, 7.455078125, 7.76318359375, 8.0712890625, 8.37939453125, 8.6875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 11.0, 7.0, 13.0, 14.0, 18.0, 22.0, 29.0, 30.0, 40.0, 43.0, 62.0, 82.0, 104.0, 99.0, 102.0, 66.0, 62.0, 47.0, 21.0, 28.0, 22.0, 19.0, 20.0, 4.0, 11.0, 13.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.125, -3.9676513671875, -3.810302734375, -3.6529541015625, -3.49560546875, -3.3382568359375, -3.180908203125, -3.0235595703125, -2.8662109375, -2.7088623046875, -2.551513671875, -2.3941650390625, -2.23681640625, -2.0794677734375, -1.922119140625, -1.7647705078125, -1.607421875, -1.4500732421875, -1.292724609375, -1.1353759765625, -0.97802734375, -0.8206787109375, -0.663330078125, -0.5059814453125, -0.3486328125, -0.1912841796875, -0.033935546875, 0.1234130859375, 0.28076171875, 0.4381103515625, 0.595458984375, 0.7528076171875, 0.91015625, 1.0675048828125, 1.224853515625, 1.3822021484375, 1.53955078125, 1.6968994140625, 1.854248046875, 2.0115966796875, 2.1689453125, 2.3262939453125, 2.483642578125, 2.6409912109375, 2.79833984375, 2.9556884765625, 3.113037109375, 3.2703857421875, 3.427734375, 3.5850830078125, 3.742431640625, 3.8997802734375, 4.05712890625, 4.2144775390625, 4.371826171875, 4.5291748046875, 4.6865234375, 4.8438720703125, 5.001220703125, 5.1585693359375, 5.31591796875, 5.4732666015625, 5.630615234375, 5.7879638671875, 5.9453125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 14.0, 50.0, 154.0, 254.0, 266.0, 170.0, 71.0, 20.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.91348266601562, -92.36012268066406, -87.8067626953125, -83.25340270996094, -78.70004272460938, -74.14668273925781, -69.59332275390625, -65.03996276855469, -60.486602783203125, -55.93324279785156, -51.3798828125, -46.82652282714844, -42.273162841796875, -37.71980285644531, -33.16644287109375, -28.613082885742188, -24.059722900390625, -19.506362915039062, -14.9530029296875, -10.399642944335938, -5.846282958984375, -1.2929229736328125, 3.26043701171875, 7.8137969970703125, 12.367156982421875, 16.920516967773438, 21.473876953125, 26.027236938476562, 30.580596923828125, 35.13395690917969, 39.68731689453125, 44.24067687988281, 48.79405212402344, 53.347412109375, 57.90077209472656, 62.454132080078125, 67.00749206542969, 71.56085205078125, 76.11421203613281, 80.66757202148438, 85.22093200683594, 89.7742919921875, 94.32765197753906, 98.88101196289062, 103.43437194824219, 107.98773193359375, 112.54109191894531, 117.09445190429688, 121.64781188964844, 126.201171875, 130.75453186035156, 135.30789184570312, 139.8612518310547, 144.41461181640625, 148.9679718017578, 153.52133178710938, 158.07469177246094, 162.6280517578125, 167.18141174316406, 171.73477172851562, 176.2881317138672, 180.84149169921875, 185.3948516845703, 189.94821166992188, 194.50157165527344]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 3.0, 6.0, 12.0, 6.0, 9.0, 18.0, 3.0, 21.0, 25.0, 22.0, 26.0, 31.0, 36.0, 45.0, 32.0, 45.0, 36.0, 52.0, 30.0, 38.0, 40.0, 55.0, 41.0, 46.0, 46.0, 34.0, 26.0, 31.0, 34.0, 34.0, 20.0, 19.0, 17.0, 16.0, 13.0, 10.0, 8.0, 5.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-43.56036376953125, -42.34282684326172, -41.12529373168945, -39.90776062011719, -38.690223693847656, -37.472686767578125, -36.25515365600586, -35.037620544433594, -33.82008361816406, -32.60254669189453, -31.385013580322266, -30.167478561401367, -28.94994354248047, -27.73240852355957, -26.514873504638672, -25.297338485717773, -24.079803466796875, -22.862268447875977, -21.644733428955078, -20.42719841003418, -19.20966339111328, -17.992128372192383, -16.774593353271484, -15.557058334350586, -14.339523315429688, -13.121988296508789, -11.90445327758789, -10.686918258666992, -9.469383239746094, -8.251848220825195, -7.034313201904297, -5.816778182983398, -4.599239349365234, -3.381704330444336, -2.1641693115234375, -0.9466342926025391, 0.2709007263183594, 1.4884357452392578, 2.7059707641601562, 3.9235057830810547, 5.141040802001953, 6.358575820922852, 7.57611083984375, 8.793645858764648, 10.011180877685547, 11.228715896606445, 12.446250915527344, 13.663785934448242, 14.88132095336914, 16.09885597229004, 17.316390991210938, 18.533926010131836, 19.751461029052734, 20.968996047973633, 22.18653106689453, 23.40406608581543, 24.621601104736328, 25.839136123657227, 27.056671142578125, 28.274206161499023, 29.491741180419922, 30.70927619934082, 31.92681121826172, 33.14434814453125, 34.361881256103516]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 10.0, 21.0, 26.0, 28.0, 64.0, 98.0, 147.0, 221.0, 409.0, 684.0, 1245.0, 2272.0, 4426.0, 8994.0, 19625.0, 47435.0, 139210.0, 699112.0, 2852800.0, 280413.0, 79909.0, 30427.0, 13410.0, 6214.0, 3141.0, 1681.0, 907.0, 549.0, 304.0, 187.0, 101.0, 81.0, 43.0, 31.0, 20.0, 7.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5859375, -5.3809814453125, -5.176025390625, -4.9710693359375, -4.76611328125, -4.5611572265625, -4.356201171875, -4.1512451171875, -3.9462890625, -3.7413330078125, -3.536376953125, -3.3314208984375, -3.12646484375, -2.9215087890625, -2.716552734375, -2.5115966796875, -2.306640625, -2.1016845703125, -1.896728515625, -1.6917724609375, -1.48681640625, -1.2818603515625, -1.076904296875, -0.8719482421875, -0.6669921875, -0.4620361328125, -0.257080078125, -0.0521240234375, 0.15283203125, 0.3577880859375, 0.562744140625, 0.7677001953125, 0.97265625, 1.1776123046875, 1.382568359375, 1.5875244140625, 1.79248046875, 1.9974365234375, 2.202392578125, 2.4073486328125, 2.6123046875, 2.8172607421875, 3.022216796875, 3.2271728515625, 3.43212890625, 3.6370849609375, 3.842041015625, 4.0469970703125, 4.251953125, 4.4569091796875, 4.661865234375, 4.8668212890625, 5.07177734375, 5.2767333984375, 5.481689453125, 5.6866455078125, 5.8916015625, 6.0965576171875, 6.301513671875, 6.5064697265625, 6.71142578125, 6.9163818359375, 7.121337890625, 7.3262939453125, 7.53125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 2.0, 9.0, 6.0, 12.0, 16.0, 13.0, 18.0, 14.0, 31.0, 29.0, 33.0, 46.0, 41.0, 48.0, 56.0, 64.0, 52.0, 64.0, 61.0, 46.0, 56.0, 43.0, 32.0, 40.0, 34.0, 31.0, 27.0, 22.0, 11.0, 11.0, 12.0, 11.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5458984375, -1.4888458251953125, -1.431793212890625, -1.3747406005859375, -1.31768798828125, -1.2606353759765625, -1.203582763671875, -1.1465301513671875, -1.0894775390625, -1.0324249267578125, -0.975372314453125, -0.9183197021484375, -0.86126708984375, -0.8042144775390625, -0.747161865234375, -0.6901092529296875, -0.633056640625, -0.5760040283203125, -0.518951416015625, -0.4618988037109375, -0.40484619140625, -0.3477935791015625, -0.290740966796875, -0.2336883544921875, -0.1766357421875, -0.1195831298828125, -0.062530517578125, -0.0054779052734375, 0.05157470703125, 0.1086273193359375, 0.165679931640625, 0.2227325439453125, 0.27978515625, 0.3368377685546875, 0.393890380859375, 0.4509429931640625, 0.50799560546875, 0.5650482177734375, 0.622100830078125, 0.6791534423828125, 0.7362060546875, 0.7932586669921875, 0.850311279296875, 0.9073638916015625, 0.96441650390625, 1.0214691162109375, 1.078521728515625, 1.1355743408203125, 1.192626953125, 1.2496795654296875, 1.306732177734375, 1.3637847900390625, 1.42083740234375, 1.4778900146484375, 1.534942626953125, 1.5919952392578125, 1.6490478515625, 1.7061004638671875, 1.763153076171875, 1.8202056884765625, 1.87725830078125, 1.9343109130859375, 1.991363525390625, 2.0484161376953125, 2.10546875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 6.0, 6.0, 18.0, 19.0, 35.0, 44.0, 55.0, 80.0, 149.0, 187.0, 284.0, 443.0, 642.0, 1033.0, 1797.0, 3207.0, 5524.0, 11008.0, 23697.0, 55802.0, 154452.0, 587420.0, 2646144.0, 473982.0, 134150.0, 49698.0, 21600.0, 10167.0, 5163.0, 2943.0, 1646.0, 967.0, 660.0, 445.0, 269.0, 179.0, 114.0, 81.0, 44.0, 42.0, 25.0, 21.0, 9.0, 10.0, 6.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-7.29296875, -7.087158203125, -6.88134765625, -6.675537109375, -6.4697265625, -6.263916015625, -6.05810546875, -5.852294921875, -5.646484375, -5.440673828125, -5.23486328125, -5.029052734375, -4.8232421875, -4.617431640625, -4.41162109375, -4.205810546875, -4.0, -3.794189453125, -3.58837890625, -3.382568359375, -3.1767578125, -2.970947265625, -2.76513671875, -2.559326171875, -2.353515625, -2.147705078125, -1.94189453125, -1.736083984375, -1.5302734375, -1.324462890625, -1.11865234375, -0.912841796875, -0.70703125, -0.501220703125, -0.29541015625, -0.089599609375, 0.1162109375, 0.322021484375, 0.52783203125, 0.733642578125, 0.939453125, 1.145263671875, 1.35107421875, 1.556884765625, 1.7626953125, 1.968505859375, 2.17431640625, 2.380126953125, 2.5859375, 2.791748046875, 2.99755859375, 3.203369140625, 3.4091796875, 3.614990234375, 3.82080078125, 4.026611328125, 4.232421875, 4.438232421875, 4.64404296875, 4.849853515625, 5.0556640625, 5.261474609375, 5.46728515625, 5.673095703125, 5.87890625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 5.0, 8.0, 9.0, 19.0, 25.0, 31.0, 53.0, 59.0, 98.0, 144.0, 268.0, 522.0, 1400.0, 600.0, 306.0, 183.0, 140.0, 67.0, 31.0, 35.0, 17.0, 9.0, 9.0, 10.0, 4.0, 8.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0, -4.8310546875, -4.662109375, -4.4931640625, -4.32421875, -4.1552734375, -3.986328125, -3.8173828125, -3.6484375, -3.4794921875, -3.310546875, -3.1416015625, -2.97265625, -2.8037109375, -2.634765625, -2.4658203125, -2.296875, -2.1279296875, -1.958984375, -1.7900390625, -1.62109375, -1.4521484375, -1.283203125, -1.1142578125, -0.9453125, -0.7763671875, -0.607421875, -0.4384765625, -0.26953125, -0.1005859375, 0.068359375, 0.2373046875, 0.40625, 0.5751953125, 0.744140625, 0.9130859375, 1.08203125, 1.2509765625, 1.419921875, 1.5888671875, 1.7578125, 1.9267578125, 2.095703125, 2.2646484375, 2.43359375, 2.6025390625, 2.771484375, 2.9404296875, 3.109375, 3.2783203125, 3.447265625, 3.6162109375, 3.78515625, 3.9541015625, 4.123046875, 4.2919921875, 4.4609375, 4.6298828125, 4.798828125, 4.9677734375, 5.13671875, 5.3056640625, 5.474609375, 5.6435546875, 5.8125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 5.0, 11.0, 11.0, 25.0, 44.0, 85.0, 103.0, 147.0, 163.0, 143.0, 106.0, 63.0, 43.0, 20.0, 17.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.86811065673828, -59.44182205200195, -58.01553726196289, -56.58924865722656, -55.1629638671875, -53.73667526245117, -52.310386657714844, -50.88410186767578, -49.45781326293945, -48.031524658203125, -46.60523986816406, -45.178951263427734, -43.75266647338867, -42.326377868652344, -40.90009307861328, -39.47380447387695, -38.047515869140625, -36.6212272644043, -35.194942474365234, -33.768653869628906, -32.342369079589844, -30.916080474853516, -29.48979377746582, -28.063507080078125, -26.637222290039062, -25.210935592651367, -23.784648895263672, -22.358360290527344, -20.93207359313965, -19.505786895751953, -18.079500198364258, -16.653213500976562, -15.226924896240234, -13.800638198852539, -12.374350547790527, -10.948063850402832, -9.52177619934082, -8.095489501953125, -6.66920280456543, -5.242915153503418, -3.8166284561157227, -2.390341281890869, -0.9640543460845947, 0.4622325897216797, 1.8885197639465332, 3.3148069381713867, 4.741093635559082, 6.167381286621094, 7.593667984008789, 9.019954681396484, 10.446242332458496, 11.872529029846191, 13.298816680908203, 14.725103378295898, 16.151390075683594, 17.577678680419922, 19.003963470458984, 20.43025016784668, 21.856536865234375, 23.282825469970703, 24.7091121673584, 26.135398864746094, 27.56168556213379, 28.987972259521484, 30.414260864257812]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 7.0, 11.0, 12.0, 18.0, 18.0, 32.0, 30.0, 43.0, 48.0, 42.0, 44.0, 55.0, 60.0, 57.0, 56.0, 67.0, 65.0, 39.0, 42.0, 46.0, 38.0, 36.0, 29.0, 21.0, 29.0, 16.0, 19.0, 4.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.234235763549805, -23.45902442932129, -22.68381118774414, -21.908599853515625, -21.13338851928711, -20.358177185058594, -19.582963943481445, -18.80775260925293, -18.03253936767578, -17.257328033447266, -16.482114791870117, -15.706903457641602, -14.931692123413086, -14.156479835510254, -13.381267547607422, -12.606056213378906, -11.83084487915039, -11.055632591247559, -10.280421257019043, -9.505208969116211, -8.729997634887695, -7.954785346984863, -7.179573059082031, -6.404361248016357, -5.629149436950684, -4.85393762588501, -4.078725814819336, -3.303513526916504, -2.52830171585083, -1.7530899047851562, -0.9778776168823242, -0.2026658058166504, 0.5725479125976562, 1.3477598428726196, 2.122971773147583, 2.898183822631836, 3.6733956336975098, 4.448607444763184, 5.223819732666016, 5.9990315437316895, 6.774243354797363, 7.549455165863037, 8.324666976928711, 9.099879264831543, 9.875091552734375, 10.65030288696289, 11.425515174865723, 12.200727462768555, 12.97593879699707, 13.751151084899902, 14.526362419128418, 15.30157470703125, 16.076786041259766, 16.85199737548828, 17.62721061706543, 18.402421951293945, 19.177635192871094, 19.95284652709961, 20.728059768676758, 21.503271102905273, 22.27848243713379, 23.053695678710938, 23.828907012939453, 24.60411834716797, 25.379329681396484]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 9.0, 11.0, 7.0, 26.0, 38.0, 53.0, 96.0, 132.0, 267.0, 479.0, 889.0, 1905.0, 4332.0, 10463.0, 25017.0, 63080.0, 154707.0, 301489.0, 271107.0, 127209.0, 51245.0, 20713.0, 8348.0, 3550.0, 1658.0, 782.0, 375.0, 222.0, 116.0, 88.0, 44.0, 32.0, 18.0, 14.0, 8.0, 6.0, 3.0, 7.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.65625, -6.4654541015625, -6.274658203125, -6.0838623046875, -5.89306640625, -5.7022705078125, -5.511474609375, -5.3206787109375, -5.1298828125, -4.9390869140625, -4.748291015625, -4.5574951171875, -4.36669921875, -4.1759033203125, -3.985107421875, -3.7943115234375, -3.603515625, -3.4127197265625, -3.221923828125, -3.0311279296875, -2.84033203125, -2.6495361328125, -2.458740234375, -2.2679443359375, -2.0771484375, -1.8863525390625, -1.695556640625, -1.5047607421875, -1.31396484375, -1.1231689453125, -0.932373046875, -0.7415771484375, -0.55078125, -0.3599853515625, -0.169189453125, 0.0216064453125, 0.21240234375, 0.4031982421875, 0.593994140625, 0.7847900390625, 0.9755859375, 1.1663818359375, 1.357177734375, 1.5479736328125, 1.73876953125, 1.9295654296875, 2.120361328125, 2.3111572265625, 2.501953125, 2.6927490234375, 2.883544921875, 3.0743408203125, 3.26513671875, 3.4559326171875, 3.646728515625, 3.8375244140625, 4.0283203125, 4.2191162109375, 4.409912109375, 4.6007080078125, 4.79150390625, 4.9822998046875, 5.173095703125, 5.3638916015625, 5.5546875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 10.0, 10.0, 19.0, 23.0, 25.0, 30.0, 37.0, 37.0, 43.0, 44.0, 62.0, 60.0, 68.0, 58.0, 69.0, 73.0, 55.0, 44.0, 39.0, 36.0, 37.0, 34.0, 23.0, 18.0, 13.0, 17.0, 5.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0], "bins": [-2.931640625, -2.8571014404296875, -2.782562255859375, -2.7080230712890625, -2.63348388671875, -2.5589447021484375, -2.484405517578125, -2.4098663330078125, -2.3353271484375, -2.2607879638671875, -2.186248779296875, -2.1117095947265625, -2.03717041015625, -1.9626312255859375, -1.888092041015625, -1.8135528564453125, -1.739013671875, -1.6644744873046875, -1.589935302734375, -1.5153961181640625, -1.44085693359375, -1.3663177490234375, -1.291778564453125, -1.2172393798828125, -1.1427001953125, -1.0681610107421875, -0.993621826171875, -0.9190826416015625, -0.84454345703125, -0.7700042724609375, -0.695465087890625, -0.6209259033203125, -0.54638671875, -0.4718475341796875, -0.397308349609375, -0.3227691650390625, -0.24822998046875, -0.1736907958984375, -0.099151611328125, -0.0246124267578125, 0.0499267578125, 0.1244659423828125, 0.199005126953125, 0.2735443115234375, 0.34808349609375, 0.4226226806640625, 0.497161865234375, 0.5717010498046875, 0.646240234375, 0.7207794189453125, 0.795318603515625, 0.8698577880859375, 0.94439697265625, 1.0189361572265625, 1.093475341796875, 1.1680145263671875, 1.2425537109375, 1.3170928955078125, 1.391632080078125, 1.4661712646484375, 1.54071044921875, 1.6152496337890625, 1.689788818359375, 1.7643280029296875, 1.8388671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 6.0, 4.0, 17.0, 15.0, 17.0, 30.0, 22.0, 46.0, 64.0, 79.0, 124.0, 208.0, 333.0, 474.0, 1022.0, 2416.0, 11847.0, 118623.0, 718011.0, 173280.0, 16179.0, 2992.0, 1126.0, 594.0, 355.0, 179.0, 147.0, 104.0, 82.0, 40.0, 27.0, 17.0, 24.0, 14.0, 11.0, 7.0, 7.0, 5.0, 4.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-19.71875, -19.1939697265625, -18.669189453125, -18.1444091796875, -17.61962890625, -17.0948486328125, -16.570068359375, -16.0452880859375, -15.5205078125, -14.9957275390625, -14.470947265625, -13.9461669921875, -13.42138671875, -12.8966064453125, -12.371826171875, -11.8470458984375, -11.322265625, -10.7974853515625, -10.272705078125, -9.7479248046875, -9.22314453125, -8.6983642578125, -8.173583984375, -7.6488037109375, -7.1240234375, -6.5992431640625, -6.074462890625, -5.5496826171875, -5.02490234375, -4.5001220703125, -3.975341796875, -3.4505615234375, -2.92578125, -2.4010009765625, -1.876220703125, -1.3514404296875, -0.82666015625, -0.3018798828125, 0.222900390625, 0.7476806640625, 1.2724609375, 1.7972412109375, 2.322021484375, 2.8468017578125, 3.37158203125, 3.8963623046875, 4.421142578125, 4.9459228515625, 5.470703125, 5.9954833984375, 6.520263671875, 7.0450439453125, 7.56982421875, 8.0946044921875, 8.619384765625, 9.1441650390625, 9.6689453125, 10.1937255859375, 10.718505859375, 11.2432861328125, 11.76806640625, 12.2928466796875, 12.817626953125, 13.3424072265625, 13.8671875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 4.0, 6.0, 7.0, 13.0, 10.0, 12.0, 21.0, 22.0, 28.0, 33.0, 36.0, 27.0, 31.0, 47.0, 45.0, 49.0, 49.0, 54.0, 52.0, 56.0, 44.0, 48.0, 38.0, 44.0, 39.0, 23.0, 27.0, 31.0, 15.0, 25.0, 13.0, 10.0, 7.0, 10.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.84375, -9.4541015625, -9.064453125, -8.6748046875, -8.28515625, -7.8955078125, -7.505859375, -7.1162109375, -6.7265625, -6.3369140625, -5.947265625, -5.5576171875, -5.16796875, -4.7783203125, -4.388671875, -3.9990234375, -3.609375, -3.2197265625, -2.830078125, -2.4404296875, -2.05078125, -1.6611328125, -1.271484375, -0.8818359375, -0.4921875, -0.1025390625, 0.287109375, 0.6767578125, 1.06640625, 1.4560546875, 1.845703125, 2.2353515625, 2.625, 3.0146484375, 3.404296875, 3.7939453125, 4.18359375, 4.5732421875, 4.962890625, 5.3525390625, 5.7421875, 6.1318359375, 6.521484375, 6.9111328125, 7.30078125, 7.6904296875, 8.080078125, 8.4697265625, 8.859375, 9.2490234375, 9.638671875, 10.0283203125, 10.41796875, 10.8076171875, 11.197265625, 11.5869140625, 11.9765625, 12.3662109375, 12.755859375, 13.1455078125, 13.53515625, 13.9248046875, 14.314453125, 14.7041015625, 15.09375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 4.0, 5.0, 7.0, 8.0, 11.0, 19.0, 20.0, 37.0, 67.0, 145.0, 223.0, 506.0, 1243.0, 3681.0, 14384.0, 84800.0, 531893.0, 348831.0, 48825.0, 9389.0, 2624.0, 962.0, 417.0, 196.0, 103.0, 50.0, 31.0, 23.0, 18.0, 5.0, 6.0, 4.0, 7.0, 1.0, 8.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.03125, -7.80084228515625, -7.5704345703125, -7.34002685546875, -7.109619140625, -6.87921142578125, -6.6488037109375, -6.41839599609375, -6.18798828125, -5.95758056640625, -5.7271728515625, -5.49676513671875, -5.266357421875, -5.03594970703125, -4.8055419921875, -4.57513427734375, -4.3447265625, -4.11431884765625, -3.8839111328125, -3.65350341796875, -3.423095703125, -3.19268798828125, -2.9622802734375, -2.73187255859375, -2.50146484375, -2.27105712890625, -2.0406494140625, -1.81024169921875, -1.579833984375, -1.34942626953125, -1.1190185546875, -0.88861083984375, -0.658203125, -0.42779541015625, -0.1973876953125, 0.03302001953125, 0.263427734375, 0.49383544921875, 0.7242431640625, 0.95465087890625, 1.18505859375, 1.41546630859375, 1.6458740234375, 1.87628173828125, 2.106689453125, 2.33709716796875, 2.5675048828125, 2.79791259765625, 3.0283203125, 3.25872802734375, 3.4891357421875, 3.71954345703125, 3.949951171875, 4.18035888671875, 4.4107666015625, 4.64117431640625, 4.87158203125, 5.10198974609375, 5.3323974609375, 5.56280517578125, 5.793212890625, 6.02362060546875, 6.2540283203125, 6.48443603515625, 6.71484375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 8.0, 8.0, 14.0, 20.0, 36.0, 34.0, 66.0, 71.0, 96.0, 115.0, 122.0, 109.0, 72.0, 59.0, 42.0, 35.0, 31.0, 15.0, 14.0, 9.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00133514404296875, -0.0012937039136886597, -0.0012522637844085693, -0.001210823655128479, -0.0011693835258483887, -0.0011279433965682983, -0.001086503267288208, -0.0010450631380081177, -0.0010036230087280273, -0.000962182879447937, -0.0009207427501678467, -0.0008793026208877563, -0.000837862491607666, -0.0007964223623275757, -0.0007549822330474854, -0.000713542103767395, -0.0006721019744873047, -0.0006306618452072144, -0.000589221715927124, -0.0005477815866470337, -0.0005063414573669434, -0.00046490132808685303, -0.0004234611988067627, -0.00038202106952667236, -0.00034058094024658203, -0.0002991408109664917, -0.00025770068168640137, -0.00021626055240631104, -0.0001748204231262207, -0.00013338029384613037, -9.194016456604004e-05, -5.050003528594971e-05, -9.059906005859375e-06, 3.238022327423096e-05, 7.382035255432129e-05, 0.00011526048183441162, 0.00015670061111450195, 0.00019814074039459229, 0.00023958086967468262, 0.00028102099895477295, 0.0003224611282348633, 0.0003639012575149536, 0.00040534138679504395, 0.0004467815160751343, 0.0004882216453552246, 0.0005296617746353149, 0.0005711019039154053, 0.0006125420331954956, 0.0006539821624755859, 0.0006954222917556763, 0.0007368624210357666, 0.0007783025503158569, 0.0008197426795959473, 0.0008611828088760376, 0.0009026229381561279, 0.0009440630674362183, 0.0009855031967163086, 0.001026943325996399, 0.0010683834552764893, 0.0011098235845565796, 0.00115126371383667, 0.0011927038431167603, 0.0012341439723968506, 0.001275584101676941, 0.0013170242309570312]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 6.0, 5.0, 14.0, 10.0, 15.0, 30.0, 36.0, 43.0, 82.0, 94.0, 176.0, 267.0, 556.0, 1224.0, 3158.0, 10106.0, 50640.0, 353924.0, 519405.0, 86172.0, 15307.0, 4202.0, 1477.0, 654.0, 334.0, 219.0, 130.0, 89.0, 61.0, 36.0, 22.0, 14.0, 13.0, 13.0, 8.0, 3.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0], "bins": [-8.328125, -8.1097412109375, -7.891357421875, -7.6729736328125, -7.45458984375, -7.2362060546875, -7.017822265625, -6.7994384765625, -6.5810546875, -6.3626708984375, -6.144287109375, -5.9259033203125, -5.70751953125, -5.4891357421875, -5.270751953125, -5.0523681640625, -4.833984375, -4.6156005859375, -4.397216796875, -4.1788330078125, -3.96044921875, -3.7420654296875, -3.523681640625, -3.3052978515625, -3.0869140625, -2.8685302734375, -2.650146484375, -2.4317626953125, -2.21337890625, -1.9949951171875, -1.776611328125, -1.5582275390625, -1.33984375, -1.1214599609375, -0.903076171875, -0.6846923828125, -0.46630859375, -0.2479248046875, -0.029541015625, 0.1888427734375, 0.4072265625, 0.6256103515625, 0.843994140625, 1.0623779296875, 1.28076171875, 1.4991455078125, 1.717529296875, 1.9359130859375, 2.154296875, 2.3726806640625, 2.591064453125, 2.8094482421875, 3.02783203125, 3.2462158203125, 3.464599609375, 3.6829833984375, 3.9013671875, 4.1197509765625, 4.338134765625, 4.5565185546875, 4.77490234375, 4.9932861328125, 5.211669921875, 5.4300537109375, 5.6484375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 3.0, 5.0, 12.0, 7.0, 13.0, 12.0, 22.0, 27.0, 36.0, 28.0, 53.0, 55.0, 69.0, 95.0, 75.0, 77.0, 63.0, 50.0, 54.0, 46.0, 39.0, 33.0, 18.0, 18.0, 20.0, 8.0, 10.0, 14.0, 8.0, 6.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -4.06414794921875, -3.9173583984375, -3.77056884765625, -3.623779296875, -3.47698974609375, -3.3302001953125, -3.18341064453125, -3.03662109375, -2.88983154296875, -2.7430419921875, -2.59625244140625, -2.449462890625, -2.30267333984375, -2.1558837890625, -2.00909423828125, -1.8623046875, -1.71551513671875, -1.5687255859375, -1.42193603515625, -1.275146484375, -1.12835693359375, -0.9815673828125, -0.83477783203125, -0.68798828125, -0.54119873046875, -0.3944091796875, -0.24761962890625, -0.100830078125, 0.04595947265625, 0.1927490234375, 0.33953857421875, 0.486328125, 0.63311767578125, 0.7799072265625, 0.92669677734375, 1.073486328125, 1.22027587890625, 1.3670654296875, 1.51385498046875, 1.66064453125, 1.80743408203125, 1.9542236328125, 2.10101318359375, 2.247802734375, 2.39459228515625, 2.5413818359375, 2.68817138671875, 2.8349609375, 2.98175048828125, 3.1285400390625, 3.27532958984375, 3.422119140625, 3.56890869140625, 3.7156982421875, 3.86248779296875, 4.00927734375, 4.15606689453125, 4.3028564453125, 4.44964599609375, 4.596435546875, 4.74322509765625, 4.8900146484375, 5.03680419921875, 5.18359375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 28.0, 122.0, 233.0, 301.0, 204.0, 77.0, 21.0, 8.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.5889892578125, -258.0293273925781, -252.4696807861328, -246.9100341796875, -241.35037231445312, -235.7907257080078, -230.2310791015625, -224.67141723632812, -219.1117706298828, -213.5521240234375, -207.99246215820312, -202.4328155517578, -196.8731689453125, -191.31350708007812, -185.7538604736328, -180.1942138671875, -174.63455200195312, -169.0749053955078, -163.51524353027344, -157.95559692382812, -152.39593505859375, -146.83628845214844, -141.27664184570312, -135.71697998046875, -130.15733337402344, -124.5976791381836, -119.03802490234375, -113.47837829589844, -107.9187240600586, -102.35906982421875, -96.79942321777344, -91.2397689819336, -85.68009948730469, -80.12044525146484, -74.560791015625, -69.00114440917969, -63.441490173339844, -57.8818359375, -52.32218551635742, -46.762535095214844, -41.202880859375, -35.643226623535156, -30.083576202392578, -24.523923873901367, -18.964271545410156, -13.404619216918945, -7.844966888427734, -2.2853164672851562, 3.2743377685546875, 8.833990097045898, 14.39364242553711, 19.95329475402832, 25.51294708251953, 31.072599411010742, 36.63225173950195, 42.19190216064453, 47.751556396484375, 53.31121063232422, 58.8708610534668, 64.43051147460938, 69.99016571044922, 75.54981994628906, 81.10946655273438, 86.66912078857422, 92.22877502441406]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 4.0, 4.0, 7.0, 9.0, 12.0, 15.0, 21.0, 24.0, 26.0, 24.0, 21.0, 45.0, 25.0, 31.0, 40.0, 45.0, 43.0, 44.0, 47.0, 51.0, 47.0, 48.0, 47.0, 29.0, 44.0, 32.0, 31.0, 29.0, 24.0, 21.0, 21.0, 23.0, 14.0, 10.0, 10.0, 8.0, 8.0, 4.0, 3.0, 3.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-53.82587814331055, -52.183006286621094, -50.54013442993164, -48.89726257324219, -47.25439453125, -45.61151885986328, -43.968650817871094, -42.32577896118164, -40.68290710449219, -39.040035247802734, -37.39716339111328, -35.75429153442383, -34.111419677734375, -32.46855163574219, -30.825679779052734, -29.18280792236328, -27.539936065673828, -25.897064208984375, -24.254192352294922, -22.6113224029541, -20.96845054626465, -19.325578689575195, -17.682708740234375, -16.039836883544922, -14.396965026855469, -12.754093170166016, -11.111222267150879, -9.468351364135742, -7.825479507446289, -6.182607650756836, -4.539736747741699, -2.8968658447265625, -1.2539901733398438, 0.38888120651245117, 2.031752586364746, 3.674623966217041, 5.317495346069336, 6.960367202758789, 8.603238105773926, 10.246109008789062, 11.888980865478516, 13.531852722167969, 15.174723625183105, 16.817594528198242, 18.460466384887695, 20.10333824157715, 21.74620819091797, 23.389080047607422, 25.031951904296875, 26.674823760986328, 28.31769561767578, 29.9605655670166, 31.603437423706055, 33.246307373046875, 34.88917922973633, 36.53205108642578, 38.174922943115234, 39.81779479980469, 41.46066665649414, 43.103538513183594, 44.74640655517578, 46.3892822265625, 48.03215026855469, 49.67502212524414, 51.317893981933594]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 2.0, 4.0, 6.0, 3.0, 5.0, 13.0, 19.0, 23.0, 40.0, 24.0, 41.0, 70.0, 99.0, 156.0, 231.0, 416.0, 700.0, 1325.0, 2849.0, 8480.0, 42727.0, 3930640.0, 179088.0, 18099.0, 4853.0, 1985.0, 920.0, 515.0, 325.0, 164.0, 134.0, 85.0, 65.0, 53.0, 34.0, 23.0, 10.0, 11.0, 10.0, 4.0, 6.0, 4.0, 8.0, 5.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.171875, -16.647705078125, -16.12353515625, -15.599365234375, -15.0751953125, -14.551025390625, -14.02685546875, -13.502685546875, -12.978515625, -12.454345703125, -11.93017578125, -11.406005859375, -10.8818359375, -10.357666015625, -9.83349609375, -9.309326171875, -8.78515625, -8.260986328125, -7.73681640625, -7.212646484375, -6.6884765625, -6.164306640625, -5.64013671875, -5.115966796875, -4.591796875, -4.067626953125, -3.54345703125, -3.019287109375, -2.4951171875, -1.970947265625, -1.44677734375, -0.922607421875, -0.3984375, 0.125732421875, 0.64990234375, 1.174072265625, 1.6982421875, 2.222412109375, 2.74658203125, 3.270751953125, 3.794921875, 4.319091796875, 4.84326171875, 5.367431640625, 5.8916015625, 6.415771484375, 6.93994140625, 7.464111328125, 7.98828125, 8.512451171875, 9.03662109375, 9.560791015625, 10.0849609375, 10.609130859375, 11.13330078125, 11.657470703125, 12.181640625, 12.705810546875, 13.22998046875, 13.754150390625, 14.2783203125, 14.802490234375, 15.32666015625, 15.850830078125, 16.375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 6.0, 11.0, 13.0, 17.0, 26.0, 36.0, 23.0, 37.0, 41.0, 47.0, 65.0, 57.0, 79.0, 65.0, 72.0, 58.0, 43.0, 51.0, 38.0, 50.0, 39.0, 24.0, 16.0, 18.0, 11.0, 17.0, 9.0, 9.0, 3.0, 5.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6640625, -2.5823974609375, -2.500732421875, -2.4190673828125, -2.33740234375, -2.2557373046875, -2.174072265625, -2.0924072265625, -2.0107421875, -1.9290771484375, -1.847412109375, -1.7657470703125, -1.68408203125, -1.6024169921875, -1.520751953125, -1.4390869140625, -1.357421875, -1.2757568359375, -1.194091796875, -1.1124267578125, -1.03076171875, -0.9490966796875, -0.867431640625, -0.7857666015625, -0.7041015625, -0.6224365234375, -0.540771484375, -0.4591064453125, -0.37744140625, -0.2957763671875, -0.214111328125, -0.1324462890625, -0.05078125, 0.0308837890625, 0.112548828125, 0.1942138671875, 0.27587890625, 0.3575439453125, 0.439208984375, 0.5208740234375, 0.6025390625, 0.6842041015625, 0.765869140625, 0.8475341796875, 0.92919921875, 1.0108642578125, 1.092529296875, 1.1741943359375, 1.255859375, 1.3375244140625, 1.419189453125, 1.5008544921875, 1.58251953125, 1.6641845703125, 1.745849609375, 1.8275146484375, 1.9091796875, 1.9908447265625, 2.072509765625, 2.1541748046875, 2.23583984375, 2.3175048828125, 2.399169921875, 2.4808349609375, 2.5625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 8.0, 4.0, 11.0, 8.0, 7.0, 10.0, 11.0, 16.0, 27.0, 20.0, 31.0, 35.0, 53.0, 101.0, 152.0, 212.0, 340.0, 615.0, 1367.0, 3727.0, 13637.0, 110706.0, 3983876.0, 63257.0, 10237.0, 3075.0, 1198.0, 592.0, 323.0, 204.0, 128.0, 85.0, 57.0, 41.0, 22.0, 24.0, 16.0, 13.0, 9.0, 10.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.359375, -19.73095703125, -19.1025390625, -18.47412109375, -17.845703125, -17.21728515625, -16.5888671875, -15.96044921875, -15.33203125, -14.70361328125, -14.0751953125, -13.44677734375, -12.818359375, -12.18994140625, -11.5615234375, -10.93310546875, -10.3046875, -9.67626953125, -9.0478515625, -8.41943359375, -7.791015625, -7.16259765625, -6.5341796875, -5.90576171875, -5.27734375, -4.64892578125, -4.0205078125, -3.39208984375, -2.763671875, -2.13525390625, -1.5068359375, -0.87841796875, -0.25, 0.37841796875, 1.0068359375, 1.63525390625, 2.263671875, 2.89208984375, 3.5205078125, 4.14892578125, 4.77734375, 5.40576171875, 6.0341796875, 6.66259765625, 7.291015625, 7.91943359375, 8.5478515625, 9.17626953125, 9.8046875, 10.43310546875, 11.0615234375, 11.68994140625, 12.318359375, 12.94677734375, 13.5751953125, 14.20361328125, 14.83203125, 15.46044921875, 16.0888671875, 16.71728515625, 17.345703125, 17.97412109375, 18.6025390625, 19.23095703125, 19.859375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 14.0, 22.0, 32.0, 73.0, 236.0, 3179.0, 305.0, 105.0, 31.0, 22.0, 14.0, 13.0, 7.0, 2.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.25, -5.126739501953125, -5.00347900390625, -4.880218505859375, -4.7569580078125, -4.633697509765625, -4.51043701171875, -4.387176513671875, -4.263916015625, -4.140655517578125, -4.01739501953125, -3.894134521484375, -3.7708740234375, -3.647613525390625, -3.52435302734375, -3.401092529296875, -3.27783203125, -3.154571533203125, -3.03131103515625, -2.908050537109375, -2.7847900390625, -2.661529541015625, -2.53826904296875, -2.415008544921875, -2.291748046875, -2.168487548828125, -2.04522705078125, -1.921966552734375, -1.7987060546875, -1.675445556640625, -1.55218505859375, -1.428924560546875, -1.3056640625, -1.182403564453125, -1.05914306640625, -0.935882568359375, -0.8126220703125, -0.689361572265625, -0.56610107421875, -0.442840576171875, -0.319580078125, -0.196319580078125, -0.07305908203125, 0.050201416015625, 0.1734619140625, 0.296722412109375, 0.41998291015625, 0.543243408203125, 0.66650390625, 0.789764404296875, 0.91302490234375, 1.036285400390625, 1.1595458984375, 1.282806396484375, 1.40606689453125, 1.529327392578125, 1.652587890625, 1.775848388671875, 1.89910888671875, 2.022369384765625, 2.1456298828125, 2.268890380859375, 2.39215087890625, 2.515411376953125, 2.638671875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 3.0, 2.0, 8.0, 7.0, 19.0, 18.0, 34.0, 39.0, 55.0, 55.0, 87.0, 94.0, 97.0, 74.0, 77.0, 58.0, 85.0, 53.0, 42.0, 19.0, 27.0, 14.0, 11.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.951854228973389, -6.653461456298828, -6.355068683624268, -6.056675910949707, -5.758283615112305, -5.459890842437744, -5.161498069763184, -4.863105773925781, -4.5647125244140625, -4.266319751739502, -3.9679272174835205, -3.66953444480896, -3.3711419105529785, -3.072749137878418, -2.7743563652038574, -2.475963830947876, -2.1775712966918945, -1.8791786432266235, -1.5807859897613525, -1.282393217086792, -0.984000563621521, -0.68560791015625, -0.38721513748168945, -0.08882260322570801, 0.20957016944885254, 0.5079628229141235, 0.8063555359840393, 1.104748249053955, 1.403140902519226, 1.701533555984497, 1.9999263286590576, 2.298318862915039, 2.5967111587524414, 2.895103931427002, 3.1934964656829834, 3.491889238357544, 3.7902817726135254, 4.088674545288086, 4.3870673179626465, 4.685460090637207, 4.983852386474609, 5.28224515914917, 5.5806379318237305, 5.879030227661133, 6.177423000335693, 6.475815773010254, 6.7742085456848145, 7.072601318359375, 7.3709940910339355, 7.669386863708496, 7.967779636383057, 8.266172409057617, 8.56456470489502, 8.862957000732422, 9.16135025024414, 9.459742546081543, 9.758135795593262, 10.056528091430664, 10.354921340942383, 10.653313636779785, 10.951706886291504, 11.250099182128906, 11.548492431640625, 11.846884727478027, 12.14527702331543]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 6.0, 10.0, 10.0, 7.0, 7.0, 20.0, 6.0, 20.0, 13.0, 27.0, 20.0, 17.0, 35.0, 37.0, 27.0, 22.0, 30.0, 45.0, 34.0, 34.0, 37.0, 42.0, 42.0, 43.0, 35.0, 33.0, 32.0, 34.0, 30.0, 36.0, 34.0, 25.0, 20.0, 24.0, 16.0, 20.0, 16.0, 8.0, 6.0, 8.0, 9.0, 6.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.181201934814453, -5.010282039642334, -4.839362144470215, -4.6684417724609375, -4.497521877288818, -4.326601982116699, -4.155681610107422, -3.9847617149353027, -3.8138418197631836, -3.6429219245910645, -3.472001791000366, -3.301081657409668, -3.130161762237549, -2.9592418670654297, -2.7883217334747314, -2.617401599884033, -2.446481704711914, -2.275561809539795, -2.1046416759490967, -1.933721661567688, -1.7628016471862793, -1.5918816328048706, -1.420961618423462, -1.2500416040420532, -1.0791215896606445, -0.9082015752792358, -0.7372815608978271, -0.5663615465164185, -0.39544153213500977, -0.22452151775360107, -0.05360150337219238, 0.11731851100921631, 0.2882380485534668, 0.4591580629348755, 0.6300780773162842, 0.8009980916976929, 0.9719181060791016, 1.1428381204605103, 1.313758134841919, 1.4846781492233276, 1.6555981636047363, 1.826518177986145, 1.9974381923675537, 2.168358325958252, 2.339278221130371, 2.5101981163024902, 2.6811182498931885, 2.8520383834838867, 3.022958278656006, 3.193878173828125, 3.3647983074188232, 3.5357184410095215, 3.7066383361816406, 3.8775582313537598, 4.048478126525879, 4.219398498535156, 4.390318393707275, 4.5612382888793945, 4.732158660888672, 4.903078556060791, 5.07399845123291, 5.244918346405029, 5.415838241577148, 5.586758613586426, 5.757678508758545]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 7.0, 5.0, 11.0, 17.0, 15.0, 30.0, 35.0, 63.0, 137.0, 240.0, 445.0, 874.0, 1977.0, 4425.0, 10534.0, 24528.0, 56450.0, 120274.0, 213510.0, 254683.0, 184849.0, 96909.0, 44675.0, 19097.0, 8227.0, 3502.0, 1522.0, 701.0, 344.0, 177.0, 105.0, 68.0, 33.0, 26.0, 14.0, 15.0, 8.0, 4.0, 4.0, 4.0, 4.0, 0.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.0546875, -4.8984375, -4.7421875, -4.5859375, -4.4296875, -4.2734375, -4.1171875, -3.9609375, -3.8046875, -3.6484375, -3.4921875, -3.3359375, -3.1796875, -3.0234375, -2.8671875, -2.7109375, -2.5546875, -2.3984375, -2.2421875, -2.0859375, -1.9296875, -1.7734375, -1.6171875, -1.4609375, -1.3046875, -1.1484375, -0.9921875, -0.8359375, -0.6796875, -0.5234375, -0.3671875, -0.2109375, -0.0546875, 0.1015625, 0.2578125, 0.4140625, 0.5703125, 0.7265625, 0.8828125, 1.0390625, 1.1953125, 1.3515625, 1.5078125, 1.6640625, 1.8203125, 1.9765625, 2.1328125, 2.2890625, 2.4453125, 2.6015625, 2.7578125, 2.9140625, 3.0703125, 3.2265625, 3.3828125, 3.5390625, 3.6953125, 3.8515625, 4.0078125, 4.1640625, 4.3203125, 4.4765625, 4.6328125, 4.7890625, 4.9453125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 8.0, 7.0, 10.0, 14.0, 10.0, 16.0, 23.0, 19.0, 25.0, 36.0, 31.0, 43.0, 53.0, 61.0, 47.0, 57.0, 51.0, 46.0, 67.0, 50.0, 48.0, 45.0, 31.0, 34.0, 23.0, 24.0, 29.0, 26.0, 17.0, 13.0, 10.0, 11.0, 6.0, 1.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.591796875, -2.515289306640625, -2.43878173828125, -2.362274169921875, -2.2857666015625, -2.209259033203125, -2.13275146484375, -2.056243896484375, -1.979736328125, -1.903228759765625, -1.82672119140625, -1.750213623046875, -1.6737060546875, -1.597198486328125, -1.52069091796875, -1.444183349609375, -1.36767578125, -1.291168212890625, -1.21466064453125, -1.138153076171875, -1.0616455078125, -0.985137939453125, -0.90863037109375, -0.832122802734375, -0.755615234375, -0.679107666015625, -0.60260009765625, -0.526092529296875, -0.4495849609375, -0.373077392578125, -0.29656982421875, -0.220062255859375, -0.1435546875, -0.067047119140625, 0.00946044921875, 0.085968017578125, 0.1624755859375, 0.238983154296875, 0.31549072265625, 0.391998291015625, 0.468505859375, 0.545013427734375, 0.62152099609375, 0.698028564453125, 0.7745361328125, 0.851043701171875, 0.92755126953125, 1.004058837890625, 1.08056640625, 1.157073974609375, 1.23358154296875, 1.310089111328125, 1.3865966796875, 1.463104248046875, 1.53961181640625, 1.616119384765625, 1.692626953125, 1.769134521484375, 1.84564208984375, 1.922149658203125, 1.9986572265625, 2.075164794921875, 2.15167236328125, 2.228179931640625, 2.3046875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 7.0, 10.0, 22.0, 22.0, 21.0, 37.0, 43.0, 47.0, 80.0, 100.0, 132.0, 198.0, 262.0, 391.0, 613.0, 1166.0, 2707.0, 10749.0, 78299.0, 531240.0, 364478.0, 45867.0, 7174.0, 2130.0, 965.0, 554.0, 345.0, 238.0, 194.0, 117.0, 84.0, 68.0, 58.0, 30.0, 30.0, 22.0, 12.0, 13.0, 10.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.265625, -10.8885498046875, -10.511474609375, -10.1343994140625, -9.75732421875, -9.3802490234375, -9.003173828125, -8.6260986328125, -8.2490234375, -7.8719482421875, -7.494873046875, -7.1177978515625, -6.74072265625, -6.3636474609375, -5.986572265625, -5.6094970703125, -5.232421875, -4.8553466796875, -4.478271484375, -4.1011962890625, -3.72412109375, -3.3470458984375, -2.969970703125, -2.5928955078125, -2.2158203125, -1.8387451171875, -1.461669921875, -1.0845947265625, -0.70751953125, -0.3304443359375, 0.046630859375, 0.4237060546875, 0.80078125, 1.1778564453125, 1.554931640625, 1.9320068359375, 2.30908203125, 2.6861572265625, 3.063232421875, 3.4403076171875, 3.8173828125, 4.1944580078125, 4.571533203125, 4.9486083984375, 5.32568359375, 5.7027587890625, 6.079833984375, 6.4569091796875, 6.833984375, 7.2110595703125, 7.588134765625, 7.9652099609375, 8.34228515625, 8.7193603515625, 9.096435546875, 9.4735107421875, 9.8505859375, 10.2276611328125, 10.604736328125, 10.9818115234375, 11.35888671875, 11.7359619140625, 12.113037109375, 12.4901123046875, 12.8671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 9.0, 4.0, 8.0, 7.0, 7.0, 10.0, 8.0, 9.0, 23.0, 19.0, 9.0, 17.0, 20.0, 23.0, 30.0, 41.0, 40.0, 36.0, 44.0, 48.0, 46.0, 53.0, 52.0, 56.0, 36.0, 38.0, 50.0, 36.0, 47.0, 37.0, 27.0, 21.0, 23.0, 15.0, 15.0, 13.0, 8.0, 5.0, 4.0, 4.0, 7.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.0078125, -10.6402587890625, -10.272705078125, -9.9051513671875, -9.53759765625, -9.1700439453125, -8.802490234375, -8.4349365234375, -8.0673828125, -7.6998291015625, -7.332275390625, -6.9647216796875, -6.59716796875, -6.2296142578125, -5.862060546875, -5.4945068359375, -5.126953125, -4.7593994140625, -4.391845703125, -4.0242919921875, -3.65673828125, -3.2891845703125, -2.921630859375, -2.5540771484375, -2.1865234375, -1.8189697265625, -1.451416015625, -1.0838623046875, -0.71630859375, -0.3487548828125, 0.018798828125, 0.3863525390625, 0.75390625, 1.1214599609375, 1.489013671875, 1.8565673828125, 2.22412109375, 2.5916748046875, 2.959228515625, 3.3267822265625, 3.6943359375, 4.0618896484375, 4.429443359375, 4.7969970703125, 5.16455078125, 5.5321044921875, 5.899658203125, 6.2672119140625, 6.634765625, 7.0023193359375, 7.369873046875, 7.7374267578125, 8.10498046875, 8.4725341796875, 8.840087890625, 9.2076416015625, 9.5751953125, 9.9427490234375, 10.310302734375, 10.6778564453125, 11.04541015625, 11.4129638671875, 11.780517578125, 12.1480712890625, 12.515625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 22.0, 23.0, 32.0, 59.0, 77.0, 153.0, 217.0, 352.0, 608.0, 1262.0, 2613.0, 6274.0, 18719.0, 75779.0, 352650.0, 448965.0, 103078.0, 24079.0, 7280.0, 3019.0, 1425.0, 820.0, 397.0, 249.0, 140.0, 99.0, 34.0, 26.0, 25.0, 23.0, 17.0, 6.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.966796875, -3.814788818359375, -3.66278076171875, -3.510772705078125, -3.3587646484375, -3.206756591796875, -3.05474853515625, -2.902740478515625, -2.750732421875, -2.598724365234375, -2.44671630859375, -2.294708251953125, -2.1427001953125, -1.990692138671875, -1.83868408203125, -1.686676025390625, -1.53466796875, -1.382659912109375, -1.23065185546875, -1.078643798828125, -0.9266357421875, -0.774627685546875, -0.62261962890625, -0.470611572265625, -0.318603515625, -0.166595458984375, -0.01458740234375, 0.137420654296875, 0.2894287109375, 0.441436767578125, 0.59344482421875, 0.745452880859375, 0.8974609375, 1.049468994140625, 1.20147705078125, 1.353485107421875, 1.5054931640625, 1.657501220703125, 1.80950927734375, 1.961517333984375, 2.113525390625, 2.265533447265625, 2.41754150390625, 2.569549560546875, 2.7215576171875, 2.873565673828125, 3.02557373046875, 3.177581787109375, 3.32958984375, 3.481597900390625, 3.63360595703125, 3.785614013671875, 3.9376220703125, 4.089630126953125, 4.24163818359375, 4.393646240234375, 4.545654296875, 4.697662353515625, 4.84967041015625, 5.001678466796875, 5.1536865234375, 5.305694580078125, 5.45770263671875, 5.609710693359375, 5.76171875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 8.0, 10.0, 4.0, 8.0, 8.0, 10.0, 13.0, 17.0, 19.0, 15.0, 29.0, 32.0, 39.0, 44.0, 50.0, 68.0, 53.0, 54.0, 69.0, 63.0, 54.0, 58.0, 49.0, 39.0, 25.0, 27.0, 30.0, 19.0, 12.0, 10.0, 9.0, 11.0, 9.0, 2.0, 9.0, 8.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0005936622619628906, -0.0005734935402870178, -0.000553324818611145, -0.0005331560969352722, -0.0005129873752593994, -0.0004928186535835266, -0.0004726499319076538, -0.000452481210231781, -0.0004323124885559082, -0.0004121437668800354, -0.0003919750452041626, -0.0003718063235282898, -0.000351637601852417, -0.0003314688801765442, -0.0003113001585006714, -0.0002911314368247986, -0.0002709627151489258, -0.000250793993473053, -0.00023062527179718018, -0.00021045655012130737, -0.00019028782844543457, -0.00017011910676956177, -0.00014995038509368896, -0.00012978166341781616, -0.00010961294174194336, -8.944422006607056e-05, -6.927549839019775e-05, -4.910677671432495e-05, -2.893805503845215e-05, -8.769333362579346e-06, 1.1399388313293457e-05, 3.156810998916626e-05, 5.173683166503906e-05, 7.190555334091187e-05, 9.207427501678467e-05, 0.00011224299669265747, 0.00013241171836853027, 0.00015258044004440308, 0.00017274916172027588, 0.00019291788339614868, 0.00021308660507202148, 0.0002332553267478943, 0.0002534240484237671, 0.0002735927700996399, 0.0002937614917755127, 0.0003139302134513855, 0.0003340989351272583, 0.0003542676568031311, 0.0003744363784790039, 0.0003946051001548767, 0.0004147738218307495, 0.0004349425435066223, 0.0004551112651824951, 0.0004752799868583679, 0.0004954487085342407, 0.0005156174302101135, 0.0005357861518859863, 0.0005559548735618591, 0.0005761235952377319, 0.0005962923169136047, 0.0006164610385894775, 0.0006366297602653503, 0.0006567984819412231, 0.000676967203617096, 0.0006971359252929688]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 4.0, 3.0, 7.0, 7.0, 16.0, 17.0, 25.0, 45.0, 88.0, 168.0, 324.0, 771.0, 1837.0, 5914.0, 30137.0, 346579.0, 596100.0, 53706.0, 8575.0, 2471.0, 898.0, 407.0, 215.0, 93.0, 54.0, 38.0, 13.0, 16.0, 11.0, 7.0, 3.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.28515625, -7.03509521484375, -6.7850341796875, -6.53497314453125, -6.284912109375, -6.03485107421875, -5.7847900390625, -5.53472900390625, -5.28466796875, -5.03460693359375, -4.7845458984375, -4.53448486328125, -4.284423828125, -4.03436279296875, -3.7843017578125, -3.53424072265625, -3.2841796875, -3.03411865234375, -2.7840576171875, -2.53399658203125, -2.283935546875, -2.03387451171875, -1.7838134765625, -1.53375244140625, -1.28369140625, -1.03363037109375, -0.7835693359375, -0.53350830078125, -0.283447265625, -0.03338623046875, 0.2166748046875, 0.46673583984375, 0.716796875, 0.96685791015625, 1.2169189453125, 1.46697998046875, 1.717041015625, 1.96710205078125, 2.2171630859375, 2.46722412109375, 2.71728515625, 2.96734619140625, 3.2174072265625, 3.46746826171875, 3.717529296875, 3.96759033203125, 4.2176513671875, 4.46771240234375, 4.7177734375, 4.96783447265625, 5.2178955078125, 5.46795654296875, 5.718017578125, 5.96807861328125, 6.2181396484375, 6.46820068359375, 6.71826171875, 6.96832275390625, 7.2183837890625, 7.46844482421875, 7.718505859375, 7.96856689453125, 8.2186279296875, 8.46868896484375, 8.71875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 2.0, 5.0, 2.0, 6.0, 14.0, 17.0, 18.0, 18.0, 26.0, 34.0, 55.0, 56.0, 68.0, 59.0, 93.0, 79.0, 84.0, 60.0, 70.0, 49.0, 32.0, 38.0, 26.0, 27.0, 15.0, 11.0, 3.0, 8.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0859375, -3.936279296875, -3.78662109375, -3.636962890625, -3.4873046875, -3.337646484375, -3.18798828125, -3.038330078125, -2.888671875, -2.739013671875, -2.58935546875, -2.439697265625, -2.2900390625, -2.140380859375, -1.99072265625, -1.841064453125, -1.69140625, -1.541748046875, -1.39208984375, -1.242431640625, -1.0927734375, -0.943115234375, -0.79345703125, -0.643798828125, -0.494140625, -0.344482421875, -0.19482421875, -0.045166015625, 0.1044921875, 0.254150390625, 0.40380859375, 0.553466796875, 0.703125, 0.852783203125, 1.00244140625, 1.152099609375, 1.3017578125, 1.451416015625, 1.60107421875, 1.750732421875, 1.900390625, 2.050048828125, 2.19970703125, 2.349365234375, 2.4990234375, 2.648681640625, 2.79833984375, 2.947998046875, 3.09765625, 3.247314453125, 3.39697265625, 3.546630859375, 3.6962890625, 3.845947265625, 3.99560546875, 4.145263671875, 4.294921875, 4.444580078125, 4.59423828125, 4.743896484375, 4.8935546875, 5.043212890625, 5.19287109375, 5.342529296875, 5.4921875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 11.0, 22.0, 107.0, 263.0, 319.0, 190.0, 81.0, 11.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-100.46893310546875, -94.2789077758789, -88.0888900756836, -81.89886474609375, -75.7088394165039, -69.51881408691406, -63.32879638671875, -57.138771057128906, -50.94874954223633, -44.75872802734375, -38.568702697753906, -32.37868118286133, -26.188657760620117, -19.998634338378906, -13.808612823486328, -7.618587493896484, -1.4285659790039062, 4.7614569664001465, 10.9514799118042, 17.141502380371094, 23.331525802612305, 29.521549224853516, 35.711570739746094, 41.90159606933594, 48.091617584228516, 54.281639099121094, 60.47166442871094, 66.66168212890625, 72.8517074584961, 79.04173278808594, 85.23175048828125, 91.42178344726562, 97.61180114746094, 103.80182647705078, 109.9918441772461, 116.18186950683594, 122.37189483642578, 128.56192016601562, 134.75193786621094, 140.94195556640625, 147.13198852539062, 153.32200622558594, 159.5120391845703, 165.70205688476562, 171.89207458496094, 178.0821075439453, 184.27212524414062, 190.462158203125, 196.65216064453125, 202.84217834472656, 209.03221130371094, 215.22222900390625, 221.41224670410156, 227.60227966308594, 233.79229736328125, 239.98233032226562, 246.17234802246094, 252.36236572265625, 258.5523986816406, 264.742431640625, 270.93243408203125, 277.1224670410156, 283.3125, 289.50250244140625, 295.6925354003906]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 10.0, 17.0, 12.0, 12.0, 15.0, 19.0, 7.0, 16.0, 22.0, 14.0, 24.0, 35.0, 24.0, 39.0, 35.0, 38.0, 42.0, 39.0, 36.0, 62.0, 50.0, 40.0, 47.0, 32.0, 38.0, 27.0, 34.0, 24.0, 18.0, 29.0, 21.0, 10.0, 19.0, 9.0, 15.0, 6.0, 12.0, 9.0, 9.0, 6.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-49.288211822509766, -47.75959396362305, -46.23097610473633, -44.70235824584961, -43.17374038696289, -41.64512252807617, -40.11650848388672, -38.587890625, -37.05927276611328, -35.53065490722656, -34.002037048339844, -32.473419189453125, -30.944801330566406, -29.416183471679688, -27.8875675201416, -26.358949661254883, -24.83032989501953, -23.301712036132812, -21.773094177246094, -20.244476318359375, -18.715858459472656, -17.187240600585938, -15.658624649047852, -14.130006790161133, -12.601388931274414, -11.072771072387695, -9.544153213500977, -8.015536308288574, -6.4869184494018555, -4.958300590515137, -3.4296836853027344, -1.9010658264160156, -0.3724517822265625, 1.1561658382415771, 2.684783458709717, 4.213400840759277, 5.742018699645996, 7.270636558532715, 8.799253463745117, 10.327871322631836, 11.856489181518555, 13.385107040405273, 14.913724899291992, 16.442340850830078, 17.970958709716797, 19.499576568603516, 21.028194427490234, 22.556812286376953, 24.085430145263672, 25.61404800415039, 27.14266586303711, 28.671283721923828, 30.199901580810547, 31.728519439697266, 33.25713348388672, 34.78575134277344, 36.314369201660156, 37.842987060546875, 39.371604919433594, 40.90022277832031, 42.42884063720703, 43.95745849609375, 45.48607635498047, 47.01469421386719, 48.543312072753906]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 7.0, 6.0, 7.0, 10.0, 14.0, 26.0, 31.0, 28.0, 45.0, 73.0, 85.0, 151.0, 175.0, 308.0, 460.0, 851.0, 1583.0, 3373.0, 8819.0, 31727.0, 251785.0, 3804673.0, 65143.0, 14652.0, 5095.0, 2197.0, 1128.0, 634.0, 388.0, 251.0, 169.0, 107.0, 65.0, 63.0, 29.0, 32.0, 20.0, 19.0, 12.0, 7.0, 10.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-12.5234375, -12.1678466796875, -11.812255859375, -11.4566650390625, -11.10107421875, -10.7454833984375, -10.389892578125, -10.0343017578125, -9.6787109375, -9.3231201171875, -8.967529296875, -8.6119384765625, -8.25634765625, -7.9007568359375, -7.545166015625, -7.1895751953125, -6.833984375, -6.4783935546875, -6.122802734375, -5.7672119140625, -5.41162109375, -5.0560302734375, -4.700439453125, -4.3448486328125, -3.9892578125, -3.6336669921875, -3.278076171875, -2.9224853515625, -2.56689453125, -2.2113037109375, -1.855712890625, -1.5001220703125, -1.14453125, -0.7889404296875, -0.433349609375, -0.0777587890625, 0.27783203125, 0.6334228515625, 0.989013671875, 1.3446044921875, 1.7001953125, 2.0557861328125, 2.411376953125, 2.7669677734375, 3.12255859375, 3.4781494140625, 3.833740234375, 4.1893310546875, 4.544921875, 4.9005126953125, 5.256103515625, 5.6116943359375, 5.96728515625, 6.3228759765625, 6.678466796875, 7.0340576171875, 7.3896484375, 7.7452392578125, 8.100830078125, 8.4564208984375, 8.81201171875, 9.1676025390625, 9.523193359375, 9.8787841796875, 10.234375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 7.0, 10.0, 9.0, 13.0, 12.0, 10.0, 9.0, 16.0, 19.0, 26.0, 23.0, 36.0, 44.0, 36.0, 41.0, 54.0, 55.0, 59.0, 57.0, 34.0, 60.0, 41.0, 33.0, 49.0, 40.0, 29.0, 22.0, 22.0, 19.0, 20.0, 20.0, 16.0, 9.0, 9.0, 6.0, 5.0, 5.0, 6.0, 4.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.12109375, -2.0571746826171875, -1.993255615234375, -1.9293365478515625, -1.86541748046875, -1.8014984130859375, -1.737579345703125, -1.6736602783203125, -1.6097412109375, -1.5458221435546875, -1.481903076171875, -1.4179840087890625, -1.35406494140625, -1.2901458740234375, -1.226226806640625, -1.1623077392578125, -1.098388671875, -1.0344696044921875, -0.970550537109375, -0.9066314697265625, -0.84271240234375, -0.7787933349609375, -0.714874267578125, -0.6509552001953125, -0.5870361328125, -0.5231170654296875, -0.459197998046875, -0.3952789306640625, -0.33135986328125, -0.2674407958984375, -0.203521728515625, -0.1396026611328125, -0.07568359375, -0.0117645263671875, 0.052154541015625, 0.1160736083984375, 0.17999267578125, 0.2439117431640625, 0.307830810546875, 0.3717498779296875, 0.4356689453125, 0.4995880126953125, 0.563507080078125, 0.6274261474609375, 0.69134521484375, 0.7552642822265625, 0.819183349609375, 0.8831024169921875, 0.947021484375, 1.0109405517578125, 1.074859619140625, 1.1387786865234375, 1.20269775390625, 1.2666168212890625, 1.330535888671875, 1.3944549560546875, 1.4583740234375, 1.5222930908203125, 1.586212158203125, 1.6501312255859375, 1.71405029296875, 1.7779693603515625, 1.841888427734375, 1.9058074951171875, 1.9697265625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 9.0, 9.0, 12.0, 6.0, 10.0, 19.0, 30.0, 43.0, 53.0, 86.0, 122.0, 202.0, 299.0, 462.0, 751.0, 1318.0, 2415.0, 4744.0, 10583.0, 29326.0, 125003.0, 3687783.0, 259177.0, 44623.0, 14073.0, 5940.0, 2999.0, 1685.0, 885.0, 609.0, 329.0, 240.0, 129.0, 95.0, 59.0, 39.0, 31.0, 21.0, 21.0, 14.0, 5.0, 4.0, 5.0, 4.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0], "bins": [-9.953125, -9.6484375, -9.34375, -9.0390625, -8.734375, -8.4296875, -8.125, -7.8203125, -7.515625, -7.2109375, -6.90625, -6.6015625, -6.296875, -5.9921875, -5.6875, -5.3828125, -5.078125, -4.7734375, -4.46875, -4.1640625, -3.859375, -3.5546875, -3.25, -2.9453125, -2.640625, -2.3359375, -2.03125, -1.7265625, -1.421875, -1.1171875, -0.8125, -0.5078125, -0.203125, 0.1015625, 0.40625, 0.7109375, 1.015625, 1.3203125, 1.625, 1.9296875, 2.234375, 2.5390625, 2.84375, 3.1484375, 3.453125, 3.7578125, 4.0625, 4.3671875, 4.671875, 4.9765625, 5.28125, 5.5859375, 5.890625, 6.1953125, 6.5, 6.8046875, 7.109375, 7.4140625, 7.71875, 8.0234375, 8.328125, 8.6328125, 8.9375, 9.2421875, 9.546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 9.0, 9.0, 13.0, 22.0, 28.0, 39.0, 77.0, 147.0, 462.0, 2733.0, 230.0, 108.0, 69.0, 30.0, 27.0, 13.0, 17.0, 13.0, 5.0, 9.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.17578125, -2.086151123046875, -1.99652099609375, -1.906890869140625, -1.8172607421875, -1.727630615234375, -1.63800048828125, -1.548370361328125, -1.458740234375, -1.369110107421875, -1.27947998046875, -1.189849853515625, -1.1002197265625, -1.010589599609375, -0.92095947265625, -0.831329345703125, -0.74169921875, -0.652069091796875, -0.56243896484375, -0.472808837890625, -0.3831787109375, -0.293548583984375, -0.20391845703125, -0.114288330078125, -0.024658203125, 0.064971923828125, 0.15460205078125, 0.244232177734375, 0.3338623046875, 0.423492431640625, 0.51312255859375, 0.602752685546875, 0.6923828125, 0.782012939453125, 0.87164306640625, 0.961273193359375, 1.0509033203125, 1.140533447265625, 1.23016357421875, 1.319793701171875, 1.409423828125, 1.499053955078125, 1.58868408203125, 1.678314208984375, 1.7679443359375, 1.857574462890625, 1.94720458984375, 2.036834716796875, 2.12646484375, 2.216094970703125, 2.30572509765625, 2.395355224609375, 2.4849853515625, 2.574615478515625, 2.66424560546875, 2.753875732421875, 2.843505859375, 2.933135986328125, 3.02276611328125, 3.112396240234375, 3.2020263671875, 3.291656494140625, 3.38128662109375, 3.470916748046875, 3.560546875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 6.0, 11.0, 31.0, 39.0, 54.0, 81.0, 102.0, 119.0, 128.0, 130.0, 104.0, 80.0, 44.0, 27.0, 16.0, 10.0, 10.0, 0.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.040060997009277, -7.573615550994873, -7.107170104980469, -6.640725135803223, -6.174279689788818, -5.707834243774414, -5.241389274597168, -4.774943828582764, -4.308498382568359, -3.842052936553955, -3.37560772895813, -2.9091625213623047, -2.4427170753479004, -1.976271629333496, -1.509826421737671, -1.0433812141418457, -0.5769357681274414, -0.11049044132232666, 0.3559548854827881, 0.8224002122879028, 1.2888455390930176, 1.7552909851074219, 2.221736192703247, 2.6881814002990723, 3.1546268463134766, 3.621072292327881, 4.087517738342285, 4.553962707519531, 5.0204081535339355, 5.48685359954834, 5.953298568725586, 6.41974401473999, 6.886190414428711, 7.352635860443115, 7.8190813064575195, 8.285526275634766, 8.751972198486328, 9.218417167663574, 9.68486213684082, 10.151308059692383, 10.617753028869629, 11.084197998046875, 11.550643920898438, 12.017088890075684, 12.48353385925293, 12.949979782104492, 13.416424751281738, 13.882869720458984, 14.349315643310547, 14.815760612487793, 15.282206535339355, 15.748651504516602, 16.215097427368164, 16.681541442871094, 17.147987365722656, 17.61443328857422, 18.08087921142578, 18.547325134277344, 19.013769149780273, 19.480215072631836, 19.9466609954834, 20.413105010986328, 20.87955093383789, 21.345996856689453, 21.812440872192383]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 6.0, 8.0, 11.0, 12.0, 16.0, 24.0, 13.0, 22.0, 22.0, 23.0, 36.0, 39.0, 41.0, 34.0, 45.0, 42.0, 45.0, 48.0, 35.0, 37.0, 51.0, 47.0, 47.0, 38.0, 40.0, 35.0, 37.0, 33.0, 21.0, 14.0, 15.0, 14.0, 13.0, 3.0, 3.0, 9.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.148445129394531, -6.9387922286987305, -6.72913932800293, -6.519486427307129, -6.309833526611328, -6.100180625915527, -5.890527725219727, -5.680874824523926, -5.471221923828125, -5.261569023132324, -5.051916122436523, -4.842263221740723, -4.632610321044922, -4.422957420349121, -4.21330451965332, -4.0036516189575195, -3.793998956680298, -3.584346055984497, -3.3746931552886963, -3.1650402545928955, -2.9553873538970947, -2.745734691619873, -2.5360817909240723, -2.3264288902282715, -2.1167759895324707, -1.90712308883667, -1.6974701881408691, -1.4878172874450684, -1.2781643867492676, -1.0685116052627563, -0.8588587045669556, -0.6492058038711548, -0.43955278396606445, -0.22989989817142487, -0.02024701237678528, 0.18940585851669312, 0.3990587592124939, 0.6087116003036499, 0.8183645009994507, 1.0280174016952515, 1.2376703023910522, 1.447323203086853, 1.6569761037826538, 1.866628885269165, 2.076281785964966, 2.2859346866607666, 2.4955875873565674, 2.705240488052368, 2.914893388748169, 3.1245462894439697, 3.3341991901397705, 3.5438520908355713, 3.753504991531372, 3.9631576538085938, 4.1728105545043945, 4.382463455200195, 4.592116355895996, 4.801769256591797, 5.011422157287598, 5.221075057983398, 5.430727958679199, 5.640380859375, 5.850033760070801, 6.059686660766602, 6.269339561462402]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 7.0, 3.0, 11.0, 13.0, 13.0, 30.0, 33.0, 55.0, 78.0, 140.0, 201.0, 343.0, 519.0, 903.0, 1467.0, 2513.0, 4355.0, 7528.0, 13336.0, 24002.0, 42488.0, 73196.0, 118966.0, 169632.0, 189221.0, 154154.0, 102564.0, 61494.0, 35205.0, 19772.0, 11234.0, 6228.0, 3587.0, 2080.0, 1219.0, 744.0, 463.0, 267.0, 171.0, 121.0, 58.0, 43.0, 37.0, 24.0, 16.0, 6.0, 4.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-2.845703125, -2.7548828125, -2.6640625, -2.5732421875, -2.482421875, -2.3916015625, -2.30078125, -2.2099609375, -2.119140625, -2.0283203125, -1.9375, -1.8466796875, -1.755859375, -1.6650390625, -1.57421875, -1.4833984375, -1.392578125, -1.3017578125, -1.2109375, -1.1201171875, -1.029296875, -0.9384765625, -0.84765625, -0.7568359375, -0.666015625, -0.5751953125, -0.484375, -0.3935546875, -0.302734375, -0.2119140625, -0.12109375, -0.0302734375, 0.060546875, 0.1513671875, 0.2421875, 0.3330078125, 0.423828125, 0.5146484375, 0.60546875, 0.6962890625, 0.787109375, 0.8779296875, 0.96875, 1.0595703125, 1.150390625, 1.2412109375, 1.33203125, 1.4228515625, 1.513671875, 1.6044921875, 1.6953125, 1.7861328125, 1.876953125, 1.9677734375, 2.05859375, 2.1494140625, 2.240234375, 2.3310546875, 2.421875, 2.5126953125, 2.603515625, 2.6943359375, 2.78515625, 2.8759765625, 2.966796875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 4.0, 6.0, 9.0, 9.0, 11.0, 18.0, 16.0, 16.0, 24.0, 27.0, 30.0, 35.0, 32.0, 42.0, 50.0, 57.0, 59.0, 55.0, 56.0, 69.0, 40.0, 38.0, 39.0, 35.0, 45.0, 35.0, 28.0, 27.0, 23.0, 14.0, 13.0, 5.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2421875, -2.16632080078125, -2.0904541015625, -2.01458740234375, -1.938720703125, -1.86285400390625, -1.7869873046875, -1.71112060546875, -1.63525390625, -1.55938720703125, -1.4835205078125, -1.40765380859375, -1.331787109375, -1.25592041015625, -1.1800537109375, -1.10418701171875, -1.0283203125, -0.95245361328125, -0.8765869140625, -0.80072021484375, -0.724853515625, -0.64898681640625, -0.5731201171875, -0.49725341796875, -0.42138671875, -0.34552001953125, -0.2696533203125, -0.19378662109375, -0.117919921875, -0.04205322265625, 0.0338134765625, 0.10968017578125, 0.185546875, 0.26141357421875, 0.3372802734375, 0.41314697265625, 0.489013671875, 0.56488037109375, 0.6407470703125, 0.71661376953125, 0.79248046875, 0.86834716796875, 0.9442138671875, 1.02008056640625, 1.095947265625, 1.17181396484375, 1.2476806640625, 1.32354736328125, 1.3994140625, 1.47528076171875, 1.5511474609375, 1.62701416015625, 1.702880859375, 1.77874755859375, 1.8546142578125, 1.93048095703125, 2.00634765625, 2.08221435546875, 2.1580810546875, 2.23394775390625, 2.309814453125, 2.38568115234375, 2.4615478515625, 2.53741455078125, 2.61328125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 7.0, 6.0, 14.0, 8.0, 8.0, 20.0, 28.0, 40.0, 66.0, 62.0, 81.0, 114.0, 141.0, 213.0, 348.0, 493.0, 769.0, 1360.0, 3205.0, 13173.0, 102252.0, 655854.0, 235639.0, 25024.0, 5019.0, 1803.0, 869.0, 531.0, 376.0, 280.0, 191.0, 136.0, 117.0, 73.0, 48.0, 41.0, 40.0, 15.0, 26.0, 15.0, 9.0, 6.0, 6.0, 8.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.96875, -9.643798828125, -9.31884765625, -8.993896484375, -8.6689453125, -8.343994140625, -8.01904296875, -7.694091796875, -7.369140625, -7.044189453125, -6.71923828125, -6.394287109375, -6.0693359375, -5.744384765625, -5.41943359375, -5.094482421875, -4.76953125, -4.444580078125, -4.11962890625, -3.794677734375, -3.4697265625, -3.144775390625, -2.81982421875, -2.494873046875, -2.169921875, -1.844970703125, -1.52001953125, -1.195068359375, -0.8701171875, -0.545166015625, -0.22021484375, 0.104736328125, 0.4296875, 0.754638671875, 1.07958984375, 1.404541015625, 1.7294921875, 2.054443359375, 2.37939453125, 2.704345703125, 3.029296875, 3.354248046875, 3.67919921875, 4.004150390625, 4.3291015625, 4.654052734375, 4.97900390625, 5.303955078125, 5.62890625, 5.953857421875, 6.27880859375, 6.603759765625, 6.9287109375, 7.253662109375, 7.57861328125, 7.903564453125, 8.228515625, 8.553466796875, 8.87841796875, 9.203369140625, 9.5283203125, 9.853271484375, 10.17822265625, 10.503173828125, 10.828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 6.0, 7.0, 11.0, 8.0, 14.0, 21.0, 24.0, 22.0, 23.0, 21.0, 29.0, 38.0, 46.0, 32.0, 41.0, 53.0, 45.0, 41.0, 43.0, 34.0, 37.0, 32.0, 35.0, 51.0, 29.0, 47.0, 35.0, 25.0, 16.0, 21.0, 13.0, 28.0, 18.0, 12.0, 5.0, 5.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.90625, -9.5888671875, -9.271484375, -8.9541015625, -8.63671875, -8.3193359375, -8.001953125, -7.6845703125, -7.3671875, -7.0498046875, -6.732421875, -6.4150390625, -6.09765625, -5.7802734375, -5.462890625, -5.1455078125, -4.828125, -4.5107421875, -4.193359375, -3.8759765625, -3.55859375, -3.2412109375, -2.923828125, -2.6064453125, -2.2890625, -1.9716796875, -1.654296875, -1.3369140625, -1.01953125, -0.7021484375, -0.384765625, -0.0673828125, 0.25, 0.5673828125, 0.884765625, 1.2021484375, 1.51953125, 1.8369140625, 2.154296875, 2.4716796875, 2.7890625, 3.1064453125, 3.423828125, 3.7412109375, 4.05859375, 4.3759765625, 4.693359375, 5.0107421875, 5.328125, 5.6455078125, 5.962890625, 6.2802734375, 6.59765625, 6.9150390625, 7.232421875, 7.5498046875, 7.8671875, 8.1845703125, 8.501953125, 8.8193359375, 9.13671875, 9.4541015625, 9.771484375, 10.0888671875, 10.40625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 9.0, 2.0, 11.0, 15.0, 25.0, 45.0, 77.0, 137.0, 265.0, 659.0, 2172.0, 13492.0, 261851.0, 722542.0, 41315.0, 3991.0, 1084.0, 401.0, 224.0, 94.0, 59.0, 27.0, 16.0, 16.0, 7.0, 6.0, 7.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8359375, -6.584716796875, -6.33349609375, -6.082275390625, -5.8310546875, -5.579833984375, -5.32861328125, -5.077392578125, -4.826171875, -4.574951171875, -4.32373046875, -4.072509765625, -3.8212890625, -3.570068359375, -3.31884765625, -3.067626953125, -2.81640625, -2.565185546875, -2.31396484375, -2.062744140625, -1.8115234375, -1.560302734375, -1.30908203125, -1.057861328125, -0.806640625, -0.555419921875, -0.30419921875, -0.052978515625, 0.1982421875, 0.449462890625, 0.70068359375, 0.951904296875, 1.203125, 1.454345703125, 1.70556640625, 1.956787109375, 2.2080078125, 2.459228515625, 2.71044921875, 2.961669921875, 3.212890625, 3.464111328125, 3.71533203125, 3.966552734375, 4.2177734375, 4.468994140625, 4.72021484375, 4.971435546875, 5.22265625, 5.473876953125, 5.72509765625, 5.976318359375, 6.2275390625, 6.478759765625, 6.72998046875, 6.981201171875, 7.232421875, 7.483642578125, 7.73486328125, 7.986083984375, 8.2373046875, 8.488525390625, 8.73974609375, 8.990966796875, 9.2421875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 3.0, 9.0, 6.0, 10.0, 18.0, 17.0, 25.0, 30.0, 41.0, 47.0, 38.0, 56.0, 71.0, 88.0, 87.0, 70.0, 73.0, 56.0, 52.0, 37.0, 32.0, 21.0, 26.0, 23.0, 11.0, 13.0, 8.0, 7.0, 5.0, 5.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005917549133300781, -0.0005691573023796082, -0.0005465596914291382, -0.0005239620804786682, -0.0005013644695281982, -0.00047876685857772827, -0.0004561692476272583, -0.00043357163667678833, -0.00041097402572631836, -0.0003883764147758484, -0.0003657788038253784, -0.00034318119287490845, -0.0003205835819244385, -0.0002979859709739685, -0.00027538836002349854, -0.00025279074907302856, -0.0002301931381225586, -0.00020759552717208862, -0.00018499791622161865, -0.00016240030527114868, -0.0001398026943206787, -0.00011720508337020874, -9.460747241973877e-05, -7.20098614692688e-05, -4.941225051879883e-05, -2.6814639568328857e-05, -4.217028617858887e-06, 1.8380582332611084e-05, 4.0978193283081055e-05, 6.357580423355103e-05, 8.6173415184021e-05, 0.00010877102613449097, 0.00013136863708496094, 0.0001539662480354309, 0.00017656385898590088, 0.00019916146993637085, 0.00022175908088684082, 0.0002443566918373108, 0.00026695430278778076, 0.00028955191373825073, 0.0003121495246887207, 0.0003347471356391907, 0.00035734474658966064, 0.0003799423575401306, 0.0004025399684906006, 0.00042513757944107056, 0.00044773519039154053, 0.0004703328013420105, 0.0004929304122924805, 0.0005155280232429504, 0.0005381256341934204, 0.0005607232451438904, 0.0005833208560943604, 0.0006059184670448303, 0.0006285160779953003, 0.0006511136889457703, 0.0006737112998962402, 0.0006963089108467102, 0.0007189065217971802, 0.0007415041327476501, 0.0007641017436981201, 0.0007866993546485901, 0.0008092969655990601, 0.00083189457654953, 0.0008544921875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 7.0, 8.0, 12.0, 30.0, 71.0, 156.0, 360.0, 1025.0, 4922.0, 138653.0, 876302.0, 23615.0, 2313.0, 651.0, 243.0, 89.0, 44.0, 21.0, 14.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.03125, -13.664794921875, -13.29833984375, -12.931884765625, -12.5654296875, -12.198974609375, -11.83251953125, -11.466064453125, -11.099609375, -10.733154296875, -10.36669921875, -10.000244140625, -9.6337890625, -9.267333984375, -8.90087890625, -8.534423828125, -8.16796875, -7.801513671875, -7.43505859375, -7.068603515625, -6.7021484375, -6.335693359375, -5.96923828125, -5.602783203125, -5.236328125, -4.869873046875, -4.50341796875, -4.136962890625, -3.7705078125, -3.404052734375, -3.03759765625, -2.671142578125, -2.3046875, -1.938232421875, -1.57177734375, -1.205322265625, -0.8388671875, -0.472412109375, -0.10595703125, 0.260498046875, 0.626953125, 0.993408203125, 1.35986328125, 1.726318359375, 2.0927734375, 2.459228515625, 2.82568359375, 3.192138671875, 3.55859375, 3.925048828125, 4.29150390625, 4.657958984375, 5.0244140625, 5.390869140625, 5.75732421875, 6.123779296875, 6.490234375, 6.856689453125, 7.22314453125, 7.589599609375, 7.9560546875, 8.322509765625, 8.68896484375, 9.055419921875, 9.421875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 9.0, 18.0, 26.0, 34.0, 83.0, 110.0, 143.0, 164.0, 140.0, 111.0, 68.0, 36.0, 27.0, 13.0, 8.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.7972412109375, -7.531982421875, -7.2667236328125, -7.00146484375, -6.7362060546875, -6.470947265625, -6.2056884765625, -5.9404296875, -5.6751708984375, -5.409912109375, -5.1446533203125, -4.87939453125, -4.6141357421875, -4.348876953125, -4.0836181640625, -3.818359375, -3.5531005859375, -3.287841796875, -3.0225830078125, -2.75732421875, -2.4920654296875, -2.226806640625, -1.9615478515625, -1.6962890625, -1.4310302734375, -1.165771484375, -0.9005126953125, -0.63525390625, -0.3699951171875, -0.104736328125, 0.1605224609375, 0.42578125, 0.6910400390625, 0.956298828125, 1.2215576171875, 1.48681640625, 1.7520751953125, 2.017333984375, 2.2825927734375, 2.5478515625, 2.8131103515625, 3.078369140625, 3.3436279296875, 3.60888671875, 3.8741455078125, 4.139404296875, 4.4046630859375, 4.669921875, 4.9351806640625, 5.200439453125, 5.4656982421875, 5.73095703125, 5.9962158203125, 6.261474609375, 6.5267333984375, 6.7919921875, 7.0572509765625, 7.322509765625, 7.5877685546875, 7.85302734375, 8.1182861328125, 8.383544921875, 8.6488037109375, 8.9140625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 12.0, 20.0, 59.0, 140.0, 243.0, 245.0, 170.0, 72.0, 29.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.7281494140625, -47.39817428588867, -43.06819534301758, -38.73822021484375, -34.408241271972656, -30.078266143798828, -25.748291015625, -21.41831398010254, -17.088336944580078, -12.758359909057617, -8.428383827209473, -4.098407745361328, 0.2315692901611328, 4.561546325683594, 8.891521453857422, 13.221498489379883, 17.551475524902344, 21.881452560424805, 26.211429595947266, 30.541404724121094, 34.87138366699219, 39.201358795166016, 43.531333923339844, 47.86131286621094, 52.191287994384766, 56.521263122558594, 60.85124206542969, 65.18121337890625, 69.51119232177734, 73.84117126464844, 78.171142578125, 82.5011215209961, 86.83110046386719, 91.16107940673828, 95.49105072021484, 99.82102966308594, 104.15100860595703, 108.48098754882812, 112.81095886230469, 117.14093780517578, 121.47091674804688, 125.80089569091797, 130.13087463378906, 134.46084594726562, 138.7908172607422, 143.1208038330078, 147.45077514648438, 151.78074645996094, 156.1107177734375, 160.44068908691406, 164.7706756591797, 169.10064697265625, 173.4306182861328, 177.76060485839844, 182.090576171875, 186.42054748535156, 190.7505340576172, 195.08050537109375, 199.41049194335938, 203.74046325683594, 208.0704345703125, 212.40042114257812, 216.7303924560547, 221.06036376953125, 225.39035034179688]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 1.0, 5.0, 6.0, 8.0, 5.0, 12.0, 16.0, 13.0, 19.0, 23.0, 38.0, 37.0, 38.0, 47.0, 56.0, 53.0, 54.0, 59.0, 67.0, 58.0, 53.0, 43.0, 48.0, 35.0, 36.0, 32.0, 22.0, 19.0, 26.0, 11.0, 16.0, 12.0, 10.0, 6.0, 4.0, 2.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.68544387817383, -55.88404083251953, -54.08263397216797, -52.28123092651367, -50.479827880859375, -48.67842483520508, -46.87702178955078, -45.07561492919922, -43.27421188354492, -41.472808837890625, -39.67140197753906, -37.869998931884766, -36.06859588623047, -34.26719284057617, -32.465789794921875, -30.664382934570312, -28.862979888916016, -27.06157684326172, -25.26017189025879, -23.45876693725586, -21.657363891601562, -19.855960845947266, -18.054555892944336, -16.253150939941406, -14.45174789428711, -12.650343894958496, -10.848939895629883, -9.04753589630127, -7.246131896972656, -5.444727897644043, -3.6433238983154297, -1.8419198989868164, -0.04051971435546875, 1.7608842849731445, 3.562288284301758, 5.363692283630371, 7.165096282958984, 8.966500282287598, 10.767904281616211, 12.569308280944824, 14.370712280273438, 16.172115325927734, 17.973520278930664, 19.774925231933594, 21.57632827758789, 23.377731323242188, 25.179136276245117, 26.980541229248047, 28.781944274902344, 30.58334732055664, 32.38475036621094, 34.1861572265625, 35.9875602722168, 37.788963317871094, 39.590370178222656, 41.39177322387695, 43.19317626953125, 44.99457931518555, 46.795982360839844, 48.597389221191406, 50.3987922668457, 52.2001953125, 54.00160217285156, 55.80300521850586, 57.604408264160156]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 6.0, 6.0, 10.0, 12.0, 17.0, 26.0, 34.0, 56.0, 71.0, 95.0, 141.0, 208.0, 365.0, 535.0, 837.0, 1587.0, 2756.0, 5737.0, 13439.0, 40741.0, 659353.0, 3398746.0, 42934.0, 13707.0, 5782.0, 2931.0, 1607.0, 919.0, 528.0, 379.0, 231.0, 149.0, 91.0, 62.0, 49.0, 35.0, 30.0, 15.0, 11.0, 11.0, 5.0, 6.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-8.3359375, -8.08343505859375, -7.8309326171875, -7.57843017578125, -7.325927734375, -7.07342529296875, -6.8209228515625, -6.56842041015625, -6.31591796875, -6.06341552734375, -5.8109130859375, -5.55841064453125, -5.305908203125, -5.05340576171875, -4.8009033203125, -4.54840087890625, -4.2958984375, -4.04339599609375, -3.7908935546875, -3.53839111328125, -3.285888671875, -3.03338623046875, -2.7808837890625, -2.52838134765625, -2.27587890625, -2.02337646484375, -1.7708740234375, -1.51837158203125, -1.265869140625, -1.01336669921875, -0.7608642578125, -0.50836181640625, -0.255859375, -0.00335693359375, 0.2491455078125, 0.50164794921875, 0.754150390625, 1.00665283203125, 1.2591552734375, 1.51165771484375, 1.76416015625, 2.01666259765625, 2.2691650390625, 2.52166748046875, 2.774169921875, 3.02667236328125, 3.2791748046875, 3.53167724609375, 3.7841796875, 4.03668212890625, 4.2891845703125, 4.54168701171875, 4.794189453125, 5.04669189453125, 5.2991943359375, 5.55169677734375, 5.80419921875, 6.05670166015625, 6.3092041015625, 6.56170654296875, 6.814208984375, 7.06671142578125, 7.3192138671875, 7.57171630859375, 7.82421875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 5.0, 4.0, 5.0, 11.0, 14.0, 10.0, 6.0, 16.0, 15.0, 16.0, 26.0, 27.0, 46.0, 35.0, 46.0, 59.0, 64.0, 74.0, 55.0, 41.0, 55.0, 58.0, 53.0, 34.0, 50.0, 27.0, 23.0, 29.0, 21.0, 18.0, 13.0, 11.0, 12.0, 9.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.6875, -2.60540771484375, -2.5233154296875, -2.44122314453125, -2.359130859375, -2.27703857421875, -2.1949462890625, -2.11285400390625, -2.03076171875, -1.94866943359375, -1.8665771484375, -1.78448486328125, -1.702392578125, -1.62030029296875, -1.5382080078125, -1.45611572265625, -1.3740234375, -1.29193115234375, -1.2098388671875, -1.12774658203125, -1.045654296875, -0.96356201171875, -0.8814697265625, -0.79937744140625, -0.71728515625, -0.63519287109375, -0.5531005859375, -0.47100830078125, -0.388916015625, -0.30682373046875, -0.2247314453125, -0.14263916015625, -0.060546875, 0.02154541015625, 0.1036376953125, 0.18572998046875, 0.267822265625, 0.34991455078125, 0.4320068359375, 0.51409912109375, 0.59619140625, 0.67828369140625, 0.7603759765625, 0.84246826171875, 0.924560546875, 1.00665283203125, 1.0887451171875, 1.17083740234375, 1.2529296875, 1.33502197265625, 1.4171142578125, 1.49920654296875, 1.581298828125, 1.66339111328125, 1.7454833984375, 1.82757568359375, 1.90966796875, 1.99176025390625, 2.0738525390625, 2.15594482421875, 2.238037109375, 2.32012939453125, 2.4022216796875, 2.48431396484375, 2.56640625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 6.0, 12.0, 10.0, 19.0, 20.0, 19.0, 31.0, 34.0, 50.0, 51.0, 85.0, 140.0, 161.0, 238.0, 343.0, 645.0, 950.0, 1797.0, 4506.0, 14953.0, 92733.0, 3971806.0, 82910.0, 14074.0, 4166.0, 1747.0, 963.0, 545.0, 344.0, 213.0, 179.0, 126.0, 96.0, 95.0, 53.0, 32.0, 30.0, 25.0, 19.0, 12.0, 11.0, 10.0, 9.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-13.1640625, -12.745849609375, -12.32763671875, -11.909423828125, -11.4912109375, -11.072998046875, -10.65478515625, -10.236572265625, -9.818359375, -9.400146484375, -8.98193359375, -8.563720703125, -8.1455078125, -7.727294921875, -7.30908203125, -6.890869140625, -6.47265625, -6.054443359375, -5.63623046875, -5.218017578125, -4.7998046875, -4.381591796875, -3.96337890625, -3.545166015625, -3.126953125, -2.708740234375, -2.29052734375, -1.872314453125, -1.4541015625, -1.035888671875, -0.61767578125, -0.199462890625, 0.21875, 0.636962890625, 1.05517578125, 1.473388671875, 1.8916015625, 2.309814453125, 2.72802734375, 3.146240234375, 3.564453125, 3.982666015625, 4.40087890625, 4.819091796875, 5.2373046875, 5.655517578125, 6.07373046875, 6.491943359375, 6.91015625, 7.328369140625, 7.74658203125, 8.164794921875, 8.5830078125, 9.001220703125, 9.41943359375, 9.837646484375, 10.255859375, 10.674072265625, 11.09228515625, 11.510498046875, 11.9287109375, 12.346923828125, 12.76513671875, 13.183349609375, 13.6015625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 5.0, 8.0, 8.0, 11.0, 24.0, 28.0, 84.0, 223.0, 3255.0, 241.0, 87.0, 41.0, 17.0, 11.0, 11.0, 8.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.609375, -3.50482177734375, -3.4002685546875, -3.29571533203125, -3.191162109375, -3.08660888671875, -2.9820556640625, -2.87750244140625, -2.77294921875, -2.66839599609375, -2.5638427734375, -2.45928955078125, -2.354736328125, -2.25018310546875, -2.1456298828125, -2.04107666015625, -1.9365234375, -1.83197021484375, -1.7274169921875, -1.62286376953125, -1.518310546875, -1.41375732421875, -1.3092041015625, -1.20465087890625, -1.10009765625, -0.99554443359375, -0.8909912109375, -0.78643798828125, -0.681884765625, -0.57733154296875, -0.4727783203125, -0.36822509765625, -0.263671875, -0.15911865234375, -0.0545654296875, 0.04998779296875, 0.154541015625, 0.25909423828125, 0.3636474609375, 0.46820068359375, 0.57275390625, 0.67730712890625, 0.7818603515625, 0.88641357421875, 0.990966796875, 1.09552001953125, 1.2000732421875, 1.30462646484375, 1.4091796875, 1.51373291015625, 1.6182861328125, 1.72283935546875, 1.827392578125, 1.93194580078125, 2.0364990234375, 2.14105224609375, 2.24560546875, 2.35015869140625, 2.4547119140625, 2.55926513671875, 2.663818359375, 2.76837158203125, 2.8729248046875, 2.97747802734375, 3.08203125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 6.0, 13.0, 10.0, 12.0, 42.0, 53.0, 51.0, 65.0, 82.0, 84.0, 98.0, 106.0, 88.0, 78.0, 57.0, 43.0, 33.0, 22.0, 19.0, 13.0, 6.0, 5.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.741270065307617, -7.433234214782715, -7.125197887420654, -6.817161560058594, -6.509125709533691, -6.201089859008789, -5.8930535316467285, -5.585017204284668, -5.276981353759766, -4.968945503234863, -4.660909175872803, -4.352872848510742, -4.04483699798584, -3.7368009090423584, -3.428764820098877, -3.1207287311553955, -2.812692642211914, -2.5046565532684326, -2.196620464324951, -1.8885843753814697, -1.5805482864379883, -1.2725121974945068, -0.9644761085510254, -0.656440019607544, -0.3484039306640625, -0.040367841720581055, 0.2676682472229004, 0.5757043361663818, 0.8837404251098633, 1.1917765140533447, 1.4998126029968262, 1.8078486919403076, 2.1158857345581055, 2.423921823501587, 2.7319579124450684, 3.03999400138855, 3.3480300903320312, 3.6560661792755127, 3.964102268218994, 4.272138595581055, 4.580174446105957, 4.888210296630859, 5.19624662399292, 5.5042829513549805, 5.812318801879883, 6.120354652404785, 6.428390979766846, 6.736427307128906, 7.044463157653809, 7.352499008178711, 7.6605353355407715, 7.968571662902832, 8.276607513427734, 8.584643363952637, 8.892679214477539, 9.200716018676758, 9.50875186920166, 9.816787719726562, 10.124824523925781, 10.432860374450684, 10.740896224975586, 11.048932075500488, 11.35696792602539, 11.66500473022461, 11.973040580749512]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 5.0, 12.0, 9.0, 13.0, 12.0, 15.0, 20.0, 20.0, 22.0, 19.0, 22.0, 29.0, 27.0, 35.0, 22.0, 34.0, 36.0, 41.0, 39.0, 48.0, 30.0, 33.0, 39.0, 45.0, 45.0, 27.0, 44.0, 34.0, 28.0, 29.0, 21.0, 19.0, 15.0, 19.0, 19.0, 10.0, 9.0, 13.0, 7.0, 5.0, 5.0, 3.0, 5.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.128503799438477, -4.966505527496338, -4.804506778717041, -4.642508506774902, -4.4805097579956055, -4.318511486053467, -4.156513214111328, -3.9945147037506104, -3.8325161933898926, -3.670517683029175, -3.508519172668457, -3.3465209007263184, -3.1845223903656006, -3.022523880004883, -2.860525608062744, -2.6985270977020264, -2.5365285873413086, -2.374530076980591, -2.212531566619873, -2.0505332946777344, -1.8885347843170166, -1.7265362739562988, -1.5645378828048706, -1.4025394916534424, -1.2405409812927246, -1.0785424709320068, -0.9165440797805786, -0.7545456290245056, -0.5925471782684326, -0.4305487275123596, -0.2685502767562866, -0.1065518856048584, 0.055446624755859375, 0.21744507551193237, 0.37944352626800537, 0.5414419770240784, 0.7034404277801514, 0.8654388785362244, 1.0274373292922974, 1.1894357204437256, 1.3514342308044434, 1.5134327411651611, 1.6754311323165894, 1.8374295234680176, 1.9994280338287354, 2.161426544189453, 2.323424816131592, 2.4854233264923096, 2.6474218368530273, 2.809420347213745, 2.971418857574463, 3.1334171295166016, 3.2954156398773193, 3.457414150238037, 3.619412422180176, 3.7814109325408936, 3.9434094429016113, 4.10540771484375, 4.267406463623047, 4.4294047355651855, 4.591403007507324, 4.753401756286621, 4.91540002822876, 5.077398300170898, 5.239397048950195]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 11.0, 5.0, 8.0, 20.0, 30.0, 52.0, 67.0, 107.0, 193.0, 303.0, 510.0, 882.0, 1676.0, 3100.0, 6072.0, 12122.0, 24301.0, 48481.0, 96455.0, 182544.0, 264066.0, 195882.0, 104642.0, 53196.0, 26731.0, 13012.0, 6546.0, 3366.0, 1743.0, 998.0, 543.0, 342.0, 200.0, 134.0, 78.0, 48.0, 26.0, 20.0, 13.0, 6.0, 6.0, 9.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.130859375, -3.021240234375, -2.91162109375, -2.802001953125, -2.6923828125, -2.582763671875, -2.47314453125, -2.363525390625, -2.25390625, -2.144287109375, -2.03466796875, -1.925048828125, -1.8154296875, -1.705810546875, -1.59619140625, -1.486572265625, -1.376953125, -1.267333984375, -1.15771484375, -1.048095703125, -0.9384765625, -0.828857421875, -0.71923828125, -0.609619140625, -0.5, -0.390380859375, -0.28076171875, -0.171142578125, -0.0615234375, 0.048095703125, 0.15771484375, 0.267333984375, 0.376953125, 0.486572265625, 0.59619140625, 0.705810546875, 0.8154296875, 0.925048828125, 1.03466796875, 1.144287109375, 1.25390625, 1.363525390625, 1.47314453125, 1.582763671875, 1.6923828125, 1.802001953125, 1.91162109375, 2.021240234375, 2.130859375, 2.240478515625, 2.35009765625, 2.459716796875, 2.5693359375, 2.678955078125, 2.78857421875, 2.898193359375, 3.0078125, 3.117431640625, 3.22705078125, 3.336669921875, 3.4462890625, 3.555908203125, 3.66552734375, 3.775146484375, 3.884765625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 10.0, 4.0, 4.0, 6.0, 11.0, 6.0, 11.0, 10.0, 15.0, 23.0, 22.0, 24.0, 36.0, 36.0, 41.0, 42.0, 46.0, 43.0, 66.0, 55.0, 39.0, 39.0, 53.0, 45.0, 50.0, 47.0, 37.0, 21.0, 24.0, 22.0, 19.0, 24.0, 18.0, 12.0, 8.0, 7.0, 3.0, 9.0, 4.0, 1.0, 0.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.49609375, -2.41802978515625, -2.3399658203125, -2.26190185546875, -2.183837890625, -2.10577392578125, -2.0277099609375, -1.94964599609375, -1.87158203125, -1.79351806640625, -1.7154541015625, -1.63739013671875, -1.559326171875, -1.48126220703125, -1.4031982421875, -1.32513427734375, -1.2470703125, -1.16900634765625, -1.0909423828125, -1.01287841796875, -0.934814453125, -0.85675048828125, -0.7786865234375, -0.70062255859375, -0.62255859375, -0.54449462890625, -0.4664306640625, -0.38836669921875, -0.310302734375, -0.23223876953125, -0.1541748046875, -0.07611083984375, 0.001953125, 0.08001708984375, 0.1580810546875, 0.23614501953125, 0.314208984375, 0.39227294921875, 0.4703369140625, 0.54840087890625, 0.62646484375, 0.70452880859375, 0.7825927734375, 0.86065673828125, 0.938720703125, 1.01678466796875, 1.0948486328125, 1.17291259765625, 1.2509765625, 1.32904052734375, 1.4071044921875, 1.48516845703125, 1.563232421875, 1.64129638671875, 1.7193603515625, 1.79742431640625, 1.87548828125, 1.95355224609375, 2.0316162109375, 2.10968017578125, 2.187744140625, 2.26580810546875, 2.3438720703125, 2.42193603515625, 2.5]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 2.0, 13.0, 15.0, 27.0, 51.0, 92.0, 165.0, 276.0, 560.0, 1208.0, 4589.0, 124823.0, 891642.0, 21088.0, 2310.0, 796.0, 411.0, 197.0, 120.0, 71.0, 34.0, 27.0, 18.0, 9.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.03125, -15.397216796875, -14.76318359375, -14.129150390625, -13.4951171875, -12.861083984375, -12.22705078125, -11.593017578125, -10.958984375, -10.324951171875, -9.69091796875, -9.056884765625, -8.4228515625, -7.788818359375, -7.15478515625, -6.520751953125, -5.88671875, -5.252685546875, -4.61865234375, -3.984619140625, -3.3505859375, -2.716552734375, -2.08251953125, -1.448486328125, -0.814453125, -0.180419921875, 0.45361328125, 1.087646484375, 1.7216796875, 2.355712890625, 2.98974609375, 3.623779296875, 4.2578125, 4.891845703125, 5.52587890625, 6.159912109375, 6.7939453125, 7.427978515625, 8.06201171875, 8.696044921875, 9.330078125, 9.964111328125, 10.59814453125, 11.232177734375, 11.8662109375, 12.500244140625, 13.13427734375, 13.768310546875, 14.40234375, 15.036376953125, 15.67041015625, 16.304443359375, 16.9384765625, 17.572509765625, 18.20654296875, 18.840576171875, 19.474609375, 20.108642578125, 20.74267578125, 21.376708984375, 22.0107421875, 22.644775390625, 23.27880859375, 23.912841796875, 24.546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 10.0, 3.0, 10.0, 9.0, 6.0, 20.0, 21.0, 26.0, 27.0, 34.0, 49.0, 44.0, 44.0, 58.0, 71.0, 57.0, 65.0, 48.0, 52.0, 50.0, 57.0, 49.0, 42.0, 35.0, 14.0, 24.0, 15.0, 17.0, 12.0, 5.0, 8.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.03125, -15.516845703125, -15.00244140625, -14.488037109375, -13.9736328125, -13.459228515625, -12.94482421875, -12.430419921875, -11.916015625, -11.401611328125, -10.88720703125, -10.372802734375, -9.8583984375, -9.343994140625, -8.82958984375, -8.315185546875, -7.80078125, -7.286376953125, -6.77197265625, -6.257568359375, -5.7431640625, -5.228759765625, -4.71435546875, -4.199951171875, -3.685546875, -3.171142578125, -2.65673828125, -2.142333984375, -1.6279296875, -1.113525390625, -0.59912109375, -0.084716796875, 0.4296875, 0.944091796875, 1.45849609375, 1.972900390625, 2.4873046875, 3.001708984375, 3.51611328125, 4.030517578125, 4.544921875, 5.059326171875, 5.57373046875, 6.088134765625, 6.6025390625, 7.116943359375, 7.63134765625, 8.145751953125, 8.66015625, 9.174560546875, 9.68896484375, 10.203369140625, 10.7177734375, 11.232177734375, 11.74658203125, 12.260986328125, 12.775390625, 13.289794921875, 13.80419921875, 14.318603515625, 14.8330078125, 15.347412109375, 15.86181640625, 16.376220703125, 16.890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 9.0, 5.0, 8.0, 16.0, 14.0, 27.0, 27.0, 62.0, 75.0, 105.0, 215.0, 354.0, 795.0, 2206.0, 11357.0, 156276.0, 794569.0, 72244.0, 7122.0, 1666.0, 627.0, 301.0, 167.0, 83.0, 46.0, 43.0, 36.0, 26.0, 17.0, 14.0, 16.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8203125, -6.609619140625, -6.39892578125, -6.188232421875, -5.9775390625, -5.766845703125, -5.55615234375, -5.345458984375, -5.134765625, -4.924072265625, -4.71337890625, -4.502685546875, -4.2919921875, -4.081298828125, -3.87060546875, -3.659912109375, -3.44921875, -3.238525390625, -3.02783203125, -2.817138671875, -2.6064453125, -2.395751953125, -2.18505859375, -1.974365234375, -1.763671875, -1.552978515625, -1.34228515625, -1.131591796875, -0.9208984375, -0.710205078125, -0.49951171875, -0.288818359375, -0.078125, 0.132568359375, 0.34326171875, 0.553955078125, 0.7646484375, 0.975341796875, 1.18603515625, 1.396728515625, 1.607421875, 1.818115234375, 2.02880859375, 2.239501953125, 2.4501953125, 2.660888671875, 2.87158203125, 3.082275390625, 3.29296875, 3.503662109375, 3.71435546875, 3.925048828125, 4.1357421875, 4.346435546875, 4.55712890625, 4.767822265625, 4.978515625, 5.189208984375, 5.39990234375, 5.610595703125, 5.8212890625, 6.031982421875, 6.24267578125, 6.453369140625, 6.6640625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 14.0, 9.0, 21.0, 15.0, 22.0, 36.0, 31.0, 58.0, 66.0, 65.0, 88.0, 96.0, 109.0, 72.0, 65.0, 43.0, 29.0, 41.0, 26.0, 27.0, 10.0, 7.0, 10.0, 10.0, 4.0, 2.0, 4.0, 6.0, 0.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006222724914550781, -0.0006018355488777161, -0.000581398606300354, -0.0005609616637229919, -0.0005405247211456299, -0.0005200877785682678, -0.0004996508359909058, -0.0004792138934135437, -0.00045877695083618164, -0.0004383400082588196, -0.0004179030656814575, -0.00039746612310409546, -0.0003770291805267334, -0.00035659223794937134, -0.0003361552953720093, -0.0003157183527946472, -0.00029528141021728516, -0.0002748444676399231, -0.00025440752506256104, -0.00023397058248519897, -0.00021353363990783691, -0.00019309669733047485, -0.0001726597547531128, -0.00015222281217575073, -0.00013178586959838867, -0.00011134892702102661, -9.091198444366455e-05, -7.047504186630249e-05, -5.003809928894043e-05, -2.960115671157837e-05, -9.164214134216309e-06, 1.1272728443145752e-05, 3.170967102050781e-05, 5.214661359786987e-05, 7.258355617523193e-05, 9.3020498752594e-05, 0.00011345744132995605, 0.00013389438390731812, 0.00015433132648468018, 0.00017476826906204224, 0.0001952052116394043, 0.00021564215421676636, 0.00023607909679412842, 0.0002565160393714905, 0.00027695298194885254, 0.0002973899245262146, 0.00031782686710357666, 0.0003382638096809387, 0.0003587007522583008, 0.00037913769483566284, 0.0003995746374130249, 0.00042001157999038696, 0.000440448522567749, 0.0004608854651451111, 0.00048132240772247314, 0.0005017593502998352, 0.0005221962928771973, 0.0005426332354545593, 0.0005630701780319214, 0.0005835071206092834, 0.0006039440631866455, 0.0006243810057640076, 0.0006448179483413696, 0.0006652548909187317, 0.0006856918334960938]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 2.0, 2.0, 11.0, 9.0, 13.0, 15.0, 17.0, 21.0, 42.0, 48.0, 68.0, 122.0, 213.0, 314.0, 562.0, 1032.0, 2485.0, 8219.0, 44091.0, 382620.0, 530277.0, 62123.0, 10367.0, 3011.0, 1252.0, 665.0, 329.0, 186.0, 142.0, 82.0, 56.0, 28.0, 33.0, 22.0, 14.0, 10.0, 8.0, 9.0, 5.0, 5.0, 5.0, 3.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0], "bins": [-5.30078125, -5.14056396484375, -4.9803466796875, -4.82012939453125, -4.659912109375, -4.49969482421875, -4.3394775390625, -4.17926025390625, -4.01904296875, -3.85882568359375, -3.6986083984375, -3.53839111328125, -3.378173828125, -3.21795654296875, -3.0577392578125, -2.89752197265625, -2.7373046875, -2.57708740234375, -2.4168701171875, -2.25665283203125, -2.096435546875, -1.93621826171875, -1.7760009765625, -1.61578369140625, -1.45556640625, -1.29534912109375, -1.1351318359375, -0.97491455078125, -0.814697265625, -0.65447998046875, -0.4942626953125, -0.33404541015625, -0.173828125, -0.01361083984375, 0.1466064453125, 0.30682373046875, 0.467041015625, 0.62725830078125, 0.7874755859375, 0.94769287109375, 1.10791015625, 1.26812744140625, 1.4283447265625, 1.58856201171875, 1.748779296875, 1.90899658203125, 2.0692138671875, 2.22943115234375, 2.3896484375, 2.54986572265625, 2.7100830078125, 2.87030029296875, 3.030517578125, 3.19073486328125, 3.3509521484375, 3.51116943359375, 3.67138671875, 3.83160400390625, 3.9918212890625, 4.15203857421875, 4.312255859375, 4.47247314453125, 4.6326904296875, 4.79290771484375, 4.953125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 8.0, 16.0, 18.0, 23.0, 45.0, 65.0, 63.0, 99.0, 86.0, 97.0, 102.0, 87.0, 81.0, 58.0, 51.0, 24.0, 27.0, 17.0, 9.0, 8.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.04296875, -3.8651123046875, -3.687255859375, -3.5093994140625, -3.33154296875, -3.1536865234375, -2.975830078125, -2.7979736328125, -2.6201171875, -2.4422607421875, -2.264404296875, -2.0865478515625, -1.90869140625, -1.7308349609375, -1.552978515625, -1.3751220703125, -1.197265625, -1.0194091796875, -0.841552734375, -0.6636962890625, -0.48583984375, -0.3079833984375, -0.130126953125, 0.0477294921875, 0.2255859375, 0.4034423828125, 0.581298828125, 0.7591552734375, 0.93701171875, 1.1148681640625, 1.292724609375, 1.4705810546875, 1.6484375, 1.8262939453125, 2.004150390625, 2.1820068359375, 2.35986328125, 2.5377197265625, 2.715576171875, 2.8934326171875, 3.0712890625, 3.2491455078125, 3.427001953125, 3.6048583984375, 3.78271484375, 3.9605712890625, 4.138427734375, 4.3162841796875, 4.494140625, 4.6719970703125, 4.849853515625, 5.0277099609375, 5.20556640625, 5.3834228515625, 5.561279296875, 5.7391357421875, 5.9169921875, 6.0948486328125, 6.272705078125, 6.4505615234375, 6.62841796875, 6.8062744140625, 6.984130859375, 7.1619873046875, 7.33984375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 17.0, 44.0, 150.0, 228.0, 286.0, 162.0, 67.0, 25.0, 14.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-205.98831176757812, -201.43031311035156, -196.87232971191406, -192.3143310546875, -187.75633239746094, -183.19833374023438, -178.64035034179688, -174.0823516845703, -169.52435302734375, -164.9663543701172, -160.4083709716797, -155.85037231445312, -151.29237365722656, -146.734375, -142.1763916015625, -137.61839294433594, -133.06040954589844, -128.50241088867188, -123.94441986083984, -119.38642883300781, -114.82843017578125, -110.27043914794922, -105.71244812011719, -101.15444946289062, -96.5964584350586, -92.03846740722656, -87.48046875, -82.92247772216797, -78.36448669433594, -73.80648803710938, -69.24849700927734, -64.69050598144531, -60.13251495361328, -55.574520111083984, -51.01652526855469, -46.458534240722656, -41.90053939819336, -37.34254455566406, -32.78455352783203, -28.226558685302734, -23.668563842773438, -19.11056900024414, -14.552576065063477, -9.994582176208496, -5.436588287353516, -0.8785934448242188, 3.6793994903564453, 8.23739242553711, 12.795387268066406, 17.353382110595703, 21.911375045776367, 26.46936798095703, 31.027362823486328, 35.585357666015625, 40.143348693847656, 44.70134353637695, 49.25933837890625, 53.81733322143555, 58.375328063964844, 62.933319091796875, 67.49131774902344, 72.04930877685547, 76.6072998046875, 81.16529846191406, 85.7232894897461]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 12.0, 10.0, 11.0, 13.0, 21.0, 15.0, 30.0, 27.0, 45.0, 33.0, 39.0, 44.0, 37.0, 54.0, 64.0, 56.0, 59.0, 63.0, 46.0, 41.0, 45.0, 30.0, 41.0, 32.0, 28.0, 24.0, 5.0, 16.0, 11.0, 12.0, 9.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-69.10728454589844, -67.03999328613281, -64.97269439697266, -62.90540313720703, -60.838111877441406, -58.770816802978516, -56.703521728515625, -54.63623046875, -52.568939208984375, -50.501644134521484, -48.43435287475586, -46.36705780029297, -44.299766540527344, -42.23247146606445, -40.16517639160156, -38.09788513183594, -36.03059005737305, -33.963294982910156, -31.89600372314453, -29.82870864868164, -27.761417388916016, -25.694122314453125, -23.626829147338867, -21.55953598022461, -19.49224281311035, -17.424949645996094, -15.357656478881836, -13.290362358093262, -11.223069190979004, -9.155776023864746, -7.088481903076172, -5.021188735961914, -2.953899383544922, -0.886605978012085, 1.180687427520752, 3.247981071472168, 5.315274238586426, 7.382567405700684, 9.449861526489258, 11.517154693603516, 13.584447860717773, 15.651741027832031, 17.71903419494629, 19.786327362060547, 21.853622436523438, 23.920913696289062, 25.988208770751953, 28.05550193786621, 30.12279510498047, 32.19009017944336, 34.257381439208984, 36.324676513671875, 38.3919677734375, 40.45926284790039, 42.52655792236328, 44.593849182128906, 46.66114044189453, 48.72843551635742, 50.79572677612305, 52.86302185058594, 54.93031311035156, 56.99760818481445, 59.064903259277344, 61.13219451904297, 63.19948959350586]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 6.0, 8.0, 20.0, 10.0, 25.0, 20.0, 35.0, 41.0, 58.0, 92.0, 115.0, 165.0, 275.0, 438.0, 665.0, 1029.0, 2045.0, 4324.0, 10457.0, 35939.0, 331323.0, 3713725.0, 65616.0, 15706.0, 5900.0, 2603.0, 1433.0, 765.0, 502.0, 317.0, 193.0, 135.0, 86.0, 60.0, 48.0, 31.0, 14.0, 11.0, 15.0, 12.0, 5.0, 9.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.5546875, -9.248291015625, -8.94189453125, -8.635498046875, -8.3291015625, -8.022705078125, -7.71630859375, -7.409912109375, -7.103515625, -6.797119140625, -6.49072265625, -6.184326171875, -5.8779296875, -5.571533203125, -5.26513671875, -4.958740234375, -4.65234375, -4.345947265625, -4.03955078125, -3.733154296875, -3.4267578125, -3.120361328125, -2.81396484375, -2.507568359375, -2.201171875, -1.894775390625, -1.58837890625, -1.281982421875, -0.9755859375, -0.669189453125, -0.36279296875, -0.056396484375, 0.25, 0.556396484375, 0.86279296875, 1.169189453125, 1.4755859375, 1.781982421875, 2.08837890625, 2.394775390625, 2.701171875, 3.007568359375, 3.31396484375, 3.620361328125, 3.9267578125, 4.233154296875, 4.53955078125, 4.845947265625, 5.15234375, 5.458740234375, 5.76513671875, 6.071533203125, 6.3779296875, 6.684326171875, 6.99072265625, 7.297119140625, 7.603515625, 7.909912109375, 8.21630859375, 8.522705078125, 8.8291015625, 9.135498046875, 9.44189453125, 9.748291015625, 10.0546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 8.0, 6.0, 10.0, 12.0, 19.0, 17.0, 19.0, 26.0, 34.0, 34.0, 33.0, 40.0, 36.0, 48.0, 64.0, 52.0, 59.0, 46.0, 47.0, 56.0, 51.0, 37.0, 36.0, 35.0, 28.0, 18.0, 31.0, 20.0, 13.0, 10.0, 16.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.341796875, -2.262969970703125, -2.18414306640625, -2.105316162109375, -2.0264892578125, -1.947662353515625, -1.86883544921875, -1.790008544921875, -1.711181640625, -1.632354736328125, -1.55352783203125, -1.474700927734375, -1.3958740234375, -1.317047119140625, -1.23822021484375, -1.159393310546875, -1.08056640625, -1.001739501953125, -0.92291259765625, -0.844085693359375, -0.7652587890625, -0.686431884765625, -0.60760498046875, -0.528778076171875, -0.449951171875, -0.371124267578125, -0.29229736328125, -0.213470458984375, -0.1346435546875, -0.055816650390625, 0.02301025390625, 0.101837158203125, 0.1806640625, 0.259490966796875, 0.33831787109375, 0.417144775390625, 0.4959716796875, 0.574798583984375, 0.65362548828125, 0.732452392578125, 0.811279296875, 0.890106201171875, 0.96893310546875, 1.047760009765625, 1.1265869140625, 1.205413818359375, 1.28424072265625, 1.363067626953125, 1.44189453125, 1.520721435546875, 1.59954833984375, 1.678375244140625, 1.7572021484375, 1.836029052734375, 1.91485595703125, 1.993682861328125, 2.072509765625, 2.151336669921875, 2.23016357421875, 2.308990478515625, 2.3878173828125, 2.466644287109375, 2.54547119140625, 2.624298095703125, 2.703125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 13.0, 5.0, 8.0, 9.0, 18.0, 18.0, 34.0, 50.0, 60.0, 87.0, 121.0, 222.0, 421.0, 699.0, 1251.0, 2429.0, 5182.0, 13504.0, 47190.0, 362084.0, 3612137.0, 108568.0, 24305.0, 8322.0, 3548.0, 1699.0, 860.0, 550.0, 321.0, 205.0, 120.0, 55.0, 62.0, 38.0, 24.0, 17.0, 16.0, 8.0, 4.0, 10.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.4296875, -8.1683349609375, -7.906982421875, -7.6456298828125, -7.38427734375, -7.1229248046875, -6.861572265625, -6.6002197265625, -6.3388671875, -6.0775146484375, -5.816162109375, -5.5548095703125, -5.29345703125, -5.0321044921875, -4.770751953125, -4.5093994140625, -4.248046875, -3.9866943359375, -3.725341796875, -3.4639892578125, -3.20263671875, -2.9412841796875, -2.679931640625, -2.4185791015625, -2.1572265625, -1.8958740234375, -1.634521484375, -1.3731689453125, -1.11181640625, -0.8504638671875, -0.589111328125, -0.3277587890625, -0.06640625, 0.1949462890625, 0.456298828125, 0.7176513671875, 0.97900390625, 1.2403564453125, 1.501708984375, 1.7630615234375, 2.0244140625, 2.2857666015625, 2.547119140625, 2.8084716796875, 3.06982421875, 3.3311767578125, 3.592529296875, 3.8538818359375, 4.115234375, 4.3765869140625, 4.637939453125, 4.8992919921875, 5.16064453125, 5.4219970703125, 5.683349609375, 5.9447021484375, 6.2060546875, 6.4674072265625, 6.728759765625, 6.9901123046875, 7.25146484375, 7.5128173828125, 7.774169921875, 8.0355224609375, 8.296875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 7.0, 13.0, 11.0, 23.0, 31.0, 45.0, 70.0, 145.0, 386.0, 2543.0, 393.0, 165.0, 83.0, 44.0, 21.0, 22.0, 14.0, 14.0, 11.0, 7.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.759765625, -3.636566162109375, -3.51336669921875, -3.390167236328125, -3.2669677734375, -3.143768310546875, -3.02056884765625, -2.897369384765625, -2.774169921875, -2.650970458984375, -2.52777099609375, -2.404571533203125, -2.2813720703125, -2.158172607421875, -2.03497314453125, -1.911773681640625, -1.78857421875, -1.665374755859375, -1.54217529296875, -1.418975830078125, -1.2957763671875, -1.172576904296875, -1.04937744140625, -0.926177978515625, -0.802978515625, -0.679779052734375, -0.55657958984375, -0.433380126953125, -0.3101806640625, -0.186981201171875, -0.06378173828125, 0.059417724609375, 0.1826171875, 0.305816650390625, 0.42901611328125, 0.552215576171875, 0.6754150390625, 0.798614501953125, 0.92181396484375, 1.045013427734375, 1.168212890625, 1.291412353515625, 1.41461181640625, 1.537811279296875, 1.6610107421875, 1.784210205078125, 1.90740966796875, 2.030609130859375, 2.15380859375, 2.277008056640625, 2.40020751953125, 2.523406982421875, 2.6466064453125, 2.769805908203125, 2.89300537109375, 3.016204833984375, 3.139404296875, 3.262603759765625, 3.38580322265625, 3.509002685546875, 3.6322021484375, 3.755401611328125, 3.87860107421875, 4.001800537109375, 4.125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 11.0, 8.0, 14.0, 40.0, 67.0, 84.0, 118.0, 123.0, 147.0, 108.0, 96.0, 60.0, 53.0, 23.0, 16.0, 15.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.594886779785156, -21.943449020385742, -21.29201316833496, -20.640575408935547, -19.989139556884766, -19.33770179748535, -18.686264038085938, -18.034828186035156, -17.383390426635742, -16.731952667236328, -16.080516815185547, -15.429079055786133, -14.777642250061035, -14.126205444335938, -13.474767684936523, -12.823330879211426, -12.171894073486328, -11.52045726776123, -10.869020462036133, -10.217582702636719, -9.566145896911621, -8.914709091186523, -8.26327133178711, -7.611834526062012, -6.960397720336914, -6.308960914611816, -5.6575236320495605, -5.006086349487305, -4.354649543762207, -3.7032124996185303, -3.0517754554748535, -2.4003381729125977, -1.7489013671875, -1.0974643230438232, -0.4460272789001465, 0.20540976524353027, 0.856846809387207, 1.5082838535308838, 2.1597208976745605, 2.8111581802368164, 3.462594985961914, 4.114031791687012, 4.765469074249268, 5.416906356811523, 6.068343162536621, 6.719779968261719, 7.371217250823975, 8.02265453338623, 8.674091339111328, 9.325528144836426, 9.976964950561523, 10.628402709960938, 11.279839515686035, 11.931276321411133, 12.582714080810547, 13.234150886535645, 13.885587692260742, 14.53702449798584, 15.188461303710938, 15.839899063110352, 16.491336822509766, 17.142772674560547, 17.79421043395996, 18.445648193359375, 19.097084045410156]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 5.0, 8.0, 7.0, 10.0, 6.0, 9.0, 14.0, 13.0, 11.0, 23.0, 25.0, 15.0, 26.0, 24.0, 33.0, 30.0, 37.0, 27.0, 34.0, 46.0, 25.0, 45.0, 45.0, 36.0, 37.0, 34.0, 34.0, 32.0, 34.0, 31.0, 22.0, 32.0, 22.0, 24.0, 20.0, 17.0, 18.0, 15.0, 11.0, 11.0, 10.0, 14.0, 9.0, 3.0, 4.0, 3.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-8.285606384277344, -8.016773223876953, -7.747940540313721, -7.47910737991333, -7.210274696350098, -6.941441535949707, -6.672608375549316, -6.403775691986084, -6.134943008422852, -5.866109848022461, -5.5972771644592285, -5.328444004058838, -5.0596113204956055, -4.790778160095215, -4.521944999694824, -4.253112316131592, -3.984279155731201, -3.7154462337493896, -3.446613311767578, -3.1777801513671875, -2.908947467803955, -2.6401143074035645, -2.371281385421753, -2.1024484634399414, -1.8336155414581299, -1.5647826194763184, -1.2959496974945068, -1.0271166563034058, -0.7582837343215942, -0.4894508123397827, -0.22061777114868164, 0.04821515083312988, 0.3170480728149414, 0.5858809947967529, 0.8547139763832092, 1.1235469579696655, 1.392379879951477, 1.6612128019332886, 1.9300458431243896, 2.198878765106201, 2.4677116870880127, 2.736544609069824, 3.0053775310516357, 3.2742104530334473, 3.543043613433838, 3.8118762969970703, 4.080709457397461, 4.349542617797852, 4.618375301361084, 4.887208461761475, 5.156041145324707, 5.424874305725098, 5.69370698928833, 5.962540149688721, 6.231372833251953, 6.500205993652344, 6.769039154052734, 7.037872314453125, 7.306704998016357, 7.575538158416748, 7.8443708419799805, 8.113204002380371, 8.382037162780762, 8.650869369506836, 8.919702529907227]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 11.0, 11.0, 19.0, 20.0, 48.0, 58.0, 78.0, 151.0, 224.0, 378.0, 667.0, 1179.0, 1984.0, 3850.0, 7136.0, 13769.0, 26956.0, 52789.0, 102200.0, 215282.0, 301635.0, 157958.0, 78563.0, 40121.0, 20579.0, 10569.0, 5390.0, 2989.0, 1647.0, 898.0, 564.0, 295.0, 195.0, 127.0, 69.0, 54.0, 29.0, 26.0, 13.0, 8.0, 4.0, 6.0, 4.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.4921875, -4.3388671875, -4.185546875, -4.0322265625, -3.87890625, -3.7255859375, -3.572265625, -3.4189453125, -3.265625, -3.1123046875, -2.958984375, -2.8056640625, -2.65234375, -2.4990234375, -2.345703125, -2.1923828125, -2.0390625, -1.8857421875, -1.732421875, -1.5791015625, -1.42578125, -1.2724609375, -1.119140625, -0.9658203125, -0.8125, -0.6591796875, -0.505859375, -0.3525390625, -0.19921875, -0.0458984375, 0.107421875, 0.2607421875, 0.4140625, 0.5673828125, 0.720703125, 0.8740234375, 1.02734375, 1.1806640625, 1.333984375, 1.4873046875, 1.640625, 1.7939453125, 1.947265625, 2.1005859375, 2.25390625, 2.4072265625, 2.560546875, 2.7138671875, 2.8671875, 3.0205078125, 3.173828125, 3.3271484375, 3.48046875, 3.6337890625, 3.787109375, 3.9404296875, 4.09375, 4.2470703125, 4.400390625, 4.5537109375, 4.70703125, 4.8603515625, 5.013671875, 5.1669921875, 5.3203125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 4.0, 2.0, 8.0, 9.0, 11.0, 18.0, 17.0, 27.0, 31.0, 32.0, 40.0, 46.0, 53.0, 51.0, 57.0, 47.0, 52.0, 54.0, 74.0, 58.0, 58.0, 44.0, 37.0, 31.0, 28.0, 20.0, 25.0, 11.0, 14.0, 7.0, 4.0, 9.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.865234375, -2.771759033203125, -2.67828369140625, -2.584808349609375, -2.4913330078125, -2.397857666015625, -2.30438232421875, -2.210906982421875, -2.117431640625, -2.023956298828125, -1.93048095703125, -1.837005615234375, -1.7435302734375, -1.650054931640625, -1.55657958984375, -1.463104248046875, -1.36962890625, -1.276153564453125, -1.18267822265625, -1.089202880859375, -0.9957275390625, -0.902252197265625, -0.80877685546875, -0.715301513671875, -0.621826171875, -0.528350830078125, -0.43487548828125, -0.341400146484375, -0.2479248046875, -0.154449462890625, -0.06097412109375, 0.032501220703125, 0.1259765625, 0.219451904296875, 0.31292724609375, 0.406402587890625, 0.4998779296875, 0.593353271484375, 0.68682861328125, 0.780303955078125, 0.873779296875, 0.967254638671875, 1.06072998046875, 1.154205322265625, 1.2476806640625, 1.341156005859375, 1.43463134765625, 1.528106689453125, 1.62158203125, 1.715057373046875, 1.80853271484375, 1.902008056640625, 1.9954833984375, 2.088958740234375, 2.18243408203125, 2.275909423828125, 2.369384765625, 2.462860107421875, 2.55633544921875, 2.649810791015625, 2.7432861328125, 2.836761474609375, 2.93023681640625, 3.023712158203125, 3.1171875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 3.0, 5.0, 6.0, 7.0, 11.0, 19.0, 17.0, 29.0, 46.0, 54.0, 83.0, 147.0, 241.0, 417.0, 743.0, 1645.0, 4854.0, 32676.0, 665575.0, 317137.0, 18673.0, 3391.0, 1229.0, 629.0, 311.0, 200.0, 125.0, 102.0, 51.0, 43.0, 21.0, 15.0, 15.0, 14.0, 3.0, 5.0, 4.0, 3.0, 7.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-19.78125, -19.244873046875, -18.70849609375, -18.172119140625, -17.6357421875, -17.099365234375, -16.56298828125, -16.026611328125, -15.490234375, -14.953857421875, -14.41748046875, -13.881103515625, -13.3447265625, -12.808349609375, -12.27197265625, -11.735595703125, -11.19921875, -10.662841796875, -10.12646484375, -9.590087890625, -9.0537109375, -8.517333984375, -7.98095703125, -7.444580078125, -6.908203125, -6.371826171875, -5.83544921875, -5.299072265625, -4.7626953125, -4.226318359375, -3.68994140625, -3.153564453125, -2.6171875, -2.080810546875, -1.54443359375, -1.008056640625, -0.4716796875, 0.064697265625, 0.60107421875, 1.137451171875, 1.673828125, 2.210205078125, 2.74658203125, 3.282958984375, 3.8193359375, 4.355712890625, 4.89208984375, 5.428466796875, 5.96484375, 6.501220703125, 7.03759765625, 7.573974609375, 8.1103515625, 8.646728515625, 9.18310546875, 9.719482421875, 10.255859375, 10.792236328125, 11.32861328125, 11.864990234375, 12.4013671875, 12.937744140625, 13.47412109375, 14.010498046875, 14.546875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 7.0, 8.0, 8.0, 4.0, 11.0, 14.0, 12.0, 17.0, 15.0, 26.0, 35.0, 33.0, 37.0, 50.0, 47.0, 45.0, 55.0, 61.0, 38.0, 53.0, 55.0, 55.0, 47.0, 47.0, 38.0, 25.0, 29.0, 24.0, 26.0, 20.0, 12.0, 15.0, 9.0, 5.0, 4.0, 7.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.9765625, -12.5902099609375, -12.203857421875, -11.8175048828125, -11.43115234375, -11.0447998046875, -10.658447265625, -10.2720947265625, -9.8857421875, -9.4993896484375, -9.113037109375, -8.7266845703125, -8.34033203125, -7.9539794921875, -7.567626953125, -7.1812744140625, -6.794921875, -6.4085693359375, -6.022216796875, -5.6358642578125, -5.24951171875, -4.8631591796875, -4.476806640625, -4.0904541015625, -3.7041015625, -3.3177490234375, -2.931396484375, -2.5450439453125, -2.15869140625, -1.7723388671875, -1.385986328125, -0.9996337890625, -0.61328125, -0.2269287109375, 0.159423828125, 0.5457763671875, 0.93212890625, 1.3184814453125, 1.704833984375, 2.0911865234375, 2.4775390625, 2.8638916015625, 3.250244140625, 3.6365966796875, 4.02294921875, 4.4093017578125, 4.795654296875, 5.1820068359375, 5.568359375, 5.9547119140625, 6.341064453125, 6.7274169921875, 7.11376953125, 7.5001220703125, 7.886474609375, 8.2728271484375, 8.6591796875, 9.0455322265625, 9.431884765625, 9.8182373046875, 10.20458984375, 10.5909423828125, 10.977294921875, 11.3636474609375, 11.75]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 9.0, 23.0, 23.0, 34.0, 63.0, 155.0, 389.0, 978.0, 3608.0, 25627.0, 474224.0, 511617.0, 26301.0, 3746.0, 1029.0, 365.0, 173.0, 72.0, 42.0, 23.0, 14.0, 12.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8671875, -5.6416015625, -5.416015625, -5.1904296875, -4.96484375, -4.7392578125, -4.513671875, -4.2880859375, -4.0625, -3.8369140625, -3.611328125, -3.3857421875, -3.16015625, -2.9345703125, -2.708984375, -2.4833984375, -2.2578125, -2.0322265625, -1.806640625, -1.5810546875, -1.35546875, -1.1298828125, -0.904296875, -0.6787109375, -0.453125, -0.2275390625, -0.001953125, 0.2236328125, 0.44921875, 0.6748046875, 0.900390625, 1.1259765625, 1.3515625, 1.5771484375, 1.802734375, 2.0283203125, 2.25390625, 2.4794921875, 2.705078125, 2.9306640625, 3.15625, 3.3818359375, 3.607421875, 3.8330078125, 4.05859375, 4.2841796875, 4.509765625, 4.7353515625, 4.9609375, 5.1865234375, 5.412109375, 5.6376953125, 5.86328125, 6.0888671875, 6.314453125, 6.5400390625, 6.765625, 6.9912109375, 7.216796875, 7.4423828125, 7.66796875, 7.8935546875, 8.119140625, 8.3447265625, 8.5703125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 8.0, 10.0, 18.0, 15.0, 35.0, 40.0, 53.0, 77.0, 108.0, 206.0, 133.0, 94.0, 71.0, 39.0, 26.0, 27.0, 20.0, 9.0, 9.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016841888427734375, -0.0016369819641113281, -0.0015897750854492188, -0.0015425682067871094, -0.001495361328125, -0.0014481544494628906, -0.0014009475708007812, -0.0013537406921386719, -0.0013065338134765625, -0.0012593269348144531, -0.0012121200561523438, -0.0011649131774902344, -0.001117706298828125, -0.0010704994201660156, -0.0010232925415039062, -0.0009760856628417969, -0.0009288787841796875, -0.0008816719055175781, -0.0008344650268554688, -0.0007872581481933594, -0.00074005126953125, -0.0006928443908691406, -0.0006456375122070312, -0.0005984306335449219, -0.0005512237548828125, -0.0005040168762207031, -0.00045680999755859375, -0.0004096031188964844, -0.000362396240234375, -0.0003151893615722656, -0.00026798248291015625, -0.00022077560424804688, -0.0001735687255859375, -0.00012636184692382812, -7.915496826171875e-05, -3.1948089599609375e-05, 1.52587890625e-05, 6.246566772460938e-05, 0.00010967254638671875, 0.00015687942504882812, 0.0002040863037109375, 0.0002512931823730469, 0.00029850006103515625, 0.0003457069396972656, 0.000392913818359375, 0.0004401206970214844, 0.00048732757568359375, 0.0005345344543457031, 0.0005817413330078125, 0.0006289482116699219, 0.0006761550903320312, 0.0007233619689941406, 0.00077056884765625, 0.0008177757263183594, 0.0008649826049804688, 0.0009121894836425781, 0.0009593963623046875, 0.0010066032409667969, 0.0010538101196289062, 0.0011010169982910156, 0.001148223876953125, 0.0011954307556152344, 0.0012426376342773438, 0.0012898445129394531, 0.0013370513916015625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 8.0, 7.0, 7.0, 10.0, 23.0, 24.0, 44.0, 95.0, 156.0, 283.0, 635.0, 1678.0, 5776.0, 41102.0, 737044.0, 240691.0, 15824.0, 3163.0, 1013.0, 463.0, 203.0, 126.0, 50.0, 54.0, 22.0, 20.0, 9.0, 3.0, 5.0, 8.0, 1.0, 4.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.60546875, -7.38037109375, -7.1552734375, -6.93017578125, -6.705078125, -6.47998046875, -6.2548828125, -6.02978515625, -5.8046875, -5.57958984375, -5.3544921875, -5.12939453125, -4.904296875, -4.67919921875, -4.4541015625, -4.22900390625, -4.00390625, -3.77880859375, -3.5537109375, -3.32861328125, -3.103515625, -2.87841796875, -2.6533203125, -2.42822265625, -2.203125, -1.97802734375, -1.7529296875, -1.52783203125, -1.302734375, -1.07763671875, -0.8525390625, -0.62744140625, -0.40234375, -0.17724609375, 0.0478515625, 0.27294921875, 0.498046875, 0.72314453125, 0.9482421875, 1.17333984375, 1.3984375, 1.62353515625, 1.8486328125, 2.07373046875, 2.298828125, 2.52392578125, 2.7490234375, 2.97412109375, 3.19921875, 3.42431640625, 3.6494140625, 3.87451171875, 4.099609375, 4.32470703125, 4.5498046875, 4.77490234375, 5.0, 5.22509765625, 5.4501953125, 5.67529296875, 5.900390625, 6.12548828125, 6.3505859375, 6.57568359375, 6.80078125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 8.0, 8.0, 11.0, 15.0, 27.0, 34.0, 31.0, 43.0, 70.0, 78.0, 99.0, 113.0, 94.0, 64.0, 75.0, 55.0, 50.0, 29.0, 19.0, 22.0, 14.0, 7.0, 9.0, 9.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.41796875, -5.273193359375, -5.12841796875, -4.983642578125, -4.8388671875, -4.694091796875, -4.54931640625, -4.404541015625, -4.259765625, -4.114990234375, -3.97021484375, -3.825439453125, -3.6806640625, -3.535888671875, -3.39111328125, -3.246337890625, -3.1015625, -2.956787109375, -2.81201171875, -2.667236328125, -2.5224609375, -2.377685546875, -2.23291015625, -2.088134765625, -1.943359375, -1.798583984375, -1.65380859375, -1.509033203125, -1.3642578125, -1.219482421875, -1.07470703125, -0.929931640625, -0.78515625, -0.640380859375, -0.49560546875, -0.350830078125, -0.2060546875, -0.061279296875, 0.08349609375, 0.228271484375, 0.373046875, 0.517822265625, 0.66259765625, 0.807373046875, 0.9521484375, 1.096923828125, 1.24169921875, 1.386474609375, 1.53125, 1.676025390625, 1.82080078125, 1.965576171875, 2.1103515625, 2.255126953125, 2.39990234375, 2.544677734375, 2.689453125, 2.834228515625, 2.97900390625, 3.123779296875, 3.2685546875, 3.413330078125, 3.55810546875, 3.702880859375, 3.84765625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 1.0, 4.0, 8.0, 14.0, 39.0, 69.0, 174.0, 218.0, 240.0, 146.0, 59.0, 20.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-196.76458740234375, -192.5618896484375, -188.35919189453125, -184.15650939941406, -179.9538116455078, -175.75111389160156, -171.5484161376953, -167.34571838378906, -163.14303588867188, -158.94033813476562, -154.73764038085938, -150.5349578857422, -146.33226013183594, -142.1295623779297, -137.92686462402344, -133.7241668701172, -129.52146911621094, -125.31877136230469, -121.11608123779297, -116.91338348388672, -112.710693359375, -108.50799560546875, -104.3052978515625, -100.10260009765625, -95.89990997314453, -91.69721221923828, -87.49452209472656, -83.29182434082031, -79.08912658691406, -74.88643646240234, -70.6837387084961, -66.48104858398438, -62.27833557128906, -58.07564163208008, -53.872947692871094, -49.670249938964844, -45.46755599975586, -41.264862060546875, -37.062164306640625, -32.85947036743164, -28.656776428222656, -24.454082489013672, -20.251386642456055, -16.048690795898438, -11.845996856689453, -7.643302917480469, -3.4406070709228516, 0.7620887756347656, 4.96478271484375, 9.16747760772705, 13.370172500610352, 17.57286834716797, 21.775562286376953, 25.978256225585938, 30.180952072143555, 34.38364791870117, 38.586341857910156, 42.78903579711914, 46.991729736328125, 51.194427490234375, 55.39712142944336, 59.599815368652344, 63.802513122558594, 68.00520324707031, 72.20790100097656]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 5.0, 6.0, 3.0, 15.0, 4.0, 9.0, 16.0, 22.0, 23.0, 15.0, 17.0, 19.0, 26.0, 25.0, 31.0, 24.0, 38.0, 40.0, 35.0, 45.0, 36.0, 55.0, 52.0, 48.0, 46.0, 41.0, 41.0, 27.0, 29.0, 39.0, 24.0, 14.0, 24.0, 12.0, 14.0, 16.0, 12.0, 10.0, 8.0, 6.0, 8.0, 10.0, 3.0, 2.0, 3.0, 6.0, 0.0, 0.0, 2.0, 2.0], "bins": [-48.197967529296875, -46.828712463378906, -45.45945739746094, -44.09020233154297, -42.720947265625, -41.35169219970703, -39.98243713378906, -38.613182067871094, -37.243927001953125, -35.874671936035156, -34.50541687011719, -33.13616180419922, -31.76690673828125, -30.39765167236328, -29.028396606445312, -27.659141540527344, -26.289886474609375, -24.920631408691406, -23.551376342773438, -22.18212127685547, -20.8128662109375, -19.44361114501953, -18.074356079101562, -16.705101013183594, -15.335845947265625, -13.966590881347656, -12.597335815429688, -11.228080749511719, -9.85882568359375, -8.489570617675781, -7.1203155517578125, -5.751060485839844, -4.381805419921875, -3.0125503540039062, -1.6432952880859375, -0.27404022216796875, 1.09521484375, 2.4644699096679688, 3.8337249755859375, 5.202980041503906, 6.572235107421875, 7.941490173339844, 9.310745239257812, 10.680000305175781, 12.04925537109375, 13.418510437011719, 14.787765502929688, 16.157020568847656, 17.526275634765625, 18.895530700683594, 20.264785766601562, 21.63404083251953, 23.0032958984375, 24.37255096435547, 25.741806030273438, 27.111061096191406, 28.480316162109375, 29.849571228027344, 31.218826293945312, 32.58808135986328, 33.95733642578125, 35.32659149169922, 36.69584655761719, 38.065101623535156, 39.434356689453125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 13.0, 17.0, 21.0, 34.0, 49.0, 70.0, 110.0, 164.0, 275.0, 478.0, 802.0, 1482.0, 2652.0, 5157.0, 11167.0, 26353.0, 73857.0, 275669.0, 1906227.0, 1547193.0, 232736.0, 64902.0, 24217.0, 10175.0, 4756.0, 2451.0, 1278.0, 717.0, 443.0, 262.0, 191.0, 118.0, 74.0, 55.0, 30.0, 28.0, 20.0, 12.0, 9.0, 6.0, 1.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5859375, -4.4423828125, -4.298828125, -4.1552734375, -4.01171875, -3.8681640625, -3.724609375, -3.5810546875, -3.4375, -3.2939453125, -3.150390625, -3.0068359375, -2.86328125, -2.7197265625, -2.576171875, -2.4326171875, -2.2890625, -2.1455078125, -2.001953125, -1.8583984375, -1.71484375, -1.5712890625, -1.427734375, -1.2841796875, -1.140625, -0.9970703125, -0.853515625, -0.7099609375, -0.56640625, -0.4228515625, -0.279296875, -0.1357421875, 0.0078125, 0.1513671875, 0.294921875, 0.4384765625, 0.58203125, 0.7255859375, 0.869140625, 1.0126953125, 1.15625, 1.2998046875, 1.443359375, 1.5869140625, 1.73046875, 1.8740234375, 2.017578125, 2.1611328125, 2.3046875, 2.4482421875, 2.591796875, 2.7353515625, 2.87890625, 3.0224609375, 3.166015625, 3.3095703125, 3.453125, 3.5966796875, 3.740234375, 3.8837890625, 4.02734375, 4.1708984375, 4.314453125, 4.4580078125, 4.6015625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 7.0, 8.0, 7.0, 19.0, 19.0, 19.0, 25.0, 34.0, 32.0, 38.0, 58.0, 57.0, 53.0, 58.0, 61.0, 55.0, 58.0, 60.0, 54.0, 43.0, 43.0, 39.0, 33.0, 26.0, 12.0, 15.0, 19.0, 15.0, 10.0, 9.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.27734375, -2.189971923828125, -2.10260009765625, -2.015228271484375, -1.9278564453125, -1.840484619140625, -1.75311279296875, -1.665740966796875, -1.578369140625, -1.490997314453125, -1.40362548828125, -1.316253662109375, -1.2288818359375, -1.141510009765625, -1.05413818359375, -0.966766357421875, -0.87939453125, -0.792022705078125, -0.70465087890625, -0.617279052734375, -0.5299072265625, -0.442535400390625, -0.35516357421875, -0.267791748046875, -0.180419921875, -0.093048095703125, -0.00567626953125, 0.081695556640625, 0.1690673828125, 0.256439208984375, 0.34381103515625, 0.431182861328125, 0.5185546875, 0.605926513671875, 0.69329833984375, 0.780670166015625, 0.8680419921875, 0.955413818359375, 1.04278564453125, 1.130157470703125, 1.217529296875, 1.304901123046875, 1.39227294921875, 1.479644775390625, 1.5670166015625, 1.654388427734375, 1.74176025390625, 1.829132080078125, 1.91650390625, 2.003875732421875, 2.09124755859375, 2.178619384765625, 2.2659912109375, 2.353363037109375, 2.44073486328125, 2.528106689453125, 2.615478515625, 2.702850341796875, 2.79022216796875, 2.877593994140625, 2.9649658203125, 3.052337646484375, 3.13970947265625, 3.227081298828125, 3.314453125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 11.0, 11.0, 10.0, 9.0, 30.0, 47.0, 62.0, 73.0, 137.0, 261.0, 602.0, 1315.0, 3364.0, 10790.0, 47544.0, 362514.0, 3323509.0, 379673.0, 47879.0, 10814.0, 3292.0, 1217.0, 507.0, 235.0, 145.0, 67.0, 52.0, 28.0, 22.0, 16.0, 5.0, 15.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3046875, -8.032470703125, -7.76025390625, -7.488037109375, -7.2158203125, -6.943603515625, -6.67138671875, -6.399169921875, -6.126953125, -5.854736328125, -5.58251953125, -5.310302734375, -5.0380859375, -4.765869140625, -4.49365234375, -4.221435546875, -3.94921875, -3.677001953125, -3.40478515625, -3.132568359375, -2.8603515625, -2.588134765625, -2.31591796875, -2.043701171875, -1.771484375, -1.499267578125, -1.22705078125, -0.954833984375, -0.6826171875, -0.410400390625, -0.13818359375, 0.134033203125, 0.40625, 0.678466796875, 0.95068359375, 1.222900390625, 1.4951171875, 1.767333984375, 2.03955078125, 2.311767578125, 2.583984375, 2.856201171875, 3.12841796875, 3.400634765625, 3.6728515625, 3.945068359375, 4.21728515625, 4.489501953125, 4.76171875, 5.033935546875, 5.30615234375, 5.578369140625, 5.8505859375, 6.122802734375, 6.39501953125, 6.667236328125, 6.939453125, 7.211669921875, 7.48388671875, 7.756103515625, 8.0283203125, 8.300537109375, 8.57275390625, 8.844970703125, 9.1171875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 8.0, 7.0, 6.0, 9.0, 19.0, 22.0, 32.0, 27.0, 57.0, 79.0, 116.0, 172.0, 289.0, 495.0, 803.0, 774.0, 448.0, 262.0, 145.0, 104.0, 49.0, 42.0, 34.0, 21.0, 15.0, 12.0, 5.0, 8.0, 7.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2578125, -7.98974609375, -7.7216796875, -7.45361328125, -7.185546875, -6.91748046875, -6.6494140625, -6.38134765625, -6.11328125, -5.84521484375, -5.5771484375, -5.30908203125, -5.041015625, -4.77294921875, -4.5048828125, -4.23681640625, -3.96875, -3.70068359375, -3.4326171875, -3.16455078125, -2.896484375, -2.62841796875, -2.3603515625, -2.09228515625, -1.82421875, -1.55615234375, -1.2880859375, -1.02001953125, -0.751953125, -0.48388671875, -0.2158203125, 0.05224609375, 0.3203125, 0.58837890625, 0.8564453125, 1.12451171875, 1.392578125, 1.66064453125, 1.9287109375, 2.19677734375, 2.46484375, 2.73291015625, 3.0009765625, 3.26904296875, 3.537109375, 3.80517578125, 4.0732421875, 4.34130859375, 4.609375, 4.87744140625, 5.1455078125, 5.41357421875, 5.681640625, 5.94970703125, 6.2177734375, 6.48583984375, 6.75390625, 7.02197265625, 7.2900390625, 7.55810546875, 7.826171875, 8.09423828125, 8.3623046875, 8.63037109375, 8.8984375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 2.0, 8.0, 7.0, 14.0, 28.0, 35.0, 79.0, 150.0, 192.0, 193.0, 128.0, 77.0, 33.0, 25.0, 10.0, 1.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.24327087402344, -75.37190246582031, -72.50053405761719, -69.62916564941406, -66.7577896118164, -63.88642120361328, -61.015052795410156, -58.14368438720703, -55.27231216430664, -52.400943756103516, -49.529571533203125, -46.658203125, -43.786834716796875, -40.915462493896484, -38.04409408569336, -35.17272186279297, -32.301353454589844, -29.429983139038086, -26.558612823486328, -23.687244415283203, -20.815874099731445, -17.944503784179688, -15.073135375976562, -12.201765060424805, -9.330394744873047, -6.459024906158447, -3.5876550674438477, -0.7162857055664062, 2.1550846099853516, 5.026454925537109, 7.897823333740234, 10.769193649291992, 13.640556335449219, 16.511926651000977, 19.383296966552734, 22.25466537475586, 25.126035690307617, 27.997406005859375, 30.8687744140625, 33.740142822265625, 36.611515045166016, 39.48288345336914, 42.35425567626953, 45.225624084472656, 48.09699249267578, 50.96836471557617, 53.8397331237793, 56.71110534667969, 59.58247375488281, 62.45384216308594, 65.32521057128906, 68.19657897949219, 71.06795501708984, 73.93932342529297, 76.8106918334961, 79.68206024169922, 82.55343627929688, 85.4248046875, 88.29617309570312, 91.16754150390625, 94.0389175415039, 96.91028594970703, 99.78165435791016, 102.65302276611328, 105.5243911743164]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 4.0, 6.0, 7.0, 8.0, 11.0, 9.0, 11.0, 9.0, 16.0, 17.0, 30.0, 25.0, 23.0, 24.0, 24.0, 42.0, 30.0, 49.0, 50.0, 44.0, 41.0, 37.0, 32.0, 34.0, 38.0, 47.0, 33.0, 30.0, 44.0, 33.0, 26.0, 31.0, 16.0, 19.0, 17.0, 13.0, 12.0, 13.0, 10.0, 3.0, 8.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-34.006317138671875, -32.975563049316406, -31.944805145263672, -30.91404914855957, -29.88329315185547, -28.8525390625, -27.8217830657959, -26.791027069091797, -25.760271072387695, -24.729515075683594, -23.698759078979492, -22.66800308227539, -21.637248992919922, -20.606491088867188, -19.57573699951172, -18.544981002807617, -17.514225006103516, -16.483469009399414, -15.452713012695312, -14.421957969665527, -13.391201972961426, -12.360445976257324, -11.329690933227539, -10.298934936523438, -9.268178939819336, -8.237422943115234, -7.206667423248291, -6.175911903381348, -5.145155906677246, -4.1143999099731445, -3.083644390106201, -2.052888870239258, -1.0221366882324219, 0.008619070053100586, 1.039374828338623, 2.0701305866241455, 3.100886344909668, 4.1316423416137695, 5.162397861480713, 6.193153381347656, 7.223909378051758, 8.25466537475586, 9.285421371459961, 10.316176414489746, 11.346932411193848, 12.37768840789795, 13.408443450927734, 14.439199447631836, 15.469955444335938, 16.50071144104004, 17.53146743774414, 18.562223434448242, 19.592979431152344, 20.623733520507812, 21.654489517211914, 22.685245513916016, 23.716001510620117, 24.74675750732422, 25.77751350402832, 26.808269500732422, 27.83902359008789, 28.869781494140625, 29.900535583496094, 30.931291580200195, 31.962047576904297]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 9.0, 6.0, 11.0, 17.0, 26.0, 35.0, 83.0, 120.0, 187.0, 330.0, 554.0, 933.0, 1551.0, 2972.0, 5745.0, 11324.0, 23313.0, 51120.0, 134884.0, 400691.0, 260800.0, 83822.0, 35628.0, 16612.0, 8219.0, 4129.0, 2242.0, 1274.0, 788.0, 478.0, 238.0, 166.0, 96.0, 51.0, 34.0, 33.0, 13.0, 8.0, 6.0, 7.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-7.4453125, -7.2532958984375, -7.061279296875, -6.8692626953125, -6.67724609375, -6.4852294921875, -6.293212890625, -6.1011962890625, -5.9091796875, -5.7171630859375, -5.525146484375, -5.3331298828125, -5.14111328125, -4.9490966796875, -4.757080078125, -4.5650634765625, -4.373046875, -4.1810302734375, -3.989013671875, -3.7969970703125, -3.60498046875, -3.4129638671875, -3.220947265625, -3.0289306640625, -2.8369140625, -2.6448974609375, -2.452880859375, -2.2608642578125, -2.06884765625, -1.8768310546875, -1.684814453125, -1.4927978515625, -1.30078125, -1.1087646484375, -0.916748046875, -0.7247314453125, -0.53271484375, -0.3406982421875, -0.148681640625, 0.0433349609375, 0.2353515625, 0.4273681640625, 0.619384765625, 0.8114013671875, 1.00341796875, 1.1954345703125, 1.387451171875, 1.5794677734375, 1.771484375, 1.9635009765625, 2.155517578125, 2.3475341796875, 2.53955078125, 2.7315673828125, 2.923583984375, 3.1156005859375, 3.3076171875, 3.4996337890625, 3.691650390625, 3.8836669921875, 4.07568359375, 4.2677001953125, 4.459716796875, 4.6517333984375, 4.84375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 9.0, 6.0, 10.0, 6.0, 13.0, 17.0, 23.0, 29.0, 45.0, 34.0, 46.0, 54.0, 69.0, 61.0, 61.0, 74.0, 69.0, 55.0, 63.0, 50.0, 35.0, 39.0, 28.0, 27.0, 21.0, 14.0, 14.0, 7.0, 12.0, 7.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.66015625, -2.5592041015625, -2.458251953125, -2.3572998046875, -2.25634765625, -2.1553955078125, -2.054443359375, -1.9534912109375, -1.8525390625, -1.7515869140625, -1.650634765625, -1.5496826171875, -1.44873046875, -1.3477783203125, -1.246826171875, -1.1458740234375, -1.044921875, -0.9439697265625, -0.843017578125, -0.7420654296875, -0.64111328125, -0.5401611328125, -0.439208984375, -0.3382568359375, -0.2373046875, -0.1363525390625, -0.035400390625, 0.0655517578125, 0.16650390625, 0.2674560546875, 0.368408203125, 0.4693603515625, 0.5703125, 0.6712646484375, 0.772216796875, 0.8731689453125, 0.97412109375, 1.0750732421875, 1.176025390625, 1.2769775390625, 1.3779296875, 1.4788818359375, 1.579833984375, 1.6807861328125, 1.78173828125, 1.8826904296875, 1.983642578125, 2.0845947265625, 2.185546875, 2.2864990234375, 2.387451171875, 2.4884033203125, 2.58935546875, 2.6903076171875, 2.791259765625, 2.8922119140625, 2.9931640625, 3.0941162109375, 3.195068359375, 3.2960205078125, 3.39697265625, 3.4979248046875, 3.598876953125, 3.6998291015625, 3.80078125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 11.0, 7.0, 16.0, 20.0, 22.0, 24.0, 68.0, 104.0, 161.0, 281.0, 513.0, 1009.0, 2784.0, 12463.0, 190457.0, 802911.0, 30299.0, 4413.0, 1489.0, 663.0, 327.0, 159.0, 122.0, 75.0, 54.0, 32.0, 18.0, 13.0, 13.0, 6.0, 6.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3125, -14.6796875, -14.046875, -13.4140625, -12.78125, -12.1484375, -11.515625, -10.8828125, -10.25, -9.6171875, -8.984375, -8.3515625, -7.71875, -7.0859375, -6.453125, -5.8203125, -5.1875, -4.5546875, -3.921875, -3.2890625, -2.65625, -2.0234375, -1.390625, -0.7578125, -0.125, 0.5078125, 1.140625, 1.7734375, 2.40625, 3.0390625, 3.671875, 4.3046875, 4.9375, 5.5703125, 6.203125, 6.8359375, 7.46875, 8.1015625, 8.734375, 9.3671875, 10.0, 10.6328125, 11.265625, 11.8984375, 12.53125, 13.1640625, 13.796875, 14.4296875, 15.0625, 15.6953125, 16.328125, 16.9609375, 17.59375, 18.2265625, 18.859375, 19.4921875, 20.125, 20.7578125, 21.390625, 22.0234375, 22.65625, 23.2890625, 23.921875, 24.5546875, 25.1875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 8.0, 4.0, 16.0, 18.0, 18.0, 20.0, 19.0, 25.0, 36.0, 38.0, 31.0, 42.0, 42.0, 51.0, 47.0, 47.0, 48.0, 61.0, 57.0, 62.0, 44.0, 36.0, 35.0, 25.0, 25.0, 15.0, 23.0, 17.0, 10.0, 11.0, 12.0, 12.0, 6.0, 8.0, 6.0, 6.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.6640625, -11.2681884765625, -10.872314453125, -10.4764404296875, -10.08056640625, -9.6846923828125, -9.288818359375, -8.8929443359375, -8.4970703125, -8.1011962890625, -7.705322265625, -7.3094482421875, -6.91357421875, -6.5177001953125, -6.121826171875, -5.7259521484375, -5.330078125, -4.9342041015625, -4.538330078125, -4.1424560546875, -3.74658203125, -3.3507080078125, -2.954833984375, -2.5589599609375, -2.1630859375, -1.7672119140625, -1.371337890625, -0.9754638671875, -0.57958984375, -0.1837158203125, 0.212158203125, 0.6080322265625, 1.00390625, 1.3997802734375, 1.795654296875, 2.1915283203125, 2.58740234375, 2.9832763671875, 3.379150390625, 3.7750244140625, 4.1708984375, 4.5667724609375, 4.962646484375, 5.3585205078125, 5.75439453125, 6.1502685546875, 6.546142578125, 6.9420166015625, 7.337890625, 7.7337646484375, 8.129638671875, 8.5255126953125, 8.92138671875, 9.3172607421875, 9.713134765625, 10.1090087890625, 10.5048828125, 10.9007568359375, 11.296630859375, 11.6925048828125, 12.08837890625, 12.4842529296875, 12.880126953125, 13.2760009765625, 13.671875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 4.0, 5.0, 4.0, 5.0, 5.0, 15.0, 14.0, 16.0, 35.0, 54.0, 108.0, 242.0, 615.0, 2291.0, 14340.0, 226018.0, 772012.0, 27443.0, 3842.0, 856.0, 325.0, 127.0, 61.0, 44.0, 16.0, 26.0, 7.0, 8.0, 6.0, 4.0, 6.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5, -8.1749267578125, -7.849853515625, -7.5247802734375, -7.19970703125, -6.8746337890625, -6.549560546875, -6.2244873046875, -5.8994140625, -5.5743408203125, -5.249267578125, -4.9241943359375, -4.59912109375, -4.2740478515625, -3.948974609375, -3.6239013671875, -3.298828125, -2.9737548828125, -2.648681640625, -2.3236083984375, -1.99853515625, -1.6734619140625, -1.348388671875, -1.0233154296875, -0.6982421875, -0.3731689453125, -0.048095703125, 0.2769775390625, 0.60205078125, 0.9271240234375, 1.252197265625, 1.5772705078125, 1.90234375, 2.2274169921875, 2.552490234375, 2.8775634765625, 3.20263671875, 3.5277099609375, 3.852783203125, 4.1778564453125, 4.5029296875, 4.8280029296875, 5.153076171875, 5.4781494140625, 5.80322265625, 6.1282958984375, 6.453369140625, 6.7784423828125, 7.103515625, 7.4285888671875, 7.753662109375, 8.0787353515625, 8.40380859375, 8.7288818359375, 9.053955078125, 9.3790283203125, 9.7041015625, 10.0291748046875, 10.354248046875, 10.6793212890625, 11.00439453125, 11.3294677734375, 11.654541015625, 11.9796142578125, 12.3046875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 5.0, 9.0, 8.0, 8.0, 10.0, 23.0, 36.0, 46.0, 70.0, 119.0, 277.0, 150.0, 80.0, 53.0, 20.0, 17.0, 16.0, 11.0, 13.0, 12.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017442703247070312, -0.0016854554414749146, -0.0016266405582427979, -0.0015678256750106812, -0.0015090107917785645, -0.0014501959085464478, -0.001391381025314331, -0.0013325661420822144, -0.0012737512588500977, -0.001214936375617981, -0.0011561214923858643, -0.0010973066091537476, -0.0010384917259216309, -0.0009796768426895142, -0.0009208619594573975, -0.0008620470762252808, -0.0008032321929931641, -0.0007444173097610474, -0.0006856024265289307, -0.000626787543296814, -0.0005679726600646973, -0.0005091577768325806, -0.00045034289360046387, -0.00039152801036834717, -0.00033271312713623047, -0.00027389824390411377, -0.00021508336067199707, -0.00015626847743988037, -9.745359420776367e-05, -3.863871097564697e-05, 2.0176172256469727e-05, 7.899105548858643e-05, 0.00013780593872070312, 0.00019662082195281982, 0.0002554357051849365, 0.0003142505884170532, 0.0003730654716491699, 0.0004318803548812866, 0.0004906952381134033, 0.00054951012134552, 0.0006083250045776367, 0.0006671398878097534, 0.0007259547710418701, 0.0007847696542739868, 0.0008435845375061035, 0.0009023994207382202, 0.0009612143039703369, 0.0010200291872024536, 0.0010788440704345703, 0.001137658953666687, 0.0011964738368988037, 0.0012552887201309204, 0.0013141036033630371, 0.0013729184865951538, 0.0014317333698272705, 0.0014905482530593872, 0.001549363136291504, 0.0016081780195236206, 0.0016669929027557373, 0.001725807785987854, 0.0017846226692199707, 0.0018434375524520874, 0.001902252435684204, 0.001961067318916321, 0.0020198822021484375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0, 3.0, 7.0, 3.0, 2.0, 1.0, 9.0, 8.0, 8.0, 8.0, 17.0, 26.0, 42.0, 45.0, 57.0, 103.0, 154.0, 210.0, 335.0, 509.0, 1029.0, 1828.0, 3946.0, 11409.0, 50100.0, 600061.0, 326356.0, 35765.0, 9265.0, 3396.0, 1709.0, 802.0, 488.0, 276.0, 194.0, 101.0, 86.0, 56.0, 43.0, 21.0, 15.0, 15.0, 14.0, 15.0, 13.0, 4.0, 5.0, 0.0, 2.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.47265625, -6.28173828125, -6.0908203125, -5.89990234375, -5.708984375, -5.51806640625, -5.3271484375, -5.13623046875, -4.9453125, -4.75439453125, -4.5634765625, -4.37255859375, -4.181640625, -3.99072265625, -3.7998046875, -3.60888671875, -3.41796875, -3.22705078125, -3.0361328125, -2.84521484375, -2.654296875, -2.46337890625, -2.2724609375, -2.08154296875, -1.890625, -1.69970703125, -1.5087890625, -1.31787109375, -1.126953125, -0.93603515625, -0.7451171875, -0.55419921875, -0.36328125, -0.17236328125, 0.0185546875, 0.20947265625, 0.400390625, 0.59130859375, 0.7822265625, 0.97314453125, 1.1640625, 1.35498046875, 1.5458984375, 1.73681640625, 1.927734375, 2.11865234375, 2.3095703125, 2.50048828125, 2.69140625, 2.88232421875, 3.0732421875, 3.26416015625, 3.455078125, 3.64599609375, 3.8369140625, 4.02783203125, 4.21875, 4.40966796875, 4.6005859375, 4.79150390625, 4.982421875, 5.17333984375, 5.3642578125, 5.55517578125, 5.74609375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 8.0, 10.0, 10.0, 8.0, 12.0, 20.0, 29.0, 29.0, 47.0, 74.0, 114.0, 124.0, 105.0, 109.0, 81.0, 53.0, 39.0, 30.0, 20.0, 24.0, 11.0, 12.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.04888916015625, -4.8477783203125, -4.64666748046875, -4.445556640625, -4.24444580078125, -4.0433349609375, -3.84222412109375, -3.64111328125, -3.44000244140625, -3.2388916015625, -3.03778076171875, -2.836669921875, -2.63555908203125, -2.4344482421875, -2.23333740234375, -2.0322265625, -1.83111572265625, -1.6300048828125, -1.42889404296875, -1.227783203125, -1.02667236328125, -0.8255615234375, -0.62445068359375, -0.42333984375, -0.22222900390625, -0.0211181640625, 0.17999267578125, 0.381103515625, 0.58221435546875, 0.7833251953125, 0.98443603515625, 1.185546875, 1.38665771484375, 1.5877685546875, 1.78887939453125, 1.989990234375, 2.19110107421875, 2.3922119140625, 2.59332275390625, 2.79443359375, 2.99554443359375, 3.1966552734375, 3.39776611328125, 3.598876953125, 3.79998779296875, 4.0010986328125, 4.20220947265625, 4.4033203125, 4.60443115234375, 4.8055419921875, 5.00665283203125, 5.207763671875, 5.40887451171875, 5.6099853515625, 5.81109619140625, 6.01220703125, 6.21331787109375, 6.4144287109375, 6.61553955078125, 6.816650390625, 7.01776123046875, 7.2188720703125, 7.41998291015625, 7.62109375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 18.0, 27.0, 78.0, 104.0, 182.0, 240.0, 162.0, 84.0, 54.0, 14.0, 10.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.79753112792969, -91.1848373413086, -87.57213592529297, -83.95944213867188, -80.34674072265625, -76.73404693603516, -73.12134552001953, -69.50865173339844, -65.89595031738281, -62.28325271606445, -58.670555114746094, -55.057857513427734, -51.445159912109375, -47.83246612548828, -44.219764709472656, -40.60707092285156, -36.9943733215332, -33.381675720214844, -29.768978118896484, -26.156280517578125, -22.543582916259766, -18.93088722229004, -15.31818962097168, -11.70549201965332, -8.092794418334961, -4.480096817016602, -0.8673996925354004, 2.745297431945801, 6.35799503326416, 9.970691680908203, 13.583389282226562, 17.196086883544922, 20.80878448486328, 24.42148208618164, 28.0341796875, 31.64687728881836, 35.25957489013672, 38.87226867675781, 42.48497009277344, 46.09766387939453, 49.710365295410156, 53.323062896728516, 56.935760498046875, 60.548458099365234, 64.1611557006836, 67.77384948730469, 71.38655090332031, 74.9992446899414, 78.6119384765625, 82.2246322631836, 85.83733367919922, 89.45002746582031, 93.06272888183594, 96.67542266845703, 100.28812408447266, 103.90081787109375, 107.51351928710938, 111.12621307373047, 114.7389144897461, 118.35160827636719, 121.96430969238281, 125.5770034790039, 129.189697265625, 132.80239868164062, 136.41510009765625]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 10.0, 21.0, 14.0, 14.0, 17.0, 32.0, 45.0, 54.0, 58.0, 59.0, 60.0, 83.0, 94.0, 94.0, 64.0, 59.0, 51.0, 33.0, 44.0, 33.0, 17.0, 19.0, 18.0, 4.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-107.73379516601562, -105.35274505615234, -102.9717025756836, -100.59065246582031, -98.20960998535156, -95.82855987548828, -93.44751739501953, -91.06646728515625, -88.6854248046875, -86.30437469482422, -83.92333221435547, -81.54228210449219, -79.16123962402344, -76.78018951416016, -74.3991470336914, -72.01809692382812, -69.63704681396484, -67.25599670410156, -64.87495422363281, -62.4939079284668, -60.11286163330078, -57.7318115234375, -55.350765228271484, -52.96971893310547, -50.58867263793945, -48.20762634277344, -45.82658004760742, -43.445533752441406, -41.064483642578125, -38.683441162109375, -36.302391052246094, -33.92134475708008, -31.540302276611328, -29.159255981445312, -26.778209686279297, -24.39716148376465, -22.016115188598633, -19.635068893432617, -17.25402069091797, -14.872974395751953, -12.491928100585938, -10.110881805419922, -7.72983455657959, -5.348787784576416, -2.967741012573242, -0.5866947174072266, 1.7943525314331055, 4.1753997802734375, 6.556446075439453, 8.937492370605469, 11.3185396194458, 13.699586868286133, 16.08063316345215, 18.461679458618164, 20.842727661132812, 23.223773956298828, 25.604820251464844, 27.98586654663086, 30.366912841796875, 32.74795913696289, 35.129005432128906, 37.51005554199219, 39.8911018371582, 42.27214813232422, 44.653194427490234]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 6.0, 17.0, 18.0, 13.0, 16.0, 36.0, 34.0, 47.0, 76.0, 78.0, 133.0, 226.0, 472.0, 2231.0, 31538.0, 3626337.0, 520772.0, 10067.0, 1117.0, 350.0, 209.0, 116.0, 89.0, 69.0, 49.0, 31.0, 30.0, 27.0, 18.0, 13.0, 8.0, 6.0, 6.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.984375, -17.4677734375, -16.951171875, -16.4345703125, -15.91796875, -15.4013671875, -14.884765625, -14.3681640625, -13.8515625, -13.3349609375, -12.818359375, -12.3017578125, -11.78515625, -11.2685546875, -10.751953125, -10.2353515625, -9.71875, -9.2021484375, -8.685546875, -8.1689453125, -7.65234375, -7.1357421875, -6.619140625, -6.1025390625, -5.5859375, -5.0693359375, -4.552734375, -4.0361328125, -3.51953125, -3.0029296875, -2.486328125, -1.9697265625, -1.453125, -0.9365234375, -0.419921875, 0.0966796875, 0.61328125, 1.1298828125, 1.646484375, 2.1630859375, 2.6796875, 3.1962890625, 3.712890625, 4.2294921875, 4.74609375, 5.2626953125, 5.779296875, 6.2958984375, 6.8125, 7.3291015625, 7.845703125, 8.3623046875, 8.87890625, 9.3955078125, 9.912109375, 10.4287109375, 10.9453125, 11.4619140625, 11.978515625, 12.4951171875, 13.01171875, 13.5283203125, 14.044921875, 14.5615234375, 15.078125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 9.0, 17.0, 17.0, 32.0, 43.0, 65.0, 72.0, 103.0, 122.0, 97.0, 125.0, 86.0, 56.0, 52.0, 43.0, 30.0, 16.0, 9.0, 7.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.95703125, -7.791748046875, -7.62646484375, -7.461181640625, -7.2958984375, -7.130615234375, -6.96533203125, -6.800048828125, -6.634765625, -6.469482421875, -6.30419921875, -6.138916015625, -5.9736328125, -5.808349609375, -5.64306640625, -5.477783203125, -5.3125, -5.147216796875, -4.98193359375, -4.816650390625, -4.6513671875, -4.486083984375, -4.32080078125, -4.155517578125, -3.990234375, -3.824951171875, -3.65966796875, -3.494384765625, -3.3291015625, -3.163818359375, -2.99853515625, -2.833251953125, -2.66796875, -2.502685546875, -2.33740234375, -2.172119140625, -2.0068359375, -1.841552734375, -1.67626953125, -1.510986328125, -1.345703125, -1.180419921875, -1.01513671875, -0.849853515625, -0.6845703125, -0.519287109375, -0.35400390625, -0.188720703125, -0.0234375, 0.141845703125, 0.30712890625, 0.472412109375, 0.6376953125, 0.802978515625, 0.96826171875, 1.133544921875, 1.298828125, 1.464111328125, 1.62939453125, 1.794677734375, 1.9599609375, 2.125244140625, 2.29052734375, 2.455810546875, 2.62109375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 3.0, 5.0, 6.0, 10.0, 25.0, 35.0, 45.0, 103.0, 209.0, 392.0, 885.0, 2385.0, 7395.0, 26101.0, 123185.0, 1190340.0, 2556944.0, 229228.0, 40044.0, 10930.0, 3494.0, 1358.0, 547.0, 290.0, 134.0, 63.0, 50.0, 23.0, 23.0, 11.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.90625, -6.67730712890625, -6.4483642578125, -6.21942138671875, -5.990478515625, -5.76153564453125, -5.5325927734375, -5.30364990234375, -5.07470703125, -4.84576416015625, -4.6168212890625, -4.38787841796875, -4.158935546875, -3.92999267578125, -3.7010498046875, -3.47210693359375, -3.2431640625, -3.01422119140625, -2.7852783203125, -2.55633544921875, -2.327392578125, -2.09844970703125, -1.8695068359375, -1.64056396484375, -1.41162109375, -1.18267822265625, -0.9537353515625, -0.72479248046875, -0.495849609375, -0.26690673828125, -0.0379638671875, 0.19097900390625, 0.419921875, 0.64886474609375, 0.8778076171875, 1.10675048828125, 1.335693359375, 1.56463623046875, 1.7935791015625, 2.02252197265625, 2.25146484375, 2.48040771484375, 2.7093505859375, 2.93829345703125, 3.167236328125, 3.39617919921875, 3.6251220703125, 3.85406494140625, 4.0830078125, 4.31195068359375, 4.5408935546875, 4.76983642578125, 4.998779296875, 5.22772216796875, 5.4566650390625, 5.68560791015625, 5.91455078125, 6.14349365234375, 6.3724365234375, 6.60137939453125, 6.830322265625, 7.05926513671875, 7.2882080078125, 7.51715087890625, 7.74609375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 5.0, 3.0, 8.0, 10.0, 10.0, 13.0, 13.0, 35.0, 36.0, 64.0, 66.0, 81.0, 121.0, 190.0, 269.0, 427.0, 589.0, 613.0, 483.0, 332.0, 196.0, 159.0, 96.0, 69.0, 47.0, 28.0, 17.0, 22.0, 15.0, 11.0, 2.0, 11.0, 9.0, 7.0, 6.0, 1.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.74609375, -5.542236328125, -5.33837890625, -5.134521484375, -4.9306640625, -4.726806640625, -4.52294921875, -4.319091796875, -4.115234375, -3.911376953125, -3.70751953125, -3.503662109375, -3.2998046875, -3.095947265625, -2.89208984375, -2.688232421875, -2.484375, -2.280517578125, -2.07666015625, -1.872802734375, -1.6689453125, -1.465087890625, -1.26123046875, -1.057373046875, -0.853515625, -0.649658203125, -0.44580078125, -0.241943359375, -0.0380859375, 0.165771484375, 0.36962890625, 0.573486328125, 0.77734375, 0.981201171875, 1.18505859375, 1.388916015625, 1.5927734375, 1.796630859375, 2.00048828125, 2.204345703125, 2.408203125, 2.612060546875, 2.81591796875, 3.019775390625, 3.2236328125, 3.427490234375, 3.63134765625, 3.835205078125, 4.0390625, 4.242919921875, 4.44677734375, 4.650634765625, 4.8544921875, 5.058349609375, 5.26220703125, 5.466064453125, 5.669921875, 5.873779296875, 6.07763671875, 6.281494140625, 6.4853515625, 6.689208984375, 6.89306640625, 7.096923828125, 7.30078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 4.0, 4.0, 5.0, 9.0, 17.0, 33.0, 93.0, 191.0, 262.0, 244.0, 87.0, 31.0, 9.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.6290283203125, -130.35536193847656, -127.08169555664062, -123.80802917480469, -120.53436279296875, -117.26069641113281, -113.98703002929688, -110.71336364746094, -107.439697265625, -104.16603088378906, -100.89236450195312, -97.61869812011719, -94.34503173828125, -91.07136535644531, -87.79769897460938, -84.52403259277344, -81.2503662109375, -77.97669982910156, -74.70303344726562, -71.42936706542969, -68.15570068359375, -64.88203430175781, -61.608367919921875, -58.33470153808594, -55.06103515625, -51.78736877441406, -48.513702392578125, -45.24003601074219, -41.96636962890625, -38.69270324707031, -35.419036865234375, -32.14537048339844, -28.8717041015625, -25.598037719726562, -22.324371337890625, -19.050704956054688, -15.77703857421875, -12.503372192382812, -9.229705810546875, -5.9560394287109375, -2.682373046875, 0.5912933349609375, 3.864959716796875, 7.1386260986328125, 10.41229248046875, 13.685958862304688, 16.959625244140625, 20.233291625976562, 23.5069580078125, 26.780624389648438, 30.054290771484375, 33.32795715332031, 36.60162353515625, 39.87528991699219, 43.148956298828125, 46.42262268066406, 49.6962890625, 52.96995544433594, 56.243621826171875, 59.51728820800781, 62.79095458984375, 66.06462097167969, 69.33828735351562, 72.61195373535156, 75.8856201171875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 7.0, 7.0, 7.0, 8.0, 14.0, 9.0, 18.0, 23.0, 19.0, 28.0, 31.0, 36.0, 35.0, 38.0, 47.0, 47.0, 36.0, 49.0, 41.0, 41.0, 48.0, 49.0, 38.0, 42.0, 38.0, 29.0, 33.0, 21.0, 21.0, 24.0, 20.0, 15.0, 15.0, 11.0, 8.0, 6.0, 7.0, 7.0, 4.0, 5.0, 1.0, 3.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-30.170644760131836, -29.19820785522461, -28.22576904296875, -27.253332138061523, -26.280895233154297, -25.308456420898438, -24.33601951599121, -23.363582611083984, -22.391143798828125, -21.4187068939209, -20.44626808166504, -19.473831176757812, -18.501394271850586, -17.52895736694336, -16.5565185546875, -15.584081649780273, -14.611644744873047, -13.639206886291504, -12.666769981384277, -11.694332122802734, -10.721895217895508, -9.749457359313965, -8.777019500732422, -7.804582118988037, -6.832144737243652, -5.859707355499268, -4.887269973754883, -3.91483211517334, -2.942394733428955, -1.9699573516845703, -0.9975194931030273, -0.025082111358642578, 0.9473533630371094, 1.9197908639907837, 2.892228364944458, 3.864665985107422, 4.837103366851807, 5.809540748596191, 6.781978607177734, 7.754415988922119, 8.726853370666504, 9.699291229248047, 10.671728134155273, 11.644165992736816, 12.61660385131836, 13.589040756225586, 14.561478614807129, 15.533916473388672, 16.5063533782959, 17.478790283203125, 18.451229095458984, 19.42366600036621, 20.396102905273438, 21.368541717529297, 22.340978622436523, 23.31341552734375, 24.28585433959961, 25.258291244506836, 26.230730056762695, 27.203166961669922, 28.17560386657715, 29.148040771484375, 30.120479583740234, 31.09291648864746, 32.06535339355469]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 7.0, 10.0, 18.0, 22.0, 39.0, 60.0, 102.0, 179.0, 285.0, 518.0, 1004.0, 1883.0, 4019.0, 8922.0, 21513.0, 59443.0, 232645.0, 500646.0, 145426.0, 42205.0, 16121.0, 6851.0, 3132.0, 1551.0, 848.0, 450.0, 238.0, 151.0, 109.0, 50.0, 36.0, 27.0, 7.0, 15.0, 7.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.33203125, -6.108642578125, -5.88525390625, -5.661865234375, -5.4384765625, -5.215087890625, -4.99169921875, -4.768310546875, -4.544921875, -4.321533203125, -4.09814453125, -3.874755859375, -3.6513671875, -3.427978515625, -3.20458984375, -2.981201171875, -2.7578125, -2.534423828125, -2.31103515625, -2.087646484375, -1.8642578125, -1.640869140625, -1.41748046875, -1.194091796875, -0.970703125, -0.747314453125, -0.52392578125, -0.300537109375, -0.0771484375, 0.146240234375, 0.36962890625, 0.593017578125, 0.81640625, 1.039794921875, 1.26318359375, 1.486572265625, 1.7099609375, 1.933349609375, 2.15673828125, 2.380126953125, 2.603515625, 2.826904296875, 3.05029296875, 3.273681640625, 3.4970703125, 3.720458984375, 3.94384765625, 4.167236328125, 4.390625, 4.614013671875, 4.83740234375, 5.060791015625, 5.2841796875, 5.507568359375, 5.73095703125, 5.954345703125, 6.177734375, 6.401123046875, 6.62451171875, 6.847900390625, 7.0712890625, 7.294677734375, 7.51806640625, 7.741455078125, 7.96484375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 8.0, 11.0, 21.0, 14.0, 22.0, 28.0, 28.0, 47.0, 42.0, 66.0, 58.0, 67.0, 70.0, 78.0, 71.0, 65.0, 56.0, 51.0, 45.0, 31.0, 24.0, 26.0, 20.0, 21.0, 7.0, 8.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.1796875, -5.061920166015625, -4.94415283203125, -4.826385498046875, -4.7086181640625, -4.590850830078125, -4.47308349609375, -4.355316162109375, -4.237548828125, -4.119781494140625, -4.00201416015625, -3.884246826171875, -3.7664794921875, -3.648712158203125, -3.53094482421875, -3.413177490234375, -3.29541015625, -3.177642822265625, -3.05987548828125, -2.942108154296875, -2.8243408203125, -2.706573486328125, -2.58880615234375, -2.471038818359375, -2.353271484375, -2.235504150390625, -2.11773681640625, -1.999969482421875, -1.8822021484375, -1.764434814453125, -1.64666748046875, -1.528900146484375, -1.4111328125, -1.293365478515625, -1.17559814453125, -1.057830810546875, -0.9400634765625, -0.822296142578125, -0.70452880859375, -0.586761474609375, -0.468994140625, -0.351226806640625, -0.23345947265625, -0.115692138671875, 0.0020751953125, 0.119842529296875, 0.23760986328125, 0.355377197265625, 0.47314453125, 0.590911865234375, 0.70867919921875, 0.826446533203125, 0.9442138671875, 1.061981201171875, 1.17974853515625, 1.297515869140625, 1.415283203125, 1.533050537109375, 1.65081787109375, 1.768585205078125, 1.8863525390625, 2.004119873046875, 2.12188720703125, 2.239654541015625, 2.357421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 6.0, 12.0, 12.0, 16.0, 21.0, 33.0, 48.0, 65.0, 102.0, 162.0, 282.0, 453.0, 822.0, 1801.0, 5019.0, 19742.0, 139277.0, 773262.0, 85541.0, 14528.0, 4071.0, 1501.0, 718.0, 388.0, 240.0, 146.0, 93.0, 59.0, 36.0, 30.0, 20.0, 14.0, 11.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.1015625, -12.6971435546875, -12.292724609375, -11.8883056640625, -11.48388671875, -11.0794677734375, -10.675048828125, -10.2706298828125, -9.8662109375, -9.4617919921875, -9.057373046875, -8.6529541015625, -8.24853515625, -7.8441162109375, -7.439697265625, -7.0352783203125, -6.630859375, -6.2264404296875, -5.822021484375, -5.4176025390625, -5.01318359375, -4.6087646484375, -4.204345703125, -3.7999267578125, -3.3955078125, -2.9910888671875, -2.586669921875, -2.1822509765625, -1.77783203125, -1.3734130859375, -0.968994140625, -0.5645751953125, -0.16015625, 0.2442626953125, 0.648681640625, 1.0531005859375, 1.45751953125, 1.8619384765625, 2.266357421875, 2.6707763671875, 3.0751953125, 3.4796142578125, 3.884033203125, 4.2884521484375, 4.69287109375, 5.0972900390625, 5.501708984375, 5.9061279296875, 6.310546875, 6.7149658203125, 7.119384765625, 7.5238037109375, 7.92822265625, 8.3326416015625, 8.737060546875, 9.1414794921875, 9.5458984375, 9.9503173828125, 10.354736328125, 10.7591552734375, 11.16357421875, 11.5679931640625, 11.972412109375, 12.3768310546875, 12.78125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 8.0, 9.0, 13.0, 12.0, 9.0, 19.0, 30.0, 38.0, 37.0, 30.0, 52.0, 58.0, 60.0, 63.0, 73.0, 56.0, 65.0, 50.0, 56.0, 51.0, 49.0, 43.0, 23.0, 24.0, 15.0, 14.0, 8.0, 8.0, 10.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.2421875, -14.763916015625, -14.28564453125, -13.807373046875, -13.3291015625, -12.850830078125, -12.37255859375, -11.894287109375, -11.416015625, -10.937744140625, -10.45947265625, -9.981201171875, -9.5029296875, -9.024658203125, -8.54638671875, -8.068115234375, -7.58984375, -7.111572265625, -6.63330078125, -6.155029296875, -5.6767578125, -5.198486328125, -4.72021484375, -4.241943359375, -3.763671875, -3.285400390625, -2.80712890625, -2.328857421875, -1.8505859375, -1.372314453125, -0.89404296875, -0.415771484375, 0.0625, 0.540771484375, 1.01904296875, 1.497314453125, 1.9755859375, 2.453857421875, 2.93212890625, 3.410400390625, 3.888671875, 4.366943359375, 4.84521484375, 5.323486328125, 5.8017578125, 6.280029296875, 6.75830078125, 7.236572265625, 7.71484375, 8.193115234375, 8.67138671875, 9.149658203125, 9.6279296875, 10.106201171875, 10.58447265625, 11.062744140625, 11.541015625, 12.019287109375, 12.49755859375, 12.975830078125, 13.4541015625, 13.932373046875, 14.41064453125, 14.888916015625, 15.3671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 5.0, 3.0, 11.0, 14.0, 21.0, 50.0, 61.0, 148.0, 258.0, 778.0, 3354.0, 25169.0, 661329.0, 336395.0, 17335.0, 2498.0, 581.0, 237.0, 131.0, 49.0, 33.0, 23.0, 17.0, 7.0, 7.0, 4.0, 8.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.65625, -9.3629150390625, -9.069580078125, -8.7762451171875, -8.48291015625, -8.1895751953125, -7.896240234375, -7.6029052734375, -7.3095703125, -7.0162353515625, -6.722900390625, -6.4295654296875, -6.13623046875, -5.8428955078125, -5.549560546875, -5.2562255859375, -4.962890625, -4.6695556640625, -4.376220703125, -4.0828857421875, -3.78955078125, -3.4962158203125, -3.202880859375, -2.9095458984375, -2.6162109375, -2.3228759765625, -2.029541015625, -1.7362060546875, -1.44287109375, -1.1495361328125, -0.856201171875, -0.5628662109375, -0.26953125, 0.0238037109375, 0.317138671875, 0.6104736328125, 0.90380859375, 1.1971435546875, 1.490478515625, 1.7838134765625, 2.0771484375, 2.3704833984375, 2.663818359375, 2.9571533203125, 3.25048828125, 3.5438232421875, 3.837158203125, 4.1304931640625, 4.423828125, 4.7171630859375, 5.010498046875, 5.3038330078125, 5.59716796875, 5.8905029296875, 6.183837890625, 6.4771728515625, 6.7705078125, 7.0638427734375, 7.357177734375, 7.6505126953125, 7.94384765625, 8.2371826171875, 8.530517578125, 8.8238525390625, 9.1171875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 6.0, 0.0, 3.0, 4.0, 6.0, 6.0, 6.0, 5.0, 9.0, 15.0, 13.0, 22.0, 30.0, 38.0, 66.0, 73.0, 106.0, 148.0, 116.0, 98.0, 68.0, 41.0, 24.0, 22.0, 16.0, 10.0, 17.0, 8.0, 8.0, 5.0, 3.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0011930465698242188, -0.0011573880910873413, -0.0011217296123504639, -0.0010860711336135864, -0.001050412654876709, -0.0010147541761398315, -0.000979095697402954, -0.0009434372186660767, -0.0009077787399291992, -0.0008721202611923218, -0.0008364617824554443, -0.0008008033037185669, -0.0007651448249816895, -0.000729486346244812, -0.0006938278675079346, -0.0006581693887710571, -0.0006225109100341797, -0.0005868524312973022, -0.0005511939525604248, -0.0005155354738235474, -0.0004798769950866699, -0.0004442185163497925, -0.00040856003761291504, -0.0003729015588760376, -0.00033724308013916016, -0.0003015846014022827, -0.0002659261226654053, -0.00023026764392852783, -0.0001946091651916504, -0.00015895068645477295, -0.0001232922077178955, -8.763372898101807e-05, -5.1975250244140625e-05, -1.6316771507263184e-05, 1.9341707229614258e-05, 5.50001859664917e-05, 9.065866470336914e-05, 0.00012631714344024658, 0.00016197562217712402, 0.00019763410091400146, 0.0002332925796508789, 0.00026895105838775635, 0.0003046095371246338, 0.00034026801586151123, 0.00037592649459838867, 0.0004115849733352661, 0.00044724345207214355, 0.000482901930809021, 0.0005185604095458984, 0.0005542188882827759, 0.0005898773670196533, 0.0006255358457565308, 0.0006611943244934082, 0.0006968528032302856, 0.0007325112819671631, 0.0007681697607040405, 0.000803828239440918, 0.0008394867181777954, 0.0008751451969146729, 0.0009108036756515503, 0.0009464621543884277, 0.0009821206331253052, 0.0010177791118621826, 0.00105343759059906, 0.0010890960693359375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 8.0, 8.0, 18.0, 20.0, 59.0, 75.0, 139.0, 268.0, 576.0, 1517.0, 5155.0, 30091.0, 421761.0, 546806.0, 33634.0, 5542.0, 1661.0, 642.0, 279.0, 120.0, 79.0, 39.0, 26.0, 12.0, 5.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.50390625, -6.28729248046875, -6.0706787109375, -5.85406494140625, -5.637451171875, -5.42083740234375, -5.2042236328125, -4.98760986328125, -4.77099609375, -4.55438232421875, -4.3377685546875, -4.12115478515625, -3.904541015625, -3.68792724609375, -3.4713134765625, -3.25469970703125, -3.0380859375, -2.82147216796875, -2.6048583984375, -2.38824462890625, -2.171630859375, -1.95501708984375, -1.7384033203125, -1.52178955078125, -1.30517578125, -1.08856201171875, -0.8719482421875, -0.65533447265625, -0.438720703125, -0.22210693359375, -0.0054931640625, 0.21112060546875, 0.427734375, 0.64434814453125, 0.8609619140625, 1.07757568359375, 1.294189453125, 1.51080322265625, 1.7274169921875, 1.94403076171875, 2.16064453125, 2.37725830078125, 2.5938720703125, 2.81048583984375, 3.027099609375, 3.24371337890625, 3.4603271484375, 3.67694091796875, 3.8935546875, 4.11016845703125, 4.3267822265625, 4.54339599609375, 4.760009765625, 4.97662353515625, 5.1932373046875, 5.40985107421875, 5.62646484375, 5.84307861328125, 6.0596923828125, 6.27630615234375, 6.492919921875, 6.70953369140625, 6.9261474609375, 7.14276123046875, 7.359375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 6.0, 5.0, 6.0, 7.0, 8.0, 12.0, 11.0, 28.0, 27.0, 49.0, 50.0, 72.0, 84.0, 110.0, 117.0, 90.0, 93.0, 54.0, 40.0, 37.0, 22.0, 15.0, 11.0, 14.0, 4.0, 7.0, 9.0, 4.0, 10.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-6.9765625, -6.8154296875, -6.654296875, -6.4931640625, -6.33203125, -6.1708984375, -6.009765625, -5.8486328125, -5.6875, -5.5263671875, -5.365234375, -5.2041015625, -5.04296875, -4.8818359375, -4.720703125, -4.5595703125, -4.3984375, -4.2373046875, -4.076171875, -3.9150390625, -3.75390625, -3.5927734375, -3.431640625, -3.2705078125, -3.109375, -2.9482421875, -2.787109375, -2.6259765625, -2.46484375, -2.3037109375, -2.142578125, -1.9814453125, -1.8203125, -1.6591796875, -1.498046875, -1.3369140625, -1.17578125, -1.0146484375, -0.853515625, -0.6923828125, -0.53125, -0.3701171875, -0.208984375, -0.0478515625, 0.11328125, 0.2744140625, 0.435546875, 0.5966796875, 0.7578125, 0.9189453125, 1.080078125, 1.2412109375, 1.40234375, 1.5634765625, 1.724609375, 1.8857421875, 2.046875, 2.2080078125, 2.369140625, 2.5302734375, 2.69140625, 2.8525390625, 3.013671875, 3.1748046875, 3.3359375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 1.0, 7.0, 6.0, 10.0, 12.0, 34.0, 72.0, 108.0, 188.0, 178.0, 124.0, 96.0, 67.0, 37.0, 13.0, 12.0, 5.0, 5.0, 3.0, 3.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.44009399414062, -93.96033477783203, -91.48058319091797, -89.00082397460938, -86.52106475830078, -84.04130554199219, -81.56155395507812, -79.08179473876953, -76.60203552246094, -74.12227630615234, -71.64252471923828, -69.16276550292969, -66.6830062866211, -64.2032470703125, -61.72349548339844, -59.243736267089844, -56.76398468017578, -54.28422927856445, -51.80447006225586, -49.32471466064453, -46.84495544433594, -44.36520004272461, -41.88544464111328, -39.40568542480469, -36.92593002319336, -34.44617462158203, -31.966415405273438, -29.48666000366211, -27.00690269470215, -24.527145385742188, -22.04738998413086, -19.5676326751709, -17.087871551513672, -14.608114242553711, -12.128357887268066, -9.648601531982422, -7.168844223022461, -4.6890869140625, -2.2093305587768555, 0.27042579650878906, 2.75018310546875, 5.229939937591553, 7.7096967697143555, 10.189453125, 12.669210433959961, 15.148967742919922, 17.62872314453125, 20.10848045349121, 22.588237762451172, 25.067995071411133, 27.547752380371094, 30.027507781982422, 32.50726318359375, 34.987022399902344, 37.46677780151367, 39.946533203125, 42.426292419433594, 44.90604782104492, 47.385807037353516, 49.865562438964844, 52.34532165527344, 54.825077056884766, 57.304832458496094, 59.78459167480469, 62.264347076416016]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 3.0, 4.0, 10.0, 6.0, 6.0, 13.0, 13.0, 23.0, 22.0, 15.0, 29.0, 36.0, 27.0, 35.0, 54.0, 52.0, 52.0, 69.0, 42.0, 54.0, 58.0, 53.0, 40.0, 32.0, 38.0, 23.0, 37.0, 25.0, 20.0, 23.0, 16.0, 11.0, 17.0, 14.0, 8.0, 8.0, 3.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.702449798583984, -49.21373748779297, -47.72502136230469, -46.23630905151367, -44.747596740722656, -43.258880615234375, -41.77016830444336, -40.281455993652344, -38.79273986816406, -37.30402755737305, -35.815311431884766, -34.32659912109375, -32.837886810302734, -31.349170684814453, -29.860458374023438, -28.37174415588379, -26.883031845092773, -25.394317626953125, -23.90560531616211, -22.41689109802246, -20.928176879882812, -19.439464569091797, -17.95075035095215, -16.4620361328125, -14.973322868347168, -13.484609603881836, -11.995895385742188, -10.507182121276855, -9.018468856811523, -7.529754638671875, -6.041041374206543, -4.5523271560668945, -3.0636138916015625, -1.5749002695083618, -0.08618664741516113, 1.40252685546875, 2.8912405967712402, 4.3799543380737305, 5.8686676025390625, 7.357381820678711, 8.846095085144043, 10.334808349609375, 11.823522567749023, 13.312235832214355, 14.800949096679688, 16.289663314819336, 17.778377532958984, 19.26708984375, 20.75580406188965, 22.244518280029297, 23.733230590820312, 25.22194480895996, 26.71065902709961, 28.199371337890625, 29.688085556030273, 31.176799774169922, 32.66551208496094, 34.15422439575195, 35.642940521240234, 37.13165283203125, 38.620365142822266, 40.10908126831055, 41.59779357910156, 43.086509704589844, 44.57522201538086]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 3.0, 5.0, 5.0, 4.0, 8.0, 5.0, 12.0, 24.0, 19.0, 28.0, 39.0, 61.0, 141.0, 317.0, 852.0, 2637.0, 9657.0, 46021.0, 298387.0, 2590726.0, 1094431.0, 120251.0, 22486.0, 5416.0, 1544.0, 577.0, 258.0, 133.0, 62.0, 48.0, 20.0, 29.0, 21.0, 17.0, 7.0, 8.0, 8.0, 8.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.6328125, -6.430419921875, -6.22802734375, -6.025634765625, -5.8232421875, -5.620849609375, -5.41845703125, -5.216064453125, -5.013671875, -4.811279296875, -4.60888671875, -4.406494140625, -4.2041015625, -4.001708984375, -3.79931640625, -3.596923828125, -3.39453125, -3.192138671875, -2.98974609375, -2.787353515625, -2.5849609375, -2.382568359375, -2.18017578125, -1.977783203125, -1.775390625, -1.572998046875, -1.37060546875, -1.168212890625, -0.9658203125, -0.763427734375, -0.56103515625, -0.358642578125, -0.15625, 0.046142578125, 0.24853515625, 0.450927734375, 0.6533203125, 0.855712890625, 1.05810546875, 1.260498046875, 1.462890625, 1.665283203125, 1.86767578125, 2.070068359375, 2.2724609375, 2.474853515625, 2.67724609375, 2.879638671875, 3.08203125, 3.284423828125, 3.48681640625, 3.689208984375, 3.8916015625, 4.093994140625, 4.29638671875, 4.498779296875, 4.701171875, 4.903564453125, 5.10595703125, 5.308349609375, 5.5107421875, 5.713134765625, 5.91552734375, 6.117919921875, 6.3203125]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 15.0, 18.0, 26.0, 45.0, 59.0, 95.0, 99.0, 133.0, 148.0, 120.0, 88.0, 54.0, 44.0, 31.0, 17.0, 9.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.453125, -9.2596435546875, -9.066162109375, -8.8726806640625, -8.67919921875, -8.4857177734375, -8.292236328125, -8.0987548828125, -7.9052734375, -7.7117919921875, -7.518310546875, -7.3248291015625, -7.13134765625, -6.9378662109375, -6.744384765625, -6.5509033203125, -6.357421875, -6.1639404296875, -5.970458984375, -5.7769775390625, -5.58349609375, -5.3900146484375, -5.196533203125, -5.0030517578125, -4.8095703125, -4.6160888671875, -4.422607421875, -4.2291259765625, -4.03564453125, -3.8421630859375, -3.648681640625, -3.4552001953125, -3.26171875, -3.0682373046875, -2.874755859375, -2.6812744140625, -2.48779296875, -2.2943115234375, -2.100830078125, -1.9073486328125, -1.7138671875, -1.5203857421875, -1.326904296875, -1.1334228515625, -0.93994140625, -0.7464599609375, -0.552978515625, -0.3594970703125, -0.166015625, 0.0274658203125, 0.220947265625, 0.4144287109375, 0.60791015625, 0.8013916015625, 0.994873046875, 1.1883544921875, 1.3818359375, 1.5753173828125, 1.768798828125, 1.9622802734375, 2.15576171875, 2.3492431640625, 2.542724609375, 2.7362060546875, 2.9296875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 6.0, 9.0, 9.0, 14.0, 12.0, 22.0, 38.0, 46.0, 79.0, 165.0, 299.0, 597.0, 1383.0, 3957.0, 15194.0, 83510.0, 766530.0, 2903331.0, 350394.0, 51484.0, 11401.0, 3280.0, 1222.0, 568.0, 283.0, 171.0, 85.0, 58.0, 42.0, 33.0, 17.0, 15.0, 7.0, 13.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.80859375, -7.55120849609375, -7.2938232421875, -7.03643798828125, -6.779052734375, -6.52166748046875, -6.2642822265625, -6.00689697265625, -5.74951171875, -5.49212646484375, -5.2347412109375, -4.97735595703125, -4.719970703125, -4.46258544921875, -4.2052001953125, -3.94781494140625, -3.6904296875, -3.43304443359375, -3.1756591796875, -2.91827392578125, -2.660888671875, -2.40350341796875, -2.1461181640625, -1.88873291015625, -1.63134765625, -1.37396240234375, -1.1165771484375, -0.85919189453125, -0.601806640625, -0.34442138671875, -0.0870361328125, 0.17034912109375, 0.427734375, 0.68511962890625, 0.9425048828125, 1.19989013671875, 1.457275390625, 1.71466064453125, 1.9720458984375, 2.22943115234375, 2.48681640625, 2.74420166015625, 3.0015869140625, 3.25897216796875, 3.516357421875, 3.77374267578125, 4.0311279296875, 4.28851318359375, 4.5458984375, 4.80328369140625, 5.0606689453125, 5.31805419921875, 5.575439453125, 5.83282470703125, 6.0902099609375, 6.34759521484375, 6.60498046875, 6.86236572265625, 7.1197509765625, 7.37713623046875, 7.634521484375, 7.89190673828125, 8.1492919921875, 8.40667724609375, 8.6640625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 2.0, 13.0, 12.0, 22.0, 31.0, 39.0, 52.0, 70.0, 101.0, 184.0, 261.0, 323.0, 464.0, 591.0, 539.0, 407.0, 286.0, 198.0, 116.0, 89.0, 72.0, 59.0, 31.0, 31.0, 17.0, 14.0, 12.0, 7.0, 6.0, 2.0, 8.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.62109375, -7.35540771484375, -7.0897216796875, -6.82403564453125, -6.558349609375, -6.29266357421875, -6.0269775390625, -5.76129150390625, -5.49560546875, -5.22991943359375, -4.9642333984375, -4.69854736328125, -4.432861328125, -4.16717529296875, -3.9014892578125, -3.63580322265625, -3.3701171875, -3.10443115234375, -2.8387451171875, -2.57305908203125, -2.307373046875, -2.04168701171875, -1.7760009765625, -1.51031494140625, -1.24462890625, -0.97894287109375, -0.7132568359375, -0.44757080078125, -0.181884765625, 0.08380126953125, 0.3494873046875, 0.61517333984375, 0.880859375, 1.14654541015625, 1.4122314453125, 1.67791748046875, 1.943603515625, 2.20928955078125, 2.4749755859375, 2.74066162109375, 3.00634765625, 3.27203369140625, 3.5377197265625, 3.80340576171875, 4.069091796875, 4.33477783203125, 4.6004638671875, 4.86614990234375, 5.1318359375, 5.39752197265625, 5.6632080078125, 5.92889404296875, 6.194580078125, 6.46026611328125, 6.7259521484375, 6.99163818359375, 7.25732421875, 7.52301025390625, 7.7886962890625, 8.05438232421875, 8.320068359375, 8.58575439453125, 8.8514404296875, 9.11712646484375, 9.3828125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 18.0, 34.0, 93.0, 172.0, 200.0, 182.0, 132.0, 87.0, 41.0, 20.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-118.06639099121094, -114.4468765258789, -110.8273696899414, -107.20785522460938, -103.58834838867188, -99.96883392333984, -96.34931945800781, -92.72981262207031, -89.11029815673828, -85.49078369140625, -81.87127685546875, -78.25176239013672, -74.63224792480469, -71.01274108886719, -67.39322662353516, -63.77371597290039, -60.154205322265625, -56.53469467163086, -52.915184020996094, -49.29566955566406, -45.6761589050293, -42.05664825439453, -38.4371337890625, -34.817623138427734, -31.19811248779297, -27.578601837158203, -23.959089279174805, -20.339576721191406, -16.72006607055664, -13.100555419921875, -9.481042861938477, -5.861530303955078, -2.2420196533203125, 1.3774919509887695, 4.997003555297852, 8.616515159606934, 12.236026763916016, 15.855537414550781, 19.47504997253418, 23.094562530517578, 26.714073181152344, 30.33358383178711, 33.953094482421875, 37.572608947753906, 41.19211959838867, 44.81163024902344, 48.43114471435547, 52.050655364990234, 55.670166015625, 59.289676666259766, 62.90918731689453, 66.52870178222656, 70.14820861816406, 73.7677230834961, 77.38723754882812, 81.00674438476562, 84.62625885009766, 88.24577331542969, 91.86528015136719, 95.48479461669922, 99.10430908203125, 102.72381591796875, 106.34333038330078, 109.96284484863281, 113.58235168457031]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 6.0, 10.0, 7.0, 13.0, 31.0, 31.0, 33.0, 48.0, 51.0, 62.0, 87.0, 84.0, 76.0, 83.0, 87.0, 53.0, 65.0, 55.0, 26.0, 21.0, 21.0, 22.0, 11.0, 15.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.94514465332031, -38.58870315551758, -36.23226547241211, -33.875823974609375, -31.519386291503906, -29.162944793701172, -26.80650520324707, -24.45006561279297, -22.093626022338867, -19.737186431884766, -17.380746841430664, -15.024306297302246, -12.667866706848145, -10.311427116394043, -7.954986572265625, -5.598546981811523, -3.242107391357422, -0.8856675624847412, 1.4707722663879395, 3.827212333679199, 6.183651924133301, 8.540091514587402, 10.89653205871582, 13.252971649169922, 15.609411239624023, 17.965850830078125, 20.322290420532227, 22.678730010986328, 25.035171508789062, 27.39160919189453, 29.748050689697266, 32.1044921875, 34.46092987060547, 36.8173713684082, 39.17380905151367, 41.530250549316406, 43.886688232421875, 46.24312973022461, 48.599571228027344, 50.95600891113281, 53.31244659423828, 55.668888092041016, 58.025325775146484, 60.38176727294922, 62.73820495605469, 65.09464263916016, 67.45108795166016, 69.80752563476562, 72.16397094726562, 74.5204086303711, 76.8768539428711, 79.23329162597656, 81.58972930908203, 83.9461669921875, 86.3026123046875, 88.65904998779297, 91.01548767089844, 93.3719253540039, 95.7283706665039, 98.08480834960938, 100.44124603271484, 102.79768371582031, 105.15412902832031, 107.51056671142578, 109.86700439453125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 11.0, 14.0, 21.0, 30.0, 33.0, 63.0, 82.0, 138.0, 228.0, 344.0, 588.0, 1076.0, 1960.0, 3884.0, 7780.0, 16566.0, 36016.0, 81207.0, 214114.0, 375745.0, 178538.0, 70102.0, 31186.0, 14329.0, 6926.0, 3390.0, 1764.0, 960.0, 540.0, 314.0, 205.0, 131.0, 89.0, 62.0, 37.0, 26.0, 20.0, 6.0, 7.0, 7.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83203125, -5.6402587890625, -5.448486328125, -5.2567138671875, -5.06494140625, -4.8731689453125, -4.681396484375, -4.4896240234375, -4.2978515625, -4.1060791015625, -3.914306640625, -3.7225341796875, -3.53076171875, -3.3389892578125, -3.147216796875, -2.9554443359375, -2.763671875, -2.5718994140625, -2.380126953125, -2.1883544921875, -1.99658203125, -1.8048095703125, -1.613037109375, -1.4212646484375, -1.2294921875, -1.0377197265625, -0.845947265625, -0.6541748046875, -0.46240234375, -0.2706298828125, -0.078857421875, 0.1129150390625, 0.3046875, 0.4964599609375, 0.688232421875, 0.8800048828125, 1.07177734375, 1.2635498046875, 1.455322265625, 1.6470947265625, 1.8388671875, 2.0306396484375, 2.222412109375, 2.4141845703125, 2.60595703125, 2.7977294921875, 2.989501953125, 3.1812744140625, 3.373046875, 3.5648193359375, 3.756591796875, 3.9483642578125, 4.14013671875, 4.3319091796875, 4.523681640625, 4.7154541015625, 4.9072265625, 5.0989990234375, 5.290771484375, 5.4825439453125, 5.67431640625, 5.8660888671875, 6.057861328125, 6.2496337890625, 6.44140625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 6.0, 6.0, 19.0, 15.0, 16.0, 15.0, 25.0, 21.0, 31.0, 43.0, 32.0, 49.0, 36.0, 45.0, 45.0, 59.0, 51.0, 39.0, 50.0, 56.0, 49.0, 40.0, 35.0, 42.0, 24.0, 20.0, 17.0, 20.0, 12.0, 12.0, 18.0, 12.0, 6.0, 10.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.208984375, -2.12225341796875, -2.0355224609375, -1.94879150390625, -1.862060546875, -1.77532958984375, -1.6885986328125, -1.60186767578125, -1.51513671875, -1.42840576171875, -1.3416748046875, -1.25494384765625, -1.168212890625, -1.08148193359375, -0.9947509765625, -0.90802001953125, -0.8212890625, -0.73455810546875, -0.6478271484375, -0.56109619140625, -0.474365234375, -0.38763427734375, -0.3009033203125, -0.21417236328125, -0.12744140625, -0.04071044921875, 0.0460205078125, 0.13275146484375, 0.219482421875, 0.30621337890625, 0.3929443359375, 0.47967529296875, 0.56640625, 0.65313720703125, 0.7398681640625, 0.82659912109375, 0.913330078125, 1.00006103515625, 1.0867919921875, 1.17352294921875, 1.26025390625, 1.34698486328125, 1.4337158203125, 1.52044677734375, 1.607177734375, 1.69390869140625, 1.7806396484375, 1.86737060546875, 1.9541015625, 2.04083251953125, 2.1275634765625, 2.21429443359375, 2.301025390625, 2.38775634765625, 2.4744873046875, 2.56121826171875, 2.64794921875, 2.73468017578125, 2.8214111328125, 2.90814208984375, 2.994873046875, 3.08160400390625, 3.1683349609375, 3.25506591796875, 3.341796875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 8.0, 4.0, 3.0, 6.0, 8.0, 7.0, 7.0, 18.0, 30.0, 34.0, 50.0, 75.0, 102.0, 196.0, 299.0, 457.0, 750.0, 1371.0, 2612.0, 6977.0, 29235.0, 259129.0, 677599.0, 51988.0, 10029.0, 3505.0, 1683.0, 887.0, 526.0, 325.0, 221.0, 130.0, 105.0, 63.0, 40.0, 26.0, 18.0, 13.0, 8.0, 6.0, 4.0, 3.0, 4.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5234375, -14.0252685546875, -13.527099609375, -13.0289306640625, -12.53076171875, -12.0325927734375, -11.534423828125, -11.0362548828125, -10.5380859375, -10.0399169921875, -9.541748046875, -9.0435791015625, -8.54541015625, -8.0472412109375, -7.549072265625, -7.0509033203125, -6.552734375, -6.0545654296875, -5.556396484375, -5.0582275390625, -4.56005859375, -4.0618896484375, -3.563720703125, -3.0655517578125, -2.5673828125, -2.0692138671875, -1.571044921875, -1.0728759765625, -0.57470703125, -0.0765380859375, 0.421630859375, 0.9197998046875, 1.41796875, 1.9161376953125, 2.414306640625, 2.9124755859375, 3.41064453125, 3.9088134765625, 4.406982421875, 4.9051513671875, 5.4033203125, 5.9014892578125, 6.399658203125, 6.8978271484375, 7.39599609375, 7.8941650390625, 8.392333984375, 8.8905029296875, 9.388671875, 9.8868408203125, 10.385009765625, 10.8831787109375, 11.38134765625, 11.8795166015625, 12.377685546875, 12.8758544921875, 13.3740234375, 13.8721923828125, 14.370361328125, 14.8685302734375, 15.36669921875, 15.8648681640625, 16.363037109375, 16.8612060546875, 17.359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 5.0, 7.0, 7.0, 14.0, 7.0, 15.0, 19.0, 21.0, 33.0, 40.0, 28.0, 42.0, 48.0, 60.0, 52.0, 55.0, 62.0, 64.0, 60.0, 39.0, 69.0, 39.0, 41.0, 25.0, 26.0, 34.0, 15.0, 14.0, 14.0, 9.0, 11.0, 11.0, 2.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.0078125, -14.5013427734375, -13.994873046875, -13.4884033203125, -12.98193359375, -12.4754638671875, -11.968994140625, -11.4625244140625, -10.9560546875, -10.4495849609375, -9.943115234375, -9.4366455078125, -8.93017578125, -8.4237060546875, -7.917236328125, -7.4107666015625, -6.904296875, -6.3978271484375, -5.891357421875, -5.3848876953125, -4.87841796875, -4.3719482421875, -3.865478515625, -3.3590087890625, -2.8525390625, -2.3460693359375, -1.839599609375, -1.3331298828125, -0.82666015625, -0.3201904296875, 0.186279296875, 0.6927490234375, 1.19921875, 1.7056884765625, 2.212158203125, 2.7186279296875, 3.22509765625, 3.7315673828125, 4.238037109375, 4.7445068359375, 5.2509765625, 5.7574462890625, 6.263916015625, 6.7703857421875, 7.27685546875, 7.7833251953125, 8.289794921875, 8.7962646484375, 9.302734375, 9.8092041015625, 10.315673828125, 10.8221435546875, 11.32861328125, 11.8350830078125, 12.341552734375, 12.8480224609375, 13.3544921875, 13.8609619140625, 14.367431640625, 14.8739013671875, 15.38037109375, 15.8868408203125, 16.393310546875, 16.8997802734375, 17.40625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 3.0, 3.0, 8.0, 5.0, 8.0, 13.0, 13.0, 24.0, 33.0, 48.0, 72.0, 98.0, 220.0, 334.0, 725.0, 1381.0, 3446.0, 12025.0, 57768.0, 531001.0, 371730.0, 52219.0, 11142.0, 3389.0, 1378.0, 617.0, 326.0, 204.0, 101.0, 66.0, 43.0, 37.0, 18.0, 19.0, 12.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.77734375, -4.6002197265625, -4.423095703125, -4.2459716796875, -4.06884765625, -3.8917236328125, -3.714599609375, -3.5374755859375, -3.3603515625, -3.1832275390625, -3.006103515625, -2.8289794921875, -2.65185546875, -2.4747314453125, -2.297607421875, -2.1204833984375, -1.943359375, -1.7662353515625, -1.589111328125, -1.4119873046875, -1.23486328125, -1.0577392578125, -0.880615234375, -0.7034912109375, -0.5263671875, -0.3492431640625, -0.172119140625, 0.0050048828125, 0.18212890625, 0.3592529296875, 0.536376953125, 0.7135009765625, 0.890625, 1.0677490234375, 1.244873046875, 1.4219970703125, 1.59912109375, 1.7762451171875, 1.953369140625, 2.1304931640625, 2.3076171875, 2.4847412109375, 2.661865234375, 2.8389892578125, 3.01611328125, 3.1932373046875, 3.370361328125, 3.5474853515625, 3.724609375, 3.9017333984375, 4.078857421875, 4.2559814453125, 4.43310546875, 4.6102294921875, 4.787353515625, 4.9644775390625, 5.1416015625, 5.3187255859375, 5.495849609375, 5.6729736328125, 5.85009765625, 6.0272216796875, 6.204345703125, 6.3814697265625, 6.55859375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 9.0, 7.0, 8.0, 15.0, 17.0, 24.0, 16.0, 27.0, 34.0, 53.0, 71.0, 112.0, 150.0, 133.0, 84.0, 47.0, 38.0, 47.0, 25.0, 18.0, 17.0, 12.0, 8.0, 7.0, 4.0, 4.0, 3.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013093948364257812, -0.0012603700160980225, -0.0012113451957702637, -0.0011623203754425049, -0.001113295555114746, -0.0010642707347869873, -0.0010152459144592285, -0.0009662210941314697, -0.0009171962738037109, -0.0008681714534759521, -0.0008191466331481934, -0.0007701218128204346, -0.0007210969924926758, -0.000672072172164917, -0.0006230473518371582, -0.0005740225315093994, -0.0005249977111816406, -0.00047597289085388184, -0.00042694807052612305, -0.00037792325019836426, -0.00032889842987060547, -0.0002798736095428467, -0.0002308487892150879, -0.0001818239688873291, -0.0001327991485595703, -8.377432823181152e-05, -3.4749507904052734e-05, 1.4275312423706055e-05, 6.330013275146484e-05, 0.00011232495307922363, 0.00016134977340698242, 0.0002103745937347412, 0.0002593994140625, 0.0003084242343902588, 0.0003574490547180176, 0.00040647387504577637, 0.00045549869537353516, 0.0005045235157012939, 0.0005535483360290527, 0.0006025731563568115, 0.0006515979766845703, 0.0007006227970123291, 0.0007496476173400879, 0.0007986724376678467, 0.0008476972579956055, 0.0008967220783233643, 0.000945746898651123, 0.0009947717189788818, 0.0010437965393066406, 0.0010928213596343994, 0.0011418461799621582, 0.001190871000289917, 0.0012398958206176758, 0.0012889206409454346, 0.0013379454612731934, 0.0013869702816009521, 0.001435995101928711, 0.0014850199222564697, 0.0015340447425842285, 0.0015830695629119873, 0.001632094383239746, 0.0016811192035675049, 0.0017301440238952637, 0.0017791688442230225, 0.0018281936645507812]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 3.0, 3.0, 10.0, 16.0, 19.0, 23.0, 59.0, 70.0, 98.0, 202.0, 356.0, 714.0, 1389.0, 3602.0, 12556.0, 89492.0, 791108.0, 125794.0, 15582.0, 4221.0, 1551.0, 764.0, 397.0, 181.0, 109.0, 79.0, 54.0, 33.0, 19.0, 16.0, 11.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.72265625, -5.50726318359375, -5.2918701171875, -5.07647705078125, -4.861083984375, -4.64569091796875, -4.4302978515625, -4.21490478515625, -3.99951171875, -3.78411865234375, -3.5687255859375, -3.35333251953125, -3.137939453125, -2.92254638671875, -2.7071533203125, -2.49176025390625, -2.2763671875, -2.06097412109375, -1.8455810546875, -1.63018798828125, -1.414794921875, -1.19940185546875, -0.9840087890625, -0.76861572265625, -0.55322265625, -0.33782958984375, -0.1224365234375, 0.09295654296875, 0.308349609375, 0.52374267578125, 0.7391357421875, 0.95452880859375, 1.169921875, 1.38531494140625, 1.6007080078125, 1.81610107421875, 2.031494140625, 2.24688720703125, 2.4622802734375, 2.67767333984375, 2.89306640625, 3.10845947265625, 3.3238525390625, 3.53924560546875, 3.754638671875, 3.97003173828125, 4.1854248046875, 4.40081787109375, 4.6162109375, 4.83160400390625, 5.0469970703125, 5.26239013671875, 5.477783203125, 5.69317626953125, 5.9085693359375, 6.12396240234375, 6.33935546875, 6.55474853515625, 6.7701416015625, 6.98553466796875, 7.200927734375, 7.41632080078125, 7.6317138671875, 7.84710693359375, 8.0625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 5.0, 5.0, 14.0, 18.0, 14.0, 14.0, 27.0, 35.0, 44.0, 41.0, 63.0, 82.0, 79.0, 91.0, 95.0, 76.0, 67.0, 51.0, 34.0, 36.0, 20.0, 15.0, 18.0, 16.0, 12.0, 8.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.12890625, -4.97039794921875, -4.8118896484375, -4.65338134765625, -4.494873046875, -4.33636474609375, -4.1778564453125, -4.01934814453125, -3.86083984375, -3.70233154296875, -3.5438232421875, -3.38531494140625, -3.226806640625, -3.06829833984375, -2.9097900390625, -2.75128173828125, -2.5927734375, -2.43426513671875, -2.2757568359375, -2.11724853515625, -1.958740234375, -1.80023193359375, -1.6417236328125, -1.48321533203125, -1.32470703125, -1.16619873046875, -1.0076904296875, -0.84918212890625, -0.690673828125, -0.53216552734375, -0.3736572265625, -0.21514892578125, -0.056640625, 0.10186767578125, 0.2603759765625, 0.41888427734375, 0.577392578125, 0.73590087890625, 0.8944091796875, 1.05291748046875, 1.21142578125, 1.36993408203125, 1.5284423828125, 1.68695068359375, 1.845458984375, 2.00396728515625, 2.1624755859375, 2.32098388671875, 2.4794921875, 2.63800048828125, 2.7965087890625, 2.95501708984375, 3.113525390625, 3.27203369140625, 3.4305419921875, 3.58905029296875, 3.74755859375, 3.90606689453125, 4.0645751953125, 4.22308349609375, 4.381591796875, 4.54010009765625, 4.6986083984375, 4.85711669921875, 5.015625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 7.0, 9.0, 25.0, 44.0, 87.0, 147.0, 256.0, 169.0, 114.0, 67.0, 26.0, 23.0, 8.0, 5.0, 6.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-102.94600677490234, -99.47513580322266, -96.00425720214844, -92.53338623046875, -89.06251525878906, -85.59163665771484, -82.12076568603516, -78.64988708496094, -75.17901611328125, -71.70814514160156, -68.23726654052734, -64.76639556884766, -61.2955207824707, -57.82464599609375, -54.35377502441406, -50.88290023803711, -47.412025451660156, -43.9411506652832, -40.47027587890625, -36.99940490722656, -33.52853012084961, -30.057655334472656, -26.586782455444336, -23.115909576416016, -19.645034790039062, -16.17416000366211, -12.703287124633789, -9.232413291931152, -5.761539459228516, -2.2906646728515625, 1.1802082061767578, 4.651081085205078, 8.1219482421875, 11.592822074890137, 15.063695907592773, 18.534568786621094, 22.005443572998047, 25.476318359375, 28.94719123840332, 32.41806411743164, 35.888938903808594, 39.35981369018555, 42.8306884765625, 46.30155944824219, 49.77243423461914, 53.243309020996094, 56.71417999267578, 60.185054779052734, 63.65592956542969, 67.12680053710938, 70.5976791381836, 74.06855010986328, 77.5394287109375, 81.01029968261719, 84.48117065429688, 87.95204162597656, 91.42292022705078, 94.89379119873047, 98.36466979980469, 101.83554077148438, 105.30641174316406, 108.77729034423828, 112.24816131591797, 115.71903991699219, 119.18991088867188]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 9.0, 8.0, 9.0, 17.0, 24.0, 21.0, 18.0, 23.0, 22.0, 35.0, 41.0, 27.0, 54.0, 48.0, 58.0, 63.0, 68.0, 56.0, 45.0, 54.0, 37.0, 38.0, 35.0, 36.0, 31.0, 11.0, 25.0, 22.0, 13.0, 10.0, 11.0, 6.0, 5.0, 2.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.33470153808594, -62.552001953125, -60.76930618286133, -58.986610412597656, -57.20391082763672, -55.42121124267578, -53.63851547241211, -51.85581970214844, -50.0731201171875, -48.29042053222656, -46.50772476196289, -44.72502899169922, -42.94232940673828, -41.159629821777344, -39.37693405151367, -37.59423828125, -35.81153869628906, -34.028839111328125, -32.24614334106445, -30.46344566345215, -28.680747985839844, -26.89805030822754, -25.115352630615234, -23.33265495300293, -21.549957275390625, -19.76725959777832, -17.984561920166016, -16.20186424255371, -14.419166564941406, -12.636468887329102, -10.853771209716797, -9.071073532104492, -7.288372039794922, -5.505674362182617, -3.7229766845703125, -1.9402790069580078, -0.15758132934570312, 1.6251163482666016, 3.4078140258789062, 5.190511703491211, 6.973209381103516, 8.75590705871582, 10.538604736328125, 12.32130241394043, 14.104000091552734, 15.886697769165039, 17.669395446777344, 19.45209312438965, 21.234790802001953, 23.017488479614258, 24.800186157226562, 26.582883834838867, 28.365581512451172, 30.148279190063477, 31.93097686767578, 33.71367645263672, 35.49637222290039, 37.27906799316406, 39.061767578125, 40.84446716308594, 42.62716293334961, 44.40985870361328, 46.19255828857422, 47.975257873535156, 49.75795364379883]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 13.0, 14.0, 28.0, 48.0, 70.0, 126.0, 280.0, 595.0, 1492.0, 4420.0, 16777.0, 87234.0, 838224.0, 2847185.0, 337344.0, 45630.0, 9872.0, 2838.0, 988.0, 450.0, 221.0, 123.0, 73.0, 64.0, 41.0, 27.0, 21.0, 7.0, 12.0, 17.0, 9.0, 7.0, 3.0, 3.0, 3.0, 3.0, 7.0, 6.0, 4.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.39453125, -4.18841552734375, -3.9822998046875, -3.77618408203125, -3.570068359375, -3.36395263671875, -3.1578369140625, -2.95172119140625, -2.74560546875, -2.53948974609375, -2.3333740234375, -2.12725830078125, -1.921142578125, -1.71502685546875, -1.5089111328125, -1.30279541015625, -1.0966796875, -0.89056396484375, -0.6844482421875, -0.47833251953125, -0.272216796875, -0.06610107421875, 0.1400146484375, 0.34613037109375, 0.55224609375, 0.75836181640625, 0.9644775390625, 1.17059326171875, 1.376708984375, 1.58282470703125, 1.7889404296875, 1.99505615234375, 2.201171875, 2.40728759765625, 2.6134033203125, 2.81951904296875, 3.025634765625, 3.23175048828125, 3.4378662109375, 3.64398193359375, 3.85009765625, 4.05621337890625, 4.2623291015625, 4.46844482421875, 4.674560546875, 4.88067626953125, 5.0867919921875, 5.29290771484375, 5.4990234375, 5.70513916015625, 5.9112548828125, 6.11737060546875, 6.323486328125, 6.52960205078125, 6.7357177734375, 6.94183349609375, 7.14794921875, 7.35406494140625, 7.5601806640625, 7.76629638671875, 7.972412109375, 8.17852783203125, 8.3846435546875, 8.59075927734375, 8.796875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 10.0, 6.0, 12.0, 13.0, 11.0, 21.0, 21.0, 23.0, 32.0, 33.0, 36.0, 45.0, 45.0, 47.0, 63.0, 60.0, 54.0, 56.0, 50.0, 61.0, 43.0, 29.0, 41.0, 30.0, 39.0, 31.0, 14.0, 18.0, 10.0, 17.0, 7.0, 6.0, 6.0, 0.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-3.822265625, -3.725006103515625, -3.62774658203125, -3.530487060546875, -3.4332275390625, -3.335968017578125, -3.23870849609375, -3.141448974609375, -3.044189453125, -2.946929931640625, -2.84967041015625, -2.752410888671875, -2.6551513671875, -2.557891845703125, -2.46063232421875, -2.363372802734375, -2.26611328125, -2.168853759765625, -2.07159423828125, -1.974334716796875, -1.8770751953125, -1.779815673828125, -1.68255615234375, -1.585296630859375, -1.488037109375, -1.390777587890625, -1.29351806640625, -1.196258544921875, -1.0989990234375, -1.001739501953125, -0.90447998046875, -0.807220458984375, -0.7099609375, -0.612701416015625, -0.51544189453125, -0.418182373046875, -0.3209228515625, -0.223663330078125, -0.12640380859375, -0.029144287109375, 0.068115234375, 0.165374755859375, 0.26263427734375, 0.359893798828125, 0.4571533203125, 0.554412841796875, 0.65167236328125, 0.748931884765625, 0.84619140625, 0.943450927734375, 1.04071044921875, 1.137969970703125, 1.2352294921875, 1.332489013671875, 1.42974853515625, 1.527008056640625, 1.624267578125, 1.721527099609375, 1.81878662109375, 1.916046142578125, 2.0133056640625, 2.110565185546875, 2.20782470703125, 2.305084228515625, 2.40234375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 7.0, 7.0, 8.0, 14.0, 29.0, 52.0, 94.0, 173.0, 304.0, 703.0, 1764.0, 6374.0, 37294.0, 412534.0, 3335267.0, 357643.0, 33260.0, 5874.0, 1563.0, 653.0, 307.0, 160.0, 75.0, 53.0, 28.0, 12.0, 12.0, 7.0, 7.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.03125, -6.703857421875, -6.37646484375, -6.049072265625, -5.7216796875, -5.394287109375, -5.06689453125, -4.739501953125, -4.412109375, -4.084716796875, -3.75732421875, -3.429931640625, -3.1025390625, -2.775146484375, -2.44775390625, -2.120361328125, -1.79296875, -1.465576171875, -1.13818359375, -0.810791015625, -0.4833984375, -0.156005859375, 0.17138671875, 0.498779296875, 0.826171875, 1.153564453125, 1.48095703125, 1.808349609375, 2.1357421875, 2.463134765625, 2.79052734375, 3.117919921875, 3.4453125, 3.772705078125, 4.10009765625, 4.427490234375, 4.7548828125, 5.082275390625, 5.40966796875, 5.737060546875, 6.064453125, 6.391845703125, 6.71923828125, 7.046630859375, 7.3740234375, 7.701416015625, 8.02880859375, 8.356201171875, 8.68359375, 9.010986328125, 9.33837890625, 9.665771484375, 9.9931640625, 10.320556640625, 10.64794921875, 10.975341796875, 11.302734375, 11.630126953125, 11.95751953125, 12.284912109375, 12.6123046875, 12.939697265625, 13.26708984375, 13.594482421875, 13.921875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 9.0, 7.0, 5.0, 16.0, 16.0, 22.0, 38.0, 53.0, 68.0, 116.0, 167.0, 259.0, 393.0, 604.0, 675.0, 546.0, 369.0, 238.0, 150.0, 103.0, 78.0, 38.0, 30.0, 25.0, 13.0, 16.0, 12.0, 2.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6640625, -9.3658447265625, -9.067626953125, -8.7694091796875, -8.47119140625, -8.1729736328125, -7.874755859375, -7.5765380859375, -7.2783203125, -6.9801025390625, -6.681884765625, -6.3836669921875, -6.08544921875, -5.7872314453125, -5.489013671875, -5.1907958984375, -4.892578125, -4.5943603515625, -4.296142578125, -3.9979248046875, -3.69970703125, -3.4014892578125, -3.103271484375, -2.8050537109375, -2.5068359375, -2.2086181640625, -1.910400390625, -1.6121826171875, -1.31396484375, -1.0157470703125, -0.717529296875, -0.4193115234375, -0.12109375, 0.1771240234375, 0.475341796875, 0.7735595703125, 1.07177734375, 1.3699951171875, 1.668212890625, 1.9664306640625, 2.2646484375, 2.5628662109375, 2.861083984375, 3.1593017578125, 3.45751953125, 3.7557373046875, 4.053955078125, 4.3521728515625, 4.650390625, 4.9486083984375, 5.246826171875, 5.5450439453125, 5.84326171875, 6.1414794921875, 6.439697265625, 6.7379150390625, 7.0361328125, 7.3343505859375, 7.632568359375, 7.9307861328125, 8.22900390625, 8.5272216796875, 8.825439453125, 9.1236572265625, 9.421875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 9.0, 10.0, 16.0, 55.0, 110.0, 146.0, 224.0, 207.0, 107.0, 62.0, 18.0, 12.0, 8.0, 2.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-131.54518127441406, -127.95063018798828, -124.3560791015625, -120.76152801513672, -117.16697692871094, -113.57243347167969, -109.9778823852539, -106.38333129882812, -102.78878021240234, -99.19422912597656, -95.59967803955078, -92.005126953125, -88.41058349609375, -84.81602478027344, -81.22148132324219, -77.6269302368164, -74.03237915039062, -70.43782806396484, -66.84327697753906, -63.24872970581055, -59.654178619384766, -56.059627532958984, -52.46508026123047, -48.87052917480469, -45.275978088378906, -41.681427001953125, -38.086875915527344, -34.49232864379883, -30.897777557373047, -27.303226470947266, -23.708677291870117, -20.11412811279297, -16.519569396972656, -12.925019264221191, -9.330469131469727, -5.735918998718262, -2.141368865966797, 1.4531822204589844, 5.047731399536133, 8.642280578613281, 12.236831665039062, 15.831381797790527, 19.425931930541992, 23.02048110961914, 26.615032196044922, 30.209583282470703, 33.80413055419922, 37.398681640625, 40.99323272705078, 44.58778381347656, 48.182334899902344, 51.77688217163086, 55.37143325805664, 58.96598434448242, 62.56053161621094, 66.15508270263672, 69.7496337890625, 73.34418487548828, 76.93873596191406, 80.53328704833984, 84.12783813476562, 87.72238159179688, 91.31693267822266, 94.91148376464844, 98.50603485107422]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 1.0, 1.0, 5.0, 4.0, 3.0, 5.0, 5.0, 9.0, 7.0, 8.0, 10.0, 11.0, 10.0, 15.0, 18.0, 16.0, 27.0, 25.0, 23.0, 39.0, 24.0, 32.0, 44.0, 42.0, 42.0, 45.0, 35.0, 37.0, 43.0, 45.0, 40.0, 36.0, 34.0, 34.0, 30.0, 29.0, 20.0, 22.0, 18.0, 21.0, 11.0, 14.0, 15.0, 11.0, 8.0, 6.0, 5.0, 3.0, 6.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-35.279869079589844, -34.17880630493164, -33.07774353027344, -31.9766788482666, -30.875614166259766, -29.774551391601562, -28.67348861694336, -27.572423934936523, -26.471359252929688, -25.370296478271484, -24.26923179626465, -23.168169021606445, -22.06710433959961, -20.966041564941406, -19.864978790283203, -18.763914108276367, -17.662851333618164, -16.56178855895996, -15.460723876953125, -14.359661102294922, -13.258596420288086, -12.157533645629883, -11.056469917297363, -9.955406188964844, -8.854342460632324, -7.753278732299805, -6.652215003967285, -5.551151752471924, -4.450088024139404, -3.3490242958068848, -2.2479610443115234, -1.146897315979004, -0.045833587646484375, 1.0552300214767456, 2.1562936305999756, 3.257357120513916, 4.3584208488464355, 5.459484577178955, 6.560547828674316, 7.661611557006836, 8.762675285339355, 9.863739013671875, 10.964802742004395, 12.065866470336914, 13.166929244995117, 14.267993927001953, 15.369056701660156, 16.47011947631836, 17.571184158325195, 18.6722469329834, 19.773311614990234, 20.874374389648438, 21.975439071655273, 23.076501846313477, 24.177566528320312, 25.278629302978516, 26.37969207763672, 27.480754852294922, 28.581819534301758, 29.68288230895996, 30.783946990966797, 31.885009765625, 32.9860725402832, 34.087135314941406, 35.188201904296875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 15.0, 8.0, 9.0, 26.0, 37.0, 72.0, 125.0, 181.0, 373.0, 767.0, 1517.0, 3265.0, 7815.0, 21664.0, 78441.0, 433526.0, 396328.0, 70697.0, 20081.0, 7478.0, 3119.0, 1480.0, 717.0, 343.0, 185.0, 115.0, 61.0, 35.0, 24.0, 18.0, 13.0, 7.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.609375, -10.3223876953125, -10.035400390625, -9.7484130859375, -9.46142578125, -9.1744384765625, -8.887451171875, -8.6004638671875, -8.3134765625, -8.0264892578125, -7.739501953125, -7.4525146484375, -7.16552734375, -6.8785400390625, -6.591552734375, -6.3045654296875, -6.017578125, -5.7305908203125, -5.443603515625, -5.1566162109375, -4.86962890625, -4.5826416015625, -4.295654296875, -4.0086669921875, -3.7216796875, -3.4346923828125, -3.147705078125, -2.8607177734375, -2.57373046875, -2.2867431640625, -1.999755859375, -1.7127685546875, -1.42578125, -1.1387939453125, -0.851806640625, -0.5648193359375, -0.27783203125, 0.0091552734375, 0.296142578125, 0.5831298828125, 0.8701171875, 1.1571044921875, 1.444091796875, 1.7310791015625, 2.01806640625, 2.3050537109375, 2.592041015625, 2.8790283203125, 3.166015625, 3.4530029296875, 3.739990234375, 4.0269775390625, 4.31396484375, 4.6009521484375, 4.887939453125, 5.1749267578125, 5.4619140625, 5.7489013671875, 6.035888671875, 6.3228759765625, 6.60986328125, 6.8968505859375, 7.183837890625, 7.4708251953125, 7.7578125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 2.0, 6.0, 6.0, 10.0, 11.0, 13.0, 13.0, 17.0, 17.0, 18.0, 28.0, 24.0, 34.0, 29.0, 31.0, 35.0, 56.0, 43.0, 47.0, 46.0, 44.0, 50.0, 45.0, 37.0, 40.0, 34.0, 43.0, 33.0, 18.0, 32.0, 19.0, 22.0, 16.0, 17.0, 21.0, 6.0, 8.0, 10.0, 6.0, 5.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-3.09375, -3.009185791015625, -2.92462158203125, -2.840057373046875, -2.7554931640625, -2.670928955078125, -2.58636474609375, -2.501800537109375, -2.417236328125, -2.332672119140625, -2.24810791015625, -2.163543701171875, -2.0789794921875, -1.994415283203125, -1.90985107421875, -1.825286865234375, -1.74072265625, -1.656158447265625, -1.57159423828125, -1.487030029296875, -1.4024658203125, -1.317901611328125, -1.23333740234375, -1.148773193359375, -1.064208984375, -0.979644775390625, -0.89508056640625, -0.810516357421875, -0.7259521484375, -0.641387939453125, -0.55682373046875, -0.472259521484375, -0.3876953125, -0.303131103515625, -0.21856689453125, -0.134002685546875, -0.0494384765625, 0.035125732421875, 0.11968994140625, 0.204254150390625, 0.288818359375, 0.373382568359375, 0.45794677734375, 0.542510986328125, 0.6270751953125, 0.711639404296875, 0.79620361328125, 0.880767822265625, 0.96533203125, 1.049896240234375, 1.13446044921875, 1.219024658203125, 1.3035888671875, 1.388153076171875, 1.47271728515625, 1.557281494140625, 1.641845703125, 1.726409912109375, 1.81097412109375, 1.895538330078125, 1.9801025390625, 2.064666748046875, 2.14923095703125, 2.233795166015625, 2.318359375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 14.0, 13.0, 18.0, 36.0, 56.0, 82.0, 138.0, 273.0, 436.0, 892.0, 2059.0, 6634.0, 37976.0, 759987.0, 214698.0, 18117.0, 4121.0, 1430.0, 652.0, 369.0, 216.0, 123.0, 71.0, 40.0, 30.0, 22.0, 17.0, 7.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.6875, -20.10986328125, -19.5322265625, -18.95458984375, -18.376953125, -17.79931640625, -17.2216796875, -16.64404296875, -16.06640625, -15.48876953125, -14.9111328125, -14.33349609375, -13.755859375, -13.17822265625, -12.6005859375, -12.02294921875, -11.4453125, -10.86767578125, -10.2900390625, -9.71240234375, -9.134765625, -8.55712890625, -7.9794921875, -7.40185546875, -6.82421875, -6.24658203125, -5.6689453125, -5.09130859375, -4.513671875, -3.93603515625, -3.3583984375, -2.78076171875, -2.203125, -1.62548828125, -1.0478515625, -0.47021484375, 0.107421875, 0.68505859375, 1.2626953125, 1.84033203125, 2.41796875, 2.99560546875, 3.5732421875, 4.15087890625, 4.728515625, 5.30615234375, 5.8837890625, 6.46142578125, 7.0390625, 7.61669921875, 8.1943359375, 8.77197265625, 9.349609375, 9.92724609375, 10.5048828125, 11.08251953125, 11.66015625, 12.23779296875, 12.8154296875, 13.39306640625, 13.970703125, 14.54833984375, 15.1259765625, 15.70361328125, 16.28125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 1.0, 5.0, 4.0, 3.0, 7.0, 6.0, 14.0, 10.0, 14.0, 18.0, 16.0, 13.0, 22.0, 27.0, 27.0, 35.0, 46.0, 45.0, 52.0, 45.0, 41.0, 55.0, 51.0, 43.0, 58.0, 42.0, 29.0, 39.0, 34.0, 24.0, 34.0, 23.0, 23.0, 14.0, 14.0, 7.0, 10.0, 13.0, 8.0, 6.0, 4.0, 4.0, 2.0, 4.0, 6.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.2109375, -10.8250732421875, -10.439208984375, -10.0533447265625, -9.66748046875, -9.2816162109375, -8.895751953125, -8.5098876953125, -8.1240234375, -7.7381591796875, -7.352294921875, -6.9664306640625, -6.58056640625, -6.1947021484375, -5.808837890625, -5.4229736328125, -5.037109375, -4.6512451171875, -4.265380859375, -3.8795166015625, -3.49365234375, -3.1077880859375, -2.721923828125, -2.3360595703125, -1.9501953125, -1.5643310546875, -1.178466796875, -0.7926025390625, -0.40673828125, -0.0208740234375, 0.364990234375, 0.7508544921875, 1.13671875, 1.5225830078125, 1.908447265625, 2.2943115234375, 2.68017578125, 3.0660400390625, 3.451904296875, 3.8377685546875, 4.2236328125, 4.6094970703125, 4.995361328125, 5.3812255859375, 5.76708984375, 6.1529541015625, 6.538818359375, 6.9246826171875, 7.310546875, 7.6964111328125, 8.082275390625, 8.4681396484375, 8.85400390625, 9.2398681640625, 9.625732421875, 10.0115966796875, 10.3974609375, 10.7833251953125, 11.169189453125, 11.5550537109375, 11.94091796875, 12.3267822265625, 12.712646484375, 13.0985107421875, 13.484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 10.0, 6.0, 10.0, 13.0, 25.0, 25.0, 29.0, 43.0, 63.0, 87.0, 123.0, 256.0, 478.0, 1174.0, 3226.0, 12879.0, 86006.0, 798849.0, 122148.0, 16587.0, 3873.0, 1396.0, 527.0, 263.0, 130.0, 78.0, 44.0, 30.0, 33.0, 18.0, 17.0, 21.0, 17.0, 11.0, 9.0, 5.0, 4.0, 4.0, 3.0, 8.0, 7.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.3515625, -6.1292724609375, -5.906982421875, -5.6846923828125, -5.46240234375, -5.2401123046875, -5.017822265625, -4.7955322265625, -4.5732421875, -4.3509521484375, -4.128662109375, -3.9063720703125, -3.68408203125, -3.4617919921875, -3.239501953125, -3.0172119140625, -2.794921875, -2.5726318359375, -2.350341796875, -2.1280517578125, -1.90576171875, -1.6834716796875, -1.461181640625, -1.2388916015625, -1.0166015625, -0.7943115234375, -0.572021484375, -0.3497314453125, -0.12744140625, 0.0948486328125, 0.317138671875, 0.5394287109375, 0.76171875, 0.9840087890625, 1.206298828125, 1.4285888671875, 1.65087890625, 1.8731689453125, 2.095458984375, 2.3177490234375, 2.5400390625, 2.7623291015625, 2.984619140625, 3.2069091796875, 3.42919921875, 3.6514892578125, 3.873779296875, 4.0960693359375, 4.318359375, 4.5406494140625, 4.762939453125, 4.9852294921875, 5.20751953125, 5.4298095703125, 5.652099609375, 5.8743896484375, 6.0966796875, 6.3189697265625, 6.541259765625, 6.7635498046875, 6.98583984375, 7.2081298828125, 7.430419921875, 7.6527099609375, 7.875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 6.0, 10.0, 10.0, 5.0, 10.0, 11.0, 17.0, 22.0, 21.0, 34.0, 49.0, 68.0, 92.0, 119.0, 136.0, 92.0, 65.0, 44.0, 35.0, 31.0, 27.0, 13.0, 10.0, 9.0, 3.0, 11.0, 4.0, 5.0, 4.0, 8.0, 1.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0011415481567382812, -0.0011045336723327637, -0.001067519187927246, -0.0010305047035217285, -0.000993490219116211, -0.0009564757347106934, -0.0009194612503051758, -0.0008824467658996582, -0.0008454322814941406, -0.000808417797088623, -0.0007714033126831055, -0.0007343888282775879, -0.0006973743438720703, -0.0006603598594665527, -0.0006233453750610352, -0.0005863308906555176, -0.00054931640625, -0.0005123019218444824, -0.00047528743743896484, -0.00043827295303344727, -0.0004012584686279297, -0.0003642439842224121, -0.00032722949981689453, -0.00029021501541137695, -0.0002532005310058594, -0.0002161860466003418, -0.00017917156219482422, -0.00014215707778930664, -0.00010514259338378906, -6.812810897827148e-05, -3.1113624572753906e-05, 5.900859832763672e-06, 4.291534423828125e-05, 7.992982864379883e-05, 0.0001169443130493164, 0.00015395879745483398, 0.00019097328186035156, 0.00022798776626586914, 0.0002650022506713867, 0.0003020167350769043, 0.0003390312194824219, 0.00037604570388793945, 0.00041306018829345703, 0.0004500746726989746, 0.0004870891571044922, 0.0005241036415100098, 0.0005611181259155273, 0.0005981326103210449, 0.0006351470947265625, 0.0006721615791320801, 0.0007091760635375977, 0.0007461905479431152, 0.0007832050323486328, 0.0008202195167541504, 0.000857234001159668, 0.0008942484855651855, 0.0009312629699707031, 0.0009682774543762207, 0.0010052919387817383, 0.0010423064231872559, 0.0010793209075927734, 0.001116335391998291, 0.0011533498764038086, 0.0011903643608093262, 0.0012273788452148438]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 9.0, 11.0, 6.0, 16.0, 15.0, 34.0, 42.0, 79.0, 154.0, 244.0, 385.0, 814.0, 1806.0, 4498.0, 15057.0, 73878.0, 695523.0, 211806.0, 31124.0, 7830.0, 2704.0, 1185.0, 597.0, 293.0, 163.0, 107.0, 50.0, 40.0, 31.0, 21.0, 8.0, 5.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.43572998046875, -4.2698974609375, -4.10406494140625, -3.938232421875, -3.77239990234375, -3.6065673828125, -3.44073486328125, -3.27490234375, -3.10906982421875, -2.9432373046875, -2.77740478515625, -2.611572265625, -2.44573974609375, -2.2799072265625, -2.11407470703125, -1.9482421875, -1.78240966796875, -1.6165771484375, -1.45074462890625, -1.284912109375, -1.11907958984375, -0.9532470703125, -0.78741455078125, -0.62158203125, -0.45574951171875, -0.2899169921875, -0.12408447265625, 0.041748046875, 0.20758056640625, 0.3734130859375, 0.53924560546875, 0.705078125, 0.87091064453125, 1.0367431640625, 1.20257568359375, 1.368408203125, 1.53424072265625, 1.7000732421875, 1.86590576171875, 2.03173828125, 2.19757080078125, 2.3634033203125, 2.52923583984375, 2.695068359375, 2.86090087890625, 3.0267333984375, 3.19256591796875, 3.3583984375, 3.52423095703125, 3.6900634765625, 3.85589599609375, 4.021728515625, 4.18756103515625, 4.3533935546875, 4.51922607421875, 4.68505859375, 4.85089111328125, 5.0167236328125, 5.18255615234375, 5.348388671875, 5.51422119140625, 5.6800537109375, 5.84588623046875, 6.01171875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 6.0, 5.0, 6.0, 8.0, 9.0, 8.0, 7.0, 14.0, 17.0, 24.0, 18.0, 21.0, 34.0, 54.0, 57.0, 88.0, 81.0, 55.0, 88.0, 68.0, 68.0, 48.0, 37.0, 37.0, 31.0, 20.0, 15.0, 12.0, 18.0, 10.0, 6.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.5859375, -3.483062744140625, -3.38018798828125, -3.277313232421875, -3.1744384765625, -3.071563720703125, -2.96868896484375, -2.865814208984375, -2.762939453125, -2.660064697265625, -2.55718994140625, -2.454315185546875, -2.3514404296875, -2.248565673828125, -2.14569091796875, -2.042816162109375, -1.93994140625, -1.837066650390625, -1.73419189453125, -1.631317138671875, -1.5284423828125, -1.425567626953125, -1.32269287109375, -1.219818115234375, -1.116943359375, -1.014068603515625, -0.91119384765625, -0.808319091796875, -0.7054443359375, -0.602569580078125, -0.49969482421875, -0.396820068359375, -0.2939453125, -0.191070556640625, -0.08819580078125, 0.014678955078125, 0.1175537109375, 0.220428466796875, 0.32330322265625, 0.426177978515625, 0.529052734375, 0.631927490234375, 0.73480224609375, 0.837677001953125, 0.9405517578125, 1.043426513671875, 1.14630126953125, 1.249176025390625, 1.35205078125, 1.454925537109375, 1.55780029296875, 1.660675048828125, 1.7635498046875, 1.866424560546875, 1.96929931640625, 2.072174072265625, 2.175048828125, 2.277923583984375, 2.38079833984375, 2.483673095703125, 2.5865478515625, 2.689422607421875, 2.79229736328125, 2.895172119140625, 2.998046875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 5.0, 4.0, 2.0, 4.0, 2.0, 14.0, 20.0, 55.0, 87.0, 159.0, 260.0, 177.0, 95.0, 61.0, 23.0, 9.0, 11.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-114.03837585449219, -110.83909606933594, -107.63981628417969, -104.4405288696289, -101.24124908447266, -98.0419692993164, -94.84268188476562, -91.64340209960938, -88.44412231445312, -85.24484252929688, -82.04556274414062, -78.84627532958984, -75.6469955444336, -72.44771575927734, -69.24842834472656, -66.04914855957031, -62.84986877441406, -59.65058898925781, -56.4513053894043, -53.25202178955078, -50.05274200439453, -46.85346221923828, -43.654178619384766, -40.45489501953125, -37.255615234375, -34.05633544921875, -30.857051849365234, -27.65777015686035, -24.45848846435547, -21.259206771850586, -18.059925079345703, -14.86064338684082, -11.661361694335938, -8.462080001831055, -5.262798309326172, -2.063516616821289, 1.1357650756835938, 4.335046768188477, 7.534328460693359, 10.733610153198242, 13.932891845703125, 17.132173538208008, 20.33145523071289, 23.530736923217773, 26.730018615722656, 29.92930030822754, 33.12858200073242, 36.32786560058594, 39.52714538574219, 42.72642517089844, 45.92570877075195, 49.12499237060547, 52.32427215576172, 55.52355194091797, 58.722835540771484, 61.922119140625, 65.12139892578125, 68.3206787109375, 71.51995849609375, 74.71924591064453, 77.91852569580078, 81.11780548095703, 84.31709289550781, 87.51637268066406, 90.71565246582031]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 5.0, 8.0, 11.0, 13.0, 21.0, 14.0, 17.0, 18.0, 17.0, 18.0, 35.0, 28.0, 29.0, 38.0, 33.0, 44.0, 51.0, 69.0, 70.0, 68.0, 52.0, 37.0, 45.0, 35.0, 19.0, 23.0, 18.0, 29.0, 14.0, 11.0, 16.0, 14.0, 11.0, 8.0, 13.0, 6.0, 7.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-49.53173828125, -47.95938491821289, -46.38703155517578, -44.81467819213867, -43.24232482910156, -41.66997146606445, -40.097618103027344, -38.5252685546875, -36.952911376953125, -35.380558013916016, -33.808204650878906, -32.2358512878418, -30.663497924804688, -29.091144561767578, -27.5187931060791, -25.946439743041992, -24.374088287353516, -22.801734924316406, -21.229381561279297, -19.657028198242188, -18.084674835205078, -16.51232147216797, -14.939970016479492, -13.367616653442383, -11.795263290405273, -10.222909927368164, -8.650556564331055, -7.078204154968262, -5.505850791931152, -3.933497428894043, -2.36114501953125, -0.7887916564941406, 0.7835617065429688, 2.355914831161499, 3.9282679557800293, 5.5006208419799805, 7.07297420501709, 8.6453275680542, 10.217679977416992, 11.790033340454102, 13.362386703491211, 14.93474006652832, 16.50709342956543, 18.079444885253906, 19.651798248291016, 21.224151611328125, 22.796504974365234, 24.368858337402344, 25.941211700439453, 27.513565063476562, 29.085918426513672, 30.65827178955078, 32.23062515258789, 33.802978515625, 35.375328063964844, 36.94768524169922, 38.52003479003906, 40.09238815307617, 41.66474151611328, 43.23709487915039, 44.8094482421875, 46.38180160522461, 47.95415496826172, 49.52650451660156, 51.09886169433594]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 9.0, 9.0, 16.0, 21.0, 25.0, 32.0, 55.0, 67.0, 141.0, 282.0, 658.0, 1704.0, 6283.0, 32917.0, 401991.0, 3428621.0, 286394.0, 26828.0, 5413.0, 1544.0, 568.0, 267.0, 176.0, 73.0, 55.0, 36.0, 22.0, 19.0, 13.0, 15.0, 7.0, 6.0, 4.0, 1.0, 5.0, 2.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0390625, -7.7750244140625, -7.510986328125, -7.2469482421875, -6.98291015625, -6.7188720703125, -6.454833984375, -6.1907958984375, -5.9267578125, -5.6627197265625, -5.398681640625, -5.1346435546875, -4.87060546875, -4.6065673828125, -4.342529296875, -4.0784912109375, -3.814453125, -3.5504150390625, -3.286376953125, -3.0223388671875, -2.75830078125, -2.4942626953125, -2.230224609375, -1.9661865234375, -1.7021484375, -1.4381103515625, -1.174072265625, -0.9100341796875, -0.64599609375, -0.3819580078125, -0.117919921875, 0.1461181640625, 0.41015625, 0.6741943359375, 0.938232421875, 1.2022705078125, 1.46630859375, 1.7303466796875, 1.994384765625, 2.2584228515625, 2.5224609375, 2.7864990234375, 3.050537109375, 3.3145751953125, 3.57861328125, 3.8426513671875, 4.106689453125, 4.3707275390625, 4.634765625, 4.8988037109375, 5.162841796875, 5.4268798828125, 5.69091796875, 5.9549560546875, 6.218994140625, 6.4830322265625, 6.7470703125, 7.0111083984375, 7.275146484375, 7.5391845703125, 7.80322265625, 8.0672607421875, 8.331298828125, 8.5953369140625, 8.859375]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 7.0, 15.0, 9.0, 10.0, 12.0, 29.0, 20.0, 28.0, 35.0, 26.0, 47.0, 53.0, 45.0, 54.0, 70.0, 54.0, 66.0, 61.0, 48.0, 67.0, 37.0, 29.0, 41.0, 23.0, 32.0, 24.0, 10.0, 10.0, 12.0, 7.0, 8.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.576171875, -3.468994140625, -3.36181640625, -3.254638671875, -3.1474609375, -3.040283203125, -2.93310546875, -2.825927734375, -2.71875, -2.611572265625, -2.50439453125, -2.397216796875, -2.2900390625, -2.182861328125, -2.07568359375, -1.968505859375, -1.861328125, -1.754150390625, -1.64697265625, -1.539794921875, -1.4326171875, -1.325439453125, -1.21826171875, -1.111083984375, -1.00390625, -0.896728515625, -0.78955078125, -0.682373046875, -0.5751953125, -0.468017578125, -0.36083984375, -0.253662109375, -0.146484375, -0.039306640625, 0.06787109375, 0.175048828125, 0.2822265625, 0.389404296875, 0.49658203125, 0.603759765625, 0.7109375, 0.818115234375, 0.92529296875, 1.032470703125, 1.1396484375, 1.246826171875, 1.35400390625, 1.461181640625, 1.568359375, 1.675537109375, 1.78271484375, 1.889892578125, 1.9970703125, 2.104248046875, 2.21142578125, 2.318603515625, 2.42578125, 2.532958984375, 2.64013671875, 2.747314453125, 2.8544921875, 2.961669921875, 3.06884765625, 3.176025390625, 3.283203125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 6.0, 9.0, 11.0, 10.0, 19.0, 32.0, 45.0, 93.0, 211.0, 431.0, 1164.0, 3200.0, 14469.0, 158962.0, 3666349.0, 321821.0, 20565.0, 4198.0, 1468.0, 629.0, 301.0, 130.0, 71.0, 30.0, 20.0, 10.0, 13.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.5078125, -15.0841064453125, -14.660400390625, -14.2366943359375, -13.81298828125, -13.3892822265625, -12.965576171875, -12.5418701171875, -12.1181640625, -11.6944580078125, -11.270751953125, -10.8470458984375, -10.42333984375, -9.9996337890625, -9.575927734375, -9.1522216796875, -8.728515625, -8.3048095703125, -7.881103515625, -7.4573974609375, -7.03369140625, -6.6099853515625, -6.186279296875, -5.7625732421875, -5.3388671875, -4.9151611328125, -4.491455078125, -4.0677490234375, -3.64404296875, -3.2203369140625, -2.796630859375, -2.3729248046875, -1.94921875, -1.5255126953125, -1.101806640625, -0.6781005859375, -0.25439453125, 0.1693115234375, 0.593017578125, 1.0167236328125, 1.4404296875, 1.8641357421875, 2.287841796875, 2.7115478515625, 3.13525390625, 3.5589599609375, 3.982666015625, 4.4063720703125, 4.830078125, 5.2537841796875, 5.677490234375, 6.1011962890625, 6.52490234375, 6.9486083984375, 7.372314453125, 7.7960205078125, 8.2197265625, 8.6434326171875, 9.067138671875, 9.4908447265625, 9.91455078125, 10.3382568359375, 10.761962890625, 11.1856689453125, 11.609375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 5.0, 5.0, 7.0, 6.0, 15.0, 19.0, 30.0, 52.0, 97.0, 131.0, 238.0, 472.0, 852.0, 914.0, 556.0, 289.0, 141.0, 89.0, 50.0, 37.0, 27.0, 14.0, 11.0, 4.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.4609375, -9.0982666015625, -8.735595703125, -8.3729248046875, -8.01025390625, -7.6475830078125, -7.284912109375, -6.9222412109375, -6.5595703125, -6.1968994140625, -5.834228515625, -5.4715576171875, -5.10888671875, -4.7462158203125, -4.383544921875, -4.0208740234375, -3.658203125, -3.2955322265625, -2.932861328125, -2.5701904296875, -2.20751953125, -1.8448486328125, -1.482177734375, -1.1195068359375, -0.7568359375, -0.3941650390625, -0.031494140625, 0.3311767578125, 0.69384765625, 1.0565185546875, 1.419189453125, 1.7818603515625, 2.14453125, 2.5072021484375, 2.869873046875, 3.2325439453125, 3.59521484375, 3.9578857421875, 4.320556640625, 4.6832275390625, 5.0458984375, 5.4085693359375, 5.771240234375, 6.1339111328125, 6.49658203125, 6.8592529296875, 7.221923828125, 7.5845947265625, 7.947265625, 8.3099365234375, 8.672607421875, 9.0352783203125, 9.39794921875, 9.7606201171875, 10.123291015625, 10.4859619140625, 10.8486328125, 11.2113037109375, 11.573974609375, 11.9366455078125, 12.29931640625, 12.6619873046875, 13.024658203125, 13.3873291015625, 13.75]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 8.0, 10.0, 21.0, 76.0, 231.0, 383.0, 189.0, 58.0, 11.0, 9.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.48670959472656, -85.29113006591797, -80.09555053710938, -74.89997100830078, -69.70439147949219, -64.50880432128906, -59.31322479248047, -54.117645263671875, -48.92206573486328, -43.72648620605469, -38.530906677246094, -33.335323333740234, -28.13974380493164, -22.944164276123047, -17.74858283996582, -12.553001403808594, -7.357421875, -2.16184139251709, 3.0337390899658203, 8.22931957244873, 13.42490005493164, 18.620479583740234, 23.81606101989746, 29.011642456054688, 34.20722198486328, 39.402801513671875, 44.59838104248047, 49.79396438598633, 54.98954391479492, 60.185123443603516, 65.38070678710938, 70.57628631591797, 75.77188110351562, 80.96746063232422, 86.16304016113281, 91.3586196899414, 96.55419921875, 101.74978637695312, 106.94536590576172, 112.14094543457031, 117.3365249633789, 122.5321044921875, 127.7276840209961, 132.9232635498047, 138.1188507080078, 143.31442260742188, 148.510009765625, 153.70559692382812, 158.9011688232422, 164.0967559814453, 169.29232788085938, 174.4879150390625, 179.68348693847656, 184.8790740966797, 190.07464599609375, 195.27023315429688, 200.4658203125, 205.66140747070312, 210.8569793701172, 216.0525665283203, 221.24813842773438, 226.4437255859375, 231.63929748535156, 236.8348846435547, 242.03045654296875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 13.0, 9.0, 20.0, 29.0, 37.0, 39.0, 71.0, 71.0, 73.0, 75.0, 101.0, 86.0, 98.0, 69.0, 42.0, 54.0, 28.0, 21.0, 23.0, 13.0, 8.0, 3.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.41293334960938, -79.10778045654297, -76.80261993408203, -74.49746704101562, -72.19230651855469, -69.88715362548828, -67.58200073242188, -65.27684020996094, -62.97168731689453, -60.66653060913086, -58.36137390136719, -56.05622100830078, -53.75106430053711, -51.44590759277344, -49.14075469970703, -46.83559799194336, -44.53044128417969, -42.225284576416016, -39.920127868652344, -37.61497497558594, -35.309818267822266, -33.004661560058594, -30.699506759643555, -28.394351959228516, -26.089195251464844, -23.784038543701172, -21.478883743286133, -19.173728942871094, -16.868572235107422, -14.563416481018066, -12.258260726928711, -9.953105926513672, -7.647956848144531, -5.342801094055176, -3.0376453399658203, -0.7324895858764648, 1.5726661682128906, 3.877821922302246, 6.182977676391602, 8.48813247680664, 10.793289184570312, 13.098444938659668, 15.403600692749023, 17.708755493164062, 20.013912200927734, 22.319068908691406, 24.624223709106445, 26.929378509521484, 29.234535217285156, 31.539691925048828, 33.8448486328125, 36.150001525878906, 38.45515823364258, 40.76031494140625, 43.065467834472656, 45.37062454223633, 47.67578125, 49.98093795776367, 52.286094665527344, 54.59124755859375, 56.89640426635742, 59.201560974121094, 61.5067138671875, 63.81187057495117, 66.11702728271484]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 3.0, 10.0, 17.0, 17.0, 27.0, 51.0, 70.0, 144.0, 234.0, 490.0, 1094.0, 2647.0, 7596.0, 28303.0, 180002.0, 612421.0, 175227.0, 27896.0, 7483.0, 2669.0, 1092.0, 490.0, 258.0, 115.0, 63.0, 34.0, 25.0, 16.0, 15.0, 11.0, 7.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-9.421875, -9.1636962890625, -8.905517578125, -8.6473388671875, -8.38916015625, -8.1309814453125, -7.872802734375, -7.6146240234375, -7.3564453125, -7.0982666015625, -6.840087890625, -6.5819091796875, -6.32373046875, -6.0655517578125, -5.807373046875, -5.5491943359375, -5.291015625, -5.0328369140625, -4.774658203125, -4.5164794921875, -4.25830078125, -4.0001220703125, -3.741943359375, -3.4837646484375, -3.2255859375, -2.9674072265625, -2.709228515625, -2.4510498046875, -2.19287109375, -1.9346923828125, -1.676513671875, -1.4183349609375, -1.16015625, -0.9019775390625, -0.643798828125, -0.3856201171875, -0.12744140625, 0.1307373046875, 0.388916015625, 0.6470947265625, 0.9052734375, 1.1634521484375, 1.421630859375, 1.6798095703125, 1.93798828125, 2.1961669921875, 2.454345703125, 2.7125244140625, 2.970703125, 3.2288818359375, 3.487060546875, 3.7452392578125, 4.00341796875, 4.2615966796875, 4.519775390625, 4.7779541015625, 5.0361328125, 5.2943115234375, 5.552490234375, 5.8106689453125, 6.06884765625, 6.3270263671875, 6.585205078125, 6.8433837890625, 7.1015625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 9.0, 1.0, 7.0, 11.0, 12.0, 21.0, 20.0, 22.0, 39.0, 43.0, 45.0, 47.0, 52.0, 42.0, 65.0, 66.0, 66.0, 69.0, 61.0, 48.0, 46.0, 44.0, 26.0, 35.0, 19.0, 16.0, 13.0, 14.0, 16.0, 11.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5546875, -4.431060791015625, -4.30743408203125, -4.183807373046875, -4.0601806640625, -3.936553955078125, -3.81292724609375, -3.689300537109375, -3.565673828125, -3.442047119140625, -3.31842041015625, -3.194793701171875, -3.0711669921875, -2.947540283203125, -2.82391357421875, -2.700286865234375, -2.57666015625, -2.453033447265625, -2.32940673828125, -2.205780029296875, -2.0821533203125, -1.958526611328125, -1.83489990234375, -1.711273193359375, -1.587646484375, -1.464019775390625, -1.34039306640625, -1.216766357421875, -1.0931396484375, -0.969512939453125, -0.84588623046875, -0.722259521484375, -0.5986328125, -0.475006103515625, -0.35137939453125, -0.227752685546875, -0.1041259765625, 0.019500732421875, 0.14312744140625, 0.266754150390625, 0.390380859375, 0.514007568359375, 0.63763427734375, 0.761260986328125, 0.8848876953125, 1.008514404296875, 1.13214111328125, 1.255767822265625, 1.37939453125, 1.503021240234375, 1.62664794921875, 1.750274658203125, 1.8739013671875, 1.997528076171875, 2.12115478515625, 2.244781494140625, 2.368408203125, 2.492034912109375, 2.61566162109375, 2.739288330078125, 2.8629150390625, 2.986541748046875, 3.11016845703125, 3.233795166015625, 3.357421875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 11.0, 5.0, 12.0, 10.0, 15.0, 24.0, 38.0, 39.0, 81.0, 128.0, 221.0, 466.0, 899.0, 2032.0, 5398.0, 23404.0, 200642.0, 710201.0, 85551.0, 12622.0, 3667.0, 1514.0, 636.0, 374.0, 200.0, 128.0, 65.0, 48.0, 21.0, 21.0, 25.0, 7.0, 10.0, 5.0, 10.0, 4.0, 8.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.390625, -10.1044921875, -9.818359375, -9.5322265625, -9.24609375, -8.9599609375, -8.673828125, -8.3876953125, -8.1015625, -7.8154296875, -7.529296875, -7.2431640625, -6.95703125, -6.6708984375, -6.384765625, -6.0986328125, -5.8125, -5.5263671875, -5.240234375, -4.9541015625, -4.66796875, -4.3818359375, -4.095703125, -3.8095703125, -3.5234375, -3.2373046875, -2.951171875, -2.6650390625, -2.37890625, -2.0927734375, -1.806640625, -1.5205078125, -1.234375, -0.9482421875, -0.662109375, -0.3759765625, -0.08984375, 0.1962890625, 0.482421875, 0.7685546875, 1.0546875, 1.3408203125, 1.626953125, 1.9130859375, 2.19921875, 2.4853515625, 2.771484375, 3.0576171875, 3.34375, 3.6298828125, 3.916015625, 4.2021484375, 4.48828125, 4.7744140625, 5.060546875, 5.3466796875, 5.6328125, 5.9189453125, 6.205078125, 6.4912109375, 6.77734375, 7.0634765625, 7.349609375, 7.6357421875, 7.921875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 5.0, 10.0, 10.0, 14.0, 17.0, 17.0, 23.0, 26.0, 33.0, 29.0, 49.0, 42.0, 42.0, 49.0, 52.0, 65.0, 49.0, 51.0, 63.0, 59.0, 49.0, 42.0, 35.0, 35.0, 30.0, 29.0, 18.0, 14.0, 11.0, 8.0, 8.0, 3.0, 6.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.15625, -10.744384765625, -10.33251953125, -9.920654296875, -9.5087890625, -9.096923828125, -8.68505859375, -8.273193359375, -7.861328125, -7.449462890625, -7.03759765625, -6.625732421875, -6.2138671875, -5.802001953125, -5.39013671875, -4.978271484375, -4.56640625, -4.154541015625, -3.74267578125, -3.330810546875, -2.9189453125, -2.507080078125, -2.09521484375, -1.683349609375, -1.271484375, -0.859619140625, -0.44775390625, -0.035888671875, 0.3759765625, 0.787841796875, 1.19970703125, 1.611572265625, 2.0234375, 2.435302734375, 2.84716796875, 3.259033203125, 3.6708984375, 4.082763671875, 4.49462890625, 4.906494140625, 5.318359375, 5.730224609375, 6.14208984375, 6.553955078125, 6.9658203125, 7.377685546875, 7.78955078125, 8.201416015625, 8.61328125, 9.025146484375, 9.43701171875, 9.848876953125, 10.2607421875, 10.672607421875, 11.08447265625, 11.496337890625, 11.908203125, 12.320068359375, 12.73193359375, 13.143798828125, 13.5556640625, 13.967529296875, 14.37939453125, 14.791259765625, 15.203125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 7.0, 11.0, 12.0, 23.0, 23.0, 37.0, 69.0, 110.0, 195.0, 335.0, 681.0, 1406.0, 3078.0, 7960.0, 24655.0, 96366.0, 573921.0, 256613.0, 56888.0, 15980.0, 5688.0, 2302.0, 1004.0, 500.0, 284.0, 143.0, 90.0, 48.0, 36.0, 22.0, 15.0, 9.0, 5.0, 6.0, 5.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-3.279296875, -3.187744140625, -3.09619140625, -3.004638671875, -2.9130859375, -2.821533203125, -2.72998046875, -2.638427734375, -2.546875, -2.455322265625, -2.36376953125, -2.272216796875, -2.1806640625, -2.089111328125, -1.99755859375, -1.906005859375, -1.814453125, -1.722900390625, -1.63134765625, -1.539794921875, -1.4482421875, -1.356689453125, -1.26513671875, -1.173583984375, -1.08203125, -0.990478515625, -0.89892578125, -0.807373046875, -0.7158203125, -0.624267578125, -0.53271484375, -0.441162109375, -0.349609375, -0.258056640625, -0.16650390625, -0.074951171875, 0.0166015625, 0.108154296875, 0.19970703125, 0.291259765625, 0.3828125, 0.474365234375, 0.56591796875, 0.657470703125, 0.7490234375, 0.840576171875, 0.93212890625, 1.023681640625, 1.115234375, 1.206787109375, 1.29833984375, 1.389892578125, 1.4814453125, 1.572998046875, 1.66455078125, 1.756103515625, 1.84765625, 1.939208984375, 2.03076171875, 2.122314453125, 2.2138671875, 2.305419921875, 2.39697265625, 2.488525390625, 2.580078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 14.0, 20.0, 35.0, 36.0, 77.0, 80.0, 162.0, 169.0, 154.0, 98.0, 48.0, 27.0, 20.0, 14.0, 4.0, 8.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0016031265258789062, -0.001564227044582367, -0.0015253275632858276, -0.0014864280819892883, -0.001447528600692749, -0.0014086291193962097, -0.0013697296380996704, -0.001330830156803131, -0.0012919306755065918, -0.0012530311942100525, -0.0012141317129135132, -0.0011752322316169739, -0.0011363327503204346, -0.0010974332690238953, -0.001058533787727356, -0.0010196343064308167, -0.0009807348251342773, -0.000941835343837738, -0.0009029358625411987, -0.0008640363812446594, -0.0008251368999481201, -0.0007862374186515808, -0.0007473379373550415, -0.0007084384560585022, -0.0006695389747619629, -0.0006306394934654236, -0.0005917400121688843, -0.000552840530872345, -0.0005139410495758057, -0.00047504156827926636, -0.00043614208698272705, -0.00039724260568618774, -0.00035834312438964844, -0.00031944364309310913, -0.0002805441617965698, -0.00024164468050003052, -0.0002027451992034912, -0.0001638457179069519, -0.0001249462366104126, -8.604675531387329e-05, -4.7147274017333984e-05, -8.247792720794678e-06, 3.065168857574463e-05, 6.955116987228394e-05, 0.00010845065116882324, 0.00014735013246536255, 0.00018624961376190186, 0.00022514909505844116, 0.00026404857635498047, 0.0003029480576515198, 0.0003418475389480591, 0.0003807470202445984, 0.0004196465015411377, 0.000458545982837677, 0.0004974454641342163, 0.0005363449454307556, 0.0005752444267272949, 0.0006141439080238342, 0.0006530433893203735, 0.0006919428706169128, 0.0007308423519134521, 0.0007697418332099915, 0.0008086413145065308, 0.0008475407958030701, 0.0008864402770996094]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 8.0, 9.0, 7.0, 10.0, 19.0, 27.0, 30.0, 34.0, 61.0, 81.0, 129.0, 220.0, 353.0, 609.0, 1166.0, 2269.0, 4922.0, 12168.0, 33327.0, 104995.0, 499042.0, 266421.0, 78548.0, 25708.0, 9982.0, 4124.0, 1981.0, 954.0, 533.0, 299.0, 155.0, 121.0, 79.0, 50.0, 32.0, 21.0, 19.0, 10.0, 9.0, 4.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.234375, -2.157012939453125, -2.07965087890625, -2.002288818359375, -1.9249267578125, -1.847564697265625, -1.77020263671875, -1.692840576171875, -1.615478515625, -1.538116455078125, -1.46075439453125, -1.383392333984375, -1.3060302734375, -1.228668212890625, -1.15130615234375, -1.073944091796875, -0.99658203125, -0.919219970703125, -0.84185791015625, -0.764495849609375, -0.6871337890625, -0.609771728515625, -0.53240966796875, -0.455047607421875, -0.377685546875, -0.300323486328125, -0.22296142578125, -0.145599365234375, -0.0682373046875, 0.009124755859375, 0.08648681640625, 0.163848876953125, 0.2412109375, 0.318572998046875, 0.39593505859375, 0.473297119140625, 0.5506591796875, 0.628021240234375, 0.70538330078125, 0.782745361328125, 0.860107421875, 0.937469482421875, 1.01483154296875, 1.092193603515625, 1.1695556640625, 1.246917724609375, 1.32427978515625, 1.401641845703125, 1.47900390625, 1.556365966796875, 1.63372802734375, 1.711090087890625, 1.7884521484375, 1.865814208984375, 1.94317626953125, 2.020538330078125, 2.097900390625, 2.175262451171875, 2.25262451171875, 2.329986572265625, 2.4073486328125, 2.484710693359375, 2.56207275390625, 2.639434814453125, 2.716796875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 6.0, 3.0, 3.0, 4.0, 3.0, 3.0, 9.0, 5.0, 4.0, 11.0, 12.0, 17.0, 10.0, 17.0, 30.0, 27.0, 35.0, 55.0, 52.0, 52.0, 67.0, 79.0, 84.0, 66.0, 60.0, 53.0, 43.0, 35.0, 27.0, 26.0, 22.0, 19.0, 14.0, 13.0, 7.0, 6.0, 8.0, 4.0, 5.0, 2.0, 5.0, 7.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0], "bins": [-2.78125, -2.705596923828125, -2.62994384765625, -2.554290771484375, -2.4786376953125, -2.402984619140625, -2.32733154296875, -2.251678466796875, -2.176025390625, -2.100372314453125, -2.02471923828125, -1.949066162109375, -1.8734130859375, -1.797760009765625, -1.72210693359375, -1.646453857421875, -1.57080078125, -1.495147705078125, -1.41949462890625, -1.343841552734375, -1.2681884765625, -1.192535400390625, -1.11688232421875, -1.041229248046875, -0.965576171875, -0.889923095703125, -0.81427001953125, -0.738616943359375, -0.6629638671875, -0.587310791015625, -0.51165771484375, -0.436004638671875, -0.3603515625, -0.284698486328125, -0.20904541015625, -0.133392333984375, -0.0577392578125, 0.017913818359375, 0.09356689453125, 0.169219970703125, 0.244873046875, 0.320526123046875, 0.39617919921875, 0.471832275390625, 0.5474853515625, 0.623138427734375, 0.69879150390625, 0.774444580078125, 0.85009765625, 0.925750732421875, 1.00140380859375, 1.077056884765625, 1.1527099609375, 1.228363037109375, 1.30401611328125, 1.379669189453125, 1.455322265625, 1.530975341796875, 1.60662841796875, 1.682281494140625, 1.7579345703125, 1.833587646484375, 1.90924072265625, 1.984893798828125, 2.060546875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 5.0, 11.0, 24.0, 68.0, 138.0, 306.0, 217.0, 104.0, 53.0, 28.0, 11.0, 12.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-129.7572784423828, -126.91883087158203, -124.08038330078125, -121.241943359375, -118.40349578857422, -115.56504821777344, -112.72660827636719, -109.8881607055664, -107.04971313476562, -104.21126556396484, -101.37281799316406, -98.53437805175781, -95.69593048095703, -92.85748291015625, -90.01904296875, -87.18059539794922, -84.34214782714844, -81.50370025634766, -78.66525268554688, -75.82681274414062, -72.98836517333984, -70.14991760253906, -67.31147766113281, -64.47303009033203, -61.63458251953125, -58.79613494873047, -55.95769119262695, -53.11924743652344, -50.280799865722656, -47.442352294921875, -44.60390853881836, -41.765464782714844, -38.927024841308594, -36.08857727050781, -33.2501335144043, -30.41168785095215, -27.5732421875, -24.73479652404785, -21.896350860595703, -19.057905197143555, -16.219459533691406, -13.381013870239258, -10.54256820678711, -7.704122543334961, -4.8656768798828125, -2.027231216430664, 0.8112144470214844, 3.649660110473633, 6.488105773925781, 9.32655143737793, 12.164997100830078, 15.003442764282227, 17.841888427734375, 20.680334091186523, 23.518779754638672, 26.35722541809082, 29.19567108154297, 32.03411865234375, 34.872562408447266, 37.71100616455078, 40.54945373535156, 43.387901306152344, 46.22634506225586, 49.064788818359375, 51.903236389160156]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 2.0, 5.0, 3.0, 2.0, 8.0, 3.0, 9.0, 6.0, 4.0, 9.0, 15.0, 19.0, 22.0, 23.0, 23.0, 19.0, 20.0, 27.0, 30.0, 40.0, 56.0, 57.0, 66.0, 65.0, 62.0, 56.0, 35.0, 41.0, 32.0, 37.0, 42.0, 23.0, 25.0, 15.0, 18.0, 9.0, 12.0, 7.0, 2.0, 14.0, 9.0, 7.0, 4.0, 3.0, 2.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0], "bins": [-46.52021026611328, -45.20225143432617, -43.88429641723633, -42.56633758544922, -41.248382568359375, -39.930423736572266, -38.61246871948242, -37.29450988769531, -35.97655487060547, -34.65859603881836, -33.340641021728516, -32.022682189941406, -30.704727172851562, -29.386770248413086, -28.06881332397461, -26.7508544921875, -25.432897567749023, -24.114940643310547, -22.79698371887207, -21.479026794433594, -20.161069869995117, -18.84311294555664, -17.52515411376953, -16.207199096679688, -14.889241218566895, -13.571284294128418, -12.253327369689941, -10.935369491577148, -9.617412567138672, -8.299455642700195, -6.981498718261719, -5.663541793823242, -4.345584869384766, -3.027627944946289, -1.7096707820892334, -0.39171361923217773, 0.9262433052062988, 2.2442002296447754, 3.56215763092041, 4.880114555358887, 6.198071479797363, 7.51602840423584, 8.833985328674316, 10.15194320678711, 11.469900131225586, 12.787857055664062, 14.105813980102539, 15.423770904541016, 16.741727828979492, 18.05968475341797, 19.377641677856445, 20.695598602294922, 22.0135555267334, 23.331512451171875, 24.649471282958984, 25.967426300048828, 27.285385131835938, 28.603342056274414, 29.92129898071289, 31.239255905151367, 32.557212829589844, 33.87517166137695, 35.1931266784668, 36.511085510253906, 37.82904052734375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 13.0, 8.0, 16.0, 36.0, 67.0, 107.0, 252.0, 592.0, 2121.0, 9660.0, 72116.0, 2269406.0, 1770245.0, 58893.0, 7871.0, 1709.0, 560.0, 261.0, 138.0, 75.0, 37.0, 31.0, 18.0, 12.0, 13.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.28125, -8.0048828125, -7.728515625, -7.4521484375, -7.17578125, -6.8994140625, -6.623046875, -6.3466796875, -6.0703125, -5.7939453125, -5.517578125, -5.2412109375, -4.96484375, -4.6884765625, -4.412109375, -4.1357421875, -3.859375, -3.5830078125, -3.306640625, -3.0302734375, -2.75390625, -2.4775390625, -2.201171875, -1.9248046875, -1.6484375, -1.3720703125, -1.095703125, -0.8193359375, -0.54296875, -0.2666015625, 0.009765625, 0.2861328125, 0.5625, 0.8388671875, 1.115234375, 1.3916015625, 1.66796875, 1.9443359375, 2.220703125, 2.4970703125, 2.7734375, 3.0498046875, 3.326171875, 3.6025390625, 3.87890625, 4.1552734375, 4.431640625, 4.7080078125, 4.984375, 5.2607421875, 5.537109375, 5.8134765625, 6.08984375, 6.3662109375, 6.642578125, 6.9189453125, 7.1953125, 7.4716796875, 7.748046875, 8.0244140625, 8.30078125, 8.5771484375, 8.853515625, 9.1298828125, 9.40625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 3.0, 8.0, 8.0, 15.0, 20.0, 30.0, 26.0, 35.0, 40.0, 61.0, 40.0, 66.0, 72.0, 75.0, 64.0, 67.0, 63.0, 56.0, 56.0, 37.0, 35.0, 27.0, 23.0, 27.0, 22.0, 8.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.388671875, -3.258453369140625, -3.12823486328125, -2.998016357421875, -2.8677978515625, -2.737579345703125, -2.60736083984375, -2.477142333984375, -2.346923828125, -2.216705322265625, -2.08648681640625, -1.956268310546875, -1.8260498046875, -1.695831298828125, -1.56561279296875, -1.435394287109375, -1.30517578125, -1.174957275390625, -1.04473876953125, -0.914520263671875, -0.7843017578125, -0.654083251953125, -0.52386474609375, -0.393646240234375, -0.263427734375, -0.133209228515625, -0.00299072265625, 0.127227783203125, 0.2574462890625, 0.387664794921875, 0.51788330078125, 0.648101806640625, 0.7783203125, 0.908538818359375, 1.03875732421875, 1.168975830078125, 1.2991943359375, 1.429412841796875, 1.55963134765625, 1.689849853515625, 1.820068359375, 1.950286865234375, 2.08050537109375, 2.210723876953125, 2.3409423828125, 2.471160888671875, 2.60137939453125, 2.731597900390625, 2.86181640625, 2.992034912109375, 3.12225341796875, 3.252471923828125, 3.3826904296875, 3.512908935546875, 3.64312744140625, 3.773345947265625, 3.903564453125, 4.033782958984375, 4.16400146484375, 4.294219970703125, 4.4244384765625, 4.554656982421875, 4.68487548828125, 4.815093994140625, 4.9453125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 8.0, 5.0, 5.0, 11.0, 9.0, 16.0, 27.0, 42.0, 63.0, 101.0, 215.0, 610.0, 2269.0, 16550.0, 379125.0, 3684897.0, 100649.0, 7481.0, 1381.0, 424.0, 171.0, 82.0, 55.0, 24.0, 16.0, 14.0, 7.0, 9.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-16.40625, -15.9993896484375, -15.592529296875, -15.1856689453125, -14.77880859375, -14.3719482421875, -13.965087890625, -13.5582275390625, -13.1513671875, -12.7445068359375, -12.337646484375, -11.9307861328125, -11.52392578125, -11.1170654296875, -10.710205078125, -10.3033447265625, -9.896484375, -9.4896240234375, -9.082763671875, -8.6759033203125, -8.26904296875, -7.8621826171875, -7.455322265625, -7.0484619140625, -6.6416015625, -6.2347412109375, -5.827880859375, -5.4210205078125, -5.01416015625, -4.6072998046875, -4.200439453125, -3.7935791015625, -3.38671875, -2.9798583984375, -2.572998046875, -2.1661376953125, -1.75927734375, -1.3524169921875, -0.945556640625, -0.5386962890625, -0.1318359375, 0.2750244140625, 0.681884765625, 1.0887451171875, 1.49560546875, 1.9024658203125, 2.309326171875, 2.7161865234375, 3.123046875, 3.5299072265625, 3.936767578125, 4.3436279296875, 4.75048828125, 5.1573486328125, 5.564208984375, 5.9710693359375, 6.3779296875, 6.7847900390625, 7.191650390625, 7.5985107421875, 8.00537109375, 8.4122314453125, 8.819091796875, 9.2259521484375, 9.6328125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 11.0, 7.0, 5.0, 5.0, 10.0, 17.0, 15.0, 19.0, 34.0, 44.0, 83.0, 92.0, 151.0, 202.0, 320.0, 518.0, 691.0, 553.0, 392.0, 280.0, 181.0, 131.0, 87.0, 57.0, 49.0, 28.0, 12.0, 23.0, 15.0, 9.0, 7.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.921875, -6.722412109375, -6.52294921875, -6.323486328125, -6.1240234375, -5.924560546875, -5.72509765625, -5.525634765625, -5.326171875, -5.126708984375, -4.92724609375, -4.727783203125, -4.5283203125, -4.328857421875, -4.12939453125, -3.929931640625, -3.73046875, -3.531005859375, -3.33154296875, -3.132080078125, -2.9326171875, -2.733154296875, -2.53369140625, -2.334228515625, -2.134765625, -1.935302734375, -1.73583984375, -1.536376953125, -1.3369140625, -1.137451171875, -0.93798828125, -0.738525390625, -0.5390625, -0.339599609375, -0.14013671875, 0.059326171875, 0.2587890625, 0.458251953125, 0.65771484375, 0.857177734375, 1.056640625, 1.256103515625, 1.45556640625, 1.655029296875, 1.8544921875, 2.053955078125, 2.25341796875, 2.452880859375, 2.65234375, 2.851806640625, 3.05126953125, 3.250732421875, 3.4501953125, 3.649658203125, 3.84912109375, 4.048583984375, 4.248046875, 4.447509765625, 4.64697265625, 4.846435546875, 5.0458984375, 5.245361328125, 5.44482421875, 5.644287109375, 5.84375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 10.0, 16.0, 25.0, 65.0, 112.0, 154.0, 183.0, 152.0, 120.0, 66.0, 32.0, 18.0, 12.0, 12.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.47664642333984, -62.42560958862305, -60.374576568603516, -58.32353973388672, -56.27250289916992, -54.221466064453125, -52.170433044433594, -50.1193962097168, -48.068359375, -46.0173225402832, -43.96628952026367, -41.915252685546875, -39.86421585083008, -37.81317901611328, -35.76214599609375, -33.71110916137695, -31.660076141357422, -29.609041213989258, -27.55800437927246, -25.506969451904297, -23.4559326171875, -21.404897689819336, -19.353862762451172, -17.302825927734375, -15.251791000366211, -13.20075511932373, -11.14971923828125, -9.098684310913086, -7.0476484298706055, -4.996612548828125, -2.945577621459961, -0.8945417404174805, 1.156494140625, 3.2075297832489014, 5.258565425872803, 7.309600830078125, 9.360636711120605, 11.411672592163086, 13.46270751953125, 15.51374340057373, 17.56477928161621, 19.615814208984375, 21.666851043701172, 23.717885971069336, 25.7689208984375, 27.819957733154297, 29.87099266052246, 31.922027587890625, 33.97306442260742, 36.02410125732422, 38.07513427734375, 40.12617111206055, 42.177207946777344, 44.228240966796875, 46.27927780151367, 48.33031463623047, 50.38134765625, 52.4323844909668, 54.48341751098633, 56.534454345703125, 58.58549118041992, 60.63652801513672, 62.68756103515625, 64.73859405517578, 66.78963470458984]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 4.0, 2.0, 5.0, 5.0, 10.0, 9.0, 9.0, 11.0, 8.0, 16.0, 13.0, 16.0, 19.0, 24.0, 16.0, 22.0, 21.0, 22.0, 36.0, 39.0, 52.0, 46.0, 51.0, 47.0, 42.0, 40.0, 53.0, 38.0, 45.0, 30.0, 24.0, 26.0, 27.0, 24.0, 32.0, 16.0, 18.0, 10.0, 8.0, 8.0, 12.0, 11.0, 7.0, 7.0, 6.0, 6.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.314151763916016, -25.468732833862305, -24.62331199645996, -23.77789306640625, -22.932472229003906, -22.087053298950195, -21.241634368896484, -20.39621353149414, -19.55079460144043, -18.70537567138672, -17.859954833984375, -17.014535903930664, -16.169116973876953, -15.32369613647461, -14.478277206420898, -13.632857322692871, -12.787437438964844, -11.942017555236816, -11.096597671508789, -10.251178741455078, -9.40575885772705, -8.560338973999023, -7.714919567108154, -6.869500160217285, -6.024080276489258, -5.1786603927612305, -4.333240985870361, -3.487821340560913, -2.642401695251465, -1.7969818115234375, -0.9515624046325684, -0.10614299774169922, 0.7392787933349609, 1.5846984386444092, 2.4301180839538574, 3.2755377292633057, 4.120957374572754, 4.966377258300781, 5.81179666519165, 6.6572160720825195, 7.502635955810547, 8.348055839538574, 9.193475723266602, 10.038894653320312, 10.88431453704834, 11.729734420776367, 12.575153350830078, 13.420573234558105, 14.265993118286133, 15.11141300201416, 15.956832885742188, 16.8022518157959, 17.64767074584961, 18.493091583251953, 19.338510513305664, 20.183929443359375, 21.02935028076172, 21.87476921081543, 22.720190048217773, 23.565608978271484, 24.411029815673828, 25.25644874572754, 26.10186767578125, 26.947288513183594, 27.792707443237305]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 10.0, 8.0, 21.0, 36.0, 60.0, 83.0, 139.0, 266.0, 490.0, 950.0, 2113.0, 5511.0, 18338.0, 90885.0, 490052.0, 358148.0, 60284.0, 13427.0, 4287.0, 1721.0, 775.0, 405.0, 205.0, 135.0, 70.0, 44.0, 27.0, 21.0, 15.0, 4.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.234375, -8.0111083984375, -7.787841796875, -7.5645751953125, -7.34130859375, -7.1180419921875, -6.894775390625, -6.6715087890625, -6.4482421875, -6.2249755859375, -6.001708984375, -5.7784423828125, -5.55517578125, -5.3319091796875, -5.108642578125, -4.8853759765625, -4.662109375, -4.4388427734375, -4.215576171875, -3.9923095703125, -3.76904296875, -3.5457763671875, -3.322509765625, -3.0992431640625, -2.8759765625, -2.6527099609375, -2.429443359375, -2.2061767578125, -1.98291015625, -1.7596435546875, -1.536376953125, -1.3131103515625, -1.08984375, -0.8665771484375, -0.643310546875, -0.4200439453125, -0.19677734375, 0.0264892578125, 0.249755859375, 0.4730224609375, 0.6962890625, 0.9195556640625, 1.142822265625, 1.3660888671875, 1.58935546875, 1.8126220703125, 2.035888671875, 2.2591552734375, 2.482421875, 2.7056884765625, 2.928955078125, 3.1522216796875, 3.37548828125, 3.5987548828125, 3.822021484375, 4.0452880859375, 4.2685546875, 4.4918212890625, 4.715087890625, 4.9383544921875, 5.16162109375, 5.3848876953125, 5.608154296875, 5.8314208984375, 6.0546875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 8.0, 2.0, 7.0, 12.0, 19.0, 26.0, 26.0, 40.0, 35.0, 63.0, 65.0, 63.0, 61.0, 72.0, 80.0, 63.0, 59.0, 70.0, 45.0, 45.0, 34.0, 31.0, 30.0, 16.0, 15.0, 12.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.40234375, -5.2479248046875, -5.093505859375, -4.9390869140625, -4.78466796875, -4.6302490234375, -4.475830078125, -4.3214111328125, -4.1669921875, -4.0125732421875, -3.858154296875, -3.7037353515625, -3.54931640625, -3.3948974609375, -3.240478515625, -3.0860595703125, -2.931640625, -2.7772216796875, -2.622802734375, -2.4683837890625, -2.31396484375, -2.1595458984375, -2.005126953125, -1.8507080078125, -1.6962890625, -1.5418701171875, -1.387451171875, -1.2330322265625, -1.07861328125, -0.9241943359375, -0.769775390625, -0.6153564453125, -0.4609375, -0.3065185546875, -0.152099609375, 0.0023193359375, 0.15673828125, 0.3111572265625, 0.465576171875, 0.6199951171875, 0.7744140625, 0.9288330078125, 1.083251953125, 1.2376708984375, 1.39208984375, 1.5465087890625, 1.700927734375, 1.8553466796875, 2.009765625, 2.1641845703125, 2.318603515625, 2.4730224609375, 2.62744140625, 2.7818603515625, 2.936279296875, 3.0906982421875, 3.2451171875, 3.3995361328125, 3.553955078125, 3.7083740234375, 3.86279296875, 4.0172119140625, 4.171630859375, 4.3260498046875, 4.48046875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 7.0, 5.0, 4.0, 10.0, 14.0, 27.0, 29.0, 43.0, 59.0, 83.0, 151.0, 234.0, 379.0, 770.0, 1574.0, 4552.0, 17868.0, 126092.0, 759959.0, 112439.0, 16767.0, 4208.0, 1539.0, 692.0, 345.0, 230.0, 154.0, 91.0, 63.0, 45.0, 34.0, 20.0, 28.0, 9.0, 10.0, 3.0, 3.0, 6.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.859375, -7.5833740234375, -7.307373046875, -7.0313720703125, -6.75537109375, -6.4793701171875, -6.203369140625, -5.9273681640625, -5.6513671875, -5.3753662109375, -5.099365234375, -4.8233642578125, -4.54736328125, -4.2713623046875, -3.995361328125, -3.7193603515625, -3.443359375, -3.1673583984375, -2.891357421875, -2.6153564453125, -2.33935546875, -2.0633544921875, -1.787353515625, -1.5113525390625, -1.2353515625, -0.9593505859375, -0.683349609375, -0.4073486328125, -0.13134765625, 0.1446533203125, 0.420654296875, 0.6966552734375, 0.97265625, 1.2486572265625, 1.524658203125, 1.8006591796875, 2.07666015625, 2.3526611328125, 2.628662109375, 2.9046630859375, 3.1806640625, 3.4566650390625, 3.732666015625, 4.0086669921875, 4.28466796875, 4.5606689453125, 4.836669921875, 5.1126708984375, 5.388671875, 5.6646728515625, 5.940673828125, 6.2166748046875, 6.49267578125, 6.7686767578125, 7.044677734375, 7.3206787109375, 7.5966796875, 7.8726806640625, 8.148681640625, 8.4246826171875, 8.70068359375, 8.9766845703125, 9.252685546875, 9.5286865234375, 9.8046875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 5.0, 7.0, 10.0, 6.0, 13.0, 15.0, 24.0, 29.0, 36.0, 37.0, 30.0, 40.0, 48.0, 69.0, 57.0, 60.0, 60.0, 63.0, 63.0, 62.0, 47.0, 42.0, 27.0, 28.0, 22.0, 25.0, 15.0, 16.0, 8.0, 5.0, 14.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.4609375, -13.9930419921875, -13.525146484375, -13.0572509765625, -12.58935546875, -12.1214599609375, -11.653564453125, -11.1856689453125, -10.7177734375, -10.2498779296875, -9.781982421875, -9.3140869140625, -8.84619140625, -8.3782958984375, -7.910400390625, -7.4425048828125, -6.974609375, -6.5067138671875, -6.038818359375, -5.5709228515625, -5.10302734375, -4.6351318359375, -4.167236328125, -3.6993408203125, -3.2314453125, -2.7635498046875, -2.295654296875, -1.8277587890625, -1.35986328125, -0.8919677734375, -0.424072265625, 0.0438232421875, 0.51171875, 0.9796142578125, 1.447509765625, 1.9154052734375, 2.38330078125, 2.8511962890625, 3.319091796875, 3.7869873046875, 4.2548828125, 4.7227783203125, 5.190673828125, 5.6585693359375, 6.12646484375, 6.5943603515625, 7.062255859375, 7.5301513671875, 7.998046875, 8.4659423828125, 8.933837890625, 9.4017333984375, 9.86962890625, 10.3375244140625, 10.805419921875, 11.2733154296875, 11.7412109375, 12.2091064453125, 12.677001953125, 13.1448974609375, 13.61279296875, 14.0806884765625, 14.548583984375, 15.0164794921875, 15.484375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 8.0, 11.0, 23.0, 35.0, 60.0, 66.0, 159.0, 266.0, 524.0, 1129.0, 2611.0, 6457.0, 17990.0, 66241.0, 613587.0, 267596.0, 48038.0, 14347.0, 5265.0, 2122.0, 913.0, 499.0, 224.0, 148.0, 78.0, 40.0, 28.0, 18.0, 18.0, 9.0, 10.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.767578125, -2.67498779296875, -2.5823974609375, -2.48980712890625, -2.397216796875, -2.30462646484375, -2.2120361328125, -2.11944580078125, -2.02685546875, -1.93426513671875, -1.8416748046875, -1.74908447265625, -1.656494140625, -1.56390380859375, -1.4713134765625, -1.37872314453125, -1.2861328125, -1.19354248046875, -1.1009521484375, -1.00836181640625, -0.915771484375, -0.82318115234375, -0.7305908203125, -0.63800048828125, -0.54541015625, -0.45281982421875, -0.3602294921875, -0.26763916015625, -0.175048828125, -0.08245849609375, 0.0101318359375, 0.10272216796875, 0.1953125, 0.28790283203125, 0.3804931640625, 0.47308349609375, 0.565673828125, 0.65826416015625, 0.7508544921875, 0.84344482421875, 0.93603515625, 1.02862548828125, 1.1212158203125, 1.21380615234375, 1.306396484375, 1.39898681640625, 1.4915771484375, 1.58416748046875, 1.6767578125, 1.76934814453125, 1.8619384765625, 1.95452880859375, 2.047119140625, 2.13970947265625, 2.2322998046875, 2.32489013671875, 2.41748046875, 2.51007080078125, 2.6026611328125, 2.69525146484375, 2.787841796875, 2.88043212890625, 2.9730224609375, 3.06561279296875, 3.158203125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 4.0, 2.0, 10.0, 7.0, 12.0, 16.0, 18.0, 24.0, 43.0, 59.0, 92.0, 120.0, 140.0, 128.0, 106.0, 55.0, 43.0, 37.0, 18.0, 12.0, 7.0, 7.0, 8.0, 6.0, 5.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007724761962890625, -0.0007454901933670044, -0.0007185041904449463, -0.0006915181875228882, -0.0006645321846008301, -0.000637546181678772, -0.0006105601787567139, -0.0005835741758346558, -0.0005565881729125977, -0.0005296021699905396, -0.0005026161670684814, -0.00047563016414642334, -0.00044864416122436523, -0.00042165815830230713, -0.000394672155380249, -0.0003676861524581909, -0.0003407001495361328, -0.0003137141466140747, -0.0002867281436920166, -0.0002597421407699585, -0.0002327561378479004, -0.00020577013492584229, -0.00017878413200378418, -0.00015179812908172607, -0.00012481212615966797, -9.782612323760986e-05, -7.084012031555176e-05, -4.385411739349365e-05, -1.6868114471435547e-05, 1.0117888450622559e-05, 3.7103891372680664e-05, 6.408989429473877e-05, 9.107589721679688e-05, 0.00011806190013885498, 0.00014504790306091309, 0.0001720339059829712, 0.0001990199089050293, 0.0002260059118270874, 0.0002529919147491455, 0.0002799779176712036, 0.0003069639205932617, 0.0003339499235153198, 0.00036093592643737793, 0.00038792192935943604, 0.00041490793228149414, 0.00044189393520355225, 0.00046887993812561035, 0.0004958659410476685, 0.0005228519439697266, 0.0005498379468917847, 0.0005768239498138428, 0.0006038099527359009, 0.000630795955657959, 0.0006577819585800171, 0.0006847679615020752, 0.0007117539644241333, 0.0007387399673461914, 0.0007657259702682495, 0.0007927119731903076, 0.0008196979761123657, 0.0008466839790344238, 0.0008736699819564819, 0.00090065598487854, 0.0009276419878005981, 0.0009546279907226562]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 10.0, 12.0, 14.0, 29.0, 40.0, 53.0, 88.0, 174.0, 276.0, 499.0, 947.0, 2074.0, 4851.0, 12757.0, 41243.0, 200911.0, 661881.0, 85897.0, 22898.0, 7854.0, 3125.0, 1341.0, 682.0, 367.0, 202.0, 119.0, 68.0, 44.0, 35.0, 19.0, 8.0, 5.0, 8.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.744140625, -2.6534423828125, -2.562744140625, -2.4720458984375, -2.38134765625, -2.2906494140625, -2.199951171875, -2.1092529296875, -2.0185546875, -1.9278564453125, -1.837158203125, -1.7464599609375, -1.65576171875, -1.5650634765625, -1.474365234375, -1.3836669921875, -1.29296875, -1.2022705078125, -1.111572265625, -1.0208740234375, -0.93017578125, -0.8394775390625, -0.748779296875, -0.6580810546875, -0.5673828125, -0.4766845703125, -0.385986328125, -0.2952880859375, -0.20458984375, -0.1138916015625, -0.023193359375, 0.0675048828125, 0.158203125, 0.2489013671875, 0.339599609375, 0.4302978515625, 0.52099609375, 0.6116943359375, 0.702392578125, 0.7930908203125, 0.8837890625, 0.9744873046875, 1.065185546875, 1.1558837890625, 1.24658203125, 1.3372802734375, 1.427978515625, 1.5186767578125, 1.609375, 1.7000732421875, 1.790771484375, 1.8814697265625, 1.97216796875, 2.0628662109375, 2.153564453125, 2.2442626953125, 2.3349609375, 2.4256591796875, 2.516357421875, 2.6070556640625, 2.69775390625, 2.7884521484375, 2.879150390625, 2.9698486328125, 3.060546875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 4.0, 4.0, 2.0, 7.0, 6.0, 2.0, 7.0, 5.0, 18.0, 28.0, 30.0, 34.0, 59.0, 75.0, 113.0, 123.0, 106.0, 101.0, 69.0, 52.0, 40.0, 31.0, 18.0, 11.0, 11.0, 12.0, 8.0, 7.0, 2.0, 1.0, 5.0, 6.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.912109375, -2.799102783203125, -2.68609619140625, -2.573089599609375, -2.4600830078125, -2.347076416015625, -2.23406982421875, -2.121063232421875, -2.008056640625, -1.895050048828125, -1.78204345703125, -1.669036865234375, -1.5560302734375, -1.443023681640625, -1.33001708984375, -1.217010498046875, -1.10400390625, -0.990997314453125, -0.87799072265625, -0.764984130859375, -0.6519775390625, -0.538970947265625, -0.42596435546875, -0.312957763671875, -0.199951171875, -0.086944580078125, 0.02606201171875, 0.139068603515625, 0.2520751953125, 0.365081787109375, 0.47808837890625, 0.591094970703125, 0.7041015625, 0.817108154296875, 0.93011474609375, 1.043121337890625, 1.1561279296875, 1.269134521484375, 1.38214111328125, 1.495147705078125, 1.608154296875, 1.721160888671875, 1.83416748046875, 1.947174072265625, 2.0601806640625, 2.173187255859375, 2.28619384765625, 2.399200439453125, 2.51220703125, 2.625213623046875, 2.73822021484375, 2.851226806640625, 2.9642333984375, 3.077239990234375, 3.19024658203125, 3.303253173828125, 3.416259765625, 3.529266357421875, 3.64227294921875, 3.755279541015625, 3.8682861328125, 3.981292724609375, 4.09429931640625, 4.207305908203125, 4.3203125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 5.0, 5.0, 15.0, 16.0, 33.0, 77.0, 200.0, 364.0, 136.0, 75.0, 28.0, 10.0, 9.0, 6.0, 3.0, 7.0, 2.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.33690643310547, -60.508365631103516, -57.6798210144043, -54.851280212402344, -52.022735595703125, -49.19419479370117, -46.36565399169922, -43.537109375, -40.70856857299805, -37.880027770996094, -35.051483154296875, -32.22294235229492, -29.394399642944336, -26.56585693359375, -23.737316131591797, -20.90877342224121, -18.080230712890625, -15.251688003540039, -12.42314624786377, -9.5946044921875, -6.766061782836914, -3.937519073486328, -1.108978271484375, 1.719564437866211, 4.548107147216797, 7.376649379730225, 10.205191612243652, 13.033733367919922, 15.862276077270508, 18.690818786621094, 21.519359588623047, 24.347902297973633, 27.176437377929688, 30.004980087280273, 32.83352279663086, 35.66206359863281, 38.49060821533203, 41.319149017333984, 44.14768981933594, 46.976234436035156, 49.80477523803711, 52.63331604003906, 55.46186065673828, 58.290401458740234, 61.11894226074219, 63.947486877441406, 66.77603149414062, 69.60456848144531, 72.43311309814453, 75.26165771484375, 78.09019470214844, 80.91873931884766, 83.74728393554688, 86.57582092285156, 89.40436553955078, 92.23291015625, 95.06144714355469, 97.8899917602539, 100.7185287475586, 103.54707336425781, 106.37561798095703, 109.20416259765625, 112.03269958496094, 114.86124420166016, 117.68978881835938]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 5.0, 7.0, 7.0, 7.0, 10.0, 8.0, 15.0, 12.0, 16.0, 15.0, 20.0, 15.0, 20.0, 16.0, 29.0, 28.0, 35.0, 50.0, 51.0, 81.0, 88.0, 73.0, 47.0, 46.0, 40.0, 27.0, 27.0, 27.0, 22.0, 23.0, 21.0, 19.0, 14.0, 11.0, 10.0, 8.0, 6.0, 9.0, 4.0, 10.0, 5.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-47.214622497558594, -45.79095458984375, -44.367286682128906, -42.94361877441406, -41.51995086669922, -40.096282958984375, -38.67261505126953, -37.24894714355469, -35.825279235839844, -34.401611328125, -32.977943420410156, -31.554275512695312, -30.13060760498047, -28.706939697265625, -27.283273696899414, -25.85960578918457, -24.43593978881836, -23.012271881103516, -21.588603973388672, -20.164936065673828, -18.741268157958984, -17.31760025024414, -15.89393424987793, -14.470266342163086, -13.046598434448242, -11.622930526733398, -10.199262619018555, -8.775595664978027, -7.351927757263184, -5.92825984954834, -4.5045928955078125, -3.0809249877929688, -1.6572608947753906, -0.23359322547912598, 1.1900744438171387, 2.613741874694824, 4.037409782409668, 5.461077690124512, 6.884744644165039, 8.308412551879883, 9.732080459594727, 11.15574836730957, 12.579416275024414, 14.003083229064941, 15.426751136779785, 16.850418090820312, 18.274085998535156, 19.69775390625, 21.121421813964844, 22.545089721679688, 23.96875762939453, 25.392425537109375, 26.81609344482422, 28.239761352539062, 29.663427352905273, 31.087095260620117, 32.510765075683594, 33.93443298339844, 35.35810089111328, 36.781768798828125, 38.20543670654297, 39.62910461425781, 41.052772521972656, 42.4764404296875, 43.90010452270508]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 7.0, 6.0, 14.0, 9.0, 23.0, 37.0, 66.0, 111.0, 249.0, 541.0, 1414.0, 4066.0, 16520.0, 100887.0, 1287162.0, 2545860.0, 202007.0, 26053.0, 6021.0, 1799.0, 737.0, 307.0, 134.0, 90.0, 48.0, 38.0, 16.0, 14.0, 6.0, 5.0, 9.0, 2.0, 0.0, 4.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.75390625, -6.5438232421875, -6.333740234375, -6.1236572265625, -5.91357421875, -5.7034912109375, -5.493408203125, -5.2833251953125, -5.0732421875, -4.8631591796875, -4.653076171875, -4.4429931640625, -4.23291015625, -4.0228271484375, -3.812744140625, -3.6026611328125, -3.392578125, -3.1824951171875, -2.972412109375, -2.7623291015625, -2.55224609375, -2.3421630859375, -2.132080078125, -1.9219970703125, -1.7119140625, -1.5018310546875, -1.291748046875, -1.0816650390625, -0.87158203125, -0.6614990234375, -0.451416015625, -0.2413330078125, -0.03125, 0.1788330078125, 0.388916015625, 0.5989990234375, 0.80908203125, 1.0191650390625, 1.229248046875, 1.4393310546875, 1.6494140625, 1.8594970703125, 2.069580078125, 2.2796630859375, 2.48974609375, 2.6998291015625, 2.909912109375, 3.1199951171875, 3.330078125, 3.5401611328125, 3.750244140625, 3.9603271484375, 4.17041015625, 4.3804931640625, 4.590576171875, 4.8006591796875, 5.0107421875, 5.2208251953125, 5.430908203125, 5.6409912109375, 5.85107421875, 6.0611572265625, 6.271240234375, 6.4813232421875, 6.69140625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 6.0, 3.0, 15.0, 11.0, 20.0, 16.0, 15.0, 14.0, 23.0, 29.0, 26.0, 24.0, 38.0, 36.0, 30.0, 28.0, 54.0, 37.0, 47.0, 49.0, 54.0, 55.0, 37.0, 39.0, 39.0, 37.0, 32.0, 24.0, 26.0, 20.0, 9.0, 21.0, 15.0, 17.0, 6.0, 12.0, 5.0, 7.0, 5.0, 2.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.9765625, -2.88128662109375, -2.7860107421875, -2.69073486328125, -2.595458984375, -2.50018310546875, -2.4049072265625, -2.30963134765625, -2.21435546875, -2.11907958984375, -2.0238037109375, -1.92852783203125, -1.833251953125, -1.73797607421875, -1.6427001953125, -1.54742431640625, -1.4521484375, -1.35687255859375, -1.2615966796875, -1.16632080078125, -1.071044921875, -0.97576904296875, -0.8804931640625, -0.78521728515625, -0.68994140625, -0.59466552734375, -0.4993896484375, -0.40411376953125, -0.308837890625, -0.21356201171875, -0.1182861328125, -0.02301025390625, 0.072265625, 0.16754150390625, 0.2628173828125, 0.35809326171875, 0.453369140625, 0.54864501953125, 0.6439208984375, 0.73919677734375, 0.83447265625, 0.92974853515625, 1.0250244140625, 1.12030029296875, 1.215576171875, 1.31085205078125, 1.4061279296875, 1.50140380859375, 1.5966796875, 1.69195556640625, 1.7872314453125, 1.88250732421875, 1.977783203125, 2.07305908203125, 2.1683349609375, 2.26361083984375, 2.35888671875, 2.45416259765625, 2.5494384765625, 2.64471435546875, 2.739990234375, 2.83526611328125, 2.9305419921875, 3.02581787109375, 3.12109375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 8.0, 4.0, 10.0, 13.0, 27.0, 18.0, 23.0, 55.0, 79.0, 130.0, 213.0, 389.0, 1079.0, 3785.0, 18080.0, 175038.0, 3271282.0, 670819.0, 43010.0, 7015.0, 1841.0, 630.0, 299.0, 151.0, 69.0, 60.0, 35.0, 35.0, 13.0, 14.0, 14.0, 8.0, 10.0, 6.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.8515625, -8.5633544921875, -8.275146484375, -7.9869384765625, -7.69873046875, -7.4105224609375, -7.122314453125, -6.8341064453125, -6.5458984375, -6.2576904296875, -5.969482421875, -5.6812744140625, -5.39306640625, -5.1048583984375, -4.816650390625, -4.5284423828125, -4.240234375, -3.9520263671875, -3.663818359375, -3.3756103515625, -3.08740234375, -2.7991943359375, -2.510986328125, -2.2227783203125, -1.9345703125, -1.6463623046875, -1.358154296875, -1.0699462890625, -0.78173828125, -0.4935302734375, -0.205322265625, 0.0828857421875, 0.37109375, 0.6593017578125, 0.947509765625, 1.2357177734375, 1.52392578125, 1.8121337890625, 2.100341796875, 2.3885498046875, 2.6767578125, 2.9649658203125, 3.253173828125, 3.5413818359375, 3.82958984375, 4.1177978515625, 4.406005859375, 4.6942138671875, 4.982421875, 5.2706298828125, 5.558837890625, 5.8470458984375, 6.13525390625, 6.4234619140625, 6.711669921875, 6.9998779296875, 7.2880859375, 7.5762939453125, 7.864501953125, 8.1527099609375, 8.44091796875, 8.7291259765625, 9.017333984375, 9.3055419921875, 9.59375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 3.0, 11.0, 10.0, 13.0, 14.0, 23.0, 24.0, 24.0, 72.0, 87.0, 88.0, 145.0, 201.0, 317.0, 440.0, 571.0, 550.0, 425.0, 326.0, 197.0, 151.0, 98.0, 73.0, 47.0, 47.0, 25.0, 22.0, 11.0, 17.0, 5.0, 6.0, 6.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.81640625, -5.60797119140625, -5.3995361328125, -5.19110107421875, -4.982666015625, -4.77423095703125, -4.5657958984375, -4.35736083984375, -4.14892578125, -3.94049072265625, -3.7320556640625, -3.52362060546875, -3.315185546875, -3.10675048828125, -2.8983154296875, -2.68988037109375, -2.4814453125, -2.27301025390625, -2.0645751953125, -1.85614013671875, -1.647705078125, -1.43927001953125, -1.2308349609375, -1.02239990234375, -0.81396484375, -0.60552978515625, -0.3970947265625, -0.18865966796875, 0.019775390625, 0.22821044921875, 0.4366455078125, 0.64508056640625, 0.853515625, 1.06195068359375, 1.2703857421875, 1.47882080078125, 1.687255859375, 1.89569091796875, 2.1041259765625, 2.31256103515625, 2.52099609375, 2.72943115234375, 2.9378662109375, 3.14630126953125, 3.354736328125, 3.56317138671875, 3.7716064453125, 3.98004150390625, 4.1884765625, 4.39691162109375, 4.6053466796875, 4.81378173828125, 5.022216796875, 5.23065185546875, 5.4390869140625, 5.64752197265625, 5.85595703125, 6.06439208984375, 6.2728271484375, 6.48126220703125, 6.689697265625, 6.89813232421875, 7.1065673828125, 7.31500244140625, 7.5234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 8.0, 7.0, 9.0, 11.0, 17.0, 45.0, 77.0, 92.0, 142.0, 154.0, 152.0, 121.0, 69.0, 43.0, 17.0, 12.0, 10.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.10871124267578, -47.25234603881836, -45.39598083496094, -43.53961944580078, -41.68325424194336, -39.82688903808594, -37.970523834228516, -36.114158630371094, -34.25779724121094, -32.401432037353516, -30.545068740844727, -28.688703536987305, -26.832340240478516, -24.975975036621094, -23.119609832763672, -21.263246536254883, -19.40688133239746, -17.55051612854004, -15.69415283203125, -13.837787628173828, -11.981424331665039, -10.125059127807617, -8.268694877624512, -6.412330627441406, -4.555966377258301, -2.6996021270751953, -0.8432376384735107, 1.0131268501281738, 2.8694911003112793, 4.725855827331543, 6.582220077514648, 8.438584327697754, 10.29494857788086, 12.151312828063965, 14.00767707824707, 15.864042282104492, 17.72040557861328, 19.576770782470703, 21.433135986328125, 23.289499282836914, 25.145862579345703, 27.002227783203125, 28.858591079711914, 30.714956283569336, 32.571319580078125, 34.42768478393555, 36.28404998779297, 38.140411376953125, 39.99678039550781, 41.853145599365234, 43.709510803222656, 45.56587219238281, 47.422237396240234, 49.278602600097656, 51.13496780395508, 52.9913330078125, 54.847694396972656, 56.70405960083008, 58.5604248046875, 60.416786193847656, 62.27315139770508, 64.1295166015625, 65.98587799072266, 67.84224700927734, 69.6986083984375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 5.0, 16.0, 4.0, 14.0, 7.0, 20.0, 22.0, 17.0, 14.0, 26.0, 36.0, 36.0, 42.0, 40.0, 37.0, 40.0, 39.0, 45.0, 42.0, 26.0, 40.0, 44.0, 47.0, 40.0, 42.0, 29.0, 32.0, 28.0, 32.0, 20.0, 23.0, 14.0, 11.0, 13.0, 7.0, 9.0, 9.0, 7.0, 2.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.73577117919922, -27.777189254760742, -26.818607330322266, -25.86002540588379, -24.901443481445312, -23.94286346435547, -22.984281539916992, -22.025699615478516, -21.06711769104004, -20.108535766601562, -19.149953842163086, -18.19137191772461, -17.232791900634766, -16.274208068847656, -15.315628051757812, -14.357046127319336, -13.39846420288086, -12.439882278442383, -11.481300354003906, -10.522719383239746, -9.56413745880127, -8.605555534362793, -7.646974086761475, -6.688392639160156, -5.72981071472168, -4.771228790283203, -3.8126473426818848, -2.8540656566619873, -1.8954839706420898, -0.9369020462036133, 0.021679401397705078, 0.9802608489990234, 1.9388427734375, 2.8974244594573975, 3.856006145477295, 4.814587593078613, 5.77316951751709, 6.731751441955566, 7.690332889556885, 8.648914337158203, 9.60749626159668, 10.566078186035156, 11.524660110473633, 12.483241081237793, 13.44182300567627, 14.400404930114746, 15.358985900878906, 16.317567825317383, 17.27614974975586, 18.234731674194336, 19.193313598632812, 20.15189552307129, 21.110477447509766, 22.06905746459961, 23.027639389038086, 23.986221313476562, 24.94480323791504, 25.903385162353516, 26.861967086791992, 27.82054901123047, 28.779129028320312, 29.737712860107422, 30.696292877197266, 31.654874801635742, 32.61345672607422]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 2.0, 6.0, 8.0, 4.0, 14.0, 13.0, 21.0, 44.0, 62.0, 101.0, 178.0, 304.0, 661.0, 1521.0, 3946.0, 12663.0, 52513.0, 316086.0, 532092.0, 98046.0, 20437.0, 5870.0, 2133.0, 885.0, 392.0, 224.0, 133.0, 68.0, 48.0, 21.0, 24.0, 12.0, 15.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.92523193359375, -7.6864013671875, -7.44757080078125, -7.208740234375, -6.96990966796875, -6.7310791015625, -6.49224853515625, -6.25341796875, -6.01458740234375, -5.7757568359375, -5.53692626953125, -5.298095703125, -5.05926513671875, -4.8204345703125, -4.58160400390625, -4.3427734375, -4.10394287109375, -3.8651123046875, -3.62628173828125, -3.387451171875, -3.14862060546875, -2.9097900390625, -2.67095947265625, -2.43212890625, -2.19329833984375, -1.9544677734375, -1.71563720703125, -1.476806640625, -1.23797607421875, -0.9991455078125, -0.76031494140625, -0.521484375, -0.28265380859375, -0.0438232421875, 0.19500732421875, 0.433837890625, 0.67266845703125, 0.9114990234375, 1.15032958984375, 1.38916015625, 1.62799072265625, 1.8668212890625, 2.10565185546875, 2.344482421875, 2.58331298828125, 2.8221435546875, 3.06097412109375, 3.2998046875, 3.53863525390625, 3.7774658203125, 4.01629638671875, 4.255126953125, 4.49395751953125, 4.7327880859375, 4.97161865234375, 5.21044921875, 5.44927978515625, 5.6881103515625, 5.92694091796875, 6.165771484375, 6.40460205078125, 6.6434326171875, 6.88226318359375, 7.12109375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 11.0, 6.0, 7.0, 15.0, 13.0, 23.0, 16.0, 14.0, 32.0, 33.0, 32.0, 45.0, 44.0, 47.0, 40.0, 50.0, 52.0, 48.0, 57.0, 50.0, 40.0, 58.0, 39.0, 31.0, 24.0, 35.0, 32.0, 17.0, 15.0, 12.0, 13.0, 12.0, 6.0, 9.0, 8.0, 5.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.548828125, -3.43603515625, -3.3232421875, -3.21044921875, -3.09765625, -2.98486328125, -2.8720703125, -2.75927734375, -2.646484375, -2.53369140625, -2.4208984375, -2.30810546875, -2.1953125, -2.08251953125, -1.9697265625, -1.85693359375, -1.744140625, -1.63134765625, -1.5185546875, -1.40576171875, -1.29296875, -1.18017578125, -1.0673828125, -0.95458984375, -0.841796875, -0.72900390625, -0.6162109375, -0.50341796875, -0.390625, -0.27783203125, -0.1650390625, -0.05224609375, 0.060546875, 0.17333984375, 0.2861328125, 0.39892578125, 0.51171875, 0.62451171875, 0.7373046875, 0.85009765625, 0.962890625, 1.07568359375, 1.1884765625, 1.30126953125, 1.4140625, 1.52685546875, 1.6396484375, 1.75244140625, 1.865234375, 1.97802734375, 2.0908203125, 2.20361328125, 2.31640625, 2.42919921875, 2.5419921875, 2.65478515625, 2.767578125, 2.88037109375, 2.9931640625, 3.10595703125, 3.21875, 3.33154296875, 3.4443359375, 3.55712890625, 3.669921875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 8.0, 3.0, 4.0, 5.0, 10.0, 13.0, 18.0, 27.0, 41.0, 40.0, 65.0, 74.0, 98.0, 152.0, 262.0, 359.0, 644.0, 1235.0, 2445.0, 6362.0, 22720.0, 129427.0, 751575.0, 102634.0, 19268.0, 5883.0, 2308.0, 1142.0, 619.0, 344.0, 240.0, 151.0, 88.0, 73.0, 62.0, 38.0, 36.0, 14.0, 24.0, 15.0, 8.0, 6.0, 7.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6015625, -8.3443603515625, -8.087158203125, -7.8299560546875, -7.57275390625, -7.3155517578125, -7.058349609375, -6.8011474609375, -6.5439453125, -6.2867431640625, -6.029541015625, -5.7723388671875, -5.51513671875, -5.2579345703125, -5.000732421875, -4.7435302734375, -4.486328125, -4.2291259765625, -3.971923828125, -3.7147216796875, -3.45751953125, -3.2003173828125, -2.943115234375, -2.6859130859375, -2.4287109375, -2.1715087890625, -1.914306640625, -1.6571044921875, -1.39990234375, -1.1427001953125, -0.885498046875, -0.6282958984375, -0.37109375, -0.1138916015625, 0.143310546875, 0.4005126953125, 0.65771484375, 0.9149169921875, 1.172119140625, 1.4293212890625, 1.6865234375, 1.9437255859375, 2.200927734375, 2.4581298828125, 2.71533203125, 2.9725341796875, 3.229736328125, 3.4869384765625, 3.744140625, 4.0013427734375, 4.258544921875, 4.5157470703125, 4.77294921875, 5.0301513671875, 5.287353515625, 5.5445556640625, 5.8017578125, 6.0589599609375, 6.316162109375, 6.5733642578125, 6.83056640625, 7.0877685546875, 7.344970703125, 7.6021728515625, 7.859375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 6.0, 5.0, 10.0, 1.0, 8.0, 5.0, 15.0, 12.0, 19.0, 23.0, 33.0, 31.0, 47.0, 48.0, 51.0, 51.0, 66.0, 55.0, 76.0, 61.0, 50.0, 55.0, 52.0, 40.0, 40.0, 25.0, 24.0, 20.0, 11.0, 12.0, 8.0, 12.0, 4.0, 4.0, 5.0, 2.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.6484375, -13.1614990234375, -12.674560546875, -12.1876220703125, -11.70068359375, -11.2137451171875, -10.726806640625, -10.2398681640625, -9.7529296875, -9.2659912109375, -8.779052734375, -8.2921142578125, -7.80517578125, -7.3182373046875, -6.831298828125, -6.3443603515625, -5.857421875, -5.3704833984375, -4.883544921875, -4.3966064453125, -3.90966796875, -3.4227294921875, -2.935791015625, -2.4488525390625, -1.9619140625, -1.4749755859375, -0.988037109375, -0.5010986328125, -0.01416015625, 0.4727783203125, 0.959716796875, 1.4466552734375, 1.93359375, 2.4205322265625, 2.907470703125, 3.3944091796875, 3.88134765625, 4.3682861328125, 4.855224609375, 5.3421630859375, 5.8291015625, 6.3160400390625, 6.802978515625, 7.2899169921875, 7.77685546875, 8.2637939453125, 8.750732421875, 9.2376708984375, 9.724609375, 10.2115478515625, 10.698486328125, 11.1854248046875, 11.67236328125, 12.1593017578125, 12.646240234375, 13.1331787109375, 13.6201171875, 14.1070556640625, 14.593994140625, 15.0809326171875, 15.56787109375, 16.0548095703125, 16.541748046875, 17.0286865234375, 17.515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 7.0, 2.0, 4.0, 15.0, 12.0, 23.0, 30.0, 24.0, 39.0, 76.0, 112.0, 164.0, 274.0, 571.0, 1143.0, 2858.0, 7689.0, 25240.0, 127451.0, 756669.0, 94553.0, 20335.0, 6586.0, 2412.0, 1050.0, 520.0, 230.0, 160.0, 84.0, 62.0, 39.0, 32.0, 17.0, 15.0, 12.0, 9.0, 6.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.900390625, -2.816131591796875, -2.73187255859375, -2.647613525390625, -2.5633544921875, -2.479095458984375, -2.39483642578125, -2.310577392578125, -2.226318359375, -2.142059326171875, -2.05780029296875, -1.973541259765625, -1.8892822265625, -1.805023193359375, -1.72076416015625, -1.636505126953125, -1.55224609375, -1.467987060546875, -1.38372802734375, -1.299468994140625, -1.2152099609375, -1.130950927734375, -1.04669189453125, -0.962432861328125, -0.878173828125, -0.793914794921875, -0.70965576171875, -0.625396728515625, -0.5411376953125, -0.456878662109375, -0.37261962890625, -0.288360595703125, -0.2041015625, -0.119842529296875, -0.03558349609375, 0.048675537109375, 0.1329345703125, 0.217193603515625, 0.30145263671875, 0.385711669921875, 0.469970703125, 0.554229736328125, 0.63848876953125, 0.722747802734375, 0.8070068359375, 0.891265869140625, 0.97552490234375, 1.059783935546875, 1.14404296875, 1.228302001953125, 1.31256103515625, 1.396820068359375, 1.4810791015625, 1.565338134765625, 1.64959716796875, 1.733856201171875, 1.818115234375, 1.902374267578125, 1.98663330078125, 2.070892333984375, 2.1551513671875, 2.239410400390625, 2.32366943359375, 2.407928466796875, 2.4921875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 10.0, 9.0, 15.0, 21.0, 28.0, 43.0, 86.0, 135.0, 207.0, 172.0, 92.0, 67.0, 31.0, 24.0, 8.0, 13.0, 10.0, 4.0, 8.0, 2.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0011234283447265625, -0.0010900646448135376, -0.0010567009449005127, -0.0010233372449874878, -0.0009899735450744629, -0.000956609845161438, -0.0009232461452484131, -0.0008898824453353882, -0.0008565187454223633, -0.0008231550455093384, -0.0007897913455963135, -0.0007564276456832886, -0.0007230639457702637, -0.0006897002458572388, -0.0006563365459442139, -0.000622972846031189, -0.0005896091461181641, -0.0005562454462051392, -0.0005228817462921143, -0.0004895180463790894, -0.00045615434646606445, -0.00042279064655303955, -0.00038942694664001465, -0.00035606324672698975, -0.00032269954681396484, -0.00028933584690093994, -0.00025597214698791504, -0.00022260844707489014, -0.00018924474716186523, -0.00015588104724884033, -0.00012251734733581543, -8.915364742279053e-05, -5.5789947509765625e-05, -2.2426247596740723e-05, 1.093745231628418e-05, 4.430115222930908e-05, 7.766485214233398e-05, 0.00011102855205535889, 0.0001443922519683838, 0.0001777559518814087, 0.0002111196517944336, 0.0002444833517074585, 0.0002778470516204834, 0.0003112107515335083, 0.0003445744514465332, 0.0003779381513595581, 0.000411301851272583, 0.0004446655511856079, 0.0004780292510986328, 0.0005113929510116577, 0.0005447566509246826, 0.0005781203508377075, 0.0006114840507507324, 0.0006448477506637573, 0.0006782114505767822, 0.0007115751504898071, 0.000744938850402832, 0.0007783025503158569, 0.0008116662502288818, 0.0008450299501419067, 0.0008783936500549316, 0.0009117573499679565, 0.0009451210498809814, 0.0009784847497940063, 0.0010118484497070312]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 8.0, 3.0, 5.0, 12.0, 20.0, 33.0, 43.0, 77.0, 123.0, 181.0, 326.0, 493.0, 909.0, 1744.0, 3716.0, 8607.0, 22847.0, 72390.0, 504492.0, 324996.0, 69330.0, 22127.0, 8464.0, 3571.0, 1757.0, 896.0, 510.0, 302.0, 182.0, 117.0, 82.0, 60.0, 39.0, 30.0, 22.0, 11.0, 11.0, 7.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.072265625, -2.013031005859375, -1.95379638671875, -1.894561767578125, -1.8353271484375, -1.776092529296875, -1.71685791015625, -1.657623291015625, -1.598388671875, -1.539154052734375, -1.47991943359375, -1.420684814453125, -1.3614501953125, -1.302215576171875, -1.24298095703125, -1.183746337890625, -1.12451171875, -1.065277099609375, -1.00604248046875, -0.946807861328125, -0.8875732421875, -0.828338623046875, -0.76910400390625, -0.709869384765625, -0.650634765625, -0.591400146484375, -0.53216552734375, -0.472930908203125, -0.4136962890625, -0.354461669921875, -0.29522705078125, -0.235992431640625, -0.1767578125, -0.117523193359375, -0.05828857421875, 0.000946044921875, 0.0601806640625, 0.119415283203125, 0.17864990234375, 0.237884521484375, 0.297119140625, 0.356353759765625, 0.41558837890625, 0.474822998046875, 0.5340576171875, 0.593292236328125, 0.65252685546875, 0.711761474609375, 0.77099609375, 0.830230712890625, 0.88946533203125, 0.948699951171875, 1.0079345703125, 1.067169189453125, 1.12640380859375, 1.185638427734375, 1.244873046875, 1.304107666015625, 1.36334228515625, 1.422576904296875, 1.4818115234375, 1.541046142578125, 1.60028076171875, 1.659515380859375, 1.71875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 10.0, 8.0, 7.0, 8.0, 11.0, 22.0, 28.0, 39.0, 46.0, 57.0, 62.0, 81.0, 75.0, 92.0, 87.0, 69.0, 54.0, 41.0, 25.0, 27.0, 27.0, 23.0, 16.0, 16.0, 12.0, 9.0, 9.0, 2.0, 5.0, 4.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.22265625, -2.148406982421875, -2.07415771484375, -1.999908447265625, -1.9256591796875, -1.851409912109375, -1.77716064453125, -1.702911376953125, -1.628662109375, -1.554412841796875, -1.48016357421875, -1.405914306640625, -1.3316650390625, -1.257415771484375, -1.18316650390625, -1.108917236328125, -1.03466796875, -0.960418701171875, -0.88616943359375, -0.811920166015625, -0.7376708984375, -0.663421630859375, -0.58917236328125, -0.514923095703125, -0.440673828125, -0.366424560546875, -0.29217529296875, -0.217926025390625, -0.1436767578125, -0.069427490234375, 0.00482177734375, 0.079071044921875, 0.1533203125, 0.227569580078125, 0.30181884765625, 0.376068115234375, 0.4503173828125, 0.524566650390625, 0.59881591796875, 0.673065185546875, 0.747314453125, 0.821563720703125, 0.89581298828125, 0.970062255859375, 1.0443115234375, 1.118560791015625, 1.19281005859375, 1.267059326171875, 1.34130859375, 1.415557861328125, 1.48980712890625, 1.564056396484375, 1.6383056640625, 1.712554931640625, 1.78680419921875, 1.861053466796875, 1.935302734375, 2.009552001953125, 2.08380126953125, 2.158050537109375, 2.2322998046875, 2.306549072265625, 2.38079833984375, 2.455047607421875, 2.529296875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 15.0, 28.0, 82.0, 192.0, 424.0, 150.0, 51.0, 28.0, 11.0, 8.0, 3.0, 1.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-134.7137451171875, -131.00860595703125, -127.30345916748047, -123.59832000732422, -119.89318084716797, -116.18803405761719, -112.48289489746094, -108.77775573730469, -105.07261657714844, -101.36747741699219, -97.6623306274414, -93.95719146728516, -90.2520523071289, -86.54690551757812, -82.84176635742188, -79.13662719726562, -75.43148040771484, -71.7263412475586, -68.02119445800781, -64.31605529785156, -60.61091613769531, -56.9057731628418, -53.20063018798828, -49.49549102783203, -45.790348052978516, -42.085205078125, -38.38006591796875, -34.674922943115234, -30.96978187561035, -27.26464080810547, -23.559497833251953, -19.85435676574707, -16.149215698242188, -12.444074630737305, -8.738932609558105, -5.033790588378906, -1.3286495208740234, 2.3764915466308594, 6.081634521484375, 9.786775588989258, 13.49191665649414, 17.197057723999023, 20.902198791503906, 24.607341766357422, 28.312482833862305, 32.01762390136719, 35.7227668762207, 39.42790985107422, 43.13304901123047, 46.838191986083984, 50.543331146240234, 54.24847412109375, 57.95361328125, 61.658756256103516, 65.36389923095703, 69.06903839111328, 72.77418518066406, 76.47932434082031, 80.1844711303711, 83.88961029052734, 87.5947494506836, 91.29989624023438, 95.00503540039062, 98.71017456054688, 102.41531372070312]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 9.0, 3.0, 7.0, 9.0, 10.0, 12.0, 13.0, 13.0, 19.0, 27.0, 28.0, 33.0, 27.0, 33.0, 38.0, 58.0, 73.0, 105.0, 114.0, 66.0, 44.0, 25.0, 27.0, 30.0, 30.0, 16.0, 26.0, 11.0, 15.0, 14.0, 9.0, 9.0, 8.0, 5.0, 9.0, 2.0, 5.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.213958740234375, -49.490150451660156, -47.7663459777832, -46.042537689208984, -44.318729400634766, -42.59492492675781, -40.871116638183594, -39.147308349609375, -37.423500061035156, -35.69969177246094, -33.975887298583984, -32.252079010009766, -30.528270721435547, -28.80446434020996, -27.080657958984375, -25.356849670410156, -23.633045196533203, -21.909238815307617, -20.1854305267334, -18.461624145507812, -16.737815856933594, -15.014009475708008, -13.290203094482422, -11.56639575958252, -9.842588424682617, -8.118781089782715, -6.394974231719971, -4.671167373657227, -2.947360038757324, -1.2235527038574219, 0.5002536773681641, 2.2240610122680664, 3.9478721618652344, 5.671679496765137, 7.395486354827881, 9.119293212890625, 10.843100547790527, 12.56690788269043, 14.290714263916016, 16.014522552490234, 17.73832893371582, 19.462135314941406, 21.185943603515625, 22.90974998474121, 24.633556365966797, 26.357364654541016, 28.0811710357666, 29.804977416992188, 31.528785705566406, 33.252593994140625, 34.97639846801758, 36.7002067565918, 38.424015045166016, 40.14781951904297, 41.87162780761719, 43.595436096191406, 45.319244384765625, 47.043052673339844, 48.7668571472168, 50.490665435791016, 52.214473724365234, 53.93827819824219, 55.662086486816406, 57.385894775390625, 59.10969924926758]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 8.0, 6.0, 13.0, 18.0, 29.0, 48.0, 73.0, 121.0, 183.0, 350.0, 691.0, 1576.0, 4173.0, 12860.0, 52938.0, 326773.0, 2147083.0, 1407051.0, 191501.0, 34427.0, 8672.0, 3011.0, 1246.0, 595.0, 318.0, 170.0, 120.0, 71.0, 43.0, 24.0, 19.0, 20.0, 10.0, 7.0, 9.0, 8.0, 6.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87109375, -6.62445068359375, -6.3778076171875, -6.13116455078125, -5.884521484375, -5.63787841796875, -5.3912353515625, -5.14459228515625, -4.89794921875, -4.65130615234375, -4.4046630859375, -4.15802001953125, -3.911376953125, -3.66473388671875, -3.4180908203125, -3.17144775390625, -2.9248046875, -2.67816162109375, -2.4315185546875, -2.18487548828125, -1.938232421875, -1.69158935546875, -1.4449462890625, -1.19830322265625, -0.95166015625, -0.70501708984375, -0.4583740234375, -0.21173095703125, 0.034912109375, 0.28155517578125, 0.5281982421875, 0.77484130859375, 1.021484375, 1.26812744140625, 1.5147705078125, 1.76141357421875, 2.008056640625, 2.25469970703125, 2.5013427734375, 2.74798583984375, 2.99462890625, 3.24127197265625, 3.4879150390625, 3.73455810546875, 3.981201171875, 4.22784423828125, 4.4744873046875, 4.72113037109375, 4.9677734375, 5.21441650390625, 5.4610595703125, 5.70770263671875, 5.954345703125, 6.20098876953125, 6.4476318359375, 6.69427490234375, 6.94091796875, 7.18756103515625, 7.4342041015625, 7.68084716796875, 7.927490234375, 8.17413330078125, 8.4207763671875, 8.66741943359375, 8.9140625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 12.0, 10.0, 8.0, 13.0, 16.0, 9.0, 17.0, 14.0, 24.0, 27.0, 22.0, 33.0, 39.0, 29.0, 36.0, 41.0, 42.0, 49.0, 37.0, 44.0, 37.0, 57.0, 45.0, 50.0, 38.0, 31.0, 38.0, 30.0, 24.0, 18.0, 12.0, 21.0, 16.0, 7.0, 8.0, 4.0, 5.0, 6.0, 3.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.09765625, -3.003173828125, -2.90869140625, -2.814208984375, -2.7197265625, -2.625244140625, -2.53076171875, -2.436279296875, -2.341796875, -2.247314453125, -2.15283203125, -2.058349609375, -1.9638671875, -1.869384765625, -1.77490234375, -1.680419921875, -1.5859375, -1.491455078125, -1.39697265625, -1.302490234375, -1.2080078125, -1.113525390625, -1.01904296875, -0.924560546875, -0.830078125, -0.735595703125, -0.64111328125, -0.546630859375, -0.4521484375, -0.357666015625, -0.26318359375, -0.168701171875, -0.07421875, 0.020263671875, 0.11474609375, 0.209228515625, 0.3037109375, 0.398193359375, 0.49267578125, 0.587158203125, 0.681640625, 0.776123046875, 0.87060546875, 0.965087890625, 1.0595703125, 1.154052734375, 1.24853515625, 1.343017578125, 1.4375, 1.531982421875, 1.62646484375, 1.720947265625, 1.8154296875, 1.909912109375, 2.00439453125, 2.098876953125, 2.193359375, 2.287841796875, 2.38232421875, 2.476806640625, 2.5712890625, 2.665771484375, 2.76025390625, 2.854736328125, 2.94921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 3.0, 4.0, 5.0, 7.0, 4.0, 8.0, 17.0, 17.0, 30.0, 45.0, 71.0, 132.0, 205.0, 396.0, 843.0, 2022.0, 6413.0, 67242.0, 3853691.0, 247153.0, 11091.0, 2687.0, 1061.0, 495.0, 260.0, 142.0, 83.0, 45.0, 36.0, 19.0, 10.0, 13.0, 8.0, 6.0, 1.0, 5.0, 1.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.3125, -20.6171875, -19.921875, -19.2265625, -18.53125, -17.8359375, -17.140625, -16.4453125, -15.75, -15.0546875, -14.359375, -13.6640625, -12.96875, -12.2734375, -11.578125, -10.8828125, -10.1875, -9.4921875, -8.796875, -8.1015625, -7.40625, -6.7109375, -6.015625, -5.3203125, -4.625, -3.9296875, -3.234375, -2.5390625, -1.84375, -1.1484375, -0.453125, 0.2421875, 0.9375, 1.6328125, 2.328125, 3.0234375, 3.71875, 4.4140625, 5.109375, 5.8046875, 6.5, 7.1953125, 7.890625, 8.5859375, 9.28125, 9.9765625, 10.671875, 11.3671875, 12.0625, 12.7578125, 13.453125, 14.1484375, 14.84375, 15.5390625, 16.234375, 16.9296875, 17.625, 18.3203125, 19.015625, 19.7109375, 20.40625, 21.1015625, 21.796875, 22.4921875, 23.1875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 4.0, 16.0, 17.0, 33.0, 36.0, 59.0, 109.0, 147.0, 284.0, 387.0, 586.0, 716.0, 627.0, 376.0, 239.0, 146.0, 102.0, 76.0, 35.0, 21.0, 14.0, 16.0, 9.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6875, -13.22314453125, -12.7587890625, -12.29443359375, -11.830078125, -11.36572265625, -10.9013671875, -10.43701171875, -9.97265625, -9.50830078125, -9.0439453125, -8.57958984375, -8.115234375, -7.65087890625, -7.1865234375, -6.72216796875, -6.2578125, -5.79345703125, -5.3291015625, -4.86474609375, -4.400390625, -3.93603515625, -3.4716796875, -3.00732421875, -2.54296875, -2.07861328125, -1.6142578125, -1.14990234375, -0.685546875, -0.22119140625, 0.2431640625, 0.70751953125, 1.171875, 1.63623046875, 2.1005859375, 2.56494140625, 3.029296875, 3.49365234375, 3.9580078125, 4.42236328125, 4.88671875, 5.35107421875, 5.8154296875, 6.27978515625, 6.744140625, 7.20849609375, 7.6728515625, 8.13720703125, 8.6015625, 9.06591796875, 9.5302734375, 9.99462890625, 10.458984375, 10.92333984375, 11.3876953125, 11.85205078125, 12.31640625, 12.78076171875, 13.2451171875, 13.70947265625, 14.173828125, 14.63818359375, 15.1025390625, 15.56689453125, 16.03125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 9.0, 4.0, 12.0, 22.0, 53.0, 101.0, 133.0, 238.0, 201.0, 98.0, 51.0, 29.0, 10.0, 13.0, 9.0, 7.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-222.80076599121094, -217.55882263183594, -212.31687927246094, -207.07493591308594, -201.83299255371094, -196.591064453125, -191.34912109375, -186.107177734375, -180.865234375, -175.623291015625, -170.38134765625, -165.139404296875, -159.8974609375, -154.655517578125, -149.41357421875, -144.17164611816406, -138.9296875, -133.687744140625, -128.44580078125, -123.203857421875, -117.96192169189453, -112.71997833251953, -107.47803497314453, -102.23609924316406, -96.99415588378906, -91.75221252441406, -86.51026916503906, -81.26832580566406, -76.0263900756836, -70.7844467163086, -65.5425033569336, -60.30056381225586, -55.058624267578125, -49.816680908203125, -44.57474136352539, -39.33279800415039, -34.090858459472656, -28.848915100097656, -23.606971740722656, -18.365032196044922, -13.123088836669922, -7.8811469078063965, -2.639204978942871, 2.6027374267578125, 7.84467887878418, 13.086620330810547, 18.328563690185547, 23.57050323486328, 28.81244659423828, 34.05438995361328, 39.296329498291016, 44.538272857666016, 49.78021240234375, 55.02215576171875, 60.26409912109375, 65.50604248046875, 70.74798583984375, 75.98992919921875, 81.23187255859375, 86.47381591796875, 91.71575164794922, 96.95769500732422, 102.19963836669922, 107.44157409667969, 112.68351745605469]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 7.0, 17.0, 25.0, 21.0, 32.0, 35.0, 51.0, 55.0, 81.0, 71.0, 99.0, 85.0, 78.0, 73.0, 64.0, 49.0, 42.0, 31.0, 22.0, 17.0, 13.0, 15.0, 8.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-109.1646728515625, -106.04253387451172, -102.92040252685547, -99.79826354980469, -96.67613220214844, -93.55399322509766, -90.43185424804688, -87.30972290039062, -84.18758392333984, -81.06544494628906, -77.94331359863281, -74.82117462158203, -71.69904327392578, -68.576904296875, -65.45477294921875, -62.33263397216797, -59.21049880981445, -56.08836364746094, -52.96622848510742, -49.844093322753906, -46.721954345703125, -43.59981918334961, -40.477684020996094, -37.35554504394531, -34.23341369628906, -31.111278533935547, -27.9891414642334, -24.867006301879883, -21.744869232177734, -18.62273406982422, -15.500598907470703, -12.378461837768555, -9.256324768066406, -6.134188652038574, -3.0120530128479004, 0.11008262634277344, 3.2322187423706055, 6.3543548583984375, 9.476490020751953, 12.598627090454102, 15.720762252807617, 18.842897415161133, 21.96503448486328, 25.087169647216797, 28.209304809570312, 31.33144187927246, 34.453575134277344, 37.575714111328125, 40.69784927368164, 43.819984436035156, 46.94211959838867, 50.06425476074219, 53.18639373779297, 56.308528900146484, 59.4306640625, 62.55280303955078, 65.67493438720703, 68.79707336425781, 71.91920471191406, 75.04134368896484, 78.1634750366211, 81.28561401367188, 84.40774536132812, 87.5298843383789, 90.65202331542969]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 4.0, 7.0, 13.0, 23.0, 17.0, 29.0, 62.0, 101.0, 182.0, 233.0, 500.0, 895.0, 1697.0, 3750.0, 9136.0, 26375.0, 95505.0, 532492.0, 286830.0, 60010.0, 17967.0, 6749.0, 2873.0, 1402.0, 720.0, 399.0, 206.0, 158.0, 75.0, 48.0, 26.0, 19.0, 11.0, 11.0, 8.0, 3.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-6.3046875, -6.10662841796875, -5.9085693359375, -5.71051025390625, -5.512451171875, -5.31439208984375, -5.1163330078125, -4.91827392578125, -4.72021484375, -4.52215576171875, -4.3240966796875, -4.12603759765625, -3.927978515625, -3.72991943359375, -3.5318603515625, -3.33380126953125, -3.1357421875, -2.93768310546875, -2.7396240234375, -2.54156494140625, -2.343505859375, -2.14544677734375, -1.9473876953125, -1.74932861328125, -1.55126953125, -1.35321044921875, -1.1551513671875, -0.95709228515625, -0.759033203125, -0.56097412109375, -0.3629150390625, -0.16485595703125, 0.033203125, 0.23126220703125, 0.4293212890625, 0.62738037109375, 0.825439453125, 1.02349853515625, 1.2215576171875, 1.41961669921875, 1.61767578125, 1.81573486328125, 2.0137939453125, 2.21185302734375, 2.409912109375, 2.60797119140625, 2.8060302734375, 3.00408935546875, 3.2021484375, 3.40020751953125, 3.5982666015625, 3.79632568359375, 3.994384765625, 4.19244384765625, 4.3905029296875, 4.58856201171875, 4.78662109375, 4.98468017578125, 5.1827392578125, 5.38079833984375, 5.578857421875, 5.77691650390625, 5.9749755859375, 6.17303466796875, 6.37109375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 8.0, 8.0, 6.0, 4.0, 10.0, 12.0, 11.0, 20.0, 19.0, 28.0, 26.0, 33.0, 26.0, 38.0, 57.0, 60.0, 56.0, 51.0, 56.0, 54.0, 57.0, 63.0, 39.0, 37.0, 30.0, 32.0, 30.0, 22.0, 20.0, 17.0, 18.0, 16.0, 12.0, 5.0, 5.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.17578125, -5.0106201171875, -4.845458984375, -4.6802978515625, -4.51513671875, -4.3499755859375, -4.184814453125, -4.0196533203125, -3.8544921875, -3.6893310546875, -3.524169921875, -3.3590087890625, -3.19384765625, -3.0286865234375, -2.863525390625, -2.6983642578125, -2.533203125, -2.3680419921875, -2.202880859375, -2.0377197265625, -1.87255859375, -1.7073974609375, -1.542236328125, -1.3770751953125, -1.2119140625, -1.0467529296875, -0.881591796875, -0.7164306640625, -0.55126953125, -0.3861083984375, -0.220947265625, -0.0557861328125, 0.109375, 0.2745361328125, 0.439697265625, 0.6048583984375, 0.77001953125, 0.9351806640625, 1.100341796875, 1.2655029296875, 1.4306640625, 1.5958251953125, 1.760986328125, 1.9261474609375, 2.09130859375, 2.2564697265625, 2.421630859375, 2.5867919921875, 2.751953125, 2.9171142578125, 3.082275390625, 3.2474365234375, 3.41259765625, 3.5777587890625, 3.742919921875, 3.9080810546875, 4.0732421875, 4.2384033203125, 4.403564453125, 4.5687255859375, 4.73388671875, 4.8990478515625, 5.064208984375, 5.2293701171875, 5.39453125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 3.0, 6.0, 10.0, 20.0, 18.0, 29.0, 38.0, 55.0, 106.0, 156.0, 332.0, 591.0, 1612.0, 6048.0, 40699.0, 886302.0, 97014.0, 11195.0, 2505.0, 856.0, 406.0, 212.0, 126.0, 59.0, 51.0, 27.0, 14.0, 15.0, 12.0, 8.0, 9.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-12.2890625, -11.9539794921875, -11.618896484375, -11.2838134765625, -10.94873046875, -10.6136474609375, -10.278564453125, -9.9434814453125, -9.6083984375, -9.2733154296875, -8.938232421875, -8.6031494140625, -8.26806640625, -7.9329833984375, -7.597900390625, -7.2628173828125, -6.927734375, -6.5926513671875, -6.257568359375, -5.9224853515625, -5.58740234375, -5.2523193359375, -4.917236328125, -4.5821533203125, -4.2470703125, -3.9119873046875, -3.576904296875, -3.2418212890625, -2.90673828125, -2.5716552734375, -2.236572265625, -1.9014892578125, -1.56640625, -1.2313232421875, -0.896240234375, -0.5611572265625, -0.22607421875, 0.1090087890625, 0.444091796875, 0.7791748046875, 1.1142578125, 1.4493408203125, 1.784423828125, 2.1195068359375, 2.45458984375, 2.7896728515625, 3.124755859375, 3.4598388671875, 3.794921875, 4.1300048828125, 4.465087890625, 4.8001708984375, 5.13525390625, 5.4703369140625, 5.805419921875, 6.1405029296875, 6.4755859375, 6.8106689453125, 7.145751953125, 7.4808349609375, 7.81591796875, 8.1510009765625, 8.486083984375, 8.8211669921875, 9.15625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 2.0, 2.0, 2.0, 4.0, 6.0, 4.0, 6.0, 10.0, 7.0, 7.0, 12.0, 7.0, 22.0, 17.0, 19.0, 13.0, 30.0, 25.0, 33.0, 30.0, 39.0, 41.0, 64.0, 52.0, 73.0, 73.0, 50.0, 49.0, 39.0, 38.0, 21.0, 21.0, 19.0, 20.0, 23.0, 18.0, 20.0, 16.0, 12.0, 8.0, 6.0, 7.0, 5.0, 10.0, 7.0, 9.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-18.0, -17.480712890625, -16.96142578125, -16.442138671875, -15.9228515625, -15.403564453125, -14.88427734375, -14.364990234375, -13.845703125, -13.326416015625, -12.80712890625, -12.287841796875, -11.7685546875, -11.249267578125, -10.72998046875, -10.210693359375, -9.69140625, -9.172119140625, -8.65283203125, -8.133544921875, -7.6142578125, -7.094970703125, -6.57568359375, -6.056396484375, -5.537109375, -5.017822265625, -4.49853515625, -3.979248046875, -3.4599609375, -2.940673828125, -2.42138671875, -1.902099609375, -1.3828125, -0.863525390625, -0.34423828125, 0.175048828125, 0.6943359375, 1.213623046875, 1.73291015625, 2.252197265625, 2.771484375, 3.290771484375, 3.81005859375, 4.329345703125, 4.8486328125, 5.367919921875, 5.88720703125, 6.406494140625, 6.92578125, 7.445068359375, 7.96435546875, 8.483642578125, 9.0029296875, 9.522216796875, 10.04150390625, 10.560791015625, 11.080078125, 11.599365234375, 12.11865234375, 12.637939453125, 13.1572265625, 13.676513671875, 14.19580078125, 14.715087890625, 15.234375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 13.0, 11.0, 23.0, 29.0, 39.0, 74.0, 97.0, 190.0, 286.0, 548.0, 1331.0, 3545.0, 11864.0, 55834.0, 835249.0, 111677.0, 19042.0, 5150.0, 1848.0, 769.0, 372.0, 209.0, 128.0, 63.0, 43.0, 34.0, 19.0, 24.0, 7.0, 9.0, 7.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.00390625, -1.947723388671875, -1.89154052734375, -1.835357666015625, -1.7791748046875, -1.722991943359375, -1.66680908203125, -1.610626220703125, -1.554443359375, -1.498260498046875, -1.44207763671875, -1.385894775390625, -1.3297119140625, -1.273529052734375, -1.21734619140625, -1.161163330078125, -1.10498046875, -1.048797607421875, -0.99261474609375, -0.936431884765625, -0.8802490234375, -0.824066162109375, -0.76788330078125, -0.711700439453125, -0.655517578125, -0.599334716796875, -0.54315185546875, -0.486968994140625, -0.4307861328125, -0.374603271484375, -0.31842041015625, -0.262237548828125, -0.2060546875, -0.149871826171875, -0.09368896484375, -0.037506103515625, 0.0186767578125, 0.074859619140625, 0.13104248046875, 0.187225341796875, 0.243408203125, 0.299591064453125, 0.35577392578125, 0.411956787109375, 0.4681396484375, 0.524322509765625, 0.58050537109375, 0.636688232421875, 0.69287109375, 0.749053955078125, 0.80523681640625, 0.861419677734375, 0.9176025390625, 0.973785400390625, 1.02996826171875, 1.086151123046875, 1.142333984375, 1.198516845703125, 1.25469970703125, 1.310882568359375, 1.3670654296875, 1.423248291015625, 1.47943115234375, 1.535614013671875, 1.591796875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 4.0, 2.0, 5.0, 12.0, 5.0, 13.0, 24.0, 16.0, 26.0, 26.0, 41.0, 47.0, 79.0, 101.0, 129.0, 102.0, 84.0, 74.0, 48.0, 34.0, 24.0, 19.0, 15.0, 11.0, 11.0, 7.0, 7.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040411949157714844, -0.00039057061076164246, -0.0003770217299461365, -0.0003634728491306305, -0.0003499239683151245, -0.00033637508749961853, -0.00032282620668411255, -0.00030927732586860657, -0.0002957284450531006, -0.0002821795642375946, -0.0002686306834220886, -0.00025508180260658264, -0.00024153292179107666, -0.00022798404097557068, -0.0002144351601600647, -0.00020088627934455872, -0.00018733739852905273, -0.00017378851771354675, -0.00016023963689804077, -0.0001466907560825348, -0.0001331418752670288, -0.00011959299445152283, -0.00010604411363601685, -9.249523282051086e-05, -7.894635200500488e-05, -6.53974711894989e-05, -5.184859037399292e-05, -3.829970955848694e-05, -2.4750828742980957e-05, -1.1201947927474976e-05, 2.346932888031006e-06, 1.5895813703536987e-05, 2.944469451904297e-05, 4.299357533454895e-05, 5.654245615005493e-05, 7.009133696556091e-05, 8.36402177810669e-05, 9.718909859657288e-05, 0.00011073797941207886, 0.00012428686022758484, 0.00013783574104309082, 0.0001513846218585968, 0.00016493350267410278, 0.00017848238348960876, 0.00019203126430511475, 0.00020558014512062073, 0.0002191290259361267, 0.0002326779067516327, 0.00024622678756713867, 0.00025977566838264465, 0.00027332454919815063, 0.0002868734300136566, 0.0003004223108291626, 0.0003139711916446686, 0.00032752007246017456, 0.00034106895327568054, 0.0003546178340911865, 0.0003681667149066925, 0.0003817155957221985, 0.00039526447653770447, 0.00040881335735321045, 0.00042236223816871643, 0.0004359111189842224, 0.0004494599997997284, 0.0004630088806152344]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 10.0, 4.0, 8.0, 17.0, 20.0, 21.0, 27.0, 35.0, 53.0, 75.0, 137.0, 187.0, 294.0, 551.0, 834.0, 1552.0, 3213.0, 7542.0, 19814.0, 71761.0, 773468.0, 121446.0, 28654.0, 10132.0, 4131.0, 1949.0, 1031.0, 571.0, 355.0, 209.0, 149.0, 106.0, 60.0, 44.0, 30.0, 15.0, 13.0, 6.0, 9.0, 6.0, 3.0, 7.0, 1.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-1.830078125, -1.77874755859375, -1.7274169921875, -1.67608642578125, -1.624755859375, -1.57342529296875, -1.5220947265625, -1.47076416015625, -1.41943359375, -1.36810302734375, -1.3167724609375, -1.26544189453125, -1.214111328125, -1.16278076171875, -1.1114501953125, -1.06011962890625, -1.0087890625, -0.95745849609375, -0.9061279296875, -0.85479736328125, -0.803466796875, -0.75213623046875, -0.7008056640625, -0.64947509765625, -0.59814453125, -0.54681396484375, -0.4954833984375, -0.44415283203125, -0.392822265625, -0.34149169921875, -0.2901611328125, -0.23883056640625, -0.1875, -0.13616943359375, -0.0848388671875, -0.03350830078125, 0.017822265625, 0.06915283203125, 0.1204833984375, 0.17181396484375, 0.22314453125, 0.27447509765625, 0.3258056640625, 0.37713623046875, 0.428466796875, 0.47979736328125, 0.5311279296875, 0.58245849609375, 0.6337890625, 0.68511962890625, 0.7364501953125, 0.78778076171875, 0.839111328125, 0.89044189453125, 0.9417724609375, 0.99310302734375, 1.04443359375, 1.09576416015625, 1.1470947265625, 1.19842529296875, 1.249755859375, 1.30108642578125, 1.3524169921875, 1.40374755859375, 1.455078125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 6.0, 8.0, 5.0, 11.0, 18.0, 23.0, 26.0, 34.0, 56.0, 59.0, 67.0, 89.0, 79.0, 87.0, 85.0, 67.0, 62.0, 45.0, 32.0, 29.0, 31.0, 11.0, 17.0, 13.0, 7.0, 7.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9326171875, -1.8752593994140625, -1.817901611328125, -1.7605438232421875, -1.70318603515625, -1.6458282470703125, -1.588470458984375, -1.5311126708984375, -1.4737548828125, -1.4163970947265625, -1.359039306640625, -1.3016815185546875, -1.24432373046875, -1.1869659423828125, -1.129608154296875, -1.0722503662109375, -1.014892578125, -0.9575347900390625, -0.900177001953125, -0.8428192138671875, -0.78546142578125, -0.7281036376953125, -0.670745849609375, -0.6133880615234375, -0.5560302734375, -0.4986724853515625, -0.441314697265625, -0.3839569091796875, -0.32659912109375, -0.2692413330078125, -0.211883544921875, -0.1545257568359375, -0.09716796875, -0.0398101806640625, 0.017547607421875, 0.0749053955078125, 0.13226318359375, 0.1896209716796875, 0.246978759765625, 0.3043365478515625, 0.3616943359375, 0.4190521240234375, 0.476409912109375, 0.5337677001953125, 0.59112548828125, 0.6484832763671875, 0.705841064453125, 0.7631988525390625, 0.820556640625, 0.8779144287109375, 0.935272216796875, 0.9926300048828125, 1.04998779296875, 1.1073455810546875, 1.164703369140625, 1.2220611572265625, 1.2794189453125, 1.3367767333984375, 1.394134521484375, 1.4514923095703125, 1.50885009765625, 1.5662078857421875, 1.623565673828125, 1.6809234619140625, 1.73828125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 7.0, 9.0, 13.0, 31.0, 65.0, 105.0, 431.0, 213.0, 66.0, 30.0, 11.0, 5.0, 6.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.72777557373047, -117.690185546875, -114.65259552001953, -111.61500549316406, -108.57740783691406, -105.5398178100586, -102.50222778320312, -99.46463775634766, -96.42704772949219, -93.38945770263672, -90.35186767578125, -87.31427001953125, -84.27667999267578, -81.23908996582031, -78.20149993896484, -75.16390991210938, -72.12631225585938, -69.0887222290039, -66.05113220214844, -63.0135383605957, -59.97594451904297, -56.9383544921875, -53.90076446533203, -50.86317443847656, -47.82558059692383, -44.78799057006836, -41.750396728515625, -38.712806701660156, -35.67521667480469, -32.63762283325195, -29.600032806396484, -26.562440872192383, -23.524856567382812, -20.48726463317871, -17.44967269897461, -14.41208267211914, -11.374490737915039, -8.336898803710938, -5.299308776855469, -2.261716842651367, 0.7758750915527344, 3.8134665489196777, 6.851058006286621, 9.888648986816406, 12.926240921020508, 15.96383285522461, 19.001422882080078, 22.03901481628418, 25.07660675048828, 28.114198684692383, 31.151790618896484, 34.18938064575195, 37.22697448730469, 40.264564514160156, 43.302154541015625, 46.339744567871094, 49.37733840942383, 52.4149284362793, 55.45252227783203, 58.4901123046875, 61.52770233154297, 64.56529235839844, 67.60289001464844, 70.6404800415039, 73.67807006835938]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 4.0, 2.0, 6.0, 11.0, 3.0, 15.0, 17.0, 24.0, 20.0, 23.0, 35.0, 37.0, 79.0, 123.0, 172.0, 138.0, 74.0, 41.0, 28.0, 21.0, 26.0, 21.0, 22.0, 12.0, 10.0, 8.0, 10.0, 6.0, 6.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.70097351074219, -54.47761154174805, -52.254249572753906, -50.0308837890625, -47.80752182006836, -45.58415985107422, -43.36079406738281, -41.13743209838867, -38.91407012939453, -36.69070816040039, -34.46734619140625, -32.243980407714844, -30.020618438720703, -27.797256469726562, -25.57389259338379, -23.350528717041016, -21.127166748046875, -18.903804779052734, -16.68044090270996, -14.457077980041504, -12.233715057373047, -10.01035213470459, -7.786989212036133, -5.563626289367676, -3.3402633666992188, -1.1169004440307617, 1.1064624786376953, 3.3298254013061523, 5.553188323974609, 7.776551246643066, 9.999914169311523, 12.22327709197998, 14.446632385253906, 16.669994354248047, 18.89335823059082, 21.116722106933594, 23.340084075927734, 25.563446044921875, 27.78680992126465, 30.010173797607422, 32.23353576660156, 34.4568977355957, 36.680259704589844, 38.90362548828125, 41.12698745727539, 43.35034942626953, 45.57371520996094, 47.79707717895508, 50.02043914794922, 52.24380111694336, 54.4671630859375, 56.690528869628906, 58.91389083862305, 61.13725280761719, 63.360618591308594, 65.58397674560547, 67.80734252929688, 70.03070831298828, 72.25406646728516, 74.47743225097656, 76.70079040527344, 78.92415618896484, 81.14752197265625, 83.37088012695312, 85.59424591064453]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 8.0, 12.0, 11.0, 10.0, 21.0, 19.0, 24.0, 27.0, 33.0, 51.0, 56.0, 131.0, 223.0, 72.0, 57.0, 42.0, 49.0, 27.0, 21.0, 27.0, 18.0, 13.0, 13.0, 4.0, 8.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.15234375, -5.9486083984375, -5.744873046875, -5.5411376953125, -5.33740234375, -5.1336669921875, -4.929931640625, -4.7261962890625, -4.5224609375, -4.3187255859375, -4.114990234375, -3.9112548828125, -3.70751953125, -3.5037841796875, -3.300048828125, -3.0963134765625, -2.892578125, -2.6888427734375, -2.485107421875, -2.2813720703125, -2.07763671875, -1.8739013671875, -1.670166015625, -1.4664306640625, -1.2626953125, -1.0589599609375, -0.855224609375, -0.6514892578125, -0.44775390625, -0.2440185546875, -0.040283203125, 0.1634521484375, 0.3671875, 0.5709228515625, 0.774658203125, 0.9783935546875, 1.18212890625, 1.3858642578125, 1.589599609375, 1.7933349609375, 1.9970703125, 2.2008056640625, 2.404541015625, 2.6082763671875, 2.81201171875, 3.0157470703125, 3.219482421875, 3.4232177734375, 3.626953125, 3.8306884765625, 4.034423828125, 4.2381591796875, 4.44189453125, 4.6456298828125, 4.849365234375, 5.0531005859375, 5.2568359375, 5.4605712890625, 5.664306640625, 5.8680419921875, 6.07177734375, 6.2755126953125, 6.479248046875, 6.6829833984375, 6.88671875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 1.0, 1.0, 0.0, 3.0, 7.0, 7.0, 6.0, 16.0, 35.0, 54.0, 64.0, 99.0, 189.0, 639.0, 2668.0, 22094.0, 8347694.0, 12133.0, 1922.0, 501.0, 182.0, 99.0, 58.0, 26.0, 23.0, 13.0, 11.0, 9.0, 7.0, 4.0, 4.0, 7.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.262577056884766, -56.704315185546875, -55.14605712890625, -53.58779525756836, -52.02953338623047, -50.47127151489258, -48.91300964355469, -47.35475158691406, -45.79648971557617, -44.23822784423828, -42.679969787597656, -41.121707916259766, -39.563446044921875, -38.005184173583984, -36.446922302246094, -34.88866424560547, -33.33040237426758, -31.772140502929688, -30.21388053894043, -28.655620574951172, -27.09735870361328, -25.53909683227539, -23.980836868286133, -22.422576904296875, -20.864315032958984, -19.306053161621094, -17.747793197631836, -16.189533233642578, -14.631271362304688, -13.073010444641113, -11.514749526977539, -9.956488609313965, -8.39822769165039, -6.839966773986816, -5.281705856323242, -3.723444938659668, -2.1651840209960938, -0.6069231033325195, 0.9513378143310547, 2.509598731994629, 4.067859649658203, 5.626120567321777, 7.184381484985352, 8.742642402648926, 10.3009033203125, 11.859164237976074, 13.417425155639648, 14.975686073303223, 16.533946990966797, 18.092208862304688, 19.650468826293945, 21.208728790283203, 22.766990661621094, 24.325252532958984, 25.883512496948242, 27.4417724609375, 29.00003433227539, 30.55829620361328, 32.116554260253906, 33.6748161315918, 35.23307800292969, 36.79133987426758, 38.34960174560547, 39.907859802246094, 41.466121673583984]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 1.0, 5.0, 3.0, 5.0, 3.0, 3.0, 4.0, 4.0, 3.0, 3.0, 5.0, 8.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.58476638793945, -54.015106201171875, -52.44544219970703, -50.87578201293945, -49.30611801147461, -47.73645782470703, -46.16679382324219, -44.59713363647461, -43.02747344970703, -41.45781326293945, -39.88814926147461, -38.31848907470703, -36.74882507324219, -35.17916488647461, -33.60950469970703, -32.03984069824219, -30.470176696777344, -28.900514602661133, -27.330852508544922, -25.761192321777344, -24.1915283203125, -22.621868133544922, -21.05220603942871, -19.4825439453125, -17.91288185119629, -16.343219757080078, -14.773557662963867, -13.203896522521973, -11.634234428405762, -10.06457233428955, -8.494911193847656, -6.925249099731445, -5.3555908203125, -3.785928964614868, -2.2162671089172363, -0.6466054916381836, 0.9230566024780273, 2.4927186965942383, 4.062379837036133, 5.632041931152344, 7.201704025268555, 8.771366119384766, 10.341028213500977, 11.910689353942871, 13.480351448059082, 15.050013542175293, 16.619674682617188, 18.1893367767334, 19.75899887084961, 21.32866096496582, 22.89832305908203, 24.46798324584961, 26.037647247314453, 27.60730743408203, 29.176969528198242, 30.746631622314453, 32.31629180908203, 33.88595199584961, 35.45561599731445, 37.02527618408203, 38.594940185546875, 40.16460037231445, 41.73426055908203, 43.303924560546875, 44.87358856201172]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 11.0, 19.0, 22.0, 35.0, 53.0, 72.0, 102.0, 118.0, 111.0, 112.0, 106.0, 82.0, 65.0, 32.0, 25.0, 16.0, 9.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5, -7.27679443359375, -7.0535888671875, -6.83038330078125, -6.607177734375, -6.38397216796875, -6.1607666015625, -5.93756103515625, -5.71435546875, -5.49114990234375, -5.2679443359375, -5.04473876953125, -4.821533203125, -4.59832763671875, -4.3751220703125, -4.15191650390625, -3.9287109375, -3.70550537109375, -3.4822998046875, -3.25909423828125, -3.035888671875, -2.81268310546875, -2.5894775390625, -2.36627197265625, -2.14306640625, -1.91986083984375, -1.6966552734375, -1.47344970703125, -1.250244140625, -1.02703857421875, -0.8038330078125, -0.58062744140625, -0.357421875, -0.13421630859375, 0.0889892578125, 0.31219482421875, 0.535400390625, 0.75860595703125, 0.9818115234375, 1.20501708984375, 1.42822265625, 1.65142822265625, 1.8746337890625, 2.09783935546875, 2.321044921875, 2.54425048828125, 2.7674560546875, 2.99066162109375, 3.2138671875, 3.43707275390625, 3.6602783203125, 3.88348388671875, 4.106689453125, 4.32989501953125, 4.5531005859375, 4.77630615234375, 4.99951171875, 5.22271728515625, 5.4459228515625, 5.66912841796875, 5.892333984375, 6.11553955078125, 6.3387451171875, 6.56195068359375, 6.78515625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 9.0, 10.0, 21.0, 33.0, 55.0, 69.0, 134.0, 263.0, 429.0, 837.0, 1930.0, 4268.0, 9701.0, 23755.0, 60081.0, 139191.0, 156424.0, 74448.0, 30098.0, 12387.0, 5279.0, 2357.0, 1137.0, 595.0, 291.0, 196.0, 96.0, 67.0, 32.0, 25.0, 15.0, 14.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.421875, -27.563720703125, -26.70556640625, -25.847412109375, -24.9892578125, -24.131103515625, -23.27294921875, -22.414794921875, -21.556640625, -20.698486328125, -19.84033203125, -18.982177734375, -18.1240234375, -17.265869140625, -16.40771484375, -15.549560546875, -14.69140625, -13.833251953125, -12.97509765625, -12.116943359375, -11.2587890625, -10.400634765625, -9.54248046875, -8.684326171875, -7.826171875, -6.968017578125, -6.10986328125, -5.251708984375, -4.3935546875, -3.535400390625, -2.67724609375, -1.819091796875, -0.9609375, -0.102783203125, 0.75537109375, 1.613525390625, 2.4716796875, 3.329833984375, 4.18798828125, 5.046142578125, 5.904296875, 6.762451171875, 7.62060546875, 8.478759765625, 9.3369140625, 10.195068359375, 11.05322265625, 11.911376953125, 12.76953125, 13.627685546875, 14.48583984375, 15.343994140625, 16.2021484375, 17.060302734375, 17.91845703125, 18.776611328125, 19.634765625, 20.492919921875, 21.35107421875, 22.209228515625, 23.0673828125, 23.925537109375, 24.78369140625, 25.641845703125, 26.5]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 10.0, 11.0, 16.0, 24.0, 30.0, 31.0, 30.0, 29.0, 44.0, 55.0, 62.0, 85.0, 64.0, 70.0, 76.0, 60.0, 55.0, 40.0, 41.0, 32.0, 26.0, 20.0, 18.0, 16.0, 11.0, 10.0, 7.0, 5.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.7138671875, -5.548828125, -5.3837890625, -5.21875, -5.0537109375, -4.888671875, -4.7236328125, -4.55859375, -4.3935546875, -4.228515625, -4.0634765625, -3.8984375, -3.7333984375, -3.568359375, -3.4033203125, -3.23828125, -3.0732421875, -2.908203125, -2.7431640625, -2.578125, -2.4130859375, -2.248046875, -2.0830078125, -1.91796875, -1.7529296875, -1.587890625, -1.4228515625, -1.2578125, -1.0927734375, -0.927734375, -0.7626953125, -0.59765625, -0.4326171875, -0.267578125, -0.1025390625, 0.0625, 0.2275390625, 0.392578125, 0.5576171875, 0.72265625, 0.8876953125, 1.052734375, 1.2177734375, 1.3828125, 1.5478515625, 1.712890625, 1.8779296875, 2.04296875, 2.2080078125, 2.373046875, 2.5380859375, 2.703125, 2.8681640625, 3.033203125, 3.1982421875, 3.36328125, 3.5283203125, 3.693359375, 3.8583984375, 4.0234375, 4.1884765625, 4.353515625, 4.5185546875, 4.68359375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 6.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 17.0, 19.0, 39.0, 53.0, 62.0, 63.0, 62.0, 68.0, 35.0, 13.0, 10.0, 6.0, 6.0, 4.0, 6.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.748912811279297, -27.527360916137695, -26.305809020996094, -25.084259033203125, -23.862707138061523, -22.641155242919922, -21.419605255126953, -20.19805335998535, -18.97650146484375, -17.75494956970215, -16.533397674560547, -15.311847686767578, -14.090295791625977, -12.868743896484375, -11.64719295501709, -10.425642013549805, -9.204090118408203, -7.98253870010376, -6.760987281799316, -5.539435863494873, -4.31788444519043, -3.0963330268859863, -1.874781608581543, -0.6532306671142578, 0.5683212280273438, 1.789872646331787, 3.0114240646362305, 4.232975482940674, 5.454526901245117, 6.6760783195495605, 7.897629737854004, 9.119180679321289, 10.340736389160156, 11.562288284301758, 12.783839225769043, 14.005390167236328, 15.22694206237793, 16.44849395751953, 17.6700439453125, 18.8915958404541, 20.113147735595703, 21.334699630737305, 22.556251525878906, 23.777801513671875, 24.999353408813477, 26.220905303955078, 27.442455291748047, 28.66400718688965, 29.88555908203125, 31.10711097717285, 32.32866287231445, 33.55021286010742, 34.771766662597656, 35.993316650390625, 37.214866638183594, 38.43641662597656, 39.6579704284668, 40.879520416259766, 42.10107421875, 43.32262420654297, 44.54417419433594, 45.76572799682617, 46.98727798461914, 48.208831787109375, 49.430381774902344]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 7.0, 7.0, 5.0, 4.0, 13.0, 19.0, 18.0, 48.0, 42.0, 39.0, 56.0, 56.0, 40.0, 27.0, 25.0, 27.0, 9.0, 7.0, 3.0, 3.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.539997100830078, -23.715524673461914, -22.89105224609375, -22.066579818725586, -21.242107391357422, -20.417633056640625, -19.59316062927246, -18.768688201904297, -17.944215774536133, -17.11974334716797, -16.295270919799805, -15.470797538757324, -14.64632511138916, -13.821852684020996, -12.997379302978516, -12.172906875610352, -11.348434448242188, -10.523962020874023, -9.69948959350586, -8.875016212463379, -8.050543785095215, -7.226071357727051, -6.4015984535217285, -5.577125549316406, -4.752653121948242, -3.928180456161499, -3.103707790374756, -2.2792351245880127, -1.4547624588012695, -0.6302900314331055, 0.1941828727722168, 1.018655776977539, 1.843130111694336, 2.667602777481079, 3.4920754432678223, 4.3165483474731445, 5.141020774841309, 5.965493202209473, 6.789966106414795, 7.614439010620117, 8.438911437988281, 9.263383865356445, 10.08785629272461, 10.91232967376709, 11.736802101135254, 12.561274528503418, 13.385747909545898, 14.210220336914062, 15.034692764282227, 15.85916519165039, 16.683637619018555, 17.50811004638672, 18.332584381103516, 19.157054901123047, 19.981529235839844, 20.806001663208008, 21.630474090576172, 22.454946517944336, 23.2794189453125, 24.103891372680664, 24.928363800048828, 25.752838134765625, 26.57731056213379, 27.401782989501953, 28.226255416870117]}, "eval/loss": 1.6549711227416992, "eval/wer": 1.0372272907576359, "eval/runtime": 899.3827, "eval/samples_per_second": 2.938, "eval/steps_per_second": 0.368} \ No newline at end of file