diff --git "a/wandb/run-20220301_123331-3cwoccr3/files/wandb-summary.json" "b/wandb/run-20220301_123331-3cwoccr3/files/wandb-summary.json" --- "a/wandb/run-20220301_123331-3cwoccr3/files/wandb-summary.json" +++ "b/wandb/run-20220301_123331-3cwoccr3/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 4.4712, "train/learning_rate": 1.776e-05, "train/epoch": 1.0, "train/global_step": 297, "_runtime": 6038, "_timestamp": 1646144049, "_step": 298, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 80.0, 454.0, 412.0, 63.0, 7.0], "bins": [-318.0708923339844, -312.8525390625, -307.6341552734375, -302.4158020019531, -297.19744873046875, -291.97906494140625, -286.7607116699219, -281.5423583984375, -276.323974609375, -271.1056213378906, -265.8872375488281, -260.66888427734375, -255.45053100585938, -250.23216247558594, -245.0137939453125, -239.79544067382812, -234.57708740234375, -229.3587188720703, -224.14036560058594, -218.9219970703125, -213.70364379882812, -208.4852752685547, -203.26690673828125, -198.04855346679688, -192.83018493652344, -187.61181640625, -182.39346313476562, -177.1750946044922, -171.95672607421875, -166.73837280273438, -161.52000427246094, -156.3016357421875, -151.0832977294922, -145.86492919921875, -140.64657592773438, -135.42820739746094, -130.2098388671875, -124.99148559570312, -119.77311706542969, -114.55475616455078, -109.33639526367188, -104.11803436279297, -98.89967346191406, -93.68130493164062, -88.46294403076172, -83.24458312988281, -78.02621459960938, -72.80785369873047, -67.58949279785156, -62.371131896972656, -57.152767181396484, -51.93440246582031, -46.716041564941406, -41.4976806640625, -36.27931594848633, -31.060951232910156, -25.842588424682617, -20.624225616455078, -15.405862808227539, -10.1875, -4.969137191772461, 0.24922561645507812, 5.467588424682617, 10.685953140258789, 15.904314041137695]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 6.0, 7.0, 3.0, 10.0, 11.0, 9.0, 19.0, 15.0, 18.0, 23.0, 24.0, 31.0, 39.0, 35.0, 50.0, 48.0, 32.0, 32.0, 55.0, 49.0, 46.0, 44.0, 40.0, 48.0, 49.0, 35.0, 35.0, 17.0, 25.0, 20.0, 24.0, 21.0, 10.0, 11.0, 17.0, 12.0, 11.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-53.798095703125, -52.326568603515625, -50.855045318603516, -49.38351821899414, -47.911991119384766, -46.440467834472656, -44.96894073486328, -43.497413635253906, -42.0258903503418, -40.55436325073242, -39.08283996582031, -37.61131286621094, -36.13978576660156, -34.66826248168945, -33.19673538208008, -31.725210189819336, -30.25368309020996, -28.78215789794922, -27.310630798339844, -25.8391056060791, -24.36758041381836, -22.896053314208984, -21.424528121948242, -19.9530029296875, -18.481475830078125, -17.009950637817383, -15.538424491882324, -14.066898345947266, -12.595373153686523, -11.123847007751465, -9.652320861816406, -8.180795669555664, -6.709270477294922, -5.2377448081970215, -3.766218900680542, -2.2946929931640625, -0.8231673240661621, 0.6483583450317383, 2.119884490966797, 3.591409683227539, 5.062935829162598, 6.534461498260498, 8.005987167358398, 9.477513313293457, 10.949039459228516, 12.420564651489258, 13.892090797424316, 15.363615989685059, 16.835142135620117, 18.30666732788086, 19.778194427490234, 21.249719619750977, 22.72124481201172, 24.192771911621094, 25.664297103881836, 27.135822296142578, 28.607349395751953, 30.078874588012695, 31.55040168762207, 33.02192687988281, 34.49345397949219, 35.9649772644043, 37.43650436401367, 38.90802764892578, 40.379554748535156]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 9.0, 4.0, 11.0, 7.0, 11.0, 16.0, 21.0, 21.0, 19.0, 34.0, 36.0, 43.0, 53.0, 50.0, 49.0, 59.0, 40.0, 65.0, 44.0, 51.0, 36.0, 53.0, 32.0, 36.0, 40.0, 33.0, 17.0, 18.0, 20.0, 20.0, 15.0, 8.0, 7.0, 6.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6640625, -2.56243896484375, -2.4608154296875, -2.35919189453125, -2.257568359375, -2.15594482421875, -2.0543212890625, -1.95269775390625, -1.85107421875, -1.74945068359375, -1.6478271484375, -1.54620361328125, -1.444580078125, -1.34295654296875, -1.2413330078125, -1.13970947265625, -1.0380859375, -0.93646240234375, -0.8348388671875, -0.73321533203125, -0.631591796875, -0.52996826171875, -0.4283447265625, -0.32672119140625, -0.22509765625, -0.12347412109375, -0.0218505859375, 0.07977294921875, 0.181396484375, 0.28302001953125, 0.3846435546875, 0.48626708984375, 0.587890625, 0.68951416015625, 0.7911376953125, 0.89276123046875, 0.994384765625, 1.09600830078125, 1.1976318359375, 1.29925537109375, 1.40087890625, 1.50250244140625, 1.6041259765625, 1.70574951171875, 1.807373046875, 1.90899658203125, 2.0106201171875, 2.11224365234375, 2.2138671875, 2.31549072265625, 2.4171142578125, 2.51873779296875, 2.620361328125, 2.72198486328125, 2.8236083984375, 2.92523193359375, 3.02685546875, 3.12847900390625, 3.2301025390625, 3.33172607421875, 3.433349609375, 3.53497314453125, 3.6365966796875, 3.73822021484375, 3.83984375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 14.0, 15.0, 31.0, 36.0, 71.0, 96.0, 141.0, 272.0, 431.0, 785.0, 1472.0, 3077.0, 8438.0, 35158.0, 282709.0, 2640571.0, 1102198.0, 91797.0, 16868.0, 5230.0, 2197.0, 1143.0, 627.0, 311.0, 223.0, 139.0, 83.0, 62.0, 28.0, 16.0, 12.0, 8.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0], "bins": [-13.3515625, -13.0157470703125, -12.679931640625, -12.3441162109375, -12.00830078125, -11.6724853515625, -11.336669921875, -11.0008544921875, -10.6650390625, -10.3292236328125, -9.993408203125, -9.6575927734375, -9.32177734375, -8.9859619140625, -8.650146484375, -8.3143310546875, -7.978515625, -7.6427001953125, -7.306884765625, -6.9710693359375, -6.63525390625, -6.2994384765625, -5.963623046875, -5.6278076171875, -5.2919921875, -4.9561767578125, -4.620361328125, -4.2845458984375, -3.94873046875, -3.6129150390625, -3.277099609375, -2.9412841796875, -2.60546875, -2.2696533203125, -1.933837890625, -1.5980224609375, -1.26220703125, -0.9263916015625, -0.590576171875, -0.2547607421875, 0.0810546875, 0.4168701171875, 0.752685546875, 1.0885009765625, 1.42431640625, 1.7601318359375, 2.095947265625, 2.4317626953125, 2.767578125, 3.1033935546875, 3.439208984375, 3.7750244140625, 4.11083984375, 4.4466552734375, 4.782470703125, 5.1182861328125, 5.4541015625, 5.7899169921875, 6.125732421875, 6.4615478515625, 6.79736328125, 7.1331787109375, 7.468994140625, 7.8048095703125, 8.140625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 12.0, 5.0, 9.0, 21.0, 15.0, 35.0, 44.0, 46.0, 61.0, 90.0, 149.0, 188.0, 275.0, 374.0, 517.0, 519.0, 462.0, 355.0, 266.0, 194.0, 133.0, 86.0, 68.0, 41.0, 32.0, 21.0, 15.0, 11.0, 8.0, 8.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.4921875, -11.1356201171875, -10.779052734375, -10.4224853515625, -10.06591796875, -9.7093505859375, -9.352783203125, -8.9962158203125, -8.6396484375, -8.2830810546875, -7.926513671875, -7.5699462890625, -7.21337890625, -6.8568115234375, -6.500244140625, -6.1436767578125, -5.787109375, -5.4305419921875, -5.073974609375, -4.7174072265625, -4.36083984375, -4.0042724609375, -3.647705078125, -3.2911376953125, -2.9345703125, -2.5780029296875, -2.221435546875, -1.8648681640625, -1.50830078125, -1.1517333984375, -0.795166015625, -0.4385986328125, -0.08203125, 0.2745361328125, 0.631103515625, 0.9876708984375, 1.34423828125, 1.7008056640625, 2.057373046875, 2.4139404296875, 2.7705078125, 3.1270751953125, 3.483642578125, 3.8402099609375, 4.19677734375, 4.5533447265625, 4.909912109375, 5.2664794921875, 5.623046875, 5.9796142578125, 6.336181640625, 6.6927490234375, 7.04931640625, 7.4058837890625, 7.762451171875, 8.1190185546875, 8.4755859375, 8.8321533203125, 9.188720703125, 9.5452880859375, 9.90185546875, 10.2584228515625, 10.614990234375, 10.9715576171875, 11.328125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 4.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 12.0, 17.0, 24.0, 41.0, 55.0, 88.0, 124.0, 161.0, 314.0, 490.0, 991.0, 2279.0, 8063.0, 299143.0, 3807389.0, 66341.0, 5035.0, 1750.0, 788.0, 416.0, 246.0, 162.0, 112.0, 60.0, 56.0, 30.0, 19.0, 17.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.59375, -34.380859375, -33.16796875, -31.955078125, -30.7421875, -29.529296875, -28.31640625, -27.103515625, -25.890625, -24.677734375, -23.46484375, -22.251953125, -21.0390625, -19.826171875, -18.61328125, -17.400390625, -16.1875, -14.974609375, -13.76171875, -12.548828125, -11.3359375, -10.123046875, -8.91015625, -7.697265625, -6.484375, -5.271484375, -4.05859375, -2.845703125, -1.6328125, -0.419921875, 0.79296875, 2.005859375, 3.21875, 4.431640625, 5.64453125, 6.857421875, 8.0703125, 9.283203125, 10.49609375, 11.708984375, 12.921875, 14.134765625, 15.34765625, 16.560546875, 17.7734375, 18.986328125, 20.19921875, 21.412109375, 22.625, 23.837890625, 25.05078125, 26.263671875, 27.4765625, 28.689453125, 29.90234375, 31.115234375, 32.328125, 33.541015625, 34.75390625, 35.966796875, 37.1796875, 38.392578125, 39.60546875, 40.818359375, 42.03125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 10.0, 40.0, 97.0, 209.0, 276.0, 201.0, 117.0, 37.0, 14.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.43179321289062, -77.31104278564453, -75.19029235839844, -73.06954956054688, -70.94879913330078, -68.82804870605469, -66.7072982788086, -64.5865478515625, -62.46580505371094, -60.345054626464844, -58.224308013916016, -56.10355758666992, -53.982810974121094, -51.862060546875, -49.741310119628906, -47.62056350708008, -45.499813079833984, -43.37906265258789, -41.25831604003906, -39.13756561279297, -37.01681900024414, -34.89606857299805, -32.77532196044922, -30.654571533203125, -28.533823013305664, -26.413074493408203, -24.292325973510742, -22.17157745361328, -20.050827026367188, -17.93008041381836, -15.809329986572266, -13.688581466674805, -11.567832946777344, -9.447084426879883, -7.326335430145264, -5.2055864334106445, -3.0848379135131836, -0.9640893936157227, 1.1566600799560547, 3.2774085998535156, 5.398157119750977, 7.5189056396484375, 9.639654159545898, 11.760403633117676, 13.881152153015137, 16.00189971923828, 18.122650146484375, 20.243398666381836, 22.364147186279297, 24.484895706176758, 26.60564422607422, 28.726394653320312, 30.84714126586914, 32.967891693115234, 35.08863830566406, 37.209388732910156, 39.33013916015625, 41.450889587402344, 43.57163619995117, 45.692386627197266, 47.813133239746094, 49.93388366699219, 52.05463409423828, 54.17538070678711, 56.29612731933594]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 6.0, 10.0, 6.0, 7.0, 9.0, 12.0, 11.0, 14.0, 7.0, 22.0, 14.0, 23.0, 29.0, 20.0, 27.0, 26.0, 42.0, 30.0, 37.0, 39.0, 45.0, 31.0, 35.0, 29.0, 38.0, 23.0, 44.0, 30.0, 33.0, 32.0, 49.0, 35.0, 20.0, 28.0, 18.0, 14.0, 18.0, 25.0, 15.0, 12.0, 10.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-35.123512268066406, -34.12685012817383, -33.13018798828125, -32.13352584838867, -31.136863708496094, -30.140201568603516, -29.143539428710938, -28.14687728881836, -27.15021514892578, -26.153553009033203, -25.156890869140625, -24.160228729248047, -23.16356658935547, -22.16690444946289, -21.170242309570312, -20.173580169677734, -19.176916122436523, -18.180253982543945, -17.183591842651367, -16.18692970275879, -15.190267562866211, -14.193605422973633, -13.196942329406738, -12.20028018951416, -11.203618049621582, -10.206955909729004, -9.210293769836426, -8.213630676269531, -7.216969013214111, -6.220306873321533, -5.223644256591797, -4.226982116699219, -3.230318069458008, -2.2336559295654297, -1.2369935512542725, -0.24033117294311523, 0.7563309669494629, 1.752993106842041, 2.7496557235717773, 3.7463178634643555, 4.742980003356934, 5.739642143249512, 6.73630428314209, 7.732966899871826, 8.729629516601562, 9.72629165649414, 10.722953796386719, 11.719615936279297, 12.716278076171875, 13.712940216064453, 14.709602355957031, 15.70626449584961, 16.702926635742188, 17.699588775634766, 18.696250915527344, 19.692913055419922, 20.6895751953125, 21.686237335205078, 22.682899475097656, 23.679561614990234, 24.676223754882812, 25.67288589477539, 26.66954803466797, 27.666210174560547, 28.662874221801758]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 7.0, 5.0, 6.0, 10.0, 10.0, 12.0, 19.0, 18.0, 22.0, 22.0, 27.0, 25.0, 23.0, 34.0, 50.0, 36.0, 34.0, 39.0, 42.0, 66.0, 37.0, 48.0, 46.0, 34.0, 28.0, 39.0, 30.0, 28.0, 35.0, 19.0, 24.0, 19.0, 23.0, 20.0, 12.0, 9.0, 7.0, 6.0, 8.0, 4.0, 2.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.703125, -2.61004638671875, -2.5169677734375, -2.42388916015625, -2.330810546875, -2.23773193359375, -2.1446533203125, -2.05157470703125, -1.95849609375, -1.86541748046875, -1.7723388671875, -1.67926025390625, -1.586181640625, -1.49310302734375, -1.4000244140625, -1.30694580078125, -1.2138671875, -1.12078857421875, -1.0277099609375, -0.93463134765625, -0.841552734375, -0.74847412109375, -0.6553955078125, -0.56231689453125, -0.46923828125, -0.37615966796875, -0.2830810546875, -0.19000244140625, -0.096923828125, -0.00384521484375, 0.0892333984375, 0.18231201171875, 0.275390625, 0.36846923828125, 0.4615478515625, 0.55462646484375, 0.647705078125, 0.74078369140625, 0.8338623046875, 0.92694091796875, 1.02001953125, 1.11309814453125, 1.2061767578125, 1.29925537109375, 1.392333984375, 1.48541259765625, 1.5784912109375, 1.67156982421875, 1.7646484375, 1.85772705078125, 1.9508056640625, 2.04388427734375, 2.136962890625, 2.23004150390625, 2.3231201171875, 2.41619873046875, 2.50927734375, 2.60235595703125, 2.6954345703125, 2.78851318359375, 2.881591796875, 2.97467041015625, 3.0677490234375, 3.16082763671875, 3.25390625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 14.0, 15.0, 23.0, 30.0, 52.0, 64.0, 113.0, 133.0, 196.0, 287.0, 462.0, 679.0, 1058.0, 1498.0, 2315.0, 3654.0, 5690.0, 9052.0, 14721.0, 24835.0, 41765.0, 73576.0, 141417.0, 293402.0, 199972.0, 97923.0, 54501.0, 31077.0, 18649.0, 11343.0, 7104.0, 4453.0, 2967.0, 1758.0, 1260.0, 808.0, 543.0, 360.0, 231.0, 166.0, 109.0, 95.0, 53.0, 43.0, 25.0, 18.0, 12.0, 9.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0], "bins": [-0.60888671875, -0.5908355712890625, -0.572784423828125, -0.5547332763671875, -0.53668212890625, -0.5186309814453125, -0.500579833984375, -0.4825286865234375, -0.4644775390625, -0.4464263916015625, -0.428375244140625, -0.4103240966796875, -0.39227294921875, -0.3742218017578125, -0.356170654296875, -0.3381195068359375, -0.320068359375, -0.3020172119140625, -0.283966064453125, -0.2659149169921875, -0.24786376953125, -0.2298126220703125, -0.211761474609375, -0.1937103271484375, -0.1756591796875, -0.1576080322265625, -0.139556884765625, -0.1215057373046875, -0.10345458984375, -0.0854034423828125, -0.067352294921875, -0.0493011474609375, -0.03125, -0.0131988525390625, 0.004852294921875, 0.0229034423828125, 0.04095458984375, 0.0590057373046875, 0.077056884765625, 0.0951080322265625, 0.1131591796875, 0.1312103271484375, 0.149261474609375, 0.1673126220703125, 0.18536376953125, 0.2034149169921875, 0.221466064453125, 0.2395172119140625, 0.257568359375, 0.2756195068359375, 0.293670654296875, 0.3117218017578125, 0.32977294921875, 0.3478240966796875, 0.365875244140625, 0.3839263916015625, 0.4019775390625, 0.4200286865234375, 0.438079833984375, 0.4561309814453125, 0.47418212890625, 0.4922332763671875, 0.510284423828125, 0.5283355712890625, 0.54638671875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 7.0, 13.0, 10.0, 11.0, 11.0, 6.0, 17.0, 20.0, 22.0, 21.0, 28.0, 27.0, 29.0, 48.0, 39.0, 36.0, 33.0, 34.0, 53.0, 41.0, 1065.0, 39.0, 31.0, 37.0, 29.0, 41.0, 34.0, 25.0, 21.0, 21.0, 17.0, 21.0, 19.0, 26.0, 17.0, 7.0, 3.0, 10.0, 10.0, 12.0, 4.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.71875, -1.6635589599609375, -1.608367919921875, -1.5531768798828125, -1.49798583984375, -1.4427947998046875, -1.387603759765625, -1.3324127197265625, -1.2772216796875, -1.2220306396484375, -1.166839599609375, -1.1116485595703125, -1.05645751953125, -1.0012664794921875, -0.946075439453125, -0.8908843994140625, -0.835693359375, -0.7805023193359375, -0.725311279296875, -0.6701202392578125, -0.61492919921875, -0.5597381591796875, -0.504547119140625, -0.4493560791015625, -0.3941650390625, -0.3389739990234375, -0.283782958984375, -0.2285919189453125, -0.17340087890625, -0.1182098388671875, -0.063018798828125, -0.0078277587890625, 0.04736328125, 0.1025543212890625, 0.157745361328125, 0.2129364013671875, 0.26812744140625, 0.3233184814453125, 0.378509521484375, 0.4337005615234375, 0.4888916015625, 0.5440826416015625, 0.599273681640625, 0.6544647216796875, 0.70965576171875, 0.7648468017578125, 0.820037841796875, 0.8752288818359375, 0.930419921875, 0.9856109619140625, 1.040802001953125, 1.0959930419921875, 1.15118408203125, 1.2063751220703125, 1.261566162109375, 1.3167572021484375, 1.3719482421875, 1.4271392822265625, 1.482330322265625, 1.5375213623046875, 1.59271240234375, 1.6479034423828125, 1.703094482421875, 1.7582855224609375, 1.8134765625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 16.0, 18.0, 23.0, 31.0, 40.0, 61.0, 75.0, 134.0, 165.0, 257.0, 337.0, 500.0, 768.0, 1104.0, 1613.0, 2353.0, 3652.0, 5617.0, 8786.0, 14016.0, 21586.0, 35538.0, 59947.0, 109962.0, 217283.0, 1306879.0, 129964.0, 68845.0, 39267.0, 24056.0, 15183.0, 9893.0, 6430.0, 4139.0, 2755.0, 1840.0, 1223.0, 899.0, 608.0, 365.0, 263.0, 194.0, 123.0, 97.0, 70.0, 42.0, 39.0, 27.0, 11.0, 11.0, 12.0, 5.0, 2.0, 5.0, 0.0, 2.0], "bins": [-0.52783203125, -0.5118980407714844, -0.49596405029296875, -0.4800300598144531, -0.4640960693359375, -0.4481620788574219, -0.43222808837890625, -0.4162940979003906, -0.400360107421875, -0.3844261169433594, -0.36849212646484375, -0.3525581359863281, -0.3366241455078125, -0.3206901550292969, -0.30475616455078125, -0.2888221740722656, -0.27288818359375, -0.2569541931152344, -0.24102020263671875, -0.22508621215820312, -0.2091522216796875, -0.19321823120117188, -0.17728424072265625, -0.16135025024414062, -0.145416259765625, -0.12948226928710938, -0.11354827880859375, -0.09761428833007812, -0.0816802978515625, -0.06574630737304688, -0.04981231689453125, -0.033878326416015625, -0.0179443359375, -0.002010345458984375, 0.01392364501953125, 0.029857635498046875, 0.0457916259765625, 0.061725616455078125, 0.07765960693359375, 0.09359359741210938, 0.109527587890625, 0.12546157836914062, 0.14139556884765625, 0.15732955932617188, 0.1732635498046875, 0.18919754028320312, 0.20513153076171875, 0.22106552124023438, 0.23699951171875, 0.2529335021972656, 0.26886749267578125, 0.2848014831542969, 0.3007354736328125, 0.3166694641113281, 0.33260345458984375, 0.3485374450683594, 0.364471435546875, 0.3804054260253906, 0.39633941650390625, 0.4122734069824219, 0.4282073974609375, 0.4441413879394531, 0.46007537841796875, 0.4760093688964844, 0.491943359375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 7.0, 3.0, 10.0, 11.0, 13.0, 11.0, 16.0, 22.0, 32.0, 43.0, 19.0, 50.0, 45.0, 59.0, 53.0, 59.0, 65.0, 64.0, 53.0, 46.0, 44.0, 40.0, 41.0, 26.0, 31.0, 22.0, 20.0, 16.0, 19.0, 14.0, 8.0, 6.0, 8.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003750324249267578, -0.00036242231726646423, -0.00034981220960617065, -0.0003372021019458771, -0.0003245919942855835, -0.0003119818866252899, -0.00029937177896499634, -0.00028676167130470276, -0.0002741515636444092, -0.0002615414559841156, -0.000248931348323822, -0.00023632124066352844, -0.00022371113300323486, -0.00021110102534294128, -0.0001984909176826477, -0.00018588081002235413, -0.00017327070236206055, -0.00016066059470176697, -0.0001480504870414734, -0.0001354403793811798, -0.00012283027172088623, -0.00011022016406059265, -9.761005640029907e-05, -8.499994874000549e-05, -7.238984107971191e-05, -5.9779733419418335e-05, -4.7169625759124756e-05, -3.455951809883118e-05, -2.1949410438537598e-05, -9.339302778244019e-06, 3.2708048820495605e-06, 1.588091254234314e-05, 2.849102020263672e-05, 4.11011278629303e-05, 5.371123552322388e-05, 6.632134318351746e-05, 7.893145084381104e-05, 9.154155850410461e-05, 0.0001041516661643982, 0.00011676177382469177, 0.00012937188148498535, 0.00014198198914527893, 0.0001545920968055725, 0.0001672022044658661, 0.00017981231212615967, 0.00019242241978645325, 0.00020503252744674683, 0.0002176426351070404, 0.00023025274276733398, 0.00024286285042762756, 0.00025547295808792114, 0.0002680830657482147, 0.0002806931734085083, 0.0002933032810688019, 0.00030591338872909546, 0.00031852349638938904, 0.0003311336040496826, 0.0003437437117099762, 0.0003563538193702698, 0.00036896392703056335, 0.00038157403469085693, 0.0003941841423511505, 0.0004067942500114441, 0.00041940435767173767, 0.00043201446533203125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 8.0, 6.0, 14.0, 9.0, 19.0, 27.0, 21.0, 32.0, 31.0, 41.0, 55.0, 74.0, 87.0, 136.0, 139.0, 224.0, 276.0, 429.0, 641.0, 1682.0, 740219.0, 301040.0, 1208.0, 556.0, 402.0, 285.0, 199.0, 170.0, 90.0, 93.0, 59.0, 60.0, 36.0, 52.0, 37.0, 25.0, 20.0, 14.0, 7.0, 3.0, 2.0, 6.0, 8.0, 1.0, 1.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.006404876708984375, -0.006190836429595947, -0.0059767961502075195, -0.005762755870819092, -0.005548715591430664, -0.005334675312042236, -0.005120635032653809, -0.004906594753265381, -0.004692554473876953, -0.004478514194488525, -0.004264473915100098, -0.00405043363571167, -0.003836393356323242, -0.0036223530769348145, -0.0034083127975463867, -0.003194272518157959, -0.0029802322387695312, -0.0027661919593811035, -0.0025521516799926758, -0.002338111400604248, -0.0021240711212158203, -0.0019100308418273926, -0.0016959905624389648, -0.0014819502830505371, -0.0012679100036621094, -0.0010538697242736816, -0.0008398294448852539, -0.0006257891654968262, -0.00041174888610839844, -0.0001977086067199707, 1.633167266845703e-05, 0.00023037195205688477, 0.0004444122314453125, 0.0006584525108337402, 0.000872492790222168, 0.0010865330696105957, 0.0013005733489990234, 0.0015146136283874512, 0.001728653907775879, 0.0019426941871643066, 0.0021567344665527344, 0.002370774745941162, 0.00258481502532959, 0.0027988553047180176, 0.0030128955841064453, 0.003226935863494873, 0.0034409761428833008, 0.0036550164222717285, 0.0038690567016601562, 0.004083096981048584, 0.004297137260437012, 0.0045111775398254395, 0.004725217819213867, 0.004939258098602295, 0.005153298377990723, 0.00536733865737915, 0.005581378936767578, 0.005795419216156006, 0.006009459495544434, 0.006223499774932861, 0.006437540054321289, 0.006651580333709717, 0.0068656206130981445, 0.007079660892486572, 0.007293701171875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 14.0, 109.0, 338.0, 352.0, 153.0, 40.0, 7.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008666588691994548, -0.0008439445518888533, -0.0008212301763705909, -0.0007985158590599895, -0.0007758014835417271, -0.0007530871662311256, -0.0007303728489205241, -0.0007076584734022617, -0.0006849440978839993, -0.0006622297805733979, -0.0006395154050551355, -0.000616801087744534, -0.0005940867122262716, -0.0005713723949156702, -0.0005486580776050687, -0.0005259437020868063, -0.0005032293847762048, -0.0004805150383617729, -0.00045780069194734097, -0.0004350863746367395, -0.0004123719991184771, -0.00038965768180787563, -0.0003669433353934437, -0.0003442289889790118, -0.00032151464256457984, -0.0002988002961501479, -0.000276085949735716, -0.00025337160332128406, -0.00023065727145876735, -0.00020794292504433542, -0.00018522859318181872, -0.0001625142467673868, -0.00013979995856061578, -0.00011708561214618385, -9.437127300770953e-05, -7.165693386923522e-05, -4.894258745480329e-05, -2.622824104037136e-05, -3.513909177854657e-06, 1.9200437236577272e-05, 4.19147836510092e-05, 6.462913006544113e-05, 8.734346920391545e-05, 0.00011005780834238976, 0.0001327721547568217, 0.00015548650117125362, 0.00017820083303377032, 0.00020091517944820225, 0.00022362952586263418, 0.0002463438722770661, 0.00026905821869149804, 0.0002917725360020995, 0.0003144869115203619, 0.0003372012288309634, 0.0003599155752453953, 0.00038262992165982723, 0.00040534426807425916, 0.0004280586144886911, 0.000450772960903123, 0.00047348730731755495, 0.0004962016246281564, 0.0005189160001464188, 0.0005416303174570203, 0.0005643446929752827, 0.0005870590102858841]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 7.0, 12.0, 10.0, 11.0, 16.0, 16.0, 19.0, 22.0, 23.0, 29.0, 34.0, 35.0, 31.0, 42.0, 34.0, 32.0, 39.0, 37.0, 45.0, 36.0, 46.0, 40.0, 34.0, 48.0, 35.0, 34.0, 28.0, 29.0, 24.0, 23.0, 17.0, 12.0, 17.0, 16.0, 13.0, 8.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0002161264419555664, -0.00020975247025489807, -0.00020337849855422974, -0.0001970045268535614, -0.00019063055515289307, -0.00018425658345222473, -0.0001778826117515564, -0.00017150864005088806, -0.00016513466835021973, -0.0001587606966495514, -0.00015238672494888306, -0.00014601275324821472, -0.0001396387815475464, -0.00013326480984687805, -0.00012689083814620972, -0.00012051686644554138, -0.00011414289474487305, -0.00010776892304420471, -0.00010139495134353638, -9.502097964286804e-05, -8.864700794219971e-05, -8.227303624153137e-05, -7.589906454086304e-05, -6.95250928401947e-05, -6.315112113952637e-05, -5.677714943885803e-05, -5.04031777381897e-05, -4.402920603752136e-05, -3.765523433685303e-05, -3.128126263618469e-05, -2.4907290935516357e-05, -1.8533319234848022e-05, -1.2159347534179688e-05, -5.7853758335113525e-06, 5.885958671569824e-07, 6.962567567825317e-06, 1.3336539268493652e-05, 1.9710510969161987e-05, 2.6084482669830322e-05, 3.245845437049866e-05, 3.883242607116699e-05, 4.520639777183533e-05, 5.158036947250366e-05, 5.7954341173172e-05, 6.432831287384033e-05, 7.070228457450867e-05, 7.7076256275177e-05, 8.345022797584534e-05, 8.982419967651367e-05, 9.619817137718201e-05, 0.00010257214307785034, 0.00010894611477851868, 0.00011532008647918701, 0.00012169405817985535, 0.00012806802988052368, 0.00013444200158119202, 0.00014081597328186035, 0.0001471899449825287, 0.00015356391668319702, 0.00015993788838386536, 0.0001663118600845337, 0.00017268583178520203, 0.00017905980348587036, 0.0001854337751865387, 0.00019180774688720703]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 7.0, 5.0, 6.0, 10.0, 10.0, 12.0, 19.0, 18.0, 22.0, 22.0, 27.0, 25.0, 23.0, 34.0, 50.0, 36.0, 34.0, 39.0, 42.0, 66.0, 37.0, 48.0, 46.0, 34.0, 28.0, 39.0, 30.0, 28.0, 35.0, 19.0, 24.0, 19.0, 23.0, 20.0, 12.0, 9.0, 7.0, 6.0, 8.0, 4.0, 2.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.703125, -2.61004638671875, -2.5169677734375, -2.42388916015625, -2.330810546875, -2.23773193359375, -2.1446533203125, -2.05157470703125, -1.95849609375, -1.86541748046875, -1.7723388671875, -1.67926025390625, -1.586181640625, -1.49310302734375, -1.4000244140625, -1.30694580078125, -1.2138671875, -1.12078857421875, -1.0277099609375, -0.93463134765625, -0.841552734375, -0.74847412109375, -0.6553955078125, -0.56231689453125, -0.46923828125, -0.37615966796875, -0.2830810546875, -0.19000244140625, -0.096923828125, -0.00384521484375, 0.0892333984375, 0.18231201171875, 0.275390625, 0.36846923828125, 0.4615478515625, 0.55462646484375, 0.647705078125, 0.74078369140625, 0.8338623046875, 0.92694091796875, 1.02001953125, 1.11309814453125, 1.2061767578125, 1.29925537109375, 1.392333984375, 1.48541259765625, 1.5784912109375, 1.67156982421875, 1.7646484375, 1.85772705078125, 1.9508056640625, 2.04388427734375, 2.136962890625, 2.23004150390625, 2.3231201171875, 2.41619873046875, 2.50927734375, 2.60235595703125, 2.6954345703125, 2.78851318359375, 2.881591796875, 2.97467041015625, 3.0677490234375, 3.16082763671875, 3.25390625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 3.0, 3.0, 15.0, 7.0, 6.0, 15.0, 22.0, 27.0, 42.0, 49.0, 77.0, 80.0, 118.0, 158.0, 216.0, 287.0, 391.0, 525.0, 690.0, 959.0, 1416.0, 1998.0, 2914.0, 4560.0, 8134.0, 18683.0, 74228.0, 524615.0, 328589.0, 45808.0, 14245.0, 6803.0, 3938.0, 2528.0, 1769.0, 1258.0, 875.0, 686.0, 433.0, 372.0, 259.0, 207.0, 137.0, 104.0, 73.0, 59.0, 49.0, 34.0, 30.0, 23.0, 16.0, 9.0, 7.0, 9.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0], "bins": [-12.0859375, -11.70654296875, -11.3271484375, -10.94775390625, -10.568359375, -10.18896484375, -9.8095703125, -9.43017578125, -9.05078125, -8.67138671875, -8.2919921875, -7.91259765625, -7.533203125, -7.15380859375, -6.7744140625, -6.39501953125, -6.015625, -5.63623046875, -5.2568359375, -4.87744140625, -4.498046875, -4.11865234375, -3.7392578125, -3.35986328125, -2.98046875, -2.60107421875, -2.2216796875, -1.84228515625, -1.462890625, -1.08349609375, -0.7041015625, -0.32470703125, 0.0546875, 0.43408203125, 0.8134765625, 1.19287109375, 1.572265625, 1.95166015625, 2.3310546875, 2.71044921875, 3.08984375, 3.46923828125, 3.8486328125, 4.22802734375, 4.607421875, 4.98681640625, 5.3662109375, 5.74560546875, 6.125, 6.50439453125, 6.8837890625, 7.26318359375, 7.642578125, 8.02197265625, 8.4013671875, 8.78076171875, 9.16015625, 9.53955078125, 9.9189453125, 10.29833984375, 10.677734375, 11.05712890625, 11.4365234375, 11.81591796875, 12.1953125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 8.0, 4.0, 8.0, 8.0, 15.0, 6.0, 15.0, 19.0, 17.0, 17.0, 12.0, 29.0, 31.0, 26.0, 27.0, 28.0, 42.0, 51.0, 79.0, 126.0, 216.0, 1334.0, 254.0, 169.0, 81.0, 69.0, 54.0, 44.0, 33.0, 34.0, 25.0, 32.0, 17.0, 25.0, 16.0, 14.0, 12.0, 8.0, 10.0, 8.0, 3.0, 4.0, 8.0, 0.0, 5.0, 2.0, 3.0, 1.0, 2.0], "bins": [-10.0078125, -9.73602294921875, -9.4642333984375, -9.19244384765625, -8.920654296875, -8.64886474609375, -8.3770751953125, -8.10528564453125, -7.83349609375, -7.56170654296875, -7.2899169921875, -7.01812744140625, -6.746337890625, -6.47454833984375, -6.2027587890625, -5.93096923828125, -5.6591796875, -5.38739013671875, -5.1156005859375, -4.84381103515625, -4.572021484375, -4.30023193359375, -4.0284423828125, -3.75665283203125, -3.48486328125, -3.21307373046875, -2.9412841796875, -2.66949462890625, -2.397705078125, -2.12591552734375, -1.8541259765625, -1.58233642578125, -1.310546875, -1.03875732421875, -0.7669677734375, -0.49517822265625, -0.223388671875, 0.04840087890625, 0.3201904296875, 0.59197998046875, 0.86376953125, 1.13555908203125, 1.4073486328125, 1.67913818359375, 1.950927734375, 2.22271728515625, 2.4945068359375, 2.76629638671875, 3.0380859375, 3.30987548828125, 3.5816650390625, 3.85345458984375, 4.125244140625, 4.39703369140625, 4.6688232421875, 4.94061279296875, 5.21240234375, 5.48419189453125, 5.7559814453125, 6.02777099609375, 6.299560546875, 6.57135009765625, 6.8431396484375, 7.11492919921875, 7.38671875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 7.0, 1.0, 11.0, 12.0, 9.0, 20.0, 29.0, 21.0, 24.0, 27.0, 40.0, 46.0, 74.0, 145.0, 273.0, 705.0, 3459.0, 1715582.0, 1420627.0, 3054.0, 738.0, 287.0, 121.0, 79.0, 51.0, 33.0, 36.0, 29.0, 22.0, 31.0, 17.0, 14.0, 12.0, 10.0, 12.0, 6.0, 4.0, 7.0, 7.0, 2.0, 3.0, 3.0, 4.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.515625, -29.385009765625, -28.25439453125, -27.123779296875, -25.9931640625, -24.862548828125, -23.73193359375, -22.601318359375, -21.470703125, -20.340087890625, -19.20947265625, -18.078857421875, -16.9482421875, -15.817626953125, -14.68701171875, -13.556396484375, -12.42578125, -11.295166015625, -10.16455078125, -9.033935546875, -7.9033203125, -6.772705078125, -5.64208984375, -4.511474609375, -3.380859375, -2.250244140625, -1.11962890625, 0.010986328125, 1.1416015625, 2.272216796875, 3.40283203125, 4.533447265625, 5.6640625, 6.794677734375, 7.92529296875, 9.055908203125, 10.1865234375, 11.317138671875, 12.44775390625, 13.578369140625, 14.708984375, 15.839599609375, 16.97021484375, 18.100830078125, 19.2314453125, 20.362060546875, 21.49267578125, 22.623291015625, 23.75390625, 24.884521484375, 26.01513671875, 27.145751953125, 28.2763671875, 29.406982421875, 30.53759765625, 31.668212890625, 32.798828125, 33.929443359375, 35.06005859375, 36.190673828125, 37.3212890625, 38.451904296875, 39.58251953125, 40.713134765625, 41.84375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 995.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.60826110839844, -154.34991455078125, -143.09158325195312, -131.83323669433594, -120.57490539550781, -109.31655883789062, -98.05821990966797, -86.79988098144531, -75.54154205322266, -64.283203125, -53.024864196777344, -41.76652145385742, -30.508182525634766, -19.24984359741211, -7.9915008544921875, 3.2668380737304688, 14.525177001953125, 25.78351593017578, 37.04185485839844, 48.30019760131836, 59.558536529541016, 70.81687927246094, 82.0752182006836, 93.33355712890625, 104.5918960571289, 115.85023498535156, 127.10857391357422, 138.36691284179688, 149.62525939941406, 160.8835906982422, 172.14193725585938, 183.4002685546875, 194.65859985351562, 205.9169464111328, 217.17527770996094, 228.43362426757812, 239.69195556640625, 250.95030212402344, 262.2086486816406, 273.46697998046875, 284.7253112792969, 295.983642578125, 307.24200439453125, 318.5003356933594, 329.7586669921875, 341.0169982910156, 352.2753601074219, 363.53369140625, 374.79205322265625, 386.0503845214844, 397.3087463378906, 408.56707763671875, 419.8254089355469, 431.083740234375, 442.34210205078125, 453.6004333496094, 464.8587646484375, 476.1170959472656, 487.3754577636719, 498.6337890625, 509.8921203613281, 521.1504516601562, 532.4088134765625, 543.6671142578125, 554.9254760742188]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 2.0, 9.0, 6.0, 6.0, 13.0, 12.0, 15.0, 22.0, 21.0, 23.0, 25.0, 16.0, 26.0, 27.0, 32.0, 41.0, 23.0, 42.0, 40.0, 51.0, 31.0, 37.0, 46.0, 48.0, 36.0, 36.0, 38.0, 39.0, 34.0, 29.0, 15.0, 25.0, 24.0, 13.0, 14.0, 13.0, 13.0, 15.0, 11.0, 6.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.403093338012695, -29.32271385192871, -28.242334365844727, -27.161954879760742, -26.081575393676758, -25.001195907592773, -23.92081642150879, -22.840436935424805, -21.76005744934082, -20.679677963256836, -19.59929847717285, -18.518918991088867, -17.438539505004883, -16.3581600189209, -15.277780532836914, -14.19740104675293, -13.117021560668945, -12.036642074584961, -10.956262588500977, -9.875883102416992, -8.795503616333008, -7.715124130249023, -6.634744644165039, -5.554365158081055, -4.47398567199707, -3.393606185913086, -2.3132266998291016, -1.2328472137451172, -0.1524677276611328, 0.9279117584228516, 2.008291244506836, 3.0886707305908203, 4.1690521240234375, 5.249431610107422, 6.329811096191406, 7.410190582275391, 8.490570068359375, 9.57094955444336, 10.651329040527344, 11.731708526611328, 12.812088012695312, 13.892467498779297, 14.972846984863281, 16.053226470947266, 17.13360595703125, 18.213985443115234, 19.29436492919922, 20.374744415283203, 21.455123901367188, 22.535503387451172, 23.615882873535156, 24.69626235961914, 25.776641845703125, 26.85702133178711, 27.937400817871094, 29.017780303955078, 30.098159790039062, 31.178539276123047, 32.25891876220703, 33.339298248291016, 34.419677734375, 35.500057220458984, 36.58043670654297, 37.66081619262695, 38.74119567871094]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 6.0, 4.0, 6.0, 9.0, 7.0, 19.0, 14.0, 19.0, 19.0, 31.0, 27.0, 20.0, 35.0, 38.0, 36.0, 41.0, 51.0, 43.0, 45.0, 55.0, 40.0, 31.0, 50.0, 35.0, 33.0, 36.0, 33.0, 43.0, 19.0, 26.0, 20.0, 23.0, 16.0, 15.0, 5.0, 14.0, 8.0, 1.0, 6.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.98828125, -2.883819580078125, -2.77935791015625, -2.674896240234375, -2.5704345703125, -2.465972900390625, -2.36151123046875, -2.257049560546875, -2.152587890625, -2.048126220703125, -1.94366455078125, -1.839202880859375, -1.7347412109375, -1.630279541015625, -1.52581787109375, -1.421356201171875, -1.31689453125, -1.212432861328125, -1.10797119140625, -1.003509521484375, -0.8990478515625, -0.794586181640625, -0.69012451171875, -0.585662841796875, -0.481201171875, -0.376739501953125, -0.27227783203125, -0.167816162109375, -0.0633544921875, 0.041107177734375, 0.14556884765625, 0.250030517578125, 0.3544921875, 0.458953857421875, 0.56341552734375, 0.667877197265625, 0.7723388671875, 0.876800537109375, 0.98126220703125, 1.085723876953125, 1.190185546875, 1.294647216796875, 1.39910888671875, 1.503570556640625, 1.6080322265625, 1.712493896484375, 1.81695556640625, 1.921417236328125, 2.02587890625, 2.130340576171875, 2.23480224609375, 2.339263916015625, 2.4437255859375, 2.548187255859375, 2.65264892578125, 2.757110595703125, 2.861572265625, 2.966033935546875, 3.07049560546875, 3.174957275390625, 3.2794189453125, 3.383880615234375, 3.48834228515625, 3.592803955078125, 3.697265625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 8.0, 14.0, 20.0, 22.0, 24.0, 25.0, 36.0, 62.0, 85.0, 113.0, 152.0, 223.0, 379.0, 545.0, 939.0, 1706.0, 3381.0, 7613.0, 20143.0, 80579.0, 767996.0, 2834246.0, 392817.0, 54125.0, 15548.0, 6358.0, 2947.0, 1597.0, 865.0, 552.0, 338.0, 223.0, 161.0, 120.0, 76.0, 59.0, 38.0, 41.0, 24.0, 15.0, 16.0, 10.0, 15.0, 5.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-12.7890625, -12.39404296875, -11.9990234375, -11.60400390625, -11.208984375, -10.81396484375, -10.4189453125, -10.02392578125, -9.62890625, -9.23388671875, -8.8388671875, -8.44384765625, -8.048828125, -7.65380859375, -7.2587890625, -6.86376953125, -6.46875, -6.07373046875, -5.6787109375, -5.28369140625, -4.888671875, -4.49365234375, -4.0986328125, -3.70361328125, -3.30859375, -2.91357421875, -2.5185546875, -2.12353515625, -1.728515625, -1.33349609375, -0.9384765625, -0.54345703125, -0.1484375, 0.24658203125, 0.6416015625, 1.03662109375, 1.431640625, 1.82666015625, 2.2216796875, 2.61669921875, 3.01171875, 3.40673828125, 3.8017578125, 4.19677734375, 4.591796875, 4.98681640625, 5.3818359375, 5.77685546875, 6.171875, 6.56689453125, 6.9619140625, 7.35693359375, 7.751953125, 8.14697265625, 8.5419921875, 8.93701171875, 9.33203125, 9.72705078125, 10.1220703125, 10.51708984375, 10.912109375, 11.30712890625, 11.7021484375, 12.09716796875, 12.4921875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 10.0, 17.0, 19.0, 34.0, 38.0, 53.0, 92.0, 115.0, 157.0, 254.0, 329.0, 441.0, 575.0, 510.0, 425.0, 325.0, 223.0, 112.0, 107.0, 82.0, 47.0, 34.0, 21.0, 15.0, 13.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.4375, -17.96337890625, -17.4892578125, -17.01513671875, -16.541015625, -16.06689453125, -15.5927734375, -15.11865234375, -14.64453125, -14.17041015625, -13.6962890625, -13.22216796875, -12.748046875, -12.27392578125, -11.7998046875, -11.32568359375, -10.8515625, -10.37744140625, -9.9033203125, -9.42919921875, -8.955078125, -8.48095703125, -8.0068359375, -7.53271484375, -7.05859375, -6.58447265625, -6.1103515625, -5.63623046875, -5.162109375, -4.68798828125, -4.2138671875, -3.73974609375, -3.265625, -2.79150390625, -2.3173828125, -1.84326171875, -1.369140625, -0.89501953125, -0.4208984375, 0.05322265625, 0.52734375, 1.00146484375, 1.4755859375, 1.94970703125, 2.423828125, 2.89794921875, 3.3720703125, 3.84619140625, 4.3203125, 4.79443359375, 5.2685546875, 5.74267578125, 6.216796875, 6.69091796875, 7.1650390625, 7.63916015625, 8.11328125, 8.58740234375, 9.0615234375, 9.53564453125, 10.009765625, 10.48388671875, 10.9580078125, 11.43212890625, 11.90625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 8.0, 2.0, 5.0, 10.0, 18.0, 11.0, 15.0, 36.0, 28.0, 48.0, 57.0, 84.0, 135.0, 223.0, 462.0, 1715.0, 30783.0, 3972984.0, 183463.0, 2806.0, 617.0, 275.0, 167.0, 91.0, 78.0, 46.0, 39.0, 22.0, 13.0, 10.0, 13.0, 3.0, 5.0, 6.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5625, -33.919921875, -32.27734375, -30.634765625, -28.9921875, -27.349609375, -25.70703125, -24.064453125, -22.421875, -20.779296875, -19.13671875, -17.494140625, -15.8515625, -14.208984375, -12.56640625, -10.923828125, -9.28125, -7.638671875, -5.99609375, -4.353515625, -2.7109375, -1.068359375, 0.57421875, 2.216796875, 3.859375, 5.501953125, 7.14453125, 8.787109375, 10.4296875, 12.072265625, 13.71484375, 15.357421875, 17.0, 18.642578125, 20.28515625, 21.927734375, 23.5703125, 25.212890625, 26.85546875, 28.498046875, 30.140625, 31.783203125, 33.42578125, 35.068359375, 36.7109375, 38.353515625, 39.99609375, 41.638671875, 43.28125, 44.923828125, 46.56640625, 48.208984375, 49.8515625, 51.494140625, 53.13671875, 54.779296875, 56.421875, 58.064453125, 59.70703125, 61.349609375, 62.9921875, 64.634765625, 66.27734375, 67.919921875, 69.5625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 212.0, 719.0, 81.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.40779876708984, -74.5325927734375, -65.65739440917969, -56.78219223022461, -47.90699005126953, -39.03178787231445, -30.156585693359375, -21.281383514404297, -12.406181335449219, -3.5309791564941406, 5.3442230224609375, 14.219425201416016, 23.094627380371094, 31.969829559326172, 40.84503173828125, 49.72023391723633, 58.595436096191406, 67.47064208984375, 76.34584045410156, 85.22103881835938, 94.09624481201172, 102.97145080566406, 111.84664916992188, 120.72184753417969, 129.5970458984375, 138.4722442626953, 147.34744262695312, 156.22265625, 165.0978546142578, 173.97305297851562, 182.8482666015625, 191.7234649658203, 200.59866333007812, 209.47386169433594, 218.34906005859375, 227.22427368164062, 236.09947204589844, 244.97467041015625, 253.84988403320312, 262.7250671386719, 271.60028076171875, 280.4754943847656, 289.3506774902344, 298.22589111328125, 307.10107421875, 315.9762878417969, 324.85150146484375, 333.7266845703125, 342.6018981933594, 351.47711181640625, 360.352294921875, 369.2275085449219, 378.10272216796875, 386.9779052734375, 395.8531188964844, 404.7283020019531, 413.603515625, 422.4787292480469, 431.3539123535156, 440.2291259765625, 449.10430908203125, 457.9795227050781, 466.854736328125, 475.72991943359375, 484.6051330566406]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 1.0, 6.0, 10.0, 12.0, 14.0, 7.0, 14.0, 17.0, 18.0, 22.0, 24.0, 24.0, 27.0, 35.0, 36.0, 36.0, 39.0, 45.0, 37.0, 31.0, 37.0, 41.0, 26.0, 29.0, 37.0, 44.0, 43.0, 28.0, 28.0, 30.0, 31.0, 22.0, 21.0, 20.0, 22.0, 12.0, 12.0, 13.0, 6.0, 11.0, 6.0, 7.0, 7.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.00556182861328, -37.77153396606445, -36.53750228881836, -35.30347442626953, -34.06944274902344, -32.83541488647461, -31.60138511657715, -30.367355346679688, -29.133325576782227, -27.899295806884766, -26.665266036987305, -25.431236267089844, -24.197208404541016, -22.963176727294922, -21.729148864746094, -20.495119094848633, -19.261089324951172, -18.02705955505371, -16.79302978515625, -15.559000968933105, -14.324971199035645, -13.090941429138184, -11.856912612915039, -10.622882843017578, -9.388853073120117, -8.154823303222656, -6.9207940101623535, -5.686764717102051, -4.45273494720459, -3.218705177307129, -1.9846758842468262, -0.7506465911865234, 0.4833831787109375, 1.7174127101898193, 2.951442241668701, 4.185471534729004, 5.419501304626465, 6.653531074523926, 7.8875603675842285, 9.121589660644531, 10.355619430541992, 11.589649200439453, 12.823678970336914, 14.057707786560059, 15.29173755645752, 16.525768280029297, 17.759796142578125, 18.993825912475586, 20.227855682373047, 21.461885452270508, 22.69591522216797, 23.92994499206543, 25.16397476196289, 26.39800262451172, 27.63203239440918, 28.86606216430664, 30.1000919342041, 31.334121704101562, 32.56814956665039, 33.802181243896484, 35.03620910644531, 36.270240783691406, 37.504268646240234, 38.73829650878906, 39.972328186035156]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 3.0, 6.0, 7.0, 7.0, 10.0, 13.0, 16.0, 17.0, 14.0, 18.0, 33.0, 18.0, 20.0, 31.0, 29.0, 22.0, 35.0, 45.0, 50.0, 40.0, 45.0, 42.0, 36.0, 41.0, 24.0, 34.0, 23.0, 35.0, 28.0, 36.0, 29.0, 32.0, 22.0, 15.0, 24.0, 12.0, 13.0, 9.0, 12.0, 9.0, 10.0, 7.0, 5.0, 3.0, 0.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.115234375, -3.020172119140625, -2.92510986328125, -2.830047607421875, -2.7349853515625, -2.639923095703125, -2.54486083984375, -2.449798583984375, -2.354736328125, -2.259674072265625, -2.16461181640625, -2.069549560546875, -1.9744873046875, -1.879425048828125, -1.78436279296875, -1.689300537109375, -1.59423828125, -1.499176025390625, -1.40411376953125, -1.309051513671875, -1.2139892578125, -1.118927001953125, -1.02386474609375, -0.928802490234375, -0.833740234375, -0.738677978515625, -0.64361572265625, -0.548553466796875, -0.4534912109375, -0.358428955078125, -0.26336669921875, -0.168304443359375, -0.0732421875, 0.021820068359375, 0.11688232421875, 0.211944580078125, 0.3070068359375, 0.402069091796875, 0.49713134765625, 0.592193603515625, 0.687255859375, 0.782318115234375, 0.87738037109375, 0.972442626953125, 1.0675048828125, 1.162567138671875, 1.25762939453125, 1.352691650390625, 1.44775390625, 1.542816162109375, 1.63787841796875, 1.732940673828125, 1.8280029296875, 1.923065185546875, 2.01812744140625, 2.113189697265625, 2.208251953125, 2.303314208984375, 2.39837646484375, 2.493438720703125, 2.5885009765625, 2.683563232421875, 2.77862548828125, 2.873687744140625, 2.96875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 6.0, 11.0, 23.0, 24.0, 39.0, 60.0, 61.0, 90.0, 144.0, 177.0, 305.0, 364.0, 604.0, 820.0, 1177.0, 1616.0, 2455.0, 3547.0, 5150.0, 7467.0, 11074.0, 16508.0, 24536.0, 37284.0, 60119.0, 101381.0, 196629.0, 246265.0, 126017.0, 72019.0, 44424.0, 28772.0, 19034.0, 12721.0, 8665.0, 5893.0, 3987.0, 2762.0, 1908.0, 1372.0, 913.0, 657.0, 431.0, 342.0, 207.0, 156.0, 105.0, 73.0, 51.0, 29.0, 30.0, 21.0, 16.0, 11.0, 4.0, 4.0, 2.0, 3.0], "bins": [-0.57568359375, -0.5583343505859375, -0.540985107421875, -0.5236358642578125, -0.50628662109375, -0.4889373779296875, -0.471588134765625, -0.4542388916015625, -0.4368896484375, -0.4195404052734375, -0.402191162109375, -0.3848419189453125, -0.36749267578125, -0.3501434326171875, -0.332794189453125, -0.3154449462890625, -0.298095703125, -0.2807464599609375, -0.263397216796875, -0.2460479736328125, -0.22869873046875, -0.2113494873046875, -0.194000244140625, -0.1766510009765625, -0.1593017578125, -0.1419525146484375, -0.124603271484375, -0.1072540283203125, -0.08990478515625, -0.0725555419921875, -0.055206298828125, -0.0378570556640625, -0.0205078125, -0.0031585693359375, 0.014190673828125, 0.0315399169921875, 0.04888916015625, 0.0662384033203125, 0.083587646484375, 0.1009368896484375, 0.1182861328125, 0.1356353759765625, 0.152984619140625, 0.1703338623046875, 0.18768310546875, 0.2050323486328125, 0.222381591796875, 0.2397308349609375, 0.257080078125, 0.2744293212890625, 0.291778564453125, 0.3091278076171875, 0.32647705078125, 0.3438262939453125, 0.361175537109375, 0.3785247802734375, 0.3958740234375, 0.4132232666015625, 0.430572509765625, 0.4479217529296875, 0.46527099609375, 0.4826202392578125, 0.499969482421875, 0.5173187255859375, 0.53466796875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 4.0, 8.0, 11.0, 9.0, 9.0, 12.0, 17.0, 18.0, 26.0, 12.0, 22.0, 26.0, 32.0, 32.0, 31.0, 32.0, 37.0, 36.0, 45.0, 43.0, 1069.0, 34.0, 46.0, 35.0, 32.0, 40.0, 44.0, 20.0, 30.0, 25.0, 29.0, 24.0, 22.0, 18.0, 21.0, 11.0, 13.0, 11.0, 8.0, 9.0, 7.0, 7.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.115234375, -2.048980712890625, -1.98272705078125, -1.916473388671875, -1.8502197265625, -1.783966064453125, -1.71771240234375, -1.651458740234375, -1.585205078125, -1.518951416015625, -1.45269775390625, -1.386444091796875, -1.3201904296875, -1.253936767578125, -1.18768310546875, -1.121429443359375, -1.05517578125, -0.988922119140625, -0.92266845703125, -0.856414794921875, -0.7901611328125, -0.723907470703125, -0.65765380859375, -0.591400146484375, -0.525146484375, -0.458892822265625, -0.39263916015625, -0.326385498046875, -0.2601318359375, -0.193878173828125, -0.12762451171875, -0.061370849609375, 0.0048828125, 0.071136474609375, 0.13739013671875, 0.203643798828125, 0.2698974609375, 0.336151123046875, 0.40240478515625, 0.468658447265625, 0.534912109375, 0.601165771484375, 0.66741943359375, 0.733673095703125, 0.7999267578125, 0.866180419921875, 0.93243408203125, 0.998687744140625, 1.06494140625, 1.131195068359375, 1.19744873046875, 1.263702392578125, 1.3299560546875, 1.396209716796875, 1.46246337890625, 1.528717041015625, 1.594970703125, 1.661224365234375, 1.72747802734375, 1.793731689453125, 1.8599853515625, 1.926239013671875, 1.99249267578125, 2.058746337890625, 2.125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 12.0, 14.0, 20.0, 36.0, 43.0, 57.0, 97.0, 103.0, 161.0, 238.0, 297.0, 508.0, 679.0, 1033.0, 1518.0, 2183.0, 3437.0, 5009.0, 7887.0, 12434.0, 19109.0, 31127.0, 50550.0, 87443.0, 171097.0, 1331590.0, 158034.0, 82435.0, 47741.0, 29323.0, 18852.0, 11526.0, 7760.0, 4825.0, 3181.0, 2178.0, 1412.0, 982.0, 652.0, 463.0, 332.0, 232.0, 154.0, 105.0, 64.0, 59.0, 43.0, 32.0, 20.0, 15.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.56982421875, -0.5517044067382812, -0.5335845947265625, -0.5154647827148438, -0.497344970703125, -0.47922515869140625, -0.4611053466796875, -0.44298553466796875, -0.42486572265625, -0.40674591064453125, -0.3886260986328125, -0.37050628662109375, -0.352386474609375, -0.33426666259765625, -0.3161468505859375, -0.29802703857421875, -0.2799072265625, -0.26178741455078125, -0.2436676025390625, -0.22554779052734375, -0.207427978515625, -0.18930816650390625, -0.1711883544921875, -0.15306854248046875, -0.13494873046875, -0.11682891845703125, -0.0987091064453125, -0.08058929443359375, -0.062469482421875, -0.04434967041015625, -0.0262298583984375, -0.00811004638671875, 0.010009765625, 0.02812957763671875, 0.0462493896484375, 0.06436920166015625, 0.082489013671875, 0.10060882568359375, 0.1187286376953125, 0.13684844970703125, 0.15496826171875, 0.17308807373046875, 0.1912078857421875, 0.20932769775390625, 0.227447509765625, 0.24556732177734375, 0.2636871337890625, 0.28180694580078125, 0.2999267578125, 0.31804656982421875, 0.3361663818359375, 0.35428619384765625, 0.372406005859375, 0.39052581787109375, 0.4086456298828125, 0.42676544189453125, 0.44488525390625, 0.46300506591796875, 0.4811248779296875, 0.49924468994140625, 0.517364501953125, 0.5354843139648438, 0.5536041259765625, 0.5717239379882812, 0.58984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [5.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 2.0, 7.0, 3.0, 10.0, 10.0, 7.0, 23.0, 13.0, 19.0, 17.0, 17.0, 32.0, 22.0, 41.0, 41.0, 52.0, 57.0, 67.0, 57.0, 70.0, 61.0, 58.0, 38.0, 48.0, 36.0, 30.0, 23.0, 28.0, 17.0, 11.0, 15.0, 11.0, 10.0, 10.0, 6.0, 3.0, 3.0, 4.0, 2.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004892349243164062, -0.00047062337398529053, -0.0004520118236541748, -0.0004334002733230591, -0.00041478872299194336, -0.00039617717266082764, -0.0003775656223297119, -0.0003589540719985962, -0.00034034252166748047, -0.00032173097133636475, -0.000303119421005249, -0.0002845078706741333, -0.0002658963203430176, -0.00024728477001190186, -0.00022867321968078613, -0.0002100616693496704, -0.0001914501190185547, -0.00017283856868743896, -0.00015422701835632324, -0.00013561546802520752, -0.0001170039176940918, -9.839236736297607e-05, -7.978081703186035e-05, -6.116926670074463e-05, -4.2557716369628906e-05, -2.3946166038513184e-05, -5.334615707397461e-06, 1.3276934623718262e-05, 3.1888484954833984e-05, 5.050003528594971e-05, 6.911158561706543e-05, 8.772313594818115e-05, 0.00010633468627929688, 0.0001249462366104126, 0.00014355778694152832, 0.00016216933727264404, 0.00018078088760375977, 0.0001993924379348755, 0.0002180039882659912, 0.00023661553859710693, 0.00025522708892822266, 0.0002738386392593384, 0.0002924501895904541, 0.0003110617399215698, 0.00032967329025268555, 0.00034828484058380127, 0.000366896390914917, 0.0003855079412460327, 0.00040411949157714844, 0.00042273104190826416, 0.0004413425922393799, 0.0004599541425704956, 0.00047856569290161133, 0.000497177243232727, 0.0005157887935638428, 0.0005344003438949585, 0.0005530118942260742, 0.0005716234445571899, 0.0005902349948883057, 0.0006088465452194214, 0.0006274580955505371, 0.0006460696458816528, 0.0006646811962127686, 0.0006832927465438843, 0.000701904296875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 2.0, 10.0, 8.0, 18.0, 16.0, 16.0, 21.0, 23.0, 61.0, 51.0, 79.0, 98.0, 107.0, 175.0, 289.0, 534.0, 1547.0, 982296.0, 61093.0, 845.0, 421.0, 245.0, 125.0, 118.0, 55.0, 69.0, 46.0, 28.0, 19.0, 24.0, 31.0, 16.0, 10.0, 15.0, 9.0, 6.0, 2.0, 5.0, 5.0, 2.0, 2.0, 5.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.01442718505859375, -0.014024138450622559, -0.013621091842651367, -0.013218045234680176, -0.012814998626708984, -0.012411952018737793, -0.012008905410766602, -0.01160585880279541, -0.011202812194824219, -0.010799765586853027, -0.010396718978881836, -0.009993672370910645, -0.009590625762939453, -0.009187579154968262, -0.00878453254699707, -0.008381485939025879, -0.007978439331054688, -0.007575392723083496, -0.007172346115112305, -0.006769299507141113, -0.006366252899169922, -0.0059632062911987305, -0.005560159683227539, -0.005157113075256348, -0.004754066467285156, -0.004351019859313965, -0.0039479732513427734, -0.003544926643371582, -0.0031418800354003906, -0.0027388334274291992, -0.002335786819458008, -0.0019327402114868164, -0.001529693603515625, -0.0011266469955444336, -0.0007236003875732422, -0.0003205537796020508, 8.249282836914062e-05, 0.00048553943634033203, 0.0008885860443115234, 0.0012916326522827148, 0.0016946792602539062, 0.0020977258682250977, 0.002500772476196289, 0.0029038190841674805, 0.003306865692138672, 0.0037099123001098633, 0.004112958908081055, 0.004516005516052246, 0.0049190521240234375, 0.005322098731994629, 0.00572514533996582, 0.006128191947937012, 0.006531238555908203, 0.0069342851638793945, 0.007337331771850586, 0.007740378379821777, 0.008143424987792969, 0.00854647159576416, 0.008949518203735352, 0.009352564811706543, 0.009755611419677734, 0.010158658027648926, 0.010561704635620117, 0.010964751243591309, 0.0113677978515625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 19.0, 223.0, 586.0, 175.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001708584139123559, -0.001652475562877953, -0.001596366986632347, -0.0015402584103867412, -0.0014841498341411352, -0.0014280412578955293, -0.0013719326816499233, -0.0013158239889889956, -0.0012597155291587114, -0.0012036069529131055, -0.0011474983766674995, -0.0010913898004218936, -0.0010352812241762877, -0.0009791726479306817, -0.0009230640134774148, -0.0008669554372318089, -0.000810846802778542, -0.0007547382265329361, -0.0006986296502873302, -0.0006425210740417242, -0.0005864124977961183, -0.0005303039215505123, -0.00047419528709724545, -0.0004180867108516395, -0.00036197813460603356, -0.0003058695583604276, -0.00024976098211482167, -0.00019365237676538527, -0.00013754380051977932, -8.143522427417338e-05, -2.5326618924736977e-05, 3.078195732086897e-05, 8.689064998179674e-05, 0.0001429992262274027, 0.00019910781702492386, 0.00025521640782244503, 0.000311324984068051, 0.0003674335603136569, 0.00042354216566309333, 0.0004796507419086993, 0.0005357593181543052, 0.0005918678943999112, 0.0006479764706455171, 0.000704085105098784, 0.0007601936813443899, 0.0008163022575899959, 0.0008724108338356018, 0.0009285194100812078, 0.0009846279863268137, 0.0010407365625724196, 0.0010968451388180256, 0.0011529537150636315, 0.0012090622913092375, 0.0012651708675548434, 0.0013212794438004494, 0.0013773881364613771, 0.0014334965962916613, 0.0014896051725372672, 0.0015457137487828732, 0.001601822325028479, 0.001657930901274085, 0.001714039477519691, 0.001770148053765297, 0.0018262567464262247, 0.0018823653226718307]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 4.0, 4.0, 3.0, 7.0, 12.0, 11.0, 17.0, 14.0, 14.0, 16.0, 25.0, 19.0, 21.0, 27.0, 40.0, 39.0, 35.0, 35.0, 39.0, 50.0, 41.0, 54.0, 38.0, 40.0, 47.0, 36.0, 30.0, 45.0, 39.0, 31.0, 31.0, 21.0, 25.0, 13.0, 16.0, 12.0, 8.0, 10.0, 9.0, 6.0, 4.0, 6.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003325939178466797, -0.0003217337653040886, -0.0003108736127614975, -0.0003000134602189064, -0.0002891533076763153, -0.0002782931551337242, -0.0002674330025911331, -0.000256572850048542, -0.00024571269750595093, -0.00023485254496335983, -0.00022399239242076874, -0.00021313223987817764, -0.00020227208733558655, -0.00019141193479299545, -0.00018055178225040436, -0.00016969162970781326, -0.00015883147716522217, -0.00014797132462263107, -0.00013711117208003998, -0.00012625101953744888, -0.00011539086699485779, -0.00010453071445226669, -9.36705619096756e-05, -8.28104093670845e-05, -7.195025682449341e-05, -6.109010428190231e-05, -5.022995173931122e-05, -3.936979919672012e-05, -2.850964665412903e-05, -1.7649494111537933e-05, -6.789341568946838e-06, 4.070810973644257e-06, 1.4930963516235352e-05, 2.5791116058826447e-05, 3.665126860141754e-05, 4.7511421144008636e-05, 5.837157368659973e-05, 6.923172622919083e-05, 8.009187877178192e-05, 9.095203131437302e-05, 0.00010181218385696411, 0.0001126723363995552, 0.0001235324889421463, 0.0001343926414847374, 0.0001452527940273285, 0.00015611294656991959, 0.00016697309911251068, 0.00017783325165510178, 0.00018869340419769287, 0.00019955355674028397, 0.00021041370928287506, 0.00022127386182546616, 0.00023213401436805725, 0.00024299416691064835, 0.00025385431945323944, 0.00026471447199583054, 0.00027557462453842163, 0.0002864347770810127, 0.0002972949296236038, 0.0003081550821661949, 0.000319015234708786, 0.0003298753872513771, 0.0003407355397939682, 0.0003515956923365593, 0.0003624558448791504]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 3.0, 6.0, 7.0, 7.0, 10.0, 13.0, 16.0, 17.0, 14.0, 18.0, 33.0, 18.0, 20.0, 31.0, 29.0, 22.0, 35.0, 45.0, 50.0, 40.0, 45.0, 42.0, 36.0, 41.0, 24.0, 34.0, 23.0, 35.0, 28.0, 36.0, 29.0, 32.0, 22.0, 15.0, 24.0, 12.0, 13.0, 9.0, 12.0, 9.0, 10.0, 7.0, 5.0, 3.0, 0.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.115234375, -3.020172119140625, -2.92510986328125, -2.830047607421875, -2.7349853515625, -2.639923095703125, -2.54486083984375, -2.449798583984375, -2.354736328125, -2.259674072265625, -2.16461181640625, -2.069549560546875, -1.9744873046875, -1.879425048828125, -1.78436279296875, -1.689300537109375, -1.59423828125, -1.499176025390625, -1.40411376953125, -1.309051513671875, -1.2139892578125, -1.118927001953125, -1.02386474609375, -0.928802490234375, -0.833740234375, -0.738677978515625, -0.64361572265625, -0.548553466796875, -0.4534912109375, -0.358428955078125, -0.26336669921875, -0.168304443359375, -0.0732421875, 0.021820068359375, 0.11688232421875, 0.211944580078125, 0.3070068359375, 0.402069091796875, 0.49713134765625, 0.592193603515625, 0.687255859375, 0.782318115234375, 0.87738037109375, 0.972442626953125, 1.0675048828125, 1.162567138671875, 1.25762939453125, 1.352691650390625, 1.44775390625, 1.542816162109375, 1.63787841796875, 1.732940673828125, 1.8280029296875, 1.923065185546875, 2.01812744140625, 2.113189697265625, 2.208251953125, 2.303314208984375, 2.39837646484375, 2.493438720703125, 2.5885009765625, 2.683563232421875, 2.77862548828125, 2.873687744140625, 2.96875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 10.0, 6.0, 20.0, 16.0, 22.0, 28.0, 48.0, 74.0, 85.0, 128.0, 157.0, 251.0, 379.0, 579.0, 961.0, 1875.0, 3658.0, 7435.0, 17442.0, 42929.0, 110882.0, 245322.0, 312772.0, 178958.0, 72906.0, 28247.0, 11685.0, 5381.0, 2575.0, 1360.0, 794.0, 488.0, 332.0, 221.0, 147.0, 109.0, 72.0, 52.0, 41.0, 39.0, 21.0, 13.0, 6.0, 8.0, 9.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.1328125, -4.012237548828125, -3.89166259765625, -3.771087646484375, -3.6505126953125, -3.529937744140625, -3.40936279296875, -3.288787841796875, -3.168212890625, -3.047637939453125, -2.92706298828125, -2.806488037109375, -2.6859130859375, -2.565338134765625, -2.44476318359375, -2.324188232421875, -2.20361328125, -2.083038330078125, -1.96246337890625, -1.841888427734375, -1.7213134765625, -1.600738525390625, -1.48016357421875, -1.359588623046875, -1.239013671875, -1.118438720703125, -0.99786376953125, -0.877288818359375, -0.7567138671875, -0.636138916015625, -0.51556396484375, -0.394989013671875, -0.2744140625, -0.153839111328125, -0.03326416015625, 0.087310791015625, 0.2078857421875, 0.328460693359375, 0.44903564453125, 0.569610595703125, 0.690185546875, 0.810760498046875, 0.93133544921875, 1.051910400390625, 1.1724853515625, 1.293060302734375, 1.41363525390625, 1.534210205078125, 1.65478515625, 1.775360107421875, 1.89593505859375, 2.016510009765625, 2.1370849609375, 2.257659912109375, 2.37823486328125, 2.498809814453125, 2.619384765625, 2.739959716796875, 2.86053466796875, 2.981109619140625, 3.1016845703125, 3.222259521484375, 3.34283447265625, 3.463409423828125, 3.583984375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 13.0, 10.0, 6.0, 6.0, 16.0, 14.0, 18.0, 18.0, 19.0, 32.0, 26.0, 23.0, 45.0, 40.0, 35.0, 52.0, 75.0, 159.0, 304.0, 1391.0, 205.0, 102.0, 66.0, 41.0, 52.0, 45.0, 34.0, 30.0, 27.0, 26.0, 17.0, 14.0, 16.0, 10.0, 16.0, 9.0, 7.0, 6.0, 8.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.046875, -11.68359375, -11.3203125, -10.95703125, -10.59375, -10.23046875, -9.8671875, -9.50390625, -9.140625, -8.77734375, -8.4140625, -8.05078125, -7.6875, -7.32421875, -6.9609375, -6.59765625, -6.234375, -5.87109375, -5.5078125, -5.14453125, -4.78125, -4.41796875, -4.0546875, -3.69140625, -3.328125, -2.96484375, -2.6015625, -2.23828125, -1.875, -1.51171875, -1.1484375, -0.78515625, -0.421875, -0.05859375, 0.3046875, 0.66796875, 1.03125, 1.39453125, 1.7578125, 2.12109375, 2.484375, 2.84765625, 3.2109375, 3.57421875, 3.9375, 4.30078125, 4.6640625, 5.02734375, 5.390625, 5.75390625, 6.1171875, 6.48046875, 6.84375, 7.20703125, 7.5703125, 7.93359375, 8.296875, 8.66015625, 9.0234375, 9.38671875, 9.75, 10.11328125, 10.4765625, 10.83984375, 11.203125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 7.0, 6.0, 8.0, 10.0, 7.0, 12.0, 16.0, 16.0, 23.0, 30.0, 36.0, 44.0, 53.0, 84.0, 131.0, 205.0, 425.0, 1163.0, 10357.0, 2282929.0, 842446.0, 5776.0, 949.0, 339.0, 184.0, 129.0, 56.0, 39.0, 39.0, 39.0, 25.0, 17.0, 17.0, 17.0, 12.0, 17.0, 6.0, 7.0, 11.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.921875, -22.155517578125, -21.38916015625, -20.622802734375, -19.8564453125, -19.090087890625, -18.32373046875, -17.557373046875, -16.791015625, -16.024658203125, -15.25830078125, -14.491943359375, -13.7255859375, -12.959228515625, -12.19287109375, -11.426513671875, -10.66015625, -9.893798828125, -9.12744140625, -8.361083984375, -7.5947265625, -6.828369140625, -6.06201171875, -5.295654296875, -4.529296875, -3.762939453125, -2.99658203125, -2.230224609375, -1.4638671875, -0.697509765625, 0.06884765625, 0.835205078125, 1.6015625, 2.367919921875, 3.13427734375, 3.900634765625, 4.6669921875, 5.433349609375, 6.19970703125, 6.966064453125, 7.732421875, 8.498779296875, 9.26513671875, 10.031494140625, 10.7978515625, 11.564208984375, 12.33056640625, 13.096923828125, 13.86328125, 14.629638671875, 15.39599609375, 16.162353515625, 16.9287109375, 17.695068359375, 18.46142578125, 19.227783203125, 19.994140625, 20.760498046875, 21.52685546875, 22.293212890625, 23.0595703125, 23.825927734375, 24.59228515625, 25.358642578125, 26.125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 186.0, 782.0, 43.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-208.3084716796875, -204.4712677001953, -200.6340789794922, -196.796875, -192.95968627929688, -189.1224822998047, -185.2852783203125, -181.44808959960938, -177.6108856201172, -173.773681640625, -169.93649291992188, -166.0992889404297, -162.2620849609375, -158.42489624023438, -154.5876922607422, -150.75050354003906, -146.91329956054688, -143.0760955810547, -139.23890686035156, -135.40170288085938, -131.56451416015625, -127.72731018066406, -123.89010620117188, -120.05290985107422, -116.21571350097656, -112.3785171508789, -108.54132080078125, -104.70411682128906, -100.8669204711914, -97.02972412109375, -93.19252014160156, -89.3553237915039, -85.51812744140625, -81.6809310913086, -77.84373474121094, -74.00653076171875, -70.1693344116211, -66.33213806152344, -62.494937896728516, -58.657737731933594, -54.82053756713867, -50.98333740234375, -47.146141052246094, -43.30894470214844, -39.471744537353516, -35.634544372558594, -31.797348022460938, -27.96014976501465, -24.12295150756836, -20.28575325012207, -16.44855499267578, -12.611356735229492, -8.774158477783203, -4.936960220336914, -1.099761962890625, 2.737436294555664, 6.574634552001953, 10.411832809448242, 14.249031066894531, 18.08622932434082, 21.92342758178711, 25.7606258392334, 29.597824096679688, 33.435020446777344, 37.272220611572266]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 1.0, 4.0, 6.0, 13.0, 10.0, 11.0, 17.0, 11.0, 15.0, 22.0, 19.0, 35.0, 17.0, 30.0, 21.0, 39.0, 48.0, 42.0, 48.0, 39.0, 39.0, 40.0, 28.0, 35.0, 38.0, 29.0, 45.0, 44.0, 31.0, 20.0, 28.0, 25.0, 30.0, 12.0, 15.0, 14.0, 15.0, 17.0, 7.0, 6.0, 7.0, 6.0, 6.0, 2.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.04179382324219, -32.95559310913086, -31.86939239501953, -30.783191680908203, -29.696990966796875, -28.610790252685547, -27.524587631225586, -26.438386917114258, -25.35218620300293, -24.2659854888916, -23.179784774780273, -22.093584060668945, -21.007381439208984, -19.921180725097656, -18.834980010986328, -17.748779296875, -16.662578582763672, -15.576377868652344, -14.490177154541016, -13.403975486755371, -12.317774772644043, -11.231574058532715, -10.14537239074707, -9.059171676635742, -7.972970962524414, -6.886770248413086, -5.8005690574646, -4.714367866516113, -3.628167152404785, -2.541966438293457, -1.4557652473449707, -0.3695640563964844, 0.7166366577148438, 1.802837610244751, 2.889038562774658, 3.9752395153045654, 5.061440467834473, 6.147641181945801, 7.233842372894287, 8.320043563842773, 9.406244277954102, 10.49244499206543, 11.578645706176758, 12.664847373962402, 13.75104808807373, 14.837248802185059, 15.923450469970703, 17.00965118408203, 18.09585189819336, 19.182052612304688, 20.268253326416016, 21.354454040527344, 22.440654754638672, 23.52685546875, 24.61305809020996, 25.69925880432129, 26.785459518432617, 27.871660232543945, 28.957860946655273, 30.0440616607666, 31.130264282226562, 32.21646499633789, 33.30266571044922, 34.38886642456055, 35.475067138671875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 13.0, 4.0, 11.0, 13.0, 18.0, 16.0, 17.0, 16.0, 20.0, 27.0, 19.0, 22.0, 40.0, 27.0, 32.0, 36.0, 44.0, 34.0, 44.0, 37.0, 30.0, 48.0, 44.0, 24.0, 35.0, 33.0, 33.0, 29.0, 26.0, 34.0, 17.0, 19.0, 25.0, 15.0, 12.0, 12.0, 11.0, 8.0, 10.0, 3.0, 6.0, 6.0, 3.0, 5.0, 5.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-3.234375, -3.136474609375, -3.03857421875, -2.940673828125, -2.8427734375, -2.744873046875, -2.64697265625, -2.549072265625, -2.451171875, -2.353271484375, -2.25537109375, -2.157470703125, -2.0595703125, -1.961669921875, -1.86376953125, -1.765869140625, -1.66796875, -1.570068359375, -1.47216796875, -1.374267578125, -1.2763671875, -1.178466796875, -1.08056640625, -0.982666015625, -0.884765625, -0.786865234375, -0.68896484375, -0.591064453125, -0.4931640625, -0.395263671875, -0.29736328125, -0.199462890625, -0.1015625, -0.003662109375, 0.09423828125, 0.192138671875, 0.2900390625, 0.387939453125, 0.48583984375, 0.583740234375, 0.681640625, 0.779541015625, 0.87744140625, 0.975341796875, 1.0732421875, 1.171142578125, 1.26904296875, 1.366943359375, 1.46484375, 1.562744140625, 1.66064453125, 1.758544921875, 1.8564453125, 1.954345703125, 2.05224609375, 2.150146484375, 2.248046875, 2.345947265625, 2.44384765625, 2.541748046875, 2.6396484375, 2.737548828125, 2.83544921875, 2.933349609375, 3.03125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 3.0, 9.0, 7.0, 16.0, 19.0, 17.0, 31.0, 22.0, 35.0, 48.0, 51.0, 81.0, 127.0, 264.0, 516.0, 1364.0, 5472.0, 39460.0, 615001.0, 3007817.0, 483944.0, 32840.0, 4686.0, 1257.0, 477.0, 220.0, 105.0, 79.0, 58.0, 47.0, 52.0, 29.0, 22.0, 20.0, 20.0, 10.0, 10.0, 13.0, 9.0, 3.0, 2.0, 5.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-12.7109375, -12.3310546875, -11.951171875, -11.5712890625, -11.19140625, -10.8115234375, -10.431640625, -10.0517578125, -9.671875, -9.2919921875, -8.912109375, -8.5322265625, -8.15234375, -7.7724609375, -7.392578125, -7.0126953125, -6.6328125, -6.2529296875, -5.873046875, -5.4931640625, -5.11328125, -4.7333984375, -4.353515625, -3.9736328125, -3.59375, -3.2138671875, -2.833984375, -2.4541015625, -2.07421875, -1.6943359375, -1.314453125, -0.9345703125, -0.5546875, -0.1748046875, 0.205078125, 0.5849609375, 0.96484375, 1.3447265625, 1.724609375, 2.1044921875, 2.484375, 2.8642578125, 3.244140625, 3.6240234375, 4.00390625, 4.3837890625, 4.763671875, 5.1435546875, 5.5234375, 5.9033203125, 6.283203125, 6.6630859375, 7.04296875, 7.4228515625, 7.802734375, 8.1826171875, 8.5625, 8.9423828125, 9.322265625, 9.7021484375, 10.08203125, 10.4619140625, 10.841796875, 11.2216796875, 11.6015625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 10.0, 7.0, 21.0, 31.0, 36.0, 52.0, 83.0, 125.0, 142.0, 216.0, 281.0, 379.0, 484.0, 496.0, 472.0, 354.0, 240.0, 195.0, 128.0, 93.0, 69.0, 48.0, 33.0, 21.0, 24.0, 8.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1328125, -12.72607421875, -12.3193359375, -11.91259765625, -11.505859375, -11.09912109375, -10.6923828125, -10.28564453125, -9.87890625, -9.47216796875, -9.0654296875, -8.65869140625, -8.251953125, -7.84521484375, -7.4384765625, -7.03173828125, -6.625, -6.21826171875, -5.8115234375, -5.40478515625, -4.998046875, -4.59130859375, -4.1845703125, -3.77783203125, -3.37109375, -2.96435546875, -2.5576171875, -2.15087890625, -1.744140625, -1.33740234375, -0.9306640625, -0.52392578125, -0.1171875, 0.28955078125, 0.6962890625, 1.10302734375, 1.509765625, 1.91650390625, 2.3232421875, 2.72998046875, 3.13671875, 3.54345703125, 3.9501953125, 4.35693359375, 4.763671875, 5.17041015625, 5.5771484375, 5.98388671875, 6.390625, 6.79736328125, 7.2041015625, 7.61083984375, 8.017578125, 8.42431640625, 8.8310546875, 9.23779296875, 9.64453125, 10.05126953125, 10.4580078125, 10.86474609375, 11.271484375, 11.67822265625, 12.0849609375, 12.49169921875, 12.8984375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 9.0, 12.0, 21.0, 26.0, 45.0, 63.0, 113.0, 177.0, 331.0, 816.0, 2709.0, 41766.0, 3241195.0, 891954.0, 12133.0, 1623.0, 592.0, 270.0, 144.0, 88.0, 61.0, 41.0, 23.0, 22.0, 11.0, 10.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.03125, -22.87744140625, -21.7236328125, -20.56982421875, -19.416015625, -18.26220703125, -17.1083984375, -15.95458984375, -14.80078125, -13.64697265625, -12.4931640625, -11.33935546875, -10.185546875, -9.03173828125, -7.8779296875, -6.72412109375, -5.5703125, -4.41650390625, -3.2626953125, -2.10888671875, -0.955078125, 0.19873046875, 1.3525390625, 2.50634765625, 3.66015625, 4.81396484375, 5.9677734375, 7.12158203125, 8.275390625, 9.42919921875, 10.5830078125, 11.73681640625, 12.890625, 14.04443359375, 15.1982421875, 16.35205078125, 17.505859375, 18.65966796875, 19.8134765625, 20.96728515625, 22.12109375, 23.27490234375, 24.4287109375, 25.58251953125, 26.736328125, 27.89013671875, 29.0439453125, 30.19775390625, 31.3515625, 32.50537109375, 33.6591796875, 34.81298828125, 35.966796875, 37.12060546875, 38.2744140625, 39.42822265625, 40.58203125, 41.73583984375, 42.8896484375, 44.04345703125, 45.197265625, 46.35107421875, 47.5048828125, 48.65869140625, 49.8125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 12.0, 16.0, 19.0, 27.0, 47.0, 56.0, 79.0, 87.0, 80.0, 103.0, 81.0, 80.0, 85.0, 77.0, 44.0, 40.0, 29.0, 13.0, 10.0, 4.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.093761444091797, -29.010303497314453, -27.926847457885742, -26.84339141845703, -25.759933471679688, -24.676475524902344, -23.593019485473633, -22.509563446044922, -21.426105499267578, -20.342647552490234, -19.259191513061523, -18.175735473632812, -17.09227752685547, -16.008819580078125, -14.925363540649414, -13.841906547546387, -12.75844955444336, -11.674992561340332, -10.591535568237305, -9.508078575134277, -8.42462158203125, -7.341164588928223, -6.257707595825195, -5.174250602722168, -4.090793609619141, -3.0073366165161133, -1.923879623413086, -0.8404226303100586, 0.24303436279296875, 1.326491355895996, 2.4099483489990234, 3.493405342102051, 4.5768585205078125, 5.66031551361084, 6.743772506713867, 7.8272294998168945, 8.910686492919922, 9.99414348602295, 11.077600479125977, 12.161057472229004, 13.244514465332031, 14.327971458435059, 15.411428451538086, 16.494884490966797, 17.57834243774414, 18.661800384521484, 19.745256423950195, 20.828712463378906, 21.91217041015625, 22.995628356933594, 24.079084396362305, 25.162540435791016, 26.24599838256836, 27.329456329345703, 28.412912368774414, 29.496368408203125, 30.57982635498047, 31.663284301757812, 32.746742248535156, 33.830196380615234, 34.91365432739258, 35.99711227416992, 37.08056640625, 38.164024353027344, 39.24748229980469]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 6.0, 17.0, 12.0, 30.0, 23.0, 19.0, 14.0, 34.0, 31.0, 24.0, 41.0, 41.0, 32.0, 53.0, 46.0, 44.0, 43.0, 36.0, 35.0, 50.0, 33.0, 44.0, 47.0, 42.0, 28.0, 25.0, 21.0, 23.0, 20.0, 11.0, 13.0, 10.0, 10.0, 6.0, 8.0, 5.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.70399856567383, -38.40064239501953, -37.0972900390625, -35.79393768310547, -34.49058151245117, -33.187225341796875, -31.883872985839844, -30.58051872253418, -29.277164459228516, -27.97381019592285, -26.670455932617188, -25.367101669311523, -24.06374740600586, -22.760393142700195, -21.45703887939453, -20.153684616088867, -18.850330352783203, -17.54697608947754, -16.243621826171875, -14.940267562866211, -13.636913299560547, -12.333559036254883, -11.030204772949219, -9.726850509643555, -8.42349624633789, -7.120141983032227, -5.8167877197265625, -4.513433456420898, -3.2100791931152344, -1.9067249298095703, -0.6033706665039062, 0.6999835968017578, 2.0033416748046875, 3.3066959381103516, 4.610050201416016, 5.91340446472168, 7.216758728027344, 8.520112991333008, 9.823467254638672, 11.126821517944336, 12.43017578125, 13.733530044555664, 15.036884307861328, 16.340238571166992, 17.643592834472656, 18.94694709777832, 20.250301361083984, 21.55365562438965, 22.857009887695312, 24.160364151000977, 25.46371841430664, 26.767072677612305, 28.07042694091797, 29.373781204223633, 30.677135467529297, 31.98048973083496, 33.283843994140625, 34.587196350097656, 35.89055252075195, 37.19390869140625, 38.49726104736328, 39.80061340332031, 41.10396957397461, 42.407325744628906, 43.71067810058594]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 14.0, 9.0, 11.0, 6.0, 13.0, 17.0, 9.0, 21.0, 16.0, 26.0, 34.0, 35.0, 28.0, 30.0, 38.0, 49.0, 35.0, 46.0, 35.0, 57.0, 40.0, 39.0, 35.0, 31.0, 38.0, 33.0, 25.0, 40.0, 22.0, 23.0, 22.0, 14.0, 17.0, 18.0, 9.0, 12.0, 14.0, 7.0, 5.0, 7.0, 3.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.63671875, -3.527374267578125, -3.41802978515625, -3.308685302734375, -3.1993408203125, -3.089996337890625, -2.98065185546875, -2.871307373046875, -2.761962890625, -2.652618408203125, -2.54327392578125, -2.433929443359375, -2.3245849609375, -2.215240478515625, -2.10589599609375, -1.996551513671875, -1.88720703125, -1.777862548828125, -1.66851806640625, -1.559173583984375, -1.4498291015625, -1.340484619140625, -1.23114013671875, -1.121795654296875, -1.012451171875, -0.903106689453125, -0.79376220703125, -0.684417724609375, -0.5750732421875, -0.465728759765625, -0.35638427734375, -0.247039794921875, -0.1376953125, -0.028350830078125, 0.08099365234375, 0.190338134765625, 0.2996826171875, 0.409027099609375, 0.51837158203125, 0.627716064453125, 0.737060546875, 0.846405029296875, 0.95574951171875, 1.065093994140625, 1.1744384765625, 1.283782958984375, 1.39312744140625, 1.502471923828125, 1.61181640625, 1.721160888671875, 1.83050537109375, 1.939849853515625, 2.0491943359375, 2.158538818359375, 2.26788330078125, 2.377227783203125, 2.486572265625, 2.595916748046875, 2.70526123046875, 2.814605712890625, 2.9239501953125, 3.033294677734375, 3.14263916015625, 3.251983642578125, 3.361328125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 2.0, 6.0, 12.0, 21.0, 22.0, 36.0, 49.0, 90.0, 100.0, 177.0, 259.0, 374.0, 536.0, 894.0, 1226.0, 1856.0, 2699.0, 4196.0, 6244.0, 9652.0, 15100.0, 23787.0, 39069.0, 64498.0, 112860.0, 229184.0, 241661.0, 117787.0, 66710.0, 39930.0, 24642.0, 15441.0, 9920.0, 6585.0, 4295.0, 2818.0, 1891.0, 1304.0, 863.0, 595.0, 380.0, 264.0, 188.0, 106.0, 73.0, 54.0, 32.0, 22.0, 21.0, 12.0, 11.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.64794921875, -0.6283340454101562, -0.6087188720703125, -0.5891036987304688, -0.569488525390625, -0.5498733520507812, -0.5302581787109375, -0.5106430053710938, -0.49102783203125, -0.47141265869140625, -0.4517974853515625, -0.43218231201171875, -0.412567138671875, -0.39295196533203125, -0.3733367919921875, -0.35372161865234375, -0.3341064453125, -0.31449127197265625, -0.2948760986328125, -0.27526092529296875, -0.255645751953125, -0.23603057861328125, -0.2164154052734375, -0.19680023193359375, -0.17718505859375, -0.15756988525390625, -0.1379547119140625, -0.11833953857421875, -0.098724365234375, -0.07910919189453125, -0.0594940185546875, -0.03987884521484375, -0.020263671875, -0.00064849853515625, 0.0189666748046875, 0.03858184814453125, 0.058197021484375, 0.07781219482421875, 0.0974273681640625, 0.11704254150390625, 0.13665771484375, 0.15627288818359375, 0.1758880615234375, 0.19550323486328125, 0.215118408203125, 0.23473358154296875, 0.2543487548828125, 0.27396392822265625, 0.2935791015625, 0.31319427490234375, 0.3328094482421875, 0.35242462158203125, 0.372039794921875, 0.39165496826171875, 0.4112701416015625, 0.43088531494140625, 0.45050048828125, 0.47011566162109375, 0.4897308349609375, 0.5093460083007812, 0.528961181640625, 0.5485763549804688, 0.5681915283203125, 0.5878067016601562, 0.607421875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 4.0, 8.0, 11.0, 14.0, 24.0, 19.0, 19.0, 25.0, 26.0, 26.0, 37.0, 33.0, 39.0, 31.0, 42.0, 29.0, 35.0, 37.0, 1070.0, 42.0, 36.0, 39.0, 39.0, 36.0, 36.0, 33.0, 30.0, 19.0, 22.0, 23.0, 24.0, 10.0, 22.0, 12.0, 13.0, 12.0, 6.0, 10.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9853515625, -1.9157257080078125, -1.846099853515625, -1.7764739990234375, -1.70684814453125, -1.6372222900390625, -1.567596435546875, -1.4979705810546875, -1.4283447265625, -1.3587188720703125, -1.289093017578125, -1.2194671630859375, -1.14984130859375, -1.0802154541015625, -1.010589599609375, -0.9409637451171875, -0.871337890625, -0.8017120361328125, -0.732086181640625, -0.6624603271484375, -0.59283447265625, -0.5232086181640625, -0.453582763671875, -0.3839569091796875, -0.3143310546875, -0.2447052001953125, -0.175079345703125, -0.1054534912109375, -0.03582763671875, 0.0337982177734375, 0.103424072265625, 0.1730499267578125, 0.24267578125, 0.3123016357421875, 0.381927490234375, 0.4515533447265625, 0.52117919921875, 0.5908050537109375, 0.660430908203125, 0.7300567626953125, 0.7996826171875, 0.8693084716796875, 0.938934326171875, 1.0085601806640625, 1.07818603515625, 1.1478118896484375, 1.217437744140625, 1.2870635986328125, 1.356689453125, 1.4263153076171875, 1.495941162109375, 1.5655670166015625, 1.63519287109375, 1.7048187255859375, 1.774444580078125, 1.8440704345703125, 1.9136962890625, 1.9833221435546875, 2.052947998046875, 2.1225738525390625, 2.19219970703125, 2.2618255615234375, 2.331451416015625, 2.4010772705078125, 2.470703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 13.0, 18.0, 20.0, 37.0, 53.0, 75.0, 93.0, 143.0, 227.0, 273.0, 382.0, 589.0, 843.0, 1326.0, 1922.0, 3134.0, 4580.0, 7405.0, 11706.0, 18316.0, 29523.0, 48210.0, 82799.0, 154961.0, 1326831.0, 173230.0, 90536.0, 52598.0, 32044.0, 19851.0, 12383.0, 8040.0, 5119.0, 3244.0, 2130.0, 1384.0, 949.0, 694.0, 476.0, 323.0, 191.0, 134.0, 89.0, 68.0, 37.0, 32.0, 27.0, 22.0, 9.0, 14.0, 11.0, 4.0, 3.0, 2.0, 5.0], "bins": [-0.6376953125, -0.6187057495117188, -0.5997161865234375, -0.5807266235351562, -0.561737060546875, -0.5427474975585938, -0.5237579345703125, -0.5047683715820312, -0.48577880859375, -0.46678924560546875, -0.4477996826171875, -0.42881011962890625, -0.409820556640625, -0.39083099365234375, -0.3718414306640625, -0.35285186767578125, -0.3338623046875, -0.31487274169921875, -0.2958831787109375, -0.27689361572265625, -0.257904052734375, -0.23891448974609375, -0.2199249267578125, -0.20093536376953125, -0.18194580078125, -0.16295623779296875, -0.1439666748046875, -0.12497711181640625, -0.105987548828125, -0.08699798583984375, -0.0680084228515625, -0.04901885986328125, -0.030029296875, -0.01103973388671875, 0.0079498291015625, 0.02693939208984375, 0.045928955078125, 0.06491851806640625, 0.0839080810546875, 0.10289764404296875, 0.12188720703125, 0.14087677001953125, 0.1598663330078125, 0.17885589599609375, 0.197845458984375, 0.21683502197265625, 0.2358245849609375, 0.25481414794921875, 0.2738037109375, 0.29279327392578125, 0.3117828369140625, 0.33077239990234375, 0.349761962890625, 0.36875152587890625, 0.3877410888671875, 0.40673065185546875, 0.42572021484375, 0.44470977783203125, 0.4636993408203125, 0.48268890380859375, 0.501678466796875, 0.5206680297851562, 0.5396575927734375, 0.5586471557617188, 0.57763671875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 2.0, 8.0, 7.0, 8.0, 10.0, 9.0, 9.0, 19.0, 25.0, 14.0, 20.0, 16.0, 28.0, 34.0, 43.0, 43.0, 46.0, 56.0, 53.0, 57.0, 59.0, 50.0, 46.0, 48.0, 34.0, 41.0, 50.0, 33.0, 17.0, 23.0, 20.0, 17.0, 8.0, 14.0, 8.0, 7.0, 4.0, 3.0, 4.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00048160552978515625, -0.00046490877866744995, -0.00044821202754974365, -0.00043151527643203735, -0.00041481852531433105, -0.00039812177419662476, -0.00038142502307891846, -0.00036472827196121216, -0.00034803152084350586, -0.00033133476972579956, -0.00031463801860809326, -0.00029794126749038696, -0.00028124451637268066, -0.00026454776525497437, -0.00024785101413726807, -0.00023115426301956177, -0.00021445751190185547, -0.00019776076078414917, -0.00018106400966644287, -0.00016436725854873657, -0.00014767050743103027, -0.00013097375631332397, -0.00011427700519561768, -9.758025407791138e-05, -8.088350296020508e-05, -6.418675184249878e-05, -4.749000072479248e-05, -3.079324960708618e-05, -1.4096498489379883e-05, 2.600252628326416e-06, 1.9297003746032715e-05, 3.5993754863739014e-05, 5.269050598144531e-05, 6.938725709915161e-05, 8.608400821685791e-05, 0.00010278075933456421, 0.00011947751045227051, 0.0001361742615699768, 0.0001528710126876831, 0.0001695677638053894, 0.0001862645149230957, 0.000202961266040802, 0.0002196580171585083, 0.0002363547682762146, 0.0002530515193939209, 0.0002697482705116272, 0.0002864450216293335, 0.0003031417727470398, 0.0003198385238647461, 0.0003365352749824524, 0.0003532320261001587, 0.000369928777217865, 0.0003866255283355713, 0.0004033222794532776, 0.0004200190305709839, 0.0004367157816886902, 0.0004534125328063965, 0.0004701092839241028, 0.0004868060350418091, 0.0005035027861595154, 0.0005201995372772217, 0.000536896288394928, 0.0005535930395126343, 0.0005702897906303406, 0.0005869865417480469]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 9.0, 5.0, 9.0, 10.0, 19.0, 21.0, 29.0, 57.0, 59.0, 62.0, 98.0, 120.0, 170.0, 222.0, 324.0, 628.0, 10185.0, 1016701.0, 17866.0, 709.0, 322.0, 252.0, 174.0, 134.0, 82.0, 68.0, 48.0, 46.0, 23.0, 32.0, 15.0, 20.0, 8.0, 11.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.01288604736328125, -0.012533426284790039, -0.012180805206298828, -0.011828184127807617, -0.011475563049316406, -0.011122941970825195, -0.010770320892333984, -0.010417699813842773, -0.010065078735351562, -0.009712457656860352, -0.00935983657836914, -0.00900721549987793, -0.008654594421386719, -0.008301973342895508, -0.007949352264404297, -0.007596731185913086, -0.007244110107421875, -0.006891489028930664, -0.006538867950439453, -0.006186246871948242, -0.005833625793457031, -0.00548100471496582, -0.005128383636474609, -0.0047757625579833984, -0.0044231414794921875, -0.0040705204010009766, -0.0037178993225097656, -0.0033652782440185547, -0.0030126571655273438, -0.002660036087036133, -0.002307415008544922, -0.001954793930053711, -0.0016021728515625, -0.001249551773071289, -0.0008969306945800781, -0.0005443096160888672, -0.00019168853759765625, 0.0001609325408935547, 0.0005135536193847656, 0.0008661746978759766, 0.0012187957763671875, 0.0015714168548583984, 0.0019240379333496094, 0.0022766590118408203, 0.0026292800903320312, 0.002981901168823242, 0.003334522247314453, 0.003687143325805664, 0.004039764404296875, 0.004392385482788086, 0.004745006561279297, 0.005097627639770508, 0.005450248718261719, 0.00580286979675293, 0.006155490875244141, 0.0065081119537353516, 0.0068607330322265625, 0.0072133541107177734, 0.007565975189208984, 0.007918596267700195, 0.008271217346191406, 0.008623838424682617, 0.008976459503173828, 0.009329080581665039, 0.00968170166015625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 26.0, 180.0, 363.0, 333.0, 93.0, 18.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008653370314277709, -0.0008216529386118054, -0.0007779689040035009, -0.0007342848111875355, -0.0006906007183715701, -0.0006469166837632656, -0.0006032325909473002, -0.0005595484981313348, -0.0005158644635230303, -0.0004721803998108953, -0.0004284963069949299, -0.00038481224328279495, -0.00034112815046682954, -0.0002974440867546946, -0.0002537600230425596, -0.0002100759302265942, -0.0001663918374106288, -0.0001227077591465786, -7.902368815848604e-05, -3.533961717039347e-05, 8.344461093656719e-06, 5.2028539357706904e-05, 9.571260306984186e-05, 0.00013939669588580728, 0.00018308075959794223, 0.00022676483786199242, 0.0002704489161260426, 0.00031413297983817756, 0.0003578170435503125, 0.00040150113636627793, 0.0004451852000784129, 0.0004888692637905478, 0.0005325532983988523, 0.0005762373912148178, 0.0006199214258231223, 0.0006636055186390877, 0.0007072896114550531, 0.0007509737042710185, 0.000794657738879323, 0.0008383418316952884, 0.0008820259245112538, 0.0009257100173272192, 0.0009693940519355237, 0.0010130781447514892, 0.0010567621793597937, 0.00110044633038342, 0.0011441303649917245, 0.001187814399600029, 0.0012314985506236553, 0.0012751825852319598, 0.0013188667362555861, 0.0013625507708638906, 0.0014062348054721951, 0.0014499189564958215, 0.001493602991104126, 0.0015372871421277523, 0.001580971060320735, 0.0016246550949290395, 0.0016683392459526658, 0.0017120232805609703, 0.0017557073151692748, 0.0017993914661929011, 0.0018430755008012056, 0.001886759651824832, 0.0019304436864331365]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 10.0, 7.0, 15.0, 17.0, 18.0, 16.0, 8.0, 13.0, 23.0, 23.0, 22.0, 27.0, 33.0, 40.0, 34.0, 33.0, 30.0, 31.0, 41.0, 38.0, 43.0, 51.0, 35.0, 36.0, 32.0, 35.0, 32.0, 41.0, 23.0, 18.0, 23.0, 27.0, 25.0, 15.0, 14.0, 8.0, 8.0, 9.0, 10.0, 9.0, 3.0, 10.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025898218154907227, -0.00025032833218574524, -0.0002416744828224182, -0.0002330206334590912, -0.00022436678409576416, -0.00021571293473243713, -0.0002070590853691101, -0.00019840523600578308, -0.00018975138664245605, -0.00018109753727912903, -0.000172443687915802, -0.00016378983855247498, -0.00015513598918914795, -0.00014648213982582092, -0.0001378282904624939, -0.00012917444109916687, -0.00012052059173583984, -0.00011186674237251282, -0.00010321289300918579, -9.455904364585876e-05, -8.590519428253174e-05, -7.725134491920471e-05, -6.859749555587769e-05, -5.994364619255066e-05, -5.128979682922363e-05, -4.2635947465896606e-05, -3.398209810256958e-05, -2.5328248739242554e-05, -1.6674399375915527e-05, -8.020550012588501e-06, 6.332993507385254e-07, 9.287148714065552e-06, 1.7940998077392578e-05, 2.6594847440719604e-05, 3.524869680404663e-05, 4.390254616737366e-05, 5.2556395530700684e-05, 6.121024489402771e-05, 6.986409425735474e-05, 7.851794362068176e-05, 8.717179298400879e-05, 9.582564234733582e-05, 0.00010447949171066284, 0.00011313334107398987, 0.0001217871904373169, 0.00013044103980064392, 0.00013909488916397095, 0.00014774873852729797, 0.000156402587890625, 0.00016505643725395203, 0.00017371028661727905, 0.00018236413598060608, 0.0001910179853439331, 0.00019967183470726013, 0.00020832568407058716, 0.00021697953343391418, 0.0002256333827972412, 0.00023428723216056824, 0.00024294108152389526, 0.0002515949308872223, 0.0002602487802505493, 0.00026890262961387634, 0.00027755647897720337, 0.0002862103283405304, 0.0002948641777038574]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 14.0, 9.0, 11.0, 6.0, 13.0, 17.0, 9.0, 21.0, 16.0, 26.0, 34.0, 35.0, 28.0, 30.0, 38.0, 49.0, 35.0, 46.0, 35.0, 57.0, 40.0, 39.0, 35.0, 31.0, 38.0, 33.0, 25.0, 40.0, 22.0, 23.0, 22.0, 14.0, 17.0, 18.0, 9.0, 12.0, 14.0, 7.0, 5.0, 7.0, 3.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.63671875, -3.527374267578125, -3.41802978515625, -3.308685302734375, -3.1993408203125, -3.089996337890625, -2.98065185546875, -2.871307373046875, -2.761962890625, -2.652618408203125, -2.54327392578125, -2.433929443359375, -2.3245849609375, -2.215240478515625, -2.10589599609375, -1.996551513671875, -1.88720703125, -1.777862548828125, -1.66851806640625, -1.559173583984375, -1.4498291015625, -1.340484619140625, -1.23114013671875, -1.121795654296875, -1.012451171875, -0.903106689453125, -0.79376220703125, -0.684417724609375, -0.5750732421875, -0.465728759765625, -0.35638427734375, -0.247039794921875, -0.1376953125, -0.028350830078125, 0.08099365234375, 0.190338134765625, 0.2996826171875, 0.409027099609375, 0.51837158203125, 0.627716064453125, 0.737060546875, 0.846405029296875, 0.95574951171875, 1.065093994140625, 1.1744384765625, 1.283782958984375, 1.39312744140625, 1.502471923828125, 1.61181640625, 1.721160888671875, 1.83050537109375, 1.939849853515625, 2.0491943359375, 2.158538818359375, 2.26788330078125, 2.377227783203125, 2.486572265625, 2.595916748046875, 2.70526123046875, 2.814605712890625, 2.9239501953125, 3.033294677734375, 3.14263916015625, 3.251983642578125, 3.361328125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 8.0, 16.0, 11.0, 19.0, 18.0, 28.0, 52.0, 76.0, 103.0, 147.0, 205.0, 277.0, 405.0, 671.0, 1104.0, 1987.0, 3438.0, 6572.0, 12804.0, 28685.0, 72579.0, 210682.0, 403633.0, 187600.0, 65042.0, 26127.0, 12116.0, 6104.0, 3194.0, 1865.0, 1028.0, 661.0, 375.0, 259.0, 179.0, 140.0, 101.0, 68.0, 53.0, 40.0, 31.0, 14.0, 16.0, 14.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.9765625, -3.857666015625, -3.73876953125, -3.619873046875, -3.5009765625, -3.382080078125, -3.26318359375, -3.144287109375, -3.025390625, -2.906494140625, -2.78759765625, -2.668701171875, -2.5498046875, -2.430908203125, -2.31201171875, -2.193115234375, -2.07421875, -1.955322265625, -1.83642578125, -1.717529296875, -1.5986328125, -1.479736328125, -1.36083984375, -1.241943359375, -1.123046875, -1.004150390625, -0.88525390625, -0.766357421875, -0.6474609375, -0.528564453125, -0.40966796875, -0.290771484375, -0.171875, -0.052978515625, 0.06591796875, 0.184814453125, 0.3037109375, 0.422607421875, 0.54150390625, 0.660400390625, 0.779296875, 0.898193359375, 1.01708984375, 1.135986328125, 1.2548828125, 1.373779296875, 1.49267578125, 1.611572265625, 1.73046875, 1.849365234375, 1.96826171875, 2.087158203125, 2.2060546875, 2.324951171875, 2.44384765625, 2.562744140625, 2.681640625, 2.800537109375, 2.91943359375, 3.038330078125, 3.1572265625, 3.276123046875, 3.39501953125, 3.513916015625, 3.6328125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 6.0, 11.0, 9.0, 3.0, 4.0, 16.0, 17.0, 23.0, 24.0, 24.0, 38.0, 34.0, 35.0, 32.0, 34.0, 57.0, 75.0, 160.0, 1545.0, 375.0, 106.0, 55.0, 47.0, 30.0, 48.0, 38.0, 38.0, 32.0, 24.0, 18.0, 14.0, 11.0, 19.0, 11.0, 11.0, 10.0, 9.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9453125, -12.511962890625, -12.07861328125, -11.645263671875, -11.2119140625, -10.778564453125, -10.34521484375, -9.911865234375, -9.478515625, -9.045166015625, -8.61181640625, -8.178466796875, -7.7451171875, -7.311767578125, -6.87841796875, -6.445068359375, -6.01171875, -5.578369140625, -5.14501953125, -4.711669921875, -4.2783203125, -3.844970703125, -3.41162109375, -2.978271484375, -2.544921875, -2.111572265625, -1.67822265625, -1.244873046875, -0.8115234375, -0.378173828125, 0.05517578125, 0.488525390625, 0.921875, 1.355224609375, 1.78857421875, 2.221923828125, 2.6552734375, 3.088623046875, 3.52197265625, 3.955322265625, 4.388671875, 4.822021484375, 5.25537109375, 5.688720703125, 6.1220703125, 6.555419921875, 6.98876953125, 7.422119140625, 7.85546875, 8.288818359375, 8.72216796875, 9.155517578125, 9.5888671875, 10.022216796875, 10.45556640625, 10.888916015625, 11.322265625, 11.755615234375, 12.18896484375, 12.622314453125, 13.0556640625, 13.489013671875, 13.92236328125, 14.355712890625, 14.7890625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 10.0, 6.0, 13.0, 14.0, 20.0, 16.0, 22.0, 27.0, 28.0, 47.0, 59.0, 82.0, 111.0, 203.0, 366.0, 1046.0, 8161.0, 595224.0, 2522478.0, 15036.0, 1564.0, 470.0, 214.0, 136.0, 66.0, 63.0, 51.0, 41.0, 30.0, 19.0, 18.0, 14.0, 7.0, 8.0, 10.0, 17.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.765625, -24.017578125, -23.26953125, -22.521484375, -21.7734375, -21.025390625, -20.27734375, -19.529296875, -18.78125, -18.033203125, -17.28515625, -16.537109375, -15.7890625, -15.041015625, -14.29296875, -13.544921875, -12.796875, -12.048828125, -11.30078125, -10.552734375, -9.8046875, -9.056640625, -8.30859375, -7.560546875, -6.8125, -6.064453125, -5.31640625, -4.568359375, -3.8203125, -3.072265625, -2.32421875, -1.576171875, -0.828125, -0.080078125, 0.66796875, 1.416015625, 2.1640625, 2.912109375, 3.66015625, 4.408203125, 5.15625, 5.904296875, 6.65234375, 7.400390625, 8.1484375, 8.896484375, 9.64453125, 10.392578125, 11.140625, 11.888671875, 12.63671875, 13.384765625, 14.1328125, 14.880859375, 15.62890625, 16.376953125, 17.125, 17.873046875, 18.62109375, 19.369140625, 20.1171875, 20.865234375, 21.61328125, 22.361328125, 23.109375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 16.0, 22.0, 64.0, 141.0, 173.0, 204.0, 170.0, 118.0, 42.0, 29.0, 13.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0806245803833, -10.249979019165039, -9.419332504272461, -8.588685989379883, -7.758040428161621, -6.927394390106201, -6.096748352050781, -5.266102313995361, -4.435456275939941, -3.6048102378845215, -2.7741641998291016, -1.9435181617736816, -1.1128721237182617, -0.2822260856628418, 0.5484199523925781, 1.379065990447998, 2.209712028503418, 3.040358066558838, 3.871004104614258, 4.701650142669678, 5.532296180725098, 6.362942218780518, 7.1935882568359375, 8.024234771728516, 8.854880332946777, 9.685525894165039, 10.516172409057617, 11.346818923950195, 12.177464485168457, 13.008110046386719, 13.838756561279297, 14.669403076171875, 15.500049591064453, 16.33069610595703, 17.16134262084961, 17.991987228393555, 18.822633743286133, 19.65328025817871, 20.483924865722656, 21.314571380615234, 22.145217895507812, 22.97586441040039, 23.80651092529297, 24.637155532836914, 25.467802047729492, 26.29844856262207, 27.129093170166016, 27.959739685058594, 28.790386199951172, 29.62103271484375, 30.451679229736328, 31.282323837280273, 32.11296844482422, 32.9436149597168, 33.774261474609375, 34.60490798950195, 35.43555450439453, 36.26620101928711, 37.09684753417969, 37.927494049072266, 38.758140563964844, 39.588783264160156, 40.419429779052734, 41.25007629394531, 42.08072280883789]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 6.0, 7.0, 6.0, 14.0, 9.0, 12.0, 12.0, 14.0, 11.0, 19.0, 29.0, 35.0, 32.0, 40.0, 32.0, 34.0, 32.0, 46.0, 41.0, 41.0, 26.0, 46.0, 35.0, 42.0, 36.0, 36.0, 41.0, 33.0, 30.0, 26.0, 30.0, 26.0, 24.0, 27.0, 9.0, 15.0, 11.0, 7.0, 5.0, 7.0, 3.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-41.49871063232422, -40.227928161621094, -38.957149505615234, -37.68636703491211, -36.415584564208984, -35.144805908203125, -33.8740234375, -32.603240966796875, -31.332460403442383, -30.06167984008789, -28.790897369384766, -27.520116806030273, -26.24933624267578, -24.978553771972656, -23.707773208618164, -22.436992645263672, -21.166210174560547, -19.895429611206055, -18.62464714050293, -17.353866577148438, -16.083084106445312, -14.81230354309082, -13.541522979736328, -12.27074146270752, -10.999959945678711, -9.729178428649902, -8.458396911621094, -7.187616348266602, -5.916834831237793, -4.646053314208984, -3.375272274017334, -2.1044912338256836, -0.833709716796875, 0.4370715618133545, 1.707852840423584, 2.9786341190338135, 4.249415397644043, 5.520196914672852, 6.790977954864502, 8.061758995056152, 9.332540512084961, 10.60332202911377, 11.874103546142578, 13.14488410949707, 14.415665626525879, 15.686447143554688, 16.95722770690918, 18.228008270263672, 19.498790740966797, 20.76957130432129, 22.040353775024414, 23.311134338378906, 24.58191680908203, 25.852697372436523, 27.123477935791016, 28.39426040649414, 29.665040969848633, 30.935821533203125, 32.20660400390625, 33.477386474609375, 34.748165130615234, 36.01894760131836, 37.289730072021484, 38.560508728027344, 39.83129119873047]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 8.0, 6.0, 9.0, 12.0, 13.0, 14.0, 11.0, 18.0, 22.0, 20.0, 35.0, 31.0, 34.0, 39.0, 31.0, 44.0, 50.0, 37.0, 55.0, 43.0, 40.0, 37.0, 45.0, 27.0, 34.0, 47.0, 31.0, 30.0, 21.0, 30.0, 24.0, 9.0, 16.0, 17.0, 11.0, 7.0, 9.0, 10.0, 2.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0390625, -3.917449951171875, -3.79583740234375, -3.674224853515625, -3.5526123046875, -3.430999755859375, -3.30938720703125, -3.187774658203125, -3.066162109375, -2.944549560546875, -2.82293701171875, -2.701324462890625, -2.5797119140625, -2.458099365234375, -2.33648681640625, -2.214874267578125, -2.09326171875, -1.971649169921875, -1.85003662109375, -1.728424072265625, -1.6068115234375, -1.485198974609375, -1.36358642578125, -1.241973876953125, -1.120361328125, -0.998748779296875, -0.87713623046875, -0.755523681640625, -0.6339111328125, -0.512298583984375, -0.39068603515625, -0.269073486328125, -0.1474609375, -0.025848388671875, 0.09576416015625, 0.217376708984375, 0.3389892578125, 0.460601806640625, 0.58221435546875, 0.703826904296875, 0.825439453125, 0.947052001953125, 1.06866455078125, 1.190277099609375, 1.3118896484375, 1.433502197265625, 1.55511474609375, 1.676727294921875, 1.79833984375, 1.919952392578125, 2.04156494140625, 2.163177490234375, 2.2847900390625, 2.406402587890625, 2.52801513671875, 2.649627685546875, 2.771240234375, 2.892852783203125, 3.01446533203125, 3.136077880859375, 3.2576904296875, 3.379302978515625, 3.50091552734375, 3.622528076171875, 3.744140625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 4.0, 14.0, 5.0, 10.0, 9.0, 13.0, 18.0, 21.0, 23.0, 26.0, 25.0, 42.0, 48.0, 60.0, 122.0, 374.0, 2239.0, 40712.0, 2666215.0, 1462002.0, 20156.0, 1442.0, 280.0, 94.0, 46.0, 40.0, 33.0, 34.0, 23.0, 20.0, 16.0, 22.0, 19.0, 10.0, 5.0, 9.0, 7.0, 6.0, 5.0, 6.0, 6.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.71875, -21.078125, -20.4375, -19.796875, -19.15625, -18.515625, -17.875, -17.234375, -16.59375, -15.953125, -15.3125, -14.671875, -14.03125, -13.390625, -12.75, -12.109375, -11.46875, -10.828125, -10.1875, -9.546875, -8.90625, -8.265625, -7.625, -6.984375, -6.34375, -5.703125, -5.0625, -4.421875, -3.78125, -3.140625, -2.5, -1.859375, -1.21875, -0.578125, 0.0625, 0.703125, 1.34375, 1.984375, 2.625, 3.265625, 3.90625, 4.546875, 5.1875, 5.828125, 6.46875, 7.109375, 7.75, 8.390625, 9.03125, 9.671875, 10.3125, 10.953125, 11.59375, 12.234375, 12.875, 13.515625, 14.15625, 14.796875, 15.4375, 16.078125, 16.71875, 17.359375, 18.0, 18.640625, 19.28125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 6.0, 9.0, 12.0, 19.0, 27.0, 34.0, 58.0, 84.0, 127.0, 152.0, 209.0, 330.0, 433.0, 488.0, 499.0, 384.0, 353.0, 271.0, 175.0, 109.0, 87.0, 61.0, 48.0, 32.0, 19.0, 14.0, 4.0, 8.0, 7.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.5625, -15.173828125, -14.78515625, -14.396484375, -14.0078125, -13.619140625, -13.23046875, -12.841796875, -12.453125, -12.064453125, -11.67578125, -11.287109375, -10.8984375, -10.509765625, -10.12109375, -9.732421875, -9.34375, -8.955078125, -8.56640625, -8.177734375, -7.7890625, -7.400390625, -7.01171875, -6.623046875, -6.234375, -5.845703125, -5.45703125, -5.068359375, -4.6796875, -4.291015625, -3.90234375, -3.513671875, -3.125, -2.736328125, -2.34765625, -1.958984375, -1.5703125, -1.181640625, -0.79296875, -0.404296875, -0.015625, 0.373046875, 0.76171875, 1.150390625, 1.5390625, 1.927734375, 2.31640625, 2.705078125, 3.09375, 3.482421875, 3.87109375, 4.259765625, 4.6484375, 5.037109375, 5.42578125, 5.814453125, 6.203125, 6.591796875, 6.98046875, 7.369140625, 7.7578125, 8.146484375, 8.53515625, 8.923828125, 9.3125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 10.0, 14.0, 10.0, 21.0, 28.0, 53.0, 79.0, 138.0, 201.0, 392.0, 1303.0, 18019.0, 3197142.0, 968322.0, 6944.0, 790.0, 329.0, 182.0, 113.0, 73.0, 44.0, 30.0, 13.0, 5.0, 7.0, 6.0, 7.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.3125, -33.892578125, -32.47265625, -31.052734375, -29.6328125, -28.212890625, -26.79296875, -25.373046875, -23.953125, -22.533203125, -21.11328125, -19.693359375, -18.2734375, -16.853515625, -15.43359375, -14.013671875, -12.59375, -11.173828125, -9.75390625, -8.333984375, -6.9140625, -5.494140625, -4.07421875, -2.654296875, -1.234375, 0.185546875, 1.60546875, 3.025390625, 4.4453125, 5.865234375, 7.28515625, 8.705078125, 10.125, 11.544921875, 12.96484375, 14.384765625, 15.8046875, 17.224609375, 18.64453125, 20.064453125, 21.484375, 22.904296875, 24.32421875, 25.744140625, 27.1640625, 28.583984375, 30.00390625, 31.423828125, 32.84375, 34.263671875, 35.68359375, 37.103515625, 38.5234375, 39.943359375, 41.36328125, 42.783203125, 44.203125, 45.623046875, 47.04296875, 48.462890625, 49.8828125, 51.302734375, 52.72265625, 54.142578125, 55.5625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 19.0, 97.0, 301.0, 376.0, 183.0, 33.0, 5.0, 2.0], "bins": [-292.83917236328125, -287.89251708984375, -282.9458312988281, -277.9991760253906, -273.0525207519531, -268.1058349609375, -263.1591796875, -258.2125244140625, -253.26583862304688, -248.3191680908203, -243.3725128173828, -238.42584228515625, -233.4791717529297, -228.53250122070312, -223.58584594726562, -218.63917541503906, -213.69252014160156, -208.745849609375, -203.7991943359375, -198.85252380371094, -193.90585327148438, -188.95919799804688, -184.0125274658203, -179.06585693359375, -174.11920166015625, -169.1725311279297, -164.2258758544922, -159.27920532226562, -154.33253479003906, -149.3858642578125, -144.439208984375, -139.49253845214844, -134.54586791992188, -129.5991973876953, -124.65253448486328, -119.70587158203125, -114.75920104980469, -109.81253814697266, -104.86587524414062, -99.91920471191406, -94.97254180908203, -90.02587890625, -85.07920837402344, -80.1325454711914, -75.18588256835938, -70.23921203613281, -65.29254913330078, -60.345882415771484, -55.39921569824219, -50.45254898071289, -45.505882263183594, -40.55921936035156, -35.612552642822266, -30.66588592529297, -25.719221115112305, -20.77255630493164, -15.825891494750977, -10.879225730895996, -5.932559967041016, -0.9858942031860352, 3.9607715606689453, 8.907438278198242, 13.854103088378906, 18.80076789855957, 23.747434616088867]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 9.0, 6.0, 13.0, 11.0, 17.0, 29.0, 16.0, 17.0, 19.0, 27.0, 30.0, 34.0, 36.0, 43.0, 45.0, 56.0, 42.0, 51.0, 34.0, 42.0, 48.0, 44.0, 38.0, 57.0, 39.0, 30.0, 34.0, 26.0, 18.0, 24.0, 18.0, 13.0, 9.0, 9.0, 3.0, 4.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.424598693847656, -40.11902618408203, -38.81345748901367, -37.50788879394531, -36.20231628417969, -34.89674377441406, -33.5911750793457, -32.285606384277344, -30.98003387451172, -29.674463272094727, -28.368892669677734, -27.063322067260742, -25.75775146484375, -24.452180862426758, -23.146610260009766, -21.841039657592773, -20.53546905517578, -19.22989845275879, -17.924327850341797, -16.618757247924805, -15.313186645507812, -14.00761604309082, -12.702045440673828, -11.396474838256836, -10.090904235839844, -8.785333633422852, -7.479763031005859, -6.174192428588867, -4.868621826171875, -3.563051223754883, -2.2574806213378906, -0.9519100189208984, 0.3536567687988281, 1.6592273712158203, 2.9647979736328125, 4.270368576049805, 5.575939178466797, 6.881509780883789, 8.187080383300781, 9.492650985717773, 10.798221588134766, 12.103792190551758, 13.40936279296875, 14.714933395385742, 16.020503997802734, 17.326074600219727, 18.63164520263672, 19.93721580505371, 21.242786407470703, 22.548357009887695, 23.853927612304688, 25.15949821472168, 26.465068817138672, 27.770639419555664, 29.076210021972656, 30.38178062438965, 31.68735122680664, 32.992919921875, 34.298492431640625, 35.60406494140625, 36.90963363647461, 38.21520233154297, 39.520774841308594, 40.82634735107422, 42.13191604614258]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 5.0, 6.0, 13.0, 7.0, 14.0, 18.0, 17.0, 21.0, 21.0, 19.0, 34.0, 30.0, 26.0, 48.0, 39.0, 38.0, 51.0, 61.0, 39.0, 39.0, 58.0, 40.0, 44.0, 37.0, 41.0, 37.0, 30.0, 31.0, 18.0, 21.0, 22.0, 13.0, 10.0, 11.0, 11.0, 8.0, 5.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.260009765625, -4.12548828125, -3.990966796875, -3.8564453125, -3.721923828125, -3.58740234375, -3.452880859375, -3.318359375, -3.183837890625, -3.04931640625, -2.914794921875, -2.7802734375, -2.645751953125, -2.51123046875, -2.376708984375, -2.2421875, -2.107666015625, -1.97314453125, -1.838623046875, -1.7041015625, -1.569580078125, -1.43505859375, -1.300537109375, -1.166015625, -1.031494140625, -0.89697265625, -0.762451171875, -0.6279296875, -0.493408203125, -0.35888671875, -0.224365234375, -0.08984375, 0.044677734375, 0.17919921875, 0.313720703125, 0.4482421875, 0.582763671875, 0.71728515625, 0.851806640625, 0.986328125, 1.120849609375, 1.25537109375, 1.389892578125, 1.5244140625, 1.658935546875, 1.79345703125, 1.927978515625, 2.0625, 2.197021484375, 2.33154296875, 2.466064453125, 2.6005859375, 2.735107421875, 2.86962890625, 3.004150390625, 3.138671875, 3.273193359375, 3.40771484375, 3.542236328125, 3.6767578125, 3.811279296875, 3.94580078125, 4.080322265625, 4.21484375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 4.0, 6.0, 12.0, 13.0, 11.0, 20.0, 30.0, 40.0, 53.0, 86.0, 140.0, 179.0, 239.0, 397.0, 528.0, 740.0, 1073.0, 1662.0, 2321.0, 3690.0, 5372.0, 8074.0, 12768.0, 20133.0, 31849.0, 51988.0, 87530.0, 159905.0, 267367.0, 161531.0, 88306.0, 52637.0, 32099.0, 20016.0, 12765.0, 8359.0, 5351.0, 3647.0, 2311.0, 1662.0, 1100.0, 795.0, 552.0, 352.0, 257.0, 168.0, 136.0, 83.0, 52.0, 55.0, 41.0, 24.0, 12.0, 15.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.65576171875, -0.63494873046875, -0.6141357421875, -0.59332275390625, -0.572509765625, -0.55169677734375, -0.5308837890625, -0.51007080078125, -0.4892578125, -0.46844482421875, -0.4476318359375, -0.42681884765625, -0.406005859375, -0.38519287109375, -0.3643798828125, -0.34356689453125, -0.32275390625, -0.30194091796875, -0.2811279296875, -0.26031494140625, -0.239501953125, -0.21868896484375, -0.1978759765625, -0.17706298828125, -0.15625, -0.13543701171875, -0.1146240234375, -0.09381103515625, -0.072998046875, -0.05218505859375, -0.0313720703125, -0.01055908203125, 0.01025390625, 0.03106689453125, 0.0518798828125, 0.07269287109375, 0.093505859375, 0.11431884765625, 0.1351318359375, 0.15594482421875, 0.1767578125, 0.19757080078125, 0.2183837890625, 0.23919677734375, 0.260009765625, 0.28082275390625, 0.3016357421875, 0.32244873046875, 0.34326171875, 0.36407470703125, 0.3848876953125, 0.40570068359375, 0.426513671875, 0.44732666015625, 0.4681396484375, 0.48895263671875, 0.509765625, 0.53057861328125, 0.5513916015625, 0.57220458984375, 0.593017578125, 0.61383056640625, 0.6346435546875, 0.65545654296875, 0.67626953125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 9.0, 2.0, 6.0, 8.0, 7.0, 10.0, 8.0, 13.0, 6.0, 21.0, 21.0, 24.0, 33.0, 22.0, 26.0, 35.0, 35.0, 39.0, 33.0, 39.0, 36.0, 42.0, 1065.0, 43.0, 35.0, 38.0, 31.0, 40.0, 27.0, 41.0, 32.0, 20.0, 27.0, 16.0, 21.0, 18.0, 19.0, 10.0, 6.0, 13.0, 9.0, 6.0, 6.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.310546875, -2.239654541015625, -2.16876220703125, -2.097869873046875, -2.0269775390625, -1.956085205078125, -1.88519287109375, -1.814300537109375, -1.743408203125, -1.672515869140625, -1.60162353515625, -1.530731201171875, -1.4598388671875, -1.388946533203125, -1.31805419921875, -1.247161865234375, -1.17626953125, -1.105377197265625, -1.03448486328125, -0.963592529296875, -0.8927001953125, -0.821807861328125, -0.75091552734375, -0.680023193359375, -0.609130859375, -0.538238525390625, -0.46734619140625, -0.396453857421875, -0.3255615234375, -0.254669189453125, -0.18377685546875, -0.112884521484375, -0.0419921875, 0.028900146484375, 0.09979248046875, 0.170684814453125, 0.2415771484375, 0.312469482421875, 0.38336181640625, 0.454254150390625, 0.525146484375, 0.596038818359375, 0.66693115234375, 0.737823486328125, 0.8087158203125, 0.879608154296875, 0.95050048828125, 1.021392822265625, 1.09228515625, 1.163177490234375, 1.23406982421875, 1.304962158203125, 1.3758544921875, 1.446746826171875, 1.51763916015625, 1.588531494140625, 1.659423828125, 1.730316162109375, 1.80120849609375, 1.872100830078125, 1.9429931640625, 2.013885498046875, 2.08477783203125, 2.155670166015625, 2.2265625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 12.0, 10.0, 6.0, 15.0, 26.0, 41.0, 53.0, 51.0, 77.0, 122.0, 141.0, 194.0, 252.0, 352.0, 548.0, 804.0, 1135.0, 1577.0, 2130.0, 3282.0, 4800.0, 7059.0, 10416.0, 15803.0, 24657.0, 39918.0, 66745.0, 121156.0, 1286974.0, 224085.0, 113427.0, 62937.0, 37638.0, 23513.0, 15081.0, 10039.0, 6728.0, 4596.0, 3159.0, 2217.0, 1575.0, 1092.0, 722.0, 543.0, 406.0, 267.0, 216.0, 152.0, 107.0, 82.0, 79.0, 41.0, 23.0, 27.0, 12.0, 9.0, 3.0, 5.0, 2.0, 3.0, 3.0], "bins": [-0.61328125, -0.594085693359375, -0.57489013671875, -0.555694580078125, -0.5364990234375, -0.517303466796875, -0.49810791015625, -0.478912353515625, -0.459716796875, -0.440521240234375, -0.42132568359375, -0.402130126953125, -0.3829345703125, -0.363739013671875, -0.34454345703125, -0.325347900390625, -0.30615234375, -0.286956787109375, -0.26776123046875, -0.248565673828125, -0.2293701171875, -0.210174560546875, -0.19097900390625, -0.171783447265625, -0.152587890625, -0.133392333984375, -0.11419677734375, -0.095001220703125, -0.0758056640625, -0.056610107421875, -0.03741455078125, -0.018218994140625, 0.0009765625, 0.020172119140625, 0.03936767578125, 0.058563232421875, 0.0777587890625, 0.096954345703125, 0.11614990234375, 0.135345458984375, 0.154541015625, 0.173736572265625, 0.19293212890625, 0.212127685546875, 0.2313232421875, 0.250518798828125, 0.26971435546875, 0.288909912109375, 0.30810546875, 0.327301025390625, 0.34649658203125, 0.365692138671875, 0.3848876953125, 0.404083251953125, 0.42327880859375, 0.442474365234375, 0.461669921875, 0.480865478515625, 0.50006103515625, 0.519256591796875, 0.5384521484375, 0.557647705078125, 0.57684326171875, 0.596038818359375, 0.615234375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 6.0, 6.0, 5.0, 5.0, 17.0, 10.0, 16.0, 20.0, 26.0, 26.0, 42.0, 37.0, 48.0, 40.0, 47.0, 62.0, 63.0, 62.0, 52.0, 35.0, 49.0, 42.0, 36.0, 44.0, 30.0, 42.0, 18.0, 22.0, 17.0, 11.0, 8.0, 11.0, 3.0, 7.0, 2.0, 5.0, 8.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005731582641601562, -0.0005535483360290527, -0.0005339384078979492, -0.0005143284797668457, -0.0004947185516357422, -0.00047510862350463867, -0.00045549869537353516, -0.00043588876724243164, -0.0004162788391113281, -0.0003966689109802246, -0.0003770589828491211, -0.0003574490547180176, -0.00033783912658691406, -0.00031822919845581055, -0.00029861927032470703, -0.0002790093421936035, -0.0002593994140625, -0.00023978948593139648, -0.00022017955780029297, -0.00020056962966918945, -0.00018095970153808594, -0.00016134977340698242, -0.0001417398452758789, -0.0001221299171447754, -0.00010251998901367188, -8.291006088256836e-05, -6.330013275146484e-05, -4.369020462036133e-05, -2.4080276489257812e-05, -4.470348358154297e-06, 1.5139579772949219e-05, 3.4749507904052734e-05, 5.435943603515625e-05, 7.396936416625977e-05, 9.357929229736328e-05, 0.0001131892204284668, 0.0001327991485595703, 0.00015240907669067383, 0.00017201900482177734, 0.00019162893295288086, 0.00021123886108398438, 0.0002308487892150879, 0.0002504587173461914, 0.0002700686454772949, 0.00028967857360839844, 0.00030928850173950195, 0.00032889842987060547, 0.000348508358001709, 0.0003681182861328125, 0.000387728214263916, 0.00040733814239501953, 0.00042694807052612305, 0.00044655799865722656, 0.0004661679267883301, 0.0004857778549194336, 0.0005053877830505371, 0.0005249977111816406, 0.0005446076393127441, 0.0005642175674438477, 0.0005838274955749512, 0.0006034374237060547, 0.0006230473518371582, 0.0006426572799682617, 0.0006622672080993652, 0.0006818771362304688]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 9.0, 5.0, 13.0, 8.0, 10.0, 26.0, 28.0, 42.0, 50.0, 68.0, 98.0, 141.0, 229.0, 322.0, 784.0, 48709.0, 993817.0, 2773.0, 505.0, 256.0, 195.0, 117.0, 90.0, 60.0, 46.0, 32.0, 25.0, 18.0, 14.0, 13.0, 15.0, 7.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0171051025390625, -0.016646265983581543, -0.016187429428100586, -0.01572859287261963, -0.015269756317138672, -0.014810919761657715, -0.014352083206176758, -0.0138932466506958, -0.013434410095214844, -0.012975573539733887, -0.01251673698425293, -0.012057900428771973, -0.011599063873291016, -0.011140227317810059, -0.010681390762329102, -0.010222554206848145, -0.009763717651367188, -0.00930488109588623, -0.008846044540405273, -0.008387207984924316, -0.00792837142944336, -0.007469534873962402, -0.007010698318481445, -0.006551861763000488, -0.006093025207519531, -0.005634188652038574, -0.005175352096557617, -0.00471651554107666, -0.004257678985595703, -0.003798842430114746, -0.003340005874633789, -0.002881169319152832, -0.002422332763671875, -0.001963496208190918, -0.001504659652709961, -0.001045823097229004, -0.0005869865417480469, -0.00012814998626708984, 0.0003306865692138672, 0.0007895231246948242, 0.0012483596801757812, 0.0017071962356567383, 0.0021660327911376953, 0.0026248693466186523, 0.0030837059020996094, 0.0035425424575805664, 0.0040013790130615234, 0.0044602155685424805, 0.0049190521240234375, 0.0053778886795043945, 0.0058367252349853516, 0.006295561790466309, 0.006754398345947266, 0.007213234901428223, 0.00767207145690918, 0.008130908012390137, 0.008589744567871094, 0.00904858112335205, 0.009507417678833008, 0.009966254234313965, 0.010425090789794922, 0.010883927345275879, 0.011342763900756836, 0.011801600456237793, 0.01226043701171875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 45.0, 117.0, 264.0, 302.0, 180.0, 69.0, 14.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004487147962208837, -0.0004120715311728418, -0.0003754282952286303, -0.00033878503018058836, -0.0003021417651325464, -0.00026549852918833494, -0.000228855264140293, -0.00019221202819608152, -0.00015556876314803958, -0.00011892551265191287, -8.228225487982854e-05, -4.563899710774422e-05, -8.995746611617506e-06, 2.7647503884509206e-05, 6.429076893255115e-05, 0.00010093400487676263, 0.00013757726992480457, 0.00017422052042093128, 0.000210863770917058, 0.00024750703596509993, 0.00028415030101314187, 0.00032079353695735335, 0.0003574368020053953, 0.0003940800379496068, 0.0004307233029976487, 0.00046736656804569066, 0.0005040098330937326, 0.0005406530690379441, 0.0005772963049821556, 0.000613939599134028, 0.0006505828350782394, 0.0006872260710224509, 0.0007238693069666624, 0.0007605125429108739, 0.0007971558370627463, 0.0008337990730069578, 0.0008704423089511693, 0.0009070856031030416, 0.0009437288390472531, 0.0009803720749914646, 0.001017015310935676, 0.0010536585468798876, 0.001090301782824099, 0.0011269450187683105, 0.0011635883711278439, 0.0012002316070720553, 0.0012368748430162668, 0.0012735180789604783, 0.0013101613149046898, 0.0013468045508489013, 0.0013834477867931128, 0.001420091139152646, 0.0014567343750968575, 0.001493377611041069, 0.0015300208469852805, 0.001566664082929492, 0.0016033074352890253, 0.0016399506712332368, 0.0016765939071774483, 0.0017132372595369816, 0.001749880495481193, 0.0017865237314254045, 0.001823166967369616, 0.0018598102033138275, 0.001896453439258039]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 7.0, 6.0, 13.0, 7.0, 12.0, 10.0, 17.0, 21.0, 14.0, 24.0, 22.0, 18.0, 26.0, 28.0, 50.0, 43.0, 41.0, 32.0, 34.0, 33.0, 43.0, 53.0, 38.0, 35.0, 43.0, 33.0, 44.0, 37.0, 18.0, 29.0, 22.0, 26.0, 21.0, 15.0, 17.0, 15.0, 12.0, 9.0, 6.0, 8.0, 8.0, 3.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00034630298614501953, -0.0003356989473104477, -0.00032509490847587585, -0.000314490869641304, -0.0003038868308067322, -0.00029328279197216034, -0.0002826787531375885, -0.00027207471430301666, -0.0002614706754684448, -0.000250866636633873, -0.00024026259779930115, -0.0002296585589647293, -0.00021905452013015747, -0.00020845048129558563, -0.0001978464424610138, -0.00018724240362644196, -0.00017663836479187012, -0.00016603432595729828, -0.00015543028712272644, -0.0001448262482881546, -0.00013422220945358276, -0.00012361817061901093, -0.00011301413178443909, -0.00010241009294986725, -9.180605411529541e-05, -8.120201528072357e-05, -7.059797644615173e-05, -5.9993937611579895e-05, -4.938989877700806e-05, -3.878585994243622e-05, -2.818182110786438e-05, -1.757778227329254e-05, -6.973743438720703e-06, 3.6302953958511353e-06, 1.4234334230422974e-05, 2.4838373064994812e-05, 3.544241189956665e-05, 4.604645073413849e-05, 5.665048956871033e-05, 6.725452840328217e-05, 7.7858567237854e-05, 8.846260607242584e-05, 9.906664490699768e-05, 0.00010967068374156952, 0.00012027472257614136, 0.0001308787614107132, 0.00014148280024528503, 0.00015208683907985687, 0.0001626908779144287, 0.00017329491674900055, 0.0001838989555835724, 0.00019450299441814423, 0.00020510703325271606, 0.0002157110720872879, 0.00022631511092185974, 0.00023691914975643158, 0.0002475231885910034, 0.00025812722742557526, 0.0002687312662601471, 0.00027933530509471893, 0.00028993934392929077, 0.0003005433827638626, 0.00031114742159843445, 0.0003217514604330063, 0.0003323554992675781]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 5.0, 6.0, 13.0, 7.0, 14.0, 18.0, 17.0, 21.0, 21.0, 19.0, 34.0, 30.0, 26.0, 48.0, 39.0, 38.0, 51.0, 61.0, 39.0, 39.0, 58.0, 40.0, 43.0, 38.0, 41.0, 37.0, 30.0, 31.0, 18.0, 21.0, 22.0, 13.0, 10.0, 11.0, 11.0, 8.0, 5.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.260009765625, -4.12548828125, -3.990966796875, -3.8564453125, -3.721923828125, -3.58740234375, -3.452880859375, -3.318359375, -3.183837890625, -3.04931640625, -2.914794921875, -2.7802734375, -2.645751953125, -2.51123046875, -2.376708984375, -2.2421875, -2.107666015625, -1.97314453125, -1.838623046875, -1.7041015625, -1.569580078125, -1.43505859375, -1.300537109375, -1.166015625, -1.031494140625, -0.89697265625, -0.762451171875, -0.6279296875, -0.493408203125, -0.35888671875, -0.224365234375, -0.08984375, 0.044677734375, 0.17919921875, 0.313720703125, 0.4482421875, 0.582763671875, 0.71728515625, 0.851806640625, 0.986328125, 1.120849609375, 1.25537109375, 1.389892578125, 1.5244140625, 1.658935546875, 1.79345703125, 1.927978515625, 2.0625, 2.197021484375, 2.33154296875, 2.466064453125, 2.6005859375, 2.735107421875, 2.86962890625, 3.004150390625, 3.138671875, 3.273193359375, 3.40771484375, 3.542236328125, 3.6767578125, 3.811279296875, 3.94580078125, 4.080322265625, 4.21484375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 7.0, 7.0, 6.0, 14.0, 18.0, 18.0, 23.0, 37.0, 64.0, 85.0, 87.0, 148.0, 246.0, 330.0, 548.0, 916.0, 1572.0, 3210.0, 7417.0, 19190.0, 66203.0, 297208.0, 472643.0, 125747.0, 32002.0, 11133.0, 4562.0, 2022.0, 1099.0, 677.0, 408.0, 276.0, 198.0, 121.0, 86.0, 60.0, 44.0, 31.0, 17.0, 24.0, 18.0, 10.0, 7.0, 7.0, 6.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91796875, -4.76531982421875, -4.6126708984375, -4.46002197265625, -4.307373046875, -4.15472412109375, -4.0020751953125, -3.84942626953125, -3.69677734375, -3.54412841796875, -3.3914794921875, -3.23883056640625, -3.086181640625, -2.93353271484375, -2.7808837890625, -2.62823486328125, -2.4755859375, -2.32293701171875, -2.1702880859375, -2.01763916015625, -1.864990234375, -1.71234130859375, -1.5596923828125, -1.40704345703125, -1.25439453125, -1.10174560546875, -0.9490966796875, -0.79644775390625, -0.643798828125, -0.49114990234375, -0.3385009765625, -0.18585205078125, -0.033203125, 0.11944580078125, 0.2720947265625, 0.42474365234375, 0.577392578125, 0.73004150390625, 0.8826904296875, 1.03533935546875, 1.18798828125, 1.34063720703125, 1.4932861328125, 1.64593505859375, 1.798583984375, 1.95123291015625, 2.1038818359375, 2.25653076171875, 2.4091796875, 2.56182861328125, 2.7144775390625, 2.86712646484375, 3.019775390625, 3.17242431640625, 3.3250732421875, 3.47772216796875, 3.63037109375, 3.78302001953125, 3.9356689453125, 4.08831787109375, 4.240966796875, 4.39361572265625, 4.5462646484375, 4.69891357421875, 4.8515625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 4.0, 12.0, 7.0, 15.0, 19.0, 20.0, 20.0, 28.0, 26.0, 34.0, 44.0, 51.0, 60.0, 84.0, 147.0, 1750.0, 255.0, 78.0, 57.0, 50.0, 53.0, 43.0, 28.0, 29.0, 23.0, 23.0, 23.0, 19.0, 13.0, 9.0, 10.0, 12.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.28125, -18.72509765625, -18.1689453125, -17.61279296875, -17.056640625, -16.50048828125, -15.9443359375, -15.38818359375, -14.83203125, -14.27587890625, -13.7197265625, -13.16357421875, -12.607421875, -12.05126953125, -11.4951171875, -10.93896484375, -10.3828125, -9.82666015625, -9.2705078125, -8.71435546875, -8.158203125, -7.60205078125, -7.0458984375, -6.48974609375, -5.93359375, -5.37744140625, -4.8212890625, -4.26513671875, -3.708984375, -3.15283203125, -2.5966796875, -2.04052734375, -1.484375, -0.92822265625, -0.3720703125, 0.18408203125, 0.740234375, 1.29638671875, 1.8525390625, 2.40869140625, 2.96484375, 3.52099609375, 4.0771484375, 4.63330078125, 5.189453125, 5.74560546875, 6.3017578125, 6.85791015625, 7.4140625, 7.97021484375, 8.5263671875, 9.08251953125, 9.638671875, 10.19482421875, 10.7509765625, 11.30712890625, 11.86328125, 12.41943359375, 12.9755859375, 13.53173828125, 14.087890625, 14.64404296875, 15.2001953125, 15.75634765625, 16.3125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 11.0, 10.0, 15.0, 12.0, 18.0, 30.0, 20.0, 38.0, 32.0, 63.0, 84.0, 112.0, 216.0, 508.0, 1619.0, 19757.0, 3011601.0, 106662.0, 3446.0, 680.0, 278.0, 144.0, 79.0, 68.0, 38.0, 34.0, 14.0, 30.0, 17.0, 17.0, 11.0, 12.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.984375, -22.154296875, -21.32421875, -20.494140625, -19.6640625, -18.833984375, -18.00390625, -17.173828125, -16.34375, -15.513671875, -14.68359375, -13.853515625, -13.0234375, -12.193359375, -11.36328125, -10.533203125, -9.703125, -8.873046875, -8.04296875, -7.212890625, -6.3828125, -5.552734375, -4.72265625, -3.892578125, -3.0625, -2.232421875, -1.40234375, -0.572265625, 0.2578125, 1.087890625, 1.91796875, 2.748046875, 3.578125, 4.408203125, 5.23828125, 6.068359375, 6.8984375, 7.728515625, 8.55859375, 9.388671875, 10.21875, 11.048828125, 11.87890625, 12.708984375, 13.5390625, 14.369140625, 15.19921875, 16.029296875, 16.859375, 17.689453125, 18.51953125, 19.349609375, 20.1796875, 21.009765625, 21.83984375, 22.669921875, 23.5, 24.330078125, 25.16015625, 25.990234375, 26.8203125, 27.650390625, 28.48046875, 29.310546875, 30.140625]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 39.0, 667.0, 306.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.59774780273438, -166.70021057128906, -162.8026580810547, -158.90512084960938, -155.007568359375, -151.1100311279297, -147.21249389648438, -143.31494140625, -139.4174041748047, -135.51986694335938, -131.622314453125, -127.72477722167969, -123.82723236083984, -119.9296875, -116.03215026855469, -112.13460540771484, -108.237060546875, -104.33951568603516, -100.44197082519531, -96.54443359375, -92.64688873291016, -88.74934387207031, -84.851806640625, -80.95426177978516, -77.05671691894531, -73.15917205810547, -69.26162719726562, -65.36408996582031, -61.46654510498047, -57.569000244140625, -53.67145919799805, -49.77391815185547, -45.876365661621094, -41.97882080078125, -38.08127975463867, -34.183738708496094, -30.28619384765625, -26.38865089416504, -22.491107940673828, -18.593564987182617, -14.696022033691406, -10.798479080200195, -6.900936126708984, -3.0033931732177734, 0.8941497802734375, 4.791692733764648, 8.68923568725586, 12.58677864074707, 16.48432159423828, 20.381864547729492, 24.279407501220703, 28.176950454711914, 32.074493408203125, 35.97203826904297, 39.86957931518555, 43.767120361328125, 47.66466522216797, 51.56221008300781, 55.45975112915039, 59.35729217529297, 63.25483703613281, 67.15238189697266, 71.0499267578125, 74.94746398925781, 78.84500885009766]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 8.0, 5.0, 11.0, 18.0, 14.0, 14.0, 27.0, 21.0, 16.0, 33.0, 30.0, 42.0, 40.0, 35.0, 27.0, 43.0, 50.0, 49.0, 45.0, 41.0, 40.0, 44.0, 41.0, 36.0, 32.0, 19.0, 34.0, 18.0, 31.0, 18.0, 18.0, 16.0, 12.0, 11.0, 10.0, 8.0, 6.0, 7.0, 10.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.91804504394531, -43.481300354003906, -42.0445556640625, -40.607810974121094, -39.17106628417969, -37.73432159423828, -36.297576904296875, -34.8608283996582, -33.4240837097168, -31.98733901977539, -30.550594329833984, -29.113849639892578, -27.67710304260254, -26.240358352661133, -24.803613662719727, -23.366867065429688, -21.930124282836914, -20.493379592895508, -19.0566349029541, -17.619888305664062, -16.183143615722656, -14.74639892578125, -13.309654235839844, -11.872908592224121, -10.436163902282715, -8.999419212341309, -7.562673568725586, -6.12592887878418, -4.689183712005615, -3.252438545227051, -1.8156938552856445, -0.3789482116699219, 1.0577964782714844, 2.494541645050049, 3.931286573410034, 5.3680315017700195, 6.804776668548584, 8.241521835327148, 9.678266525268555, 11.115012168884277, 12.551756858825684, 13.98850154876709, 15.425247192382812, 16.86199188232422, 18.298736572265625, 19.73548126220703, 21.172225952148438, 22.608972549438477, 24.045717239379883, 25.48246192932129, 26.919206619262695, 28.355953216552734, 29.79269790649414, 31.229442596435547, 32.66618728637695, 34.10293197631836, 35.539676666259766, 36.97642135620117, 38.41316604614258, 39.849910736083984, 41.28665542602539, 42.72340393066406, 44.16014862060547, 45.596893310546875, 47.03363800048828]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 5.0, 8.0, 8.0, 12.0, 9.0, 10.0, 23.0, 19.0, 14.0, 33.0, 26.0, 20.0, 34.0, 38.0, 52.0, 31.0, 55.0, 44.0, 51.0, 54.0, 50.0, 39.0, 44.0, 37.0, 34.0, 46.0, 32.0, 26.0, 25.0, 17.0, 23.0, 18.0, 6.0, 16.0, 7.0, 11.0, 6.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34765625, -4.2071533203125, -4.066650390625, -3.9261474609375, -3.78564453125, -3.6451416015625, -3.504638671875, -3.3641357421875, -3.2236328125, -3.0831298828125, -2.942626953125, -2.8021240234375, -2.66162109375, -2.5211181640625, -2.380615234375, -2.2401123046875, -2.099609375, -1.9591064453125, -1.818603515625, -1.6781005859375, -1.53759765625, -1.3970947265625, -1.256591796875, -1.1160888671875, -0.9755859375, -0.8350830078125, -0.694580078125, -0.5540771484375, -0.41357421875, -0.2730712890625, -0.132568359375, 0.0079345703125, 0.1484375, 0.2889404296875, 0.429443359375, 0.5699462890625, 0.71044921875, 0.8509521484375, 0.991455078125, 1.1319580078125, 1.2724609375, 1.4129638671875, 1.553466796875, 1.6939697265625, 1.83447265625, 1.9749755859375, 2.115478515625, 2.2559814453125, 2.396484375, 2.5369873046875, 2.677490234375, 2.8179931640625, 2.95849609375, 3.0989990234375, 3.239501953125, 3.3800048828125, 3.5205078125, 3.6610107421875, 3.801513671875, 3.9420166015625, 4.08251953125, 4.2230224609375, 4.363525390625, 4.5040283203125, 4.64453125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 3.0, 9.0, 11.0, 13.0, 13.0, 20.0, 11.0, 16.0, 26.0, 53.0, 64.0, 116.0, 157.0, 360.0, 816.0, 2204.0, 7053.0, 28023.0, 150380.0, 940200.0, 2169895.0, 746740.0, 116278.0, 22547.0, 5909.0, 1868.0, 735.0, 292.0, 140.0, 78.0, 49.0, 37.0, 39.0, 23.0, 24.0, 19.0, 9.0, 4.0, 9.0, 6.0, 9.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.9765625, -7.7227783203125, -7.468994140625, -7.2152099609375, -6.96142578125, -6.7076416015625, -6.453857421875, -6.2000732421875, -5.9462890625, -5.6925048828125, -5.438720703125, -5.1849365234375, -4.93115234375, -4.6773681640625, -4.423583984375, -4.1697998046875, -3.916015625, -3.6622314453125, -3.408447265625, -3.1546630859375, -2.90087890625, -2.6470947265625, -2.393310546875, -2.1395263671875, -1.8857421875, -1.6319580078125, -1.378173828125, -1.1243896484375, -0.87060546875, -0.6168212890625, -0.363037109375, -0.1092529296875, 0.14453125, 0.3983154296875, 0.652099609375, 0.9058837890625, 1.15966796875, 1.4134521484375, 1.667236328125, 1.9210205078125, 2.1748046875, 2.4285888671875, 2.682373046875, 2.9361572265625, 3.18994140625, 3.4437255859375, 3.697509765625, 3.9512939453125, 4.205078125, 4.4588623046875, 4.712646484375, 4.9664306640625, 5.22021484375, 5.4739990234375, 5.727783203125, 5.9815673828125, 6.2353515625, 6.4891357421875, 6.742919921875, 6.9967041015625, 7.25048828125, 7.5042724609375, 7.758056640625, 8.0118408203125, 8.265625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 8.0, 15.0, 13.0, 20.0, 51.0, 65.0, 120.0, 165.0, 266.0, 356.0, 526.0, 593.0, 567.0, 410.0, 336.0, 187.0, 144.0, 84.0, 59.0, 37.0, 15.0, 18.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.234375, -13.756103515625, -13.27783203125, -12.799560546875, -12.3212890625, -11.843017578125, -11.36474609375, -10.886474609375, -10.408203125, -9.929931640625, -9.45166015625, -8.973388671875, -8.4951171875, -8.016845703125, -7.53857421875, -7.060302734375, -6.58203125, -6.103759765625, -5.62548828125, -5.147216796875, -4.6689453125, -4.190673828125, -3.71240234375, -3.234130859375, -2.755859375, -2.277587890625, -1.79931640625, -1.321044921875, -0.8427734375, -0.364501953125, 0.11376953125, 0.592041015625, 1.0703125, 1.548583984375, 2.02685546875, 2.505126953125, 2.9833984375, 3.461669921875, 3.93994140625, 4.418212890625, 4.896484375, 5.374755859375, 5.85302734375, 6.331298828125, 6.8095703125, 7.287841796875, 7.76611328125, 8.244384765625, 8.72265625, 9.200927734375, 9.67919921875, 10.157470703125, 10.6357421875, 11.114013671875, 11.59228515625, 12.070556640625, 12.548828125, 13.027099609375, 13.50537109375, 13.983642578125, 14.4619140625, 14.940185546875, 15.41845703125, 15.896728515625, 16.375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 8.0, 10.0, 21.0, 26.0, 40.0, 59.0, 120.0, 212.0, 487.0, 2019.0, 72222.0, 3976119.0, 139182.0, 2608.0, 576.0, 259.0, 110.0, 72.0, 57.0, 25.0, 12.0, 19.0, 8.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.625, -52.158203125, -50.69140625, -49.224609375, -47.7578125, -46.291015625, -44.82421875, -43.357421875, -41.890625, -40.423828125, -38.95703125, -37.490234375, -36.0234375, -34.556640625, -33.08984375, -31.623046875, -30.15625, -28.689453125, -27.22265625, -25.755859375, -24.2890625, -22.822265625, -21.35546875, -19.888671875, -18.421875, -16.955078125, -15.48828125, -14.021484375, -12.5546875, -11.087890625, -9.62109375, -8.154296875, -6.6875, -5.220703125, -3.75390625, -2.287109375, -0.8203125, 0.646484375, 2.11328125, 3.580078125, 5.046875, 6.513671875, 7.98046875, 9.447265625, 10.9140625, 12.380859375, 13.84765625, 15.314453125, 16.78125, 18.248046875, 19.71484375, 21.181640625, 22.6484375, 24.115234375, 25.58203125, 27.048828125, 28.515625, 29.982421875, 31.44921875, 32.916015625, 34.3828125, 35.849609375, 37.31640625, 38.783203125, 40.25]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 25.0, 136.0, 276.0, 333.0, 190.0, 47.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-199.8176727294922, -194.96788024902344, -190.11810302734375, -185.268310546875, -180.4185333251953, -175.56874084472656, -170.71896362304688, -165.86917114257812, -161.01937866210938, -156.16958618164062, -151.31980895996094, -146.4700164794922, -141.6202392578125, -136.77044677734375, -131.92066955566406, -127.07087707519531, -122.22109985351562, -117.3713150024414, -112.52153015136719, -107.67174530029297, -102.82196044921875, -97.97216796875, -93.12238311767578, -88.27259826660156, -83.42281341552734, -78.57302856445312, -73.7232437133789, -68.87345886230469, -64.02366638183594, -59.173885345458984, -54.3240966796875, -49.47431182861328, -44.62451934814453, -39.77473449707031, -34.924949645996094, -30.07516098022461, -25.22537612915039, -20.375591278076172, -15.52580451965332, -10.676017761230469, -5.82623291015625, -0.9764471054077148, 3.8733386993408203, 8.723124504089355, 13.57291030883789, 18.42269515991211, 23.27248191833496, 28.122268676757812, 32.97205352783203, 37.82183837890625, 42.67162322998047, 47.52141189575195, 52.37119674682617, 57.22098159790039, 62.070770263671875, 66.9205551147461, 71.77033996582031, 76.62012481689453, 81.46990966796875, 86.31969451904297, 91.16947937011719, 96.01927185058594, 100.86905670166016, 105.71884155273438, 110.5686264038086]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 1.0, 5.0, 6.0, 6.0, 14.0, 12.0, 12.0, 19.0, 17.0, 21.0, 19.0, 31.0, 36.0, 30.0, 48.0, 31.0, 34.0, 39.0, 50.0, 50.0, 41.0, 47.0, 42.0, 37.0, 27.0, 45.0, 34.0, 42.0, 33.0, 23.0, 25.0, 24.0, 13.0, 16.0, 11.0, 11.0, 13.0, 7.0, 7.0, 7.0, 3.0, 1.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.596866607666016, -37.36635208129883, -36.13583755493164, -34.90532302856445, -33.6748046875, -32.44429016113281, -31.213775634765625, -29.983261108398438, -28.75274658203125, -27.522232055664062, -26.291717529296875, -25.061201095581055, -23.830686569213867, -22.60017204284668, -21.36965560913086, -20.139141082763672, -18.908626556396484, -17.678112030029297, -16.44759750366211, -15.217081069946289, -13.986566543579102, -12.756052017211914, -11.52553653717041, -10.295021057128906, -9.064506530761719, -7.833991527557373, -6.603476524353027, -5.372961521148682, -4.142446517944336, -2.9119315147399902, -1.6814165115356445, -0.4509010314941406, 0.7796134948730469, 2.0101284980773926, 3.2406435012817383, 4.471158504486084, 5.70167350769043, 6.932188510894775, 8.162703514099121, 9.393218994140625, 10.623733520507812, 11.854248046875, 13.084763526916504, 14.315279006958008, 15.545793533325195, 16.776308059692383, 18.006824493408203, 19.23733901977539, 20.467853546142578, 21.698368072509766, 22.928882598876953, 24.159399032592773, 25.38991355895996, 26.62042808532715, 27.85094451904297, 29.081459045410156, 30.311973571777344, 31.54248809814453, 32.77300262451172, 34.003517150878906, 35.234031677246094, 36.46455001831055, 37.695064544677734, 38.92557907104492, 40.15609359741211]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 15.0, 11.0, 11.0, 12.0, 13.0, 19.0, 22.0, 31.0, 30.0, 27.0, 41.0, 31.0, 36.0, 48.0, 44.0, 56.0, 40.0, 43.0, 49.0, 48.0, 45.0, 36.0, 29.0, 40.0, 35.0, 21.0, 30.0, 20.0, 15.0, 16.0, 20.0, 9.0, 8.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.52734375, -4.3885498046875, -4.249755859375, -4.1109619140625, -3.97216796875, -3.8333740234375, -3.694580078125, -3.5557861328125, -3.4169921875, -3.2781982421875, -3.139404296875, -3.0006103515625, -2.86181640625, -2.7230224609375, -2.584228515625, -2.4454345703125, -2.306640625, -2.1678466796875, -2.029052734375, -1.8902587890625, -1.75146484375, -1.6126708984375, -1.473876953125, -1.3350830078125, -1.1962890625, -1.0574951171875, -0.918701171875, -0.7799072265625, -0.64111328125, -0.5023193359375, -0.363525390625, -0.2247314453125, -0.0859375, 0.0528564453125, 0.191650390625, 0.3304443359375, 0.46923828125, 0.6080322265625, 0.746826171875, 0.8856201171875, 1.0244140625, 1.1632080078125, 1.302001953125, 1.4407958984375, 1.57958984375, 1.7183837890625, 1.857177734375, 1.9959716796875, 2.134765625, 2.2735595703125, 2.412353515625, 2.5511474609375, 2.68994140625, 2.8287353515625, 2.967529296875, 3.1063232421875, 3.2451171875, 3.3839111328125, 3.522705078125, 3.6614990234375, 3.80029296875, 3.9390869140625, 4.077880859375, 4.2166748046875, 4.35546875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 11.0, 15.0, 17.0, 25.0, 31.0, 55.0, 77.0, 101.0, 172.0, 222.0, 357.0, 449.0, 682.0, 966.0, 1342.0, 1944.0, 2771.0, 3979.0, 5896.0, 8884.0, 13148.0, 20479.0, 31892.0, 50750.0, 83655.0, 152756.0, 261514.0, 165777.0, 89258.0, 53420.0, 33345.0, 21375.0, 13971.0, 9249.0, 6161.0, 4180.0, 2898.0, 2069.0, 1461.0, 961.0, 674.0, 466.0, 344.0, 248.0, 153.0, 117.0, 75.0, 57.0, 35.0, 19.0, 24.0, 13.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0], "bins": [-0.68603515625, -0.6649627685546875, -0.643890380859375, -0.6228179931640625, -0.60174560546875, -0.5806732177734375, -0.559600830078125, -0.5385284423828125, -0.5174560546875, -0.4963836669921875, -0.475311279296875, -0.4542388916015625, -0.43316650390625, -0.4120941162109375, -0.391021728515625, -0.3699493408203125, -0.348876953125, -0.3278045654296875, -0.306732177734375, -0.2856597900390625, -0.26458740234375, -0.2435150146484375, -0.222442626953125, -0.2013702392578125, -0.1802978515625, -0.1592254638671875, -0.138153076171875, -0.1170806884765625, -0.09600830078125, -0.0749359130859375, -0.053863525390625, -0.0327911376953125, -0.01171875, 0.0093536376953125, 0.030426025390625, 0.0514984130859375, 0.07257080078125, 0.0936431884765625, 0.114715576171875, 0.1357879638671875, 0.1568603515625, 0.1779327392578125, 0.199005126953125, 0.2200775146484375, 0.24114990234375, 0.2622222900390625, 0.283294677734375, 0.3043670654296875, 0.325439453125, 0.3465118408203125, 0.367584228515625, 0.3886566162109375, 0.40972900390625, 0.4308013916015625, 0.451873779296875, 0.4729461669921875, 0.4940185546875, 0.5150909423828125, 0.536163330078125, 0.5572357177734375, 0.57830810546875, 0.5993804931640625, 0.620452880859375, 0.6415252685546875, 0.66259765625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 6.0, 1.0, 4.0, 7.0, 5.0, 4.0, 12.0, 12.0, 5.0, 12.0, 8.0, 22.0, 15.0, 17.0, 29.0, 20.0, 34.0, 33.0, 41.0, 34.0, 36.0, 42.0, 36.0, 36.0, 36.0, 1055.0, 43.0, 35.0, 32.0, 41.0, 38.0, 28.0, 33.0, 26.0, 29.0, 21.0, 10.0, 23.0, 12.0, 18.0, 19.0, 4.0, 9.0, 11.0, 12.0, 4.0, 7.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-2.4140625, -2.34368896484375, -2.2733154296875, -2.20294189453125, -2.132568359375, -2.06219482421875, -1.9918212890625, -1.92144775390625, -1.85107421875, -1.78070068359375, -1.7103271484375, -1.63995361328125, -1.569580078125, -1.49920654296875, -1.4288330078125, -1.35845947265625, -1.2880859375, -1.21771240234375, -1.1473388671875, -1.07696533203125, -1.006591796875, -0.93621826171875, -0.8658447265625, -0.79547119140625, -0.72509765625, -0.65472412109375, -0.5843505859375, -0.51397705078125, -0.443603515625, -0.37322998046875, -0.3028564453125, -0.23248291015625, -0.162109375, -0.09173583984375, -0.0213623046875, 0.04901123046875, 0.119384765625, 0.18975830078125, 0.2601318359375, 0.33050537109375, 0.40087890625, 0.47125244140625, 0.5416259765625, 0.61199951171875, 0.682373046875, 0.75274658203125, 0.8231201171875, 0.89349365234375, 0.9638671875, 1.03424072265625, 1.1046142578125, 1.17498779296875, 1.245361328125, 1.31573486328125, 1.3861083984375, 1.45648193359375, 1.52685546875, 1.59722900390625, 1.6676025390625, 1.73797607421875, 1.808349609375, 1.87872314453125, 1.9490966796875, 2.01947021484375, 2.08984375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 4.0, 8.0, 11.0, 15.0, 23.0, 42.0, 61.0, 76.0, 108.0, 135.0, 197.0, 312.0, 408.0, 627.0, 907.0, 1315.0, 2076.0, 3131.0, 4688.0, 7144.0, 11218.0, 17549.0, 27913.0, 47361.0, 84362.0, 159364.0, 1323471.0, 177516.0, 92408.0, 51186.0, 29930.0, 18976.0, 11729.0, 7625.0, 5211.0, 3297.0, 2192.0, 1418.0, 970.0, 673.0, 447.0, 333.0, 230.0, 154.0, 101.0, 74.0, 49.0, 25.0, 28.0, 7.0, 15.0, 5.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.61767578125, -0.5967941284179688, -0.5759124755859375, -0.5550308227539062, -0.534149169921875, -0.5132675170898438, -0.4923858642578125, -0.47150421142578125, -0.45062255859375, -0.42974090576171875, -0.4088592529296875, -0.38797760009765625, -0.367095947265625, -0.34621429443359375, -0.3253326416015625, -0.30445098876953125, -0.2835693359375, -0.26268768310546875, -0.2418060302734375, -0.22092437744140625, -0.200042724609375, -0.17916107177734375, -0.1582794189453125, -0.13739776611328125, -0.11651611328125, -0.09563446044921875, -0.0747528076171875, -0.05387115478515625, -0.032989501953125, -0.01210784912109375, 0.0087738037109375, 0.02965545654296875, 0.050537109375, 0.07141876220703125, 0.0923004150390625, 0.11318206787109375, 0.134063720703125, 0.15494537353515625, 0.1758270263671875, 0.19670867919921875, 0.21759033203125, 0.23847198486328125, 0.2593536376953125, 0.28023529052734375, 0.301116943359375, 0.32199859619140625, 0.3428802490234375, 0.36376190185546875, 0.3846435546875, 0.40552520751953125, 0.4264068603515625, 0.44728851318359375, 0.468170166015625, 0.48905181884765625, 0.5099334716796875, 0.5308151245117188, 0.55169677734375, 0.5725784301757812, 0.5934600830078125, 0.6143417358398438, 0.635223388671875, 0.6561050415039062, 0.6769866943359375, 0.6978683471679688, 0.71875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 7.0, 4.0, 11.0, 18.0, 18.0, 18.0, 29.0, 22.0, 36.0, 26.0, 38.0, 38.0, 51.0, 54.0, 70.0, 57.0, 59.0, 57.0, 62.0, 61.0, 50.0, 33.0, 32.0, 25.0, 20.0, 15.0, 19.0, 11.0, 12.0, 10.0, 7.0, 4.0, 5.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0], "bins": [-0.0009784698486328125, -0.0009520649909973145, -0.0009256601333618164, -0.0008992552757263184, -0.0008728504180908203, -0.0008464455604553223, -0.0008200407028198242, -0.0007936358451843262, -0.0007672309875488281, -0.0007408261299133301, -0.000714421272277832, -0.000688016414642334, -0.0006616115570068359, -0.0006352066993713379, -0.0006088018417358398, -0.0005823969841003418, -0.0005559921264648438, -0.0005295872688293457, -0.0005031824111938477, -0.0004767775535583496, -0.00045037269592285156, -0.0004239678382873535, -0.00039756298065185547, -0.0003711581230163574, -0.0003447532653808594, -0.00031834840774536133, -0.0002919435501098633, -0.00026553869247436523, -0.0002391338348388672, -0.00021272897720336914, -0.0001863241195678711, -0.00015991926193237305, -0.000133514404296875, -0.00010710954666137695, -8.07046890258789e-05, -5.429983139038086e-05, -2.7894973754882812e-05, -1.4901161193847656e-06, 2.491474151611328e-05, 5.131959915161133e-05, 7.772445678710938e-05, 0.00010412931442260742, 0.00013053417205810547, 0.00015693902969360352, 0.00018334388732910156, 0.0002097487449645996, 0.00023615360260009766, 0.0002625584602355957, 0.00028896331787109375, 0.0003153681755065918, 0.00034177303314208984, 0.0003681778907775879, 0.00039458274841308594, 0.000420987606048584, 0.00044739246368408203, 0.0004737973213195801, 0.0005002021789550781, 0.0005266070365905762, 0.0005530118942260742, 0.0005794167518615723, 0.0006058216094970703, 0.0006322264671325684, 0.0006586313247680664, 0.0006850361824035645, 0.0007114410400390625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 9.0, 8.0, 5.0, 13.0, 12.0, 15.0, 20.0, 30.0, 40.0, 50.0, 67.0, 98.0, 155.0, 210.0, 339.0, 585.0, 6858.0, 1023200.0, 15065.0, 699.0, 337.0, 207.0, 124.0, 95.0, 78.0, 42.0, 45.0, 30.0, 29.0, 18.0, 21.0, 16.0, 4.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.015625, -0.015096426010131836, -0.014567852020263672, -0.014039278030395508, -0.013510704040527344, -0.01298213005065918, -0.012453556060791016, -0.011924982070922852, -0.011396408081054688, -0.010867834091186523, -0.01033926010131836, -0.009810686111450195, -0.009282112121582031, -0.008753538131713867, -0.008224964141845703, -0.007696390151977539, -0.007167816162109375, -0.006639242172241211, -0.006110668182373047, -0.005582094192504883, -0.005053520202636719, -0.004524946212768555, -0.003996372222900391, -0.0034677982330322266, -0.0029392242431640625, -0.0024106502532958984, -0.0018820762634277344, -0.0013535022735595703, -0.0008249282836914062, -0.0002963542938232422, 0.00023221969604492188, 0.0007607936859130859, 0.00128936767578125, 0.001817941665649414, 0.002346515655517578, 0.002875089645385742, 0.0034036636352539062, 0.00393223762512207, 0.004460811614990234, 0.0049893856048583984, 0.0055179595947265625, 0.0060465335845947266, 0.006575107574462891, 0.007103681564331055, 0.007632255554199219, 0.008160829544067383, 0.008689403533935547, 0.009217977523803711, 0.009746551513671875, 0.010275125503540039, 0.010803699493408203, 0.011332273483276367, 0.011860847473144531, 0.012389421463012695, 0.01291799545288086, 0.013446569442749023, 0.013975143432617188, 0.014503717422485352, 0.015032291412353516, 0.01556086540222168, 0.016089439392089844, 0.016618013381958008, 0.017146587371826172, 0.017675161361694336, 0.0182037353515625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 46.0, 427.0, 464.0, 72.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004102547187358141, -0.004011508077383041, -0.003920468967407942, -0.0038294296246021986, -0.003738390514627099, -0.0036473514046519995, -0.0035563122946769, -0.0034652729518711567, -0.003374233841896057, -0.0032831947319209576, -0.003192155621945858, -0.003101116279140115, -0.0030100771691650152, -0.0029190380591899157, -0.002827998949214816, -0.002736959606409073, -0.0026459204964339733, -0.0025548813864588737, -0.002463842276483774, -0.002372802933678031, -0.0022817638237029314, -0.002190724713727832, -0.0020996856037527323, -0.002008646260946989, -0.0019176073838025331, -0.0018265682738274336, -0.0017355290474370122, -0.0016444899374619126, -0.0015534507110714912, -0.0014624116010963917, -0.0013713724911212921, -0.0012803332647308707, -0.0011892941547557712, -0.0010982550447806716, -0.0010072158183902502, -0.0009161767084151506, -0.0008251374820247293, -0.0007340983720496297, -0.0006430592038668692, -0.0005520200356841087, -0.00046098086750134826, -0.0003699416993185878, -0.0002789025311358273, -0.00018786339205689728, -9.68242238741368e-05, -5.7850556913763285e-06, 8.525408338755369e-05, 0.00017629325157031417, 0.00026733241975307465, 0.0003583715879358351, 0.0004494107561185956, 0.0005404498660936952, 0.0006314890924841166, 0.0007225282024592161, 0.0008135673706419766, 0.0009046065388247371, 0.0009956457652151585, 0.001086684875190258, 0.0011777241015806794, 0.001268763211555779, 0.0013598024379462004, 0.0014508415479213, 0.0015418806578963995, 0.0016329198842868209, 0.0017239589942619205]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 9.0, 7.0, 7.0, 5.0, 8.0, 12.0, 12.0, 17.0, 14.0, 16.0, 21.0, 23.0, 19.0, 24.0, 24.0, 29.0, 30.0, 28.0, 33.0, 34.0, 43.0, 34.0, 41.0, 42.0, 38.0, 43.0, 35.0, 34.0, 26.0, 31.0, 35.0, 25.0, 21.0, 20.0, 34.0, 18.0, 14.0, 16.0, 15.0, 10.0, 11.0, 8.0, 11.0, 7.0, 8.0, 4.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0], "bins": [-0.00044333934783935547, -0.0004308093339204788, -0.00041827932000160217, -0.0004057493060827255, -0.0003932192921638489, -0.00038068927824497223, -0.0003681592643260956, -0.00035562925040721893, -0.0003430992364883423, -0.00033056922256946564, -0.000318039208650589, -0.00030550919473171234, -0.0002929791808128357, -0.00028044916689395905, -0.0002679191529750824, -0.00025538913905620575, -0.0002428591251373291, -0.00023032911121845245, -0.0002177990972995758, -0.00020526908338069916, -0.0001927390694618225, -0.00018020905554294586, -0.00016767904162406921, -0.00015514902770519257, -0.00014261901378631592, -0.00013008899986743927, -0.00011755898594856262, -0.00010502897202968597, -9.249895811080933e-05, -7.996894419193268e-05, -6.743893027305603e-05, -5.490891635417938e-05, -4.2378902435302734e-05, -2.9848888516426086e-05, -1.731887459754944e-05, -4.7888606786727905e-06, 7.741153240203857e-06, 2.0271167159080505e-05, 3.280118107795715e-05, 4.53311949968338e-05, 5.786120891571045e-05, 7.03912228345871e-05, 8.292123675346375e-05, 9.545125067234039e-05, 0.00010798126459121704, 0.00012051127851009369, 0.00013304129242897034, 0.00014557130634784698, 0.00015810132026672363, 0.00017063133418560028, 0.00018316134810447693, 0.00019569136202335358, 0.00020822137594223022, 0.00022075138986110687, 0.00023328140377998352, 0.00024581141769886017, 0.0002583414316177368, 0.00027087144553661346, 0.0002834014594554901, 0.00029593147337436676, 0.0003084614872932434, 0.00032099150121212006, 0.0003335215151309967, 0.00034605152904987335, 0.00035858154296875]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 15.0, 11.0, 11.0, 12.0, 13.0, 19.0, 22.0, 31.0, 30.0, 27.0, 41.0, 31.0, 36.0, 48.0, 44.0, 56.0, 40.0, 43.0, 49.0, 48.0, 45.0, 36.0, 29.0, 40.0, 35.0, 21.0, 30.0, 20.0, 15.0, 16.0, 20.0, 9.0, 8.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.52734375, -4.3885498046875, -4.249755859375, -4.1109619140625, -3.97216796875, -3.8333740234375, -3.694580078125, -3.5557861328125, -3.4169921875, -3.2781982421875, -3.139404296875, -3.0006103515625, -2.86181640625, -2.7230224609375, -2.584228515625, -2.4454345703125, -2.306640625, -2.1678466796875, -2.029052734375, -1.8902587890625, -1.75146484375, -1.6126708984375, -1.473876953125, -1.3350830078125, -1.1962890625, -1.0574951171875, -0.918701171875, -0.7799072265625, -0.64111328125, -0.5023193359375, -0.363525390625, -0.2247314453125, -0.0859375, 0.0528564453125, 0.191650390625, 0.3304443359375, 0.46923828125, 0.6080322265625, 0.746826171875, 0.8856201171875, 1.0244140625, 1.1632080078125, 1.302001953125, 1.4407958984375, 1.57958984375, 1.7183837890625, 1.857177734375, 1.9959716796875, 2.134765625, 2.2735595703125, 2.412353515625, 2.5511474609375, 2.68994140625, 2.8287353515625, 2.967529296875, 3.1063232421875, 3.2451171875, 3.3839111328125, 3.522705078125, 3.6614990234375, 3.80029296875, 3.9390869140625, 4.077880859375, 4.2166748046875, 4.35546875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 6.0, 13.0, 18.0, 17.0, 38.0, 50.0, 56.0, 87.0, 145.0, 228.0, 408.0, 713.0, 1306.0, 2415.0, 4483.0, 8833.0, 18108.0, 40124.0, 92758.0, 200576.0, 292924.0, 207771.0, 97064.0, 42126.0, 18870.0, 9072.0, 4581.0, 2476.0, 1363.0, 769.0, 439.0, 256.0, 149.0, 91.0, 65.0, 53.0, 38.0, 20.0, 14.0, 8.0, 9.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.833984375, -2.74114990234375, -2.6483154296875, -2.55548095703125, -2.462646484375, -2.36981201171875, -2.2769775390625, -2.18414306640625, -2.09130859375, -1.99847412109375, -1.9056396484375, -1.81280517578125, -1.719970703125, -1.62713623046875, -1.5343017578125, -1.44146728515625, -1.3486328125, -1.25579833984375, -1.1629638671875, -1.07012939453125, -0.977294921875, -0.88446044921875, -0.7916259765625, -0.69879150390625, -0.60595703125, -0.51312255859375, -0.4202880859375, -0.32745361328125, -0.234619140625, -0.14178466796875, -0.0489501953125, 0.04388427734375, 0.13671875, 0.22955322265625, 0.3223876953125, 0.41522216796875, 0.508056640625, 0.60089111328125, 0.6937255859375, 0.78656005859375, 0.87939453125, 0.97222900390625, 1.0650634765625, 1.15789794921875, 1.250732421875, 1.34356689453125, 1.4364013671875, 1.52923583984375, 1.6220703125, 1.71490478515625, 1.8077392578125, 1.90057373046875, 1.993408203125, 2.08624267578125, 2.1790771484375, 2.27191162109375, 2.36474609375, 2.45758056640625, 2.5504150390625, 2.64324951171875, 2.736083984375, 2.82891845703125, 2.9217529296875, 3.01458740234375, 3.107421875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 4.0, 7.0, 5.0, 13.0, 12.0, 13.0, 12.0, 20.0, 15.0, 25.0, 24.0, 32.0, 26.0, 37.0, 26.0, 39.0, 47.0, 74.0, 162.0, 1556.0, 362.0, 109.0, 67.0, 39.0, 34.0, 31.0, 36.0, 21.0, 24.0, 21.0, 27.0, 22.0, 25.0, 17.0, 11.0, 11.0, 7.0, 7.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-16.84375, -16.3731689453125, -15.902587890625, -15.4320068359375, -14.96142578125, -14.4908447265625, -14.020263671875, -13.5496826171875, -13.0791015625, -12.6085205078125, -12.137939453125, -11.6673583984375, -11.19677734375, -10.7261962890625, -10.255615234375, -9.7850341796875, -9.314453125, -8.8438720703125, -8.373291015625, -7.9027099609375, -7.43212890625, -6.9615478515625, -6.490966796875, -6.0203857421875, -5.5498046875, -5.0792236328125, -4.608642578125, -4.1380615234375, -3.66748046875, -3.1968994140625, -2.726318359375, -2.2557373046875, -1.78515625, -1.3145751953125, -0.843994140625, -0.3734130859375, 0.09716796875, 0.5677490234375, 1.038330078125, 1.5089111328125, 1.9794921875, 2.4500732421875, 2.920654296875, 3.3912353515625, 3.86181640625, 4.3323974609375, 4.802978515625, 5.2735595703125, 5.744140625, 6.2147216796875, 6.685302734375, 7.1558837890625, 7.62646484375, 8.0970458984375, 8.567626953125, 9.0382080078125, 9.5087890625, 9.9793701171875, 10.449951171875, 10.9205322265625, 11.39111328125, 11.8616943359375, 12.332275390625, 12.8028564453125, 13.2734375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 1.0, 5.0, 5.0, 8.0, 10.0, 6.0, 9.0, 18.0, 19.0, 29.0, 24.0, 28.0, 35.0, 45.0, 44.0, 66.0, 107.0, 164.0, 260.0, 550.0, 2204.0, 39632.0, 2971873.0, 125280.0, 3614.0, 674.0, 319.0, 172.0, 126.0, 87.0, 51.0, 46.0, 37.0, 26.0, 31.0, 20.0, 12.0, 6.0, 14.0, 15.0, 9.0, 5.0, 5.0, 6.0, 7.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.78125, -21.0458984375, -20.310546875, -19.5751953125, -18.83984375, -18.1044921875, -17.369140625, -16.6337890625, -15.8984375, -15.1630859375, -14.427734375, -13.6923828125, -12.95703125, -12.2216796875, -11.486328125, -10.7509765625, -10.015625, -9.2802734375, -8.544921875, -7.8095703125, -7.07421875, -6.3388671875, -5.603515625, -4.8681640625, -4.1328125, -3.3974609375, -2.662109375, -1.9267578125, -1.19140625, -0.4560546875, 0.279296875, 1.0146484375, 1.75, 2.4853515625, 3.220703125, 3.9560546875, 4.69140625, 5.4267578125, 6.162109375, 6.8974609375, 7.6328125, 8.3681640625, 9.103515625, 9.8388671875, 10.57421875, 11.3095703125, 12.044921875, 12.7802734375, 13.515625, 14.2509765625, 14.986328125, 15.7216796875, 16.45703125, 17.1923828125, 17.927734375, 18.6630859375, 19.3984375, 20.1337890625, 20.869140625, 21.6044921875, 22.33984375, 23.0751953125, 23.810546875, 24.5458984375, 25.28125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 6.0, 33.0, 75.0, 138.0, 183.0, 210.0, 185.0, 102.0, 52.0, 20.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6102876663208, -7.580400466918945, -6.55051326751709, -5.520625591278076, -4.490738391876221, -3.4608511924743652, -2.4309635162353516, -1.401076316833496, -0.3711891174316406, 0.6586982011795044, 1.6885855197906494, 2.718472957611084, 3.7483601570129395, 4.778247356414795, 5.808135032653809, 6.838022232055664, 7.8679094314575195, 8.897796630859375, 9.92768383026123, 10.957571029663086, 11.987459182739258, 13.017345428466797, 14.047233581542969, 15.077120780944824, 16.10700798034668, 17.13689613342285, 18.16678237915039, 19.196670532226562, 20.2265567779541, 21.256444931030273, 22.286331176757812, 23.316219329833984, 24.346107482910156, 25.375995635986328, 26.405881881713867, 27.43577003479004, 28.465656280517578, 29.49554443359375, 30.525432586669922, 31.55531883239746, 32.585205078125, 33.61509323120117, 34.644981384277344, 35.67486572265625, 36.70475387573242, 37.734642028808594, 38.764530181884766, 39.79441833496094, 40.824302673339844, 41.854190826416016, 42.88407897949219, 43.913963317871094, 44.943851470947266, 45.97373962402344, 47.00362777709961, 48.03351593017578, 49.06340408325195, 50.093292236328125, 51.1231803894043, 52.1530647277832, 53.182952880859375, 54.21284103393555, 55.24272918701172, 56.272613525390625, 57.3025016784668]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 7.0, 8.0, 5.0, 11.0, 15.0, 18.0, 24.0, 26.0, 23.0, 30.0, 41.0, 36.0, 48.0, 44.0, 41.0, 41.0, 56.0, 43.0, 56.0, 49.0, 41.0, 48.0, 33.0, 35.0, 30.0, 26.0, 20.0, 22.0, 19.0, 19.0, 21.0, 15.0, 6.0, 13.0, 10.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.10160827636719, -49.47425842285156, -47.84690475463867, -46.21955490112305, -44.592201232910156, -42.96485137939453, -41.337501525878906, -39.71015167236328, -38.08279800415039, -36.455448150634766, -34.828094482421875, -33.20074462890625, -31.573392868041992, -29.946041107177734, -28.31869125366211, -26.69133949279785, -25.063987731933594, -23.436635971069336, -21.809284210205078, -20.181934356689453, -18.554582595825195, -16.927230834960938, -15.299880027770996, -13.672529220581055, -12.045177459716797, -10.417825698852539, -8.790474891662598, -7.163123607635498, -5.535772323608398, -3.9084205627441406, -2.281069755554199, -0.6537189483642578, 0.9736366271972656, 2.6009879112243652, 4.228339195251465, 5.8556904792785645, 7.483041763305664, 9.110393524169922, 10.737744331359863, 12.365095138549805, 13.992446899414062, 15.61979866027832, 17.247150421142578, 18.874500274658203, 20.50185203552246, 22.12920379638672, 23.756553649902344, 25.3839054107666, 27.01125717163086, 28.638608932495117, 30.265960693359375, 31.893310546875, 33.520660400390625, 35.148014068603516, 36.77536392211914, 38.40271759033203, 40.030067443847656, 41.65741729736328, 43.28477096557617, 44.9121208190918, 46.53947448730469, 48.16682434082031, 49.79417419433594, 51.42152404785156, 53.04887771606445]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 9.0, 10.0, 6.0, 8.0, 8.0, 10.0, 12.0, 17.0, 19.0, 12.0, 23.0, 25.0, 24.0, 33.0, 34.0, 32.0, 38.0, 45.0, 41.0, 42.0, 63.0, 33.0, 40.0, 37.0, 44.0, 43.0, 45.0, 36.0, 30.0, 32.0, 26.0, 14.0, 23.0, 23.0, 10.0, 11.0, 11.0, 7.0, 9.0, 9.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46875, -4.3291015625, -4.189453125, -4.0498046875, -3.91015625, -3.7705078125, -3.630859375, -3.4912109375, -3.3515625, -3.2119140625, -3.072265625, -2.9326171875, -2.79296875, -2.6533203125, -2.513671875, -2.3740234375, -2.234375, -2.0947265625, -1.955078125, -1.8154296875, -1.67578125, -1.5361328125, -1.396484375, -1.2568359375, -1.1171875, -0.9775390625, -0.837890625, -0.6982421875, -0.55859375, -0.4189453125, -0.279296875, -0.1396484375, 0.0, 0.1396484375, 0.279296875, 0.4189453125, 0.55859375, 0.6982421875, 0.837890625, 0.9775390625, 1.1171875, 1.2568359375, 1.396484375, 1.5361328125, 1.67578125, 1.8154296875, 1.955078125, 2.0947265625, 2.234375, 2.3740234375, 2.513671875, 2.6533203125, 2.79296875, 2.9326171875, 3.072265625, 3.2119140625, 3.3515625, 3.4912109375, 3.630859375, 3.7705078125, 3.91015625, 4.0498046875, 4.189453125, 4.3291015625, 4.46875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 6.0, 9.0, 9.0, 6.0, 6.0, 9.0, 14.0, 16.0, 21.0, 17.0, 30.0, 33.0, 37.0, 46.0, 67.0, 118.0, 200.0, 442.0, 1239.0, 5177.0, 29756.0, 263242.0, 2004466.0, 1666313.0, 193830.0, 23032.0, 4175.0, 1010.0, 358.0, 192.0, 98.0, 58.0, 49.0, 38.0, 30.0, 25.0, 20.0, 12.0, 16.0, 12.0, 3.0, 7.0, 13.0, 5.0, 8.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.0234375, -10.688720703125, -10.35400390625, -10.019287109375, -9.6845703125, -9.349853515625, -9.01513671875, -8.680419921875, -8.345703125, -8.010986328125, -7.67626953125, -7.341552734375, -7.0068359375, -6.672119140625, -6.33740234375, -6.002685546875, -5.66796875, -5.333251953125, -4.99853515625, -4.663818359375, -4.3291015625, -3.994384765625, -3.65966796875, -3.324951171875, -2.990234375, -2.655517578125, -2.32080078125, -1.986083984375, -1.6513671875, -1.316650390625, -0.98193359375, -0.647216796875, -0.3125, 0.022216796875, 0.35693359375, 0.691650390625, 1.0263671875, 1.361083984375, 1.69580078125, 2.030517578125, 2.365234375, 2.699951171875, 3.03466796875, 3.369384765625, 3.7041015625, 4.038818359375, 4.37353515625, 4.708251953125, 5.04296875, 5.377685546875, 5.71240234375, 6.047119140625, 6.3818359375, 6.716552734375, 7.05126953125, 7.385986328125, 7.720703125, 8.055419921875, 8.39013671875, 8.724853515625, 9.0595703125, 9.394287109375, 9.72900390625, 10.063720703125, 10.3984375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 5.0, 5.0, 7.0, 20.0, 18.0, 22.0, 39.0, 38.0, 39.0, 60.0, 86.0, 107.0, 148.0, 188.0, 195.0, 267.0, 346.0, 336.0, 341.0, 330.0, 320.0, 261.0, 201.0, 131.0, 139.0, 91.0, 81.0, 61.0, 43.0, 40.0, 29.0, 11.0, 17.0, 10.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4453125, -8.1461181640625, -7.846923828125, -7.5477294921875, -7.24853515625, -6.9493408203125, -6.650146484375, -6.3509521484375, -6.0517578125, -5.7525634765625, -5.453369140625, -5.1541748046875, -4.85498046875, -4.5557861328125, -4.256591796875, -3.9573974609375, -3.658203125, -3.3590087890625, -3.059814453125, -2.7606201171875, -2.46142578125, -2.1622314453125, -1.863037109375, -1.5638427734375, -1.2646484375, -0.9654541015625, -0.666259765625, -0.3670654296875, -0.06787109375, 0.2313232421875, 0.530517578125, 0.8297119140625, 1.12890625, 1.4281005859375, 1.727294921875, 2.0264892578125, 2.32568359375, 2.6248779296875, 2.924072265625, 3.2232666015625, 3.5224609375, 3.8216552734375, 4.120849609375, 4.4200439453125, 4.71923828125, 5.0184326171875, 5.317626953125, 5.6168212890625, 5.916015625, 6.2152099609375, 6.514404296875, 6.8135986328125, 7.11279296875, 7.4119873046875, 7.711181640625, 8.0103759765625, 8.3095703125, 8.6087646484375, 8.907958984375, 9.2071533203125, 9.50634765625, 9.8055419921875, 10.104736328125, 10.4039306640625, 10.703125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 6.0, 10.0, 12.0, 24.0, 28.0, 42.0, 66.0, 86.0, 93.0, 149.0, 260.0, 465.0, 1660.0, 18269.0, 721789.0, 3330652.0, 113799.0, 5001.0, 849.0, 309.0, 206.0, 142.0, 83.0, 73.0, 62.0, 28.0, 32.0, 19.0, 18.0, 14.0, 11.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.28125, -32.31005859375, -31.3388671875, -30.36767578125, -29.396484375, -28.42529296875, -27.4541015625, -26.48291015625, -25.51171875, -24.54052734375, -23.5693359375, -22.59814453125, -21.626953125, -20.65576171875, -19.6845703125, -18.71337890625, -17.7421875, -16.77099609375, -15.7998046875, -14.82861328125, -13.857421875, -12.88623046875, -11.9150390625, -10.94384765625, -9.97265625, -9.00146484375, -8.0302734375, -7.05908203125, -6.087890625, -5.11669921875, -4.1455078125, -3.17431640625, -2.203125, -1.23193359375, -0.2607421875, 0.71044921875, 1.681640625, 2.65283203125, 3.6240234375, 4.59521484375, 5.56640625, 6.53759765625, 7.5087890625, 8.47998046875, 9.451171875, 10.42236328125, 11.3935546875, 12.36474609375, 13.3359375, 14.30712890625, 15.2783203125, 16.24951171875, 17.220703125, 18.19189453125, 19.1630859375, 20.13427734375, 21.10546875, 22.07666015625, 23.0478515625, 24.01904296875, 24.990234375, 25.96142578125, 26.9326171875, 27.90380859375, 28.875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 19.0, 15.0, 36.0, 38.0, 60.0, 69.0, 103.0, 98.0, 88.0, 94.0, 82.0, 89.0, 66.0, 63.0, 27.0, 27.0, 9.0, 11.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.548952102661133, -21.101688385009766, -19.654422760009766, -18.207157135009766, -16.7598934173584, -15.312628746032715, -13.865364074707031, -12.418099403381348, -10.970834732055664, -9.52357006072998, -8.076305389404297, -6.629040718078613, -5.18177604675293, -3.734511375427246, -2.2872467041015625, -0.8399820327758789, 0.6072826385498047, 2.0545473098754883, 3.501811981201172, 4.9490766525268555, 6.396341323852539, 7.843605995178223, 9.290870666503906, 10.73813533782959, 12.185400009155273, 13.632664680480957, 15.07992935180664, 16.52719497680664, 17.974458694458008, 19.421722412109375, 20.868988037109375, 22.316253662109375, 23.763519287109375, 25.210784912109375, 26.658048629760742, 28.10531234741211, 29.55257797241211, 30.99984359741211, 32.447105407714844, 33.894371032714844, 35.341636657714844, 36.788902282714844, 38.236167907714844, 39.68342971801758, 41.13069534301758, 42.57796096801758, 44.02522277832031, 45.47248840332031, 46.91975402832031, 48.36701965332031, 49.81428527832031, 51.26154708862305, 52.70881271362305, 54.15607833862305, 55.60334014892578, 57.05060577392578, 58.49787139892578, 59.94513702392578, 61.39240264892578, 62.839664459228516, 64.28692626953125, 65.73419189453125, 67.18145751953125, 68.62872314453125, 70.07598876953125]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 10.0, 5.0, 11.0, 6.0, 13.0, 13.0, 20.0, 19.0, 19.0, 19.0, 25.0, 23.0, 20.0, 33.0, 24.0, 28.0, 26.0, 34.0, 30.0, 50.0, 48.0, 43.0, 32.0, 34.0, 29.0, 34.0, 39.0, 28.0, 33.0, 29.0, 26.0, 15.0, 22.0, 20.0, 20.0, 20.0, 12.0, 15.0, 12.0, 10.0, 7.0, 8.0, 5.0, 6.0, 3.0, 5.0, 4.0, 2.0, 3.0, 5.0, 0.0, 0.0, 3.0, 2.0], "bins": [-33.534393310546875, -32.471500396728516, -31.40860939025879, -30.345718383789062, -29.282825469970703, -28.219934463500977, -27.15704345703125, -26.09415054321289, -25.031259536743164, -23.968368530273438, -22.905475616455078, -21.84258460998535, -20.779693603515625, -19.716800689697266, -18.65390968322754, -17.591018676757812, -16.528125762939453, -15.46523380279541, -14.402341842651367, -13.33945083618164, -12.276558876037598, -11.213666915893555, -10.150775909423828, -9.087883949279785, -8.024991989135742, -6.962100028991699, -5.8992085456848145, -4.83631706237793, -3.7734251022338867, -2.7105331420898438, -1.647641658782959, -0.5847501754760742, 0.47814178466796875, 1.5410335063934326, 2.6039252281188965, 3.6668169498443604, 4.729708671569824, 5.792600631713867, 6.855492115020752, 7.918383598327637, 8.98127555847168, 10.044167518615723, 11.107059478759766, 12.169950485229492, 13.232842445373535, 14.295734405517578, 15.358625411987305, 16.42151641845703, 17.48440933227539, 18.547300338745117, 19.610193252563477, 20.673084259033203, 21.735977172851562, 22.79886817932129, 23.861759185791016, 24.924652099609375, 25.9875431060791, 27.050434112548828, 28.113327026367188, 29.176218032836914, 30.23910903930664, 31.302001953125, 32.36489486694336, 33.42778396606445, 34.49067687988281]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 6.0, 7.0, 7.0, 6.0, 15.0, 15.0, 22.0, 22.0, 19.0, 13.0, 32.0, 38.0, 40.0, 36.0, 38.0, 38.0, 42.0, 44.0, 53.0, 45.0, 35.0, 53.0, 48.0, 36.0, 31.0, 28.0, 30.0, 28.0, 32.0, 26.0, 14.0, 17.0, 17.0, 14.0, 13.0, 7.0, 3.0, 11.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.9296875, -4.78497314453125, -4.6402587890625, -4.49554443359375, -4.350830078125, -4.20611572265625, -4.0614013671875, -3.91668701171875, -3.77197265625, -3.62725830078125, -3.4825439453125, -3.33782958984375, -3.193115234375, -3.04840087890625, -2.9036865234375, -2.75897216796875, -2.6142578125, -2.46954345703125, -2.3248291015625, -2.18011474609375, -2.035400390625, -1.89068603515625, -1.7459716796875, -1.60125732421875, -1.45654296875, -1.31182861328125, -1.1671142578125, -1.02239990234375, -0.877685546875, -0.73297119140625, -0.5882568359375, -0.44354248046875, -0.298828125, -0.15411376953125, -0.0093994140625, 0.13531494140625, 0.280029296875, 0.42474365234375, 0.5694580078125, 0.71417236328125, 0.85888671875, 1.00360107421875, 1.1483154296875, 1.29302978515625, 1.437744140625, 1.58245849609375, 1.7271728515625, 1.87188720703125, 2.0166015625, 2.16131591796875, 2.3060302734375, 2.45074462890625, 2.595458984375, 2.74017333984375, 2.8848876953125, 3.02960205078125, 3.17431640625, 3.31903076171875, 3.4637451171875, 3.60845947265625, 3.753173828125, 3.89788818359375, 4.0426025390625, 4.18731689453125, 4.33203125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 8.0, 8.0, 22.0, 27.0, 37.0, 55.0, 86.0, 115.0, 151.0, 228.0, 310.0, 479.0, 641.0, 990.0, 1339.0, 1928.0, 2713.0, 3904.0, 5567.0, 8227.0, 12167.0, 18231.0, 28353.0, 44716.0, 75589.0, 136510.0, 270359.0, 183578.0, 95379.0, 55463.0, 33776.0, 21840.0, 14287.0, 9587.0, 6527.0, 4614.0, 3235.0, 2231.0, 1600.0, 1111.0, 747.0, 533.0, 365.0, 295.0, 189.0, 141.0, 94.0, 59.0, 47.0, 33.0, 24.0, 14.0, 12.0, 10.0, 7.0, 3.0, 1.0, 2.0], "bins": [-0.75439453125, -0.7313308715820312, -0.7082672119140625, -0.6852035522460938, -0.662139892578125, -0.6390762329101562, -0.6160125732421875, -0.5929489135742188, -0.56988525390625, -0.5468215942382812, -0.5237579345703125, -0.5006942749023438, -0.477630615234375, -0.45456695556640625, -0.4315032958984375, -0.40843963623046875, -0.3853759765625, -0.36231231689453125, -0.3392486572265625, -0.31618499755859375, -0.293121337890625, -0.27005767822265625, -0.2469940185546875, -0.22393035888671875, -0.20086669921875, -0.17780303955078125, -0.1547393798828125, -0.13167572021484375, -0.108612060546875, -0.08554840087890625, -0.0624847412109375, -0.03942108154296875, -0.016357421875, 0.00670623779296875, 0.0297698974609375, 0.05283355712890625, 0.075897216796875, 0.09896087646484375, 0.1220245361328125, 0.14508819580078125, 0.16815185546875, 0.19121551513671875, 0.2142791748046875, 0.23734283447265625, 0.260406494140625, 0.28347015380859375, 0.3065338134765625, 0.32959747314453125, 0.3526611328125, 0.37572479248046875, 0.3987884521484375, 0.42185211181640625, 0.444915771484375, 0.46797943115234375, 0.4910430908203125, 0.5141067504882812, 0.53717041015625, 0.5602340698242188, 0.5832977294921875, 0.6063613891601562, 0.629425048828125, 0.6524887084960938, 0.6755523681640625, 0.6986160278320312, 0.7216796875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 2.0, 8.0, 5.0, 8.0, 11.0, 12.0, 10.0, 17.0, 14.0, 28.0, 20.0, 32.0, 43.0, 37.0, 45.0, 37.0, 52.0, 24.0, 35.0, 1068.0, 38.0, 37.0, 36.0, 57.0, 48.0, 39.0, 33.0, 34.0, 32.0, 34.0, 29.0, 18.0, 11.0, 19.0, 14.0, 2.0, 2.0, 11.0, 4.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9140625, -2.819610595703125, -2.72515869140625, -2.630706787109375, -2.5362548828125, -2.441802978515625, -2.34735107421875, -2.252899169921875, -2.158447265625, -2.063995361328125, -1.96954345703125, -1.875091552734375, -1.7806396484375, -1.686187744140625, -1.59173583984375, -1.497283935546875, -1.40283203125, -1.308380126953125, -1.21392822265625, -1.119476318359375, -1.0250244140625, -0.930572509765625, -0.83612060546875, -0.741668701171875, -0.647216796875, -0.552764892578125, -0.45831298828125, -0.363861083984375, -0.2694091796875, -0.174957275390625, -0.08050537109375, 0.013946533203125, 0.1083984375, 0.202850341796875, 0.29730224609375, 0.391754150390625, 0.4862060546875, 0.580657958984375, 0.67510986328125, 0.769561767578125, 0.864013671875, 0.958465576171875, 1.05291748046875, 1.147369384765625, 1.2418212890625, 1.336273193359375, 1.43072509765625, 1.525177001953125, 1.61962890625, 1.714080810546875, 1.80853271484375, 1.902984619140625, 1.9974365234375, 2.091888427734375, 2.18634033203125, 2.280792236328125, 2.375244140625, 2.469696044921875, 2.56414794921875, 2.658599853515625, 2.7530517578125, 2.847503662109375, 2.94195556640625, 3.036407470703125, 3.130859375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 7.0, 16.0, 21.0, 21.0, 40.0, 64.0, 75.0, 133.0, 196.0, 266.0, 411.0, 584.0, 839.0, 1442.0, 2208.0, 3352.0, 5316.0, 8984.0, 15284.0, 26018.0, 46289.0, 85251.0, 172469.0, 1364812.0, 168828.0, 83977.0, 45552.0, 25534.0, 14984.0, 8950.0, 5515.0, 3392.0, 2250.0, 1299.0, 938.0, 552.0, 389.0, 269.0, 183.0, 124.0, 100.0, 53.0, 43.0, 32.0, 16.0, 19.0, 14.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.86865234375, -0.8419113159179688, -0.8151702880859375, -0.7884292602539062, -0.761688232421875, -0.7349472045898438, -0.7082061767578125, -0.6814651489257812, -0.65472412109375, -0.6279830932617188, -0.6012420654296875, -0.5745010375976562, -0.547760009765625, -0.5210189819335938, -0.4942779541015625, -0.46753692626953125, -0.4407958984375, -0.41405487060546875, -0.3873138427734375, -0.36057281494140625, -0.333831787109375, -0.30709075927734375, -0.2803497314453125, -0.25360870361328125, -0.22686767578125, -0.20012664794921875, -0.1733856201171875, -0.14664459228515625, -0.119903564453125, -0.09316253662109375, -0.0664215087890625, -0.03968048095703125, -0.012939453125, 0.01380157470703125, 0.0405426025390625, 0.06728363037109375, 0.094024658203125, 0.12076568603515625, 0.1475067138671875, 0.17424774169921875, 0.20098876953125, 0.22772979736328125, 0.2544708251953125, 0.28121185302734375, 0.307952880859375, 0.33469390869140625, 0.3614349365234375, 0.38817596435546875, 0.4149169921875, 0.44165802001953125, 0.4683990478515625, 0.49514007568359375, 0.521881103515625, 0.5486221313476562, 0.5753631591796875, 0.6021041870117188, 0.62884521484375, 0.6555862426757812, 0.6823272705078125, 0.7090682983398438, 0.735809326171875, 0.7625503540039062, 0.7892913818359375, 0.8160324096679688, 0.8427734375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 11.0, 6.0, 5.0, 12.0, 15.0, 17.0, 17.0, 18.0, 15.0, 34.0, 34.0, 44.0, 57.0, 67.0, 77.0, 77.0, 69.0, 74.0, 73.0, 70.0, 57.0, 23.0, 36.0, 29.0, 15.0, 11.0, 8.0, 5.0, 5.0, 8.0, 4.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008678436279296875, -0.0008385926485061646, -0.0008093416690826416, -0.0007800906896591187, -0.0007508397102355957, -0.0007215887308120728, -0.0006923377513885498, -0.0006630867719650269, -0.0006338357925415039, -0.000604584813117981, -0.000575333833694458, -0.0005460828542709351, -0.0005168318748474121, -0.00048758089542388916, -0.0004583299160003662, -0.00042907893657684326, -0.0003998279571533203, -0.00037057697772979736, -0.0003413259983062744, -0.00031207501888275146, -0.0002828240394592285, -0.00025357306003570557, -0.00022432208061218262, -0.00019507110118865967, -0.00016582012176513672, -0.00013656914234161377, -0.00010731816291809082, -7.806718349456787e-05, -4.881620407104492e-05, -1.9565224647521973e-05, 9.685754776000977e-06, 3.8936734199523926e-05, 6.818771362304688e-05, 9.743869304656982e-05, 0.00012668967247009277, 0.00015594065189361572, 0.00018519163131713867, 0.00021444261074066162, 0.00024369359016418457, 0.0002729445695877075, 0.00030219554901123047, 0.0003314465284347534, 0.00036069750785827637, 0.0003899484872817993, 0.00041919946670532227, 0.0004484504461288452, 0.00047770142555236816, 0.0005069524049758911, 0.0005362033843994141, 0.000565454363822937, 0.00059470534324646, 0.0006239563226699829, 0.0006532073020935059, 0.0006824582815170288, 0.0007117092609405518, 0.0007409602403640747, 0.0007702112197875977, 0.0007994621992111206, 0.0008287131786346436, 0.0008579641580581665, 0.0008872151374816895, 0.0009164661169052124, 0.0009457170963287354, 0.0009749680757522583, 0.0010042190551757812]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 11.0, 8.0, 12.0, 18.0, 20.0, 41.0, 50.0, 80.0, 109.0, 190.0, 351.0, 698.0, 8879.0, 1028275.0, 8203.0, 729.0, 341.0, 191.0, 89.0, 65.0, 39.0, 33.0, 25.0, 20.0, 15.0, 13.0, 11.0, 8.0, 8.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018524169921875, -0.017935991287231445, -0.01734781265258789, -0.016759634017944336, -0.01617145538330078, -0.015583276748657227, -0.014995098114013672, -0.014406919479370117, -0.013818740844726562, -0.013230562210083008, -0.012642383575439453, -0.012054204940795898, -0.011466026306152344, -0.010877847671508789, -0.010289669036865234, -0.00970149040222168, -0.009113311767578125, -0.00852513313293457, -0.007936954498291016, -0.007348775863647461, -0.006760597229003906, -0.0061724185943603516, -0.005584239959716797, -0.004996061325073242, -0.0044078826904296875, -0.003819704055786133, -0.003231525421142578, -0.0026433467864990234, -0.0020551681518554688, -0.001466989517211914, -0.0008788108825683594, -0.0002906322479248047, 0.00029754638671875, 0.0008857250213623047, 0.0014739036560058594, 0.002062082290649414, 0.0026502609252929688, 0.0032384395599365234, 0.003826618194580078, 0.004414796829223633, 0.0050029754638671875, 0.005591154098510742, 0.006179332733154297, 0.0067675113677978516, 0.007355690002441406, 0.007943868637084961, 0.008532047271728516, 0.00912022590637207, 0.009708404541015625, 0.01029658317565918, 0.010884761810302734, 0.011472940444946289, 0.012061119079589844, 0.012649297714233398, 0.013237476348876953, 0.013825654983520508, 0.014413833618164062, 0.015002012252807617, 0.015590190887451172, 0.016178369522094727, 0.01676654815673828, 0.017354726791381836, 0.01794290542602539, 0.018531084060668945, 0.0191192626953125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 33.0, 146.0, 376.0, 333.0, 104.0, 18.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007817293517291546, -0.0007210138137452304, -0.0006602983339689672, -0.000599582795985043, -0.0005388672580011189, -0.0004781517491210252, -0.0004174362402409315, -0.00035672070225700736, -0.00029600519337691367, -0.00023528966994490474, -0.00017457414651289582, -0.00011385863763280213, -5.314311420079321e-05, 7.572409231215715e-06, 6.828791811130941e-05, 0.00012900345609523356, 0.00018971896497532725, 0.00025043447385542095, 0.0003111500118393451, 0.0003718655207194388, 0.00043258105870336294, 0.0004932965384796262, 0.0005540120764635503, 0.0006147276144474745, 0.0006754430942237377, 0.0007361586322076619, 0.0007968741119839251, 0.0008575896499678493, 0.0009183051879517734, 0.0009790207259356976, 0.0010397362057119608, 0.001100451685488224, 0.001161167281679809, 0.0012218827614560723, 0.0012825983576476574, 0.0013433138374239206, 0.0014040293172001839, 0.001464744913391769, 0.0015254603931680322, 0.0015861759893596172, 0.0016468914691358805, 0.0017076069489121437, 0.0017683225451037288, 0.001829038024879992, 0.0018897535046562552, 0.0019504691008478403, 0.0020111845806241035, 0.0020719000604003668, 0.00213261554017663, 0.0021933310199528933, 0.0022540464997291565, 0.0023147622123360634, 0.0023754776921123266, 0.00243619317188859, 0.002496908651664853, 0.0025576241314411163, 0.0026183398440480232, 0.0026790553238242865, 0.0027397708036005497, 0.0028004865162074566, 0.00286120199598372, 0.002921917475759983, 0.0029826329555362463, 0.0030433484353125095, 0.0031040639150887728]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 8.0, 7.0, 9.0, 13.0, 15.0, 12.0, 23.0, 24.0, 28.0, 19.0, 28.0, 23.0, 27.0, 29.0, 47.0, 27.0, 38.0, 34.0, 43.0, 40.0, 33.0, 36.0, 27.0, 24.0, 41.0, 27.0, 33.0, 30.0, 24.0, 30.0, 29.0, 27.0, 13.0, 15.0, 11.0, 10.0, 15.0, 11.0, 10.0, 15.0, 7.0, 4.0, 6.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.00034350156784057617, -0.0003326665610074997, -0.0003218315541744232, -0.00031099654734134674, -0.00030016154050827026, -0.0002893265336751938, -0.0002784915268421173, -0.00026765652000904083, -0.00025682151317596436, -0.0002459865063428879, -0.0002351514995098114, -0.00022431649267673492, -0.00021348148584365845, -0.00020264647901058197, -0.0001918114721775055, -0.00018097646534442902, -0.00017014145851135254, -0.00015930645167827606, -0.00014847144484519958, -0.0001376364380121231, -0.00012680143117904663, -0.00011596642434597015, -0.00010513141751289368, -9.42964106798172e-05, -8.346140384674072e-05, -7.262639701366425e-05, -6.179139018058777e-05, -5.095638334751129e-05, -4.0121376514434814e-05, -2.9286369681358337e-05, -1.845136284828186e-05, -7.616356015205383e-06, 3.2186508178710938e-06, 1.405365765094757e-05, 2.4888664484024048e-05, 3.5723671317100525e-05, 4.6558678150177e-05, 5.739368498325348e-05, 6.822869181632996e-05, 7.906369864940643e-05, 8.989870548248291e-05, 0.00010073371231555939, 0.00011156871914863586, 0.00012240372598171234, 0.00013323873281478882, 0.0001440737396478653, 0.00015490874648094177, 0.00016574375331401825, 0.00017657876014709473, 0.0001874137669801712, 0.00019824877381324768, 0.00020908378064632416, 0.00021991878747940063, 0.0002307537943124771, 0.0002415888011455536, 0.00025242380797863007, 0.00026325881481170654, 0.000274093821644783, 0.0002849288284778595, 0.000295763835310936, 0.00030659884214401245, 0.00031743384897708893, 0.0003282688558101654, 0.0003391038626432419, 0.00034993886947631836]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 6.0, 7.0, 7.0, 6.0, 15.0, 15.0, 22.0, 22.0, 19.0, 13.0, 32.0, 38.0, 40.0, 36.0, 38.0, 38.0, 42.0, 44.0, 53.0, 45.0, 35.0, 53.0, 48.0, 36.0, 31.0, 28.0, 30.0, 28.0, 32.0, 26.0, 14.0, 17.0, 17.0, 14.0, 13.0, 7.0, 3.0, 11.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.9296875, -4.78497314453125, -4.6402587890625, -4.49554443359375, -4.350830078125, -4.20611572265625, -4.0614013671875, -3.91668701171875, -3.77197265625, -3.62725830078125, -3.4825439453125, -3.33782958984375, -3.193115234375, -3.04840087890625, -2.9036865234375, -2.75897216796875, -2.6142578125, -2.46954345703125, -2.3248291015625, -2.18011474609375, -2.035400390625, -1.89068603515625, -1.7459716796875, -1.60125732421875, -1.45654296875, -1.31182861328125, -1.1671142578125, -1.02239990234375, -0.877685546875, -0.73297119140625, -0.5882568359375, -0.44354248046875, -0.298828125, -0.15411376953125, -0.0093994140625, 0.13531494140625, 0.280029296875, 0.42474365234375, 0.5694580078125, 0.71417236328125, 0.85888671875, 1.00360107421875, 1.1483154296875, 1.29302978515625, 1.437744140625, 1.58245849609375, 1.7271728515625, 1.87188720703125, 2.0166015625, 2.16131591796875, 2.3060302734375, 2.45074462890625, 2.595458984375, 2.74017333984375, 2.8848876953125, 3.02960205078125, 3.17431640625, 3.31903076171875, 3.4637451171875, 3.60845947265625, 3.753173828125, 3.89788818359375, 4.0426025390625, 4.18731689453125, 4.33203125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 6.0, 9.0, 16.0, 16.0, 20.0, 36.0, 51.0, 64.0, 92.0, 114.0, 174.0, 275.0, 336.0, 559.0, 811.0, 1281.0, 1992.0, 3140.0, 4857.0, 8258.0, 15233.0, 33343.0, 90536.0, 289245.0, 385545.0, 125069.0, 43319.0, 18596.0, 9708.0, 5695.0, 3536.0, 2219.0, 1395.0, 977.0, 658.0, 401.0, 273.0, 193.0, 146.0, 108.0, 72.0, 45.0, 34.0, 24.0, 26.0, 20.0, 11.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.67578125, -4.525634765625, -4.37548828125, -4.225341796875, -4.0751953125, -3.925048828125, -3.77490234375, -3.624755859375, -3.474609375, -3.324462890625, -3.17431640625, -3.024169921875, -2.8740234375, -2.723876953125, -2.57373046875, -2.423583984375, -2.2734375, -2.123291015625, -1.97314453125, -1.822998046875, -1.6728515625, -1.522705078125, -1.37255859375, -1.222412109375, -1.072265625, -0.922119140625, -0.77197265625, -0.621826171875, -0.4716796875, -0.321533203125, -0.17138671875, -0.021240234375, 0.12890625, 0.279052734375, 0.42919921875, 0.579345703125, 0.7294921875, 0.879638671875, 1.02978515625, 1.179931640625, 1.330078125, 1.480224609375, 1.63037109375, 1.780517578125, 1.9306640625, 2.080810546875, 2.23095703125, 2.381103515625, 2.53125, 2.681396484375, 2.83154296875, 2.981689453125, 3.1318359375, 3.281982421875, 3.43212890625, 3.582275390625, 3.732421875, 3.882568359375, 4.03271484375, 4.182861328125, 4.3330078125, 4.483154296875, 4.63330078125, 4.783447265625, 4.93359375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 3.0, 9.0, 7.0, 10.0, 9.0, 9.0, 16.0, 17.0, 24.0, 26.0, 25.0, 40.0, 36.0, 38.0, 34.0, 32.0, 42.0, 60.0, 138.0, 281.0, 1509.0, 189.0, 88.0, 52.0, 44.0, 37.0, 40.0, 38.0, 25.0, 16.0, 22.0, 16.0, 17.0, 18.0, 9.0, 11.0, 15.0, 4.0, 14.0, 4.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.4765625, -15.01171875, -14.546875, -14.08203125, -13.6171875, -13.15234375, -12.6875, -12.22265625, -11.7578125, -11.29296875, -10.828125, -10.36328125, -9.8984375, -9.43359375, -8.96875, -8.50390625, -8.0390625, -7.57421875, -7.109375, -6.64453125, -6.1796875, -5.71484375, -5.25, -4.78515625, -4.3203125, -3.85546875, -3.390625, -2.92578125, -2.4609375, -1.99609375, -1.53125, -1.06640625, -0.6015625, -0.13671875, 0.328125, 0.79296875, 1.2578125, 1.72265625, 2.1875, 2.65234375, 3.1171875, 3.58203125, 4.046875, 4.51171875, 4.9765625, 5.44140625, 5.90625, 6.37109375, 6.8359375, 7.30078125, 7.765625, 8.23046875, 8.6953125, 9.16015625, 9.625, 10.08984375, 10.5546875, 11.01953125, 11.484375, 11.94921875, 12.4140625, 12.87890625, 13.34375, 13.80859375, 14.2734375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 6.0, 6.0, 7.0, 17.0, 6.0, 26.0, 33.0, 41.0, 48.0, 78.0, 148.0, 314.0, 653.0, 4713.0, 2502689.0, 632328.0, 3297.0, 548.0, 270.0, 164.0, 95.0, 62.0, 46.0, 28.0, 20.0, 19.0, 15.0, 9.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.1875, -48.70849609375, -47.2294921875, -45.75048828125, -44.271484375, -42.79248046875, -41.3134765625, -39.83447265625, -38.35546875, -36.87646484375, -35.3974609375, -33.91845703125, -32.439453125, -30.96044921875, -29.4814453125, -28.00244140625, -26.5234375, -25.04443359375, -23.5654296875, -22.08642578125, -20.607421875, -19.12841796875, -17.6494140625, -16.17041015625, -14.69140625, -13.21240234375, -11.7333984375, -10.25439453125, -8.775390625, -7.29638671875, -5.8173828125, -4.33837890625, -2.859375, -1.38037109375, 0.0986328125, 1.57763671875, 3.056640625, 4.53564453125, 6.0146484375, 7.49365234375, 8.97265625, 10.45166015625, 11.9306640625, 13.40966796875, 14.888671875, 16.36767578125, 17.8466796875, 19.32568359375, 20.8046875, 22.28369140625, 23.7626953125, 25.24169921875, 26.720703125, 28.19970703125, 29.6787109375, 31.15771484375, 32.63671875, 34.11572265625, 35.5947265625, 37.07373046875, 38.552734375, 40.03173828125, 41.5107421875, 42.98974609375, 44.46875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 6.0, 138.0, 670.0, 191.0, 10.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.539440155029297, -24.20182228088379, -19.86420440673828, -15.526588439941406, -11.188970565795898, -6.851352691650391, -2.5137367248535156, 1.8238811492919922, 6.1614990234375, 10.499116897583008, 14.8367338180542, 19.17435073852539, 23.5119686126709, 27.849586486816406, 32.18720245361328, 36.524818420410156, 40.8624382019043, 45.20005416870117, 49.53767395019531, 53.87528991699219, 58.21290588378906, 62.5505256652832, 66.88813781738281, 71.22576141357422, 75.5633773803711, 79.90099334716797, 84.23860931396484, 88.57623291015625, 92.91384887695312, 97.25146484375, 101.58908081054688, 105.92669677734375, 110.26431274414062, 114.6019287109375, 118.93954467773438, 123.27716064453125, 127.61478424072266, 131.952392578125, 136.29000854492188, 140.6276397705078, 144.9652557373047, 149.30287170410156, 153.64048767089844, 157.9781036376953, 162.3157196044922, 166.65335083007812, 170.990966796875, 175.32858276367188, 179.66619873046875, 184.00381469726562, 188.3414306640625, 192.67904663085938, 197.01666259765625, 201.35427856445312, 205.69189453125, 210.02952575683594, 214.36712646484375, 218.70474243164062, 223.0423583984375, 227.37997436523438, 231.71759033203125, 236.05520629882812, 240.392822265625, 244.73045349121094, 249.0680694580078]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 7.0, 2.0, 10.0, 11.0, 9.0, 17.0, 16.0, 19.0, 23.0, 33.0, 28.0, 21.0, 40.0, 42.0, 40.0, 32.0, 40.0, 32.0, 52.0, 45.0, 42.0, 44.0, 47.0, 25.0, 34.0, 38.0, 37.0, 24.0, 25.0, 23.0, 27.0, 20.0, 19.0, 10.0, 19.0, 5.0, 10.0, 6.0, 7.0, 8.0, 6.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-51.48308563232422, -49.94945526123047, -48.41582489013672, -46.88219451904297, -45.34856033325195, -43.8149299621582, -42.28129959106445, -40.7476692199707, -39.21403884887695, -37.6804084777832, -36.14677810668945, -34.61314392089844, -33.07951354980469, -31.545883178710938, -30.012252807617188, -28.478622436523438, -26.944990158081055, -25.411359786987305, -23.877727508544922, -22.344097137451172, -20.810466766357422, -19.276836395263672, -17.74320411682129, -16.20957374572754, -14.675942420959473, -13.142311096191406, -11.608680725097656, -10.07504940032959, -8.541418075561523, -7.007787704467773, -5.474156379699707, -3.940526008605957, -2.4068946838378906, -0.8732637166976929, 0.6603672504425049, 2.193998336791992, 3.7276291847229004, 5.261260032653809, 6.794891357421875, 8.328521728515625, 9.862153053283691, 11.395784378051758, 12.929414749145508, 14.463046073913574, 15.99667739868164, 17.53030776977539, 19.06393814086914, 20.59756851196289, 22.131200790405273, 23.664831161499023, 25.198463439941406, 26.732093811035156, 28.265724182128906, 29.799354553222656, 31.33298683166504, 32.866615295410156, 34.40024948120117, 35.93387985229492, 37.46751022338867, 39.00114440917969, 40.53477478027344, 42.06840515136719, 43.60203552246094, 45.13566589355469, 46.66929626464844]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 5.0, 4.0, 9.0, 9.0, 9.0, 7.0, 11.0, 10.0, 16.0, 20.0, 26.0, 16.0, 33.0, 34.0, 39.0, 30.0, 47.0, 35.0, 49.0, 43.0, 49.0, 44.0, 49.0, 44.0, 44.0, 38.0, 26.0, 41.0, 32.0, 30.0, 21.0, 19.0, 18.0, 19.0, 10.0, 14.0, 18.0, 8.0, 8.0, 5.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.12890625, -4.9786376953125, -4.828369140625, -4.6781005859375, -4.52783203125, -4.3775634765625, -4.227294921875, -4.0770263671875, -3.9267578125, -3.7764892578125, -3.626220703125, -3.4759521484375, -3.32568359375, -3.1754150390625, -3.025146484375, -2.8748779296875, -2.724609375, -2.5743408203125, -2.424072265625, -2.2738037109375, -2.12353515625, -1.9732666015625, -1.822998046875, -1.6727294921875, -1.5224609375, -1.3721923828125, -1.221923828125, -1.0716552734375, -0.92138671875, -0.7711181640625, -0.620849609375, -0.4705810546875, -0.3203125, -0.1700439453125, -0.019775390625, 0.1304931640625, 0.28076171875, 0.4310302734375, 0.581298828125, 0.7315673828125, 0.8818359375, 1.0321044921875, 1.182373046875, 1.3326416015625, 1.48291015625, 1.6331787109375, 1.783447265625, 1.9337158203125, 2.083984375, 2.2342529296875, 2.384521484375, 2.5347900390625, 2.68505859375, 2.8353271484375, 2.985595703125, 3.1358642578125, 3.2861328125, 3.4364013671875, 3.586669921875, 3.7369384765625, 3.88720703125, 4.0374755859375, 4.187744140625, 4.3380126953125, 4.48828125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 2.0, 8.0, 6.0, 9.0, 10.0, 12.0, 15.0, 24.0, 37.0, 34.0, 65.0, 90.0, 183.0, 266.0, 430.0, 778.0, 1514.0, 3280.0, 7310.0, 18340.0, 51541.0, 161187.0, 496545.0, 1150374.0, 1316106.0, 653527.0, 221105.0, 70133.0, 24081.0, 9340.0, 3889.0, 1819.0, 897.0, 473.0, 288.0, 175.0, 129.0, 69.0, 49.0, 43.0, 32.0, 17.0, 19.0, 10.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.578125, -5.4097900390625, -5.241455078125, -5.0731201171875, -4.90478515625, -4.7364501953125, -4.568115234375, -4.3997802734375, -4.2314453125, -4.0631103515625, -3.894775390625, -3.7264404296875, -3.55810546875, -3.3897705078125, -3.221435546875, -3.0531005859375, -2.884765625, -2.7164306640625, -2.548095703125, -2.3797607421875, -2.21142578125, -2.0430908203125, -1.874755859375, -1.7064208984375, -1.5380859375, -1.3697509765625, -1.201416015625, -1.0330810546875, -0.86474609375, -0.6964111328125, -0.528076171875, -0.3597412109375, -0.19140625, -0.0230712890625, 0.145263671875, 0.3135986328125, 0.48193359375, 0.6502685546875, 0.818603515625, 0.9869384765625, 1.1552734375, 1.3236083984375, 1.491943359375, 1.6602783203125, 1.82861328125, 1.9969482421875, 2.165283203125, 2.3336181640625, 2.501953125, 2.6702880859375, 2.838623046875, 3.0069580078125, 3.17529296875, 3.3436279296875, 3.511962890625, 3.6802978515625, 3.8486328125, 4.0169677734375, 4.185302734375, 4.3536376953125, 4.52197265625, 4.6903076171875, 4.858642578125, 5.0269775390625, 5.1953125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 5.0, 9.0, 17.0, 13.0, 18.0, 27.0, 50.0, 66.0, 92.0, 118.0, 225.0, 247.0, 340.0, 429.0, 453.0, 459.0, 381.0, 308.0, 253.0, 162.0, 119.0, 79.0, 62.0, 49.0, 39.0, 19.0, 13.0, 9.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.609375, -14.2015380859375, -13.793701171875, -13.3858642578125, -12.97802734375, -12.5701904296875, -12.162353515625, -11.7545166015625, -11.3466796875, -10.9388427734375, -10.531005859375, -10.1231689453125, -9.71533203125, -9.3074951171875, -8.899658203125, -8.4918212890625, -8.083984375, -7.6761474609375, -7.268310546875, -6.8604736328125, -6.45263671875, -6.0447998046875, -5.636962890625, -5.2291259765625, -4.8212890625, -4.4134521484375, -4.005615234375, -3.5977783203125, -3.18994140625, -2.7821044921875, -2.374267578125, -1.9664306640625, -1.55859375, -1.1507568359375, -0.742919921875, -0.3350830078125, 0.07275390625, 0.4805908203125, 0.888427734375, 1.2962646484375, 1.7041015625, 2.1119384765625, 2.519775390625, 2.9276123046875, 3.33544921875, 3.7432861328125, 4.151123046875, 4.5589599609375, 4.966796875, 5.3746337890625, 5.782470703125, 6.1903076171875, 6.59814453125, 7.0059814453125, 7.413818359375, 7.8216552734375, 8.2294921875, 8.6373291015625, 9.045166015625, 9.4530029296875, 9.86083984375, 10.2686767578125, 10.676513671875, 11.0843505859375, 11.4921875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 4.0, 12.0, 10.0, 20.0, 12.0, 29.0, 35.0, 56.0, 80.0, 92.0, 168.0, 314.0, 967.0, 5776.0, 161545.0, 3587198.0, 425164.0, 10489.0, 1227.0, 406.0, 226.0, 133.0, 71.0, 57.0, 55.0, 39.0, 30.0, 16.0, 18.0, 5.0, 6.0, 8.0, 6.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.25, -23.22314453125, -22.1962890625, -21.16943359375, -20.142578125, -19.11572265625, -18.0888671875, -17.06201171875, -16.03515625, -15.00830078125, -13.9814453125, -12.95458984375, -11.927734375, -10.90087890625, -9.8740234375, -8.84716796875, -7.8203125, -6.79345703125, -5.7666015625, -4.73974609375, -3.712890625, -2.68603515625, -1.6591796875, -0.63232421875, 0.39453125, 1.42138671875, 2.4482421875, 3.47509765625, 4.501953125, 5.52880859375, 6.5556640625, 7.58251953125, 8.609375, 9.63623046875, 10.6630859375, 11.68994140625, 12.716796875, 13.74365234375, 14.7705078125, 15.79736328125, 16.82421875, 17.85107421875, 18.8779296875, 19.90478515625, 20.931640625, 21.95849609375, 22.9853515625, 24.01220703125, 25.0390625, 26.06591796875, 27.0927734375, 28.11962890625, 29.146484375, 30.17333984375, 31.2001953125, 32.22705078125, 33.25390625, 34.28076171875, 35.3076171875, 36.33447265625, 37.361328125, 38.38818359375, 39.4150390625, 40.44189453125, 41.46875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 22.0, 35.0, 97.0, 157.0, 214.0, 210.0, 129.0, 78.0, 51.0, 12.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.29010009765625, -139.1205596923828, -135.95101928710938, -132.78147888183594, -129.6119384765625, -126.4424057006836, -123.27286529541016, -120.10332489013672, -116.93378448486328, -113.76424407958984, -110.5947036743164, -107.42516326904297, -104.25563049316406, -101.08609008789062, -97.91654968261719, -94.74700927734375, -91.57746887207031, -88.40792846679688, -85.23838806152344, -82.06884765625, -78.89930725097656, -75.72977447509766, -72.56023406982422, -69.39069366455078, -66.22115325927734, -63.051612854003906, -59.88207244873047, -56.7125358581543, -53.54299545288086, -50.37345504760742, -47.20391845703125, -44.03437805175781, -40.864837646484375, -37.69529724121094, -34.5257568359375, -31.356220245361328, -28.18667984008789, -25.017139434814453, -21.84760093688965, -18.678062438964844, -15.508522033691406, -12.338982582092285, -9.169443130493164, -5.999903678894043, -2.830364227294922, 0.3391752243041992, 3.5087146759033203, 6.678253173828125, 9.847793579101562, 13.017333030700684, 16.186872482299805, 19.35641098022461, 22.525951385498047, 25.695491790771484, 28.86503028869629, 32.034568786621094, 35.20410919189453, 38.37364959716797, 41.543190002441406, 44.71272659301758, 47.882266998291016, 51.05180740356445, 54.221343994140625, 57.39088439941406, 60.5604248046875]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 11.0, 6.0, 8.0, 11.0, 14.0, 14.0, 15.0, 24.0, 26.0, 20.0, 24.0, 26.0, 34.0, 34.0, 35.0, 50.0, 23.0, 55.0, 44.0, 32.0, 28.0, 45.0, 37.0, 41.0, 33.0, 32.0, 21.0, 28.0, 29.0, 23.0, 19.0, 27.0, 17.0, 17.0, 16.0, 12.0, 13.0, 9.0, 12.0, 6.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-38.20566177368164, -37.06896209716797, -35.93226623535156, -34.79556655883789, -33.65886688232422, -32.52217102050781, -31.38547134399414, -30.2487735748291, -29.112075805664062, -27.975378036499023, -26.83867835998535, -25.701980590820312, -24.565282821655273, -23.428585052490234, -22.291885375976562, -21.155187606811523, -20.01848793029785, -18.881790161132812, -17.74509048461914, -16.6083927154541, -15.471694946289062, -14.334996223449707, -13.198297500610352, -12.061599731445312, -10.924901008605957, -9.788202285766602, -8.651504516601562, -7.514805793762207, -6.37810754776001, -5.2414093017578125, -4.104710578918457, -2.9680123329162598, -1.8313140869140625, -0.6946157217025757, 0.44208264350891113, 1.5787811279296875, 2.7154793739318848, 3.852177619934082, 4.9888763427734375, 6.125574588775635, 7.262272834777832, 8.398971557617188, 9.535669326782227, 10.672368049621582, 11.809066772460938, 12.945764541625977, 14.082463264465332, 15.219161987304688, 16.355859756469727, 17.492557525634766, 18.629257202148438, 19.765954971313477, 20.902652740478516, 22.039352416992188, 23.176050186157227, 24.312747955322266, 25.449447631835938, 26.586145401000977, 27.72284507751465, 28.859542846679688, 29.996240615844727, 31.132938385009766, 32.26963806152344, 33.40633773803711, 34.543033599853516]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 3.0, 9.0, 7.0, 11.0, 19.0, 15.0, 18.0, 23.0, 18.0, 26.0, 20.0, 42.0, 39.0, 44.0, 54.0, 47.0, 45.0, 41.0, 47.0, 40.0, 41.0, 48.0, 36.0, 33.0, 33.0, 31.0, 30.0, 26.0, 21.0, 18.0, 24.0, 16.0, 14.0, 15.0, 8.0, 8.0, 10.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.03515625, -4.87908935546875, -4.7230224609375, -4.56695556640625, -4.410888671875, -4.25482177734375, -4.0987548828125, -3.94268798828125, -3.78662109375, -3.63055419921875, -3.4744873046875, -3.31842041015625, -3.162353515625, -3.00628662109375, -2.8502197265625, -2.69415283203125, -2.5380859375, -2.38201904296875, -2.2259521484375, -2.06988525390625, -1.913818359375, -1.75775146484375, -1.6016845703125, -1.44561767578125, -1.28955078125, -1.13348388671875, -0.9774169921875, -0.82135009765625, -0.665283203125, -0.50921630859375, -0.3531494140625, -0.19708251953125, -0.041015625, 0.11505126953125, 0.2711181640625, 0.42718505859375, 0.583251953125, 0.73931884765625, 0.8953857421875, 1.05145263671875, 1.20751953125, 1.36358642578125, 1.5196533203125, 1.67572021484375, 1.831787109375, 1.98785400390625, 2.1439208984375, 2.29998779296875, 2.4560546875, 2.61212158203125, 2.7681884765625, 2.92425537109375, 3.080322265625, 3.23638916015625, 3.3924560546875, 3.54852294921875, 3.70458984375, 3.86065673828125, 4.0167236328125, 4.17279052734375, 4.328857421875, 4.48492431640625, 4.6409912109375, 4.79705810546875, 4.953125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 8.0, 17.0, 24.0, 30.0, 41.0, 74.0, 79.0, 152.0, 188.0, 321.0, 513.0, 720.0, 1133.0, 1685.0, 2546.0, 4023.0, 5982.0, 9394.0, 14316.0, 23056.0, 37659.0, 64805.0, 120692.0, 242815.0, 236673.0, 117758.0, 63420.0, 37107.0, 22471.0, 14272.0, 9229.0, 6102.0, 3851.0, 2573.0, 1623.0, 1056.0, 728.0, 489.0, 315.0, 202.0, 142.0, 95.0, 59.0, 45.0, 23.0, 16.0, 14.0, 13.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.83984375, -0.8127365112304688, -0.7856292724609375, -0.7585220336914062, -0.731414794921875, -0.7043075561523438, -0.6772003173828125, -0.6500930786132812, -0.62298583984375, -0.5958786010742188, -0.5687713623046875, -0.5416641235351562, -0.514556884765625, -0.48744964599609375, -0.4603424072265625, -0.43323516845703125, -0.4061279296875, -0.37902069091796875, -0.3519134521484375, -0.32480621337890625, -0.297698974609375, -0.27059173583984375, -0.2434844970703125, -0.21637725830078125, -0.18927001953125, -0.16216278076171875, -0.1350555419921875, -0.10794830322265625, -0.080841064453125, -0.05373382568359375, -0.0266265869140625, 0.00048065185546875, 0.027587890625, 0.05469512939453125, 0.0818023681640625, 0.10890960693359375, 0.136016845703125, 0.16312408447265625, 0.1902313232421875, 0.21733856201171875, 0.24444580078125, 0.27155303955078125, 0.2986602783203125, 0.32576751708984375, 0.352874755859375, 0.37998199462890625, 0.4070892333984375, 0.43419647216796875, 0.4613037109375, 0.48841094970703125, 0.5155181884765625, 0.5426254272460938, 0.569732666015625, 0.5968399047851562, 0.6239471435546875, 0.6510543823242188, 0.67816162109375, 0.7052688598632812, 0.7323760986328125, 0.7594833374023438, 0.786590576171875, 0.8136978149414062, 0.8408050537109375, 0.8679122924804688, 0.89501953125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 4.0, 6.0, 6.0, 8.0, 14.0, 12.0, 10.0, 15.0, 17.0, 28.0, 28.0, 28.0, 30.0, 28.0, 29.0, 46.0, 29.0, 30.0, 46.0, 53.0, 1062.0, 42.0, 46.0, 31.0, 29.0, 41.0, 39.0, 34.0, 35.0, 31.0, 38.0, 20.0, 19.0, 18.0, 17.0, 11.0, 14.0, 10.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0], "bins": [-3.59765625, -3.50146484375, -3.4052734375, -3.30908203125, -3.212890625, -3.11669921875, -3.0205078125, -2.92431640625, -2.828125, -2.73193359375, -2.6357421875, -2.53955078125, -2.443359375, -2.34716796875, -2.2509765625, -2.15478515625, -2.05859375, -1.96240234375, -1.8662109375, -1.77001953125, -1.673828125, -1.57763671875, -1.4814453125, -1.38525390625, -1.2890625, -1.19287109375, -1.0966796875, -1.00048828125, -0.904296875, -0.80810546875, -0.7119140625, -0.61572265625, -0.51953125, -0.42333984375, -0.3271484375, -0.23095703125, -0.134765625, -0.03857421875, 0.0576171875, 0.15380859375, 0.25, 0.34619140625, 0.4423828125, 0.53857421875, 0.634765625, 0.73095703125, 0.8271484375, 0.92333984375, 1.01953125, 1.11572265625, 1.2119140625, 1.30810546875, 1.404296875, 1.50048828125, 1.5966796875, 1.69287109375, 1.7890625, 1.88525390625, 1.9814453125, 2.07763671875, 2.173828125, 2.27001953125, 2.3662109375, 2.46240234375, 2.55859375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 12.0, 10.0, 23.0, 40.0, 40.0, 52.0, 97.0, 143.0, 201.0, 312.0, 464.0, 672.0, 1104.0, 1578.0, 2585.0, 4238.0, 6969.0, 11672.0, 19719.0, 34247.0, 60261.0, 114912.0, 249843.0, 1313982.0, 121514.0, 64341.0, 36027.0, 20753.0, 12049.0, 7383.0, 4429.0, 2678.0, 1733.0, 1045.0, 692.0, 428.0, 300.0, 172.0, 148.0, 85.0, 48.0, 48.0, 21.0, 16.0, 15.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.87158203125, -0.8425674438476562, -0.8135528564453125, -0.7845382690429688, -0.755523681640625, -0.7265090942382812, -0.6974945068359375, -0.6684799194335938, -0.63946533203125, -0.6104507446289062, -0.5814361572265625, -0.5524215698242188, -0.523406982421875, -0.49439239501953125, -0.4653778076171875, -0.43636322021484375, -0.4073486328125, -0.37833404541015625, -0.3493194580078125, -0.32030487060546875, -0.291290283203125, -0.26227569580078125, -0.2332611083984375, -0.20424652099609375, -0.17523193359375, -0.14621734619140625, -0.1172027587890625, -0.08818817138671875, -0.059173583984375, -0.03015899658203125, -0.0011444091796875, 0.02787017822265625, 0.056884765625, 0.08589935302734375, 0.1149139404296875, 0.14392852783203125, 0.172943115234375, 0.20195770263671875, 0.2309722900390625, 0.25998687744140625, 0.28900146484375, 0.31801605224609375, 0.3470306396484375, 0.37604522705078125, 0.405059814453125, 0.43407440185546875, 0.4630889892578125, 0.49210357666015625, 0.5211181640625, 0.5501327514648438, 0.5791473388671875, 0.6081619262695312, 0.637176513671875, 0.6661911010742188, 0.6952056884765625, 0.7242202758789062, 0.75323486328125, 0.7822494506835938, 0.8112640380859375, 0.8402786254882812, 0.869293212890625, 0.8983078002929688, 0.9273223876953125, 0.9563369750976562, 0.9853515625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 3.0, 5.0, 4.0, 6.0, 13.0, 7.0, 8.0, 9.0, 18.0, 13.0, 21.0, 27.0, 33.0, 23.0, 43.0, 35.0, 45.0, 39.0, 51.0, 36.0, 48.0, 53.0, 41.0, 50.0, 38.0, 32.0, 33.0, 34.0, 33.0, 30.0, 23.0, 27.0, 20.0, 21.0, 10.0, 12.0, 13.0, 7.0, 9.0, 4.0, 5.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0005354881286621094, -0.0005178079009056091, -0.0005001276731491089, -0.00048244744539260864, -0.0004647672176361084, -0.00044708698987960815, -0.0004294067621231079, -0.00041172653436660767, -0.0003940463066101074, -0.0003763660788536072, -0.00035868585109710693, -0.0003410056233406067, -0.00032332539558410645, -0.0003056451678276062, -0.00028796494007110596, -0.0002702847123146057, -0.00025260448455810547, -0.00023492425680160522, -0.00021724402904510498, -0.00019956380128860474, -0.0001818835735321045, -0.00016420334577560425, -0.000146523118019104, -0.00012884289026260376, -0.00011116266250610352, -9.348243474960327e-05, -7.580220699310303e-05, -5.812197923660278e-05, -4.044175148010254e-05, -2.2761523723602295e-05, -5.081295967102051e-06, 1.2598931789398193e-05, 3.0279159545898438e-05, 4.795938730239868e-05, 6.563961505889893e-05, 8.331984281539917e-05, 0.00010100007057189941, 0.00011868029832839966, 0.0001363605260848999, 0.00015404075384140015, 0.0001717209815979004, 0.00018940120935440063, 0.00020708143711090088, 0.00022476166486740112, 0.00024244189262390137, 0.0002601221203804016, 0.00027780234813690186, 0.0002954825758934021, 0.00031316280364990234, 0.0003308430314064026, 0.00034852325916290283, 0.0003662034869194031, 0.0003838837146759033, 0.00040156394243240356, 0.0004192441701889038, 0.00043692439794540405, 0.0004546046257019043, 0.00047228485345840454, 0.0004899650812149048, 0.000507645308971405, 0.0005253255367279053, 0.0005430057644844055, 0.0005606859922409058, 0.000578366219997406, 0.0005960464477539062]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 3.0, 5.0, 10.0, 14.0, 11.0, 19.0, 18.0, 29.0, 26.0, 39.0, 65.0, 88.0, 102.0, 159.0, 214.0, 328.0, 623.0, 2474.0, 176678.0, 854008.0, 11435.0, 839.0, 435.0, 240.0, 156.0, 150.0, 108.0, 65.0, 57.0, 39.0, 26.0, 17.0, 15.0, 9.0, 10.0, 9.0, 7.0, 5.0, 3.0, 6.0, 0.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01177978515625, -0.011389970779418945, -0.01100015640258789, -0.010610342025756836, -0.010220527648925781, -0.009830713272094727, -0.009440898895263672, -0.009051084518432617, -0.008661270141601562, -0.008271455764770508, -0.007881641387939453, -0.0074918270111083984, -0.007102012634277344, -0.006712198257446289, -0.006322383880615234, -0.00593256950378418, -0.005542755126953125, -0.00515294075012207, -0.004763126373291016, -0.004373311996459961, -0.003983497619628906, -0.0035936832427978516, -0.003203868865966797, -0.002814054489135742, -0.0024242401123046875, -0.002034425735473633, -0.0016446113586425781, -0.0012547969818115234, -0.0008649826049804688, -0.00047516822814941406, -8.535385131835938e-05, 0.0003044605255126953, 0.00069427490234375, 0.0010840892791748047, 0.0014739036560058594, 0.001863718032836914, 0.0022535324096679688, 0.0026433467864990234, 0.003033161163330078, 0.003422975540161133, 0.0038127899169921875, 0.004202604293823242, 0.004592418670654297, 0.0049822330474853516, 0.005372047424316406, 0.005761861801147461, 0.006151676177978516, 0.00654149055480957, 0.006931304931640625, 0.00732111930847168, 0.007710933685302734, 0.008100748062133789, 0.008490562438964844, 0.008880376815795898, 0.009270191192626953, 0.009660005569458008, 0.010049819946289062, 0.010439634323120117, 0.010829448699951172, 0.011219263076782227, 0.011609077453613281, 0.011998891830444336, 0.01238870620727539, 0.012778520584106445, 0.0131683349609375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 44.0, 158.0, 303.0, 340.0, 134.0, 28.0, 5.0], "bins": [-0.0038258617278188467, -0.003762006526812911, -0.003698151558637619, -0.0036342963576316833, -0.0035704411566257477, -0.003506585955619812, -0.00344273098744452, -0.0033788757864385843, -0.0033150205854326487, -0.003251165384426713, -0.003187310416251421, -0.0031234552152454853, -0.0030596000142395496, -0.002995744813233614, -0.002931889845058322, -0.0028680346440523863, -0.0028041796758770943, -0.0027403244748711586, -0.0026764695066958666, -0.002612614305689931, -0.0025487591046839952, -0.0024849039036780596, -0.0024210489355027676, -0.002357193734496832, -0.0022933385334908962, -0.0022294833324849606, -0.0021656283643096685, -0.002101773163303733, -0.002037917962297797, -0.0019740627612918615, -0.0019102077931165695, -0.0018463525921106339, -0.0017824972746893764, -0.0017186421900987625, -0.0016547869890928268, -0.001590931904502213, -0.0015270767034962773, -0.0014632216189056635, -0.0013993664178997278, -0.001335511333309114, -0.0012716562487185001, -0.0012078011641278863, -0.0011439459631219506, -0.0010800908785313368, -0.0010162356775254011, -0.0009523805929347873, -0.0008885254501365125, -0.0008246703073382378, -0.0007608151063323021, -0.0006969599635340273, -0.0006331048207357526, -0.0005692497361451387, -0.0005053945351392031, -0.00044153942144475877, -0.0003776843077503145, -0.0003138291649520397, -0.00024997402215376496, -0.0001861188793554902, -0.00012226375110913068, -5.8408622862771153e-05, 5.446519935503602e-06, 6.930166273377836e-05, 0.00013315677642822266, 0.0001970119192264974, 0.00026086706202477217]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 6.0, 4.0, 5.0, 10.0, 8.0, 16.0, 18.0, 14.0, 22.0, 20.0, 20.0, 23.0, 30.0, 40.0, 33.0, 25.0, 37.0, 44.0, 34.0, 47.0, 33.0, 39.0, 44.0, 40.0, 19.0, 34.0, 33.0, 31.0, 27.0, 20.0, 34.0, 19.0, 18.0, 23.0, 16.0, 29.0, 16.0, 17.0, 5.0, 13.0, 3.0, 10.0, 6.0, 8.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00032132863998413086, -0.0003111995756626129, -0.00030107051134109497, -0.000290941447019577, -0.0002808123826980591, -0.00027068331837654114, -0.0002605542540550232, -0.00025042518973350525, -0.0002402961254119873, -0.00023016706109046936, -0.00022003799676895142, -0.00020990893244743347, -0.00019977986812591553, -0.00018965080380439758, -0.00017952173948287964, -0.0001693926751613617, -0.00015926361083984375, -0.0001491345465183258, -0.00013900548219680786, -0.00012887641787528992, -0.00011874735355377197, -0.00010861828923225403, -9.848922491073608e-05, -8.836016058921814e-05, -7.82310962677002e-05, -6.810203194618225e-05, -5.797296762466431e-05, -4.784390330314636e-05, -3.771483898162842e-05, -2.7585774660110474e-05, -1.745671033859253e-05, -7.327646017074585e-06, 2.8014183044433594e-06, 1.2930482625961304e-05, 2.3059546947479248e-05, 3.318861126899719e-05, 4.331767559051514e-05, 5.344673991203308e-05, 6.357580423355103e-05, 7.370486855506897e-05, 8.383393287658691e-05, 9.396299719810486e-05, 0.0001040920615196228, 0.00011422112584114075, 0.0001243501901626587, 0.00013447925448417664, 0.00014460831880569458, 0.00015473738312721252, 0.00016486644744873047, 0.0001749955117702484, 0.00018512457609176636, 0.0001952536404132843, 0.00020538270473480225, 0.0002155117690563202, 0.00022564083337783813, 0.00023576989769935608, 0.000245898962020874, 0.00025602802634239197, 0.0002661570906639099, 0.00027628615498542786, 0.0002864152193069458, 0.00029654428362846375, 0.0003066733479499817, 0.00031680241227149963, 0.0003269314765930176]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 3.0, 9.0, 7.0, 11.0, 19.0, 15.0, 18.0, 23.0, 18.0, 26.0, 20.0, 42.0, 39.0, 44.0, 54.0, 47.0, 45.0, 41.0, 47.0, 40.0, 41.0, 48.0, 36.0, 33.0, 33.0, 31.0, 30.0, 26.0, 21.0, 18.0, 24.0, 16.0, 14.0, 15.0, 8.0, 8.0, 10.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.03515625, -4.87908935546875, -4.7230224609375, -4.56695556640625, -4.410888671875, -4.25482177734375, -4.0987548828125, -3.94268798828125, -3.78662109375, -3.63055419921875, -3.4744873046875, -3.31842041015625, -3.162353515625, -3.00628662109375, -2.8502197265625, -2.69415283203125, -2.5380859375, -2.38201904296875, -2.2259521484375, -2.06988525390625, -1.913818359375, -1.75775146484375, -1.6016845703125, -1.44561767578125, -1.28955078125, -1.13348388671875, -0.9774169921875, -0.82135009765625, -0.665283203125, -0.50921630859375, -0.3531494140625, -0.19708251953125, -0.041015625, 0.11505126953125, 0.2711181640625, 0.42718505859375, 0.583251953125, 0.73931884765625, 0.8953857421875, 1.05145263671875, 1.20751953125, 1.36358642578125, 1.5196533203125, 1.67572021484375, 1.831787109375, 1.98785400390625, 2.1439208984375, 2.29998779296875, 2.4560546875, 2.61212158203125, 2.7681884765625, 2.92425537109375, 3.080322265625, 3.23638916015625, 3.3924560546875, 3.54852294921875, 3.70458984375, 3.86065673828125, 4.0167236328125, 4.17279052734375, 4.328857421875, 4.48492431640625, 4.6409912109375, 4.79705810546875, 4.953125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 7.0, 12.0, 14.0, 11.0, 23.0, 32.0, 37.0, 44.0, 84.0, 122.0, 178.0, 371.0, 682.0, 1398.0, 2739.0, 5711.0, 11811.0, 27437.0, 72034.0, 239917.0, 418224.0, 172983.0, 53999.0, 21579.0, 9778.0, 4613.0, 2151.0, 1074.0, 636.0, 325.0, 187.0, 97.0, 66.0, 45.0, 34.0, 24.0, 19.0, 15.0, 10.0, 8.0, 10.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.58203125, -5.404052734375, -5.22607421875, -5.048095703125, -4.8701171875, -4.692138671875, -4.51416015625, -4.336181640625, -4.158203125, -3.980224609375, -3.80224609375, -3.624267578125, -3.4462890625, -3.268310546875, -3.09033203125, -2.912353515625, -2.734375, -2.556396484375, -2.37841796875, -2.200439453125, -2.0224609375, -1.844482421875, -1.66650390625, -1.488525390625, -1.310546875, -1.132568359375, -0.95458984375, -0.776611328125, -0.5986328125, -0.420654296875, -0.24267578125, -0.064697265625, 0.11328125, 0.291259765625, 0.46923828125, 0.647216796875, 0.8251953125, 1.003173828125, 1.18115234375, 1.359130859375, 1.537109375, 1.715087890625, 1.89306640625, 2.071044921875, 2.2490234375, 2.427001953125, 2.60498046875, 2.782958984375, 2.9609375, 3.138916015625, 3.31689453125, 3.494873046875, 3.6728515625, 3.850830078125, 4.02880859375, 4.206787109375, 4.384765625, 4.562744140625, 4.74072265625, 4.918701171875, 5.0966796875, 5.274658203125, 5.45263671875, 5.630615234375, 5.80859375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 4.0, 2.0, 9.0, 7.0, 11.0, 9.0, 10.0, 16.0, 13.0, 30.0, 22.0, 24.0, 27.0, 30.0, 44.0, 53.0, 52.0, 103.0, 165.0, 1413.0, 364.0, 164.0, 76.0, 59.0, 45.0, 42.0, 34.0, 27.0, 26.0, 31.0, 27.0, 12.0, 12.0, 16.0, 11.0, 12.0, 10.0, 5.0, 8.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0], "bins": [-19.109375, -18.57763671875, -18.0458984375, -17.51416015625, -16.982421875, -16.45068359375, -15.9189453125, -15.38720703125, -14.85546875, -14.32373046875, -13.7919921875, -13.26025390625, -12.728515625, -12.19677734375, -11.6650390625, -11.13330078125, -10.6015625, -10.06982421875, -9.5380859375, -9.00634765625, -8.474609375, -7.94287109375, -7.4111328125, -6.87939453125, -6.34765625, -5.81591796875, -5.2841796875, -4.75244140625, -4.220703125, -3.68896484375, -3.1572265625, -2.62548828125, -2.09375, -1.56201171875, -1.0302734375, -0.49853515625, 0.033203125, 0.56494140625, 1.0966796875, 1.62841796875, 2.16015625, 2.69189453125, 3.2236328125, 3.75537109375, 4.287109375, 4.81884765625, 5.3505859375, 5.88232421875, 6.4140625, 6.94580078125, 7.4775390625, 8.00927734375, 8.541015625, 9.07275390625, 9.6044921875, 10.13623046875, 10.66796875, 11.19970703125, 11.7314453125, 12.26318359375, 12.794921875, 13.32666015625, 13.8583984375, 14.39013671875, 14.921875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 8.0, 13.0, 14.0, 8.0, 26.0, 41.0, 41.0, 61.0, 75.0, 123.0, 188.0, 405.0, 836.0, 9669.0, 3045399.0, 85995.0, 1619.0, 453.0, 239.0, 152.0, 90.0, 66.0, 41.0, 28.0, 32.0, 23.0, 9.0, 11.0, 6.0, 5.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.09375, -46.52734375, -44.9609375, -43.39453125, -41.828125, -40.26171875, -38.6953125, -37.12890625, -35.5625, -33.99609375, -32.4296875, -30.86328125, -29.296875, -27.73046875, -26.1640625, -24.59765625, -23.03125, -21.46484375, -19.8984375, -18.33203125, -16.765625, -15.19921875, -13.6328125, -12.06640625, -10.5, -8.93359375, -7.3671875, -5.80078125, -4.234375, -2.66796875, -1.1015625, 0.46484375, 2.03125, 3.59765625, 5.1640625, 6.73046875, 8.296875, 9.86328125, 11.4296875, 12.99609375, 14.5625, 16.12890625, 17.6953125, 19.26171875, 20.828125, 22.39453125, 23.9609375, 25.52734375, 27.09375, 28.66015625, 30.2265625, 31.79296875, 33.359375, 34.92578125, 36.4921875, 38.05859375, 39.625, 41.19140625, 42.7578125, 44.32421875, 45.890625, 47.45703125, 49.0234375, 50.58984375, 52.15625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 13.0, 38.0, 110.0, 216.0, 274.0, 216.0, 96.0, 37.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.981849670410156, -31.286474227905273, -29.59109878540039, -27.895723342895508, -26.200347900390625, -24.50497055053711, -22.80959701538086, -21.114219665527344, -19.418846130371094, -17.72347068786621, -16.028095245361328, -14.332719802856445, -12.637344360351562, -10.941967964172363, -9.24659252166748, -7.551217079162598, -5.855840682983398, -4.160465240478516, -2.4650895595550537, -0.7697138786315918, 0.925661563873291, 2.621037483215332, 4.316412925720215, 6.011788368225098, 7.7071638107299805, 9.402539253234863, 11.097914695739746, 12.793291091918945, 14.488666534423828, 16.18404197692871, 17.879417419433594, 19.574792861938477, 21.27016830444336, 22.965543746948242, 24.660919189453125, 26.356294631958008, 28.05167007446289, 29.747047424316406, 31.442420959472656, 33.13779830932617, 34.83317184448242, 36.52854919433594, 38.22392272949219, 39.9193000793457, 41.61467361450195, 43.31005096435547, 45.00542449951172, 46.700801849365234, 48.39617919921875, 50.091556549072266, 51.786930084228516, 53.48230743408203, 55.17768096923828, 56.8730583190918, 58.56843185424805, 60.26380920410156, 61.95918273925781, 63.65456008911133, 65.34993743896484, 67.0453109741211, 68.74068450927734, 70.4360580444336, 72.13143920898438, 73.82681274414062, 75.52218627929688]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 10.0, 6.0, 8.0, 9.0, 8.0, 19.0, 12.0, 15.0, 21.0, 30.0, 29.0, 37.0, 32.0, 28.0, 33.0, 36.0, 49.0, 37.0, 49.0, 53.0, 36.0, 45.0, 34.0, 30.0, 41.0, 30.0, 47.0, 37.0, 22.0, 18.0, 17.0, 20.0, 19.0, 22.0, 15.0, 12.0, 6.0, 9.0, 3.0, 9.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-47.60844421386719, -46.23941421508789, -44.870384216308594, -43.5013542175293, -42.13232421875, -40.7632942199707, -39.394264221191406, -38.025230407714844, -36.65620422363281, -35.287174224853516, -33.91814422607422, -32.54911422729492, -31.180084228515625, -29.811054229736328, -28.4420223236084, -27.0729923248291, -25.703960418701172, -24.334930419921875, -22.965900421142578, -21.59687042236328, -20.227840423583984, -18.858810424804688, -17.489778518676758, -16.12074851989746, -14.751718521118164, -13.382688522338867, -12.01365852355957, -10.644627571105957, -9.27559757232666, -7.906567573547363, -6.53753662109375, -5.168506622314453, -3.7994728088378906, -2.4304425716400146, -1.0614123344421387, 0.3076181411743164, 1.6766481399536133, 3.04567813873291, 4.414709091186523, 5.78373908996582, 7.152769088745117, 8.521799087524414, 9.890829086303711, 11.259860038757324, 12.628890037536621, 13.997920036315918, 15.366950988769531, 16.735980987548828, 18.105010986328125, 19.474040985107422, 20.84307098388672, 22.212100982666016, 23.581130981445312, 24.95016098022461, 26.31919288635254, 27.688222885131836, 29.057252883911133, 30.42628288269043, 31.795312881469727, 33.164344787597656, 34.53337478637695, 35.90240478515625, 37.27143478393555, 38.640464782714844, 40.00949478149414]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 6.0, 4.0, 5.0, 13.0, 12.0, 11.0, 18.0, 20.0, 17.0, 20.0, 27.0, 32.0, 38.0, 40.0, 44.0, 41.0, 46.0, 46.0, 34.0, 52.0, 49.0, 46.0, 42.0, 36.0, 29.0, 35.0, 33.0, 29.0, 24.0, 23.0, 16.0, 28.0, 15.0, 15.0, 10.0, 14.0, 7.0, 10.0, 0.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1875, -5.0220947265625, -4.856689453125, -4.6912841796875, -4.52587890625, -4.3604736328125, -4.195068359375, -4.0296630859375, -3.8642578125, -3.6988525390625, -3.533447265625, -3.3680419921875, -3.20263671875, -3.0372314453125, -2.871826171875, -2.7064208984375, -2.541015625, -2.3756103515625, -2.210205078125, -2.0447998046875, -1.87939453125, -1.7139892578125, -1.548583984375, -1.3831787109375, -1.2177734375, -1.0523681640625, -0.886962890625, -0.7215576171875, -0.55615234375, -0.3907470703125, -0.225341796875, -0.0599365234375, 0.10546875, 0.2708740234375, 0.436279296875, 0.6016845703125, 0.76708984375, 0.9324951171875, 1.097900390625, 1.2633056640625, 1.4287109375, 1.5941162109375, 1.759521484375, 1.9249267578125, 2.09033203125, 2.2557373046875, 2.421142578125, 2.5865478515625, 2.751953125, 2.9173583984375, 3.082763671875, 3.2481689453125, 3.41357421875, 3.5789794921875, 3.744384765625, 3.9097900390625, 4.0751953125, 4.2406005859375, 4.406005859375, 4.5714111328125, 4.73681640625, 4.9022216796875, 5.067626953125, 5.2330322265625, 5.3984375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 10.0, 6.0, 9.0, 6.0, 11.0, 7.0, 13.0, 21.0, 20.0, 23.0, 32.0, 40.0, 37.0, 63.0, 63.0, 109.0, 168.0, 351.0, 1070.0, 14172.0, 1299243.0, 2834428.0, 41576.0, 1712.0, 408.0, 180.0, 119.0, 78.0, 66.0, 45.0, 41.0, 31.0, 31.0, 17.0, 15.0, 13.0, 13.0, 14.0, 6.0, 10.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.890625, -23.123291015625, -22.35595703125, -21.588623046875, -20.8212890625, -20.053955078125, -19.28662109375, -18.519287109375, -17.751953125, -16.984619140625, -16.21728515625, -15.449951171875, -14.6826171875, -13.915283203125, -13.14794921875, -12.380615234375, -11.61328125, -10.845947265625, -10.07861328125, -9.311279296875, -8.5439453125, -7.776611328125, -7.00927734375, -6.241943359375, -5.474609375, -4.707275390625, -3.93994140625, -3.172607421875, -2.4052734375, -1.637939453125, -0.87060546875, -0.103271484375, 0.6640625, 1.431396484375, 2.19873046875, 2.966064453125, 3.7333984375, 4.500732421875, 5.26806640625, 6.035400390625, 6.802734375, 7.570068359375, 8.33740234375, 9.104736328125, 9.8720703125, 10.639404296875, 11.40673828125, 12.174072265625, 12.94140625, 13.708740234375, 14.47607421875, 15.243408203125, 16.0107421875, 16.778076171875, 17.54541015625, 18.312744140625, 19.080078125, 19.847412109375, 20.61474609375, 21.382080078125, 22.1494140625, 22.916748046875, 23.68408203125, 24.451416015625, 25.21875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 6.0, 6.0, 15.0, 27.0, 27.0, 43.0, 91.0, 98.0, 177.0, 277.0, 406.0, 516.0, 611.0, 605.0, 408.0, 249.0, 200.0, 105.0, 89.0, 44.0, 31.0, 12.0, 13.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.625, -13.091552734375, -12.55810546875, -12.024658203125, -11.4912109375, -10.957763671875, -10.42431640625, -9.890869140625, -9.357421875, -8.823974609375, -8.29052734375, -7.757080078125, -7.2236328125, -6.690185546875, -6.15673828125, -5.623291015625, -5.08984375, -4.556396484375, -4.02294921875, -3.489501953125, -2.9560546875, -2.422607421875, -1.88916015625, -1.355712890625, -0.822265625, -0.288818359375, 0.24462890625, 0.778076171875, 1.3115234375, 1.844970703125, 2.37841796875, 2.911865234375, 3.4453125, 3.978759765625, 4.51220703125, 5.045654296875, 5.5791015625, 6.112548828125, 6.64599609375, 7.179443359375, 7.712890625, 8.246337890625, 8.77978515625, 9.313232421875, 9.8466796875, 10.380126953125, 10.91357421875, 11.447021484375, 11.98046875, 12.513916015625, 13.04736328125, 13.580810546875, 14.1142578125, 14.647705078125, 15.18115234375, 15.714599609375, 16.248046875, 16.781494140625, 17.31494140625, 17.848388671875, 18.3818359375, 18.915283203125, 19.44873046875, 19.982177734375, 20.515625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 5.0, 15.0, 18.0, 23.0, 45.0, 70.0, 119.0, 178.0, 250.0, 450.0, 970.0, 8430.0, 1497427.0, 2670153.0, 13627.0, 1191.0, 507.0, 247.0, 185.0, 118.0, 77.0, 39.0, 56.0, 21.0, 20.0, 15.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.28125, -55.81494140625, -54.3486328125, -52.88232421875, -51.416015625, -49.94970703125, -48.4833984375, -47.01708984375, -45.55078125, -44.08447265625, -42.6181640625, -41.15185546875, -39.685546875, -38.21923828125, -36.7529296875, -35.28662109375, -33.8203125, -32.35400390625, -30.8876953125, -29.42138671875, -27.955078125, -26.48876953125, -25.0224609375, -23.55615234375, -22.08984375, -20.62353515625, -19.1572265625, -17.69091796875, -16.224609375, -14.75830078125, -13.2919921875, -11.82568359375, -10.359375, -8.89306640625, -7.4267578125, -5.96044921875, -4.494140625, -3.02783203125, -1.5615234375, -0.09521484375, 1.37109375, 2.83740234375, 4.3037109375, 5.77001953125, 7.236328125, 8.70263671875, 10.1689453125, 11.63525390625, 13.1015625, 14.56787109375, 16.0341796875, 17.50048828125, 18.966796875, 20.43310546875, 21.8994140625, 23.36572265625, 24.83203125, 26.29833984375, 27.7646484375, 29.23095703125, 30.697265625, 32.16357421875, 33.6298828125, 35.09619140625, 36.5625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 4.0, 15.0, 26.0, 46.0, 51.0, 87.0, 112.0, 109.0, 88.0, 97.0, 106.0, 78.0, 59.0, 47.0, 30.0, 13.0, 15.0, 10.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.70492172241211, -33.90251922607422, -32.100120544433594, -30.297718048095703, -28.495315551757812, -26.692914962768555, -24.890514373779297, -23.088111877441406, -21.28571128845215, -19.48331069946289, -17.680908203125, -15.878507614135742, -14.076106071472168, -12.273704528808594, -10.471303939819336, -8.668902397155762, -6.8665008544921875, -5.064099311828613, -3.2616982460021973, -1.4592971801757812, 0.34310436248779297, 2.145505905151367, 3.947906494140625, 5.750308036804199, 7.552709579467773, 9.355111122131348, 11.157512664794922, 12.95991325378418, 14.762314796447754, 16.564716339111328, 18.367116928100586, 20.169517517089844, 21.971923828125, 23.774324417114258, 25.57672691345215, 27.379127502441406, 29.181529998779297, 30.983930587768555, 32.78633117675781, 34.5887336730957, 36.391136169433594, 38.193538665771484, 39.99593734741211, 41.79833984375, 43.60074234008789, 45.40314483642578, 47.205543518066406, 49.0079460144043, 50.81034469604492, 52.61274719238281, 54.41514587402344, 56.21754837036133, 58.01995086669922, 59.822349548339844, 61.624752044677734, 63.427154541015625, 65.22955322265625, 67.03195190429688, 68.83435821533203, 70.63675689697266, 72.43915557861328, 74.24156188964844, 76.04396057128906, 77.84635925292969, 79.64876556396484]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 8.0, 8.0, 9.0, 7.0, 9.0, 18.0, 15.0, 12.0, 13.0, 21.0, 28.0, 26.0, 21.0, 28.0, 34.0, 30.0, 38.0, 40.0, 36.0, 41.0, 43.0, 46.0, 42.0, 47.0, 47.0, 33.0, 31.0, 33.0, 31.0, 25.0, 35.0, 25.0, 18.0, 24.0, 13.0, 15.0, 9.0, 16.0, 9.0, 9.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.850093841552734, -41.62049102783203, -40.39088821411133, -39.16128921508789, -37.93168640136719, -36.702083587646484, -35.47248077392578, -34.24287796020508, -33.013275146484375, -31.783672332763672, -30.5540714263916, -29.3244686126709, -28.094867706298828, -26.865264892578125, -25.635662078857422, -24.40605926513672, -23.17646026611328, -21.946857452392578, -20.717256546020508, -19.487653732299805, -18.258052825927734, -17.02845001220703, -15.798847198486328, -14.569245338439941, -13.339643478393555, -12.110041618347168, -10.880439758300781, -9.650836944580078, -8.421235084533691, -7.191633224487305, -5.96203088760376, -4.732428550720215, -3.5028228759765625, -2.2732207775115967, -1.0436186790466309, 0.18598341941833496, 1.4155855178833008, 2.6451873779296875, 3.8747897148132324, 5.104392051696777, 6.333993911743164, 7.563595771789551, 8.793197631835938, 10.02280044555664, 11.252402305603027, 12.482004165649414, 13.711606979370117, 14.941208839416504, 16.17081069946289, 17.400413513183594, 18.630014419555664, 19.859617233276367, 21.089218139648438, 22.31882095336914, 23.548423767089844, 24.778026580810547, 26.007627487182617, 27.23723030090332, 28.46683120727539, 29.696434020996094, 30.926036834716797, 32.1556396484375, 33.38523864746094, 34.61484146118164, 35.844444274902344]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 1.0, 9.0, 6.0, 9.0, 10.0, 10.0, 7.0, 22.0, 23.0, 21.0, 18.0, 37.0, 30.0, 33.0, 53.0, 41.0, 43.0, 40.0, 47.0, 47.0, 39.0, 37.0, 34.0, 41.0, 35.0, 44.0, 26.0, 31.0, 30.0, 40.0, 21.0, 21.0, 16.0, 17.0, 10.0, 11.0, 8.0, 11.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3359375, -5.16973876953125, -5.0035400390625, -4.83734130859375, -4.671142578125, -4.50494384765625, -4.3387451171875, -4.17254638671875, -4.00634765625, -3.84014892578125, -3.6739501953125, -3.50775146484375, -3.341552734375, -3.17535400390625, -3.0091552734375, -2.84295654296875, -2.6767578125, -2.51055908203125, -2.3443603515625, -2.17816162109375, -2.011962890625, -1.84576416015625, -1.6795654296875, -1.51336669921875, -1.34716796875, -1.18096923828125, -1.0147705078125, -0.84857177734375, -0.682373046875, -0.51617431640625, -0.3499755859375, -0.18377685546875, -0.017578125, 0.14862060546875, 0.3148193359375, 0.48101806640625, 0.647216796875, 0.81341552734375, 0.9796142578125, 1.14581298828125, 1.31201171875, 1.47821044921875, 1.6444091796875, 1.81060791015625, 1.976806640625, 2.14300537109375, 2.3092041015625, 2.47540283203125, 2.6416015625, 2.80780029296875, 2.9739990234375, 3.14019775390625, 3.306396484375, 3.47259521484375, 3.6387939453125, 3.80499267578125, 3.97119140625, 4.13739013671875, 4.3035888671875, 4.46978759765625, 4.635986328125, 4.80218505859375, 4.9683837890625, 5.13458251953125, 5.30078125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 13.0, 20.0, 10.0, 28.0, 40.0, 57.0, 94.0, 142.0, 194.0, 283.0, 395.0, 609.0, 937.0, 1342.0, 1940.0, 3015.0, 4515.0, 7028.0, 10595.0, 16288.0, 26074.0, 41232.0, 69284.0, 118106.0, 219285.0, 221203.0, 120018.0, 69486.0, 42070.0, 26058.0, 16616.0, 10645.0, 6982.0, 4630.0, 3063.0, 2040.0, 1331.0, 903.0, 631.0, 447.0, 279.0, 177.0, 148.0, 94.0, 64.0, 39.0, 38.0, 25.0, 14.0, 7.0, 8.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80419921875, -0.7782669067382812, -0.7523345947265625, -0.7264022827148438, -0.700469970703125, -0.6745376586914062, -0.6486053466796875, -0.6226730346679688, -0.59674072265625, -0.5708084106445312, -0.5448760986328125, -0.5189437866210938, -0.493011474609375, -0.46707916259765625, -0.4411468505859375, -0.41521453857421875, -0.3892822265625, -0.36334991455078125, -0.3374176025390625, -0.31148529052734375, -0.285552978515625, -0.25962066650390625, -0.2336883544921875, -0.20775604248046875, -0.18182373046875, -0.15589141845703125, -0.1299591064453125, -0.10402679443359375, -0.078094482421875, -0.05216217041015625, -0.0262298583984375, -0.00029754638671875, 0.025634765625, 0.05156707763671875, 0.0774993896484375, 0.10343170166015625, 0.129364013671875, 0.15529632568359375, 0.1812286376953125, 0.20716094970703125, 0.23309326171875, 0.25902557373046875, 0.2849578857421875, 0.31089019775390625, 0.336822509765625, 0.36275482177734375, 0.3886871337890625, 0.41461944580078125, 0.4405517578125, 0.46648406982421875, 0.4924163818359375, 0.5183486938476562, 0.544281005859375, 0.5702133178710938, 0.5961456298828125, 0.6220779418945312, 0.64801025390625, 0.6739425659179688, 0.6998748779296875, 0.7258071899414062, 0.751739501953125, 0.7776718139648438, 0.8036041259765625, 0.8295364379882812, 0.85546875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 12.0, 2.0, 16.0, 14.0, 18.0, 22.0, 19.0, 16.0, 22.0, 34.0, 26.0, 42.0, 31.0, 33.0, 29.0, 37.0, 49.0, 34.0, 39.0, 1072.0, 44.0, 41.0, 41.0, 34.0, 41.0, 27.0, 28.0, 25.0, 25.0, 18.0, 25.0, 16.0, 11.0, 16.0, 18.0, 11.0, 13.0, 2.0, 12.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.909881591796875, -2.80999755859375, -2.710113525390625, -2.6102294921875, -2.510345458984375, -2.41046142578125, -2.310577392578125, -2.210693359375, -2.110809326171875, -2.01092529296875, -1.911041259765625, -1.8111572265625, -1.711273193359375, -1.61138916015625, -1.511505126953125, -1.41162109375, -1.311737060546875, -1.21185302734375, -1.111968994140625, -1.0120849609375, -0.912200927734375, -0.81231689453125, -0.712432861328125, -0.612548828125, -0.512664794921875, -0.41278076171875, -0.312896728515625, -0.2130126953125, -0.113128662109375, -0.01324462890625, 0.086639404296875, 0.1865234375, 0.286407470703125, 0.38629150390625, 0.486175537109375, 0.5860595703125, 0.685943603515625, 0.78582763671875, 0.885711669921875, 0.985595703125, 1.085479736328125, 1.18536376953125, 1.285247802734375, 1.3851318359375, 1.485015869140625, 1.58489990234375, 1.684783935546875, 1.78466796875, 1.884552001953125, 1.98443603515625, 2.084320068359375, 2.1842041015625, 2.284088134765625, 2.38397216796875, 2.483856201171875, 2.583740234375, 2.683624267578125, 2.78350830078125, 2.883392333984375, 2.9832763671875, 3.083160400390625, 3.18304443359375, 3.282928466796875, 3.3828125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 11.0, 12.0, 14.0, 30.0, 37.0, 48.0, 72.0, 79.0, 126.0, 177.0, 270.0, 392.0, 553.0, 902.0, 1310.0, 2096.0, 3181.0, 5030.0, 8108.0, 12770.0, 20854.0, 33885.0, 57388.0, 104002.0, 213222.0, 1322719.0, 133329.0, 69633.0, 41021.0, 24454.0, 15056.0, 9353.0, 5923.0, 3796.0, 2432.0, 1559.0, 1053.0, 704.0, 483.0, 347.0, 232.0, 170.0, 99.0, 69.0, 38.0, 29.0, 24.0, 8.0, 14.0, 8.0, 4.0, 1.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.875, -0.8469390869140625, -0.818878173828125, -0.7908172607421875, -0.76275634765625, -0.7346954345703125, -0.706634521484375, -0.6785736083984375, -0.6505126953125, -0.6224517822265625, -0.594390869140625, -0.5663299560546875, -0.53826904296875, -0.5102081298828125, -0.482147216796875, -0.4540863037109375, -0.426025390625, -0.3979644775390625, -0.369903564453125, -0.3418426513671875, -0.31378173828125, -0.2857208251953125, -0.257659912109375, -0.2295989990234375, -0.2015380859375, -0.1734771728515625, -0.145416259765625, -0.1173553466796875, -0.08929443359375, -0.0612335205078125, -0.033172607421875, -0.0051116943359375, 0.02294921875, 0.0510101318359375, 0.079071044921875, 0.1071319580078125, 0.13519287109375, 0.1632537841796875, 0.191314697265625, 0.2193756103515625, 0.2474365234375, 0.2754974365234375, 0.303558349609375, 0.3316192626953125, 0.35968017578125, 0.3877410888671875, 0.415802001953125, 0.4438629150390625, 0.471923828125, 0.4999847412109375, 0.528045654296875, 0.5561065673828125, 0.58416748046875, 0.6122283935546875, 0.640289306640625, 0.6683502197265625, 0.6964111328125, 0.7244720458984375, 0.752532958984375, 0.7805938720703125, 0.80865478515625, 0.8367156982421875, 0.864776611328125, 0.8928375244140625, 0.9208984375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 9.0, 12.0, 10.0, 14.0, 7.0, 10.0, 10.0, 17.0, 17.0, 42.0, 48.0, 55.0, 64.0, 63.0, 85.0, 82.0, 74.0, 71.0, 61.0, 37.0, 31.0, 26.0, 28.0, 19.0, 10.0, 15.0, 7.0, 6.0, 12.0, 9.0, 8.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0008192062377929688, -0.0007879436016082764, -0.000756680965423584, -0.0007254183292388916, -0.0006941556930541992, -0.0006628930568695068, -0.0006316304206848145, -0.0006003677845001221, -0.0005691051483154297, -0.0005378425121307373, -0.0005065798759460449, -0.00047531723976135254, -0.00044405460357666016, -0.0004127919673919678, -0.0003815293312072754, -0.000350266695022583, -0.0003190040588378906, -0.00028774142265319824, -0.00025647878646850586, -0.00022521615028381348, -0.0001939535140991211, -0.0001626908779144287, -0.00013142824172973633, -0.00010016560554504395, -6.890296936035156e-05, -3.764033317565918e-05, -6.377696990966797e-06, 2.4884939193725586e-05, 5.614757537841797e-05, 8.741021156311035e-05, 0.00011867284774780273, 0.00014993548393249512, 0.0001811981201171875, 0.00021246075630187988, 0.00024372339248657227, 0.00027498602867126465, 0.00030624866485595703, 0.0003375113010406494, 0.0003687739372253418, 0.0004000365734100342, 0.00043129920959472656, 0.00046256184577941895, 0.0004938244819641113, 0.0005250871181488037, 0.0005563497543334961, 0.0005876123905181885, 0.0006188750267028809, 0.0006501376628875732, 0.0006814002990722656, 0.000712662935256958, 0.0007439255714416504, 0.0007751882076263428, 0.0008064508438110352, 0.0008377134799957275, 0.0008689761161804199, 0.0009002387523651123, 0.0009315013885498047, 0.0009627640247344971, 0.0009940266609191895, 0.0010252892971038818, 0.0010565519332885742, 0.0010878145694732666, 0.001119077205657959, 0.0011503398418426514, 0.0011816024780273438]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 14.0, 10.0, 21.0, 12.0, 22.0, 29.0, 55.0, 72.0, 143.0, 144.0, 245.0, 439.0, 1073.0, 63207.0, 975877.0, 5471.0, 672.0, 333.0, 202.0, 135.0, 95.0, 65.0, 58.0, 27.0, 23.0, 21.0, 15.0, 15.0, 10.0, 9.0, 1.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.023406982421875, -0.022795677185058594, -0.022184371948242188, -0.02157306671142578, -0.020961761474609375, -0.02035045623779297, -0.019739151000976562, -0.019127845764160156, -0.01851654052734375, -0.017905235290527344, -0.017293930053710938, -0.01668262481689453, -0.016071319580078125, -0.015460014343261719, -0.014848709106445312, -0.014237403869628906, -0.0136260986328125, -0.013014793395996094, -0.012403488159179688, -0.011792182922363281, -0.011180877685546875, -0.010569572448730469, -0.009958267211914062, -0.009346961975097656, -0.00873565673828125, -0.008124351501464844, -0.0075130462646484375, -0.006901741027832031, -0.006290435791015625, -0.005679130554199219, -0.0050678253173828125, -0.004456520080566406, -0.00384521484375, -0.0032339096069335938, -0.0026226043701171875, -0.0020112991333007812, -0.001399993896484375, -0.0007886886596679688, -0.0001773834228515625, 0.00043392181396484375, 0.00104522705078125, 0.0016565322875976562, 0.0022678375244140625, 0.0028791427612304688, 0.003490447998046875, 0.004101753234863281, 0.0047130584716796875, 0.005324363708496094, 0.0059356689453125, 0.006546974182128906, 0.0071582794189453125, 0.007769584655761719, 0.008380889892578125, 0.008992195129394531, 0.009603500366210938, 0.010214805603027344, 0.01082611083984375, 0.011437416076660156, 0.012048721313476562, 0.012660026550292969, 0.013271331787109375, 0.013882637023925781, 0.014493942260742188, 0.015105247497558594, 0.015716552734375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 14.0, 86.0, 302.0, 398.0, 172.0, 34.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022419746965169907, -0.002165189478546381, -0.0020884042605757713, -0.0020116190426051617, -0.001934833824634552, -0.0018580486066639423, -0.0017812633886933327, -0.001704478170722723, -0.0016276929527521133, -0.0015509077347815037, -0.001474122516810894, -0.0013973372988402843, -0.0013205520808696747, -0.001243766862899065, -0.0011669816449284554, -0.0010901964269578457, -0.001013411208987236, -0.0009366259910166264, -0.0008598407730460167, -0.000783055555075407, -0.0007062703371047974, -0.0006294851191341877, -0.000552699901163578, -0.00047591468319296837, -0.0003991294652223587, -0.00032234424725174904, -0.0002455590292811394, -0.0001687738113105297, -9.198859333992004e-05, -1.5203375369310379e-05, 6.158184260129929e-05, 0.00013836706057190895, 0.00021515251137316227, 0.00029193772934377193, 0.0003687229473143816, 0.00044550816528499126, 0.0005222933832556009, 0.0005990786012262106, 0.0006758638191968203, 0.0007526490371674299, 0.0008294342551380396, 0.0009062194731086493, 0.000983004691079259, 0.0010597899090498686, 0.0011365751270204782, 0.001213360344991088, 0.0012901455629616976, 0.0013669307809323072, 0.001443715998902917, 0.0015205012168735266, 0.0015972864348441362, 0.001674071652814746, 0.0017508568707853556, 0.0018276420887559652, 0.001904427306726575, 0.0019812125246971846, 0.0020579977426677942, 0.002134782960638404, 0.0022115681786090136, 0.0022883533965796232, 0.002365138614550233, 0.0024419238325208426, 0.0025187090504914522, 0.002595494268462062, 0.0026722794864326715]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 9.0, 11.0, 11.0, 11.0, 10.0, 17.0, 6.0, 25.0, 26.0, 30.0, 31.0, 22.0, 37.0, 44.0, 40.0, 37.0, 42.0, 44.0, 39.0, 53.0, 47.0, 41.0, 38.0, 38.0, 52.0, 32.0, 38.0, 23.0, 22.0, 22.0, 18.0, 21.0, 11.0, 9.0, 7.0, 12.0, 6.0, 8.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.000596165657043457, -0.0005794772878289223, -0.0005627889186143875, -0.0005461005493998528, -0.000529412180185318, -0.0005127238109707832, -0.0004960354417562485, -0.0004793470725417137, -0.00046265870332717896, -0.0004459703341126442, -0.00042928196489810944, -0.0004125935956835747, -0.0003959052264690399, -0.00037921685725450516, -0.0003625284880399704, -0.00034584011882543564, -0.0003291517496109009, -0.0003124633803963661, -0.00029577501118183136, -0.0002790866419672966, -0.00026239827275276184, -0.0002457099035382271, -0.00022902153432369232, -0.00021233316510915756, -0.0001956447958946228, -0.00017895642668008804, -0.00016226805746555328, -0.00014557968825101852, -0.00012889131903648376, -0.000112202949821949, -9.551458060741425e-05, -7.882621139287949e-05, -6.213784217834473e-05, -4.544947296380997e-05, -2.8761103749275208e-05, -1.2072734534740448e-05, 4.6156346797943115e-06, 2.130400389432907e-05, 3.799237310886383e-05, 5.468074232339859e-05, 7.136911153793335e-05, 8.805748075246811e-05, 0.00010474584996700287, 0.00012143421918153763, 0.0001381225883960724, 0.00015481095761060715, 0.0001714993268251419, 0.00018818769603967667, 0.00020487606525421143, 0.00022156443446874619, 0.00023825280368328094, 0.0002549411728978157, 0.00027162954211235046, 0.0002883179113268852, 0.00030500628054142, 0.00032169464975595474, 0.0003383830189704895, 0.00035507138818502426, 0.000371759757399559, 0.0003884481266140938, 0.00040513649582862854, 0.0004218248650431633, 0.00043851323425769806, 0.0004552016034722328, 0.0004718899726867676]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 1.0, 9.0, 6.0, 9.0, 10.0, 10.0, 7.0, 22.0, 23.0, 21.0, 19.0, 36.0, 30.0, 33.0, 53.0, 41.0, 43.0, 40.0, 47.0, 47.0, 39.0, 37.0, 34.0, 41.0, 35.0, 44.0, 26.0, 31.0, 30.0, 40.0, 21.0, 21.0, 16.0, 17.0, 10.0, 11.0, 8.0, 11.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3359375, -5.16973876953125, -5.0035400390625, -4.83734130859375, -4.671142578125, -4.50494384765625, -4.3387451171875, -4.17254638671875, -4.00634765625, -3.84014892578125, -3.6739501953125, -3.50775146484375, -3.341552734375, -3.17535400390625, -3.0091552734375, -2.84295654296875, -2.6767578125, -2.51055908203125, -2.3443603515625, -2.17816162109375, -2.011962890625, -1.84576416015625, -1.6795654296875, -1.51336669921875, -1.34716796875, -1.18096923828125, -1.0147705078125, -0.84857177734375, -0.682373046875, -0.51617431640625, -0.3499755859375, -0.18377685546875, -0.017578125, 0.14862060546875, 0.3148193359375, 0.48101806640625, 0.647216796875, 0.81341552734375, 0.9796142578125, 1.14581298828125, 1.31201171875, 1.47821044921875, 1.6444091796875, 1.81060791015625, 1.976806640625, 2.14300537109375, 2.3092041015625, 2.47540283203125, 2.6416015625, 2.80780029296875, 2.9739990234375, 3.14019775390625, 3.306396484375, 3.47259521484375, 3.6387939453125, 3.80499267578125, 3.97119140625, 4.13739013671875, 4.3035888671875, 4.46978759765625, 4.635986328125, 4.80218505859375, 4.9683837890625, 5.13458251953125, 5.30078125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 1.0, 10.0, 8.0, 15.0, 17.0, 31.0, 42.0, 71.0, 89.0, 173.0, 245.0, 403.0, 681.0, 1279.0, 2385.0, 4403.0, 8478.0, 16121.0, 30568.0, 60865.0, 140042.0, 317547.0, 256397.0, 106921.0, 48537.0, 24905.0, 13124.0, 7008.0, 3720.0, 1921.0, 1038.0, 585.0, 351.0, 210.0, 132.0, 65.0, 50.0, 25.0, 17.0, 24.0, 9.0, 8.0, 7.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.375, -4.23760986328125, -4.1002197265625, -3.96282958984375, -3.825439453125, -3.68804931640625, -3.5506591796875, -3.41326904296875, -3.27587890625, -3.13848876953125, -3.0010986328125, -2.86370849609375, -2.726318359375, -2.58892822265625, -2.4515380859375, -2.31414794921875, -2.1767578125, -2.03936767578125, -1.9019775390625, -1.76458740234375, -1.627197265625, -1.48980712890625, -1.3524169921875, -1.21502685546875, -1.07763671875, -0.94024658203125, -0.8028564453125, -0.66546630859375, -0.528076171875, -0.39068603515625, -0.2532958984375, -0.11590576171875, 0.021484375, 0.15887451171875, 0.2962646484375, 0.43365478515625, 0.571044921875, 0.70843505859375, 0.8458251953125, 0.98321533203125, 1.12060546875, 1.25799560546875, 1.3953857421875, 1.53277587890625, 1.670166015625, 1.80755615234375, 1.9449462890625, 2.08233642578125, 2.2197265625, 2.35711669921875, 2.4945068359375, 2.63189697265625, 2.769287109375, 2.90667724609375, 3.0440673828125, 3.18145751953125, 3.31884765625, 3.45623779296875, 3.5936279296875, 3.73101806640625, 3.868408203125, 4.00579833984375, 4.1431884765625, 4.28057861328125, 4.41796875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 7.0, 5.0, 4.0, 9.0, 13.0, 14.0, 19.0, 16.0, 23.0, 25.0, 40.0, 33.0, 36.0, 41.0, 45.0, 54.0, 58.0, 86.0, 179.0, 1500.0, 248.0, 123.0, 58.0, 48.0, 44.0, 40.0, 46.0, 19.0, 28.0, 41.0, 26.0, 21.0, 15.0, 17.0, 16.0, 8.0, 7.0, 13.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.75, -18.158203125, -17.56640625, -16.974609375, -16.3828125, -15.791015625, -15.19921875, -14.607421875, -14.015625, -13.423828125, -12.83203125, -12.240234375, -11.6484375, -11.056640625, -10.46484375, -9.873046875, -9.28125, -8.689453125, -8.09765625, -7.505859375, -6.9140625, -6.322265625, -5.73046875, -5.138671875, -4.546875, -3.955078125, -3.36328125, -2.771484375, -2.1796875, -1.587890625, -0.99609375, -0.404296875, 0.1875, 0.779296875, 1.37109375, 1.962890625, 2.5546875, 3.146484375, 3.73828125, 4.330078125, 4.921875, 5.513671875, 6.10546875, 6.697265625, 7.2890625, 7.880859375, 8.47265625, 9.064453125, 9.65625, 10.248046875, 10.83984375, 11.431640625, 12.0234375, 12.615234375, 13.20703125, 13.798828125, 14.390625, 14.982421875, 15.57421875, 16.166015625, 16.7578125, 17.349609375, 17.94140625, 18.533203125, 19.125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 7.0, 11.0, 19.0, 29.0, 53.0, 110.0, 198.0, 519.0, 4214.0, 3134557.0, 4937.0, 542.0, 198.0, 107.0, 70.0, 40.0, 30.0, 14.0, 9.0, 12.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.125, -132.908203125, -128.69140625, -124.474609375, -120.2578125, -116.041015625, -111.82421875, -107.607421875, -103.390625, -99.173828125, -94.95703125, -90.740234375, -86.5234375, -82.306640625, -78.08984375, -73.873046875, -69.65625, -65.439453125, -61.22265625, -57.005859375, -52.7890625, -48.572265625, -44.35546875, -40.138671875, -35.921875, -31.705078125, -27.48828125, -23.271484375, -19.0546875, -14.837890625, -10.62109375, -6.404296875, -2.1875, 2.029296875, 6.24609375, 10.462890625, 14.6796875, 18.896484375, 23.11328125, 27.330078125, 31.546875, 35.763671875, 39.98046875, 44.197265625, 48.4140625, 52.630859375, 56.84765625, 61.064453125, 65.28125, 69.498046875, 73.71484375, 77.931640625, 82.1484375, 86.365234375, 90.58203125, 94.798828125, 99.015625, 103.232421875, 107.44921875, 111.666015625, 115.8828125, 120.099609375, 124.31640625, 128.533203125, 132.75]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 273.0, 746.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.31407165527344, -66.75882720947266, -45.20357894897461, -23.648330688476562, -2.0930862426757812, 19.462158203125, 41.01741027832031, 62.57264709472656, 84.12789916992188, 105.68314361572266, 127.23838806152344, 148.79364013671875, 170.348876953125, 191.9041290283203, 213.45938110351562, 235.01461791992188, 256.56988525390625, 278.1251220703125, 299.6803894042969, 321.2356262207031, 342.7908630371094, 364.34613037109375, 385.9013671875, 407.45660400390625, 429.0118408203125, 450.56707763671875, 472.1223449707031, 493.6775817871094, 515.2328491210938, 536.7880859375, 558.3433227539062, 579.8985595703125, 601.4537963867188, 623.009033203125, 644.5642700195312, 666.1195068359375, 687.6748046875, 709.2300415039062, 730.7852783203125, 752.3405151367188, 773.895751953125, 795.4509887695312, 817.0062255859375, 838.5615234375, 860.1167602539062, 881.6719970703125, 903.2272338867188, 924.782470703125, 946.3377685546875, 967.8930053710938, 989.4482421875, 1011.0035400390625, 1032.5587158203125, 1054.114013671875, 1075.669189453125, 1097.2244873046875, 1118.7796630859375, 1140.3349609375, 1161.89013671875, 1183.4454345703125, 1205.0006103515625, 1226.555908203125, 1248.111083984375, 1269.6663818359375, 1291.2216796875]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 4.0, 9.0, 7.0, 14.0, 18.0, 18.0, 16.0, 20.0, 14.0, 26.0, 22.0, 20.0, 44.0, 29.0, 34.0, 33.0, 34.0, 32.0, 49.0, 46.0, 37.0, 53.0, 39.0, 33.0, 49.0, 29.0, 46.0, 20.0, 23.0, 24.0, 26.0, 16.0, 13.0, 20.0, 11.0, 10.0, 11.0, 14.0, 6.0, 7.0, 4.0, 6.0, 2.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-47.685279846191406, -46.086273193359375, -44.48727035522461, -42.88826370239258, -41.28925704956055, -39.69025421142578, -38.09124755859375, -36.49224090576172, -34.89323425292969, -33.294227600097656, -31.695222854614258, -30.09621810913086, -28.497211456298828, -26.89820671081543, -25.29920196533203, -23.7001953125, -22.101192474365234, -20.502187728881836, -18.903181076049805, -17.304176330566406, -15.705170631408691, -14.106164932250977, -12.507160186767578, -10.908154487609863, -9.309148788452148, -7.710143089294434, -6.111137866973877, -4.51213264465332, -2.9131269454956055, -1.3141212463378906, 0.2848834991455078, 1.8838891983032227, 3.482898712158203, 5.081904411315918, 6.680909633636475, 8.279914855957031, 9.878920555114746, 11.477926254272461, 13.07693099975586, 14.675936698913574, 16.27494239807129, 17.873947143554688, 19.47295379638672, 21.071958541870117, 22.670963287353516, 24.269969940185547, 25.868974685668945, 27.467979431152344, 29.066986083984375, 30.665990829467773, 32.26499557495117, 33.8640022277832, 35.463008880615234, 37.06201171875, 38.66101837158203, 40.26002502441406, 41.859031677246094, 43.458038330078125, 45.05704116821289, 46.65604782104492, 48.25505447387695, 49.85405731201172, 51.45306396484375, 53.05207061767578, 54.65107345581055]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 3.0, 4.0, 6.0, 9.0, 11.0, 17.0, 8.0, 16.0, 16.0, 18.0, 26.0, 34.0, 30.0, 35.0, 37.0, 41.0, 45.0, 41.0, 24.0, 47.0, 48.0, 42.0, 43.0, 33.0, 37.0, 37.0, 38.0, 35.0, 32.0, 27.0, 21.0, 20.0, 22.0, 16.0, 20.0, 13.0, 8.0, 11.0, 3.0, 12.0, 4.0, 3.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.29296875, -5.11492919921875, -4.9368896484375, -4.75885009765625, -4.580810546875, -4.40277099609375, -4.2247314453125, -4.04669189453125, -3.86865234375, -3.69061279296875, -3.5125732421875, -3.33453369140625, -3.156494140625, -2.97845458984375, -2.8004150390625, -2.62237548828125, -2.4443359375, -2.26629638671875, -2.0882568359375, -1.91021728515625, -1.732177734375, -1.55413818359375, -1.3760986328125, -1.19805908203125, -1.02001953125, -0.84197998046875, -0.6639404296875, -0.48590087890625, -0.307861328125, -0.12982177734375, 0.0482177734375, 0.22625732421875, 0.404296875, 0.58233642578125, 0.7603759765625, 0.93841552734375, 1.116455078125, 1.29449462890625, 1.4725341796875, 1.65057373046875, 1.82861328125, 2.00665283203125, 2.1846923828125, 2.36273193359375, 2.540771484375, 2.71881103515625, 2.8968505859375, 3.07489013671875, 3.2529296875, 3.43096923828125, 3.6090087890625, 3.78704833984375, 3.965087890625, 4.14312744140625, 4.3211669921875, 4.49920654296875, 4.67724609375, 4.85528564453125, 5.0333251953125, 5.21136474609375, 5.389404296875, 5.56744384765625, 5.7454833984375, 5.92352294921875, 6.1015625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 9.0, 7.0, 6.0, 23.0, 19.0, 11.0, 14.0, 35.0, 47.0, 65.0, 84.0, 147.0, 206.0, 392.0, 768.0, 1822.0, 5647.0, 22025.0, 109285.0, 540000.0, 1554336.0, 1418783.0, 431417.0, 83873.0, 17379.0, 4635.0, 1576.0, 627.0, 379.0, 208.0, 129.0, 80.0, 67.0, 47.0, 37.0, 22.0, 19.0, 7.0, 12.0, 8.0, 9.0, 6.0, 7.0, 3.0, 0.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.80078125, -7.54010009765625, -7.2794189453125, -7.01873779296875, -6.758056640625, -6.49737548828125, -6.2366943359375, -5.97601318359375, -5.71533203125, -5.45465087890625, -5.1939697265625, -4.93328857421875, -4.672607421875, -4.41192626953125, -4.1512451171875, -3.89056396484375, -3.6298828125, -3.36920166015625, -3.1085205078125, -2.84783935546875, -2.587158203125, -2.32647705078125, -2.0657958984375, -1.80511474609375, -1.54443359375, -1.28375244140625, -1.0230712890625, -0.76239013671875, -0.501708984375, -0.24102783203125, 0.0196533203125, 0.28033447265625, 0.541015625, 0.80169677734375, 1.0623779296875, 1.32305908203125, 1.583740234375, 1.84442138671875, 2.1051025390625, 2.36578369140625, 2.62646484375, 2.88714599609375, 3.1478271484375, 3.40850830078125, 3.669189453125, 3.92987060546875, 4.1905517578125, 4.45123291015625, 4.7119140625, 4.97259521484375, 5.2332763671875, 5.49395751953125, 5.754638671875, 6.01531982421875, 6.2760009765625, 6.53668212890625, 6.79736328125, 7.05804443359375, 7.3187255859375, 7.57940673828125, 7.840087890625, 8.10076904296875, 8.3614501953125, 8.62213134765625, 8.8828125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 8.0, 10.0, 13.0, 16.0, 20.0, 36.0, 50.0, 70.0, 89.0, 123.0, 174.0, 252.0, 334.0, 426.0, 458.0, 427.0, 391.0, 309.0, 253.0, 166.0, 123.0, 96.0, 65.0, 51.0, 42.0, 14.0, 23.0, 13.0, 3.0, 4.0, 3.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.875, -16.4417724609375, -16.008544921875, -15.5753173828125, -15.14208984375, -14.7088623046875, -14.275634765625, -13.8424072265625, -13.4091796875, -12.9759521484375, -12.542724609375, -12.1094970703125, -11.67626953125, -11.2430419921875, -10.809814453125, -10.3765869140625, -9.943359375, -9.5101318359375, -9.076904296875, -8.6436767578125, -8.21044921875, -7.7772216796875, -7.343994140625, -6.9107666015625, -6.4775390625, -6.0443115234375, -5.611083984375, -5.1778564453125, -4.74462890625, -4.3114013671875, -3.878173828125, -3.4449462890625, -3.01171875, -2.5784912109375, -2.145263671875, -1.7120361328125, -1.27880859375, -0.8455810546875, -0.412353515625, 0.0208740234375, 0.4541015625, 0.8873291015625, 1.320556640625, 1.7537841796875, 2.18701171875, 2.6202392578125, 3.053466796875, 3.4866943359375, 3.919921875, 4.3531494140625, 4.786376953125, 5.2196044921875, 5.65283203125, 6.0860595703125, 6.519287109375, 6.9525146484375, 7.3857421875, 7.8189697265625, 8.252197265625, 8.6854248046875, 9.11865234375, 9.5518798828125, 9.985107421875, 10.4183349609375, 10.8515625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 7.0, 4.0, 9.0, 15.0, 8.0, 16.0, 23.0, 25.0, 24.0, 52.0, 69.0, 85.0, 145.0, 176.0, 346.0, 668.0, 2440.0, 33516.0, 1800487.0, 2306200.0, 45408.0, 2791.0, 706.0, 324.0, 199.0, 131.0, 97.0, 82.0, 58.0, 50.0, 30.0, 27.0, 24.0, 8.0, 10.0, 9.0, 5.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.609375, -27.589111328125, -26.56884765625, -25.548583984375, -24.5283203125, -23.508056640625, -22.48779296875, -21.467529296875, -20.447265625, -19.427001953125, -18.40673828125, -17.386474609375, -16.3662109375, -15.345947265625, -14.32568359375, -13.305419921875, -12.28515625, -11.264892578125, -10.24462890625, -9.224365234375, -8.2041015625, -7.183837890625, -6.16357421875, -5.143310546875, -4.123046875, -3.102783203125, -2.08251953125, -1.062255859375, -0.0419921875, 0.978271484375, 1.99853515625, 3.018798828125, 4.0390625, 5.059326171875, 6.07958984375, 7.099853515625, 8.1201171875, 9.140380859375, 10.16064453125, 11.180908203125, 12.201171875, 13.221435546875, 14.24169921875, 15.261962890625, 16.2822265625, 17.302490234375, 18.32275390625, 19.343017578125, 20.36328125, 21.383544921875, 22.40380859375, 23.424072265625, 24.4443359375, 25.464599609375, 26.48486328125, 27.505126953125, 28.525390625, 29.545654296875, 30.56591796875, 31.586181640625, 32.6064453125, 33.626708984375, 34.64697265625, 35.667236328125, 36.6875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 9.0, 8.0, 36.0, 54.0, 147.0, 191.0, 214.0, 183.0, 101.0, 39.0, 19.0, 9.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.20657348632812, -117.86116027832031, -114.51573944091797, -111.17032623291016, -107.82490539550781, -104.4794921875, -101.13407897949219, -97.78866577148438, -94.44324493408203, -91.09783172607422, -87.75241088867188, -84.40699768066406, -81.06158447265625, -77.7161636352539, -74.3707504272461, -71.02532958984375, -67.67991638183594, -64.33450317382812, -60.98908233642578, -57.64366912841797, -54.29825210571289, -50.95283508300781, -47.607421875, -44.26200485229492, -40.916587829589844, -37.571170806884766, -34.22575378417969, -30.880340576171875, -27.534923553466797, -24.18950653076172, -20.844091415405273, -17.498676300048828, -14.153251647949219, -10.807835578918457, -7.462419509887695, -4.117003440856934, -0.7715873718261719, 2.5738296508789062, 5.919244766235352, 9.264659881591797, 12.610076904296875, 15.955492973327637, 19.3009090423584, 22.646324157714844, 25.991741180419922, 29.337158203125, 32.68257141113281, 36.02798843383789, 39.37340545654297, 42.71882247924805, 46.064239501953125, 49.40965270996094, 52.755069732666016, 56.100486755371094, 59.445899963378906, 62.791316986083984, 66.13673400878906, 69.48214721679688, 72.82756805419922, 76.17298126220703, 79.51840209960938, 82.86381530761719, 86.209228515625, 89.55464172363281, 92.90006256103516]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 2.0, 5.0, 4.0, 7.0, 3.0, 7.0, 20.0, 9.0, 26.0, 14.0, 18.0, 24.0, 30.0, 31.0, 44.0, 34.0, 44.0, 34.0, 26.0, 45.0, 48.0, 49.0, 41.0, 34.0, 51.0, 31.0, 41.0, 54.0, 29.0, 30.0, 19.0, 27.0, 13.0, 25.0, 21.0, 10.0, 12.0, 9.0, 4.0, 11.0, 7.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.99734878540039, -37.622154235839844, -36.24695587158203, -34.871761322021484, -33.49656295776367, -32.121368408203125, -30.746171951293945, -29.370975494384766, -27.995779037475586, -26.620582580566406, -25.245386123657227, -23.870189666748047, -22.4949951171875, -21.119796752929688, -19.74460220336914, -18.36940574645996, -16.99420928955078, -15.619012832641602, -14.243816375732422, -12.868620872497559, -11.493424415588379, -10.1182279586792, -8.743032455444336, -7.367835998535156, -5.992639541625977, -4.617443084716797, -3.2422471046447754, -1.867051124572754, -0.4918546676635742, 0.8833417892456055, 2.2585372924804688, 3.6337337493896484, 5.008934020996094, 6.384130477905273, 7.759326457977295, 9.134522438049316, 10.509718894958496, 11.884915351867676, 13.260110855102539, 14.635307312011719, 16.0105037689209, 17.385700225830078, 18.760896682739258, 20.136093139648438, 21.511287689208984, 22.886486053466797, 24.261680603027344, 25.636877059936523, 27.012073516845703, 28.387269973754883, 29.762466430664062, 31.13766098022461, 32.51285934448242, 33.88805389404297, 35.26325225830078, 36.63844680786133, 38.013641357421875, 39.38883590698242, 40.764034271240234, 42.13922882080078, 43.514427185058594, 44.88962173461914, 46.26481628417969, 47.6400146484375, 49.01521301269531]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 12.0, 10.0, 7.0, 9.0, 21.0, 13.0, 15.0, 26.0, 43.0, 25.0, 40.0, 47.0, 37.0, 48.0, 49.0, 44.0, 52.0, 47.0, 42.0, 40.0, 47.0, 42.0, 40.0, 36.0, 39.0, 33.0, 29.0, 20.0, 16.0, 16.0, 8.0, 11.0, 7.0, 8.0, 3.0, 8.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.41015625, -5.20965576171875, -5.0091552734375, -4.80865478515625, -4.608154296875, -4.40765380859375, -4.2071533203125, -4.00665283203125, -3.80615234375, -3.60565185546875, -3.4051513671875, -3.20465087890625, -3.004150390625, -2.80364990234375, -2.6031494140625, -2.40264892578125, -2.2021484375, -2.00164794921875, -1.8011474609375, -1.60064697265625, -1.400146484375, -1.19964599609375, -0.9991455078125, -0.79864501953125, -0.59814453125, -0.39764404296875, -0.1971435546875, 0.00335693359375, 0.203857421875, 0.40435791015625, 0.6048583984375, 0.80535888671875, 1.005859375, 1.20635986328125, 1.4068603515625, 1.60736083984375, 1.807861328125, 2.00836181640625, 2.2088623046875, 2.40936279296875, 2.60986328125, 2.81036376953125, 3.0108642578125, 3.21136474609375, 3.411865234375, 3.61236572265625, 3.8128662109375, 4.01336669921875, 4.2138671875, 4.41436767578125, 4.6148681640625, 4.81536865234375, 5.015869140625, 5.21636962890625, 5.4168701171875, 5.61737060546875, 5.81787109375, 6.01837158203125, 6.2188720703125, 6.41937255859375, 6.619873046875, 6.82037353515625, 7.0208740234375, 7.22137451171875, 7.421875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 9.0, 14.0, 8.0, 21.0, 29.0, 34.0, 76.0, 86.0, 138.0, 246.0, 314.0, 497.0, 705.0, 1025.0, 1494.0, 2247.0, 3484.0, 5002.0, 8028.0, 12289.0, 19034.0, 31170.0, 51385.0, 91868.0, 176921.0, 278862.0, 155974.0, 81813.0, 46431.0, 28669.0, 17856.0, 11140.0, 7216.0, 4818.0, 3081.0, 2117.0, 1432.0, 942.0, 708.0, 419.0, 307.0, 199.0, 144.0, 95.0, 78.0, 46.0, 28.0, 17.0, 6.0, 6.0, 9.0, 9.0, 5.0, 5.0, 3.0], "bins": [-1.04296875, -1.0126571655273438, -0.9823455810546875, -0.9520339965820312, -0.921722412109375, -0.8914108276367188, -0.8610992431640625, -0.8307876586914062, -0.80047607421875, -0.7701644897460938, -0.7398529052734375, -0.7095413208007812, -0.679229736328125, -0.6489181518554688, -0.6186065673828125, -0.5882949829101562, -0.5579833984375, -0.5276718139648438, -0.4973602294921875, -0.46704864501953125, -0.436737060546875, -0.40642547607421875, -0.3761138916015625, -0.34580230712890625, -0.31549072265625, -0.28517913818359375, -0.2548675537109375, -0.22455596923828125, -0.194244384765625, -0.16393280029296875, -0.1336212158203125, -0.10330963134765625, -0.072998046875, -0.04268646240234375, -0.0123748779296875, 0.01793670654296875, 0.048248291015625, 0.07855987548828125, 0.1088714599609375, 0.13918304443359375, 0.16949462890625, 0.19980621337890625, 0.2301177978515625, 0.26042938232421875, 0.290740966796875, 0.32105255126953125, 0.3513641357421875, 0.38167572021484375, 0.4119873046875, 0.44229888916015625, 0.4726104736328125, 0.5029220581054688, 0.533233642578125, 0.5635452270507812, 0.5938568115234375, 0.6241683959960938, 0.65447998046875, 0.6847915649414062, 0.7151031494140625, 0.7454147338867188, 0.775726318359375, 0.8060379028320312, 0.8363494873046875, 0.8666610717773438, 0.89697265625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 2.0, 4.0, 12.0, 8.0, 16.0, 13.0, 16.0, 13.0, 20.0, 26.0, 29.0, 27.0, 22.0, 30.0, 20.0, 23.0, 26.0, 52.0, 42.0, 40.0, 1072.0, 43.0, 35.0, 40.0, 39.0, 45.0, 37.0, 28.0, 35.0, 26.0, 27.0, 15.0, 24.0, 17.0, 17.0, 12.0, 11.0, 10.0, 8.0, 6.0, 3.0, 5.0, 5.0, 3.0, 4.0, 5.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.197265625, -3.09295654296875, -2.9886474609375, -2.88433837890625, -2.780029296875, -2.67572021484375, -2.5714111328125, -2.46710205078125, -2.36279296875, -2.25848388671875, -2.1541748046875, -2.04986572265625, -1.945556640625, -1.84124755859375, -1.7369384765625, -1.63262939453125, -1.5283203125, -1.42401123046875, -1.3197021484375, -1.21539306640625, -1.111083984375, -1.00677490234375, -0.9024658203125, -0.79815673828125, -0.69384765625, -0.58953857421875, -0.4852294921875, -0.38092041015625, -0.276611328125, -0.17230224609375, -0.0679931640625, 0.03631591796875, 0.140625, 0.24493408203125, 0.3492431640625, 0.45355224609375, 0.557861328125, 0.66217041015625, 0.7664794921875, 0.87078857421875, 0.97509765625, 1.07940673828125, 1.1837158203125, 1.28802490234375, 1.392333984375, 1.49664306640625, 1.6009521484375, 1.70526123046875, 1.8095703125, 1.91387939453125, 2.0181884765625, 2.12249755859375, 2.226806640625, 2.33111572265625, 2.4354248046875, 2.53973388671875, 2.64404296875, 2.74835205078125, 2.8526611328125, 2.95697021484375, 3.061279296875, 3.16558837890625, 3.2698974609375, 3.37420654296875, 3.478515625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 5.0, 8.0, 9.0, 8.0, 16.0, 19.0, 38.0, 36.0, 46.0, 66.0, 84.0, 126.0, 171.0, 234.0, 367.0, 486.0, 760.0, 1077.0, 1520.0, 2290.0, 3374.0, 5177.0, 7599.0, 11506.0, 17856.0, 28056.0, 45471.0, 76140.0, 141571.0, 1316961.0, 186516.0, 96963.0, 55408.0, 34030.0, 21621.0, 13913.0, 8917.0, 5887.0, 3967.0, 2684.0, 1777.0, 1267.0, 886.0, 636.0, 459.0, 291.0, 243.0, 173.0, 126.0, 96.0, 64.0, 48.0, 34.0, 14.0, 20.0, 14.0, 4.0, 1.0, 2.0, 6.0], "bins": [-0.9443359375, -0.9163131713867188, -0.8882904052734375, -0.8602676391601562, -0.832244873046875, -0.8042221069335938, -0.7761993408203125, -0.7481765747070312, -0.72015380859375, -0.6921310424804688, -0.6641082763671875, -0.6360855102539062, -0.608062744140625, -0.5800399780273438, -0.5520172119140625, -0.5239944458007812, -0.4959716796875, -0.46794891357421875, -0.4399261474609375, -0.41190338134765625, -0.383880615234375, -0.35585784912109375, -0.3278350830078125, -0.29981231689453125, -0.27178955078125, -0.24376678466796875, -0.2157440185546875, -0.18772125244140625, -0.159698486328125, -0.13167572021484375, -0.1036529541015625, -0.07563018798828125, -0.047607421875, -0.01958465576171875, 0.0084381103515625, 0.03646087646484375, 0.064483642578125, 0.09250640869140625, 0.1205291748046875, 0.14855194091796875, 0.17657470703125, 0.20459747314453125, 0.2326202392578125, 0.26064300537109375, 0.288665771484375, 0.31668853759765625, 0.3447113037109375, 0.37273406982421875, 0.4007568359375, 0.42877960205078125, 0.4568023681640625, 0.48482513427734375, 0.512847900390625, 0.5408706665039062, 0.5688934326171875, 0.5969161987304688, 0.62493896484375, 0.6529617309570312, 0.6809844970703125, 0.7090072631835938, 0.737030029296875, 0.7650527954101562, 0.7930755615234375, 0.8210983276367188, 0.84912109375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 9.0, 6.0, 10.0, 18.0, 23.0, 25.0, 37.0, 58.0, 85.0, 93.0, 99.0, 108.0, 90.0, 92.0, 69.0, 42.0, 39.0, 27.0, 19.0, 12.0, 9.0, 11.0, 3.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0019073486328125, -0.001859813928604126, -0.001812279224395752, -0.001764744520187378, -0.001717209815979004, -0.0016696751117706299, -0.0016221404075622559, -0.0015746057033538818, -0.0015270709991455078, -0.0014795362949371338, -0.0014320015907287598, -0.0013844668865203857, -0.0013369321823120117, -0.0012893974781036377, -0.0012418627738952637, -0.0011943280696868896, -0.0011467933654785156, -0.0010992586612701416, -0.0010517239570617676, -0.0010041892528533936, -0.0009566545486450195, -0.0009091198444366455, -0.0008615851402282715, -0.0008140504360198975, -0.0007665157318115234, -0.0007189810276031494, -0.0006714463233947754, -0.0006239116191864014, -0.0005763769149780273, -0.0005288422107696533, -0.0004813075065612793, -0.0004337728023529053, -0.00038623809814453125, -0.0003387033939361572, -0.0002911686897277832, -0.00024363398551940918, -0.00019609928131103516, -0.00014856457710266113, -0.00010102987289428711, -5.3495168685913086e-05, -5.9604644775390625e-06, 4.157423973083496e-05, 8.910894393920898e-05, 0.000136643648147583, 0.00018417835235595703, 0.00023171305656433105, 0.0002792477607727051, 0.0003267824649810791, 0.0003743171691894531, 0.00042185187339782715, 0.00046938657760620117, 0.0005169212818145752, 0.0005644559860229492, 0.0006119906902313232, 0.0006595253944396973, 0.0007070600986480713, 0.0007545948028564453, 0.0008021295070648193, 0.0008496642112731934, 0.0008971989154815674, 0.0009447336196899414, 0.0009922683238983154, 0.0010398030281066895, 0.0010873377323150635, 0.0011348724365234375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 6.0, 12.0, 16.0, 14.0, 27.0, 30.0, 59.0, 66.0, 131.0, 248.0, 517.0, 2259.0, 1016097.0, 27506.0, 796.0, 310.0, 167.0, 101.0, 60.0, 41.0, 15.0, 18.0, 16.0, 11.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0206298828125, -0.019759654998779297, -0.018889427185058594, -0.01801919937133789, -0.017148971557617188, -0.016278743743896484, -0.015408515930175781, -0.014538288116455078, -0.013668060302734375, -0.012797832489013672, -0.011927604675292969, -0.011057376861572266, -0.010187149047851562, -0.00931692123413086, -0.008446693420410156, -0.007576465606689453, -0.00670623779296875, -0.005836009979248047, -0.004965782165527344, -0.004095554351806641, -0.0032253265380859375, -0.0023550987243652344, -0.0014848709106445312, -0.0006146430969238281, 0.000255584716796875, 0.0011258125305175781, 0.0019960403442382812, 0.0028662681579589844, 0.0037364959716796875, 0.004606723785400391, 0.005476951599121094, 0.006347179412841797, 0.0072174072265625, 0.008087635040283203, 0.008957862854003906, 0.00982809066772461, 0.010698318481445312, 0.011568546295166016, 0.012438774108886719, 0.013309001922607422, 0.014179229736328125, 0.015049457550048828, 0.01591968536376953, 0.016789913177490234, 0.017660140991210938, 0.01853036880493164, 0.019400596618652344, 0.020270824432373047, 0.02114105224609375, 0.022011280059814453, 0.022881507873535156, 0.02375173568725586, 0.024621963500976562, 0.025492191314697266, 0.02636241912841797, 0.027232646942138672, 0.028102874755859375, 0.028973102569580078, 0.02984333038330078, 0.030713558197021484, 0.03158378601074219, 0.03245401382446289, 0.033324241638183594, 0.0341944694519043, 0.035064697265625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 12.0, 42.0, 99.0, 204.0, 246.0, 170.0, 133.0, 64.0, 27.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012557676527649164, -0.0012119583552703261, -0.0011681490577757359, -0.0011243398766964674, -0.0010805305792018771, -0.0010367212817072868, -0.0009929121006280184, -0.0009491028031334281, -0.0009052935056388378, -0.0008614842081442475, -0.0008176749688573182, -0.0007738657295703888, -0.0007300564320757985, -0.0006862471345812082, -0.0006424378952942789, -0.0005986286560073495, -0.0005548193585127592, -0.0005110100610181689, -0.00046720082173123956, -0.00042339155334047973, -0.0003795822849497199, -0.0003357730165589601, -0.00029196374816820025, -0.00024815447977744043, -0.0002043452113866806, -0.00016053594299592078, -0.00011672667460516095, -7.291740621440113e-05, -2.91081378236413e-05, 1.4701130567118526e-05, 5.851039895787835e-05, 0.00010231966734863818, 0.00014612905215471983, 0.00018993832054547966, 0.00023374758893623948, 0.0002775568573269993, 0.00032136612571775913, 0.00036517539410851896, 0.0004089846624992788, 0.0004527939308900386, 0.0004966031992807984, 0.0005404124967753887, 0.0005842217360623181, 0.0006280309753492475, 0.0006718402728438377, 0.000715649570338428, 0.0007594588096253574, 0.0008032680489122868, 0.000847077346406877, 0.0008908866439014673, 0.0009346958831883967, 0.000978505122475326, 0.0010223144199699163, 0.0010661237174645066, 0.001109933014959097, 0.0011537421960383654, 0.0011975514935329556, 0.001241360791027546, 0.0012851699721068144, 0.0013289792696014047, 0.001372788567095995, 0.0014165978645905852, 0.0014604071620851755, 0.001504216343164444, 0.0015480256406590343]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 8.0, 4.0, 11.0, 8.0, 18.0, 14.0, 17.0, 14.0, 27.0, 26.0, 31.0, 28.0, 30.0, 33.0, 33.0, 39.0, 35.0, 39.0, 34.0, 41.0, 37.0, 36.0, 41.0, 35.0, 38.0, 31.0, 41.0, 43.0, 35.0, 25.0, 26.0, 22.0, 16.0, 18.0, 11.0, 12.0, 8.0, 9.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005280375480651855, -0.0005120057612657547, -0.0004959739744663239, -0.000479942187666893, -0.00046391040086746216, -0.0004478786140680313, -0.00043184682726860046, -0.0004158150404691696, -0.00039978325366973877, -0.0003837514668703079, -0.0003677196800708771, -0.00035168789327144623, -0.0003356561064720154, -0.00031962431967258453, -0.0003035925328731537, -0.00028756074607372284, -0.000271528959274292, -0.00025549717247486115, -0.0002394653856754303, -0.00022343359887599945, -0.0002074018120765686, -0.00019137002527713776, -0.0001753382384777069, -0.00015930645167827606, -0.00014327466487884521, -0.00012724287807941437, -0.00011121109127998352, -9.517930448055267e-05, -7.914751768112183e-05, -6.311573088169098e-05, -4.708394408226013e-05, -3.1052157282829285e-05, -1.5020370483398438e-05, 1.0114163160324097e-06, 1.7043203115463257e-05, 3.3074989914894104e-05, 4.910677671432495e-05, 6.51385635137558e-05, 8.117035031318665e-05, 9.720213711261749e-05, 0.00011323392391204834, 0.0001292657107114792, 0.00014529749751091003, 0.00016132928431034088, 0.00017736107110977173, 0.00019339285790920258, 0.00020942464470863342, 0.00022545643150806427, 0.00024148821830749512, 0.00025752000510692596, 0.0002735517919063568, 0.00028958357870578766, 0.0003056153655052185, 0.00032164715230464935, 0.0003376789391040802, 0.00035371072590351105, 0.0003697425127029419, 0.00038577429950237274, 0.0004018060863018036, 0.00041783787310123444, 0.0004338696599006653, 0.00044990144670009613, 0.000465933233499527, 0.0004819650202989578, 0.0004979968070983887]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 12.0, 10.0, 7.0, 9.0, 21.0, 13.0, 15.0, 26.0, 43.0, 25.0, 40.0, 47.0, 37.0, 48.0, 49.0, 44.0, 52.0, 47.0, 42.0, 40.0, 47.0, 42.0, 40.0, 36.0, 39.0, 33.0, 29.0, 20.0, 16.0, 16.0, 8.0, 11.0, 7.0, 8.0, 3.0, 8.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.41015625, -5.20965576171875, -5.0091552734375, -4.80865478515625, -4.608154296875, -4.40765380859375, -4.2071533203125, -4.00665283203125, -3.80615234375, -3.60565185546875, -3.4051513671875, -3.20465087890625, -3.004150390625, -2.80364990234375, -2.6031494140625, -2.40264892578125, -2.2021484375, -2.00164794921875, -1.8011474609375, -1.60064697265625, -1.400146484375, -1.19964599609375, -0.9991455078125, -0.79864501953125, -0.59814453125, -0.39764404296875, -0.1971435546875, 0.00335693359375, 0.203857421875, 0.40435791015625, 0.6048583984375, 0.80535888671875, 1.005859375, 1.20635986328125, 1.4068603515625, 1.60736083984375, 1.807861328125, 2.00836181640625, 2.2088623046875, 2.40936279296875, 2.60986328125, 2.81036376953125, 3.0108642578125, 3.21136474609375, 3.411865234375, 3.61236572265625, 3.8128662109375, 4.01336669921875, 4.2138671875, 4.41436767578125, 4.6148681640625, 4.81536865234375, 5.015869140625, 5.21636962890625, 5.4168701171875, 5.61737060546875, 5.81787109375, 6.01837158203125, 6.2188720703125, 6.41937255859375, 6.619873046875, 6.82037353515625, 7.0208740234375, 7.22137451171875, 7.421875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 7.0, 3.0, 8.0, 15.0, 21.0, 33.0, 37.0, 50.0, 78.0, 127.0, 191.0, 350.0, 597.0, 1014.0, 1880.0, 3701.0, 7450.0, 14931.0, 29453.0, 57472.0, 113019.0, 215760.0, 270129.0, 161521.0, 83256.0, 43127.0, 21944.0, 10928.0, 5381.0, 2749.0, 1370.0, 764.0, 449.0, 277.0, 145.0, 117.0, 76.0, 37.0, 31.0, 22.0, 19.0, 9.0, 4.0, 6.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.00390625, -4.85791015625, -4.7119140625, -4.56591796875, -4.419921875, -4.27392578125, -4.1279296875, -3.98193359375, -3.8359375, -3.68994140625, -3.5439453125, -3.39794921875, -3.251953125, -3.10595703125, -2.9599609375, -2.81396484375, -2.66796875, -2.52197265625, -2.3759765625, -2.22998046875, -2.083984375, -1.93798828125, -1.7919921875, -1.64599609375, -1.5, -1.35400390625, -1.2080078125, -1.06201171875, -0.916015625, -0.77001953125, -0.6240234375, -0.47802734375, -0.33203125, -0.18603515625, -0.0400390625, 0.10595703125, 0.251953125, 0.39794921875, 0.5439453125, 0.68994140625, 0.8359375, 0.98193359375, 1.1279296875, 1.27392578125, 1.419921875, 1.56591796875, 1.7119140625, 1.85791015625, 2.00390625, 2.14990234375, 2.2958984375, 2.44189453125, 2.587890625, 2.73388671875, 2.8798828125, 3.02587890625, 3.171875, 3.31787109375, 3.4638671875, 3.60986328125, 3.755859375, 3.90185546875, 4.0478515625, 4.19384765625, 4.33984375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 14.0, 12.0, 16.0, 15.0, 20.0, 26.0, 28.0, 40.0, 42.0, 43.0, 55.0, 65.0, 55.0, 101.0, 246.0, 1471.0, 244.0, 110.0, 76.0, 55.0, 28.0, 41.0, 30.0, 31.0, 25.0, 25.0, 18.0, 19.0, 15.0, 12.0, 4.0, 6.0, 12.0, 4.0, 4.0, 5.0, 8.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-23.953125, -23.259033203125, -22.56494140625, -21.870849609375, -21.1767578125, -20.482666015625, -19.78857421875, -19.094482421875, -18.400390625, -17.706298828125, -17.01220703125, -16.318115234375, -15.6240234375, -14.929931640625, -14.23583984375, -13.541748046875, -12.84765625, -12.153564453125, -11.45947265625, -10.765380859375, -10.0712890625, -9.377197265625, -8.68310546875, -7.989013671875, -7.294921875, -6.600830078125, -5.90673828125, -5.212646484375, -4.5185546875, -3.824462890625, -3.13037109375, -2.436279296875, -1.7421875, -1.048095703125, -0.35400390625, 0.340087890625, 1.0341796875, 1.728271484375, 2.42236328125, 3.116455078125, 3.810546875, 4.504638671875, 5.19873046875, 5.892822265625, 6.5869140625, 7.281005859375, 7.97509765625, 8.669189453125, 9.36328125, 10.057373046875, 10.75146484375, 11.445556640625, 12.1396484375, 12.833740234375, 13.52783203125, 14.221923828125, 14.916015625, 15.610107421875, 16.30419921875, 16.998291015625, 17.6923828125, 18.386474609375, 19.08056640625, 19.774658203125, 20.46875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 9.0, 9.0, 16.0, 21.0, 21.0, 31.0, 52.0, 72.0, 122.0, 169.0, 270.0, 580.0, 3066.0, 3036084.0, 102895.0, 1202.0, 432.0, 199.0, 141.0, 100.0, 65.0, 44.0, 43.0, 20.0, 14.0, 5.0, 11.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.0, -73.265625, -70.53125, -67.796875, -65.0625, -62.328125, -59.59375, -56.859375, -54.125, -51.390625, -48.65625, -45.921875, -43.1875, -40.453125, -37.71875, -34.984375, -32.25, -29.515625, -26.78125, -24.046875, -21.3125, -18.578125, -15.84375, -13.109375, -10.375, -7.640625, -4.90625, -2.171875, 0.5625, 3.296875, 6.03125, 8.765625, 11.5, 14.234375, 16.96875, 19.703125, 22.4375, 25.171875, 27.90625, 30.640625, 33.375, 36.109375, 38.84375, 41.578125, 44.3125, 47.046875, 49.78125, 52.515625, 55.25, 57.984375, 60.71875, 63.453125, 66.1875, 68.921875, 71.65625, 74.390625, 77.125, 79.859375, 82.59375, 85.328125, 88.0625, 90.796875, 93.53125, 96.265625, 99.0]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 28.0, 303.0, 548.0, 127.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-265.9557189941406, -261.1466979980469, -256.3376770019531, -251.52865600585938, -246.71963500976562, -241.91061401367188, -237.10159301757812, -232.29258728027344, -227.4835662841797, -222.67454528808594, -217.8655242919922, -213.05650329589844, -208.2474822998047, -203.4384765625, -198.62945556640625, -193.8204345703125, -189.01141357421875, -184.202392578125, -179.39337158203125, -174.5843505859375, -169.77532958984375, -164.96630859375, -160.15728759765625, -155.34828186035156, -150.53924560546875, -145.730224609375, -140.92120361328125, -136.1121826171875, -131.30316162109375, -126.49414825439453, -121.68512725830078, -116.87611389160156, -112.06709289550781, -107.25807189941406, -102.44905090332031, -97.64002990722656, -92.83101654052734, -88.0219955444336, -83.21297454833984, -78.40396118164062, -73.59494018554688, -68.78591918945312, -63.97690200805664, -59.16788101196289, -54.358863830566406, -49.549842834472656, -44.740821838378906, -39.93180465698242, -35.12278366088867, -30.313764572143555, -25.504745483398438, -20.695724487304688, -15.88670539855957, -11.077686309814453, -6.268665313720703, -1.4596481323242188, 3.3493728637695312, 8.158391952514648, 12.967411994934082, 17.776432037353516, 22.585451126098633, 27.39447021484375, 32.2034912109375, 37.012508392333984, 41.821529388427734]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 2.0, 6.0, 4.0, 7.0, 11.0, 20.0, 10.0, 20.0, 18.0, 15.0, 22.0, 23.0, 29.0, 24.0, 36.0, 39.0, 35.0, 28.0, 36.0, 35.0, 46.0, 40.0, 45.0, 35.0, 39.0, 39.0, 30.0, 47.0, 38.0, 23.0, 25.0, 27.0, 22.0, 18.0, 8.0, 13.0, 13.0, 7.0, 13.0, 10.0, 9.0, 6.0, 6.0, 4.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-44.75486373901367, -43.29269027709961, -41.83052062988281, -40.36834716796875, -38.90617370605469, -37.44400405883789, -35.98183059692383, -34.51966094970703, -33.05748748779297, -31.59531593322754, -30.13314437866211, -28.670970916748047, -27.208799362182617, -25.746627807617188, -24.284454345703125, -22.822282791137695, -21.360111236572266, -19.897939682006836, -18.435768127441406, -16.973594665527344, -15.511423110961914, -14.049251556396484, -12.587079048156738, -11.124906539916992, -9.662734985351562, -8.200563430786133, -6.738390922546387, -5.276218891143799, -3.814046859741211, -2.351874828338623, -0.8897027969360352, 0.5724697113037109, 2.0346450805664062, 3.496817111968994, 4.958989143371582, 6.42116117477417, 7.883333206176758, 9.345504760742188, 10.807677268981934, 12.26984977722168, 13.73202133178711, 15.194192886352539, 16.65636444091797, 18.11853790283203, 19.58070945739746, 21.04288101196289, 22.505054473876953, 23.967226028442383, 25.429397583007812, 26.891569137573242, 28.353740692138672, 29.815914154052734, 31.278085708618164, 32.740257263183594, 34.202430725097656, 35.66460418701172, 37.126773834228516, 38.58894729614258, 40.051116943359375, 41.51329040527344, 42.9754638671875, 44.4376335144043, 45.89980697631836, 47.361976623535156, 48.82415008544922]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 10.0, 7.0, 12.0, 12.0, 14.0, 9.0, 17.0, 25.0, 35.0, 30.0, 30.0, 29.0, 37.0, 41.0, 58.0, 48.0, 47.0, 32.0, 55.0, 30.0, 52.0, 48.0, 35.0, 35.0, 34.0, 32.0, 35.0, 30.0, 20.0, 22.0, 14.0, 11.0, 9.0, 15.0, 7.0, 4.0, 1.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.265625, -5.0556640625, -4.845703125, -4.6357421875, -4.42578125, -4.2158203125, -4.005859375, -3.7958984375, -3.5859375, -3.3759765625, -3.166015625, -2.9560546875, -2.74609375, -2.5361328125, -2.326171875, -2.1162109375, -1.90625, -1.6962890625, -1.486328125, -1.2763671875, -1.06640625, -0.8564453125, -0.646484375, -0.4365234375, -0.2265625, -0.0166015625, 0.193359375, 0.4033203125, 0.61328125, 0.8232421875, 1.033203125, 1.2431640625, 1.453125, 1.6630859375, 1.873046875, 2.0830078125, 2.29296875, 2.5029296875, 2.712890625, 2.9228515625, 3.1328125, 3.3427734375, 3.552734375, 3.7626953125, 3.97265625, 4.1826171875, 4.392578125, 4.6025390625, 4.8125, 5.0224609375, 5.232421875, 5.4423828125, 5.65234375, 5.8623046875, 6.072265625, 6.2822265625, 6.4921875, 6.7021484375, 6.912109375, 7.1220703125, 7.33203125, 7.5419921875, 7.751953125, 7.9619140625, 8.171875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 8.0, 3.0, 4.0, 8.0, 8.0, 9.0, 12.0, 13.0, 17.0, 14.0, 25.0, 28.0, 33.0, 42.0, 67.0, 96.0, 165.0, 452.0, 2073.0, 44905.0, 2109549.0, 1996325.0, 37669.0, 1834.0, 382.0, 163.0, 81.0, 60.0, 52.0, 38.0, 32.0, 18.0, 19.0, 14.0, 13.0, 14.0, 12.0, 5.0, 8.0, 2.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.474609375, -16.74609375, -16.017578125, -15.2890625, -14.560546875, -13.83203125, -13.103515625, -12.375, -11.646484375, -10.91796875, -10.189453125, -9.4609375, -8.732421875, -8.00390625, -7.275390625, -6.546875, -5.818359375, -5.08984375, -4.361328125, -3.6328125, -2.904296875, -2.17578125, -1.447265625, -0.71875, 0.009765625, 0.73828125, 1.466796875, 2.1953125, 2.923828125, 3.65234375, 4.380859375, 5.109375, 5.837890625, 6.56640625, 7.294921875, 8.0234375, 8.751953125, 9.48046875, 10.208984375, 10.9375, 11.666015625, 12.39453125, 13.123046875, 13.8515625, 14.580078125, 15.30859375, 16.037109375, 16.765625, 17.494140625, 18.22265625, 18.951171875, 19.6796875, 20.408203125, 21.13671875, 21.865234375, 22.59375, 23.322265625, 24.05078125, 24.779296875, 25.5078125, 26.236328125, 26.96484375, 27.693359375, 28.421875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 13.0, 12.0, 11.0, 18.0, 25.0, 38.0, 52.0, 86.0, 85.0, 120.0, 150.0, 213.0, 261.0, 363.0, 378.0, 456.0, 371.0, 336.0, 267.0, 216.0, 167.0, 97.0, 86.0, 44.0, 54.0, 30.0, 30.0, 21.0, 16.0, 15.0, 6.0, 4.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.1328125, -11.74658203125, -11.3603515625, -10.97412109375, -10.587890625, -10.20166015625, -9.8154296875, -9.42919921875, -9.04296875, -8.65673828125, -8.2705078125, -7.88427734375, -7.498046875, -7.11181640625, -6.7255859375, -6.33935546875, -5.953125, -5.56689453125, -5.1806640625, -4.79443359375, -4.408203125, -4.02197265625, -3.6357421875, -3.24951171875, -2.86328125, -2.47705078125, -2.0908203125, -1.70458984375, -1.318359375, -0.93212890625, -0.5458984375, -0.15966796875, 0.2265625, 0.61279296875, 0.9990234375, 1.38525390625, 1.771484375, 2.15771484375, 2.5439453125, 2.93017578125, 3.31640625, 3.70263671875, 4.0888671875, 4.47509765625, 4.861328125, 5.24755859375, 5.6337890625, 6.02001953125, 6.40625, 6.79248046875, 7.1787109375, 7.56494140625, 7.951171875, 8.33740234375, 8.7236328125, 9.10986328125, 9.49609375, 9.88232421875, 10.2685546875, 10.65478515625, 11.041015625, 11.42724609375, 11.8134765625, 12.19970703125, 12.5859375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 10.0, 14.0, 15.0, 18.0, 30.0, 28.0, 45.0, 65.0, 87.0, 103.0, 182.0, 224.0, 482.0, 1565.0, 28068.0, 3178620.0, 974560.0, 8115.0, 911.0, 346.0, 228.0, 165.0, 120.0, 79.0, 56.0, 50.0, 28.0, 15.0, 16.0, 13.0, 8.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.65625, -27.34423828125, -26.0322265625, -24.72021484375, -23.408203125, -22.09619140625, -20.7841796875, -19.47216796875, -18.16015625, -16.84814453125, -15.5361328125, -14.22412109375, -12.912109375, -11.60009765625, -10.2880859375, -8.97607421875, -7.6640625, -6.35205078125, -5.0400390625, -3.72802734375, -2.416015625, -1.10400390625, 0.2080078125, 1.52001953125, 2.83203125, 4.14404296875, 5.4560546875, 6.76806640625, 8.080078125, 9.39208984375, 10.7041015625, 12.01611328125, 13.328125, 14.64013671875, 15.9521484375, 17.26416015625, 18.576171875, 19.88818359375, 21.2001953125, 22.51220703125, 23.82421875, 25.13623046875, 26.4482421875, 27.76025390625, 29.072265625, 30.38427734375, 31.6962890625, 33.00830078125, 34.3203125, 35.63232421875, 36.9443359375, 38.25634765625, 39.568359375, 40.88037109375, 42.1923828125, 43.50439453125, 44.81640625, 46.12841796875, 47.4404296875, 48.75244140625, 50.064453125, 51.37646484375, 52.6884765625, 54.00048828125, 55.3125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 9.0, 14.0, 37.0, 59.0, 117.0, 134.0, 154.0, 142.0, 139.0, 91.0, 55.0, 30.0, 12.0, 7.0, 7.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.99246978759766, -82.63236999511719, -80.27227783203125, -77.91217803955078, -75.55208587646484, -73.19198608398438, -70.83189392089844, -68.47179412841797, -66.1116943359375, -63.7515983581543, -61.391502380371094, -59.03140640258789, -56.67131042480469, -54.31121063232422, -51.951114654541016, -49.59101867675781, -47.230926513671875, -44.87083053588867, -42.51073455810547, -40.150638580322266, -37.79054260253906, -35.430442810058594, -33.07034683227539, -30.710250854492188, -28.350154876708984, -25.99005889892578, -23.629962921142578, -21.269865036010742, -18.90976905822754, -16.549673080444336, -14.189576148986816, -11.829479217529297, -9.469375610351562, -7.109279155731201, -4.74918270111084, -2.3890862464904785, -0.028989791870117188, 2.331106185913086, 4.6912031173706055, 7.051300048828125, 9.411396026611328, 11.771492004394531, 14.13158893585205, 16.49168586730957, 18.851781845092773, 21.211877822875977, 23.571975708007812, 25.932071685791016, 28.29216766357422, 30.652263641357422, 33.012359619140625, 35.37245559692383, 37.73255157470703, 40.0926513671875, 42.4527473449707, 44.812843322753906, 47.17293930053711, 49.53303527832031, 51.893131256103516, 54.25322723388672, 56.61332702636719, 58.973419189453125, 61.333518981933594, 63.6936149597168, 66.0537109375]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 1.0, 4.0, 4.0, 10.0, 8.0, 5.0, 12.0, 13.0, 20.0, 11.0, 20.0, 23.0, 24.0, 25.0, 25.0, 26.0, 22.0, 25.0, 42.0, 40.0, 46.0, 31.0, 45.0, 35.0, 39.0, 40.0, 49.0, 39.0, 33.0, 21.0, 27.0, 26.0, 30.0, 25.0, 32.0, 15.0, 12.0, 19.0, 14.0, 16.0, 12.0, 8.0, 6.0, 8.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.96825408935547, -32.69132614135742, -31.414400100708008, -30.13747215270996, -28.860546112060547, -27.5836181640625, -26.306690216064453, -25.02976417541504, -23.752838134765625, -22.475910186767578, -21.198984146118164, -19.922056198120117, -18.645130157470703, -17.368202209472656, -16.09127426147461, -14.814348220825195, -13.537420272827148, -12.260493278503418, -10.983566284179688, -9.70663833618164, -8.429712295532227, -7.152784824371338, -5.875857353210449, -4.598930358886719, -3.3220033645629883, -2.045076370239258, -0.7681491374969482, 0.5087780952453613, 1.7857050895690918, 3.0626320838928223, 4.339559555053711, 5.616486549377441, 6.893413543701172, 8.170340538024902, 9.447267532348633, 10.72419548034668, 12.001121520996094, 13.27804946899414, 14.554976463317871, 15.831903457641602, 17.108829498291016, 18.385757446289062, 19.662683486938477, 20.939611434936523, 22.216537475585938, 23.493465423583984, 24.77039337158203, 26.047319412231445, 27.324247360229492, 28.60117530822754, 29.878101348876953, 31.155029296875, 32.43195724487305, 33.70888137817383, 34.985809326171875, 36.26273727416992, 37.53966522216797, 38.816593170166016, 40.09352111816406, 41.370445251464844, 42.64737319946289, 43.92430114746094, 45.201229095458984, 46.47815704345703, 47.75508117675781]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 11.0, 14.0, 12.0, 13.0, 19.0, 20.0, 24.0, 30.0, 39.0, 22.0, 42.0, 39.0, 47.0, 49.0, 40.0, 51.0, 53.0, 38.0, 51.0, 40.0, 43.0, 41.0, 38.0, 39.0, 39.0, 34.0, 15.0, 19.0, 13.0, 18.0, 11.0, 11.0, 3.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.453125, -5.2401123046875, -5.027099609375, -4.8140869140625, -4.60107421875, -4.3880615234375, -4.175048828125, -3.9620361328125, -3.7490234375, -3.5360107421875, -3.322998046875, -3.1099853515625, -2.89697265625, -2.6839599609375, -2.470947265625, -2.2579345703125, -2.044921875, -1.8319091796875, -1.618896484375, -1.4058837890625, -1.19287109375, -0.9798583984375, -0.766845703125, -0.5538330078125, -0.3408203125, -0.1278076171875, 0.085205078125, 0.2982177734375, 0.51123046875, 0.7242431640625, 0.937255859375, 1.1502685546875, 1.36328125, 1.5762939453125, 1.789306640625, 2.0023193359375, 2.21533203125, 2.4283447265625, 2.641357421875, 2.8543701171875, 3.0673828125, 3.2803955078125, 3.493408203125, 3.7064208984375, 3.91943359375, 4.1324462890625, 4.345458984375, 4.5584716796875, 4.771484375, 4.9844970703125, 5.197509765625, 5.4105224609375, 5.62353515625, 5.8365478515625, 6.049560546875, 6.2625732421875, 6.4755859375, 6.6885986328125, 6.901611328125, 7.1146240234375, 7.32763671875, 7.5406494140625, 7.753662109375, 7.9666748046875, 8.1796875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 11.0, 11.0, 16.0, 25.0, 22.0, 53.0, 67.0, 96.0, 158.0, 257.0, 385.0, 694.0, 1148.0, 1896.0, 3134.0, 5266.0, 8681.0, 15126.0, 26502.0, 47954.0, 90157.0, 192009.0, 315622.0, 162130.0, 78544.0, 41774.0, 23442.0, 13702.0, 7969.0, 4663.0, 2816.0, 1725.0, 990.0, 595.0, 347.0, 213.0, 132.0, 77.0, 55.0, 39.0, 21.0, 12.0, 8.0, 9.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.275390625, -1.2371978759765625, -1.199005126953125, -1.1608123779296875, -1.12261962890625, -1.0844268798828125, -1.046234130859375, -1.0080413818359375, -0.9698486328125, -0.9316558837890625, -0.893463134765625, -0.8552703857421875, -0.81707763671875, -0.7788848876953125, -0.740692138671875, -0.7024993896484375, -0.664306640625, -0.6261138916015625, -0.587921142578125, -0.5497283935546875, -0.51153564453125, -0.4733428955078125, -0.435150146484375, -0.3969573974609375, -0.3587646484375, -0.3205718994140625, -0.282379150390625, -0.2441864013671875, -0.20599365234375, -0.1678009033203125, -0.129608154296875, -0.0914154052734375, -0.05322265625, -0.0150299072265625, 0.023162841796875, 0.0613555908203125, 0.09954833984375, 0.1377410888671875, 0.175933837890625, 0.2141265869140625, 0.2523193359375, 0.2905120849609375, 0.328704833984375, 0.3668975830078125, 0.40509033203125, 0.4432830810546875, 0.481475830078125, 0.5196685791015625, 0.557861328125, 0.5960540771484375, 0.634246826171875, 0.6724395751953125, 0.71063232421875, 0.7488250732421875, 0.787017822265625, 0.8252105712890625, 0.8634033203125, 0.9015960693359375, 0.939788818359375, 0.9779815673828125, 1.01617431640625, 1.0543670654296875, 1.092559814453125, 1.1307525634765625, 1.1689453125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 2.0, 4.0, 11.0, 9.0, 14.0, 9.0, 11.0, 19.0, 21.0, 24.0, 21.0, 28.0, 40.0, 37.0, 36.0, 34.0, 39.0, 34.0, 50.0, 41.0, 1069.0, 45.0, 46.0, 34.0, 29.0, 41.0, 32.0, 31.0, 27.0, 25.0, 31.0, 24.0, 20.0, 17.0, 11.0, 8.0, 13.0, 11.0, 8.0, 6.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.603515625, -3.483673095703125, -3.36383056640625, -3.243988037109375, -3.1241455078125, -3.004302978515625, -2.88446044921875, -2.764617919921875, -2.644775390625, -2.524932861328125, -2.40509033203125, -2.285247802734375, -2.1654052734375, -2.045562744140625, -1.92572021484375, -1.805877685546875, -1.68603515625, -1.566192626953125, -1.44635009765625, -1.326507568359375, -1.2066650390625, -1.086822509765625, -0.96697998046875, -0.847137451171875, -0.727294921875, -0.607452392578125, -0.48760986328125, -0.367767333984375, -0.2479248046875, -0.128082275390625, -0.00823974609375, 0.111602783203125, 0.2314453125, 0.351287841796875, 0.47113037109375, 0.590972900390625, 0.7108154296875, 0.830657958984375, 0.95050048828125, 1.070343017578125, 1.190185546875, 1.310028076171875, 1.42987060546875, 1.549713134765625, 1.6695556640625, 1.789398193359375, 1.90924072265625, 2.029083251953125, 2.14892578125, 2.268768310546875, 2.38861083984375, 2.508453369140625, 2.6282958984375, 2.748138427734375, 2.86798095703125, 2.987823486328125, 3.107666015625, 3.227508544921875, 3.34735107421875, 3.467193603515625, 3.5870361328125, 3.706878662109375, 3.82672119140625, 3.946563720703125, 4.06640625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 9.0, 2.0, 6.0, 6.0, 14.0, 17.0, 7.0, 34.0, 41.0, 54.0, 86.0, 114.0, 143.0, 221.0, 331.0, 468.0, 701.0, 994.0, 1505.0, 2268.0, 3511.0, 5349.0, 8327.0, 13098.0, 20691.0, 33983.0, 56970.0, 102216.0, 206577.0, 1319439.0, 134982.0, 71573.0, 41760.0, 25711.0, 16149.0, 10275.0, 6636.0, 4275.0, 2733.0, 1849.0, 1241.0, 847.0, 583.0, 407.0, 272.0, 189.0, 147.0, 98.0, 71.0, 53.0, 30.0, 29.0, 18.0, 9.0, 11.0, 11.0, 2.0, 1.0, 3.0], "bins": [-1.0654296875, -1.0342864990234375, -1.003143310546875, -0.9720001220703125, -0.94085693359375, -0.9097137451171875, -0.878570556640625, -0.8474273681640625, -0.8162841796875, -0.7851409912109375, -0.753997802734375, -0.7228546142578125, -0.69171142578125, -0.6605682373046875, -0.629425048828125, -0.5982818603515625, -0.567138671875, -0.5359954833984375, -0.504852294921875, -0.4737091064453125, -0.44256591796875, -0.4114227294921875, -0.380279541015625, -0.3491363525390625, -0.3179931640625, -0.2868499755859375, -0.255706787109375, -0.2245635986328125, -0.19342041015625, -0.1622772216796875, -0.131134033203125, -0.0999908447265625, -0.06884765625, -0.0377044677734375, -0.006561279296875, 0.0245819091796875, 0.05572509765625, 0.0868682861328125, 0.118011474609375, 0.1491546630859375, 0.1802978515625, 0.2114410400390625, 0.242584228515625, 0.2737274169921875, 0.30487060546875, 0.3360137939453125, 0.367156982421875, 0.3983001708984375, 0.429443359375, 0.4605865478515625, 0.491729736328125, 0.5228729248046875, 0.55401611328125, 0.5851593017578125, 0.616302490234375, 0.6474456787109375, 0.6785888671875, 0.7097320556640625, 0.740875244140625, 0.7720184326171875, 0.80316162109375, 0.8343048095703125, 0.865447998046875, 0.8965911865234375, 0.927734375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 10.0, 12.0, 17.0, 14.0, 30.0, 23.0, 46.0, 54.0, 52.0, 63.0, 80.0, 82.0, 96.0, 79.0, 68.0, 57.0, 41.0, 36.0, 28.0, 24.0, 14.0, 9.0, 8.0, 10.0, 4.0, 7.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.0012731552124023438, -0.0012330114841461182, -0.0011928677558898926, -0.001152724027633667, -0.0011125802993774414, -0.0010724365711212158, -0.0010322928428649902, -0.0009921491146087646, -0.0009520053863525391, -0.0009118616580963135, -0.0008717179298400879, -0.0008315742015838623, -0.0007914304733276367, -0.0007512867450714111, -0.0007111430168151855, -0.00067099928855896, -0.0006308555603027344, -0.0005907118320465088, -0.0005505681037902832, -0.0005104243755340576, -0.00047028064727783203, -0.00043013691902160645, -0.00038999319076538086, -0.0003498494625091553, -0.0003097057342529297, -0.0002695620059967041, -0.00022941827774047852, -0.00018927454948425293, -0.00014913082122802734, -0.00010898709297180176, -6.884336471557617e-05, -2.8699636459350586e-05, 1.1444091796875e-05, 5.1587820053100586e-05, 9.173154830932617e-05, 0.00013187527656555176, 0.00017201900482177734, 0.00021216273307800293, 0.0002523064613342285, 0.0002924501895904541, 0.0003325939178466797, 0.0003727376461029053, 0.00041288137435913086, 0.00045302510261535645, 0.000493168830871582, 0.0005333125591278076, 0.0005734562873840332, 0.0006136000156402588, 0.0006537437438964844, 0.00069388747215271, 0.0007340312004089355, 0.0007741749286651611, 0.0008143186569213867, 0.0008544623851776123, 0.0008946061134338379, 0.0009347498416900635, 0.0009748935699462891, 0.0010150372982025146, 0.0010551810264587402, 0.0010953247547149658, 0.0011354684829711914, 0.001175612211227417, 0.0012157559394836426, 0.0012558996677398682, 0.0012960433959960938]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 8.0, 6.0, 6.0, 15.0, 11.0, 13.0, 21.0, 42.0, 50.0, 64.0, 146.0, 235.0, 523.0, 2943.0, 1020774.0, 22204.0, 752.0, 262.0, 156.0, 92.0, 73.0, 45.0, 30.0, 21.0, 10.0, 12.0, 9.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02911376953125, -0.02822256088256836, -0.02733135223388672, -0.026440143585205078, -0.025548934936523438, -0.024657726287841797, -0.023766517639160156, -0.022875308990478516, -0.021984100341796875, -0.021092891693115234, -0.020201683044433594, -0.019310474395751953, -0.018419265747070312, -0.017528057098388672, -0.01663684844970703, -0.01574563980102539, -0.01485443115234375, -0.01396322250366211, -0.013072013854980469, -0.012180805206298828, -0.011289596557617188, -0.010398387908935547, -0.009507179260253906, -0.008615970611572266, -0.007724761962890625, -0.006833553314208984, -0.005942344665527344, -0.005051136016845703, -0.0041599273681640625, -0.003268718719482422, -0.0023775100708007812, -0.0014863014221191406, -0.0005950927734375, 0.0002961158752441406, 0.0011873245239257812, 0.002078533172607422, 0.0029697418212890625, 0.003860950469970703, 0.004752159118652344, 0.005643367767333984, 0.006534576416015625, 0.007425785064697266, 0.008316993713378906, 0.009208202362060547, 0.010099411010742188, 0.010990619659423828, 0.011881828308105469, 0.01277303695678711, 0.01366424560546875, 0.01455545425415039, 0.015446662902832031, 0.016337871551513672, 0.017229080200195312, 0.018120288848876953, 0.019011497497558594, 0.019902706146240234, 0.020793914794921875, 0.021685123443603516, 0.022576332092285156, 0.023467540740966797, 0.024358749389648438, 0.025249958038330078, 0.02614116668701172, 0.02703237533569336, 0.027923583984375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 10.0, 43.0, 55.0, 123.0, 203.0, 205.0, 169.0, 114.0, 56.0, 15.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012491774978116155, -0.001207944587804377, -0.0011667115613818169, -0.0011254786513745785, -0.00108424574136734, -0.0010430127149447799, -0.0010017798049375415, -0.0009605468367226422, -0.0009193138685077429, -0.0008780809002928436, -0.0008368479320779443, -0.0007956150220707059, -0.0007543820538558066, -0.0007131490856409073, -0.0006719161756336689, -0.0006306832074187696, -0.0005894502392038703, -0.000548217270988971, -0.0005069843027740717, -0.0004657513927668333, -0.000424518424551934, -0.0003832854563370347, -0.00034205251722596586, -0.000300819578114897, -0.0002595866098999977, -0.00021835365623701364, -0.00017712070257402956, -0.0001358877489110455, -9.465479524806142e-05, -5.3421841585077345e-05, -1.2188887922093272e-05, 2.9044051188975573e-05, 7.02771358191967e-05, 0.00011151008948218077, 0.00015274304314516485, 0.00019397599680814892, 0.000235208950471133, 0.0002764419186860323, 0.00031767485779710114, 0.00035890779690817, 0.0004001407651230693, 0.0004413737333379686, 0.00048260667244903743, 0.0005238396115601063, 0.0005650725797750056, 0.0006063055479899049, 0.0006475384579971433, 0.0006887714262120426, 0.0007300043944269419, 0.0007712373626418412, 0.0008124703308567405, 0.0008537032408639789, 0.0008949362090788782, 0.0009361691772937775, 0.0009774020873010159, 0.0010186349973082542, 0.0010598680237308145, 0.0011011009337380528, 0.001142333960160613, 0.0011835668701678514, 0.0012247997801750898, 0.00126603280659765, 0.0013072657166048884, 0.0013484987430274487, 0.001389731653034687]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 9.0, 9.0, 9.0, 9.0, 12.0, 14.0, 13.0, 20.0, 27.0, 19.0, 23.0, 27.0, 25.0, 27.0, 45.0, 38.0, 48.0, 49.0, 40.0, 50.0, 40.0, 34.0, 32.0, 45.0, 31.0, 32.0, 26.0, 42.0, 27.0, 22.0, 24.0, 19.0, 19.0, 21.0, 13.0, 9.0, 14.0, 11.0, 13.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0005900859832763672, -0.0005727093666791916, -0.000555332750082016, -0.0005379561334848404, -0.0005205795168876648, -0.0005032029002904892, -0.0004858262836933136, -0.000468449667096138, -0.0004510730504989624, -0.0004336964339017868, -0.0004163198173046112, -0.0003989432007074356, -0.00038156658411026, -0.0003641899675130844, -0.0003468133509159088, -0.0003294367343187332, -0.0003120601177215576, -0.000294683501124382, -0.0002773068845272064, -0.0002599302679300308, -0.00024255365133285522, -0.00022517703473567963, -0.00020780041813850403, -0.00019042380154132843, -0.00017304718494415283, -0.00015567056834697723, -0.00013829395174980164, -0.00012091733515262604, -0.00010354071855545044, -8.616410195827484e-05, -6.878748536109924e-05, -5.1410868763923645e-05, -3.403425216674805e-05, -1.665763556957245e-05, 7.189810276031494e-07, 1.8095597624778748e-05, 3.5472214221954346e-05, 5.2848830819129944e-05, 7.022544741630554e-05, 8.760206401348114e-05, 0.00010497868061065674, 0.00012235529720783234, 0.00013973191380500793, 0.00015710853040218353, 0.00017448514699935913, 0.00019186176359653473, 0.00020923838019371033, 0.00022661499679088593, 0.00024399161338806152, 0.0002613682299852371, 0.0002787448465824127, 0.0002961214631795883, 0.0003134980797767639, 0.0003308746963739395, 0.0003482513129711151, 0.0003656279295682907, 0.0003830045461654663, 0.0004003811627626419, 0.0004177577793598175, 0.0004351343959569931, 0.0004525110125541687, 0.0004698876291513443, 0.0004872642457485199, 0.0005046408623456955, 0.0005220174789428711]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 11.0, 14.0, 12.0, 13.0, 19.0, 20.0, 24.0, 30.0, 39.0, 22.0, 42.0, 39.0, 47.0, 49.0, 40.0, 51.0, 53.0, 38.0, 51.0, 40.0, 43.0, 41.0, 38.0, 39.0, 39.0, 34.0, 15.0, 19.0, 13.0, 18.0, 11.0, 11.0, 3.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.453125, -5.2401123046875, -5.027099609375, -4.8140869140625, -4.60107421875, -4.3880615234375, -4.175048828125, -3.9620361328125, -3.7490234375, -3.5360107421875, -3.322998046875, -3.1099853515625, -2.89697265625, -2.6839599609375, -2.470947265625, -2.2579345703125, -2.044921875, -1.8319091796875, -1.618896484375, -1.4058837890625, -1.19287109375, -0.9798583984375, -0.766845703125, -0.5538330078125, -0.3408203125, -0.1278076171875, 0.085205078125, 0.2982177734375, 0.51123046875, 0.7242431640625, 0.937255859375, 1.1502685546875, 1.36328125, 1.5762939453125, 1.789306640625, 2.0023193359375, 2.21533203125, 2.4283447265625, 2.641357421875, 2.8543701171875, 3.0673828125, 3.2803955078125, 3.493408203125, 3.7064208984375, 3.91943359375, 4.1324462890625, 4.345458984375, 4.5584716796875, 4.771484375, 4.9844970703125, 5.197509765625, 5.4105224609375, 5.62353515625, 5.8365478515625, 6.049560546875, 6.2625732421875, 6.4755859375, 6.6885986328125, 6.901611328125, 7.1146240234375, 7.32763671875, 7.5406494140625, 7.753662109375, 7.9666748046875, 8.1796875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 10.0, 17.0, 15.0, 18.0, 34.0, 43.0, 57.0, 70.0, 89.0, 124.0, 188.0, 266.0, 453.0, 728.0, 1463.0, 2925.0, 6385.0, 15090.0, 33148.0, 71629.0, 156882.0, 344330.0, 229445.0, 99638.0, 46248.0, 21179.0, 9302.0, 4209.0, 1923.0, 986.0, 558.0, 326.0, 202.0, 153.0, 108.0, 74.0, 58.0, 45.0, 29.0, 31.0, 11.0, 11.0, 19.0, 6.0, 3.0, 6.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.75, -5.56280517578125, -5.3756103515625, -5.18841552734375, -5.001220703125, -4.81402587890625, -4.6268310546875, -4.43963623046875, -4.25244140625, -4.06524658203125, -3.8780517578125, -3.69085693359375, -3.503662109375, -3.31646728515625, -3.1292724609375, -2.94207763671875, -2.7548828125, -2.56768798828125, -2.3804931640625, -2.19329833984375, -2.006103515625, -1.81890869140625, -1.6317138671875, -1.44451904296875, -1.25732421875, -1.07012939453125, -0.8829345703125, -0.69573974609375, -0.508544921875, -0.32135009765625, -0.1341552734375, 0.05303955078125, 0.240234375, 0.42742919921875, 0.6146240234375, 0.80181884765625, 0.989013671875, 1.17620849609375, 1.3634033203125, 1.55059814453125, 1.73779296875, 1.92498779296875, 2.1121826171875, 2.29937744140625, 2.486572265625, 2.67376708984375, 2.8609619140625, 3.04815673828125, 3.2353515625, 3.42254638671875, 3.6097412109375, 3.79693603515625, 3.984130859375, 4.17132568359375, 4.3585205078125, 4.54571533203125, 4.73291015625, 4.92010498046875, 5.1072998046875, 5.29449462890625, 5.481689453125, 5.66888427734375, 5.8560791015625, 6.04327392578125, 6.23046875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 10.0, 6.0, 17.0, 10.0, 11.0, 10.0, 15.0, 31.0, 29.0, 33.0, 28.0, 33.0, 38.0, 39.0, 63.0, 92.0, 143.0, 1406.0, 358.0, 152.0, 90.0, 51.0, 49.0, 30.0, 33.0, 29.0, 37.0, 29.0, 23.0, 25.0, 23.0, 17.0, 18.0, 11.0, 14.0, 11.0, 5.0, 4.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.309814453125, -15.68212890625, -15.054443359375, -14.4267578125, -13.799072265625, -13.17138671875, -12.543701171875, -11.916015625, -11.288330078125, -10.66064453125, -10.032958984375, -9.4052734375, -8.777587890625, -8.14990234375, -7.522216796875, -6.89453125, -6.266845703125, -5.63916015625, -5.011474609375, -4.3837890625, -3.756103515625, -3.12841796875, -2.500732421875, -1.873046875, -1.245361328125, -0.61767578125, 0.010009765625, 0.6376953125, 1.265380859375, 1.89306640625, 2.520751953125, 3.1484375, 3.776123046875, 4.40380859375, 5.031494140625, 5.6591796875, 6.286865234375, 6.91455078125, 7.542236328125, 8.169921875, 8.797607421875, 9.42529296875, 10.052978515625, 10.6806640625, 11.308349609375, 11.93603515625, 12.563720703125, 13.19140625, 13.819091796875, 14.44677734375, 15.074462890625, 15.7021484375, 16.329833984375, 16.95751953125, 17.585205078125, 18.212890625, 18.840576171875, 19.46826171875, 20.095947265625, 20.7236328125, 21.351318359375, 21.97900390625, 22.606689453125, 23.234375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 5.0, 6.0, 10.0, 9.0, 9.0, 14.0, 12.0, 11.0, 17.0, 25.0, 27.0, 37.0, 42.0, 50.0, 61.0, 82.0, 93.0, 138.0, 175.0, 292.0, 484.0, 1161.0, 18106.0, 3044328.0, 77088.0, 1712.0, 596.0, 287.0, 202.0, 123.0, 99.0, 86.0, 59.0, 46.0, 30.0, 33.0, 32.0, 17.0, 16.0, 21.0, 11.0, 8.0, 5.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-52.625, -50.9609375, -49.296875, -47.6328125, -45.96875, -44.3046875, -42.640625, -40.9765625, -39.3125, -37.6484375, -35.984375, -34.3203125, -32.65625, -30.9921875, -29.328125, -27.6640625, -26.0, -24.3359375, -22.671875, -21.0078125, -19.34375, -17.6796875, -16.015625, -14.3515625, -12.6875, -11.0234375, -9.359375, -7.6953125, -6.03125, -4.3671875, -2.703125, -1.0390625, 0.625, 2.2890625, 3.953125, 5.6171875, 7.28125, 8.9453125, 10.609375, 12.2734375, 13.9375, 15.6015625, 17.265625, 18.9296875, 20.59375, 22.2578125, 23.921875, 25.5859375, 27.25, 28.9140625, 30.578125, 32.2421875, 33.90625, 35.5703125, 37.234375, 38.8984375, 40.5625, 42.2265625, 43.890625, 45.5546875, 47.21875, 48.8828125, 50.546875, 52.2109375, 53.875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 26.0, 115.0, 296.0, 375.0, 149.0, 37.0, 10.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.363853454589844, -35.44792938232422, -32.53200149536133, -29.61607551574707, -26.700149536132812, -23.784223556518555, -20.868297576904297, -17.95237159729004, -15.036445617675781, -12.120519638061523, -9.204593658447266, -6.288667678833008, -3.37274169921875, -0.4568157196044922, 2.4591102600097656, 5.375036239624023, 8.290962219238281, 11.206888198852539, 14.122814178466797, 17.038740158081055, 19.954666137695312, 22.87059211730957, 25.786518096923828, 28.702444076538086, 31.618370056152344, 34.53429412841797, 37.45022201538086, 40.36614990234375, 43.282073974609375, 46.197998046875, 49.11392593383789, 52.02985382080078, 54.94578552246094, 57.86170959472656, 60.77763748168945, 63.693565368652344, 66.60948944091797, 69.5254135131836, 72.44134521484375, 75.35726928710938, 78.273193359375, 81.18911743164062, 84.10504150390625, 87.0209732055664, 89.93689727783203, 92.85282135009766, 95.76875305175781, 98.68467712402344, 101.60060119628906, 104.51652526855469, 107.43244934082031, 110.34838104248047, 113.2643051147461, 116.18022918701172, 119.09616088867188, 122.0120849609375, 124.92800903320312, 127.84393310546875, 130.75985717773438, 133.67578125, 136.59170532226562, 139.5076446533203, 142.42356872558594, 145.33949279785156, 148.2554168701172]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 2.0, 3.0, 7.0, 10.0, 1.0, 10.0, 10.0, 7.0, 10.0, 13.0, 18.0, 18.0, 25.0, 25.0, 23.0, 19.0, 37.0, 37.0, 38.0, 38.0, 46.0, 41.0, 44.0, 44.0, 45.0, 44.0, 42.0, 58.0, 30.0, 30.0, 37.0, 26.0, 18.0, 29.0, 20.0, 16.0, 12.0, 10.0, 5.0, 13.0, 7.0, 9.0, 6.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-59.63190841674805, -57.779335021972656, -55.9267578125, -54.07418441772461, -52.22161102294922, -50.36903762817383, -48.51646423339844, -46.66388702392578, -44.81131362915039, -42.958740234375, -41.106163024902344, -39.25358963012695, -37.40101623535156, -35.54844284057617, -33.69586944580078, -31.843292236328125, -29.990718841552734, -28.138145446777344, -26.28557014465332, -24.432994842529297, -22.580421447753906, -20.727848052978516, -18.875272750854492, -17.02269744873047, -15.170124053955078, -13.317549705505371, -11.464975357055664, -9.612401008605957, -7.75982666015625, -5.907252311706543, -4.054677963256836, -2.202103614807129, -0.3495292663574219, 1.5030450820922852, 3.355619430541992, 5.208193778991699, 7.060768127441406, 8.913342475891113, 10.76591682434082, 12.618491172790527, 14.471065521240234, 16.323638916015625, 18.17621421813965, 20.028789520263672, 21.881362915039062, 23.733936309814453, 25.586511611938477, 27.4390869140625, 29.29166030883789, 31.14423370361328, 32.99681091308594, 34.84938430786133, 36.70195770263672, 38.55453109741211, 40.4071044921875, 42.259681701660156, 44.11225509643555, 45.96482849121094, 47.817405700683594, 49.669979095458984, 51.522552490234375, 53.375125885009766, 55.227699279785156, 57.08027648925781, 58.9328498840332]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 12.0, 17.0, 11.0, 24.0, 21.0, 21.0, 25.0, 21.0, 22.0, 40.0, 33.0, 35.0, 40.0, 41.0, 48.0, 32.0, 47.0, 42.0, 37.0, 49.0, 54.0, 47.0, 37.0, 37.0, 40.0, 23.0, 23.0, 19.0, 20.0, 16.0, 14.0, 15.0, 7.0, 4.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.89453125, -5.66607666015625, -5.4376220703125, -5.20916748046875, -4.980712890625, -4.75225830078125, -4.5238037109375, -4.29534912109375, -4.06689453125, -3.83843994140625, -3.6099853515625, -3.38153076171875, -3.153076171875, -2.92462158203125, -2.6961669921875, -2.46771240234375, -2.2392578125, -2.01080322265625, -1.7823486328125, -1.55389404296875, -1.325439453125, -1.09698486328125, -0.8685302734375, -0.64007568359375, -0.41162109375, -0.18316650390625, 0.0452880859375, 0.27374267578125, 0.502197265625, 0.73065185546875, 0.9591064453125, 1.18756103515625, 1.416015625, 1.64447021484375, 1.8729248046875, 2.10137939453125, 2.329833984375, 2.55828857421875, 2.7867431640625, 3.01519775390625, 3.24365234375, 3.47210693359375, 3.7005615234375, 3.92901611328125, 4.157470703125, 4.38592529296875, 4.6143798828125, 4.84283447265625, 5.0712890625, 5.29974365234375, 5.5281982421875, 5.75665283203125, 5.985107421875, 6.21356201171875, 6.4420166015625, 6.67047119140625, 6.89892578125, 7.12738037109375, 7.3558349609375, 7.58428955078125, 7.812744140625, 8.04119873046875, 8.2696533203125, 8.49810791015625, 8.7265625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 7.0, 4.0, 6.0, 20.0, 13.0, 16.0, 18.0, 21.0, 22.0, 30.0, 34.0, 37.0, 54.0, 82.0, 200.0, 558.0, 2782.0, 73737.0, 2579087.0, 1509469.0, 25504.0, 1707.0, 407.0, 135.0, 81.0, 44.0, 37.0, 36.0, 23.0, 22.0, 11.0, 14.0, 13.0, 14.0, 13.0, 6.0, 9.0, 3.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.75, -18.98681640625, -18.2236328125, -17.46044921875, -16.697265625, -15.93408203125, -15.1708984375, -14.40771484375, -13.64453125, -12.88134765625, -12.1181640625, -11.35498046875, -10.591796875, -9.82861328125, -9.0654296875, -8.30224609375, -7.5390625, -6.77587890625, -6.0126953125, -5.24951171875, -4.486328125, -3.72314453125, -2.9599609375, -2.19677734375, -1.43359375, -0.67041015625, 0.0927734375, 0.85595703125, 1.619140625, 2.38232421875, 3.1455078125, 3.90869140625, 4.671875, 5.43505859375, 6.1982421875, 6.96142578125, 7.724609375, 8.48779296875, 9.2509765625, 10.01416015625, 10.77734375, 11.54052734375, 12.3037109375, 13.06689453125, 13.830078125, 14.59326171875, 15.3564453125, 16.11962890625, 16.8828125, 17.64599609375, 18.4091796875, 19.17236328125, 19.935546875, 20.69873046875, 21.4619140625, 22.22509765625, 22.98828125, 23.75146484375, 24.5146484375, 25.27783203125, 26.041015625, 26.80419921875, 27.5673828125, 28.33056640625, 29.09375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 9.0, 9.0, 21.0, 25.0, 48.0, 68.0, 107.0, 152.0, 249.0, 375.0, 493.0, 567.0, 568.0, 441.0, 330.0, 206.0, 157.0, 90.0, 57.0, 41.0, 27.0, 13.0, 9.0, 9.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3203125, -13.7178955078125, -13.115478515625, -12.5130615234375, -11.91064453125, -11.3082275390625, -10.705810546875, -10.1033935546875, -9.5009765625, -8.8985595703125, -8.296142578125, -7.6937255859375, -7.09130859375, -6.4888916015625, -5.886474609375, -5.2840576171875, -4.681640625, -4.0792236328125, -3.476806640625, -2.8743896484375, -2.27197265625, -1.6695556640625, -1.067138671875, -0.4647216796875, 0.1376953125, 0.7401123046875, 1.342529296875, 1.9449462890625, 2.54736328125, 3.1497802734375, 3.752197265625, 4.3546142578125, 4.95703125, 5.5594482421875, 6.161865234375, 6.7642822265625, 7.36669921875, 7.9691162109375, 8.571533203125, 9.1739501953125, 9.7763671875, 10.3787841796875, 10.981201171875, 11.5836181640625, 12.18603515625, 12.7884521484375, 13.390869140625, 13.9932861328125, 14.595703125, 15.1981201171875, 15.800537109375, 16.4029541015625, 17.00537109375, 17.6077880859375, 18.210205078125, 18.8126220703125, 19.4150390625, 20.0174560546875, 20.619873046875, 21.2222900390625, 21.82470703125, 22.4271240234375, 23.029541015625, 23.6319580078125, 24.234375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 14.0, 11.0, 18.0, 28.0, 48.0, 79.0, 102.0, 159.0, 226.0, 342.0, 595.0, 2935.0, 1787787.0, 2396693.0, 3585.0, 646.0, 375.0, 197.0, 166.0, 117.0, 55.0, 40.0, 33.0, 16.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.4375, -79.40283203125, -77.3681640625, -75.33349609375, -73.298828125, -71.26416015625, -69.2294921875, -67.19482421875, -65.16015625, -63.12548828125, -61.0908203125, -59.05615234375, -57.021484375, -54.98681640625, -52.9521484375, -50.91748046875, -48.8828125, -46.84814453125, -44.8134765625, -42.77880859375, -40.744140625, -38.70947265625, -36.6748046875, -34.64013671875, -32.60546875, -30.57080078125, -28.5361328125, -26.50146484375, -24.466796875, -22.43212890625, -20.3974609375, -18.36279296875, -16.328125, -14.29345703125, -12.2587890625, -10.22412109375, -8.189453125, -6.15478515625, -4.1201171875, -2.08544921875, -0.05078125, 1.98388671875, 4.0185546875, 6.05322265625, 8.087890625, 10.12255859375, 12.1572265625, 14.19189453125, 16.2265625, 18.26123046875, 20.2958984375, 22.33056640625, 24.365234375, 26.39990234375, 28.4345703125, 30.46923828125, 32.50390625, 34.53857421875, 36.5732421875, 38.60791015625, 40.642578125, 42.67724609375, 44.7119140625, 46.74658203125, 48.78125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 20.0, 49.0, 135.0, 203.0, 237.0, 183.0, 113.0, 36.0, 21.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.71265411376953, -58.11537170410156, -54.518089294433594, -50.920806884765625, -47.323524475097656, -43.72624206542969, -40.12895965576172, -36.53167724609375, -32.93439483642578, -29.337112426757812, -25.739830017089844, -22.142547607421875, -18.545265197753906, -14.947982788085938, -11.350700378417969, -7.75341796875, -4.156135559082031, -0.5588531494140625, 3.0384292602539062, 6.635711669921875, 10.232994079589844, 13.830276489257812, 17.42755889892578, 21.02484130859375, 24.62212371826172, 28.219406127929688, 31.816688537597656, 35.413970947265625, 39.011253356933594, 42.60853576660156, 46.20581817626953, 49.8031005859375, 53.400390625, 56.99767303466797, 60.59495544433594, 64.1922378540039, 67.78952026367188, 71.38680267333984, 74.98408508300781, 78.58136749267578, 82.17864990234375, 85.77593231201172, 89.37321472167969, 92.97049713134766, 96.56777954101562, 100.1650619506836, 103.76234436035156, 107.35962677001953, 110.9569091796875, 114.55419158935547, 118.15147399902344, 121.7487564086914, 125.34603881835938, 128.94332885742188, 132.5406036376953, 136.13787841796875, 139.73516845703125, 143.33245849609375, 146.9297332763672, 150.52700805664062, 154.12429809570312, 157.72158813476562, 161.31886291503906, 164.9161376953125, 168.513427734375]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 5.0, 5.0, 11.0, 13.0, 14.0, 23.0, 23.0, 20.0, 25.0, 40.0, 38.0, 46.0, 38.0, 43.0, 35.0, 42.0, 41.0, 36.0, 37.0, 45.0, 37.0, 29.0, 47.0, 39.0, 41.0, 23.0, 37.0, 31.0, 16.0, 18.0, 19.0, 13.0, 15.0, 5.0, 6.0, 6.0, 1.0, 8.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.798030853271484, -40.31563949584961, -38.83324432373047, -37.350852966308594, -35.86846160888672, -34.38606643676758, -32.9036750793457, -31.421281814575195, -29.938888549804688, -28.45649528503418, -26.974102020263672, -25.491710662841797, -24.00931739807129, -22.52692413330078, -21.044532775878906, -19.5621395111084, -18.07974624633789, -16.597352981567383, -15.114960670471191, -13.632568359375, -12.150175094604492, -10.667781829833984, -9.185389518737793, -7.702997207641602, -6.220603942871094, -4.738211154937744, -3.2558183670043945, -1.773425579071045, -0.2910327911376953, 1.1913599967956543, 2.673752784729004, 4.156145095825195, 5.6385345458984375, 7.120927333831787, 8.603320121765137, 10.085712432861328, 11.568105697631836, 13.050498962402344, 14.532891273498535, 16.015283584594727, 17.497676849365234, 18.980070114135742, 20.46246337890625, 21.944854736328125, 23.427248001098633, 24.90964126586914, 26.392032623291016, 27.874425888061523, 29.35681915283203, 30.83921241760254, 32.32160568237305, 33.80399703979492, 35.28639221191406, 36.76878356933594, 38.25117492675781, 39.73356628417969, 41.21596145629883, 42.6983528137207, 44.180747985839844, 45.66313934326172, 47.145530700683594, 48.627925872802734, 50.11031723022461, 51.59271240234375, 53.075103759765625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 9.0, 16.0, 16.0, 21.0, 29.0, 19.0, 32.0, 26.0, 30.0, 43.0, 40.0, 43.0, 55.0, 45.0, 51.0, 47.0, 40.0, 47.0, 48.0, 49.0, 49.0, 44.0, 41.0, 26.0, 21.0, 20.0, 18.0, 17.0, 9.0, 7.0, 6.0, 8.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.23828125, -6.00091552734375, -5.7635498046875, -5.52618408203125, -5.288818359375, -5.05145263671875, -4.8140869140625, -4.57672119140625, -4.33935546875, -4.10198974609375, -3.8646240234375, -3.62725830078125, -3.389892578125, -3.15252685546875, -2.9151611328125, -2.67779541015625, -2.4404296875, -2.20306396484375, -1.9656982421875, -1.72833251953125, -1.490966796875, -1.25360107421875, -1.0162353515625, -0.77886962890625, -0.54150390625, -0.30413818359375, -0.0667724609375, 0.17059326171875, 0.407958984375, 0.64532470703125, 0.8826904296875, 1.12005615234375, 1.357421875, 1.59478759765625, 1.8321533203125, 2.06951904296875, 2.306884765625, 2.54425048828125, 2.7816162109375, 3.01898193359375, 3.25634765625, 3.49371337890625, 3.7310791015625, 3.96844482421875, 4.205810546875, 4.44317626953125, 4.6805419921875, 4.91790771484375, 5.1552734375, 5.39263916015625, 5.6300048828125, 5.86737060546875, 6.104736328125, 6.34210205078125, 6.5794677734375, 6.81683349609375, 7.05419921875, 7.29156494140625, 7.5289306640625, 7.76629638671875, 8.003662109375, 8.24102783203125, 8.4783935546875, 8.71575927734375, 8.953125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 11.0, 12.0, 14.0, 23.0, 27.0, 38.0, 69.0, 115.0, 151.0, 275.0, 405.0, 575.0, 915.0, 1386.0, 2194.0, 3567.0, 5657.0, 9291.0, 15690.0, 27599.0, 50153.0, 97708.0, 199116.0, 303194.0, 154760.0, 77853.0, 40840.0, 22822.0, 13064.0, 7895.0, 4761.0, 2991.0, 1853.0, 1250.0, 811.0, 506.0, 341.0, 198.0, 140.0, 97.0, 61.0, 44.0, 24.0, 15.0, 10.0, 8.0, 8.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-1.3564453125, -1.3157501220703125, -1.275054931640625, -1.2343597412109375, -1.19366455078125, -1.1529693603515625, -1.112274169921875, -1.0715789794921875, -1.0308837890625, -0.9901885986328125, -0.949493408203125, -0.9087982177734375, -0.86810302734375, -0.8274078369140625, -0.786712646484375, -0.7460174560546875, -0.705322265625, -0.6646270751953125, -0.623931884765625, -0.5832366943359375, -0.54254150390625, -0.5018463134765625, -0.461151123046875, -0.4204559326171875, -0.3797607421875, -0.3390655517578125, -0.298370361328125, -0.2576751708984375, -0.21697998046875, -0.1762847900390625, -0.135589599609375, -0.0948944091796875, -0.05419921875, -0.0135040283203125, 0.027191162109375, 0.0678863525390625, 0.10858154296875, 0.1492767333984375, 0.189971923828125, 0.2306671142578125, 0.2713623046875, 0.3120574951171875, 0.352752685546875, 0.3934478759765625, 0.43414306640625, 0.4748382568359375, 0.515533447265625, 0.5562286376953125, 0.596923828125, 0.6376190185546875, 0.678314208984375, 0.7190093994140625, 0.75970458984375, 0.8003997802734375, 0.841094970703125, 0.8817901611328125, 0.9224853515625, 0.9631805419921875, 1.003875732421875, 1.0445709228515625, 1.08526611328125, 1.1259613037109375, 1.166656494140625, 1.2073516845703125, 1.248046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 3.0, 7.0, 7.0, 9.0, 8.0, 6.0, 6.0, 8.0, 13.0, 11.0, 17.0, 24.0, 21.0, 26.0, 37.0, 32.0, 30.0, 41.0, 39.0, 24.0, 42.0, 44.0, 1070.0, 47.0, 39.0, 44.0, 33.0, 23.0, 34.0, 24.0, 31.0, 32.0, 22.0, 21.0, 23.0, 19.0, 19.0, 18.0, 19.0, 7.0, 8.0, 3.0, 7.0, 5.0, 7.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.1484375, -4.02978515625, -3.9111328125, -3.79248046875, -3.673828125, -3.55517578125, -3.4365234375, -3.31787109375, -3.19921875, -3.08056640625, -2.9619140625, -2.84326171875, -2.724609375, -2.60595703125, -2.4873046875, -2.36865234375, -2.25, -2.13134765625, -2.0126953125, -1.89404296875, -1.775390625, -1.65673828125, -1.5380859375, -1.41943359375, -1.30078125, -1.18212890625, -1.0634765625, -0.94482421875, -0.826171875, -0.70751953125, -0.5888671875, -0.47021484375, -0.3515625, -0.23291015625, -0.1142578125, 0.00439453125, 0.123046875, 0.24169921875, 0.3603515625, 0.47900390625, 0.59765625, 0.71630859375, 0.8349609375, 0.95361328125, 1.072265625, 1.19091796875, 1.3095703125, 1.42822265625, 1.546875, 1.66552734375, 1.7841796875, 1.90283203125, 2.021484375, 2.14013671875, 2.2587890625, 2.37744140625, 2.49609375, 2.61474609375, 2.7333984375, 2.85205078125, 2.970703125, 3.08935546875, 3.2080078125, 3.32666015625, 3.4453125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 10.0, 13.0, 22.0, 36.0, 55.0, 72.0, 94.0, 130.0, 254.0, 321.0, 441.0, 669.0, 996.0, 1595.0, 2389.0, 3790.0, 5969.0, 9544.0, 15855.0, 26487.0, 45610.0, 81842.0, 164397.0, 1359123.0, 173150.0, 85336.0, 47460.0, 27647.0, 16389.0, 10112.0, 6175.0, 3981.0, 2612.0, 1520.0, 946.0, 701.0, 420.0, 322.0, 201.0, 149.0, 97.0, 65.0, 45.0, 28.0, 17.0, 17.0, 8.0, 8.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0947265625, -1.0576629638671875, -1.020599365234375, -0.9835357666015625, -0.94647216796875, -0.9094085693359375, -0.872344970703125, -0.8352813720703125, -0.7982177734375, -0.7611541748046875, -0.724090576171875, -0.6870269775390625, -0.64996337890625, -0.6128997802734375, -0.575836181640625, -0.5387725830078125, -0.501708984375, -0.4646453857421875, -0.427581787109375, -0.3905181884765625, -0.35345458984375, -0.3163909912109375, -0.279327392578125, -0.2422637939453125, -0.2052001953125, -0.1681365966796875, -0.131072998046875, -0.0940093994140625, -0.05694580078125, -0.0198822021484375, 0.017181396484375, 0.0542449951171875, 0.09130859375, 0.1283721923828125, 0.165435791015625, 0.2024993896484375, 0.23956298828125, 0.2766265869140625, 0.313690185546875, 0.3507537841796875, 0.3878173828125, 0.4248809814453125, 0.461944580078125, 0.4990081787109375, 0.53607177734375, 0.5731353759765625, 0.610198974609375, 0.6472625732421875, 0.684326171875, 0.7213897705078125, 0.758453369140625, 0.7955169677734375, 0.83258056640625, 0.8696441650390625, 0.906707763671875, 0.9437713623046875, 0.9808349609375, 1.0178985595703125, 1.054962158203125, 1.0920257568359375, 1.12908935546875, 1.1661529541015625, 1.203216552734375, 1.2402801513671875, 1.27734375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 8.0, 5.0, 12.0, 4.0, 10.0, 4.0, 9.0, 21.0, 16.0, 23.0, 27.0, 40.0, 50.0, 58.0, 56.0, 78.0, 64.0, 71.0, 67.0, 64.0, 48.0, 48.0, 45.0, 32.0, 32.0, 29.0, 14.0, 14.0, 11.0, 13.0, 6.0, 6.0, 7.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0011653900146484375, -0.0011281222105026245, -0.0010908544063568115, -0.0010535866022109985, -0.0010163187980651855, -0.0009790509939193726, -0.0009417831897735596, -0.0009045153856277466, -0.0008672475814819336, -0.0008299797773361206, -0.0007927119731903076, -0.0007554441690444946, -0.0007181763648986816, -0.0006809085607528687, -0.0006436407566070557, -0.0006063729524612427, -0.0005691051483154297, -0.0005318373441696167, -0.0004945695400238037, -0.0004573017358779907, -0.00042003393173217773, -0.00038276612758636475, -0.00034549832344055176, -0.00030823051929473877, -0.0002709627151489258, -0.0002336949110031128, -0.0001964271068572998, -0.00015915930271148682, -0.00012189149856567383, -8.462369441986084e-05, -4.735589027404785e-05, -1.0088086128234863e-05, 2.7179718017578125e-05, 6.444752216339111e-05, 0.0001017153263092041, 0.0001389831304550171, 0.00017625093460083008, 0.00021351873874664307, 0.00025078654289245605, 0.00028805434703826904, 0.00032532215118408203, 0.000362589955329895, 0.000399857759475708, 0.000437125563621521, 0.000474393367767334, 0.000511661171913147, 0.00054892897605896, 0.000586196780204773, 0.0006234645843505859, 0.0006607323884963989, 0.0006980001926422119, 0.0007352679967880249, 0.0007725358009338379, 0.0008098036050796509, 0.0008470714092254639, 0.0008843392133712769, 0.0009216070175170898, 0.0009588748216629028, 0.0009961426258087158, 0.0010334104299545288, 0.0010706782341003418, 0.0011079460382461548, 0.0011452138423919678, 0.0011824816465377808, 0.0012197494506835938]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 6.0, 12.0, 9.0, 16.0, 19.0, 25.0, 23.0, 42.0, 49.0, 81.0, 121.0, 189.0, 315.0, 1012.0, 87977.0, 955133.0, 2323.0, 474.0, 251.0, 149.0, 98.0, 51.0, 30.0, 31.0, 28.0, 18.0, 10.0, 22.0, 5.0, 6.0, 7.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0280303955078125, -0.02721095085144043, -0.02639150619506836, -0.02557206153869629, -0.02475261688232422, -0.02393317222595215, -0.023113727569580078, -0.022294282913208008, -0.021474838256835938, -0.020655393600463867, -0.019835948944091797, -0.019016504287719727, -0.018197059631347656, -0.017377614974975586, -0.016558170318603516, -0.015738725662231445, -0.014919281005859375, -0.014099836349487305, -0.013280391693115234, -0.012460947036743164, -0.011641502380371094, -0.010822057723999023, -0.010002613067626953, -0.009183168411254883, -0.008363723754882812, -0.007544279098510742, -0.006724834442138672, -0.0059053897857666016, -0.005085945129394531, -0.004266500473022461, -0.0034470558166503906, -0.0026276111602783203, -0.00180816650390625, -0.0009887218475341797, -0.00016927719116210938, 0.0006501674652099609, 0.0014696121215820312, 0.0022890567779541016, 0.003108501434326172, 0.003927946090698242, 0.0047473907470703125, 0.005566835403442383, 0.006386280059814453, 0.0072057247161865234, 0.008025169372558594, 0.008844614028930664, 0.009664058685302734, 0.010483503341674805, 0.011302947998046875, 0.012122392654418945, 0.012941837310791016, 0.013761281967163086, 0.014580726623535156, 0.015400171279907227, 0.016219615936279297, 0.017039060592651367, 0.017858505249023438, 0.018677949905395508, 0.019497394561767578, 0.02031683921813965, 0.02113628387451172, 0.02195572853088379, 0.02277517318725586, 0.02359461784362793, 0.0244140625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 23.0, 44.0, 106.0, 175.0, 204.0, 192.0, 121.0, 83.0, 33.0, 12.0, 9.0, 1.0, 1.0, 2.0], "bins": [-0.002360305516049266, -0.0023171992506831884, -0.002274092985317111, -0.0022309869527816772, -0.0021878806874156, -0.0021447744220495224, -0.002101668156683445, -0.0020585618913173676, -0.00201545562595129, -0.0019723493605852127, -0.0019292432116344571, -0.0018861369462683797, -0.0018430306809023023, -0.0017999245319515467, -0.0017568182665854692, -0.0017137120012193918, -0.0016706058522686362, -0.0016274995869025588, -0.0015843934379518032, -0.0015412871725857258, -0.0014981809072196484, -0.001455074641853571, -0.0014119684929028153, -0.001368862227536738, -0.0013257560785859823, -0.001282649813219905, -0.0012395436642691493, -0.0011964373989030719, -0.0011533311335369945, -0.0011102249845862389, -0.0010671187192201614, -0.001024012453854084, -0.0009809061884880066, -0.0009377999813295901, -0.0008946937159635127, -0.0008515875088050961, -0.0008084812434390187, -0.0007653750362806022, -0.0007222688291221857, -0.0006791625637561083, -0.0006360564148053527, -0.0005929502076469362, -0.0005498439422808588, -0.0005067377351224422, -0.0004636314988601953, -0.0004205252625979483, -0.0003774190554395318, -0.00033431281917728484, -0.0002912065538112074, -0.00024810031754896045, -0.0002049940958386287, -0.00016188787412829697, -0.00011878163786605, -7.567540160380304e-05, -3.256919444538653e-05, 1.0537041816860437e-05, 5.3643278079107404e-05, 9.674950706539676e-05, 0.0001398557360516861, 0.00018296195776201785, 0.0002260681940242648, 0.0002691744302865118, 0.0003122806374449283, 0.00035538687370717525, 0.0003984931099694222]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 8.0, 8.0, 8.0, 18.0, 7.0, 16.0, 19.0, 29.0, 20.0, 26.0, 33.0, 21.0, 27.0, 31.0, 38.0, 44.0, 32.0, 49.0, 53.0, 44.0, 50.0, 49.0, 44.0, 39.0, 31.0, 41.0, 26.0, 38.0, 25.0, 29.0, 16.0, 15.0, 9.0, 7.0, 16.0, 13.0, 3.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006132721900939941, -0.0005948934704065323, -0.0005765147507190704, -0.0005581360310316086, -0.0005397573113441467, -0.0005213785916566849, -0.000502999871969223, -0.00048462115228176117, -0.0004662424325942993, -0.00044786371290683746, -0.0004294849932193756, -0.00041110627353191376, -0.0003927275538444519, -0.00037434883415699005, -0.0003559701144695282, -0.00033759139478206635, -0.0003192126750946045, -0.00030083395540714264, -0.0002824552357196808, -0.00026407651603221893, -0.0002456977963447571, -0.00022731907665729523, -0.00020894035696983337, -0.00019056163728237152, -0.00017218291759490967, -0.00015380419790744781, -0.00013542547821998596, -0.00011704675853252411, -9.866803884506226e-05, -8.02893191576004e-05, -6.191059947013855e-05, -4.35318797826767e-05, -2.5153160095214844e-05, -6.774440407752991e-06, 1.1604279279708862e-05, 2.9982998967170715e-05, 4.836171865463257e-05, 6.674043834209442e-05, 8.511915802955627e-05, 0.00010349787771701813, 0.00012187659740447998, 0.00014025531709194183, 0.0001586340367794037, 0.00017701275646686554, 0.0001953914761543274, 0.00021377019584178925, 0.0002321489155292511, 0.00025052763521671295, 0.0002689063549041748, 0.00028728507459163666, 0.0003056637942790985, 0.00032404251396656036, 0.0003424212336540222, 0.00036079995334148407, 0.0003791786730289459, 0.0003975573927164078, 0.00041593611240386963, 0.0004343148320913315, 0.00045269355177879333, 0.0004710722714662552, 0.000489450991153717, 0.0005078297108411789, 0.0005262084305286407, 0.0005445871502161026, 0.0005629658699035645]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 9.0, 16.0, 16.0, 21.0, 29.0, 19.0, 32.0, 26.0, 30.0, 43.0, 40.0, 43.0, 55.0, 45.0, 51.0, 47.0, 40.0, 47.0, 48.0, 49.0, 49.0, 44.0, 41.0, 26.0, 21.0, 20.0, 18.0, 17.0, 9.0, 7.0, 6.0, 8.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.23828125, -6.00091552734375, -5.7635498046875, -5.52618408203125, -5.288818359375, -5.05145263671875, -4.8140869140625, -4.57672119140625, -4.33935546875, -4.10198974609375, -3.8646240234375, -3.62725830078125, -3.389892578125, -3.15252685546875, -2.9151611328125, -2.67779541015625, -2.4404296875, -2.20306396484375, -1.9656982421875, -1.72833251953125, -1.490966796875, -1.25360107421875, -1.0162353515625, -0.77886962890625, -0.54150390625, -0.30413818359375, -0.0667724609375, 0.17059326171875, 0.407958984375, 0.64532470703125, 0.8826904296875, 1.12005615234375, 1.357421875, 1.59478759765625, 1.8321533203125, 2.06951904296875, 2.306884765625, 2.54425048828125, 2.7816162109375, 3.01898193359375, 3.25634765625, 3.49371337890625, 3.7310791015625, 3.96844482421875, 4.205810546875, 4.44317626953125, 4.6805419921875, 4.91790771484375, 5.1552734375, 5.39263916015625, 5.6300048828125, 5.86737060546875, 6.104736328125, 6.34210205078125, 6.5794677734375, 6.81683349609375, 7.05419921875, 7.29156494140625, 7.5289306640625, 7.76629638671875, 8.003662109375, 8.24102783203125, 8.4783935546875, 8.71575927734375, 8.953125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 10.0, 11.0, 23.0, 26.0, 29.0, 62.0, 95.0, 109.0, 203.0, 256.0, 408.0, 737.0, 1333.0, 2629.0, 5308.0, 11750.0, 28325.0, 71822.0, 178706.0, 358488.0, 230408.0, 92751.0, 36583.0, 14950.0, 6573.0, 3196.0, 1599.0, 819.0, 489.0, 261.0, 203.0, 127.0, 87.0, 48.0, 39.0, 11.0, 27.0, 15.0, 13.0, 13.0, 5.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.84375, -5.63970947265625, -5.4356689453125, -5.23162841796875, -5.027587890625, -4.82354736328125, -4.6195068359375, -4.41546630859375, -4.21142578125, -4.00738525390625, -3.8033447265625, -3.59930419921875, -3.395263671875, -3.19122314453125, -2.9871826171875, -2.78314208984375, -2.5791015625, -2.37506103515625, -2.1710205078125, -1.96697998046875, -1.762939453125, -1.55889892578125, -1.3548583984375, -1.15081787109375, -0.94677734375, -0.74273681640625, -0.5386962890625, -0.33465576171875, -0.130615234375, 0.07342529296875, 0.2774658203125, 0.48150634765625, 0.685546875, 0.88958740234375, 1.0936279296875, 1.29766845703125, 1.501708984375, 1.70574951171875, 1.9097900390625, 2.11383056640625, 2.31787109375, 2.52191162109375, 2.7259521484375, 2.92999267578125, 3.134033203125, 3.33807373046875, 3.5421142578125, 3.74615478515625, 3.9501953125, 4.15423583984375, 4.3582763671875, 4.56231689453125, 4.766357421875, 4.97039794921875, 5.1744384765625, 5.37847900390625, 5.58251953125, 5.78656005859375, 5.9906005859375, 6.19464111328125, 6.398681640625, 6.60272216796875, 6.8067626953125, 7.01080322265625, 7.21484375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 6.0, 7.0, 6.0, 4.0, 15.0, 12.0, 18.0, 18.0, 30.0, 26.0, 27.0, 19.0, 33.0, 34.0, 30.0, 54.0, 49.0, 86.0, 162.0, 867.0, 912.0, 153.0, 82.0, 54.0, 51.0, 34.0, 53.0, 23.0, 28.0, 24.0, 22.0, 12.0, 16.0, 14.0, 17.0, 7.0, 9.0, 9.0, 11.0, 2.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.703125, -21.02490234375, -20.3466796875, -19.66845703125, -18.990234375, -18.31201171875, -17.6337890625, -16.95556640625, -16.27734375, -15.59912109375, -14.9208984375, -14.24267578125, -13.564453125, -12.88623046875, -12.2080078125, -11.52978515625, -10.8515625, -10.17333984375, -9.4951171875, -8.81689453125, -8.138671875, -7.46044921875, -6.7822265625, -6.10400390625, -5.42578125, -4.74755859375, -4.0693359375, -3.39111328125, -2.712890625, -2.03466796875, -1.3564453125, -0.67822265625, 0.0, 0.67822265625, 1.3564453125, 2.03466796875, 2.712890625, 3.39111328125, 4.0693359375, 4.74755859375, 5.42578125, 6.10400390625, 6.7822265625, 7.46044921875, 8.138671875, 8.81689453125, 9.4951171875, 10.17333984375, 10.8515625, 11.52978515625, 12.2080078125, 12.88623046875, 13.564453125, 14.24267578125, 14.9208984375, 15.59912109375, 16.27734375, 16.95556640625, 17.6337890625, 18.31201171875, 18.990234375, 19.66845703125, 20.3466796875, 21.02490234375, 21.703125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 4.0, 6.0, 6.0, 12.0, 15.0, 5.0, 23.0, 43.0, 52.0, 74.0, 99.0, 184.0, 374.0, 809.0, 28834.0, 3111535.0, 2343.0, 519.0, 280.0, 169.0, 98.0, 71.0, 41.0, 28.0, 20.0, 11.0, 10.0, 6.0, 10.0, 7.0, 2.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.9375, -116.33203125, -112.7265625, -109.12109375, -105.515625, -101.91015625, -98.3046875, -94.69921875, -91.09375, -87.48828125, -83.8828125, -80.27734375, -76.671875, -73.06640625, -69.4609375, -65.85546875, -62.25, -58.64453125, -55.0390625, -51.43359375, -47.828125, -44.22265625, -40.6171875, -37.01171875, -33.40625, -29.80078125, -26.1953125, -22.58984375, -18.984375, -15.37890625, -11.7734375, -8.16796875, -4.5625, -0.95703125, 2.6484375, 6.25390625, 9.859375, 13.46484375, 17.0703125, 20.67578125, 24.28125, 27.88671875, 31.4921875, 35.09765625, 38.703125, 42.30859375, 45.9140625, 49.51953125, 53.125, 56.73046875, 60.3359375, 63.94140625, 67.546875, 71.15234375, 74.7578125, 78.36328125, 81.96875, 85.57421875, 89.1796875, 92.78515625, 96.390625, 99.99609375, 103.6015625, 107.20703125, 110.8125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 9.0, 9.0, 21.0, 32.0, 47.0, 77.0, 121.0, 136.0, 154.0, 125.0, 102.0, 83.0, 49.0, 24.0, 13.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.249046325683594, -46.18189239501953, -45.114742279052734, -44.04758834838867, -42.98043441772461, -41.91328048706055, -40.84613037109375, -39.77897644042969, -38.711822509765625, -37.64466857910156, -36.577518463134766, -35.5103645324707, -34.44321060180664, -33.37605667114258, -32.30890655517578, -31.24175262451172, -30.17460060119629, -29.10744857788086, -28.040294647216797, -26.973142623901367, -25.905988693237305, -24.838836669921875, -23.771682739257812, -22.704530715942383, -21.637378692626953, -20.570226669311523, -19.50307273864746, -18.43592071533203, -17.36876678466797, -16.30161476135254, -15.234461784362793, -14.167308807373047, -13.100154876708984, -12.033001899719238, -10.965848922729492, -9.898696899414062, -8.83154296875, -7.764390468597412, -6.697237968444824, -5.630084991455078, -4.562932014465332, -3.495779037475586, -2.428626298904419, -1.361473560333252, -0.29432058334350586, 0.7728323936462402, 1.8399848937988281, 2.907137870788574, 3.9742908477783203, 5.041443824768066, 6.1085968017578125, 7.1757493019104, 8.242902755737305, 9.310054779052734, 10.37720775604248, 11.444360733032227, 12.511513710021973, 13.578666687011719, 14.645819664001465, 15.712972640991211, 16.78012466430664, 17.847278594970703, 18.914430618286133, 19.981582641601562, 21.048736572265625]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 10.0, 8.0, 9.0, 14.0, 14.0, 17.0, 24.0, 13.0, 24.0, 15.0, 23.0, 34.0, 32.0, 29.0, 31.0, 35.0, 35.0, 30.0, 32.0, 30.0, 55.0, 50.0, 34.0, 37.0, 28.0, 30.0, 36.0, 28.0, 31.0, 27.0, 29.0, 17.0, 22.0, 9.0, 14.0, 13.0, 14.0, 7.0, 13.0, 5.0, 4.0, 8.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0], "bins": [-52.8168830871582, -51.34181213378906, -49.86674118041992, -48.39167022705078, -46.916595458984375, -45.441524505615234, -43.966453552246094, -42.49138259887695, -41.01631164550781, -39.54124069213867, -38.06616973876953, -36.591094970703125, -35.116024017333984, -33.640953063964844, -32.1658821105957, -30.690811157226562, -29.215736389160156, -27.740665435791016, -26.265592575073242, -24.7905216217041, -23.315448760986328, -21.840377807617188, -20.365306854248047, -18.890235900878906, -17.415163040161133, -15.940091133117676, -14.465019226074219, -12.989948272705078, -11.514876365661621, -10.039804458618164, -8.564733505249023, -7.089661598205566, -5.614585876464844, -4.139513969421387, -2.664442539215088, -1.189371109008789, 0.28570079803466797, 1.760772705078125, 3.2358436584472656, 4.710915565490723, 6.18598747253418, 7.661059379577637, 9.136131286621094, 10.611202239990234, 12.086274147033691, 13.561346054077148, 15.036417007446289, 16.511489868164062, 17.986560821533203, 19.461631774902344, 20.936704635620117, 22.411775588989258, 23.88684844970703, 25.361919403076172, 26.836990356445312, 28.312061309814453, 29.787134170532227, 31.262205123901367, 32.73727798461914, 34.21234893798828, 35.68741989135742, 37.16249084472656, 38.63756561279297, 40.11263656616211, 41.58770751953125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 5.0, 6.0, 12.0, 9.0, 17.0, 16.0, 21.0, 27.0, 27.0, 24.0, 28.0, 27.0, 36.0, 47.0, 45.0, 52.0, 43.0, 58.0, 40.0, 53.0, 47.0, 49.0, 39.0, 45.0, 40.0, 33.0, 26.0, 25.0, 16.0, 20.0, 23.0, 9.0, 6.0, 4.0, 8.0, 7.0, 2.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30859375, -6.05572509765625, -5.8028564453125, -5.54998779296875, -5.297119140625, -5.04425048828125, -4.7913818359375, -4.53851318359375, -4.28564453125, -4.03277587890625, -3.7799072265625, -3.52703857421875, -3.274169921875, -3.02130126953125, -2.7684326171875, -2.51556396484375, -2.2626953125, -2.00982666015625, -1.7569580078125, -1.50408935546875, -1.251220703125, -0.99835205078125, -0.7454833984375, -0.49261474609375, -0.23974609375, 0.01312255859375, 0.2659912109375, 0.51885986328125, 0.771728515625, 1.02459716796875, 1.2774658203125, 1.53033447265625, 1.783203125, 2.03607177734375, 2.2889404296875, 2.54180908203125, 2.794677734375, 3.04754638671875, 3.3004150390625, 3.55328369140625, 3.80615234375, 4.05902099609375, 4.3118896484375, 4.56475830078125, 4.817626953125, 5.07049560546875, 5.3233642578125, 5.57623291015625, 5.8291015625, 6.08197021484375, 6.3348388671875, 6.58770751953125, 6.840576171875, 7.09344482421875, 7.3463134765625, 7.59918212890625, 7.85205078125, 8.10491943359375, 8.3577880859375, 8.61065673828125, 8.863525390625, 9.11639404296875, 9.3692626953125, 9.62213134765625, 9.875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 6.0, 2.0, 4.0, 5.0, 5.0, 9.0, 13.0, 12.0, 25.0, 32.0, 25.0, 36.0, 60.0, 84.0, 114.0, 205.0, 387.0, 1270.0, 9710.0, 210004.0, 2385536.0, 1500495.0, 79909.0, 4586.0, 871.0, 321.0, 202.0, 99.0, 63.0, 44.0, 37.0, 16.0, 17.0, 19.0, 19.0, 12.0, 9.0, 8.0, 5.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.53125, -14.952880859375, -14.37451171875, -13.796142578125, -13.2177734375, -12.639404296875, -12.06103515625, -11.482666015625, -10.904296875, -10.325927734375, -9.74755859375, -9.169189453125, -8.5908203125, -8.012451171875, -7.43408203125, -6.855712890625, -6.27734375, -5.698974609375, -5.12060546875, -4.542236328125, -3.9638671875, -3.385498046875, -2.80712890625, -2.228759765625, -1.650390625, -1.072021484375, -0.49365234375, 0.084716796875, 0.6630859375, 1.241455078125, 1.81982421875, 2.398193359375, 2.9765625, 3.554931640625, 4.13330078125, 4.711669921875, 5.2900390625, 5.868408203125, 6.44677734375, 7.025146484375, 7.603515625, 8.181884765625, 8.76025390625, 9.338623046875, 9.9169921875, 10.495361328125, 11.07373046875, 11.652099609375, 12.23046875, 12.808837890625, 13.38720703125, 13.965576171875, 14.5439453125, 15.122314453125, 15.70068359375, 16.279052734375, 16.857421875, 17.435791015625, 18.01416015625, 18.592529296875, 19.1708984375, 19.749267578125, 20.32763671875, 20.906005859375, 21.484375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 7.0, 10.0, 9.0, 15.0, 20.0, 28.0, 43.0, 52.0, 95.0, 115.0, 157.0, 219.0, 240.0, 355.0, 392.0, 426.0, 447.0, 354.0, 288.0, 215.0, 154.0, 126.0, 81.0, 57.0, 41.0, 43.0, 26.0, 14.0, 10.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.6796875, -14.2420654296875, -13.804443359375, -13.3668212890625, -12.92919921875, -12.4915771484375, -12.053955078125, -11.6163330078125, -11.1787109375, -10.7410888671875, -10.303466796875, -9.8658447265625, -9.42822265625, -8.9906005859375, -8.552978515625, -8.1153564453125, -7.677734375, -7.2401123046875, -6.802490234375, -6.3648681640625, -5.92724609375, -5.4896240234375, -5.052001953125, -4.6143798828125, -4.1767578125, -3.7391357421875, -3.301513671875, -2.8638916015625, -2.42626953125, -1.9886474609375, -1.551025390625, -1.1134033203125, -0.67578125, -0.2381591796875, 0.199462890625, 0.6370849609375, 1.07470703125, 1.5123291015625, 1.949951171875, 2.3875732421875, 2.8251953125, 3.2628173828125, 3.700439453125, 4.1380615234375, 4.57568359375, 5.0133056640625, 5.450927734375, 5.8885498046875, 6.326171875, 6.7637939453125, 7.201416015625, 7.6390380859375, 8.07666015625, 8.5142822265625, 8.951904296875, 9.3895263671875, 9.8271484375, 10.2647705078125, 10.702392578125, 11.1400146484375, 11.57763671875, 12.0152587890625, 12.452880859375, 12.8905029296875, 13.328125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 4.0, 11.0, 5.0, 15.0, 29.0, 46.0, 40.0, 74.0, 84.0, 125.0, 156.0, 201.0, 314.0, 482.0, 933.0, 21212.0, 3381175.0, 783170.0, 4114.0, 666.0, 371.0, 274.0, 201.0, 150.0, 115.0, 85.0, 66.0, 36.0, 30.0, 24.0, 13.0, 14.0, 13.0, 5.0, 9.0, 1.0, 5.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.03125, -44.53759765625, -43.0439453125, -41.55029296875, -40.056640625, -38.56298828125, -37.0693359375, -35.57568359375, -34.08203125, -32.58837890625, -31.0947265625, -29.60107421875, -28.107421875, -26.61376953125, -25.1201171875, -23.62646484375, -22.1328125, -20.63916015625, -19.1455078125, -17.65185546875, -16.158203125, -14.66455078125, -13.1708984375, -11.67724609375, -10.18359375, -8.68994140625, -7.1962890625, -5.70263671875, -4.208984375, -2.71533203125, -1.2216796875, 0.27197265625, 1.765625, 3.25927734375, 4.7529296875, 6.24658203125, 7.740234375, 9.23388671875, 10.7275390625, 12.22119140625, 13.71484375, 15.20849609375, 16.7021484375, 18.19580078125, 19.689453125, 21.18310546875, 22.6767578125, 24.17041015625, 25.6640625, 27.15771484375, 28.6513671875, 30.14501953125, 31.638671875, 33.13232421875, 34.6259765625, 36.11962890625, 37.61328125, 39.10693359375, 40.6005859375, 42.09423828125, 43.587890625, 45.08154296875, 46.5751953125, 48.06884765625, 49.5625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 12.0, 16.0, 38.0, 32.0, 42.0, 51.0, 62.0, 78.0, 99.0, 82.0, 101.0, 92.0, 80.0, 63.0, 55.0, 32.0, 23.0, 14.0, 12.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.646728515625, -47.197303771972656, -45.74788284301758, -44.298458099365234, -42.84903335571289, -41.39961242675781, -39.95018768310547, -38.500762939453125, -37.05133819580078, -35.60191345214844, -34.15249252319336, -32.703067779541016, -31.253643035888672, -29.80422019958496, -28.35479736328125, -26.905372619628906, -25.455951690673828, -24.006528854370117, -22.557104110717773, -21.107681274414062, -19.65825653076172, -18.208833694458008, -16.759410858154297, -15.30998706817627, -13.860563278198242, -12.411139488220215, -10.961715698242188, -9.512292861938477, -8.06286907196045, -6.613445281982422, -5.164022445678711, -3.7145986557006836, -2.265178680419922, -0.8157551288604736, 0.6336684226989746, 2.0830917358398438, 3.532515525817871, 4.981939315795898, 6.431362152099609, 7.880785942077637, 9.330209732055664, 10.779633522033691, 12.229057312011719, 13.67848014831543, 15.127903938293457, 16.577327728271484, 18.026750564575195, 19.476173400878906, 20.92559814453125, 22.37502098083496, 23.824445724487305, 25.273868560791016, 26.72329330444336, 28.17271614074707, 29.62213897705078, 31.071563720703125, 32.52098846435547, 33.97041320800781, 35.41983413696289, 36.869258880615234, 38.31868362426758, 39.768104553222656, 41.217529296875, 42.666954040527344, 44.11637496948242]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 10.0, 12.0, 11.0, 15.0, 11.0, 14.0, 13.0, 22.0, 16.0, 26.0, 12.0, 24.0, 30.0, 29.0, 21.0, 30.0, 26.0, 39.0, 39.0, 40.0, 39.0, 42.0, 26.0, 37.0, 36.0, 26.0, 33.0, 29.0, 29.0, 26.0, 24.0, 35.0, 23.0, 27.0, 19.0, 14.0, 17.0, 14.0, 9.0, 11.0, 11.0, 7.0, 6.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-37.9444465637207, -36.71249008178711, -35.480533599853516, -34.24857711791992, -33.01662063598633, -31.784664154052734, -30.55270767211914, -29.320751190185547, -28.088794708251953, -26.85683822631836, -25.624881744384766, -24.392925262451172, -23.160968780517578, -21.929012298583984, -20.69705581665039, -19.465099334716797, -18.233142852783203, -17.00118637084961, -15.769229888916016, -14.537273406982422, -13.305316925048828, -12.073360443115234, -10.84140396118164, -9.609447479248047, -8.377490997314453, -7.145534515380859, -5.913578033447266, -4.681621551513672, -3.449665069580078, -2.2177085876464844, -0.9857521057128906, 0.24620437622070312, 1.4781570434570312, 2.710113525390625, 3.9420700073242188, 5.1740264892578125, 6.405982971191406, 7.637939453125, 8.869895935058594, 10.101852416992188, 11.333808898925781, 12.565765380859375, 13.797721862792969, 15.029678344726562, 16.261634826660156, 17.49359130859375, 18.725547790527344, 19.957504272460938, 21.18946075439453, 22.421417236328125, 23.65337371826172, 24.885330200195312, 26.117286682128906, 27.3492431640625, 28.581199645996094, 29.813156127929688, 31.04511260986328, 32.277069091796875, 33.50902557373047, 34.74098205566406, 35.972938537597656, 37.20489501953125, 38.436851501464844, 39.66880798339844, 40.90076446533203]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 10.0, 10.0, 11.0, 14.0, 26.0, 15.0, 25.0, 22.0, 24.0, 40.0, 38.0, 30.0, 49.0, 50.0, 42.0, 51.0, 47.0, 52.0, 52.0, 53.0, 37.0, 45.0, 41.0, 42.0, 33.0, 21.0, 19.0, 18.0, 14.0, 14.0, 12.0, 11.0, 11.0, 2.0, 3.0, 3.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.2928466796875, -6.046630859375, -5.8004150390625, -5.55419921875, -5.3079833984375, -5.061767578125, -4.8155517578125, -4.5693359375, -4.3231201171875, -4.076904296875, -3.8306884765625, -3.58447265625, -3.3382568359375, -3.092041015625, -2.8458251953125, -2.599609375, -2.3533935546875, -2.107177734375, -1.8609619140625, -1.61474609375, -1.3685302734375, -1.122314453125, -0.8760986328125, -0.6298828125, -0.3836669921875, -0.137451171875, 0.1087646484375, 0.35498046875, 0.6011962890625, 0.847412109375, 1.0936279296875, 1.33984375, 1.5860595703125, 1.832275390625, 2.0784912109375, 2.32470703125, 2.5709228515625, 2.817138671875, 3.0633544921875, 3.3095703125, 3.5557861328125, 3.802001953125, 4.0482177734375, 4.29443359375, 4.5406494140625, 4.786865234375, 5.0330810546875, 5.279296875, 5.5255126953125, 5.771728515625, 6.0179443359375, 6.26416015625, 6.5103759765625, 6.756591796875, 7.0028076171875, 7.2490234375, 7.4952392578125, 7.741455078125, 7.9876708984375, 8.23388671875, 8.4801025390625, 8.726318359375, 8.9725341796875, 9.21875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 2.0, 8.0, 8.0, 18.0, 19.0, 28.0, 43.0, 84.0, 124.0, 156.0, 299.0, 424.0, 729.0, 1225.0, 1961.0, 3308.0, 5432.0, 9359.0, 16096.0, 28996.0, 54620.0, 113206.0, 270705.0, 291088.0, 120895.0, 58043.0, 30713.0, 16877.0, 9617.0, 5716.0, 3362.0, 2048.0, 1273.0, 750.0, 494.0, 292.0, 194.0, 118.0, 75.0, 49.0, 29.0, 22.0, 16.0, 8.0, 9.0, 7.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.603515625, -1.5564117431640625, -1.509307861328125, -1.4622039794921875, -1.41510009765625, -1.3679962158203125, -1.320892333984375, -1.2737884521484375, -1.2266845703125, -1.1795806884765625, -1.132476806640625, -1.0853729248046875, -1.03826904296875, -0.9911651611328125, -0.944061279296875, -0.8969573974609375, -0.849853515625, -0.8027496337890625, -0.755645751953125, -0.7085418701171875, -0.66143798828125, -0.6143341064453125, -0.567230224609375, -0.5201263427734375, -0.4730224609375, -0.4259185791015625, -0.378814697265625, -0.3317108154296875, -0.28460693359375, -0.2375030517578125, -0.190399169921875, -0.1432952880859375, -0.09619140625, -0.0490875244140625, -0.001983642578125, 0.0451202392578125, 0.09222412109375, 0.1393280029296875, 0.186431884765625, 0.2335357666015625, 0.2806396484375, 0.3277435302734375, 0.374847412109375, 0.4219512939453125, 0.46905517578125, 0.5161590576171875, 0.563262939453125, 0.6103668212890625, 0.657470703125, 0.7045745849609375, 0.751678466796875, 0.7987823486328125, 0.84588623046875, 0.8929901123046875, 0.940093994140625, 0.9871978759765625, 1.0343017578125, 1.0814056396484375, 1.128509521484375, 1.1756134033203125, 1.22271728515625, 1.2698211669921875, 1.316925048828125, 1.3640289306640625, 1.4111328125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 2.0, 3.0, 7.0, 12.0, 8.0, 13.0, 14.0, 22.0, 15.0, 23.0, 23.0, 28.0, 29.0, 31.0, 38.0, 37.0, 36.0, 42.0, 43.0, 34.0, 35.0, 1052.0, 40.0, 43.0, 38.0, 33.0, 30.0, 42.0, 39.0, 26.0, 28.0, 28.0, 25.0, 19.0, 18.0, 12.0, 8.0, 10.0, 11.0, 8.0, 6.0, 8.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.140625, -4.00750732421875, -3.8743896484375, -3.74127197265625, -3.608154296875, -3.47503662109375, -3.3419189453125, -3.20880126953125, -3.07568359375, -2.94256591796875, -2.8094482421875, -2.67633056640625, -2.543212890625, -2.41009521484375, -2.2769775390625, -2.14385986328125, -2.0107421875, -1.87762451171875, -1.7445068359375, -1.61138916015625, -1.478271484375, -1.34515380859375, -1.2120361328125, -1.07891845703125, -0.94580078125, -0.81268310546875, -0.6795654296875, -0.54644775390625, -0.413330078125, -0.28021240234375, -0.1470947265625, -0.01397705078125, 0.119140625, 0.25225830078125, 0.3853759765625, 0.51849365234375, 0.651611328125, 0.78472900390625, 0.9178466796875, 1.05096435546875, 1.18408203125, 1.31719970703125, 1.4503173828125, 1.58343505859375, 1.716552734375, 1.84967041015625, 1.9827880859375, 2.11590576171875, 2.2490234375, 2.38214111328125, 2.5152587890625, 2.64837646484375, 2.781494140625, 2.91461181640625, 3.0477294921875, 3.18084716796875, 3.31396484375, 3.44708251953125, 3.5802001953125, 3.71331787109375, 3.846435546875, 3.97955322265625, 4.1126708984375, 4.24578857421875, 4.37890625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 7.0, 5.0, 5.0, 7.0, 18.0, 16.0, 21.0, 34.0, 43.0, 60.0, 84.0, 128.0, 172.0, 264.0, 427.0, 609.0, 917.0, 1333.0, 2071.0, 3245.0, 5004.0, 7985.0, 12966.0, 20624.0, 33999.0, 57442.0, 102603.0, 200640.0, 1312789.0, 141778.0, 76024.0, 44303.0, 26684.0, 16497.0, 10143.0, 6448.0, 3945.0, 2572.0, 1673.0, 1138.0, 762.0, 527.0, 343.0, 266.0, 155.0, 113.0, 79.0, 51.0, 37.0, 32.0, 22.0, 13.0, 9.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-1.1943359375, -1.1573028564453125, -1.120269775390625, -1.0832366943359375, -1.04620361328125, -1.0091705322265625, -0.972137451171875, -0.9351043701171875, -0.8980712890625, -0.8610382080078125, -0.824005126953125, -0.7869720458984375, -0.74993896484375, -0.7129058837890625, -0.675872802734375, -0.6388397216796875, -0.601806640625, -0.5647735595703125, -0.527740478515625, -0.4907073974609375, -0.45367431640625, -0.4166412353515625, -0.379608154296875, -0.3425750732421875, -0.3055419921875, -0.2685089111328125, -0.231475830078125, -0.1944427490234375, -0.15740966796875, -0.1203765869140625, -0.083343505859375, -0.0463104248046875, -0.00927734375, 0.0277557373046875, 0.064788818359375, 0.1018218994140625, 0.13885498046875, 0.1758880615234375, 0.212921142578125, 0.2499542236328125, 0.2869873046875, 0.3240203857421875, 0.361053466796875, 0.3980865478515625, 0.43511962890625, 0.4721527099609375, 0.509185791015625, 0.5462188720703125, 0.583251953125, 0.6202850341796875, 0.657318115234375, 0.6943511962890625, 0.73138427734375, 0.7684173583984375, 0.805450439453125, 0.8424835205078125, 0.8795166015625, 0.9165496826171875, 0.953582763671875, 0.9906158447265625, 1.02764892578125, 1.0646820068359375, 1.101715087890625, 1.1387481689453125, 1.17578125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 2.0, 13.0, 20.0, 19.0, 26.0, 19.0, 33.0, 38.0, 41.0, 61.0, 75.0, 67.0, 67.0, 67.0, 63.0, 79.0, 61.0, 35.0, 53.0, 32.0, 38.0, 27.0, 22.0, 7.0, 8.0, 3.0, 9.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00130462646484375, -0.0012714564800262451, -0.0012382864952087402, -0.0012051165103912354, -0.0011719465255737305, -0.0011387765407562256, -0.0011056065559387207, -0.0010724365711212158, -0.001039266586303711, -0.001006096601486206, -0.0009729266166687012, -0.0009397566318511963, -0.0009065866470336914, -0.0008734166622161865, -0.0008402466773986816, -0.0008070766925811768, -0.0007739067077636719, -0.000740736722946167, -0.0007075667381286621, -0.0006743967533111572, -0.0006412267684936523, -0.0006080567836761475, -0.0005748867988586426, -0.0005417168140411377, -0.0005085468292236328, -0.00047537684440612793, -0.00044220685958862305, -0.00040903687477111816, -0.0003758668899536133, -0.0003426969051361084, -0.0003095269203186035, -0.00027635693550109863, -0.00024318695068359375, -0.00021001696586608887, -0.00017684698104858398, -0.0001436769962310791, -0.00011050701141357422, -7.733702659606934e-05, -4.416704177856445e-05, -1.099705696105957e-05, 2.2172927856445312e-05, 5.5342912673950195e-05, 8.851289749145508e-05, 0.00012168288230895996, 0.00015485286712646484, 0.00018802285194396973, 0.0002211928367614746, 0.0002543628215789795, 0.0002875328063964844, 0.00032070279121398926, 0.00035387277603149414, 0.000387042760848999, 0.0004202127456665039, 0.0004533827304840088, 0.00048655271530151367, 0.0005197227001190186, 0.0005528926849365234, 0.0005860626697540283, 0.0006192326545715332, 0.0006524026393890381, 0.000685572624206543, 0.0007187426090240479, 0.0007519125938415527, 0.0007850825786590576, 0.0008182525634765625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 12.0, 6.0, 10.0, 23.0, 32.0, 33.0, 58.0, 57.0, 76.0, 127.0, 204.0, 389.0, 1346.0, 159966.0, 881610.0, 3248.0, 551.0, 249.0, 140.0, 98.0, 77.0, 55.0, 39.0, 28.0, 32.0, 20.0, 14.0, 17.0, 7.0, 5.0, 8.0, 5.0, 5.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01529693603515625, -0.014664053916931152, -0.014031171798706055, -0.013398289680480957, -0.01276540756225586, -0.012132525444030762, -0.011499643325805664, -0.010866761207580566, -0.010233879089355469, -0.009600996971130371, -0.008968114852905273, -0.008335232734680176, -0.007702350616455078, -0.0070694684982299805, -0.006436586380004883, -0.005803704261779785, -0.0051708221435546875, -0.00453794002532959, -0.003905057907104492, -0.0032721757888793945, -0.002639293670654297, -0.0020064115524291992, -0.0013735294342041016, -0.0007406473159790039, -0.00010776519775390625, 0.0005251169204711914, 0.001157999038696289, 0.0017908811569213867, 0.0024237632751464844, 0.003056645393371582, 0.0036895275115966797, 0.004322409629821777, 0.004955291748046875, 0.005588173866271973, 0.00622105598449707, 0.006853938102722168, 0.007486820220947266, 0.008119702339172363, 0.008752584457397461, 0.009385466575622559, 0.010018348693847656, 0.010651230812072754, 0.011284112930297852, 0.01191699504852295, 0.012549877166748047, 0.013182759284973145, 0.013815641403198242, 0.01444852352142334, 0.015081405639648438, 0.015714287757873535, 0.016347169876098633, 0.01698005199432373, 0.017612934112548828, 0.018245816230773926, 0.018878698348999023, 0.01951158046722412, 0.02014446258544922, 0.020777344703674316, 0.021410226821899414, 0.02204310894012451, 0.02267599105834961, 0.023308873176574707, 0.023941755294799805, 0.024574637413024902, 0.02520751953125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 25.0, 78.0, 149.0, 204.0, 229.0, 163.0, 97.0, 35.0, 17.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00063685531495139, -0.0005918823298998177, -0.0005469093448482454, -0.0005019363597966731, -0.00045696337474510074, -0.0004119903896935284, -0.00036701743374578655, -0.0003220444486942142, -0.0002770714636426419, -0.00023209847859106958, -0.00018712549353949726, -0.00014215252303984016, -9.717953798826784e-05, -5.2206552936695516e-05, -7.233582437038422e-06, 3.77394026145339e-05, 8.271238766610622e-05, 0.00012768537271767855, 0.00017265835776925087, 0.00021763132826890796, 0.0002626043278723955, 0.00030757731292396784, 0.0003525502688717097, 0.00039752325392328203, 0.00044249623897485435, 0.0004874692240264267, 0.0005324421799741685, 0.0005774151650257409, 0.0006223881500773132, 0.0006673611351288855, 0.0007123341201804578, 0.0007573071052320302, 0.0008022800320759416, 0.0008472530171275139, 0.0008922260021790862, 0.0009371989872306585, 0.0009821719722822309, 0.0010271449573338032, 0.0010721179423853755, 0.0011170909274369478, 0.0011620639124885201, 0.0012070368975400925, 0.0012520098825916648, 0.0012969828676432371, 0.0013419558526948094, 0.0013869288377463818, 0.001431901822797954, 0.0014768748078495264, 0.001521847676485777, 0.0015668206615373492, 0.0016117936465889215, 0.0016567666316404939, 0.0017017396166920662, 0.0017467126017436385, 0.0017916855867952108, 0.0018366585718467832, 0.0018816315568983555, 0.0019266045419499278, 0.0019715775270015, 0.0020165503956377506, 0.0020615234971046448, 0.0021064963657408953, 0.0021514694672077894, 0.00219644233584404, 0.002241415437310934]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 5.0, 10.0, 8.0, 10.0, 13.0, 11.0, 11.0, 16.0, 18.0, 19.0, 21.0, 22.0, 32.0, 34.0, 30.0, 39.0, 27.0, 34.0, 37.0, 44.0, 27.0, 41.0, 40.0, 38.0, 41.0, 35.0, 29.0, 36.0, 32.0, 33.0, 32.0, 23.0, 22.0, 23.0, 19.0, 17.0, 14.0, 12.0, 6.0, 10.0, 4.0, 6.0, 5.0, 4.0, 1.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040668249130249023, -0.0003937156870961189, -0.0003807488828897476, -0.0003677820786833763, -0.000354815274477005, -0.0003418484702706337, -0.0003288816660642624, -0.0003159148618578911, -0.0003029480576515198, -0.00028998125344514847, -0.00027701444923877716, -0.00026404764503240585, -0.00025108084082603455, -0.00023811403661966324, -0.00022514723241329193, -0.00021218042820692062, -0.00019921362400054932, -0.000186246819794178, -0.0001732800155878067, -0.0001603132113814354, -0.0001473464071750641, -0.00013437960296869278, -0.00012141279876232147, -0.00010844599455595016, -9.547919034957886e-05, -8.251238614320755e-05, -6.954558193683624e-05, -5.6578777730464935e-05, -4.361197352409363e-05, -3.064516931772232e-05, -1.7678365111351013e-05, -4.711560904979706e-06, 8.255243301391602e-06, 2.122204750776291e-05, 3.4188851714134216e-05, 4.7155655920505524e-05, 6.012246012687683e-05, 7.308926433324814e-05, 8.605606853961945e-05, 9.902287274599075e-05, 0.00011198967695236206, 0.00012495648115873337, 0.00013792328536510468, 0.00015089008957147598, 0.0001638568937778473, 0.0001768236979842186, 0.0001897905021905899, 0.0002027573063969612, 0.00021572411060333252, 0.00022869091480970383, 0.00024165771901607513, 0.00025462452322244644, 0.00026759132742881775, 0.00028055813163518906, 0.00029352493584156036, 0.00030649174004793167, 0.000319458544254303, 0.0003324253484606743, 0.0003453921526670456, 0.0003583589568734169, 0.0003713257610797882, 0.0003842925652861595, 0.0003972593694925308, 0.00041022617369890213, 0.00042319297790527344]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 10.0, 10.0, 11.0, 14.0, 26.0, 15.0, 25.0, 22.0, 24.0, 40.0, 38.0, 30.0, 48.0, 51.0, 42.0, 51.0, 47.0, 52.0, 52.0, 53.0, 37.0, 45.0, 41.0, 42.0, 33.0, 21.0, 19.0, 18.0, 14.0, 14.0, 12.0, 11.0, 11.0, 2.0, 3.0, 3.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.2928466796875, -6.046630859375, -5.8004150390625, -5.55419921875, -5.3079833984375, -5.061767578125, -4.8155517578125, -4.5693359375, -4.3231201171875, -4.076904296875, -3.8306884765625, -3.58447265625, -3.3382568359375, -3.092041015625, -2.8458251953125, -2.599609375, -2.3533935546875, -2.107177734375, -1.8609619140625, -1.61474609375, -1.3685302734375, -1.122314453125, -0.8760986328125, -0.6298828125, -0.3836669921875, -0.137451171875, 0.1087646484375, 0.35498046875, 0.6011962890625, 0.847412109375, 1.0936279296875, 1.33984375, 1.5860595703125, 1.832275390625, 2.0784912109375, 2.32470703125, 2.5709228515625, 2.817138671875, 3.0633544921875, 3.3095703125, 3.5557861328125, 3.802001953125, 4.0482177734375, 4.29443359375, 4.5406494140625, 4.786865234375, 5.0330810546875, 5.279296875, 5.5255126953125, 5.771728515625, 6.0179443359375, 6.26416015625, 6.5103759765625, 6.756591796875, 7.0028076171875, 7.2490234375, 7.4952392578125, 7.741455078125, 7.9876708984375, 8.23388671875, 8.4801025390625, 8.726318359375, 8.9725341796875, 9.21875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 12.0, 19.0, 26.0, 32.0, 49.0, 69.0, 109.0, 182.0, 304.0, 569.0, 1316.0, 3337.0, 9672.0, 29578.0, 98449.0, 330629.0, 397086.0, 121984.0, 36446.0, 11612.0, 3974.0, 1480.0, 681.0, 354.0, 201.0, 127.0, 85.0, 47.0, 35.0, 36.0, 15.0, 11.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.65625, -8.3778076171875, -8.099365234375, -7.8209228515625, -7.54248046875, -7.2640380859375, -6.985595703125, -6.7071533203125, -6.4287109375, -6.1502685546875, -5.871826171875, -5.5933837890625, -5.31494140625, -5.0364990234375, -4.758056640625, -4.4796142578125, -4.201171875, -3.9227294921875, -3.644287109375, -3.3658447265625, -3.08740234375, -2.8089599609375, -2.530517578125, -2.2520751953125, -1.9736328125, -1.6951904296875, -1.416748046875, -1.1383056640625, -0.85986328125, -0.5814208984375, -0.302978515625, -0.0245361328125, 0.25390625, 0.5323486328125, 0.810791015625, 1.0892333984375, 1.36767578125, 1.6461181640625, 1.924560546875, 2.2030029296875, 2.4814453125, 2.7598876953125, 3.038330078125, 3.3167724609375, 3.59521484375, 3.8736572265625, 4.152099609375, 4.4305419921875, 4.708984375, 4.9874267578125, 5.265869140625, 5.5443115234375, 5.82275390625, 6.1011962890625, 6.379638671875, 6.6580810546875, 6.9365234375, 7.2149658203125, 7.493408203125, 7.7718505859375, 8.05029296875, 8.3287353515625, 8.607177734375, 8.8856201171875, 9.1640625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 7.0, 10.0, 4.0, 16.0, 16.0, 15.0, 15.0, 21.0, 34.0, 28.0, 41.0, 44.0, 42.0, 50.0, 56.0, 82.0, 175.0, 1475.0, 324.0, 115.0, 64.0, 51.0, 37.0, 45.0, 40.0, 31.0, 32.0, 29.0, 25.0, 26.0, 17.0, 16.0, 16.0, 12.0, 6.0, 8.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.203125, -19.47705078125, -18.7509765625, -18.02490234375, -17.298828125, -16.57275390625, -15.8466796875, -15.12060546875, -14.39453125, -13.66845703125, -12.9423828125, -12.21630859375, -11.490234375, -10.76416015625, -10.0380859375, -9.31201171875, -8.5859375, -7.85986328125, -7.1337890625, -6.40771484375, -5.681640625, -4.95556640625, -4.2294921875, -3.50341796875, -2.77734375, -2.05126953125, -1.3251953125, -0.59912109375, 0.126953125, 0.85302734375, 1.5791015625, 2.30517578125, 3.03125, 3.75732421875, 4.4833984375, 5.20947265625, 5.935546875, 6.66162109375, 7.3876953125, 8.11376953125, 8.83984375, 9.56591796875, 10.2919921875, 11.01806640625, 11.744140625, 12.47021484375, 13.1962890625, 13.92236328125, 14.6484375, 15.37451171875, 16.1005859375, 16.82666015625, 17.552734375, 18.27880859375, 19.0048828125, 19.73095703125, 20.45703125, 21.18310546875, 21.9091796875, 22.63525390625, 23.361328125, 24.08740234375, 24.8134765625, 25.53955078125, 26.265625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 4.0, 2.0, 9.0, 8.0, 6.0, 8.0, 12.0, 26.0, 31.0, 48.0, 52.0, 96.0, 113.0, 199.0, 344.0, 878.0, 9000.0, 3126969.0, 6224.0, 784.0, 313.0, 187.0, 127.0, 77.0, 50.0, 42.0, 25.0, 19.0, 20.0, 9.0, 4.0, 4.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-111.75, -108.306640625, -104.86328125, -101.419921875, -97.9765625, -94.533203125, -91.08984375, -87.646484375, -84.203125, -80.759765625, -77.31640625, -73.873046875, -70.4296875, -66.986328125, -63.54296875, -60.099609375, -56.65625, -53.212890625, -49.76953125, -46.326171875, -42.8828125, -39.439453125, -35.99609375, -32.552734375, -29.109375, -25.666015625, -22.22265625, -18.779296875, -15.3359375, -11.892578125, -8.44921875, -5.005859375, -1.5625, 1.880859375, 5.32421875, 8.767578125, 12.2109375, 15.654296875, 19.09765625, 22.541015625, 25.984375, 29.427734375, 32.87109375, 36.314453125, 39.7578125, 43.201171875, 46.64453125, 50.087890625, 53.53125, 56.974609375, 60.41796875, 63.861328125, 67.3046875, 70.748046875, 74.19140625, 77.634765625, 81.078125, 84.521484375, 87.96484375, 91.408203125, 94.8515625, 98.294921875, 101.73828125, 105.181640625, 108.625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 12.0, 23.0, 58.0, 89.0, 123.0, 164.0, 192.0, 129.0, 93.0, 62.0, 28.0, 20.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.250093460083008, -30.055500030517578, -28.86090660095215, -27.66631317138672, -26.471721649169922, -25.277128219604492, -24.082534790039062, -22.887943267822266, -21.693347930908203, -20.498754501342773, -19.304161071777344, -18.109569549560547, -16.914976119995117, -15.720382690429688, -14.525789260864258, -13.331196784973145, -12.136604309082031, -10.942010879516602, -9.747418403625488, -8.552824974060059, -7.358232021331787, -6.163639068603516, -4.969045639038086, -3.7744531631469727, -2.579859733581543, -1.385266661643982, -0.1906735897064209, 1.0039196014404297, 2.198512554168701, 3.3931055068969727, 4.587698936462402, 5.782291412353516, 6.9768829345703125, 8.171476364135742, 9.366068840026855, 10.560662269592285, 11.755254745483398, 12.949848175048828, 14.144441604614258, 15.339034080505371, 16.533626556396484, 17.728219985961914, 18.922813415527344, 20.11740493774414, 21.31199836730957, 22.506591796875, 23.70118522644043, 24.89577865600586, 26.09037208557129, 27.28496551513672, 28.47955894470215, 29.674152374267578, 30.868743896484375, 32.06333923339844, 33.257930755615234, 34.45252227783203, 35.647117614746094, 36.84170913696289, 38.03630447387695, 39.23089599609375, 40.42549133300781, 41.62008285522461, 42.814674377441406, 44.00926971435547, 45.203861236572266]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 7.0, 14.0, 22.0, 14.0, 17.0, 19.0, 30.0, 21.0, 33.0, 45.0, 25.0, 43.0, 35.0, 44.0, 54.0, 57.0, 49.0, 37.0, 42.0, 31.0, 38.0, 35.0, 45.0, 50.0, 27.0, 21.0, 23.0, 24.0, 16.0, 17.0, 9.0, 10.0, 10.0, 6.0, 10.0, 5.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.87211227416992, -48.00289535522461, -46.1336784362793, -44.26445770263672, -42.395240783691406, -40.526023864746094, -38.65680694580078, -36.78759002685547, -34.918373107910156, -33.049156188964844, -31.1799373626709, -29.310720443725586, -27.44150161743164, -25.572284698486328, -23.703067779541016, -21.833850860595703, -19.964630126953125, -18.095413208007812, -16.226194381713867, -14.356977462768555, -12.487759590148926, -10.618541717529297, -8.749324798583984, -6.8801069259643555, -5.010889053344727, -3.1416714191436768, -1.272453784942627, 0.5967636108398438, 2.4659814834594727, 4.335199356079102, 6.204416275024414, 8.073634147644043, 9.942855834960938, 11.812073707580566, 13.681291580200195, 15.550508499145508, 17.419727325439453, 19.288944244384766, 21.158161163330078, 23.02737808227539, 24.896596908569336, 26.76581382751465, 28.635032653808594, 30.504249572753906, 32.37346649169922, 34.24268341064453, 36.111900329589844, 37.98112106323242, 39.850337982177734, 41.71955490112305, 43.58877182006836, 45.45799255371094, 47.32720947265625, 49.19642639160156, 51.065643310546875, 52.93486022949219, 54.8040771484375, 56.67329406738281, 58.542510986328125, 60.41172790527344, 62.280948638916016, 64.15016174316406, 66.01937866210938, 67.88860321044922, 69.75782012939453]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 3.0, 11.0, 8.0, 19.0, 9.0, 11.0, 17.0, 21.0, 35.0, 29.0, 36.0, 34.0, 41.0, 42.0, 53.0, 47.0, 52.0, 48.0, 50.0, 61.0, 49.0, 44.0, 31.0, 50.0, 35.0, 33.0, 25.0, 19.0, 18.0, 15.0, 8.0, 17.0, 6.0, 8.0, 7.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2890625, -7.0142822265625, -6.739501953125, -6.4647216796875, -6.18994140625, -5.9151611328125, -5.640380859375, -5.3656005859375, -5.0908203125, -4.8160400390625, -4.541259765625, -4.2664794921875, -3.99169921875, -3.7169189453125, -3.442138671875, -3.1673583984375, -2.892578125, -2.6177978515625, -2.343017578125, -2.0682373046875, -1.79345703125, -1.5186767578125, -1.243896484375, -0.9691162109375, -0.6943359375, -0.4195556640625, -0.144775390625, 0.1300048828125, 0.40478515625, 0.6795654296875, 0.954345703125, 1.2291259765625, 1.50390625, 1.7786865234375, 2.053466796875, 2.3282470703125, 2.60302734375, 2.8778076171875, 3.152587890625, 3.4273681640625, 3.7021484375, 3.9769287109375, 4.251708984375, 4.5264892578125, 4.80126953125, 5.0760498046875, 5.350830078125, 5.6256103515625, 5.900390625, 6.1751708984375, 6.449951171875, 6.7247314453125, 6.99951171875, 7.2742919921875, 7.549072265625, 7.8238525390625, 8.0986328125, 8.3734130859375, 8.648193359375, 8.9229736328125, 9.19775390625, 9.4725341796875, 9.747314453125, 10.0220947265625, 10.296875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 3.0, 11.0, 9.0, 7.0, 11.0, 20.0, 25.0, 29.0, 35.0, 47.0, 50.0, 62.0, 75.0, 112.0, 124.0, 265.0, 605.0, 2371.0, 25040.0, 573062.0, 2845302.0, 712421.0, 30512.0, 2532.0, 591.0, 284.0, 162.0, 121.0, 93.0, 59.0, 47.0, 35.0, 28.0, 31.0, 17.0, 17.0, 16.0, 21.0, 8.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.79541015625, -15.2001953125, -14.60498046875, -14.009765625, -13.41455078125, -12.8193359375, -12.22412109375, -11.62890625, -11.03369140625, -10.4384765625, -9.84326171875, -9.248046875, -8.65283203125, -8.0576171875, -7.46240234375, -6.8671875, -6.27197265625, -5.6767578125, -5.08154296875, -4.486328125, -3.89111328125, -3.2958984375, -2.70068359375, -2.10546875, -1.51025390625, -0.9150390625, -0.31982421875, 0.275390625, 0.87060546875, 1.4658203125, 2.06103515625, 2.65625, 3.25146484375, 3.8466796875, 4.44189453125, 5.037109375, 5.63232421875, 6.2275390625, 6.82275390625, 7.41796875, 8.01318359375, 8.6083984375, 9.20361328125, 9.798828125, 10.39404296875, 10.9892578125, 11.58447265625, 12.1796875, 12.77490234375, 13.3701171875, 13.96533203125, 14.560546875, 15.15576171875, 15.7509765625, 16.34619140625, 16.94140625, 17.53662109375, 18.1318359375, 18.72705078125, 19.322265625, 19.91748046875, 20.5126953125, 21.10791015625, 21.703125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 11.0, 9.0, 17.0, 20.0, 23.0, 38.0, 69.0, 69.0, 115.0, 155.0, 222.0, 296.0, 419.0, 477.0, 488.0, 487.0, 331.0, 254.0, 177.0, 111.0, 76.0, 52.0, 40.0, 34.0, 22.0, 17.0, 14.0, 11.0, 10.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8359375, -12.3463134765625, -11.856689453125, -11.3670654296875, -10.87744140625, -10.3878173828125, -9.898193359375, -9.4085693359375, -8.9189453125, -8.4293212890625, -7.939697265625, -7.4500732421875, -6.96044921875, -6.4708251953125, -5.981201171875, -5.4915771484375, -5.001953125, -4.5123291015625, -4.022705078125, -3.5330810546875, -3.04345703125, -2.5538330078125, -2.064208984375, -1.5745849609375, -1.0849609375, -0.5953369140625, -0.105712890625, 0.3839111328125, 0.87353515625, 1.3631591796875, 1.852783203125, 2.3424072265625, 2.83203125, 3.3216552734375, 3.811279296875, 4.3009033203125, 4.79052734375, 5.2801513671875, 5.769775390625, 6.2593994140625, 6.7490234375, 7.2386474609375, 7.728271484375, 8.2178955078125, 8.70751953125, 9.1971435546875, 9.686767578125, 10.1763916015625, 10.666015625, 11.1556396484375, 11.645263671875, 12.1348876953125, 12.62451171875, 13.1141357421875, 13.603759765625, 14.0933837890625, 14.5830078125, 15.0726318359375, 15.562255859375, 16.0518798828125, 16.54150390625, 17.0311279296875, 17.520751953125, 18.0103759765625, 18.5]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 7.0, 11.0, 18.0, 18.0, 23.0, 44.0, 56.0, 76.0, 102.0, 156.0, 242.0, 355.0, 661.0, 7829.0, 4031848.0, 150448.0, 1000.0, 431.0, 311.0, 191.0, 138.0, 109.0, 73.0, 42.0, 25.0, 20.0, 18.0, 10.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-88.5, -86.212890625, -83.92578125, -81.638671875, -79.3515625, -77.064453125, -74.77734375, -72.490234375, -70.203125, -67.916015625, -65.62890625, -63.341796875, -61.0546875, -58.767578125, -56.48046875, -54.193359375, -51.90625, -49.619140625, -47.33203125, -45.044921875, -42.7578125, -40.470703125, -38.18359375, -35.896484375, -33.609375, -31.322265625, -29.03515625, -26.748046875, -24.4609375, -22.173828125, -19.88671875, -17.599609375, -15.3125, -13.025390625, -10.73828125, -8.451171875, -6.1640625, -3.876953125, -1.58984375, 0.697265625, 2.984375, 5.271484375, 7.55859375, 9.845703125, 12.1328125, 14.419921875, 16.70703125, 18.994140625, 21.28125, 23.568359375, 25.85546875, 28.142578125, 30.4296875, 32.716796875, 35.00390625, 37.291015625, 39.578125, 41.865234375, 44.15234375, 46.439453125, 48.7265625, 51.013671875, 53.30078125, 55.587890625, 57.875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 10.0, 110.0, 382.0, 403.0, 97.0, 14.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.3288688659668, -51.93135452270508, -44.53384017944336, -37.136322021484375, -29.73880958557129, -22.341293334960938, -14.943778991699219, -7.5462646484375, -0.14875030517578125, 7.248764514923096, 14.646279335021973, 22.043794631958008, 29.441308975219727, 36.83882522583008, 44.2363395690918, 51.633853912353516, 59.031368255615234, 66.42888641357422, 73.82640075683594, 81.22391510009766, 88.62142944335938, 96.0189437866211, 103.41645812988281, 110.81397247314453, 118.21148681640625, 125.60900115966797, 133.0065155029297, 140.40403747558594, 147.80154418945312, 155.19906616210938, 162.59657287597656, 169.9940948486328, 177.39161682128906, 184.7891387939453, 192.1866455078125, 199.58416748046875, 206.98167419433594, 214.3791961669922, 221.77670288085938, 229.17422485351562, 236.5717315673828, 243.96925354003906, 251.36676025390625, 258.7642822265625, 266.16180419921875, 273.5592956542969, 280.9568176269531, 288.3543395996094, 295.7518615722656, 303.1493835449219, 310.5469055175781, 317.94439697265625, 325.3419189453125, 332.73944091796875, 340.136962890625, 347.5344543457031, 354.9319763183594, 362.3294982910156, 369.7270202636719, 377.12451171875, 384.52203369140625, 391.9195556640625, 399.31707763671875, 406.7145690917969, 414.1120910644531]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 8.0, 9.0, 6.0, 8.0, 14.0, 19.0, 16.0, 21.0, 25.0, 19.0, 28.0, 43.0, 36.0, 40.0, 34.0, 26.0, 42.0, 39.0, 44.0, 45.0, 37.0, 42.0, 38.0, 47.0, 34.0, 28.0, 28.0, 32.0, 29.0, 26.0, 25.0, 25.0, 15.0, 8.0, 11.0, 10.0, 11.0, 8.0, 5.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.607723236083984, -38.214412689208984, -36.82110595703125, -35.42779541015625, -34.034488677978516, -32.641178131103516, -31.24786949157715, -29.85456085205078, -28.46125030517578, -27.067941665649414, -25.674633026123047, -24.281322479248047, -22.88801383972168, -21.494705200195312, -20.101396560668945, -18.708087921142578, -17.31477928161621, -15.921470642089844, -14.52816104888916, -13.134852409362793, -11.74154281616211, -10.348234176635742, -8.954925537109375, -7.561615943908691, -6.168307304382324, -4.774998188018799, -3.3816893100738525, -1.9883804321289062, -0.5950713157653809, 0.7982378005981445, 2.1915464401245117, 3.5848560333251953, 4.9781646728515625, 6.371473789215088, 7.764782905578613, 9.15809154510498, 10.551401138305664, 11.944709777832031, 13.338018417358398, 14.731328010559082, 16.124637603759766, 17.517946243286133, 18.9112548828125, 20.3045654296875, 21.697874069213867, 23.091182708740234, 24.4844913482666, 25.87779998779297, 27.271108627319336, 28.664417266845703, 30.05772590637207, 31.451034545898438, 32.84434509277344, 34.23765563964844, 35.63096237182617, 37.02427291870117, 38.417579650878906, 39.810890197753906, 41.20419692993164, 42.59750747680664, 43.990814208984375, 45.384124755859375, 46.777435302734375, 48.17074203491211, 49.56405258178711]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 6.0, 13.0, 9.0, 11.0, 15.0, 20.0, 24.0, 32.0, 37.0, 23.0, 35.0, 39.0, 51.0, 42.0, 46.0, 53.0, 53.0, 45.0, 45.0, 45.0, 46.0, 34.0, 30.0, 34.0, 36.0, 30.0, 17.0, 27.0, 15.0, 18.0, 11.0, 12.0, 16.0, 5.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.859375, -6.6131591796875, -6.366943359375, -6.1207275390625, -5.87451171875, -5.6282958984375, -5.382080078125, -5.1358642578125, -4.8896484375, -4.6434326171875, -4.397216796875, -4.1510009765625, -3.90478515625, -3.6585693359375, -3.412353515625, -3.1661376953125, -2.919921875, -2.6737060546875, -2.427490234375, -2.1812744140625, -1.93505859375, -1.6888427734375, -1.442626953125, -1.1964111328125, -0.9501953125, -0.7039794921875, -0.457763671875, -0.2115478515625, 0.03466796875, 0.2808837890625, 0.527099609375, 0.7733154296875, 1.01953125, 1.2657470703125, 1.511962890625, 1.7581787109375, 2.00439453125, 2.2506103515625, 2.496826171875, 2.7430419921875, 2.9892578125, 3.2354736328125, 3.481689453125, 3.7279052734375, 3.97412109375, 4.2203369140625, 4.466552734375, 4.7127685546875, 4.958984375, 5.2052001953125, 5.451416015625, 5.6976318359375, 5.94384765625, 6.1900634765625, 6.436279296875, 6.6824951171875, 6.9287109375, 7.1749267578125, 7.421142578125, 7.6673583984375, 7.91357421875, 8.1597900390625, 8.406005859375, 8.6522216796875, 8.8984375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 10.0, 11.0, 9.0, 13.0, 19.0, 23.0, 33.0, 55.0, 77.0, 126.0, 201.0, 292.0, 453.0, 669.0, 1036.0, 1593.0, 2445.0, 3543.0, 5652.0, 8472.0, 13096.0, 20628.0, 33195.0, 55801.0, 100739.0, 209475.0, 277649.0, 132524.0, 70196.0, 40545.0, 24851.0, 15811.0, 10017.0, 6607.0, 4341.0, 2801.0, 1869.0, 1208.0, 872.0, 544.0, 356.0, 255.0, 146.0, 102.0, 67.0, 36.0, 38.0, 22.0, 12.0, 10.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-1.1826171875, -1.14471435546875, -1.1068115234375, -1.06890869140625, -1.031005859375, -0.99310302734375, -0.9552001953125, -0.91729736328125, -0.87939453125, -0.84149169921875, -0.8035888671875, -0.76568603515625, -0.727783203125, -0.68988037109375, -0.6519775390625, -0.61407470703125, -0.576171875, -0.53826904296875, -0.5003662109375, -0.46246337890625, -0.424560546875, -0.38665771484375, -0.3487548828125, -0.31085205078125, -0.27294921875, -0.23504638671875, -0.1971435546875, -0.15924072265625, -0.121337890625, -0.08343505859375, -0.0455322265625, -0.00762939453125, 0.0302734375, 0.06817626953125, 0.1060791015625, 0.14398193359375, 0.181884765625, 0.21978759765625, 0.2576904296875, 0.29559326171875, 0.33349609375, 0.37139892578125, 0.4093017578125, 0.44720458984375, 0.485107421875, 0.52301025390625, 0.5609130859375, 0.59881591796875, 0.63671875, 0.67462158203125, 0.7125244140625, 0.75042724609375, 0.788330078125, 0.82623291015625, 0.8641357421875, 0.90203857421875, 0.93994140625, 0.97784423828125, 1.0157470703125, 1.05364990234375, 1.091552734375, 1.12945556640625, 1.1673583984375, 1.20526123046875, 1.2431640625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 7.0, 2.0, 7.0, 6.0, 17.0, 12.0, 10.0, 19.0, 20.0, 26.0, 23.0, 22.0, 27.0, 34.0, 35.0, 31.0, 40.0, 36.0, 43.0, 36.0, 1063.0, 34.0, 42.0, 36.0, 49.0, 41.0, 27.0, 36.0, 29.0, 33.0, 34.0, 18.0, 22.0, 17.0, 13.0, 14.0, 14.0, 13.0, 8.0, 6.0, 7.0, 8.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.49609375, -4.35980224609375, -4.2235107421875, -4.08721923828125, -3.950927734375, -3.81463623046875, -3.6783447265625, -3.54205322265625, -3.40576171875, -3.26947021484375, -3.1331787109375, -2.99688720703125, -2.860595703125, -2.72430419921875, -2.5880126953125, -2.45172119140625, -2.3154296875, -2.17913818359375, -2.0428466796875, -1.90655517578125, -1.770263671875, -1.63397216796875, -1.4976806640625, -1.36138916015625, -1.22509765625, -1.08880615234375, -0.9525146484375, -0.81622314453125, -0.679931640625, -0.54364013671875, -0.4073486328125, -0.27105712890625, -0.134765625, 0.00152587890625, 0.1378173828125, 0.27410888671875, 0.410400390625, 0.54669189453125, 0.6829833984375, 0.81927490234375, 0.95556640625, 1.09185791015625, 1.2281494140625, 1.36444091796875, 1.500732421875, 1.63702392578125, 1.7733154296875, 1.90960693359375, 2.0458984375, 2.18218994140625, 2.3184814453125, 2.45477294921875, 2.591064453125, 2.72735595703125, 2.8636474609375, 2.99993896484375, 3.13623046875, 3.27252197265625, 3.4088134765625, 3.54510498046875, 3.681396484375, 3.81768798828125, 3.9539794921875, 4.09027099609375, 4.2265625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 5.0, 11.0, 16.0, 24.0, 33.0, 36.0, 56.0, 93.0, 123.0, 151.0, 220.0, 313.0, 474.0, 689.0, 942.0, 1458.0, 2091.0, 3313.0, 4860.0, 7699.0, 11720.0, 18337.0, 29486.0, 48973.0, 84412.0, 156890.0, 1320401.0, 172041.0, 91869.0, 52141.0, 31410.0, 19760.0, 12505.0, 8272.0, 5422.0, 3528.0, 2320.0, 1602.0, 1062.0, 714.0, 510.0, 394.0, 200.0, 180.0, 118.0, 90.0, 50.0, 31.0, 31.0, 27.0, 9.0, 9.0, 7.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.0966796875, -1.0608062744140625, -1.024932861328125, -0.9890594482421875, -0.95318603515625, -0.9173126220703125, -0.881439208984375, -0.8455657958984375, -0.8096923828125, -0.7738189697265625, -0.737945556640625, -0.7020721435546875, -0.66619873046875, -0.6303253173828125, -0.594451904296875, -0.5585784912109375, -0.522705078125, -0.4868316650390625, -0.450958251953125, -0.4150848388671875, -0.37921142578125, -0.3433380126953125, -0.307464599609375, -0.2715911865234375, -0.2357177734375, -0.1998443603515625, -0.163970947265625, -0.1280975341796875, -0.09222412109375, -0.0563507080078125, -0.020477294921875, 0.0153961181640625, 0.05126953125, 0.0871429443359375, 0.123016357421875, 0.1588897705078125, 0.19476318359375, 0.2306365966796875, 0.266510009765625, 0.3023834228515625, 0.3382568359375, 0.3741302490234375, 0.410003662109375, 0.4458770751953125, 0.48175048828125, 0.5176239013671875, 0.553497314453125, 0.5893707275390625, 0.625244140625, 0.6611175537109375, 0.696990966796875, 0.7328643798828125, 0.76873779296875, 0.8046112060546875, 0.840484619140625, 0.8763580322265625, 0.9122314453125, 0.9481048583984375, 0.983978271484375, 1.0198516845703125, 1.05572509765625, 1.0915985107421875, 1.127471923828125, 1.1633453369140625, 1.19921875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 10.0, 4.0, 9.0, 9.0, 8.0, 9.0, 11.0, 18.0, 15.0, 31.0, 39.0, 43.0, 35.0, 48.0, 52.0, 48.0, 47.0, 50.0, 56.0, 67.0, 51.0, 53.0, 42.0, 32.0, 30.0, 28.0, 20.0, 26.0, 16.0, 17.0, 12.0, 8.0, 6.0, 8.0, 5.0, 9.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008759498596191406, -0.0008440092206001282, -0.0008120685815811157, -0.0007801279425621033, -0.0007481873035430908, -0.0007162466645240784, -0.0006843060255050659, -0.0006523653864860535, -0.000620424747467041, -0.0005884841084480286, -0.0005565434694290161, -0.0005246028304100037, -0.0004926621913909912, -0.00046072155237197876, -0.0004287809133529663, -0.00039684027433395386, -0.0003648996353149414, -0.00033295899629592896, -0.0003010183572769165, -0.00026907771825790405, -0.0002371370792388916, -0.00020519644021987915, -0.0001732558012008667, -0.00014131516218185425, -0.0001093745231628418, -7.743388414382935e-05, -4.5493245124816895e-05, -1.3552606105804443e-05, 1.8388032913208008e-05, 5.032867193222046e-05, 8.226931095123291e-05, 0.00011420994997024536, 0.0001461505889892578, 0.00017809122800827026, 0.00021003186702728271, 0.00024197250604629517, 0.0002739131450653076, 0.00030585378408432007, 0.0003377944231033325, 0.00036973506212234497, 0.0004016757011413574, 0.0004336163401603699, 0.0004655569791793823, 0.0004974976181983948, 0.0005294382572174072, 0.0005613788962364197, 0.0005933195352554321, 0.0006252601742744446, 0.000657200813293457, 0.0006891414523124695, 0.0007210820913314819, 0.0007530227303504944, 0.0007849633693695068, 0.0008169040083885193, 0.0008488446474075317, 0.0008807852864265442, 0.0009127259254455566, 0.0009446665644645691, 0.0009766072034835815, 0.001008547842502594, 0.0010404884815216064, 0.001072429120540619, 0.0011043697595596313, 0.0011363103985786438, 0.0011682510375976562]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 4.0, 5.0, 9.0, 13.0, 10.0, 10.0, 11.0, 20.0, 24.0, 25.0, 35.0, 38.0, 43.0, 73.0, 91.0, 146.0, 283.0, 546.0, 2741.0, 907796.0, 134160.0, 1220.0, 424.0, 218.0, 156.0, 95.0, 87.0, 51.0, 51.0, 30.0, 30.0, 11.0, 21.0, 12.0, 12.0, 14.0, 4.0, 7.0, 9.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.0248260498046875, -0.024132966995239258, -0.023439884185791016, -0.022746801376342773, -0.02205371856689453, -0.02136063575744629, -0.020667552947998047, -0.019974470138549805, -0.019281387329101562, -0.01858830451965332, -0.017895221710205078, -0.017202138900756836, -0.016509056091308594, -0.01581597328186035, -0.01512289047241211, -0.014429807662963867, -0.013736724853515625, -0.013043642044067383, -0.01235055923461914, -0.011657476425170898, -0.010964393615722656, -0.010271310806274414, -0.009578227996826172, -0.00888514518737793, -0.008192062377929688, -0.007498979568481445, -0.006805896759033203, -0.006112813949584961, -0.005419731140136719, -0.0047266483306884766, -0.004033565521240234, -0.003340482711791992, -0.00264739990234375, -0.001954317092895508, -0.0012612342834472656, -0.0005681514739990234, 0.00012493133544921875, 0.0008180141448974609, 0.0015110969543457031, 0.0022041797637939453, 0.0028972625732421875, 0.0035903453826904297, 0.004283428192138672, 0.004976511001586914, 0.005669593811035156, 0.0063626766204833984, 0.007055759429931641, 0.007748842239379883, 0.008441925048828125, 0.009135007858276367, 0.00982809066772461, 0.010521173477172852, 0.011214256286621094, 0.011907339096069336, 0.012600421905517578, 0.01329350471496582, 0.013986587524414062, 0.014679670333862305, 0.015372753143310547, 0.01606583595275879, 0.01675891876220703, 0.017452001571655273, 0.018145084381103516, 0.018838167190551758, 0.01953125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 26.0, 77.0, 192.0, 305.0, 251.0, 121.0, 32.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021674383897334337, -0.0021050528157502413, -0.002042667241767049, -0.0019802816677838564, -0.0019178962102159858, -0.0018555106362327933, -0.0017931251786649227, -0.0017307396046817303, -0.0016683540306985378, -0.0016059684567153454, -0.001543582882732153, -0.0014811974251642823, -0.0014188118511810899, -0.0013564262771978974, -0.0012940408196300268, -0.0012316552456468344, -0.001169269671663642, -0.0011068840976804495, -0.001044498523697257, -0.0009821130661293864, -0.000919727492146194, -0.0008573419181630015, -0.00079495640238747, -0.0007325708866119385, -0.000670185312628746, -0.0006077997386455536, -0.0005454142228700221, -0.00048302867799066007, -0.0004206431331112981, -0.0003582575882319361, -0.0002958720433525741, -0.00023348649847321212, -0.00017110072076320648, -0.0001087151758838445, -4.632963100448251e-05, 1.605591387487948e-05, 7.844145875424147e-05, 0.00014082700363360345, 0.00020321254851296544, 0.00026559809339232743, 0.0003279836382716894, 0.0003903691831510514, 0.0004527547280304134, 0.0005151402438059449, 0.0005775258177891374, 0.0006399113917723298, 0.0007022969075478613, 0.0007646824233233929, 0.0008270679973065853, 0.0008894535712897778, 0.0009518390870653093, 0.0010142246028408408, 0.0010766101768240333, 0.0011389957508072257, 0.0012013812083750963, 0.0012637667823582888, 0.0013261523563414812, 0.0013885379303246737, 0.001450923504307866, 0.0015133089618757367, 0.0015756945358589292, 0.0016380801098421216, 0.0017004655674099922, 0.0017628511413931847, 0.001825236715376377]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 2.0, 7.0, 9.0, 7.0, 11.0, 13.0, 18.0, 13.0, 14.0, 12.0, 32.0, 28.0, 24.0, 31.0, 39.0, 35.0, 23.0, 37.0, 30.0, 33.0, 42.0, 45.0, 48.0, 40.0, 49.0, 43.0, 31.0, 47.0, 29.0, 38.0, 15.0, 25.0, 22.0, 20.0, 21.0, 13.0, 11.0, 11.0, 7.0, 6.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005617737770080566, -0.000544319860637188, -0.0005268659442663193, -0.0005094120278954506, -0.0004919581115245819, -0.0004745041951537132, -0.00045705027878284454, -0.00043959636241197586, -0.0004221424460411072, -0.0004046885296702385, -0.0003872346132993698, -0.00036978069692850113, -0.00035232678055763245, -0.00033487286418676376, -0.0003174189478158951, -0.0002999650314450264, -0.0002825111150741577, -0.00026505719870328903, -0.00024760328233242035, -0.00023014936596155167, -0.00021269544959068298, -0.0001952415332198143, -0.00017778761684894562, -0.00016033370047807693, -0.00014287978410720825, -0.00012542586773633957, -0.00010797195136547089, -9.05180349946022e-05, -7.306411862373352e-05, -5.561020225286484e-05, -3.8156285881996155e-05, -2.0702369511127472e-05, -3.248453140258789e-06, 1.4205463230609894e-05, 3.165937960147858e-05, 4.911329597234726e-05, 6.656721234321594e-05, 8.402112871408463e-05, 0.00010147504508495331, 0.00011892896145582199, 0.00013638287782669067, 0.00015383679419755936, 0.00017129071056842804, 0.00018874462693929672, 0.0002061985433101654, 0.0002236524596810341, 0.00024110637605190277, 0.00025856029242277145, 0.00027601420879364014, 0.0002934681251645088, 0.0003109220415353775, 0.0003283759579062462, 0.00034582987427711487, 0.00036328379064798355, 0.00038073770701885223, 0.0003981916233897209, 0.0004156455397605896, 0.0004330994561314583, 0.00045055337250232697, 0.00046800728887319565, 0.00048546120524406433, 0.000502915121614933, 0.0005203690379858017, 0.0005378229543566704, 0.0005552768707275391]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 6.0, 13.0, 9.0, 11.0, 15.0, 20.0, 24.0, 32.0, 37.0, 23.0, 35.0, 39.0, 51.0, 42.0, 46.0, 53.0, 53.0, 45.0, 45.0, 45.0, 46.0, 34.0, 30.0, 34.0, 36.0, 30.0, 17.0, 27.0, 15.0, 18.0, 11.0, 12.0, 16.0, 5.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.859375, -6.6131591796875, -6.366943359375, -6.1207275390625, -5.87451171875, -5.6282958984375, -5.382080078125, -5.1358642578125, -4.8896484375, -4.6434326171875, -4.397216796875, -4.1510009765625, -3.90478515625, -3.6585693359375, -3.412353515625, -3.1661376953125, -2.919921875, -2.6737060546875, -2.427490234375, -2.1812744140625, -1.93505859375, -1.6888427734375, -1.442626953125, -1.1964111328125, -0.9501953125, -0.7039794921875, -0.457763671875, -0.2115478515625, 0.03466796875, 0.2808837890625, 0.527099609375, 0.7733154296875, 1.01953125, 1.2657470703125, 1.511962890625, 1.7581787109375, 2.00439453125, 2.2506103515625, 2.496826171875, 2.7430419921875, 2.9892578125, 3.2354736328125, 3.481689453125, 3.7279052734375, 3.97412109375, 4.2203369140625, 4.466552734375, 4.7127685546875, 4.958984375, 5.2052001953125, 5.451416015625, 5.6976318359375, 5.94384765625, 6.1900634765625, 6.436279296875, 6.6824951171875, 6.9287109375, 7.1749267578125, 7.421142578125, 7.6673583984375, 7.91357421875, 8.1597900390625, 8.406005859375, 8.6522216796875, 8.8984375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 6.0, 5.0, 13.0, 8.0, 15.0, 21.0, 30.0, 65.0, 64.0, 84.0, 152.0, 304.0, 627.0, 1248.0, 2702.0, 5712.0, 12253.0, 27290.0, 64533.0, 172098.0, 365619.0, 240026.0, 89427.0, 35821.0, 16158.0, 7377.0, 3515.0, 1630.0, 808.0, 376.0, 197.0, 119.0, 83.0, 50.0, 29.0, 25.0, 20.0, 13.0, 14.0, 5.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8515625, -6.628173828125, -6.40478515625, -6.181396484375, -5.9580078125, -5.734619140625, -5.51123046875, -5.287841796875, -5.064453125, -4.841064453125, -4.61767578125, -4.394287109375, -4.1708984375, -3.947509765625, -3.72412109375, -3.500732421875, -3.27734375, -3.053955078125, -2.83056640625, -2.607177734375, -2.3837890625, -2.160400390625, -1.93701171875, -1.713623046875, -1.490234375, -1.266845703125, -1.04345703125, -0.820068359375, -0.5966796875, -0.373291015625, -0.14990234375, 0.073486328125, 0.296875, 0.520263671875, 0.74365234375, 0.967041015625, 1.1904296875, 1.413818359375, 1.63720703125, 1.860595703125, 2.083984375, 2.307373046875, 2.53076171875, 2.754150390625, 2.9775390625, 3.200927734375, 3.42431640625, 3.647705078125, 3.87109375, 4.094482421875, 4.31787109375, 4.541259765625, 4.7646484375, 4.988037109375, 5.21142578125, 5.434814453125, 5.658203125, 5.881591796875, 6.10498046875, 6.328369140625, 6.5517578125, 6.775146484375, 6.99853515625, 7.221923828125, 7.4453125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 4.0, 4.0, 9.0, 11.0, 9.0, 14.0, 13.0, 16.0, 11.0, 11.0, 30.0, 28.0, 24.0, 20.0, 49.0, 44.0, 67.0, 80.0, 149.0, 390.0, 1438.0, 179.0, 80.0, 56.0, 39.0, 51.0, 32.0, 27.0, 24.0, 27.0, 18.0, 15.0, 13.0, 12.0, 16.0, 12.0, 7.0, 5.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.46875, -28.6044921875, -27.740234375, -26.8759765625, -26.01171875, -25.1474609375, -24.283203125, -23.4189453125, -22.5546875, -21.6904296875, -20.826171875, -19.9619140625, -19.09765625, -18.2333984375, -17.369140625, -16.5048828125, -15.640625, -14.7763671875, -13.912109375, -13.0478515625, -12.18359375, -11.3193359375, -10.455078125, -9.5908203125, -8.7265625, -7.8623046875, -6.998046875, -6.1337890625, -5.26953125, -4.4052734375, -3.541015625, -2.6767578125, -1.8125, -0.9482421875, -0.083984375, 0.7802734375, 1.64453125, 2.5087890625, 3.373046875, 4.2373046875, 5.1015625, 5.9658203125, 6.830078125, 7.6943359375, 8.55859375, 9.4228515625, 10.287109375, 11.1513671875, 12.015625, 12.8798828125, 13.744140625, 14.6083984375, 15.47265625, 16.3369140625, 17.201171875, 18.0654296875, 18.9296875, 19.7939453125, 20.658203125, 21.5224609375, 22.38671875, 23.2509765625, 24.115234375, 24.9794921875, 25.84375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 2.0, 9.0, 8.0, 13.0, 21.0, 17.0, 29.0, 46.0, 53.0, 55.0, 109.0, 145.0, 284.0, 511.0, 1803.0, 2963986.0, 176455.0, 1026.0, 431.0, 228.0, 147.0, 95.0, 57.0, 41.0, 35.0, 31.0, 29.0, 11.0, 8.0, 6.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-100.0, -96.861328125, -93.72265625, -90.583984375, -87.4453125, -84.306640625, -81.16796875, -78.029296875, -74.890625, -71.751953125, -68.61328125, -65.474609375, -62.3359375, -59.197265625, -56.05859375, -52.919921875, -49.78125, -46.642578125, -43.50390625, -40.365234375, -37.2265625, -34.087890625, -30.94921875, -27.810546875, -24.671875, -21.533203125, -18.39453125, -15.255859375, -12.1171875, -8.978515625, -5.83984375, -2.701171875, 0.4375, 3.576171875, 6.71484375, 9.853515625, 12.9921875, 16.130859375, 19.26953125, 22.408203125, 25.546875, 28.685546875, 31.82421875, 34.962890625, 38.1015625, 41.240234375, 44.37890625, 47.517578125, 50.65625, 53.794921875, 56.93359375, 60.072265625, 63.2109375, 66.349609375, 69.48828125, 72.626953125, 75.765625, 78.904296875, 82.04296875, 85.181640625, 88.3203125, 91.458984375, 94.59765625, 97.736328125, 100.875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [11.0, 501.0, 499.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.462803840637207, -7.869811534881592, -0.27681922912597656, 7.3161725997924805, 14.909165382385254, 22.502159118652344, 30.095149993896484, 37.68814468383789, 45.28113555908203, 52.87412643432617, 60.46712112426758, 68.06011199951172, 75.65310668945312, 83.24609375, 90.8390884399414, 98.43208312988281, 106.02507019042969, 113.6180648803711, 121.21105194091797, 128.80404663085938, 136.39703369140625, 143.9900360107422, 151.58302307128906, 159.176025390625, 166.76901245117188, 174.36199951171875, 181.9550018310547, 189.54798889160156, 197.14097595214844, 204.73397827148438, 212.32696533203125, 219.91995239257812, 227.51295471191406, 235.10594177246094, 242.69894409179688, 250.29193115234375, 257.8849182128906, 265.4779052734375, 273.0709228515625, 280.6639099121094, 288.25689697265625, 295.8498840332031, 303.44287109375, 311.035888671875, 318.6288757324219, 326.22186279296875, 333.8148498535156, 341.4078369140625, 349.0008239746094, 356.59381103515625, 364.1867980957031, 371.77978515625, 379.372802734375, 386.9657897949219, 394.55877685546875, 402.1517639160156, 409.7447814941406, 417.3377685546875, 424.9307556152344, 432.52374267578125, 440.11676025390625, 447.7097473144531, 455.302734375, 462.8957214355469, 470.48870849609375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 10.0, 8.0, 10.0, 20.0, 14.0, 15.0, 15.0, 17.0, 12.0, 21.0, 19.0, 23.0, 30.0, 24.0, 29.0, 30.0, 45.0, 41.0, 32.0, 40.0, 33.0, 27.0, 29.0, 35.0, 34.0, 26.0, 36.0, 28.0, 32.0, 23.0, 36.0, 24.0, 20.0, 22.0, 30.0, 15.0, 19.0, 13.0, 12.0, 6.0, 8.0, 7.0, 3.0, 6.0, 5.0, 3.0, 3.0, 1.0, 4.0, 4.0, 0.0, 2.0, 2.0], "bins": [-53.91154098510742, -52.26323318481445, -50.614925384521484, -48.966617584228516, -47.31830978393555, -45.67000198364258, -44.021690368652344, -42.373382568359375, -40.725074768066406, -39.07676696777344, -37.42845916748047, -35.7801513671875, -34.13184356689453, -32.48353576660156, -30.83522605895996, -29.186918258666992, -27.538612365722656, -25.890304565429688, -24.24199676513672, -22.59368896484375, -20.94538116455078, -19.297073364257812, -17.64876365661621, -16.000455856323242, -14.352148056030273, -12.703840255737305, -11.055532455444336, -9.40722370147705, -7.758915901184082, -6.110608100891113, -4.462299346923828, -2.8139915466308594, -1.1656837463378906, 0.4826242923736572, 2.130932331085205, 3.779240608215332, 5.427548408508301, 7.0758562088012695, 8.724164962768555, 10.372472763061523, 12.020780563354492, 13.669088363647461, 15.31739616394043, 16.96570587158203, 18.614013671875, 20.26232147216797, 21.910629272460938, 23.558937072753906, 25.207244873046875, 26.855552673339844, 28.503860473632812, 30.15216827392578, 31.80047607421875, 33.44878387451172, 35.09709167480469, 36.745399475097656, 38.393707275390625, 40.042015075683594, 41.69032287597656, 43.33863067626953, 44.9869384765625, 46.63524627685547, 48.28355407714844, 49.931861877441406, 51.58017349243164]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 7.0, 6.0, 2.0, 15.0, 15.0, 11.0, 14.0, 14.0, 30.0, 28.0, 18.0, 36.0, 27.0, 45.0, 51.0, 52.0, 43.0, 52.0, 47.0, 53.0, 50.0, 35.0, 40.0, 38.0, 23.0, 31.0, 32.0, 31.0, 25.0, 22.0, 15.0, 21.0, 18.0, 11.0, 11.0, 10.0, 3.0, 8.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.26953125, -7.00006103515625, -6.7305908203125, -6.46112060546875, -6.191650390625, -5.92218017578125, -5.6527099609375, -5.38323974609375, -5.11376953125, -4.84429931640625, -4.5748291015625, -4.30535888671875, -4.035888671875, -3.76641845703125, -3.4969482421875, -3.22747802734375, -2.9580078125, -2.68853759765625, -2.4190673828125, -2.14959716796875, -1.880126953125, -1.61065673828125, -1.3411865234375, -1.07171630859375, -0.80224609375, -0.53277587890625, -0.2633056640625, 0.00616455078125, 0.275634765625, 0.54510498046875, 0.8145751953125, 1.08404541015625, 1.353515625, 1.62298583984375, 1.8924560546875, 2.16192626953125, 2.431396484375, 2.70086669921875, 2.9703369140625, 3.23980712890625, 3.50927734375, 3.77874755859375, 4.0482177734375, 4.31768798828125, 4.587158203125, 4.85662841796875, 5.1260986328125, 5.39556884765625, 5.6650390625, 5.93450927734375, 6.2039794921875, 6.47344970703125, 6.742919921875, 7.01239013671875, 7.2818603515625, 7.55133056640625, 7.82080078125, 8.09027099609375, 8.3597412109375, 8.62921142578125, 8.898681640625, 9.16815185546875, 9.4376220703125, 9.70709228515625, 9.9765625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 9.0, 16.0, 13.0, 19.0, 19.0, 18.0, 35.0, 47.0, 60.0, 75.0, 116.0, 181.0, 375.0, 872.0, 4493.0, 184921.0, 3232023.0, 756109.0, 12380.0, 1348.0, 424.0, 207.0, 132.0, 83.0, 67.0, 48.0, 42.0, 37.0, 23.0, 15.0, 15.0, 8.0, 13.0, 9.0, 7.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.15625, -23.313720703125, -22.47119140625, -21.628662109375, -20.7861328125, -19.943603515625, -19.10107421875, -18.258544921875, -17.416015625, -16.573486328125, -15.73095703125, -14.888427734375, -14.0458984375, -13.203369140625, -12.36083984375, -11.518310546875, -10.67578125, -9.833251953125, -8.99072265625, -8.148193359375, -7.3056640625, -6.463134765625, -5.62060546875, -4.778076171875, -3.935546875, -3.093017578125, -2.25048828125, -1.407958984375, -0.5654296875, 0.277099609375, 1.11962890625, 1.962158203125, 2.8046875, 3.647216796875, 4.48974609375, 5.332275390625, 6.1748046875, 7.017333984375, 7.85986328125, 8.702392578125, 9.544921875, 10.387451171875, 11.22998046875, 12.072509765625, 12.9150390625, 13.757568359375, 14.60009765625, 15.442626953125, 16.28515625, 17.127685546875, 17.97021484375, 18.812744140625, 19.6552734375, 20.497802734375, 21.34033203125, 22.182861328125, 23.025390625, 23.867919921875, 24.71044921875, 25.552978515625, 26.3955078125, 27.238037109375, 28.08056640625, 28.923095703125, 29.765625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 6.0, 9.0, 16.0, 23.0, 34.0, 54.0, 60.0, 80.0, 98.0, 183.0, 212.0, 345.0, 408.0, 446.0, 455.0, 403.0, 337.0, 246.0, 184.0, 118.0, 94.0, 73.0, 55.0, 42.0, 23.0, 21.0, 14.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.203125, -14.69775390625, -14.1923828125, -13.68701171875, -13.181640625, -12.67626953125, -12.1708984375, -11.66552734375, -11.16015625, -10.65478515625, -10.1494140625, -9.64404296875, -9.138671875, -8.63330078125, -8.1279296875, -7.62255859375, -7.1171875, -6.61181640625, -6.1064453125, -5.60107421875, -5.095703125, -4.59033203125, -4.0849609375, -3.57958984375, -3.07421875, -2.56884765625, -2.0634765625, -1.55810546875, -1.052734375, -0.54736328125, -0.0419921875, 0.46337890625, 0.96875, 1.47412109375, 1.9794921875, 2.48486328125, 2.990234375, 3.49560546875, 4.0009765625, 4.50634765625, 5.01171875, 5.51708984375, 6.0224609375, 6.52783203125, 7.033203125, 7.53857421875, 8.0439453125, 8.54931640625, 9.0546875, 9.56005859375, 10.0654296875, 10.57080078125, 11.076171875, 11.58154296875, 12.0869140625, 12.59228515625, 13.09765625, 13.60302734375, 14.1083984375, 14.61376953125, 15.119140625, 15.62451171875, 16.1298828125, 16.63525390625, 17.140625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 8.0, 7.0, 19.0, 23.0, 29.0, 58.0, 67.0, 95.0, 127.0, 175.0, 259.0, 383.0, 625.0, 5457.0, 3675610.0, 508120.0, 1579.0, 539.0, 319.0, 247.0, 152.0, 104.0, 86.0, 57.0, 45.0, 25.0, 17.0, 12.0, 9.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.5, -74.23828125, -71.9765625, -69.71484375, -67.453125, -65.19140625, -62.9296875, -60.66796875, -58.40625, -56.14453125, -53.8828125, -51.62109375, -49.359375, -47.09765625, -44.8359375, -42.57421875, -40.3125, -38.05078125, -35.7890625, -33.52734375, -31.265625, -29.00390625, -26.7421875, -24.48046875, -22.21875, -19.95703125, -17.6953125, -15.43359375, -13.171875, -10.91015625, -8.6484375, -6.38671875, -4.125, -1.86328125, 0.3984375, 2.66015625, 4.921875, 7.18359375, 9.4453125, 11.70703125, 13.96875, 16.23046875, 18.4921875, 20.75390625, 23.015625, 25.27734375, 27.5390625, 29.80078125, 32.0625, 34.32421875, 36.5859375, 38.84765625, 41.109375, 43.37109375, 45.6328125, 47.89453125, 50.15625, 52.41796875, 54.6796875, 56.94140625, 59.203125, 61.46484375, 63.7265625, 65.98828125, 68.25]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 16.0, 228.0, 582.0, 180.0, 10.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.25180053710938, -59.91868209838867, -50.58556365966797, -41.252445220947266, -31.919326782226562, -22.58620834350586, -13.253089904785156, -3.9199676513671875, 5.41314697265625, 14.746265411376953, 24.079383850097656, 33.41250228881836, 42.74562072753906, 52.078739166259766, 61.41185760498047, 70.74497985839844, 80.07809448242188, 89.41120910644531, 98.74433135986328, 108.07745361328125, 117.41056823730469, 126.74368286132812, 136.07681274414062, 145.40992736816406, 154.7430419921875, 164.07615661621094, 173.40927124023438, 182.74240112304688, 192.0755157470703, 201.40863037109375, 210.74176025390625, 220.0748748779297, 229.40802001953125, 238.7411346435547, 248.07424926757812, 257.4073791503906, 266.740478515625, 276.0736083984375, 285.40673828125, 294.7398681640625, 304.0729675292969, 313.4060974121094, 322.73919677734375, 332.07232666015625, 341.40545654296875, 350.7385559082031, 360.0716857910156, 369.40478515625, 378.7379150390625, 388.071044921875, 397.4041442871094, 406.7372741699219, 416.07037353515625, 425.40350341796875, 434.73663330078125, 444.06976318359375, 453.4028625488281, 462.7359924316406, 472.069091796875, 481.4022216796875, 490.7353515625, 500.0684509277344, 509.4015808105469, 518.7346801757812, 528.0678100585938]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 3.0, 8.0, 4.0, 5.0, 11.0, 9.0, 19.0, 15.0, 24.0, 25.0, 27.0, 31.0, 27.0, 42.0, 31.0, 43.0, 33.0, 36.0, 43.0, 35.0, 52.0, 48.0, 37.0, 34.0, 35.0, 44.0, 40.0, 40.0, 33.0, 22.0, 21.0, 22.0, 14.0, 14.0, 10.0, 12.0, 14.0, 6.0, 7.0, 7.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.38121795654297, -51.78391647338867, -50.18661117553711, -48.58930969238281, -46.99200439453125, -45.39470291137695, -43.797401428222656, -42.200096130371094, -40.6027946472168, -39.0054931640625, -37.40818786621094, -35.81088638305664, -34.213584899902344, -32.61627960205078, -31.018978118896484, -29.421674728393555, -27.824371337890625, -26.227067947387695, -24.629764556884766, -23.03246307373047, -21.43515968322754, -19.83785629272461, -18.240554809570312, -16.643251419067383, -15.045948028564453, -13.448644638061523, -11.85134220123291, -10.254039764404297, -8.656736373901367, -7.059433460235596, -5.462130546569824, -3.864828109741211, -2.2675209045410156, -0.6702179908752441, 0.9270849227905273, 2.524387836456299, 4.12169075012207, 5.718993663787842, 7.316296577453613, 8.913599014282227, 10.510902404785156, 12.108205795288086, 13.7055082321167, 15.302810668945312, 16.900114059448242, 18.497417449951172, 20.09471893310547, 21.6920223236084, 23.289325714111328, 24.886629104614258, 26.483932495117188, 28.081233978271484, 29.678537368774414, 31.275840759277344, 32.87314224243164, 34.47044372558594, 36.0677490234375, 37.6650505065918, 39.26235580444336, 40.859657287597656, 42.45696258544922, 44.054264068603516, 45.65156555175781, 47.248870849609375, 48.84617233276367]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 10.0, 8.0, 11.0, 28.0, 19.0, 20.0, 20.0, 26.0, 25.0, 24.0, 27.0, 47.0, 45.0, 38.0, 41.0, 53.0, 51.0, 45.0, 50.0, 50.0, 40.0, 38.0, 32.0, 39.0, 26.0, 24.0, 22.0, 24.0, 19.0, 19.0, 15.0, 12.0, 12.0, 11.0, 9.0, 9.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.91668701171875, -7.6693115234375, -7.42193603515625, -7.174560546875, -6.92718505859375, -6.6798095703125, -6.43243408203125, -6.18505859375, -5.93768310546875, -5.6903076171875, -5.44293212890625, -5.195556640625, -4.94818115234375, -4.7008056640625, -4.45343017578125, -4.2060546875, -3.95867919921875, -3.7113037109375, -3.46392822265625, -3.216552734375, -2.96917724609375, -2.7218017578125, -2.47442626953125, -2.22705078125, -1.97967529296875, -1.7322998046875, -1.48492431640625, -1.237548828125, -0.99017333984375, -0.7427978515625, -0.49542236328125, -0.248046875, -0.00067138671875, 0.2467041015625, 0.49407958984375, 0.741455078125, 0.98883056640625, 1.2362060546875, 1.48358154296875, 1.73095703125, 1.97833251953125, 2.2257080078125, 2.47308349609375, 2.720458984375, 2.96783447265625, 3.2152099609375, 3.46258544921875, 3.7099609375, 3.95733642578125, 4.2047119140625, 4.45208740234375, 4.699462890625, 4.94683837890625, 5.1942138671875, 5.44158935546875, 5.68896484375, 5.93634033203125, 6.1837158203125, 6.43109130859375, 6.678466796875, 6.92584228515625, 7.1732177734375, 7.42059326171875, 7.66796875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 11.0, 14.0, 19.0, 36.0, 45.0, 80.0, 117.0, 155.0, 228.0, 394.0, 574.0, 894.0, 1485.0, 2153.0, 3373.0, 5291.0, 8311.0, 13126.0, 21404.0, 35959.0, 63905.0, 129168.0, 284219.0, 234248.0, 105649.0, 55294.0, 31489.0, 18654.0, 11749.0, 7357.0, 4755.0, 3036.0, 1850.0, 1158.0, 793.0, 510.0, 339.0, 234.0, 137.0, 108.0, 73.0, 47.0, 39.0, 25.0, 14.0, 9.0, 11.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.3828125, -1.3407440185546875, -1.298675537109375, -1.2566070556640625, -1.21453857421875, -1.1724700927734375, -1.130401611328125, -1.0883331298828125, -1.0462646484375, -1.0041961669921875, -0.962127685546875, -0.9200592041015625, -0.87799072265625, -0.8359222412109375, -0.793853759765625, -0.7517852783203125, -0.709716796875, -0.6676483154296875, -0.625579833984375, -0.5835113525390625, -0.54144287109375, -0.4993743896484375, -0.457305908203125, -0.4152374267578125, -0.3731689453125, -0.3311004638671875, -0.289031982421875, -0.2469635009765625, -0.20489501953125, -0.1628265380859375, -0.120758056640625, -0.0786895751953125, -0.03662109375, 0.0054473876953125, 0.047515869140625, 0.0895843505859375, 0.13165283203125, 0.1737213134765625, 0.215789794921875, 0.2578582763671875, 0.2999267578125, 0.3419952392578125, 0.384063720703125, 0.4261322021484375, 0.46820068359375, 0.5102691650390625, 0.552337646484375, 0.5944061279296875, 0.636474609375, 0.6785430908203125, 0.720611572265625, 0.7626800537109375, 0.80474853515625, 0.8468170166015625, 0.888885498046875, 0.9309539794921875, 0.9730224609375, 1.0150909423828125, 1.057159423828125, 1.0992279052734375, 1.14129638671875, 1.1833648681640625, 1.225433349609375, 1.2675018310546875, 1.3095703125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 8.0, 12.0, 12.0, 17.0, 20.0, 17.0, 26.0, 26.0, 28.0, 42.0, 39.0, 52.0, 41.0, 49.0, 57.0, 1079.0, 47.0, 56.0, 55.0, 52.0, 42.0, 33.0, 42.0, 33.0, 31.0, 20.0, 18.0, 20.0, 13.0, 10.0, 7.0, 5.0, 8.0, 4.0, 0.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.55859375, -5.37628173828125, -5.1939697265625, -5.01165771484375, -4.829345703125, -4.64703369140625, -4.4647216796875, -4.28240966796875, -4.10009765625, -3.91778564453125, -3.7354736328125, -3.55316162109375, -3.370849609375, -3.18853759765625, -3.0062255859375, -2.82391357421875, -2.6416015625, -2.45928955078125, -2.2769775390625, -2.09466552734375, -1.912353515625, -1.73004150390625, -1.5477294921875, -1.36541748046875, -1.18310546875, -1.00079345703125, -0.8184814453125, -0.63616943359375, -0.453857421875, -0.27154541015625, -0.0892333984375, 0.09307861328125, 0.275390625, 0.45770263671875, 0.6400146484375, 0.82232666015625, 1.004638671875, 1.18695068359375, 1.3692626953125, 1.55157470703125, 1.73388671875, 1.91619873046875, 2.0985107421875, 2.28082275390625, 2.463134765625, 2.64544677734375, 2.8277587890625, 3.01007080078125, 3.1923828125, 3.37469482421875, 3.5570068359375, 3.73931884765625, 3.921630859375, 4.10394287109375, 4.2862548828125, 4.46856689453125, 4.65087890625, 4.83319091796875, 5.0155029296875, 5.19781494140625, 5.380126953125, 5.56243896484375, 5.7447509765625, 5.92706298828125, 6.109375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 12.0, 4.0, 16.0, 22.0, 28.0, 35.0, 49.0, 64.0, 110.0, 173.0, 250.0, 376.0, 593.0, 969.0, 1508.0, 2379.0, 4037.0, 6835.0, 11490.0, 20514.0, 36601.0, 69756.0, 148392.0, 1373697.0, 212732.0, 94673.0, 48279.0, 26180.0, 15050.0, 8637.0, 5152.0, 3080.0, 2078.0, 1121.0, 736.0, 492.0, 330.0, 241.0, 139.0, 117.0, 58.0, 55.0, 34.0, 10.0, 9.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.548828125, -1.5014801025390625, -1.454132080078125, -1.4067840576171875, -1.35943603515625, -1.3120880126953125, -1.264739990234375, -1.2173919677734375, -1.1700439453125, -1.1226959228515625, -1.075347900390625, -1.0279998779296875, -0.98065185546875, -0.9333038330078125, -0.885955810546875, -0.8386077880859375, -0.791259765625, -0.7439117431640625, -0.696563720703125, -0.6492156982421875, -0.60186767578125, -0.5545196533203125, -0.507171630859375, -0.4598236083984375, -0.4124755859375, -0.3651275634765625, -0.317779541015625, -0.2704315185546875, -0.22308349609375, -0.1757354736328125, -0.128387451171875, -0.0810394287109375, -0.03369140625, 0.0136566162109375, 0.061004638671875, 0.1083526611328125, 0.15570068359375, 0.2030487060546875, 0.250396728515625, 0.2977447509765625, 0.3450927734375, 0.3924407958984375, 0.439788818359375, 0.4871368408203125, 0.53448486328125, 0.5818328857421875, 0.629180908203125, 0.6765289306640625, 0.723876953125, 0.7712249755859375, 0.818572998046875, 0.8659210205078125, 0.91326904296875, 0.9606170654296875, 1.007965087890625, 1.0553131103515625, 1.1026611328125, 1.1500091552734375, 1.197357177734375, 1.2447052001953125, 1.29205322265625, 1.3394012451171875, 1.386749267578125, 1.4340972900390625, 1.4814453125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 9.0, 7.0, 5.0, 7.0, 9.0, 19.0, 25.0, 24.0, 29.0, 26.0, 45.0, 52.0, 61.0, 69.0, 88.0, 63.0, 69.0, 56.0, 56.0, 54.0, 37.0, 33.0, 28.0, 22.0, 19.0, 19.0, 11.0, 7.0, 5.0, 10.0, 6.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009107589721679688, -0.0008774846792221069, -0.0008442103862762451, -0.0008109360933303833, -0.0007776618003845215, -0.0007443875074386597, -0.0007111132144927979, -0.000677838921546936, -0.0006445646286010742, -0.0006112903356552124, -0.0005780160427093506, -0.0005447417497634888, -0.000511467456817627, -0.00047819316387176514, -0.0004449188709259033, -0.0004116445779800415, -0.0003783702850341797, -0.00034509599208831787, -0.00031182169914245605, -0.00027854740619659424, -0.0002452731132507324, -0.0002119988203048706, -0.0001787245273590088, -0.00014545023441314697, -0.00011217594146728516, -7.890164852142334e-05, -4.5627355575561523e-05, -1.2353062629699707e-05, 2.092123031616211e-05, 5.4195523262023926e-05, 8.746981620788574e-05, 0.00012074410915374756, 0.00015401840209960938, 0.0001872926950454712, 0.000220566987991333, 0.0002538412809371948, 0.00028711557388305664, 0.00032038986682891846, 0.0003536641597747803, 0.0003869384527206421, 0.0004202127456665039, 0.0004534870386123657, 0.00048676133155822754, 0.0005200356245040894, 0.0005533099174499512, 0.000586584210395813, 0.0006198585033416748, 0.0006531327962875366, 0.0006864070892333984, 0.0007196813821792603, 0.0007529556751251221, 0.0007862299680709839, 0.0008195042610168457, 0.0008527785539627075, 0.0008860528469085693, 0.0009193271398544312, 0.000952601432800293, 0.0009858757257461548, 0.0010191500186920166, 0.0010524243116378784, 0.0010856986045837402, 0.001118972897529602, 0.0011522471904754639, 0.0011855214834213257, 0.0012187957763671875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 10.0, 13.0, 8.0, 9.0, 13.0, 16.0, 23.0, 28.0, 24.0, 55.0, 61.0, 94.0, 150.0, 217.0, 499.0, 4221.0, 1005664.0, 35885.0, 761.0, 259.0, 152.0, 120.0, 59.0, 50.0, 35.0, 30.0, 28.0, 7.0, 15.0, 11.0, 6.0, 6.0, 5.0, 7.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.02899169921875, -0.028241872787475586, -0.027492046356201172, -0.026742219924926758, -0.025992393493652344, -0.02524256706237793, -0.024492740631103516, -0.0237429141998291, -0.022993087768554688, -0.022243261337280273, -0.02149343490600586, -0.020743608474731445, -0.01999378204345703, -0.019243955612182617, -0.018494129180908203, -0.01774430274963379, -0.016994476318359375, -0.01624464988708496, -0.015494823455810547, -0.014744997024536133, -0.013995170593261719, -0.013245344161987305, -0.01249551773071289, -0.011745691299438477, -0.010995864868164062, -0.010246038436889648, -0.009496212005615234, -0.00874638557434082, -0.007996559143066406, -0.007246732711791992, -0.006496906280517578, -0.005747079849243164, -0.00499725341796875, -0.004247426986694336, -0.003497600555419922, -0.002747774124145508, -0.0019979476928710938, -0.0012481212615966797, -0.0004982948303222656, 0.00025153160095214844, 0.0010013580322265625, 0.0017511844635009766, 0.0025010108947753906, 0.0032508373260498047, 0.004000663757324219, 0.004750490188598633, 0.005500316619873047, 0.006250143051147461, 0.006999969482421875, 0.007749795913696289, 0.008499622344970703, 0.009249448776245117, 0.009999275207519531, 0.010749101638793945, 0.01149892807006836, 0.012248754501342773, 0.012998580932617188, 0.013748407363891602, 0.014498233795166016, 0.01524806022644043, 0.015997886657714844, 0.016747713088989258, 0.017497539520263672, 0.018247365951538086, 0.0189971923828125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 9.0, 75.0, 382.0, 413.0, 124.0, 15.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005713447462767363, -0.005609740503132343, -0.005506033543497324, -0.005402327049523592, -0.005298620089888573, -0.005194913130253553, -0.005091206170618534, -0.004987499210983515, -0.004883792717009783, -0.0047800857573747635, -0.004676378797739744, -0.004572672303766012, -0.004468965344130993, -0.004365258384495974, -0.004261551424860954, -0.004157844465225935, -0.004054137505590916, -0.003950430545955896, -0.0038467238191515207, -0.0037430168595165014, -0.0036393101327121258, -0.0035356031730771065, -0.003431896213442087, -0.0033281894866377115, -0.003224482759833336, -0.0031207758001983166, -0.003017069073393941, -0.0029133621137589216, -0.002809655386954546, -0.0027059484273195267, -0.0026022414676845074, -0.0024985347408801317, -0.002394828014075756, -0.0022911210544407368, -0.002187414327636361, -0.002083707368001342, -0.001980000641196966, -0.0018762936815619469, -0.0017725868383422494, -0.001668879995122552, -0.0015651730354875326, -0.0014614661922678351, -0.0013577593490481377, -0.0012540523894131184, -0.0011503455461934209, -0.0010466387029737234, -0.0009429318597540259, -0.0008392249583266675, -0.0007355181151069701, -0.0006318112718872726, -0.0005281043704599142, -0.00042439752724021673, -0.0003206906549166888, -0.00021698378259316087, -0.00011327693937346339, -9.570037946105003e-06, 9.413680527359247e-05, 0.0001978436775971204, 0.00030155054992064834, 0.0004052573931403458, 0.0005089642945677042, 0.0006126711377874017, 0.0007163779810070992, 0.0008200848824344575, 0.000923791725654155]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 8.0, 9.0, 20.0, 14.0, 20.0, 19.0, 26.0, 20.0, 36.0, 34.0, 38.0, 29.0, 50.0, 34.0, 49.0, 42.0, 54.0, 38.0, 53.0, 48.0, 54.0, 52.0, 46.0, 31.0, 36.0, 19.0, 26.0, 20.0, 22.0, 12.0, 14.0, 7.0, 5.0, 4.0, 2.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005475878715515137, -0.0005288589745759964, -0.0005101300776004791, -0.0004914011806249619, -0.0004726722836494446, -0.0004539433866739273, -0.00043521448969841003, -0.00041648559272289276, -0.0003977566957473755, -0.0003790277987718582, -0.00036029890179634094, -0.00034157000482082367, -0.0003228411078453064, -0.0003041122108697891, -0.00028538331389427185, -0.0002666544169187546, -0.0002479255199432373, -0.00022919662296772003, -0.00021046772599220276, -0.00019173882901668549, -0.0001730099320411682, -0.00015428103506565094, -0.00013555213809013367, -0.0001168232411146164, -9.809434413909912e-05, -7.936544716358185e-05, -6.0636550188064575e-05, -4.19076532125473e-05, -2.317875623703003e-05, -4.449859261512756e-06, 1.4279037714004517e-05, 3.300793468952179e-05, 5.173683166503906e-05, 7.046572864055634e-05, 8.919462561607361e-05, 0.00010792352259159088, 0.00012665241956710815, 0.00014538131654262543, 0.0001641102135181427, 0.00018283911049365997, 0.00020156800746917725, 0.00022029690444469452, 0.0002390258014202118, 0.00025775469839572906, 0.00027648359537124634, 0.0002952124923467636, 0.0003139413893222809, 0.00033267028629779816, 0.00035139918327331543, 0.0003701280802488327, 0.00038885697722435, 0.00040758587419986725, 0.0004263147711753845, 0.0004450436681509018, 0.00046377256512641907, 0.00048250146210193634, 0.0005012303590774536, 0.0005199592560529709, 0.0005386881530284882, 0.0005574170500040054, 0.0005761459469795227, 0.00059487484395504, 0.0006136037409305573, 0.0006323326379060745, 0.0006510615348815918]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 10.0, 8.0, 11.0, 28.0, 19.0, 20.0, 20.0, 26.0, 25.0, 24.0, 27.0, 47.0, 45.0, 38.0, 41.0, 53.0, 51.0, 45.0, 50.0, 50.0, 40.0, 38.0, 32.0, 39.0, 26.0, 24.0, 22.0, 24.0, 19.0, 19.0, 15.0, 12.0, 12.0, 11.0, 9.0, 9.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.91668701171875, -7.6693115234375, -7.42193603515625, -7.174560546875, -6.92718505859375, -6.6798095703125, -6.43243408203125, -6.18505859375, -5.93768310546875, -5.6903076171875, -5.44293212890625, -5.195556640625, -4.94818115234375, -4.7008056640625, -4.45343017578125, -4.2060546875, -3.95867919921875, -3.7113037109375, -3.46392822265625, -3.216552734375, -2.96917724609375, -2.7218017578125, -2.47442626953125, -2.22705078125, -1.97967529296875, -1.7322998046875, -1.48492431640625, -1.237548828125, -0.99017333984375, -0.7427978515625, -0.49542236328125, -0.248046875, -0.00067138671875, 0.2467041015625, 0.49407958984375, 0.741455078125, 0.98883056640625, 1.2362060546875, 1.48358154296875, 1.73095703125, 1.97833251953125, 2.2257080078125, 2.47308349609375, 2.720458984375, 2.96783447265625, 3.2152099609375, 3.46258544921875, 3.7099609375, 3.95733642578125, 4.2047119140625, 4.45208740234375, 4.699462890625, 4.94683837890625, 5.1942138671875, 5.44158935546875, 5.68896484375, 5.93634033203125, 6.1837158203125, 6.43109130859375, 6.678466796875, 6.92584228515625, 7.1732177734375, 7.42059326171875, 7.66796875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 5.0, 6.0, 9.0, 16.0, 21.0, 29.0, 29.0, 50.0, 60.0, 81.0, 124.0, 182.0, 252.0, 514.0, 1166.0, 2692.0, 7204.0, 18658.0, 49658.0, 127337.0, 307680.0, 317178.0, 131817.0, 51451.0, 19365.0, 7593.0, 2815.0, 1136.0, 512.0, 285.0, 163.0, 87.0, 95.0, 68.0, 48.0, 40.0, 29.0, 24.0, 17.0, 17.0, 12.0, 6.0, 6.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1640625, -7.91680908203125, -7.6695556640625, -7.42230224609375, -7.175048828125, -6.92779541015625, -6.6805419921875, -6.43328857421875, -6.18603515625, -5.93878173828125, -5.6915283203125, -5.44427490234375, -5.197021484375, -4.94976806640625, -4.7025146484375, -4.45526123046875, -4.2080078125, -3.96075439453125, -3.7135009765625, -3.46624755859375, -3.218994140625, -2.97174072265625, -2.7244873046875, -2.47723388671875, -2.22998046875, -1.98272705078125, -1.7354736328125, -1.48822021484375, -1.240966796875, -0.99371337890625, -0.7464599609375, -0.49920654296875, -0.251953125, -0.00469970703125, 0.2425537109375, 0.48980712890625, 0.737060546875, 0.98431396484375, 1.2315673828125, 1.47882080078125, 1.72607421875, 1.97332763671875, 2.2205810546875, 2.46783447265625, 2.715087890625, 2.96234130859375, 3.2095947265625, 3.45684814453125, 3.7041015625, 3.95135498046875, 4.1986083984375, 4.44586181640625, 4.693115234375, 4.94036865234375, 5.1876220703125, 5.43487548828125, 5.68212890625, 5.92938232421875, 6.1766357421875, 6.42388916015625, 6.671142578125, 6.91839599609375, 7.1656494140625, 7.41290283203125, 7.66015625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 8.0, 9.0, 11.0, 11.0, 8.0, 16.0, 19.0, 15.0, 19.0, 26.0, 25.0, 27.0, 32.0, 33.0, 43.0, 41.0, 51.0, 89.0, 190.0, 1519.0, 306.0, 118.0, 55.0, 48.0, 37.0, 37.0, 32.0, 35.0, 33.0, 26.0, 20.0, 23.0, 15.0, 11.0, 19.0, 9.0, 4.0, 10.0, 2.0, 4.0, 0.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-26.5, -25.73583984375, -24.9716796875, -24.20751953125, -23.443359375, -22.67919921875, -21.9150390625, -21.15087890625, -20.38671875, -19.62255859375, -18.8583984375, -18.09423828125, -17.330078125, -16.56591796875, -15.8017578125, -15.03759765625, -14.2734375, -13.50927734375, -12.7451171875, -11.98095703125, -11.216796875, -10.45263671875, -9.6884765625, -8.92431640625, -8.16015625, -7.39599609375, -6.6318359375, -5.86767578125, -5.103515625, -4.33935546875, -3.5751953125, -2.81103515625, -2.046875, -1.28271484375, -0.5185546875, 0.24560546875, 1.009765625, 1.77392578125, 2.5380859375, 3.30224609375, 4.06640625, 4.83056640625, 5.5947265625, 6.35888671875, 7.123046875, 7.88720703125, 8.6513671875, 9.41552734375, 10.1796875, 10.94384765625, 11.7080078125, 12.47216796875, 13.236328125, 14.00048828125, 14.7646484375, 15.52880859375, 16.29296875, 17.05712890625, 17.8212890625, 18.58544921875, 19.349609375, 20.11376953125, 20.8779296875, 21.64208984375, 22.40625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 1.0, 5.0, 4.0, 7.0, 6.0, 10.0, 11.0, 15.0, 18.0, 24.0, 33.0, 50.0, 75.0, 105.0, 170.0, 344.0, 819.0, 4888.0, 3126805.0, 10299.0, 1036.0, 374.0, 198.0, 125.0, 74.0, 55.0, 33.0, 31.0, 24.0, 14.0, 13.0, 7.0, 6.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-136.75, -133.01171875, -129.2734375, -125.53515625, -121.796875, -118.05859375, -114.3203125, -110.58203125, -106.84375, -103.10546875, -99.3671875, -95.62890625, -91.890625, -88.15234375, -84.4140625, -80.67578125, -76.9375, -73.19921875, -69.4609375, -65.72265625, -61.984375, -58.24609375, -54.5078125, -50.76953125, -47.03125, -43.29296875, -39.5546875, -35.81640625, -32.078125, -28.33984375, -24.6015625, -20.86328125, -17.125, -13.38671875, -9.6484375, -5.91015625, -2.171875, 1.56640625, 5.3046875, 9.04296875, 12.78125, 16.51953125, 20.2578125, 23.99609375, 27.734375, 31.47265625, 35.2109375, 38.94921875, 42.6875, 46.42578125, 50.1640625, 53.90234375, 57.640625, 61.37890625, 65.1171875, 68.85546875, 72.59375, 76.33203125, 80.0703125, 83.80859375, 87.546875, 91.28515625, 95.0234375, 98.76171875, 102.5]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 64.0, 373.0, 462.0, 102.0, 8.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-237.55494689941406, -233.31671142578125, -229.0784912109375, -224.8402557373047, -220.60203552246094, -216.36380004882812, -212.12557983398438, -207.88734436035156, -203.6491241455078, -199.410888671875, -195.17266845703125, -190.93443298339844, -186.6962127685547, -182.45797729492188, -178.21975708007812, -173.9815216064453, -169.7432861328125, -165.5050506591797, -161.26683044433594, -157.02859497070312, -152.79037475585938, -148.55213928222656, -144.3139190673828, -140.07568359375, -135.83746337890625, -131.59922790527344, -127.36100769042969, -123.1227798461914, -118.88455200195312, -114.64632415771484, -110.40809631347656, -106.16986083984375, -101.93163299560547, -97.69340515136719, -93.4551773071289, -89.21694946289062, -84.97872161865234, -80.74049377441406, -76.50225830078125, -72.2640380859375, -68.02580261230469, -63.787574768066406, -59.549346923828125, -55.311119079589844, -51.07289123535156, -46.83466339111328, -42.596431732177734, -38.35820388793945, -34.11997985839844, -29.881752014160156, -25.643524169921875, -21.40529441833496, -17.16706657409668, -12.928838729858398, -8.690608978271484, -4.452381134033203, -0.21415328979492188, 4.024075031280518, 8.262303352355957, 12.500532150268555, 16.738759994506836, 20.976987838745117, 25.21521759033203, 29.453445434570312, 33.691673278808594]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 3.0, 4.0, 10.0, 13.0, 10.0, 23.0, 13.0, 13.0, 16.0, 24.0, 31.0, 20.0, 37.0, 33.0, 21.0, 27.0, 32.0, 37.0, 39.0, 46.0, 53.0, 41.0, 54.0, 41.0, 35.0, 26.0, 42.0, 34.0, 29.0, 28.0, 21.0, 22.0, 17.0, 13.0, 14.0, 17.0, 14.0, 10.0, 12.0, 8.0, 5.0, 7.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.984249114990234, -49.09490203857422, -47.2055549621582, -45.31620788574219, -43.426856994628906, -41.537513732910156, -39.648162841796875, -37.75881576538086, -35.869468688964844, -33.98012161254883, -32.09077453613281, -30.201425552368164, -28.31207847595215, -26.422731399536133, -24.533382415771484, -22.64403533935547, -20.754688262939453, -18.865341186523438, -16.975994110107422, -15.086645126342773, -13.197298049926758, -11.307950973510742, -9.41860294342041, -7.529254913330078, -5.6399078369140625, -3.7505602836608887, -1.8612127304077148, 0.028134822845458984, 1.9174823760986328, 3.8068294525146484, 5.6961774826049805, 7.5855255126953125, 9.474868774414062, 11.364215850830078, 13.25356388092041, 15.142911911010742, 17.032258987426758, 18.921606063842773, 20.810955047607422, 22.700302124023438, 24.589649200439453, 26.47899627685547, 28.368343353271484, 30.257692337036133, 32.14704132080078, 34.03638458251953, 35.92573547363281, 37.81508255004883, 39.704429626464844, 41.59377670288086, 43.483123779296875, 45.37247085571289, 47.261817932128906, 49.15116882324219, 51.0405158996582, 52.92986297607422, 54.819210052490234, 56.70855712890625, 58.597904205322266, 60.48725128173828, 62.37660217285156, 64.26594543457031, 66.1552963256836, 68.04464721679688, 69.93399047851562]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 6.0, 9.0, 9.0, 10.0, 23.0, 14.0, 18.0, 22.0, 24.0, 31.0, 46.0, 34.0, 31.0, 33.0, 31.0, 35.0, 60.0, 58.0, 40.0, 53.0, 52.0, 43.0, 29.0, 36.0, 26.0, 31.0, 33.0, 23.0, 25.0, 19.0, 15.0, 11.0, 18.0, 12.0, 11.0, 9.0, 8.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.08837890625, -7.8095703125, -7.53076171875, -7.251953125, -6.97314453125, -6.6943359375, -6.41552734375, -6.13671875, -5.85791015625, -5.5791015625, -5.30029296875, -5.021484375, -4.74267578125, -4.4638671875, -4.18505859375, -3.90625, -3.62744140625, -3.3486328125, -3.06982421875, -2.791015625, -2.51220703125, -2.2333984375, -1.95458984375, -1.67578125, -1.39697265625, -1.1181640625, -0.83935546875, -0.560546875, -0.28173828125, -0.0029296875, 0.27587890625, 0.5546875, 0.83349609375, 1.1123046875, 1.39111328125, 1.669921875, 1.94873046875, 2.2275390625, 2.50634765625, 2.78515625, 3.06396484375, 3.3427734375, 3.62158203125, 3.900390625, 4.17919921875, 4.4580078125, 4.73681640625, 5.015625, 5.29443359375, 5.5732421875, 5.85205078125, 6.130859375, 6.40966796875, 6.6884765625, 6.96728515625, 7.24609375, 7.52490234375, 7.8037109375, 8.08251953125, 8.361328125, 8.64013671875, 8.9189453125, 9.19775390625, 9.4765625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 0.0, 5.0, 4.0, 7.0, 9.0, 8.0, 19.0, 14.0, 27.0, 28.0, 39.0, 49.0, 59.0, 76.0, 99.0, 120.0, 178.0, 347.0, 1167.0, 17175.0, 1321643.0, 2781943.0, 67871.0, 2170.0, 415.0, 207.0, 135.0, 100.0, 78.0, 52.0, 44.0, 44.0, 37.0, 28.0, 21.0, 15.0, 20.0, 11.0, 9.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.28125, -28.37060546875, -27.4599609375, -26.54931640625, -25.638671875, -24.72802734375, -23.8173828125, -22.90673828125, -21.99609375, -21.08544921875, -20.1748046875, -19.26416015625, -18.353515625, -17.44287109375, -16.5322265625, -15.62158203125, -14.7109375, -13.80029296875, -12.8896484375, -11.97900390625, -11.068359375, -10.15771484375, -9.2470703125, -8.33642578125, -7.42578125, -6.51513671875, -5.6044921875, -4.69384765625, -3.783203125, -2.87255859375, -1.9619140625, -1.05126953125, -0.140625, 0.77001953125, 1.6806640625, 2.59130859375, 3.501953125, 4.41259765625, 5.3232421875, 6.23388671875, 7.14453125, 8.05517578125, 8.9658203125, 9.87646484375, 10.787109375, 11.69775390625, 12.6083984375, 13.51904296875, 14.4296875, 15.34033203125, 16.2509765625, 17.16162109375, 18.072265625, 18.98291015625, 19.8935546875, 20.80419921875, 21.71484375, 22.62548828125, 23.5361328125, 24.44677734375, 25.357421875, 26.26806640625, 27.1787109375, 28.08935546875, 29.0]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 9.0, 12.0, 17.0, 31.0, 23.0, 40.0, 64.0, 95.0, 151.0, 182.0, 272.0, 396.0, 515.0, 477.0, 466.0, 355.0, 294.0, 201.0, 122.0, 89.0, 73.0, 50.0, 30.0, 29.0, 19.0, 18.0, 11.0, 8.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.0625, -16.537109375, -16.01171875, -15.486328125, -14.9609375, -14.435546875, -13.91015625, -13.384765625, -12.859375, -12.333984375, -11.80859375, -11.283203125, -10.7578125, -10.232421875, -9.70703125, -9.181640625, -8.65625, -8.130859375, -7.60546875, -7.080078125, -6.5546875, -6.029296875, -5.50390625, -4.978515625, -4.453125, -3.927734375, -3.40234375, -2.876953125, -2.3515625, -1.826171875, -1.30078125, -0.775390625, -0.25, 0.275390625, 0.80078125, 1.326171875, 1.8515625, 2.376953125, 2.90234375, 3.427734375, 3.953125, 4.478515625, 5.00390625, 5.529296875, 6.0546875, 6.580078125, 7.10546875, 7.630859375, 8.15625, 8.681640625, 9.20703125, 9.732421875, 10.2578125, 10.783203125, 11.30859375, 11.833984375, 12.359375, 12.884765625, 13.41015625, 13.935546875, 14.4609375, 14.986328125, 15.51171875, 16.037109375, 16.5625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 8.0, 16.0, 14.0, 16.0, 30.0, 32.0, 44.0, 91.0, 113.0, 155.0, 257.0, 378.0, 644.0, 5624.0, 4026237.0, 158207.0, 1081.0, 450.0, 279.0, 193.0, 150.0, 76.0, 54.0, 26.0, 34.0, 23.0, 16.0, 6.0, 5.0, 7.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-87.1875, -84.439453125, -81.69140625, -78.943359375, -76.1953125, -73.447265625, -70.69921875, -67.951171875, -65.203125, -62.455078125, -59.70703125, -56.958984375, -54.2109375, -51.462890625, -48.71484375, -45.966796875, -43.21875, -40.470703125, -37.72265625, -34.974609375, -32.2265625, -29.478515625, -26.73046875, -23.982421875, -21.234375, -18.486328125, -15.73828125, -12.990234375, -10.2421875, -7.494140625, -4.74609375, -1.998046875, 0.75, 3.498046875, 6.24609375, 8.994140625, 11.7421875, 14.490234375, 17.23828125, 19.986328125, 22.734375, 25.482421875, 28.23046875, 30.978515625, 33.7265625, 36.474609375, 39.22265625, 41.970703125, 44.71875, 47.466796875, 50.21484375, 52.962890625, 55.7109375, 58.458984375, 61.20703125, 63.955078125, 66.703125, 69.451171875, 72.19921875, 74.947265625, 77.6953125, 80.443359375, 83.19140625, 85.939453125, 88.6875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 26.0, 157.0, 334.0, 320.0, 139.0, 32.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.1746368408203, -127.83661651611328, -122.49859619140625, -117.16058349609375, -111.82255554199219, -106.48454284667969, -101.14652252197266, -95.80850219726562, -90.4704818725586, -85.13246154785156, -79.79444122314453, -74.4564208984375, -69.118408203125, -63.7803840637207, -58.44236755371094, -53.104347229003906, -47.766326904296875, -42.428306579589844, -37.09028625488281, -31.752269744873047, -26.414249420166016, -21.076229095458984, -15.738212585449219, -10.400192260742188, -5.062171936035156, 0.2758474349975586, 5.613866806030273, 10.951885223388672, 16.289905548095703, 21.627925872802734, 26.9659423828125, 32.30396270751953, 37.641998291015625, 42.980018615722656, 48.31803894042969, 53.65605545043945, 58.994075775146484, 64.33209228515625, 69.67011260986328, 75.00813293457031, 80.34615325927734, 85.68417358398438, 91.0221939086914, 96.36021423339844, 101.69822692871094, 107.0362548828125, 112.374267578125, 117.71228790283203, 123.05030822753906, 128.38832092285156, 133.72634887695312, 139.06436157226562, 144.4023895263672, 149.7404022216797, 155.07843017578125, 160.41644287109375, 165.75445556640625, 171.09246826171875, 176.4304962158203, 181.7685089111328, 187.10653686523438, 192.44454956054688, 197.78256225585938, 203.12059020996094, 208.4586181640625]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 10.0, 5.0, 8.0, 10.0, 12.0, 8.0, 19.0, 16.0, 14.0, 19.0, 25.0, 31.0, 26.0, 34.0, 29.0, 36.0, 37.0, 41.0, 35.0, 35.0, 48.0, 35.0, 31.0, 49.0, 31.0, 26.0, 29.0, 38.0, 25.0, 31.0, 17.0, 23.0, 29.0, 16.0, 20.0, 11.0, 12.0, 15.0, 13.0, 5.0, 10.0, 8.0, 9.0, 4.0, 5.0, 5.0, 2.0, 0.0, 4.0, 0.0, 3.0], "bins": [-45.06654739379883, -43.75147247314453, -42.436397552490234, -41.12132263183594, -39.806251525878906, -38.49117660522461, -37.17610168457031, -35.861026763916016, -34.54595184326172, -33.23087692260742, -31.915802001953125, -30.60072898864746, -29.285654067993164, -27.970579147338867, -26.655506134033203, -25.340431213378906, -24.02535629272461, -22.710281372070312, -21.395206451416016, -20.08013343811035, -18.765058517456055, -17.449983596801758, -16.134910583496094, -14.819835662841797, -13.5047607421875, -12.189685821533203, -10.874611854553223, -9.559537887573242, -8.244462966918945, -6.929388523101807, -5.614314079284668, -4.2992401123046875, -2.9841690063476562, -1.6690945625305176, -0.3540201187133789, 0.9610543251037598, 2.2761287689208984, 3.591203212738037, 4.906277656555176, 6.221351623535156, 7.536426544189453, 8.85150146484375, 10.16657543182373, 11.481649398803711, 12.796724319458008, 14.111799240112305, 15.426873207092285, 16.741947174072266, 18.057022094726562, 19.37209701538086, 20.687171936035156, 22.00224494934082, 23.317319869995117, 24.632394790649414, 25.947467803955078, 27.262542724609375, 28.577617645263672, 29.89269256591797, 31.207767486572266, 32.52284240722656, 33.837913513183594, 35.15298843383789, 36.46806335449219, 37.783138275146484, 39.09821319580078]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0, 5.0, 5.0, 11.0, 12.0, 6.0, 15.0, 10.0, 16.0, 19.0, 24.0, 19.0, 34.0, 28.0, 35.0, 28.0, 39.0, 38.0, 54.0, 38.0, 31.0, 65.0, 51.0, 37.0, 33.0, 53.0, 33.0, 35.0, 38.0, 31.0, 25.0, 24.0, 16.0, 20.0, 18.0, 13.0, 9.0, 12.0, 13.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.90625, -7.6456298828125, -7.385009765625, -7.1243896484375, -6.86376953125, -6.6031494140625, -6.342529296875, -6.0819091796875, -5.8212890625, -5.5606689453125, -5.300048828125, -5.0394287109375, -4.77880859375, -4.5181884765625, -4.257568359375, -3.9969482421875, -3.736328125, -3.4757080078125, -3.215087890625, -2.9544677734375, -2.69384765625, -2.4332275390625, -2.172607421875, -1.9119873046875, -1.6513671875, -1.3907470703125, -1.130126953125, -0.8695068359375, -0.60888671875, -0.3482666015625, -0.087646484375, 0.1729736328125, 0.43359375, 0.6942138671875, 0.954833984375, 1.2154541015625, 1.47607421875, 1.7366943359375, 1.997314453125, 2.2579345703125, 2.5185546875, 2.7791748046875, 3.039794921875, 3.3004150390625, 3.56103515625, 3.8216552734375, 4.082275390625, 4.3428955078125, 4.603515625, 4.8641357421875, 5.124755859375, 5.3853759765625, 5.64599609375, 5.9066162109375, 6.167236328125, 6.4278564453125, 6.6884765625, 6.9490966796875, 7.209716796875, 7.4703369140625, 7.73095703125, 7.9915771484375, 8.252197265625, 8.5128173828125, 8.7734375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 4.0, 6.0, 11.0, 15.0, 16.0, 28.0, 43.0, 52.0, 86.0, 148.0, 173.0, 304.0, 401.0, 597.0, 876.0, 1318.0, 1835.0, 2772.0, 4167.0, 6413.0, 10055.0, 15560.0, 24849.0, 41402.0, 72425.0, 140203.0, 294761.0, 197092.0, 95392.0, 52125.0, 31290.0, 19268.0, 11696.0, 7728.0, 5062.0, 3428.0, 2265.0, 1518.0, 984.0, 707.0, 422.0, 318.0, 215.0, 150.0, 118.0, 77.0, 70.0, 39.0, 25.0, 18.0, 12.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0], "bins": [-1.427734375, -1.3853912353515625, -1.343048095703125, -1.3007049560546875, -1.25836181640625, -1.2160186767578125, -1.173675537109375, -1.1313323974609375, -1.0889892578125, -1.0466461181640625, -1.004302978515625, -0.9619598388671875, -0.91961669921875, -0.8772735595703125, -0.834930419921875, -0.7925872802734375, -0.750244140625, -0.7079010009765625, -0.665557861328125, -0.6232147216796875, -0.58087158203125, -0.5385284423828125, -0.496185302734375, -0.4538421630859375, -0.4114990234375, -0.3691558837890625, -0.326812744140625, -0.2844696044921875, -0.24212646484375, -0.1997833251953125, -0.157440185546875, -0.1150970458984375, -0.07275390625, -0.0304107666015625, 0.011932373046875, 0.0542755126953125, 0.09661865234375, 0.1389617919921875, 0.181304931640625, 0.2236480712890625, 0.2659912109375, 0.3083343505859375, 0.350677490234375, 0.3930206298828125, 0.43536376953125, 0.4777069091796875, 0.520050048828125, 0.5623931884765625, 0.604736328125, 0.6470794677734375, 0.689422607421875, 0.7317657470703125, 0.77410888671875, 0.8164520263671875, 0.858795166015625, 0.9011383056640625, 0.9434814453125, 0.9858245849609375, 1.028167724609375, 1.0705108642578125, 1.11285400390625, 1.1551971435546875, 1.197540283203125, 1.2398834228515625, 1.2822265625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 12.0, 10.0, 13.0, 16.0, 12.0, 13.0, 24.0, 23.0, 31.0, 38.0, 34.0, 43.0, 58.0, 45.0, 51.0, 64.0, 1070.0, 47.0, 48.0, 39.0, 42.0, 43.0, 40.0, 32.0, 24.0, 21.0, 28.0, 23.0, 12.0, 15.0, 12.0, 10.0, 8.0, 7.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.2578125, -6.068115234375, -5.87841796875, -5.688720703125, -5.4990234375, -5.309326171875, -5.11962890625, -4.929931640625, -4.740234375, -4.550537109375, -4.36083984375, -4.171142578125, -3.9814453125, -3.791748046875, -3.60205078125, -3.412353515625, -3.22265625, -3.032958984375, -2.84326171875, -2.653564453125, -2.4638671875, -2.274169921875, -2.08447265625, -1.894775390625, -1.705078125, -1.515380859375, -1.32568359375, -1.135986328125, -0.9462890625, -0.756591796875, -0.56689453125, -0.377197265625, -0.1875, 0.002197265625, 0.19189453125, 0.381591796875, 0.5712890625, 0.760986328125, 0.95068359375, 1.140380859375, 1.330078125, 1.519775390625, 1.70947265625, 1.899169921875, 2.0888671875, 2.278564453125, 2.46826171875, 2.657958984375, 2.84765625, 3.037353515625, 3.22705078125, 3.416748046875, 3.6064453125, 3.796142578125, 3.98583984375, 4.175537109375, 4.365234375, 4.554931640625, 4.74462890625, 4.934326171875, 5.1240234375, 5.313720703125, 5.50341796875, 5.693115234375, 5.8828125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 9.0, 14.0, 13.0, 28.0, 48.0, 51.0, 87.0, 143.0, 199.0, 323.0, 443.0, 631.0, 993.0, 1545.0, 2428.0, 3757.0, 6184.0, 9775.0, 16034.0, 27539.0, 47943.0, 92159.0, 202189.0, 1364343.0, 151787.0, 72142.0, 38473.0, 22278.0, 13460.0, 8182.0, 4976.0, 3195.0, 1984.0, 1280.0, 828.0, 533.0, 348.0, 223.0, 177.0, 110.0, 93.0, 61.0, 31.0, 25.0, 23.0, 11.0, 16.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.5244140625, -1.4757537841796875, -1.427093505859375, -1.3784332275390625, -1.32977294921875, -1.2811126708984375, -1.232452392578125, -1.1837921142578125, -1.1351318359375, -1.0864715576171875, -1.037811279296875, -0.9891510009765625, -0.94049072265625, -0.8918304443359375, -0.843170166015625, -0.7945098876953125, -0.745849609375, -0.6971893310546875, -0.648529052734375, -0.5998687744140625, -0.55120849609375, -0.5025482177734375, -0.453887939453125, -0.4052276611328125, -0.3565673828125, -0.3079071044921875, -0.259246826171875, -0.2105865478515625, -0.16192626953125, -0.1132659912109375, -0.064605712890625, -0.0159454345703125, 0.03271484375, 0.0813751220703125, 0.130035400390625, 0.1786956787109375, 0.22735595703125, 0.2760162353515625, 0.324676513671875, 0.3733367919921875, 0.4219970703125, 0.4706573486328125, 0.519317626953125, 0.5679779052734375, 0.61663818359375, 0.6652984619140625, 0.713958740234375, 0.7626190185546875, 0.811279296875, 0.8599395751953125, 0.908599853515625, 0.9572601318359375, 1.00592041015625, 1.0545806884765625, 1.103240966796875, 1.1519012451171875, 1.2005615234375, 1.2492218017578125, 1.297882080078125, 1.3465423583984375, 1.39520263671875, 1.4438629150390625, 1.492523193359375, 1.5411834716796875, 1.58984375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 11.0, 14.0, 14.0, 26.0, 18.0, 23.0, 28.0, 53.0, 56.0, 63.0, 86.0, 72.0, 73.0, 79.0, 81.0, 68.0, 42.0, 32.0, 33.0, 20.0, 14.0, 25.0, 9.0, 13.0, 7.0, 5.0, 3.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00217437744140625, -0.0021089017391204834, -0.002043426036834717, -0.00197795033454895, -0.0019124746322631836, -0.001846998929977417, -0.0017815232276916504, -0.0017160475254058838, -0.0016505718231201172, -0.0015850961208343506, -0.001519620418548584, -0.0014541447162628174, -0.0013886690139770508, -0.0013231933116912842, -0.0012577176094055176, -0.001192241907119751, -0.0011267662048339844, -0.0010612905025482178, -0.0009958148002624512, -0.0009303390979766846, -0.000864863395690918, -0.0007993876934051514, -0.0007339119911193848, -0.0006684362888336182, -0.0006029605865478516, -0.000537484884262085, -0.00047200918197631836, -0.00040653347969055176, -0.00034105777740478516, -0.00027558207511901855, -0.00021010637283325195, -0.00014463067054748535, -7.915496826171875e-05, -1.3679265975952148e-05, 5.179643630981445e-05, 0.00011727213859558105, 0.00018274784088134766, 0.00024822354316711426, 0.00031369924545288086, 0.00037917494773864746, 0.00044465065002441406, 0.0005101263523101807, 0.0005756020545959473, 0.0006410777568817139, 0.0007065534591674805, 0.0007720291614532471, 0.0008375048637390137, 0.0009029805660247803, 0.0009684562683105469, 0.0010339319705963135, 0.00109940767288208, 0.0011648833751678467, 0.0012303590774536133, 0.0012958347797393799, 0.0013613104820251465, 0.001426786184310913, 0.0014922618865966797, 0.0015577375888824463, 0.0016232132911682129, 0.0016886889934539795, 0.001754164695739746, 0.0018196403980255127, 0.0018851161003112793, 0.001950591802597046, 0.0020160675048828125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 4.0, 12.0, 9.0, 9.0, 12.0, 26.0, 29.0, 36.0, 51.0, 64.0, 77.0, 160.0, 299.0, 598.0, 4036.0, 1038127.0, 3578.0, 633.0, 262.0, 154.0, 99.0, 70.0, 39.0, 40.0, 31.0, 27.0, 13.0, 15.0, 10.0, 8.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.045654296875, -0.044291019439697266, -0.04292774200439453, -0.0415644645690918, -0.04020118713378906, -0.03883790969848633, -0.037474632263183594, -0.03611135482788086, -0.034748077392578125, -0.03338479995727539, -0.032021522521972656, -0.030658245086669922, -0.029294967651367188, -0.027931690216064453, -0.02656841278076172, -0.025205135345458984, -0.02384185791015625, -0.022478580474853516, -0.02111530303955078, -0.019752025604248047, -0.018388748168945312, -0.017025470733642578, -0.015662193298339844, -0.01429891586303711, -0.012935638427734375, -0.01157236099243164, -0.010209083557128906, -0.008845806121826172, -0.0074825286865234375, -0.006119251251220703, -0.004755973815917969, -0.0033926963806152344, -0.0020294189453125, -0.0006661415100097656, 0.0006971359252929688, 0.002060413360595703, 0.0034236907958984375, 0.004786968231201172, 0.006150245666503906, 0.007513523101806641, 0.008876800537109375, 0.01024007797241211, 0.011603355407714844, 0.012966632843017578, 0.014329910278320312, 0.015693187713623047, 0.01705646514892578, 0.018419742584228516, 0.01978302001953125, 0.021146297454833984, 0.02250957489013672, 0.023872852325439453, 0.025236129760742188, 0.026599407196044922, 0.027962684631347656, 0.02932596206665039, 0.030689239501953125, 0.03205251693725586, 0.033415794372558594, 0.03477907180786133, 0.03614234924316406, 0.0375056266784668, 0.03886890411376953, 0.040232181549072266, 0.041595458984375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 7.0, 469.0, 531.0, 11.0], "bins": [-0.015552587807178497, -0.015301905572414398, -0.015051223337650299, -0.0148005411028862, -0.0145498588681221, -0.014299176633358002, -0.014048494398593903, -0.013797812163829803, -0.013547129929065704, -0.013296447694301605, -0.013045765459537506, -0.012795083224773407, -0.012544400990009308, -0.012293718755245209, -0.01204303652048111, -0.01179235428571701, -0.011541672050952911, -0.011290989816188812, -0.011040307581424713, -0.010789625346660614, -0.010538943111896515, -0.010288260877132416, -0.010037578642368317, -0.009786896407604218, -0.009536214172840118, -0.00928553193807602, -0.00903484970331192, -0.008784167468547821, -0.008533485233783722, -0.008282802999019623, -0.008032120764255524, -0.0077814385294914246, -0.0075307562947273254, -0.007280074059963226, -0.007029391825199127, -0.006778709590435028, -0.006528027355670929, -0.00627734512090683, -0.006026662886142731, -0.005775980651378632, -0.0055252984166145325, -0.005274616181850433, -0.005023933947086334, -0.004773251712322235, -0.004522569477558136, -0.004271887242794037, -0.004021205008029938, -0.0037705227732658386, -0.0035198405385017395, -0.0032691583037376404, -0.0030184760689735413, -0.002767793834209442, -0.002517111599445343, -0.002266429364681244, -0.0020157471299171448, -0.0017650648951530457, -0.0015143826603889465, -0.0012637004256248474, -0.0010130181908607483, -0.0007623359560966492, -0.00051165372133255, -0.00026097148656845093, -1.0289251804351807e-05, 0.00024039298295974731, 0.0004910752759315073]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 7.0, 9.0, 6.0, 7.0, 5.0, 14.0, 11.0, 14.0, 24.0, 19.0, 22.0, 26.0, 18.0, 23.0, 34.0, 39.0, 46.0, 37.0, 30.0, 41.0, 45.0, 50.0, 43.0, 46.0, 33.0, 44.0, 35.0, 34.0, 25.0, 35.0, 32.0, 23.0, 21.0, 21.0, 14.0, 17.0, 8.0, 8.0, 6.0, 8.0, 7.0, 2.0, 3.0, 6.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0009357929229736328, -0.00090755894780159, -0.0008793249726295471, -0.0008510909974575043, -0.0008228570222854614, -0.0007946230471134186, -0.0007663890719413757, -0.0007381550967693329, -0.00070992112159729, -0.0006816871464252472, -0.0006534531712532043, -0.0006252191960811615, -0.0005969852209091187, -0.0005687512457370758, -0.000540517270565033, -0.0005122832953929901, -0.00048404932022094727, -0.0004558153450489044, -0.00042758136987686157, -0.0003993473947048187, -0.0003711134195327759, -0.00034287944436073303, -0.0003146454691886902, -0.00028641149401664734, -0.0002581775188446045, -0.00022994354367256165, -0.0002017095685005188, -0.00017347559332847595, -0.0001452416181564331, -0.00011700764298439026, -8.877366781234741e-05, -6.0539692640304565e-05, -3.230571746826172e-05, -4.071742296218872e-06, 2.4162232875823975e-05, 5.239620804786682e-05, 8.063018321990967e-05, 0.00010886415839195251, 0.00013709813356399536, 0.0001653321087360382, 0.00019356608390808105, 0.0002218000590801239, 0.00025003403425216675, 0.0002782680094242096, 0.00030650198459625244, 0.0003347359597682953, 0.00036296993494033813, 0.000391203910112381, 0.00041943788528442383, 0.0004476718604564667, 0.0004759058356285095, 0.0005041398108005524, 0.0005323737859725952, 0.0005606077611446381, 0.0005888417363166809, 0.0006170757114887238, 0.0006453096866607666, 0.0006735436618328094, 0.0007017776370048523, 0.0007300116121768951, 0.000758245587348938, 0.0007864795625209808, 0.0008147135376930237, 0.0008429475128650665, 0.0008711814880371094]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0, 5.0, 5.0, 11.0, 12.0, 6.0, 15.0, 10.0, 16.0, 19.0, 24.0, 19.0, 34.0, 28.0, 35.0, 28.0, 39.0, 38.0, 54.0, 38.0, 31.0, 65.0, 51.0, 37.0, 33.0, 53.0, 33.0, 35.0, 38.0, 31.0, 25.0, 24.0, 16.0, 20.0, 18.0, 13.0, 9.0, 12.0, 13.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.90625, -7.6456298828125, -7.385009765625, -7.1243896484375, -6.86376953125, -6.6031494140625, -6.342529296875, -6.0819091796875, -5.8212890625, -5.5606689453125, -5.300048828125, -5.0394287109375, -4.77880859375, -4.5181884765625, -4.257568359375, -3.9969482421875, -3.736328125, -3.4757080078125, -3.215087890625, -2.9544677734375, -2.69384765625, -2.4332275390625, -2.172607421875, -1.9119873046875, -1.6513671875, -1.3907470703125, -1.130126953125, -0.8695068359375, -0.60888671875, -0.3482666015625, -0.087646484375, 0.1729736328125, 0.43359375, 0.6942138671875, 0.954833984375, 1.2154541015625, 1.47607421875, 1.7366943359375, 1.997314453125, 2.2579345703125, 2.5185546875, 2.7791748046875, 3.039794921875, 3.3004150390625, 3.56103515625, 3.8216552734375, 4.082275390625, 4.3428955078125, 4.603515625, 4.8641357421875, 5.124755859375, 5.3853759765625, 5.64599609375, 5.9066162109375, 6.167236328125, 6.4278564453125, 6.6884765625, 6.9490966796875, 7.209716796875, 7.4703369140625, 7.73095703125, 7.9915771484375, 8.252197265625, 8.5128173828125, 8.7734375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 6.0, 10.0, 15.0, 10.0, 21.0, 16.0, 29.0, 42.0, 60.0, 79.0, 88.0, 120.0, 201.0, 327.0, 622.0, 1578.0, 8888.0, 68964.0, 562632.0, 353724.0, 42604.0, 5711.0, 1297.0, 517.0, 290.0, 196.0, 121.0, 97.0, 57.0, 61.0, 40.0, 23.0, 19.0, 15.0, 16.0, 11.0, 13.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.6171875, -15.0946044921875, -14.572021484375, -14.0494384765625, -13.52685546875, -13.0042724609375, -12.481689453125, -11.9591064453125, -11.4365234375, -10.9139404296875, -10.391357421875, -9.8687744140625, -9.34619140625, -8.8236083984375, -8.301025390625, -7.7784423828125, -7.255859375, -6.7332763671875, -6.210693359375, -5.6881103515625, -5.16552734375, -4.6429443359375, -4.120361328125, -3.5977783203125, -3.0751953125, -2.5526123046875, -2.030029296875, -1.5074462890625, -0.98486328125, -0.4622802734375, 0.060302734375, 0.5828857421875, 1.10546875, 1.6280517578125, 2.150634765625, 2.6732177734375, 3.19580078125, 3.7183837890625, 4.240966796875, 4.7635498046875, 5.2861328125, 5.8087158203125, 6.331298828125, 6.8538818359375, 7.37646484375, 7.8990478515625, 8.421630859375, 8.9442138671875, 9.466796875, 9.9893798828125, 10.511962890625, 11.0345458984375, 11.55712890625, 12.0797119140625, 12.602294921875, 13.1248779296875, 13.6474609375, 14.1700439453125, 14.692626953125, 15.2152099609375, 15.73779296875, 16.2603759765625, 16.782958984375, 17.3055419921875, 17.828125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 3.0, 5.0, 6.0, 10.0, 9.0, 8.0, 13.0, 14.0, 20.0, 21.0, 22.0, 30.0, 33.0, 35.0, 41.0, 44.0, 47.0, 76.0, 145.0, 343.0, 1470.0, 150.0, 85.0, 48.0, 50.0, 38.0, 46.0, 47.0, 39.0, 27.0, 19.0, 23.0, 23.0, 10.0, 12.0, 15.0, 7.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.171875, -29.261474609375, -28.35107421875, -27.440673828125, -26.5302734375, -25.619873046875, -24.70947265625, -23.799072265625, -22.888671875, -21.978271484375, -21.06787109375, -20.157470703125, -19.2470703125, -18.336669921875, -17.42626953125, -16.515869140625, -15.60546875, -14.695068359375, -13.78466796875, -12.874267578125, -11.9638671875, -11.053466796875, -10.14306640625, -9.232666015625, -8.322265625, -7.411865234375, -6.50146484375, -5.591064453125, -4.6806640625, -3.770263671875, -2.85986328125, -1.949462890625, -1.0390625, -0.128662109375, 0.78173828125, 1.692138671875, 2.6025390625, 3.512939453125, 4.42333984375, 5.333740234375, 6.244140625, 7.154541015625, 8.06494140625, 8.975341796875, 9.8857421875, 10.796142578125, 11.70654296875, 12.616943359375, 13.52734375, 14.437744140625, 15.34814453125, 16.258544921875, 17.1689453125, 18.079345703125, 18.98974609375, 19.900146484375, 20.810546875, 21.720947265625, 22.63134765625, 23.541748046875, 24.4521484375, 25.362548828125, 26.27294921875, 27.183349609375, 28.09375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 8.0, 4.0, 5.0, 14.0, 27.0, 22.0, 41.0, 52.0, 67.0, 60.0, 121.0, 145.0, 273.0, 514.0, 1740.0, 998777.0, 2140545.0, 1937.0, 545.0, 239.0, 153.0, 114.0, 76.0, 53.0, 54.0, 26.0, 24.0, 19.0, 14.0, 15.0, 10.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-123.125, -119.609375, -116.09375, -112.578125, -109.0625, -105.546875, -102.03125, -98.515625, -95.0, -91.484375, -87.96875, -84.453125, -80.9375, -77.421875, -73.90625, -70.390625, -66.875, -63.359375, -59.84375, -56.328125, -52.8125, -49.296875, -45.78125, -42.265625, -38.75, -35.234375, -31.71875, -28.203125, -24.6875, -21.171875, -17.65625, -14.140625, -10.625, -7.109375, -3.59375, -0.078125, 3.4375, 6.953125, 10.46875, 13.984375, 17.5, 21.015625, 24.53125, 28.046875, 31.5625, 35.078125, 38.59375, 42.109375, 45.625, 49.140625, 52.65625, 56.171875, 59.6875, 63.203125, 66.71875, 70.234375, 73.75, 77.265625, 80.78125, 84.296875, 87.8125, 91.328125, 94.84375, 98.359375, 101.875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 11.0, 38.0, 87.0, 99.0, 133.0, 186.0, 158.0, 125.0, 89.0, 35.0, 26.0, 10.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.83781433105469, -48.67265319824219, -47.50749588012695, -46.34233474731445, -45.17717742919922, -44.01201629638672, -42.846858978271484, -41.681697845458984, -40.51654052734375, -39.35137939453125, -38.186222076416016, -37.021060943603516, -35.85590362548828, -34.69074249267578, -33.52558517456055, -32.36042404174805, -31.195262908935547, -30.03010368347168, -28.864944458007812, -27.699785232543945, -26.534626007080078, -25.369464874267578, -24.20430564880371, -23.039146423339844, -21.873987197875977, -20.70882797241211, -19.543668746948242, -18.378509521484375, -17.213348388671875, -16.04819107055664, -14.88302993774414, -13.717870712280273, -12.55270767211914, -11.387548446655273, -10.222389221191406, -9.057229042053223, -7.8920698165893555, -6.726910591125488, -5.561750888824463, -4.3965911865234375, -3.2314319610595703, -2.066272497177124, -0.9011130332946777, 0.26404643058776855, 1.4292058944702148, 2.594365119934082, 3.7595248222351074, 4.924684524536133, 6.08984375, 7.255002975463867, 8.420162200927734, 9.585322380065918, 10.750481605529785, 11.915640830993652, 13.080801010131836, 14.245960235595703, 15.41111946105957, 16.576278686523438, 17.741437911987305, 18.906597137451172, 20.071758270263672, 21.236915588378906, 22.402076721191406, 23.567235946655273, 24.73239517211914]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 4.0, 2.0, 5.0, 14.0, 15.0, 12.0, 12.0, 18.0, 20.0, 15.0, 23.0, 25.0, 30.0, 42.0, 38.0, 40.0, 41.0, 34.0, 49.0, 46.0, 36.0, 51.0, 47.0, 32.0, 34.0, 30.0, 25.0, 40.0, 31.0, 27.0, 16.0, 18.0, 18.0, 13.0, 8.0, 13.0, 10.0, 8.0, 11.0, 10.0, 7.0, 8.0, 2.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.28593826293945, -60.176822662353516, -58.06770706176758, -55.95859146118164, -53.84947967529297, -51.74036407470703, -49.631248474121094, -47.522132873535156, -45.41301727294922, -43.30390167236328, -41.194786071777344, -39.085670471191406, -36.97655487060547, -34.86743927001953, -32.75832748413086, -30.649211883544922, -28.540096282958984, -26.430980682373047, -24.32186508178711, -22.212751388549805, -20.103635787963867, -17.99452018737793, -15.885405540466309, -13.776290893554688, -11.66717529296875, -9.558059692382812, -7.448945045471191, -5.339829921722412, -3.230714797973633, -1.1215991973876953, 0.9875154495239258, 3.096630096435547, 5.205741882324219, 7.314857006072998, 9.423972129821777, 11.533086776733398, 13.642202377319336, 15.751317977905273, 17.860431671142578, 19.969547271728516, 22.078662872314453, 24.18777847290039, 26.296894073486328, 28.406007766723633, 30.51512336730957, 32.624237060546875, 34.73335266113281, 36.84246826171875, 38.95158386230469, 41.060699462890625, 43.16981506347656, 45.2789306640625, 47.38804626464844, 49.497161865234375, 51.60627365112305, 53.715389251708984, 55.82450485229492, 57.93362045288086, 60.0427360534668, 62.151851654052734, 64.2609634399414, 66.37007904052734, 68.47919464111328, 70.58831024169922, 72.69742584228516]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 3.0, 6.0, 11.0, 9.0, 7.0, 14.0, 11.0, 20.0, 15.0, 31.0, 39.0, 29.0, 33.0, 32.0, 41.0, 51.0, 44.0, 55.0, 41.0, 46.0, 45.0, 39.0, 49.0, 45.0, 30.0, 36.0, 31.0, 32.0, 32.0, 20.0, 15.0, 16.0, 13.0, 13.0, 11.0, 16.0, 4.0, 5.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1875, -8.883056640625, -8.57861328125, -8.274169921875, -7.9697265625, -7.665283203125, -7.36083984375, -7.056396484375, -6.751953125, -6.447509765625, -6.14306640625, -5.838623046875, -5.5341796875, -5.229736328125, -4.92529296875, -4.620849609375, -4.31640625, -4.011962890625, -3.70751953125, -3.403076171875, -3.0986328125, -2.794189453125, -2.48974609375, -2.185302734375, -1.880859375, -1.576416015625, -1.27197265625, -0.967529296875, -0.6630859375, -0.358642578125, -0.05419921875, 0.250244140625, 0.5546875, 0.859130859375, 1.16357421875, 1.468017578125, 1.7724609375, 2.076904296875, 2.38134765625, 2.685791015625, 2.990234375, 3.294677734375, 3.59912109375, 3.903564453125, 4.2080078125, 4.512451171875, 4.81689453125, 5.121337890625, 5.42578125, 5.730224609375, 6.03466796875, 6.339111328125, 6.6435546875, 6.947998046875, 7.25244140625, 7.556884765625, 7.861328125, 8.165771484375, 8.47021484375, 8.774658203125, 9.0791015625, 9.383544921875, 9.68798828125, 9.992431640625, 10.296875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 11.0, 11.0, 12.0, 26.0, 31.0, 37.0, 36.0, 66.0, 95.0, 192.0, 278.0, 555.0, 1290.0, 4653.0, 22428.0, 143420.0, 753887.0, 1770962.0, 1160574.0, 280041.0, 44218.0, 7836.0, 1992.0, 681.0, 360.0, 181.0, 118.0, 70.0, 57.0, 36.0, 28.0, 19.0, 22.0, 13.0, 10.0, 6.0, 10.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4140625, -11.01611328125, -10.6181640625, -10.22021484375, -9.822265625, -9.42431640625, -9.0263671875, -8.62841796875, -8.23046875, -7.83251953125, -7.4345703125, -7.03662109375, -6.638671875, -6.24072265625, -5.8427734375, -5.44482421875, -5.046875, -4.64892578125, -4.2509765625, -3.85302734375, -3.455078125, -3.05712890625, -2.6591796875, -2.26123046875, -1.86328125, -1.46533203125, -1.0673828125, -0.66943359375, -0.271484375, 0.12646484375, 0.5244140625, 0.92236328125, 1.3203125, 1.71826171875, 2.1162109375, 2.51416015625, 2.912109375, 3.31005859375, 3.7080078125, 4.10595703125, 4.50390625, 4.90185546875, 5.2998046875, 5.69775390625, 6.095703125, 6.49365234375, 6.8916015625, 7.28955078125, 7.6875, 8.08544921875, 8.4833984375, 8.88134765625, 9.279296875, 9.67724609375, 10.0751953125, 10.47314453125, 10.87109375, 11.26904296875, 11.6669921875, 12.06494140625, 12.462890625, 12.86083984375, 13.2587890625, 13.65673828125, 14.0546875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 13.0, 14.0, 31.0, 39.0, 65.0, 67.0, 96.0, 166.0, 216.0, 304.0, 411.0, 498.0, 509.0, 457.0, 331.0, 243.0, 193.0, 115.0, 90.0, 66.0, 37.0, 32.0, 23.0, 21.0, 13.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.296875, -20.7080078125, -20.119140625, -19.5302734375, -18.94140625, -18.3525390625, -17.763671875, -17.1748046875, -16.5859375, -15.9970703125, -15.408203125, -14.8193359375, -14.23046875, -13.6416015625, -13.052734375, -12.4638671875, -11.875, -11.2861328125, -10.697265625, -10.1083984375, -9.51953125, -8.9306640625, -8.341796875, -7.7529296875, -7.1640625, -6.5751953125, -5.986328125, -5.3974609375, -4.80859375, -4.2197265625, -3.630859375, -3.0419921875, -2.453125, -1.8642578125, -1.275390625, -0.6865234375, -0.09765625, 0.4912109375, 1.080078125, 1.6689453125, 2.2578125, 2.8466796875, 3.435546875, 4.0244140625, 4.61328125, 5.2021484375, 5.791015625, 6.3798828125, 6.96875, 7.5576171875, 8.146484375, 8.7353515625, 9.32421875, 9.9130859375, 10.501953125, 11.0908203125, 11.6796875, 12.2685546875, 12.857421875, 13.4462890625, 14.03515625, 14.6240234375, 15.212890625, 15.8017578125, 16.390625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 16.0, 16.0, 31.0, 37.0, 57.0, 100.0, 169.0, 225.0, 382.0, 703.0, 1456.0, 8915.0, 3078949.0, 1095535.0, 4949.0, 1168.0, 618.0, 358.0, 204.0, 119.0, 104.0, 59.0, 38.0, 18.0, 20.0, 12.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.96875, -55.89111328125, -53.8134765625, -51.73583984375, -49.658203125, -47.58056640625, -45.5029296875, -43.42529296875, -41.34765625, -39.27001953125, -37.1923828125, -35.11474609375, -33.037109375, -30.95947265625, -28.8818359375, -26.80419921875, -24.7265625, -22.64892578125, -20.5712890625, -18.49365234375, -16.416015625, -14.33837890625, -12.2607421875, -10.18310546875, -8.10546875, -6.02783203125, -3.9501953125, -1.87255859375, 0.205078125, 2.28271484375, 4.3603515625, 6.43798828125, 8.515625, 10.59326171875, 12.6708984375, 14.74853515625, 16.826171875, 18.90380859375, 20.9814453125, 23.05908203125, 25.13671875, 27.21435546875, 29.2919921875, 31.36962890625, 33.447265625, 35.52490234375, 37.6025390625, 39.68017578125, 41.7578125, 43.83544921875, 45.9130859375, 47.99072265625, 50.068359375, 52.14599609375, 54.2236328125, 56.30126953125, 58.37890625, 60.45654296875, 62.5341796875, 64.61181640625, 66.689453125, 68.76708984375, 70.8447265625, 72.92236328125, 75.0]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 74.0, 455.0, 423.0, 56.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-369.5962219238281, -359.85150146484375, -350.1067810058594, -340.362060546875, -330.6173400878906, -320.87261962890625, -311.1278991699219, -301.3831787109375, -291.638427734375, -281.8937072753906, -272.14898681640625, -262.4042663574219, -252.6595458984375, -242.91482543945312, -233.1700897216797, -223.4253692626953, -213.6806640625, -203.93594360351562, -194.19122314453125, -184.44650268554688, -174.7017822265625, -164.95706176757812, -155.2123260498047, -145.4676055908203, -135.72288513183594, -125.97816467285156, -116.23344421386719, -106.48871612548828, -96.7439956665039, -86.99927520751953, -77.25454711914062, -67.50982666015625, -57.76509094238281, -48.02037048339844, -38.2756462097168, -28.53092384338379, -18.78620147705078, -9.041481018066406, 0.7032432556152344, 10.447967529296875, 20.19268798828125, 29.937410354614258, 39.682132720947266, 49.426856994628906, 59.17157745361328, 68.91629791259766, 78.66102600097656, 88.40574645996094, 98.15046691894531, 107.89518737792969, 117.63990783691406, 127.38463592529297, 137.12936401367188, 146.87408447265625, 156.61880493164062, 166.363525390625, 176.10824584960938, 185.85296630859375, 195.59768676757812, 205.3424072265625, 215.08712768554688, 224.83184814453125, 234.5765838623047, 244.32130432128906, 254.06602478027344]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 3.0, 10.0, 4.0, 12.0, 9.0, 17.0, 14.0, 28.0, 21.0, 27.0, 22.0, 28.0, 33.0, 37.0, 41.0, 42.0, 42.0, 55.0, 44.0, 52.0, 45.0, 37.0, 38.0, 49.0, 46.0, 39.0, 39.0, 28.0, 26.0, 15.0, 22.0, 20.0, 13.0, 14.0, 8.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.217674255371094, -54.34430694580078, -52.47093963623047, -50.59757614135742, -48.72420883178711, -46.8508415222168, -44.977474212646484, -43.10411071777344, -41.230743408203125, -39.35737609863281, -37.4840087890625, -35.61064529418945, -33.73727798461914, -31.863910675048828, -29.990543365478516, -28.117177963256836, -26.243810653686523, -24.37044334411621, -22.49707794189453, -20.62371063232422, -18.75034523010254, -16.876977920532227, -15.00361156463623, -13.130245208740234, -11.256878852844238, -9.383512496948242, -7.510146141052246, -5.636779308319092, -3.7634129524230957, -1.8900461196899414, -0.016679763793945312, 1.8566865921020508, 3.730052947998047, 5.603419303894043, 7.476785659790039, 9.350152969360352, 11.223518371582031, 13.096885681152344, 14.97025203704834, 16.843618392944336, 18.716983795166016, 20.590351104736328, 22.463716506958008, 24.33708381652832, 26.21044921875, 28.083816528320312, 29.957183837890625, 31.830549240112305, 33.70391845703125, 35.57728576660156, 37.450653076171875, 39.32401657104492, 41.197383880615234, 43.07075119018555, 44.94411849975586, 46.817481994628906, 48.69084930419922, 50.56421661376953, 52.437583923339844, 54.31094741821289, 56.1843147277832, 58.057682037353516, 59.93104934692383, 61.804412841796875, 63.67778015136719]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 10.0, 7.0, 7.0, 4.0, 7.0, 4.0, 12.0, 16.0, 10.0, 20.0, 12.0, 26.0, 19.0, 31.0, 25.0, 20.0, 30.0, 35.0, 26.0, 37.0, 39.0, 45.0, 38.0, 37.0, 39.0, 37.0, 32.0, 34.0, 34.0, 28.0, 25.0, 24.0, 25.0, 25.0, 23.0, 22.0, 25.0, 14.0, 15.0, 8.0, 10.0, 8.0, 13.0, 12.0, 5.0, 9.0, 3.0, 2.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.13671875, -6.9102783203125, -6.683837890625, -6.4573974609375, -6.23095703125, -6.0045166015625, -5.778076171875, -5.5516357421875, -5.3251953125, -5.0987548828125, -4.872314453125, -4.6458740234375, -4.41943359375, -4.1929931640625, -3.966552734375, -3.7401123046875, -3.513671875, -3.2872314453125, -3.060791015625, -2.8343505859375, -2.60791015625, -2.3814697265625, -2.155029296875, -1.9285888671875, -1.7021484375, -1.4757080078125, -1.249267578125, -1.0228271484375, -0.79638671875, -0.5699462890625, -0.343505859375, -0.1170654296875, 0.109375, 0.3358154296875, 0.562255859375, 0.7886962890625, 1.01513671875, 1.2415771484375, 1.468017578125, 1.6944580078125, 1.9208984375, 2.1473388671875, 2.373779296875, 2.6002197265625, 2.82666015625, 3.0531005859375, 3.279541015625, 3.5059814453125, 3.732421875, 3.9588623046875, 4.185302734375, 4.4117431640625, 4.63818359375, 4.8646240234375, 5.091064453125, 5.3175048828125, 5.5439453125, 5.7703857421875, 5.996826171875, 6.2232666015625, 6.44970703125, 6.6761474609375, 6.902587890625, 7.1290283203125, 7.35546875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 8.0, 4.0, 6.0, 15.0, 16.0, 23.0, 34.0, 54.0, 93.0, 107.0, 151.0, 194.0, 317.0, 428.0, 652.0, 822.0, 1169.0, 1755.0, 2350.0, 3525.0, 5006.0, 7512.0, 10763.0, 16012.0, 24039.0, 37561.0, 60232.0, 102212.0, 189615.0, 244853.0, 130119.0, 74575.0, 45331.0, 29346.0, 18939.0, 12611.0, 8657.0, 5933.0, 3986.0, 2804.0, 2028.0, 1378.0, 954.0, 703.0, 526.0, 332.0, 223.0, 171.0, 124.0, 83.0, 76.0, 44.0, 33.0, 23.0, 12.0, 12.0, 8.0, 7.0, 3.0, 2.0, 1.0], "bins": [-1.2822265625, -1.2424163818359375, -1.202606201171875, -1.1627960205078125, -1.12298583984375, -1.0831756591796875, -1.043365478515625, -1.0035552978515625, -0.9637451171875, -0.9239349365234375, -0.884124755859375, -0.8443145751953125, -0.80450439453125, -0.7646942138671875, -0.724884033203125, -0.6850738525390625, -0.645263671875, -0.6054534912109375, -0.565643310546875, -0.5258331298828125, -0.48602294921875, -0.4462127685546875, -0.406402587890625, -0.3665924072265625, -0.3267822265625, -0.2869720458984375, -0.247161865234375, -0.2073516845703125, -0.16754150390625, -0.1277313232421875, -0.087921142578125, -0.0481109619140625, -0.00830078125, 0.0315093994140625, 0.071319580078125, 0.1111297607421875, 0.15093994140625, 0.1907501220703125, 0.230560302734375, 0.2703704833984375, 0.3101806640625, 0.3499908447265625, 0.389801025390625, 0.4296112060546875, 0.46942138671875, 0.5092315673828125, 0.549041748046875, 0.5888519287109375, 0.628662109375, 0.6684722900390625, 0.708282470703125, 0.7480926513671875, 0.78790283203125, 0.8277130126953125, 0.867523193359375, 0.9073333740234375, 0.9471435546875, 0.9869537353515625, 1.026763916015625, 1.0665740966796875, 1.10638427734375, 1.1461944580078125, 1.186004638671875, 1.2258148193359375, 1.265625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 3.0, 6.0, 5.0, 9.0, 8.0, 15.0, 12.0, 19.0, 15.0, 16.0, 31.0, 27.0, 35.0, 27.0, 45.0, 41.0, 39.0, 42.0, 32.0, 44.0, 1070.0, 29.0, 41.0, 26.0, 39.0, 56.0, 46.0, 31.0, 30.0, 19.0, 18.0, 24.0, 17.0, 23.0, 6.0, 18.0, 14.0, 11.0, 13.0, 5.0, 1.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-5.67578125, -5.51507568359375, -5.3543701171875, -5.19366455078125, -5.032958984375, -4.87225341796875, -4.7115478515625, -4.55084228515625, -4.39013671875, -4.22943115234375, -4.0687255859375, -3.90802001953125, -3.747314453125, -3.58660888671875, -3.4259033203125, -3.26519775390625, -3.1044921875, -2.94378662109375, -2.7830810546875, -2.62237548828125, -2.461669921875, -2.30096435546875, -2.1402587890625, -1.97955322265625, -1.81884765625, -1.65814208984375, -1.4974365234375, -1.33673095703125, -1.176025390625, -1.01531982421875, -0.8546142578125, -0.69390869140625, -0.533203125, -0.37249755859375, -0.2117919921875, -0.05108642578125, 0.109619140625, 0.27032470703125, 0.4310302734375, 0.59173583984375, 0.75244140625, 0.91314697265625, 1.0738525390625, 1.23455810546875, 1.395263671875, 1.55596923828125, 1.7166748046875, 1.87738037109375, 2.0380859375, 2.19879150390625, 2.3594970703125, 2.52020263671875, 2.680908203125, 2.84161376953125, 3.0023193359375, 3.16302490234375, 3.32373046875, 3.48443603515625, 3.6451416015625, 3.80584716796875, 3.966552734375, 4.12725830078125, 4.2879638671875, 4.44866943359375, 4.609375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 5.0, 4.0, 7.0, 15.0, 8.0, 18.0, 38.0, 52.0, 64.0, 95.0, 158.0, 248.0, 326.0, 519.0, 807.0, 1174.0, 1875.0, 2954.0, 5013.0, 7907.0, 13062.0, 22663.0, 38811.0, 73257.0, 150688.0, 1361665.0, 203402.0, 93561.0, 48634.0, 27950.0, 16112.0, 10028.0, 6060.0, 3607.0, 2248.0, 1460.0, 895.0, 616.0, 385.0, 243.0, 160.0, 106.0, 83.0, 58.0, 37.0, 25.0, 10.0, 8.0, 8.0, 6.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.458984375, -1.4098358154296875, -1.360687255859375, -1.3115386962890625, -1.26239013671875, -1.2132415771484375, -1.164093017578125, -1.1149444580078125, -1.0657958984375, -1.0166473388671875, -0.967498779296875, -0.9183502197265625, -0.86920166015625, -0.8200531005859375, -0.770904541015625, -0.7217559814453125, -0.672607421875, -0.6234588623046875, -0.574310302734375, -0.5251617431640625, -0.47601318359375, -0.4268646240234375, -0.377716064453125, -0.3285675048828125, -0.2794189453125, -0.2302703857421875, -0.181121826171875, -0.1319732666015625, -0.08282470703125, -0.0336761474609375, 0.015472412109375, 0.0646209716796875, 0.11376953125, 0.1629180908203125, 0.212066650390625, 0.2612152099609375, 0.31036376953125, 0.3595123291015625, 0.408660888671875, 0.4578094482421875, 0.5069580078125, 0.5561065673828125, 0.605255126953125, 0.6544036865234375, 0.70355224609375, 0.7527008056640625, 0.801849365234375, 0.8509979248046875, 0.900146484375, 0.9492950439453125, 0.998443603515625, 1.0475921630859375, 1.09674072265625, 1.1458892822265625, 1.195037841796875, 1.2441864013671875, 1.2933349609375, 1.3424835205078125, 1.391632080078125, 1.4407806396484375, 1.48992919921875, 1.5390777587890625, 1.588226318359375, 1.6373748779296875, 1.6865234375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 3.0, 2.0, 5.0, 4.0, 12.0, 10.0, 17.0, 19.0, 20.0, 15.0, 29.0, 36.0, 30.0, 38.0, 47.0, 44.0, 51.0, 60.0, 58.0, 61.0, 53.0, 65.0, 40.0, 49.0, 33.0, 27.0, 35.0, 21.0, 32.0, 20.0, 13.0, 12.0, 16.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0018796920776367188, -0.0018223077058792114, -0.001764923334121704, -0.0017075389623641968, -0.0016501545906066895, -0.0015927702188491821, -0.0015353858470916748, -0.0014780014753341675, -0.0014206171035766602, -0.0013632327318191528, -0.0013058483600616455, -0.0012484639883041382, -0.0011910796165466309, -0.0011336952447891235, -0.0010763108730316162, -0.0010189265012741089, -0.0009615421295166016, -0.0009041577577590942, -0.0008467733860015869, -0.0007893890142440796, -0.0007320046424865723, -0.0006746202707290649, -0.0006172358989715576, -0.0005598515272140503, -0.000502467155456543, -0.00044508278369903564, -0.0003876984119415283, -0.000330314040184021, -0.00027292966842651367, -0.00021554529666900635, -0.00015816092491149902, -0.0001007765531539917, -4.3392181396484375e-05, 1.399219036102295e-05, 7.137656211853027e-05, 0.0001287609338760376, 0.00018614530563354492, 0.00024352967739105225, 0.00030091404914855957, 0.0003582984209060669, 0.0004156827926635742, 0.00047306716442108154, 0.0005304515361785889, 0.0005878359079360962, 0.0006452202796936035, 0.0007026046514511108, 0.0007599890232086182, 0.0008173733949661255, 0.0008747577667236328, 0.0009321421384811401, 0.0009895265102386475, 0.0010469108819961548, 0.0011042952537536621, 0.0011616796255111694, 0.0012190639972686768, 0.001276448369026184, 0.0013338327407836914, 0.0013912171125411987, 0.001448601484298706, 0.0015059858560562134, 0.0015633702278137207, 0.001620754599571228, 0.0016781389713287354, 0.0017355233430862427, 0.00179290771484375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 6.0, 2.0, 1.0, 3.0, 5.0, 4.0, 20.0, 9.0, 18.0, 17.0, 19.0, 37.0, 58.0, 55.0, 51.0, 77.0, 99.0, 143.0, 236.0, 488.0, 1087.0, 66765.0, 975921.0, 1832.0, 602.0, 317.0, 159.0, 101.0, 96.0, 56.0, 61.0, 49.0, 32.0, 25.0, 30.0, 18.0, 14.0, 7.0, 8.0, 7.0, 8.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.03546142578125, -0.03432464599609375, -0.0331878662109375, -0.03205108642578125, -0.030914306640625, -0.02977752685546875, -0.0286407470703125, -0.02750396728515625, -0.0263671875, -0.02523040771484375, -0.0240936279296875, -0.02295684814453125, -0.021820068359375, -0.02068328857421875, -0.0195465087890625, -0.01840972900390625, -0.01727294921875, -0.01613616943359375, -0.0149993896484375, -0.01386260986328125, -0.012725830078125, -0.01158905029296875, -0.0104522705078125, -0.00931549072265625, -0.0081787109375, -0.00704193115234375, -0.0059051513671875, -0.00476837158203125, -0.003631591796875, -0.00249481201171875, -0.0013580322265625, -0.00022125244140625, 0.00091552734375, 0.00205230712890625, 0.0031890869140625, 0.00432586669921875, 0.005462646484375, 0.00659942626953125, 0.0077362060546875, 0.00887298583984375, 0.010009765625, 0.01114654541015625, 0.0122833251953125, 0.01342010498046875, 0.014556884765625, 0.01569366455078125, 0.0168304443359375, 0.01796722412109375, 0.01910400390625, 0.02024078369140625, 0.0213775634765625, 0.02251434326171875, 0.023651123046875, 0.02478790283203125, 0.0259246826171875, 0.02706146240234375, 0.0281982421875, 0.02933502197265625, 0.0304718017578125, 0.03160858154296875, 0.032745361328125, 0.03388214111328125, 0.0350189208984375, 0.03615570068359375, 0.03729248046875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 54.0, 887.0, 70.0, 5.0], "bins": [-0.017986489459872246, -0.0176940206438303, -0.017401551827788353, -0.017109083011746407, -0.01681661419570446, -0.016524145379662514, -0.016231676563620567, -0.01593920774757862, -0.015646738931536674, -0.015354270115494728, -0.015061801299452782, -0.014769332483410835, -0.014476863667368889, -0.014184394851326942, -0.013891926035284996, -0.01359945721924305, -0.013306989334523678, -0.013014520518481731, -0.012722051702439785, -0.012429582886397839, -0.012137114070355892, -0.011844645254313946, -0.011552176438272, -0.011259708553552628, -0.010967239737510681, -0.010674770921468735, -0.010382302105426788, -0.010089833289384842, -0.009797364473342896, -0.009504895657300949, -0.009212426841259003, -0.008919958025217056, -0.008627488277852535, -0.008335019461810589, -0.008042550645768642, -0.007750081829726696, -0.00745761301368475, -0.007165144197642803, -0.006872675847262144, -0.006580207031220198, -0.006287738680839539, -0.005995269864797592, -0.005702801048755646, -0.005410332232713699, -0.005117863416671753, -0.0048253946006298065, -0.004532926250249147, -0.004240457434207201, -0.003947988618165255, -0.003655519802123308, -0.0033630509860813618, -0.003070582402870059, -0.0027781135868281126, -0.002485644770786166, -0.0021931761875748634, -0.001900707371532917, -0.0016082384390756488, -0.0013157697394490242, -0.0010233009234070778, -0.0007308321655727923, -0.0004383634077385068, -0.00014589459169656038, 0.0001465741079300642, 0.0004390428075566888, 0.0007315116235986352]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 12.0, 9.0, 11.0, 8.0, 19.0, 31.0, 18.0, 24.0, 27.0, 29.0, 22.0, 40.0, 36.0, 40.0, 45.0, 45.0, 49.0, 36.0, 48.0, 36.0, 33.0, 41.0, 35.0, 30.0, 41.0, 32.0, 29.0, 28.0, 23.0, 14.0, 20.0, 17.0, 13.0, 6.0, 8.0, 7.0, 9.0, 6.0, 5.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000926971435546875, -0.0008967993780970573, -0.0008666273206472397, -0.000836455263197422, -0.0008062832057476044, -0.0007761111482977867, -0.0007459390908479691, -0.0007157670333981514, -0.0006855949759483337, -0.0006554229184985161, -0.0006252508610486984, -0.0005950788035988808, -0.0005649067461490631, -0.0005347346886992455, -0.0005045626312494278, -0.00047439057379961014, -0.0004442185163497925, -0.0004140464588999748, -0.00038387440145015717, -0.0003537023440003395, -0.00032353028655052185, -0.0002933582291007042, -0.00026318617165088654, -0.00023301411420106888, -0.00020284205675125122, -0.00017266999930143356, -0.0001424979418516159, -0.00011232588440179825, -8.215382695198059e-05, -5.198176950216293e-05, -2.1809712052345276e-05, 8.362345397472382e-06, 3.853440284729004e-05, 6.87064602971077e-05, 9.887851774692535e-05, 0.000129050575196743, 0.00015922263264656067, 0.00018939469009637833, 0.00021956674754619598, 0.00024973880499601364, 0.0002799108624458313, 0.00031008291989564896, 0.0003402549773454666, 0.00037042703479528427, 0.00040059909224510193, 0.0004307711496949196, 0.00046094320714473724, 0.0004911152645945549, 0.0005212873220443726, 0.0005514593794941902, 0.0005816314369440079, 0.0006118034943938255, 0.0006419755518436432, 0.0006721476092934608, 0.0007023196667432785, 0.0007324917241930962, 0.0007626637816429138, 0.0007928358390927315, 0.0008230078965425491, 0.0008531799539923668, 0.0008833520114421844, 0.0009135240688920021, 0.0009436961263418198, 0.0009738681837916374, 0.001004040241241455]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 10.0, 7.0, 7.0, 4.0, 7.0, 4.0, 12.0, 16.0, 10.0, 20.0, 12.0, 26.0, 19.0, 31.0, 25.0, 20.0, 30.0, 35.0, 26.0, 37.0, 39.0, 45.0, 38.0, 37.0, 39.0, 37.0, 32.0, 34.0, 34.0, 28.0, 25.0, 24.0, 25.0, 24.0, 24.0, 22.0, 25.0, 14.0, 15.0, 8.0, 10.0, 8.0, 13.0, 12.0, 5.0, 9.0, 3.0, 2.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.13671875, -6.9102783203125, -6.683837890625, -6.4573974609375, -6.23095703125, -6.0045166015625, -5.778076171875, -5.5516357421875, -5.3251953125, -5.0987548828125, -4.872314453125, -4.6458740234375, -4.41943359375, -4.1929931640625, -3.966552734375, -3.7401123046875, -3.513671875, -3.2872314453125, -3.060791015625, -2.8343505859375, -2.60791015625, -2.3814697265625, -2.155029296875, -1.9285888671875, -1.7021484375, -1.4757080078125, -1.249267578125, -1.0228271484375, -0.79638671875, -0.5699462890625, -0.343505859375, -0.1170654296875, 0.109375, 0.3358154296875, 0.562255859375, 0.7886962890625, 1.01513671875, 1.2415771484375, 1.468017578125, 1.6944580078125, 1.9208984375, 2.1473388671875, 2.373779296875, 2.6002197265625, 2.82666015625, 3.0531005859375, 3.279541015625, 3.5059814453125, 3.732421875, 3.9588623046875, 4.185302734375, 4.4117431640625, 4.63818359375, 4.8646240234375, 5.091064453125, 5.3175048828125, 5.5439453125, 5.7703857421875, 5.996826171875, 6.2232666015625, 6.44970703125, 6.6761474609375, 6.902587890625, 7.1290283203125, 7.35546875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 5.0, 7.0, 13.0, 4.0, 17.0, 17.0, 19.0, 16.0, 23.0, 39.0, 66.0, 110.0, 206.0, 345.0, 658.0, 1420.0, 3083.0, 6724.0, 14680.0, 32918.0, 79324.0, 197523.0, 334297.0, 220455.0, 89283.0, 36809.0, 16214.0, 7574.0, 3422.0, 1520.0, 781.0, 367.0, 220.0, 118.0, 73.0, 47.0, 27.0, 28.0, 21.0, 16.0, 8.0, 12.0, 9.0, 4.0, 5.0, 8.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-8.3125, -8.0572509765625, -7.802001953125, -7.5467529296875, -7.29150390625, -7.0362548828125, -6.781005859375, -6.5257568359375, -6.2705078125, -6.0152587890625, -5.760009765625, -5.5047607421875, -5.24951171875, -4.9942626953125, -4.739013671875, -4.4837646484375, -4.228515625, -3.9732666015625, -3.718017578125, -3.4627685546875, -3.20751953125, -2.9522705078125, -2.697021484375, -2.4417724609375, -2.1865234375, -1.9312744140625, -1.676025390625, -1.4207763671875, -1.16552734375, -0.9102783203125, -0.655029296875, -0.3997802734375, -0.14453125, 0.1107177734375, 0.365966796875, 0.6212158203125, 0.87646484375, 1.1317138671875, 1.386962890625, 1.6422119140625, 1.8974609375, 2.1527099609375, 2.407958984375, 2.6632080078125, 2.91845703125, 3.1737060546875, 3.428955078125, 3.6842041015625, 3.939453125, 4.1947021484375, 4.449951171875, 4.7052001953125, 4.96044921875, 5.2156982421875, 5.470947265625, 5.7261962890625, 5.9814453125, 6.2366943359375, 6.491943359375, 6.7471923828125, 7.00244140625, 7.2576904296875, 7.512939453125, 7.7681884765625, 8.0234375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 8.0, 14.0, 16.0, 20.0, 20.0, 37.0, 29.0, 36.0, 40.0, 43.0, 57.0, 60.0, 85.0, 167.0, 1445.0, 373.0, 136.0, 79.0, 54.0, 50.0, 42.0, 38.0, 33.0, 27.0, 24.0, 19.0, 11.0, 16.0, 13.0, 8.0, 9.0, 8.0, 6.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.421875, -25.404541015625, -24.38720703125, -23.369873046875, -22.3525390625, -21.335205078125, -20.31787109375, -19.300537109375, -18.283203125, -17.265869140625, -16.24853515625, -15.231201171875, -14.2138671875, -13.196533203125, -12.17919921875, -11.161865234375, -10.14453125, -9.127197265625, -8.10986328125, -7.092529296875, -6.0751953125, -5.057861328125, -4.04052734375, -3.023193359375, -2.005859375, -0.988525390625, 0.02880859375, 1.046142578125, 2.0634765625, 3.080810546875, 4.09814453125, 5.115478515625, 6.1328125, 7.150146484375, 8.16748046875, 9.184814453125, 10.2021484375, 11.219482421875, 12.23681640625, 13.254150390625, 14.271484375, 15.288818359375, 16.30615234375, 17.323486328125, 18.3408203125, 19.358154296875, 20.37548828125, 21.392822265625, 22.41015625, 23.427490234375, 24.44482421875, 25.462158203125, 26.4794921875, 27.496826171875, 28.51416015625, 29.531494140625, 30.548828125, 31.566162109375, 32.58349609375, 33.600830078125, 34.6181640625, 35.635498046875, 36.65283203125, 37.670166015625, 38.6875]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 5.0, 3.0, 4.0, 11.0, 18.0, 19.0, 33.0, 31.0, 63.0, 69.0, 97.0, 154.0, 291.0, 525.0, 1303.0, 24360.0, 3089093.0, 26905.0, 1278.0, 567.0, 298.0, 181.0, 124.0, 68.0, 52.0, 37.0, 32.0, 16.0, 18.0, 10.0, 6.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-73.5625, -71.1513671875, -68.740234375, -66.3291015625, -63.91796875, -61.5068359375, -59.095703125, -56.6845703125, -54.2734375, -51.8623046875, -49.451171875, -47.0400390625, -44.62890625, -42.2177734375, -39.806640625, -37.3955078125, -34.984375, -32.5732421875, -30.162109375, -27.7509765625, -25.33984375, -22.9287109375, -20.517578125, -18.1064453125, -15.6953125, -13.2841796875, -10.873046875, -8.4619140625, -6.05078125, -3.6396484375, -1.228515625, 1.1826171875, 3.59375, 6.0048828125, 8.416015625, 10.8271484375, 13.23828125, 15.6494140625, 18.060546875, 20.4716796875, 22.8828125, 25.2939453125, 27.705078125, 30.1162109375, 32.52734375, 34.9384765625, 37.349609375, 39.7607421875, 42.171875, 44.5830078125, 46.994140625, 49.4052734375, 51.81640625, 54.2275390625, 56.638671875, 59.0498046875, 61.4609375, 63.8720703125, 66.283203125, 68.6943359375, 71.10546875, 73.5166015625, 75.927734375, 78.3388671875, 80.75]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 110.0, 344.0, 391.0, 138.0, 21.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-194.06666564941406, -190.47366333007812, -186.8806610107422, -183.28765869140625, -179.6946563720703, -176.10165405273438, -172.50865173339844, -168.9156494140625, -165.3226318359375, -161.72962951660156, -158.13662719726562, -154.5436248779297, -150.95062255859375, -147.3576202392578, -143.76461791992188, -140.17160034179688, -136.57861328125, -132.98561096191406, -129.39260864257812, -125.79960632324219, -122.20660400390625, -118.61360168457031, -115.02059173583984, -111.4275894165039, -107.83458709716797, -104.24158477783203, -100.6485824584961, -97.05558013916016, -93.46257019042969, -89.86956787109375, -86.27656555175781, -82.68356323242188, -79.09056091308594, -75.49755859375, -71.90455627441406, -68.31155395507812, -64.71855163574219, -61.125545501708984, -57.53253936767578, -53.939537048339844, -50.34653091430664, -46.7535285949707, -43.1605224609375, -39.56752014160156, -35.974517822265625, -32.38151550292969, -28.788511276245117, -25.195507049560547, -21.60250473022461, -18.009502410888672, -14.416498184204102, -10.823494911193848, -7.230491638183594, -3.6374893188476562, -0.04448509216308594, 3.5485191345214844, 7.141521453857422, 10.734524726867676, 14.32752799987793, 17.9205322265625, 21.513534545898438, 25.106536865234375, 28.699541091918945, 32.292545318603516, 35.88554763793945]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 7.0, 10.0, 14.0, 9.0, 11.0, 14.0, 25.0, 23.0, 35.0, 36.0, 29.0, 38.0, 19.0, 44.0, 62.0, 42.0, 35.0, 41.0, 49.0, 43.0, 46.0, 41.0, 44.0, 37.0, 20.0, 22.0, 32.0, 27.0, 25.0, 15.0, 20.0, 16.0, 12.0, 11.0, 11.0, 5.0, 5.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.61741638183594, -64.4090576171875, -62.2006950378418, -59.992332458496094, -57.783973693847656, -55.57561492919922, -53.367252349853516, -51.15888977050781, -48.950531005859375, -46.74217224121094, -44.533809661865234, -42.32544708251953, -40.117088317871094, -37.908729553222656, -35.70036697387695, -33.49200439453125, -31.283645629882812, -29.075284957885742, -26.866924285888672, -24.6585636138916, -22.45020294189453, -20.24184226989746, -18.03348159790039, -15.82512092590332, -13.61676025390625, -11.40839958190918, -9.20003890991211, -6.991678237915039, -4.783317565917969, -2.5749568939208984, -0.3665962219238281, 1.8417644500732422, 4.0501251220703125, 6.258485794067383, 8.466846466064453, 10.675207138061523, 12.883567810058594, 15.091928482055664, 17.300289154052734, 19.508649826049805, 21.717010498046875, 23.925371170043945, 26.133731842041016, 28.342092514038086, 30.550453186035156, 32.758811950683594, 34.9671745300293, 37.175537109375, 39.38389587402344, 41.592254638671875, 43.80061721801758, 46.00897979736328, 48.21733856201172, 50.425697326660156, 52.63405990600586, 54.84242248535156, 57.05078125, 59.25914001464844, 61.46750259399414, 63.675865173339844, 65.88422393798828, 68.09258270263672, 70.30094909667969, 72.50930786132812, 74.71766662597656]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 4.0, 2.0, 10.0, 5.0, 5.0, 12.0, 9.0, 16.0, 16.0, 19.0, 15.0, 26.0, 20.0, 19.0, 24.0, 29.0, 31.0, 35.0, 35.0, 48.0, 48.0, 40.0, 37.0, 36.0, 45.0, 39.0, 37.0, 36.0, 30.0, 30.0, 16.0, 31.0, 25.0, 24.0, 23.0, 21.0, 15.0, 16.0, 10.0, 10.0, 9.0, 9.0, 7.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-9.2265625, -8.96807861328125, -8.7095947265625, -8.45111083984375, -8.192626953125, -7.93414306640625, -7.6756591796875, -7.41717529296875, -7.15869140625, -6.90020751953125, -6.6417236328125, -6.38323974609375, -6.124755859375, -5.86627197265625, -5.6077880859375, -5.34930419921875, -5.0908203125, -4.83233642578125, -4.5738525390625, -4.31536865234375, -4.056884765625, -3.79840087890625, -3.5399169921875, -3.28143310546875, -3.02294921875, -2.76446533203125, -2.5059814453125, -2.24749755859375, -1.989013671875, -1.73052978515625, -1.4720458984375, -1.21356201171875, -0.955078125, -0.69659423828125, -0.4381103515625, -0.17962646484375, 0.078857421875, 0.33734130859375, 0.5958251953125, 0.85430908203125, 1.11279296875, 1.37127685546875, 1.6297607421875, 1.88824462890625, 2.146728515625, 2.40521240234375, 2.6636962890625, 2.92218017578125, 3.1806640625, 3.43914794921875, 3.6976318359375, 3.95611572265625, 4.214599609375, 4.47308349609375, 4.7315673828125, 4.99005126953125, 5.24853515625, 5.50701904296875, 5.7655029296875, 6.02398681640625, 6.282470703125, 6.54095458984375, 6.7994384765625, 7.05792236328125, 7.31640625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 11.0, 9.0, 15.0, 16.0, 12.0, 17.0, 20.0, 21.0, 31.0, 29.0, 51.0, 47.0, 73.0, 86.0, 163.0, 286.0, 1053.0, 10018.0, 358288.0, 3151191.0, 652445.0, 17970.0, 1399.0, 349.0, 156.0, 111.0, 77.0, 47.0, 51.0, 44.0, 24.0, 23.0, 30.0, 17.0, 12.0, 21.0, 9.0, 8.0, 11.0, 6.0, 7.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-28.53125, -27.7294921875, -26.927734375, -26.1259765625, -25.32421875, -24.5224609375, -23.720703125, -22.9189453125, -22.1171875, -21.3154296875, -20.513671875, -19.7119140625, -18.91015625, -18.1083984375, -17.306640625, -16.5048828125, -15.703125, -14.9013671875, -14.099609375, -13.2978515625, -12.49609375, -11.6943359375, -10.892578125, -10.0908203125, -9.2890625, -8.4873046875, -7.685546875, -6.8837890625, -6.08203125, -5.2802734375, -4.478515625, -3.6767578125, -2.875, -2.0732421875, -1.271484375, -0.4697265625, 0.33203125, 1.1337890625, 1.935546875, 2.7373046875, 3.5390625, 4.3408203125, 5.142578125, 5.9443359375, 6.74609375, 7.5478515625, 8.349609375, 9.1513671875, 9.953125, 10.7548828125, 11.556640625, 12.3583984375, 13.16015625, 13.9619140625, 14.763671875, 15.5654296875, 16.3671875, 17.1689453125, 17.970703125, 18.7724609375, 19.57421875, 20.3759765625, 21.177734375, 21.9794921875, 22.78125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 9.0, 4.0, 5.0, 14.0, 19.0, 18.0, 35.0, 38.0, 53.0, 55.0, 79.0, 131.0, 186.0, 236.0, 304.0, 345.0, 421.0, 435.0, 405.0, 323.0, 256.0, 169.0, 129.0, 103.0, 77.0, 52.0, 41.0, 36.0, 30.0, 21.0, 13.0, 9.0, 8.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.2421875, -14.7841796875, -14.326171875, -13.8681640625, -13.41015625, -12.9521484375, -12.494140625, -12.0361328125, -11.578125, -11.1201171875, -10.662109375, -10.2041015625, -9.74609375, -9.2880859375, -8.830078125, -8.3720703125, -7.9140625, -7.4560546875, -6.998046875, -6.5400390625, -6.08203125, -5.6240234375, -5.166015625, -4.7080078125, -4.25, -3.7919921875, -3.333984375, -2.8759765625, -2.41796875, -1.9599609375, -1.501953125, -1.0439453125, -0.5859375, -0.1279296875, 0.330078125, 0.7880859375, 1.24609375, 1.7041015625, 2.162109375, 2.6201171875, 3.078125, 3.5361328125, 3.994140625, 4.4521484375, 4.91015625, 5.3681640625, 5.826171875, 6.2841796875, 6.7421875, 7.2001953125, 7.658203125, 8.1162109375, 8.57421875, 9.0322265625, 9.490234375, 9.9482421875, 10.40625, 10.8642578125, 11.322265625, 11.7802734375, 12.23828125, 12.6962890625, 13.154296875, 13.6123046875, 14.0703125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 14.0, 5.0, 19.0, 27.0, 41.0, 48.0, 65.0, 82.0, 102.0, 139.0, 199.0, 277.0, 452.0, 1018.0, 8189.0, 606152.0, 3518667.0, 54515.0, 2206.0, 726.0, 406.0, 252.0, 202.0, 124.0, 86.0, 71.0, 52.0, 38.0, 32.0, 29.0, 11.0, 12.0, 12.0, 5.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.28125, -51.6787109375, -50.076171875, -48.4736328125, -46.87109375, -45.2685546875, -43.666015625, -42.0634765625, -40.4609375, -38.8583984375, -37.255859375, -35.6533203125, -34.05078125, -32.4482421875, -30.845703125, -29.2431640625, -27.640625, -26.0380859375, -24.435546875, -22.8330078125, -21.23046875, -19.6279296875, -18.025390625, -16.4228515625, -14.8203125, -13.2177734375, -11.615234375, -10.0126953125, -8.41015625, -6.8076171875, -5.205078125, -3.6025390625, -2.0, -0.3974609375, 1.205078125, 2.8076171875, 4.41015625, 6.0126953125, 7.615234375, 9.2177734375, 10.8203125, 12.4228515625, 14.025390625, 15.6279296875, 17.23046875, 18.8330078125, 20.435546875, 22.0380859375, 23.640625, 25.2431640625, 26.845703125, 28.4482421875, 30.05078125, 31.6533203125, 33.255859375, 34.8583984375, 36.4609375, 38.0634765625, 39.666015625, 41.2685546875, 42.87109375, 44.4736328125, 46.076171875, 47.6787109375, 49.28125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 78.0, 684.0, 247.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.2712860107422, -128.9454345703125, -115.61957550048828, -102.2937240600586, -88.96786499023438, -75.64201354980469, -62.316162109375, -48.99030303955078, -35.664451599121094, -22.33859634399414, -9.01274299621582, 4.3131103515625, 17.638965606689453, 30.964820861816406, 44.290672302246094, 57.61653137207031, 70.9423828125, 84.26823425292969, 97.5940933227539, 110.9199447631836, 124.24580383300781, 137.5716552734375, 150.8975067138672, 164.22335815429688, 177.54922485351562, 190.8750762939453, 204.200927734375, 217.52679443359375, 230.85264587402344, 244.17849731445312, 257.50433349609375, 270.8302001953125, 284.1560363769531, 297.4819030761719, 310.8077392578125, 324.13360595703125, 337.4594421386719, 350.7853088378906, 364.11114501953125, 377.43701171875, 390.76287841796875, 404.0887451171875, 417.4145812988281, 430.7404479980469, 444.0662841796875, 457.39215087890625, 470.718017578125, 484.0438537597656, 497.36968994140625, 510.695556640625, 524.0214233398438, 537.3472290039062, 550.673095703125, 563.9989624023438, 577.3248291015625, 590.6506958007812, 603.9765625, 617.3024291992188, 630.6282958984375, 643.9541015625, 657.2799682617188, 670.6058349609375, 683.9317016601562, 697.257568359375, 710.5833740234375]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 9.0, 9.0, 11.0, 18.0, 8.0, 13.0, 23.0, 19.0, 15.0, 39.0, 34.0, 31.0, 40.0, 33.0, 28.0, 42.0, 36.0, 42.0, 43.0, 47.0, 38.0, 39.0, 35.0, 39.0, 28.0, 31.0, 43.0, 22.0, 34.0, 17.0, 20.0, 21.0, 10.0, 19.0, 9.0, 15.0, 8.0, 5.0, 8.0, 6.0, 3.0, 3.0, 0.0, 1.0, 5.0, 1.0], "bins": [-59.062870025634766, -57.444156646728516, -55.82544708251953, -54.20673370361328, -52.5880241394043, -50.96931076049805, -49.35060119628906, -47.73188781738281, -46.11317443847656, -44.49446105957031, -42.87575149536133, -41.25703811645508, -39.638328552246094, -38.019615173339844, -36.400901794433594, -34.78219223022461, -33.163482666015625, -31.544771194458008, -29.92605972290039, -28.30734634399414, -26.688636779785156, -25.069923400878906, -23.45121192932129, -21.832500457763672, -20.213788986206055, -18.595077514648438, -16.97636604309082, -15.357653617858887, -13.73894214630127, -12.120230674743652, -10.501518249511719, -8.882806777954102, -7.264091491699219, -5.645380020141602, -4.026668071746826, -2.407956123352051, -0.7892446517944336, 0.8294668197631836, 2.448179244995117, 4.066890716552734, 5.685602188110352, 7.304313659667969, 8.923025131225586, 10.54173755645752, 12.160449028015137, 13.779160499572754, 15.397872924804688, 17.016584396362305, 18.635295867919922, 20.25400733947754, 21.872718811035156, 23.491432189941406, 25.11014175415039, 26.72885513305664, 28.347566604614258, 29.966278076171875, 31.584989547729492, 33.20370101928711, 34.82241439819336, 36.441123962402344, 38.059837341308594, 39.67854690551758, 41.29726028442383, 42.91596984863281, 44.53468322753906]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 6.0, 8.0, 8.0, 4.0, 6.0, 10.0, 11.0, 11.0, 18.0, 12.0, 30.0, 21.0, 23.0, 33.0, 22.0, 25.0, 30.0, 32.0, 28.0, 49.0, 40.0, 31.0, 32.0, 44.0, 50.0, 35.0, 48.0, 25.0, 35.0, 24.0, 32.0, 34.0, 17.0, 20.0, 16.0, 21.0, 14.0, 20.0, 13.0, 14.0, 15.0, 7.0, 9.0, 4.0, 2.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.77734375, -7.52630615234375, -7.2752685546875, -7.02423095703125, -6.773193359375, -6.52215576171875, -6.2711181640625, -6.02008056640625, -5.76904296875, -5.51800537109375, -5.2669677734375, -5.01593017578125, -4.764892578125, -4.51385498046875, -4.2628173828125, -4.01177978515625, -3.7607421875, -3.50970458984375, -3.2586669921875, -3.00762939453125, -2.756591796875, -2.50555419921875, -2.2545166015625, -2.00347900390625, -1.75244140625, -1.50140380859375, -1.2503662109375, -0.99932861328125, -0.748291015625, -0.49725341796875, -0.2462158203125, 0.00482177734375, 0.255859375, 0.50689697265625, 0.7579345703125, 1.00897216796875, 1.260009765625, 1.51104736328125, 1.7620849609375, 2.01312255859375, 2.26416015625, 2.51519775390625, 2.7662353515625, 3.01727294921875, 3.268310546875, 3.51934814453125, 3.7703857421875, 4.02142333984375, 4.2724609375, 4.52349853515625, 4.7745361328125, 5.02557373046875, 5.276611328125, 5.52764892578125, 5.7786865234375, 6.02972412109375, 6.28076171875, 6.53179931640625, 6.7828369140625, 7.03387451171875, 7.284912109375, 7.53594970703125, 7.7869873046875, 8.03802490234375, 8.2890625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 10.0, 19.0, 25.0, 45.0, 39.0, 91.0, 123.0, 186.0, 251.0, 363.0, 600.0, 940.0, 1298.0, 1957.0, 2762.0, 4192.0, 6038.0, 8907.0, 12507.0, 18892.0, 27768.0, 42301.0, 66879.0, 115665.0, 212271.0, 212599.0, 115895.0, 66322.0, 42488.0, 27713.0, 18802.0, 12877.0, 8685.0, 6058.0, 4222.0, 2825.0, 1939.0, 1322.0, 872.0, 598.0, 389.0, 285.0, 183.0, 114.0, 75.0, 55.0, 32.0, 30.0, 14.0, 13.0, 8.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0], "bins": [-1.314453125, -1.27337646484375, -1.2322998046875, -1.19122314453125, -1.150146484375, -1.10906982421875, -1.0679931640625, -1.02691650390625, -0.98583984375, -0.94476318359375, -0.9036865234375, -0.86260986328125, -0.821533203125, -0.78045654296875, -0.7393798828125, -0.69830322265625, -0.6572265625, -0.61614990234375, -0.5750732421875, -0.53399658203125, -0.492919921875, -0.45184326171875, -0.4107666015625, -0.36968994140625, -0.32861328125, -0.28753662109375, -0.2464599609375, -0.20538330078125, -0.164306640625, -0.12322998046875, -0.0821533203125, -0.04107666015625, 0.0, 0.04107666015625, 0.0821533203125, 0.12322998046875, 0.164306640625, 0.20538330078125, 0.2464599609375, 0.28753662109375, 0.32861328125, 0.36968994140625, 0.4107666015625, 0.45184326171875, 0.492919921875, 0.53399658203125, 0.5750732421875, 0.61614990234375, 0.6572265625, 0.69830322265625, 0.7393798828125, 0.78045654296875, 0.821533203125, 0.86260986328125, 0.9036865234375, 0.94476318359375, 0.98583984375, 1.02691650390625, 1.0679931640625, 1.10906982421875, 1.150146484375, 1.19122314453125, 1.2322998046875, 1.27337646484375, 1.314453125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 1.0, 10.0, 4.0, 16.0, 11.0, 13.0, 24.0, 16.0, 31.0, 25.0, 34.0, 32.0, 48.0, 34.0, 38.0, 45.0, 41.0, 39.0, 1066.0, 57.0, 42.0, 38.0, 42.0, 38.0, 37.0, 32.0, 23.0, 29.0, 20.0, 20.0, 22.0, 10.0, 12.0, 18.0, 6.0, 10.0, 4.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.1640625, -5.98046875, -5.796875, -5.61328125, -5.4296875, -5.24609375, -5.0625, -4.87890625, -4.6953125, -4.51171875, -4.328125, -4.14453125, -3.9609375, -3.77734375, -3.59375, -3.41015625, -3.2265625, -3.04296875, -2.859375, -2.67578125, -2.4921875, -2.30859375, -2.125, -1.94140625, -1.7578125, -1.57421875, -1.390625, -1.20703125, -1.0234375, -0.83984375, -0.65625, -0.47265625, -0.2890625, -0.10546875, 0.078125, 0.26171875, 0.4453125, 0.62890625, 0.8125, 0.99609375, 1.1796875, 1.36328125, 1.546875, 1.73046875, 1.9140625, 2.09765625, 2.28125, 2.46484375, 2.6484375, 2.83203125, 3.015625, 3.19921875, 3.3828125, 3.56640625, 3.75, 3.93359375, 4.1171875, 4.30078125, 4.484375, 4.66796875, 4.8515625, 5.03515625, 5.21875, 5.40234375, 5.5859375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 1.0, 10.0, 8.0, 4.0, 16.0, 16.0, 21.0, 35.0, 54.0, 71.0, 87.0, 159.0, 249.0, 325.0, 459.0, 667.0, 1023.0, 1590.0, 2462.0, 3865.0, 5917.0, 9648.0, 15743.0, 25928.0, 43709.0, 79084.0, 157370.0, 1351409.0, 183192.0, 90333.0, 48770.0, 28285.0, 17099.0, 10538.0, 6674.0, 4234.0, 2705.0, 1762.0, 1158.0, 785.0, 532.0, 345.0, 251.0, 168.0, 112.0, 79.0, 51.0, 40.0, 35.0, 21.0, 19.0, 7.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.546875, -1.4963226318359375, -1.445770263671875, -1.3952178955078125, -1.34466552734375, -1.2941131591796875, -1.243560791015625, -1.1930084228515625, -1.1424560546875, -1.0919036865234375, -1.041351318359375, -0.9907989501953125, -0.94024658203125, -0.8896942138671875, -0.839141845703125, -0.7885894775390625, -0.738037109375, -0.6874847412109375, -0.636932373046875, -0.5863800048828125, -0.53582763671875, -0.4852752685546875, -0.434722900390625, -0.3841705322265625, -0.3336181640625, -0.2830657958984375, -0.232513427734375, -0.1819610595703125, -0.13140869140625, -0.0808563232421875, -0.030303955078125, 0.0202484130859375, 0.07080078125, 0.1213531494140625, 0.171905517578125, 0.2224578857421875, 0.27301025390625, 0.3235626220703125, 0.374114990234375, 0.4246673583984375, 0.4752197265625, 0.5257720947265625, 0.576324462890625, 0.6268768310546875, 0.67742919921875, 0.7279815673828125, 0.778533935546875, 0.8290863037109375, 0.879638671875, 0.9301910400390625, 0.980743408203125, 1.0312957763671875, 1.08184814453125, 1.1324005126953125, 1.182952880859375, 1.2335052490234375, 1.2840576171875, 1.3346099853515625, 1.385162353515625, 1.4357147216796875, 1.48626708984375, 1.5368194580078125, 1.587371826171875, 1.6379241943359375, 1.6884765625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 9.0, 12.0, 8.0, 8.0, 15.0, 25.0, 24.0, 44.0, 51.0, 57.0, 63.0, 88.0, 99.0, 102.0, 89.0, 61.0, 52.0, 44.0, 41.0, 28.0, 19.0, 12.0, 11.0, 13.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0025196075439453125, -0.0024425387382507324, -0.0023654699325561523, -0.0022884011268615723, -0.002211332321166992, -0.002134263515472412, -0.002057194709777832, -0.001980125904083252, -0.0019030570983886719, -0.0018259882926940918, -0.0017489194869995117, -0.0016718506813049316, -0.0015947818756103516, -0.0015177130699157715, -0.0014406442642211914, -0.0013635754585266113, -0.0012865066528320312, -0.0012094378471374512, -0.001132369041442871, -0.001055300235748291, -0.000978231430053711, -0.0009011626243591309, -0.0008240938186645508, -0.0007470250129699707, -0.0006699562072753906, -0.0005928874015808105, -0.0005158185958862305, -0.0004387497901916504, -0.0003616809844970703, -0.00028461217880249023, -0.00020754337310791016, -0.00013047456741333008, -5.340576171875e-05, 2.3663043975830078e-05, 0.00010073184967041016, 0.00017780065536499023, 0.0002548694610595703, 0.0003319382667541504, 0.00040900707244873047, 0.00048607587814331055, 0.0005631446838378906, 0.0006402134895324707, 0.0007172822952270508, 0.0007943511009216309, 0.0008714199066162109, 0.000948488712310791, 0.001025557518005371, 0.0011026263236999512, 0.0011796951293945312, 0.0012567639350891113, 0.0013338327407836914, 0.0014109015464782715, 0.0014879703521728516, 0.0015650391578674316, 0.0016421079635620117, 0.0017191767692565918, 0.0017962455749511719, 0.001873314380645752, 0.001950383186340332, 0.002027451992034912, 0.002104520797729492, 0.0021815896034240723, 0.0022586584091186523, 0.0023357272148132324, 0.0024127960205078125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 11.0, 13.0, 18.0, 20.0, 18.0, 44.0, 54.0, 82.0, 101.0, 189.0, 307.0, 757.0, 15221.0, 1029119.0, 1491.0, 444.0, 236.0, 122.0, 89.0, 63.0, 36.0, 28.0, 27.0, 17.0, 16.0, 5.0, 6.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049407958984375, -0.047827720642089844, -0.04624748229980469, -0.04466724395751953, -0.043087005615234375, -0.04150676727294922, -0.03992652893066406, -0.038346290588378906, -0.03676605224609375, -0.035185813903808594, -0.03360557556152344, -0.03202533721923828, -0.030445098876953125, -0.02886486053466797, -0.027284622192382812, -0.025704383850097656, -0.0241241455078125, -0.022543907165527344, -0.020963668823242188, -0.01938343048095703, -0.017803192138671875, -0.01622295379638672, -0.014642715454101562, -0.013062477111816406, -0.01148223876953125, -0.009902000427246094, -0.008321762084960938, -0.006741523742675781, -0.005161285400390625, -0.0035810470581054688, -0.0020008087158203125, -0.00042057037353515625, 0.00115966796875, 0.0027399063110351562, 0.0043201446533203125, 0.005900382995605469, 0.007480621337890625, 0.009060859680175781, 0.010641098022460938, 0.012221336364746094, 0.01380157470703125, 0.015381813049316406, 0.016962051391601562, 0.01854228973388672, 0.020122528076171875, 0.02170276641845703, 0.023283004760742188, 0.024863243103027344, 0.0264434814453125, 0.028023719787597656, 0.029603958129882812, 0.03118419647216797, 0.032764434814453125, 0.03434467315673828, 0.03592491149902344, 0.037505149841308594, 0.03908538818359375, 0.040665626525878906, 0.04224586486816406, 0.04382610321044922, 0.045406341552734375, 0.04698657989501953, 0.04856681823730469, 0.050147056579589844, 0.051727294921875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 12.0, 33.0, 111.0, 200.0, 259.0, 222.0, 115.0, 47.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002450825646519661, -0.002383795566856861, -0.002316765720024705, -0.002249735640361905, -0.0021827055606991053, -0.002115675713866949, -0.0020486456342041492, -0.0019816155545413494, -0.0019145855912938714, -0.0018475556280463934, -0.0017805255483835936, -0.0017134955851361156, -0.0016464656218886375, -0.0015794355422258377, -0.0015124055789783597, -0.0014453756157308817, -0.0013783455360680819, -0.0013113155728206038, -0.001244285493157804, -0.001177255529910326, -0.0011102254502475262, -0.0010431954870000482, -0.0009761655237525702, -0.0009091355022974312, -0.0008421054808422923, -0.0007750754593871534, -0.0007080454379320145, -0.0006410154746845365, -0.0005739854532293975, -0.0005069554317742586, -0.00043992543942295015, -0.0003728954470716417, -0.0003058655420318246, -0.0002388355351286009, -0.0001718055282253772, -0.00010477552132215351, -3.7745514418929815e-05, 2.9284507036209106e-05, 9.631449938751757e-05, 0.00016334449173882604, 0.00023037451319396496, 0.0002974045346491039, 0.00036443452700041234, 0.0004314645193517208, 0.0004984945408068597, 0.0005655245622619987, 0.0006325545255094767, 0.0006995845469646156, 0.0007666145684197545, 0.0008336445898748934, 0.0009006746113300323, 0.0009677045745775104, 0.0010347345378249884, 0.0011017646174877882, 0.0011687945807352662, 0.0012358245439827442, 0.001302854623645544, 0.001369884586893022, 0.001436914666555822, 0.0015039446298033, 0.0015709747094660997, 0.0016380046727135777, 0.0017050346359610558, 0.0017720647156238556, 0.0018390946788713336]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 15.0, 18.0, 12.0, 22.0, 17.0, 16.0, 28.0, 36.0, 20.0, 34.0, 22.0, 31.0, 41.0, 40.0, 51.0, 32.0, 45.0, 41.0, 41.0, 32.0, 48.0, 39.0, 37.0, 40.0, 33.0, 33.0, 27.0, 31.0, 17.0, 15.0, 12.0, 14.0, 10.0, 7.0, 10.0, 11.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0009078383445739746, -0.0008779633790254593, -0.000848088413476944, -0.0008182134479284286, -0.0007883384823799133, -0.000758463516831398, -0.0007285885512828827, -0.0006987135857343674, -0.000668838620185852, -0.0006389636546373367, -0.0006090886890888214, -0.0005792137235403061, -0.0005493387579917908, -0.0005194637924432755, -0.0004895888268947601, -0.0004597138613462448, -0.0004298388957977295, -0.00039996393024921417, -0.00037008896470069885, -0.00034021399915218353, -0.0003103390336036682, -0.0002804640680551529, -0.0002505891025066376, -0.00022071413695812225, -0.00019083917140960693, -0.00016096420586109161, -0.0001310892403125763, -0.00010121427476406097, -7.133930921554565e-05, -4.1464343667030334e-05, -1.1589378118515015e-05, 1.8285587430000305e-05, 4.8160552978515625e-05, 7.803551852703094e-05, 0.00010791048407554626, 0.00013778544962406158, 0.0001676604151725769, 0.00019753538072109222, 0.00022741034626960754, 0.00025728531181812286, 0.0002871602773666382, 0.0003170352429151535, 0.0003469102084636688, 0.00037678517401218414, 0.00040666013956069946, 0.0004365351051092148, 0.0004664100706577301, 0.0004962850362062454, 0.0005261600017547607, 0.0005560349673032761, 0.0005859099328517914, 0.0006157848984003067, 0.000645659863948822, 0.0006755348294973373, 0.0007054097950458527, 0.000735284760594368, 0.0007651597261428833, 0.0007950346916913986, 0.0008249096572399139, 0.0008547846227884293, 0.0008846595883369446, 0.0009145345538854599, 0.0009444095194339752, 0.0009742844849824905, 0.0010041594505310059]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 6.0, 8.0, 8.0, 4.0, 6.0, 10.0, 11.0, 11.0, 18.0, 12.0, 30.0, 21.0, 23.0, 33.0, 22.0, 25.0, 30.0, 32.0, 28.0, 49.0, 40.0, 31.0, 32.0, 43.0, 51.0, 35.0, 48.0, 25.0, 35.0, 24.0, 32.0, 34.0, 17.0, 20.0, 16.0, 21.0, 14.0, 20.0, 13.0, 14.0, 15.0, 7.0, 9.0, 4.0, 2.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.77734375, -7.52630615234375, -7.2752685546875, -7.02423095703125, -6.773193359375, -6.52215576171875, -6.2711181640625, -6.02008056640625, -5.76904296875, -5.51800537109375, -5.2669677734375, -5.01593017578125, -4.764892578125, -4.51385498046875, -4.2628173828125, -4.01177978515625, -3.7607421875, -3.50970458984375, -3.2586669921875, -3.00762939453125, -2.756591796875, -2.50555419921875, -2.2545166015625, -2.00347900390625, -1.75244140625, -1.50140380859375, -1.2503662109375, -0.99932861328125, -0.748291015625, -0.49725341796875, -0.2462158203125, 0.00482177734375, 0.255859375, 0.50689697265625, 0.7579345703125, 1.00897216796875, 1.260009765625, 1.51104736328125, 1.7620849609375, 2.01312255859375, 2.26416015625, 2.51519775390625, 2.7662353515625, 3.01727294921875, 3.268310546875, 3.51934814453125, 3.7703857421875, 4.02142333984375, 4.2724609375, 4.52349853515625, 4.7745361328125, 5.02557373046875, 5.276611328125, 5.52764892578125, 5.7786865234375, 6.02972412109375, 6.28076171875, 6.53179931640625, 6.7828369140625, 7.03387451171875, 7.284912109375, 7.53594970703125, 7.7869873046875, 8.03802490234375, 8.2890625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 9.0, 5.0, 10.0, 11.0, 19.0, 20.0, 19.0, 36.0, 42.0, 54.0, 76.0, 109.0, 146.0, 176.0, 266.0, 440.0, 917.0, 2997.0, 11332.0, 45516.0, 233363.0, 566704.0, 144126.0, 30442.0, 7561.0, 2073.0, 766.0, 386.0, 246.0, 158.0, 130.0, 94.0, 67.0, 56.0, 37.0, 34.0, 32.0, 21.0, 18.0, 11.0, 3.0, 6.0, 7.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2421875, -13.7730712890625, -13.303955078125, -12.8348388671875, -12.36572265625, -11.8966064453125, -11.427490234375, -10.9583740234375, -10.4892578125, -10.0201416015625, -9.551025390625, -9.0819091796875, -8.61279296875, -8.1436767578125, -7.674560546875, -7.2054443359375, -6.736328125, -6.2672119140625, -5.798095703125, -5.3289794921875, -4.85986328125, -4.3907470703125, -3.921630859375, -3.4525146484375, -2.9833984375, -2.5142822265625, -2.045166015625, -1.5760498046875, -1.10693359375, -0.6378173828125, -0.168701171875, 0.3004150390625, 0.76953125, 1.2386474609375, 1.707763671875, 2.1768798828125, 2.64599609375, 3.1151123046875, 3.584228515625, 4.0533447265625, 4.5224609375, 4.9915771484375, 5.460693359375, 5.9298095703125, 6.39892578125, 6.8680419921875, 7.337158203125, 7.8062744140625, 8.275390625, 8.7445068359375, 9.213623046875, 9.6827392578125, 10.15185546875, 10.6209716796875, 11.090087890625, 11.5592041015625, 12.0283203125, 12.4974365234375, 12.966552734375, 13.4356689453125, 13.90478515625, 14.3739013671875, 14.843017578125, 15.3121337890625, 15.78125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 4.0, 2.0, 8.0, 7.0, 7.0, 9.0, 12.0, 11.0, 11.0, 14.0, 15.0, 15.0, 15.0, 21.0, 25.0, 21.0, 36.0, 46.0, 48.0, 43.0, 61.0, 69.0, 173.0, 1469.0, 307.0, 121.0, 75.0, 60.0, 43.0, 36.0, 33.0, 29.0, 30.0, 24.0, 25.0, 20.0, 22.0, 19.0, 11.0, 14.0, 8.0, 11.0, 8.0, 4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-26.0, -25.15576171875, -24.3115234375, -23.46728515625, -22.623046875, -21.77880859375, -20.9345703125, -20.09033203125, -19.24609375, -18.40185546875, -17.5576171875, -16.71337890625, -15.869140625, -15.02490234375, -14.1806640625, -13.33642578125, -12.4921875, -11.64794921875, -10.8037109375, -9.95947265625, -9.115234375, -8.27099609375, -7.4267578125, -6.58251953125, -5.73828125, -4.89404296875, -4.0498046875, -3.20556640625, -2.361328125, -1.51708984375, -0.6728515625, 0.17138671875, 1.015625, 1.85986328125, 2.7041015625, 3.54833984375, 4.392578125, 5.23681640625, 6.0810546875, 6.92529296875, 7.76953125, 8.61376953125, 9.4580078125, 10.30224609375, 11.146484375, 11.99072265625, 12.8349609375, 13.67919921875, 14.5234375, 15.36767578125, 16.2119140625, 17.05615234375, 17.900390625, 18.74462890625, 19.5888671875, 20.43310546875, 21.27734375, 22.12158203125, 22.9658203125, 23.81005859375, 24.654296875, 25.49853515625, 26.3427734375, 27.18701171875, 28.03125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 4.0, 3.0, 8.0, 13.0, 19.0, 22.0, 22.0, 32.0, 31.0, 41.0, 46.0, 72.0, 75.0, 134.0, 178.0, 291.0, 536.0, 1515.0, 17326.0, 3011992.0, 108846.0, 2570.0, 747.0, 368.0, 235.0, 121.0, 94.0, 72.0, 49.0, 42.0, 30.0, 19.0, 28.0, 27.0, 20.0, 6.0, 9.0, 16.0, 10.0, 8.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-63.125, -61.0673828125, -59.009765625, -56.9521484375, -54.89453125, -52.8369140625, -50.779296875, -48.7216796875, -46.6640625, -44.6064453125, -42.548828125, -40.4912109375, -38.43359375, -36.3759765625, -34.318359375, -32.2607421875, -30.203125, -28.1455078125, -26.087890625, -24.0302734375, -21.97265625, -19.9150390625, -17.857421875, -15.7998046875, -13.7421875, -11.6845703125, -9.626953125, -7.5693359375, -5.51171875, -3.4541015625, -1.396484375, 0.6611328125, 2.71875, 4.7763671875, 6.833984375, 8.8916015625, 10.94921875, 13.0068359375, 15.064453125, 17.1220703125, 19.1796875, 21.2373046875, 23.294921875, 25.3525390625, 27.41015625, 29.4677734375, 31.525390625, 33.5830078125, 35.640625, 37.6982421875, 39.755859375, 41.8134765625, 43.87109375, 45.9287109375, 47.986328125, 50.0439453125, 52.1015625, 54.1591796875, 56.216796875, 58.2744140625, 60.33203125, 62.3896484375, 64.447265625, 66.5048828125, 68.5625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 24.0, 393.0, 549.0, 50.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-235.83131408691406, -229.30050659179688, -222.7696990966797, -216.2388916015625, -209.70806884765625, -203.17726135253906, -196.64645385742188, -190.1156463623047, -183.5848388671875, -177.0540313720703, -170.52322387695312, -163.99240112304688, -157.4615936279297, -150.9307861328125, -144.3999786376953, -137.86917114257812, -131.33834838867188, -124.80754089355469, -118.27672576904297, -111.74591827392578, -105.21510314941406, -98.68429565429688, -92.15348815917969, -85.6226806640625, -79.09186553955078, -72.5610580444336, -66.03024291992188, -59.49943542480469, -52.968624114990234, -46.43781280517578, -39.907005310058594, -33.37619400024414, -26.845382690429688, -20.314571380615234, -13.783761978149414, -7.252952575683594, -0.7221412658691406, 5.8086700439453125, 12.3394775390625, 18.870288848876953, 25.401100158691406, 31.93191146850586, 38.46272277832031, 44.9935302734375, 51.52434158325195, 58.055152893066406, 64.5859603881836, 71.11677551269531, 77.6475830078125, 84.17839050292969, 90.7092056274414, 97.2400131225586, 103.77082824707031, 110.3016357421875, 116.83244323730469, 123.36325073242188, 129.89407348632812, 136.4248809814453, 142.9556884765625, 149.48651123046875, 156.01731872558594, 162.54812622070312, 169.0789337158203, 175.6097412109375, 182.1405487060547]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 7.0, 7.0, 8.0, 9.0, 4.0, 12.0, 14.0, 12.0, 16.0, 16.0, 24.0, 20.0, 30.0, 37.0, 22.0, 43.0, 24.0, 38.0, 37.0, 33.0, 38.0, 30.0, 45.0, 42.0, 39.0, 40.0, 34.0, 34.0, 32.0, 31.0, 23.0, 26.0, 30.0, 18.0, 13.0, 18.0, 14.0, 13.0, 9.0, 17.0, 11.0, 5.0, 6.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0], "bins": [-70.77459716796875, -68.72064971923828, -66.66670989990234, -64.61276245117188, -62.55881881713867, -60.50487518310547, -58.450927734375, -56.3969841003418, -54.343040466308594, -52.28909683227539, -50.23515319824219, -48.18120574951172, -46.127262115478516, -44.07331848144531, -42.019371032714844, -39.96542739868164, -37.91148376464844, -35.857540130615234, -33.80359649658203, -31.749649047851562, -29.69570541381836, -27.641761779785156, -25.58781623840332, -23.533870697021484, -21.47992706298828, -19.425983428955078, -17.372037887573242, -15.318093299865723, -13.264148712158203, -11.210204124450684, -9.156259536743164, -7.1023149490356445, -5.048374176025391, -2.994429588317871, -0.9404850006103516, 1.113459587097168, 3.1674041748046875, 5.221348762512207, 7.275293350219727, 9.329237937927246, 11.383182525634766, 13.437127113342285, 15.491071701049805, 17.54501724243164, 19.598960876464844, 21.652904510498047, 23.706850051879883, 25.76079559326172, 27.814739227294922, 29.868682861328125, 31.92262840270996, 33.9765739440918, 36.030517578125, 38.0844612121582, 40.138404846191406, 42.192352294921875, 44.24629592895508, 46.30023956298828, 48.35418701171875, 50.40813064575195, 52.462074279785156, 54.51601791381836, 56.56996154785156, 58.62390899658203, 60.677852630615234]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 5.0, 8.0, 7.0, 8.0, 20.0, 12.0, 16.0, 20.0, 17.0, 26.0, 21.0, 28.0, 26.0, 28.0, 33.0, 38.0, 31.0, 41.0, 42.0, 28.0, 39.0, 47.0, 34.0, 36.0, 45.0, 27.0, 31.0, 32.0, 27.0, 24.0, 29.0, 25.0, 25.0, 24.0, 10.0, 14.0, 15.0, 12.0, 9.0, 9.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-8.2421875, -7.9732666015625, -7.704345703125, -7.4354248046875, -7.16650390625, -6.8975830078125, -6.628662109375, -6.3597412109375, -6.0908203125, -5.8218994140625, -5.552978515625, -5.2840576171875, -5.01513671875, -4.7462158203125, -4.477294921875, -4.2083740234375, -3.939453125, -3.6705322265625, -3.401611328125, -3.1326904296875, -2.86376953125, -2.5948486328125, -2.325927734375, -2.0570068359375, -1.7880859375, -1.5191650390625, -1.250244140625, -0.9813232421875, -0.71240234375, -0.4434814453125, -0.174560546875, 0.0943603515625, 0.36328125, 0.6322021484375, 0.901123046875, 1.1700439453125, 1.43896484375, 1.7078857421875, 1.976806640625, 2.2457275390625, 2.5146484375, 2.7835693359375, 3.052490234375, 3.3214111328125, 3.59033203125, 3.8592529296875, 4.128173828125, 4.3970947265625, 4.666015625, 4.9349365234375, 5.203857421875, 5.4727783203125, 5.74169921875, 6.0106201171875, 6.279541015625, 6.5484619140625, 6.8173828125, 7.0863037109375, 7.355224609375, 7.6241455078125, 7.89306640625, 8.1619873046875, 8.430908203125, 8.6998291015625, 8.96875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 6.0, 11.0, 8.0, 9.0, 13.0, 13.0, 17.0, 22.0, 28.0, 35.0, 48.0, 52.0, 54.0, 88.0, 179.0, 342.0, 1307.0, 9763.0, 160593.0, 1953989.0, 1905764.0, 150367.0, 9421.0, 1211.0, 346.0, 169.0, 94.0, 59.0, 46.0, 41.0, 28.0, 27.0, 19.0, 20.0, 20.0, 12.0, 15.0, 10.0, 5.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.875, -20.178955078125, -19.48291015625, -18.786865234375, -18.0908203125, -17.394775390625, -16.69873046875, -16.002685546875, -15.306640625, -14.610595703125, -13.91455078125, -13.218505859375, -12.5224609375, -11.826416015625, -11.13037109375, -10.434326171875, -9.73828125, -9.042236328125, -8.34619140625, -7.650146484375, -6.9541015625, -6.258056640625, -5.56201171875, -4.865966796875, -4.169921875, -3.473876953125, -2.77783203125, -2.081787109375, -1.3857421875, -0.689697265625, 0.00634765625, 0.702392578125, 1.3984375, 2.094482421875, 2.79052734375, 3.486572265625, 4.1826171875, 4.878662109375, 5.57470703125, 6.270751953125, 6.966796875, 7.662841796875, 8.35888671875, 9.054931640625, 9.7509765625, 10.447021484375, 11.14306640625, 11.839111328125, 12.53515625, 13.231201171875, 13.92724609375, 14.623291015625, 15.3193359375, 16.015380859375, 16.71142578125, 17.407470703125, 18.103515625, 18.799560546875, 19.49560546875, 20.191650390625, 20.8876953125, 21.583740234375, 22.27978515625, 22.975830078125, 23.671875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 7.0, 7.0, 13.0, 15.0, 28.0, 28.0, 40.0, 51.0, 99.0, 128.0, 173.0, 250.0, 326.0, 447.0, 474.0, 486.0, 417.0, 321.0, 220.0, 172.0, 119.0, 78.0, 46.0, 45.0, 16.0, 16.0, 15.0, 12.0, 9.0, 2.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.296875, -18.7735595703125, -18.250244140625, -17.7269287109375, -17.20361328125, -16.6802978515625, -16.156982421875, -15.6336669921875, -15.1103515625, -14.5870361328125, -14.063720703125, -13.5404052734375, -13.01708984375, -12.4937744140625, -11.970458984375, -11.4471435546875, -10.923828125, -10.4005126953125, -9.877197265625, -9.3538818359375, -8.83056640625, -8.3072509765625, -7.783935546875, -7.2606201171875, -6.7373046875, -6.2139892578125, -5.690673828125, -5.1673583984375, -4.64404296875, -4.1207275390625, -3.597412109375, -3.0740966796875, -2.55078125, -2.0274658203125, -1.504150390625, -0.9808349609375, -0.45751953125, 0.0657958984375, 0.589111328125, 1.1124267578125, 1.6357421875, 2.1590576171875, 2.682373046875, 3.2056884765625, 3.72900390625, 4.2523193359375, 4.775634765625, 5.2989501953125, 5.822265625, 6.3455810546875, 6.868896484375, 7.3922119140625, 7.91552734375, 8.4388427734375, 8.962158203125, 9.4854736328125, 10.0087890625, 10.5321044921875, 11.055419921875, 11.5787353515625, 12.10205078125, 12.6253662109375, 13.148681640625, 13.6719970703125, 14.1953125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 9.0, 19.0, 21.0, 29.0, 42.0, 57.0, 74.0, 100.0, 120.0, 183.0, 285.0, 424.0, 845.0, 2887.0, 24758.0, 741825.0, 3269921.0, 141372.0, 8072.0, 1454.0, 607.0, 333.0, 226.0, 160.0, 122.0, 78.0, 75.0, 46.0, 40.0, 25.0, 15.0, 15.0, 8.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.78125, -33.59326171875, -32.4052734375, -31.21728515625, -30.029296875, -28.84130859375, -27.6533203125, -26.46533203125, -25.27734375, -24.08935546875, -22.9013671875, -21.71337890625, -20.525390625, -19.33740234375, -18.1494140625, -16.96142578125, -15.7734375, -14.58544921875, -13.3974609375, -12.20947265625, -11.021484375, -9.83349609375, -8.6455078125, -7.45751953125, -6.26953125, -5.08154296875, -3.8935546875, -2.70556640625, -1.517578125, -0.32958984375, 0.8583984375, 2.04638671875, 3.234375, 4.42236328125, 5.6103515625, 6.79833984375, 7.986328125, 9.17431640625, 10.3623046875, 11.55029296875, 12.73828125, 13.92626953125, 15.1142578125, 16.30224609375, 17.490234375, 18.67822265625, 19.8662109375, 21.05419921875, 22.2421875, 23.43017578125, 24.6181640625, 25.80615234375, 26.994140625, 28.18212890625, 29.3701171875, 30.55810546875, 31.74609375, 32.93408203125, 34.1220703125, 35.31005859375, 36.498046875, 37.68603515625, 38.8740234375, 40.06201171875, 41.25]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 3.0, 12.0, 370.0, 594.0, 38.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.25001525878906, -43.489776611328125, -29.729541778564453, -15.969306945800781, -2.2090682983398438, 11.551170349121094, 25.3114013671875, 39.07164001464844, 52.831878662109375, 66.59211730957031, 80.35235595703125, 94.11258697509766, 107.8728256225586, 121.63306427001953, 135.39329528808594, 149.15353393554688, 162.9137725830078, 176.67401123046875, 190.4342498779297, 204.19448852539062, 217.9547119140625, 231.7149658203125, 245.47518920898438, 259.23541259765625, 272.99566650390625, 286.7558898925781, 300.5161437988281, 314.2763671875, 328.03662109375, 341.7968444824219, 355.55706787109375, 369.31732177734375, 383.07757568359375, 396.8377990722656, 410.5980529785156, 424.3582763671875, 438.1185302734375, 451.8787536621094, 465.63897705078125, 479.39923095703125, 493.15948486328125, 506.9197082519531, 520.679931640625, 534.440185546875, 548.200439453125, 561.960693359375, 575.7208862304688, 589.4811401367188, 603.2413330078125, 617.0015869140625, 630.7617797851562, 644.5220336914062, 658.2822875976562, 672.0425415039062, 685.802734375, 699.56298828125, 713.3232421875, 727.08349609375, 740.8436889648438, 754.6039428710938, 768.3641967773438, 782.1244506835938, 795.8846435546875, 809.6448974609375, 823.4051513671875]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 5.0, 1.0, 2.0, 8.0, 14.0, 11.0, 12.0, 12.0, 22.0, 26.0, 17.0, 16.0, 25.0, 29.0, 34.0, 41.0, 32.0, 33.0, 31.0, 41.0, 36.0, 38.0, 45.0, 39.0, 34.0, 39.0, 33.0, 44.0, 34.0, 24.0, 31.0, 30.0, 29.0, 14.0, 21.0, 16.0, 16.0, 10.0, 11.0, 8.0, 6.0, 8.0, 6.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-53.6789665222168, -52.08578872680664, -50.492610931396484, -48.89943313598633, -47.30625915527344, -45.71308135986328, -44.119903564453125, -42.52672576904297, -40.93354797363281, -39.340370178222656, -37.7471923828125, -36.154014587402344, -34.56083679199219, -32.9676628112793, -31.37448501586914, -29.781307220458984, -28.188129425048828, -26.594951629638672, -25.001773834228516, -23.408597946166992, -21.815420150756836, -20.22224235534668, -18.629066467285156, -17.035888671875, -15.442710876464844, -13.849533081054688, -12.256356239318848, -10.663179397583008, -9.070001602172852, -7.4768242835998535, -5.8836469650268555, -4.290470123291016, -2.6972923278808594, -1.1041150093078613, 0.4890623092651367, 2.0822396278381348, 3.675416946411133, 5.268594264984131, 6.861771583557129, 8.454948425292969, 10.048126220703125, 11.641304016113281, 13.234480857849121, 14.827657699584961, 16.420835494995117, 18.014013290405273, 19.607189178466797, 21.200366973876953, 22.79354476928711, 24.386722564697266, 25.979900360107422, 27.573076248168945, 29.1662540435791, 30.759431838989258, 32.35260772705078, 33.94578552246094, 35.538963317871094, 37.13214111328125, 38.725318908691406, 40.31849670410156, 41.91167449951172, 43.50484848022461, 45.098026275634766, 46.69120407104492, 48.28438186645508]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 6.0, 4.0, 11.0, 11.0, 9.0, 16.0, 11.0, 14.0, 20.0, 26.0, 27.0, 29.0, 17.0, 30.0, 35.0, 31.0, 32.0, 25.0, 36.0, 33.0, 39.0, 52.0, 38.0, 42.0, 49.0, 28.0, 42.0, 31.0, 42.0, 18.0, 26.0, 28.0, 23.0, 16.0, 19.0, 8.0, 15.0, 12.0, 7.0, 6.0, 6.0, 10.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.234375, -7.954345703125, -7.67431640625, -7.394287109375, -7.1142578125, -6.834228515625, -6.55419921875, -6.274169921875, -5.994140625, -5.714111328125, -5.43408203125, -5.154052734375, -4.8740234375, -4.593994140625, -4.31396484375, -4.033935546875, -3.75390625, -3.473876953125, -3.19384765625, -2.913818359375, -2.6337890625, -2.353759765625, -2.07373046875, -1.793701171875, -1.513671875, -1.233642578125, -0.95361328125, -0.673583984375, -0.3935546875, -0.113525390625, 0.16650390625, 0.446533203125, 0.7265625, 1.006591796875, 1.28662109375, 1.566650390625, 1.8466796875, 2.126708984375, 2.40673828125, 2.686767578125, 2.966796875, 3.246826171875, 3.52685546875, 3.806884765625, 4.0869140625, 4.366943359375, 4.64697265625, 4.927001953125, 5.20703125, 5.487060546875, 5.76708984375, 6.047119140625, 6.3271484375, 6.607177734375, 6.88720703125, 7.167236328125, 7.447265625, 7.727294921875, 8.00732421875, 8.287353515625, 8.5673828125, 8.847412109375, 9.12744140625, 9.407470703125, 9.6875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 5.0, 9.0, 4.0, 22.0, 20.0, 38.0, 47.0, 64.0, 112.0, 165.0, 232.0, 362.0, 516.0, 858.0, 1235.0, 1801.0, 2998.0, 4770.0, 7420.0, 12060.0, 20361.0, 34497.0, 60416.0, 112154.0, 240919.0, 266268.0, 122022.0, 65438.0, 36883.0, 21851.0, 13030.0, 7993.0, 5019.0, 3126.0, 2020.0, 1203.0, 878.0, 558.0, 369.0, 252.0, 188.0, 104.0, 87.0, 66.0, 28.0, 27.0, 25.0, 11.0, 5.0, 6.0, 4.0, 4.0, 3.0, 2.0], "bins": [-1.9775390625, -1.921142578125, -1.86474609375, -1.808349609375, -1.751953125, -1.695556640625, -1.63916015625, -1.582763671875, -1.5263671875, -1.469970703125, -1.41357421875, -1.357177734375, -1.30078125, -1.244384765625, -1.18798828125, -1.131591796875, -1.0751953125, -1.018798828125, -0.96240234375, -0.906005859375, -0.849609375, -0.793212890625, -0.73681640625, -0.680419921875, -0.6240234375, -0.567626953125, -0.51123046875, -0.454833984375, -0.3984375, -0.342041015625, -0.28564453125, -0.229248046875, -0.1728515625, -0.116455078125, -0.06005859375, -0.003662109375, 0.052734375, 0.109130859375, 0.16552734375, 0.221923828125, 0.2783203125, 0.334716796875, 0.39111328125, 0.447509765625, 0.50390625, 0.560302734375, 0.61669921875, 0.673095703125, 0.7294921875, 0.785888671875, 0.84228515625, 0.898681640625, 0.955078125, 1.011474609375, 1.06787109375, 1.124267578125, 1.1806640625, 1.237060546875, 1.29345703125, 1.349853515625, 1.40625, 1.462646484375, 1.51904296875, 1.575439453125, 1.6318359375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 1.0, 8.0, 9.0, 9.0, 9.0, 8.0, 12.0, 16.0, 18.0, 13.0, 13.0, 21.0, 18.0, 19.0, 29.0, 28.0, 19.0, 29.0, 32.0, 38.0, 26.0, 40.0, 28.0, 1058.0, 43.0, 41.0, 47.0, 47.0, 37.0, 37.0, 22.0, 27.0, 19.0, 19.0, 20.0, 16.0, 18.0, 20.0, 18.0, 16.0, 13.0, 10.0, 13.0, 10.0, 9.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 4.0, 3.0], "bins": [-5.75, -5.5845947265625, -5.419189453125, -5.2537841796875, -5.08837890625, -4.9229736328125, -4.757568359375, -4.5921630859375, -4.4267578125, -4.2613525390625, -4.095947265625, -3.9305419921875, -3.76513671875, -3.5997314453125, -3.434326171875, -3.2689208984375, -3.103515625, -2.9381103515625, -2.772705078125, -2.6072998046875, -2.44189453125, -2.2764892578125, -2.111083984375, -1.9456787109375, -1.7802734375, -1.6148681640625, -1.449462890625, -1.2840576171875, -1.11865234375, -0.9532470703125, -0.787841796875, -0.6224365234375, -0.45703125, -0.2916259765625, -0.126220703125, 0.0391845703125, 0.20458984375, 0.3699951171875, 0.535400390625, 0.7008056640625, 0.8662109375, 1.0316162109375, 1.197021484375, 1.3624267578125, 1.52783203125, 1.6932373046875, 1.858642578125, 2.0240478515625, 2.189453125, 2.3548583984375, 2.520263671875, 2.6856689453125, 2.85107421875, 3.0164794921875, 3.181884765625, 3.3472900390625, 3.5126953125, 3.6781005859375, 3.843505859375, 4.0089111328125, 4.17431640625, 4.3397216796875, 4.505126953125, 4.6705322265625, 4.8359375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [7.0, 5.0, 15.0, 17.0, 22.0, 21.0, 42.0, 66.0, 62.0, 131.0, 155.0, 189.0, 291.0, 358.0, 581.0, 720.0, 1191.0, 1616.0, 2368.0, 3283.0, 5092.0, 7357.0, 10910.0, 16013.0, 23970.0, 36042.0, 58376.0, 102286.0, 201978.0, 1298563.0, 127855.0, 69891.0, 42479.0, 27613.0, 18248.0, 12554.0, 8297.0, 5626.0, 3944.0, 2699.0, 1909.0, 1253.0, 904.0, 628.0, 451.0, 288.0, 216.0, 155.0, 146.0, 75.0, 61.0, 39.0, 24.0, 19.0, 16.0, 13.0, 5.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.3134765625, -1.2684478759765625, -1.223419189453125, -1.1783905029296875, -1.13336181640625, -1.0883331298828125, -1.043304443359375, -0.9982757568359375, -0.9532470703125, -0.9082183837890625, -0.863189697265625, -0.8181610107421875, -0.77313232421875, -0.7281036376953125, -0.683074951171875, -0.6380462646484375, -0.593017578125, -0.5479888916015625, -0.502960205078125, -0.4579315185546875, -0.41290283203125, -0.3678741455078125, -0.322845458984375, -0.2778167724609375, -0.2327880859375, -0.1877593994140625, -0.142730712890625, -0.0977020263671875, -0.05267333984375, -0.0076446533203125, 0.037384033203125, 0.0824127197265625, 0.12744140625, 0.1724700927734375, 0.217498779296875, 0.2625274658203125, 0.30755615234375, 0.3525848388671875, 0.397613525390625, 0.4426422119140625, 0.4876708984375, 0.5326995849609375, 0.577728271484375, 0.6227569580078125, 0.66778564453125, 0.7128143310546875, 0.757843017578125, 0.8028717041015625, 0.847900390625, 0.8929290771484375, 0.937957763671875, 0.9829864501953125, 1.02801513671875, 1.0730438232421875, 1.118072509765625, 1.1631011962890625, 1.2081298828125, 1.2531585693359375, 1.298187255859375, 1.3432159423828125, 1.38824462890625, 1.4332733154296875, 1.478302001953125, 1.5233306884765625, 1.568359375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 0.0, 3.0, 4.0, 0.0, 5.0, 4.0, 7.0, 14.0, 13.0, 11.0, 17.0, 17.0, 25.0, 19.0, 33.0, 41.0, 50.0, 76.0, 74.0, 85.0, 73.0, 63.0, 67.0, 54.0, 52.0, 48.0, 31.0, 22.0, 14.0, 21.0, 15.0, 15.0, 4.0, 5.0, 2.0, 4.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.002567291259765625, -0.002500012516975403, -0.0024327337741851807, -0.0023654550313949585, -0.0022981762886047363, -0.002230897545814514, -0.002163618803024292, -0.00209634006023407, -0.0020290613174438477, -0.0019617825746536255, -0.0018945038318634033, -0.0018272250890731812, -0.001759946346282959, -0.0016926676034927368, -0.0016253888607025146, -0.0015581101179122925, -0.0014908313751220703, -0.0014235526323318481, -0.001356273889541626, -0.0012889951467514038, -0.0012217164039611816, -0.0011544376611709595, -0.0010871589183807373, -0.0010198801755905151, -0.000952601432800293, -0.0008853226900100708, -0.0008180439472198486, -0.0007507652044296265, -0.0006834864616394043, -0.0006162077188491821, -0.00054892897605896, -0.0004816502332687378, -0.0004143714904785156, -0.00034709274768829346, -0.0002798140048980713, -0.00021253526210784912, -0.00014525651931762695, -7.797777652740479e-05, -1.0699033737182617e-05, 5.657970905303955e-05, 0.00012385845184326172, 0.0001911371946334839, 0.00025841593742370605, 0.0003256946802139282, 0.0003929734230041504, 0.00046025216579437256, 0.0005275309085845947, 0.0005948096513748169, 0.0006620883941650391, 0.0007293671369552612, 0.0007966458797454834, 0.0008639246225357056, 0.0009312033653259277, 0.00099848210811615, 0.001065760850906372, 0.0011330395936965942, 0.0012003183364868164, 0.0012675970792770386, 0.0013348758220672607, 0.001402154564857483, 0.001469433307647705, 0.0015367120504379272, 0.0016039907932281494, 0.0016712695360183716, 0.0017385482788085938]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 4.0, 11.0, 20.0, 10.0, 24.0, 37.0, 42.0, 49.0, 83.0, 109.0, 178.0, 314.0, 593.0, 2357.0, 1015118.0, 27607.0, 848.0, 394.0, 229.0, 123.0, 90.0, 73.0, 44.0, 32.0, 30.0, 19.0, 22.0, 27.0, 8.0, 8.0, 3.0, 7.0, 6.0, 4.0, 4.0, 4.0, 1.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033935546875, -0.03261566162109375, -0.0312957763671875, -0.02997589111328125, -0.028656005859375, -0.02733612060546875, -0.0260162353515625, -0.02469635009765625, -0.02337646484375, -0.02205657958984375, -0.0207366943359375, -0.01941680908203125, -0.018096923828125, -0.01677703857421875, -0.0154571533203125, -0.01413726806640625, -0.0128173828125, -0.01149749755859375, -0.0101776123046875, -0.00885772705078125, -0.007537841796875, -0.00621795654296875, -0.0048980712890625, -0.00357818603515625, -0.00225830078125, -0.00093841552734375, 0.0003814697265625, 0.00170135498046875, 0.003021240234375, 0.00434112548828125, 0.0056610107421875, 0.00698089599609375, 0.00830078125, 0.00962066650390625, 0.0109405517578125, 0.01226043701171875, 0.013580322265625, 0.01490020751953125, 0.0162200927734375, 0.01753997802734375, 0.01885986328125, 0.02017974853515625, 0.0214996337890625, 0.02281951904296875, 0.024139404296875, 0.02545928955078125, 0.0267791748046875, 0.02809906005859375, 0.0294189453125, 0.03073883056640625, 0.0320587158203125, 0.03337860107421875, 0.034698486328125, 0.03601837158203125, 0.0373382568359375, 0.03865814208984375, 0.03997802734375, 0.04129791259765625, 0.0426177978515625, 0.04393768310546875, 0.045257568359375, 0.04657745361328125, 0.0478973388671875, 0.04921722412109375, 0.050537109375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 20.0, 307.0, 571.0, 114.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008393684402108192, -0.008208485320210457, -0.008023286238312721, -0.007838087156414986, -0.007652888540178537, -0.007467689458280802, -0.007282490376383066, -0.007097291294485331, -0.006912092678248882, -0.006726893596351147, -0.006541694514453411, -0.0063564954325556755, -0.006171296816319227, -0.005986097734421492, -0.005800898652523756, -0.00561569957062602, -0.005430500488728285, -0.005245301406830549, -0.005060102324932814, -0.004874903708696365, -0.00468970462679863, -0.004504505544900894, -0.004319306463003159, -0.004134107381105423, -0.003948908299207687, -0.0037637092173099518, -0.00357851036824286, -0.0033933112863451242, -0.0032081124372780323, -0.0030229133553802967, -0.002837714273482561, -0.0026525151915848255, -0.00246731610968709, -0.0022821170277893543, -0.0020969181787222624, -0.0019117190968245268, -0.001726520131342113, -0.0015413211658596992, -0.0013561220839619637, -0.0011709231184795499, -0.0009857241529971361, -0.0008005251875147223, -0.0006153261638246477, -0.000430127140134573, -0.0002449281746521592, -5.9729209169745445e-05, 0.00012546987272799015, 0.0003106688382104039, 0.0004958678036928177, 0.0006810667691752315, 0.0008662657928653061, 0.0010514648165553808, 0.0012366637820377946, 0.0014218627475202084, 0.001607061829417944, 0.0017922607949003577, 0.0019774597603827715, 0.002162658842280507, 0.002347857691347599, 0.0025330567732453346, 0.0027182558551430702, 0.002903454704210162, 0.0030886537861078978, 0.0032738526351749897, 0.0034590517170727253]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 5.0, 7.0, 12.0, 9.0, 12.0, 14.0, 23.0, 26.0, 28.0, 30.0, 20.0, 38.0, 26.0, 31.0, 40.0, 41.0, 44.0, 37.0, 37.0, 50.0, 34.0, 41.0, 36.0, 33.0, 32.0, 33.0, 28.0, 30.0, 27.0, 34.0, 13.0, 28.0, 20.0, 13.0, 12.0, 11.0, 9.0, 3.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.0011210441589355469, -0.0010897833853960037, -0.0010585226118564606, -0.0010272618383169174, -0.0009960010647773743, -0.0009647402912378311, -0.000933479517698288, -0.0009022187441587448, -0.0008709579706192017, -0.0008396971970796585, -0.0008084364235401154, -0.0007771756500005722, -0.000745914876461029, -0.0007146541029214859, -0.0006833933293819427, -0.0006521325558423996, -0.0006208717823028564, -0.0005896110087633133, -0.0005583502352237701, -0.000527089461684227, -0.0004958286881446838, -0.0004645679146051407, -0.00043330714106559753, -0.0004020463675260544, -0.00037078559398651123, -0.0003395248204469681, -0.0003082640469074249, -0.0002770032733678818, -0.0002457424998283386, -0.00021448172628879547, -0.00018322095274925232, -0.00015196017920970917, -0.00012069940567016602, -8.943863213062286e-05, -5.817785859107971e-05, -2.691708505153656e-05, 4.343688488006592e-06, 3.5604462027549744e-05, 6.68652355670929e-05, 9.812600910663605e-05, 0.0001293867826461792, 0.00016064755618572235, 0.0001919083297252655, 0.00022316910326480865, 0.0002544298768043518, 0.00028569065034389496, 0.0003169514238834381, 0.00034821219742298126, 0.0003794729709625244, 0.00041073374450206757, 0.0004419945180416107, 0.00047325529158115387, 0.000504516065120697, 0.0005357768386602402, 0.0005670376121997833, 0.0005982983857393265, 0.0006295591592788696, 0.0006608199328184128, 0.0006920807063579559, 0.0007233414798974991, 0.0007546022534370422, 0.0007858630269765854, 0.0008171238005161285, 0.0008483845740556717, 0.0008796453475952148]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 6.0, 4.0, 11.0, 11.0, 9.0, 16.0, 11.0, 14.0, 20.0, 26.0, 27.0, 29.0, 17.0, 30.0, 35.0, 31.0, 32.0, 25.0, 36.0, 33.0, 39.0, 52.0, 38.0, 42.0, 49.0, 28.0, 42.0, 31.0, 42.0, 18.0, 26.0, 28.0, 23.0, 16.0, 19.0, 8.0, 15.0, 12.0, 7.0, 6.0, 6.0, 10.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.234375, -7.954345703125, -7.67431640625, -7.394287109375, -7.1142578125, -6.834228515625, -6.55419921875, -6.274169921875, -5.994140625, -5.714111328125, -5.43408203125, -5.154052734375, -4.8740234375, -4.593994140625, -4.31396484375, -4.033935546875, -3.75390625, -3.473876953125, -3.19384765625, -2.913818359375, -2.6337890625, -2.353759765625, -2.07373046875, -1.793701171875, -1.513671875, -1.233642578125, -0.95361328125, -0.673583984375, -0.3935546875, -0.113525390625, 0.16650390625, 0.446533203125, 0.7265625, 1.006591796875, 1.28662109375, 1.566650390625, 1.8466796875, 2.126708984375, 2.40673828125, 2.686767578125, 2.966796875, 3.246826171875, 3.52685546875, 3.806884765625, 4.0869140625, 4.366943359375, 4.64697265625, 4.927001953125, 5.20703125, 5.487060546875, 5.76708984375, 6.047119140625, 6.3271484375, 6.607177734375, 6.88720703125, 7.167236328125, 7.447265625, 7.727294921875, 8.00732421875, 8.287353515625, 8.5673828125, 8.847412109375, 9.12744140625, 9.407470703125, 9.6875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 13.0, 4.0, 9.0, 18.0, 31.0, 32.0, 30.0, 52.0, 76.0, 72.0, 116.0, 124.0, 190.0, 246.0, 300.0, 435.0, 575.0, 1037.0, 2732.0, 10554.0, 53210.0, 600550.0, 330300.0, 35067.0, 7592.0, 2156.0, 858.0, 564.0, 388.0, 299.0, 221.0, 168.0, 131.0, 86.0, 71.0, 63.0, 36.0, 31.0, 23.0, 17.0, 14.0, 14.0, 9.0, 7.0, 11.0, 5.0, 4.0, 6.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.71875, -20.025390625, -19.33203125, -18.638671875, -17.9453125, -17.251953125, -16.55859375, -15.865234375, -15.171875, -14.478515625, -13.78515625, -13.091796875, -12.3984375, -11.705078125, -11.01171875, -10.318359375, -9.625, -8.931640625, -8.23828125, -7.544921875, -6.8515625, -6.158203125, -5.46484375, -4.771484375, -4.078125, -3.384765625, -2.69140625, -1.998046875, -1.3046875, -0.611328125, 0.08203125, 0.775390625, 1.46875, 2.162109375, 2.85546875, 3.548828125, 4.2421875, 4.935546875, 5.62890625, 6.322265625, 7.015625, 7.708984375, 8.40234375, 9.095703125, 9.7890625, 10.482421875, 11.17578125, 11.869140625, 12.5625, 13.255859375, 13.94921875, 14.642578125, 15.3359375, 16.029296875, 16.72265625, 17.416015625, 18.109375, 18.802734375, 19.49609375, 20.189453125, 20.8828125, 21.576171875, 22.26953125, 22.962890625, 23.65625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 9.0, 11.0, 9.0, 18.0, 6.0, 17.0, 19.0, 22.0, 29.0, 23.0, 47.0, 44.0, 40.0, 43.0, 60.0, 70.0, 173.0, 1546.0, 336.0, 114.0, 47.0, 46.0, 53.0, 44.0, 37.0, 21.0, 22.0, 25.0, 26.0, 28.0, 7.0, 12.0, 10.0, 13.0, 7.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.78125, -32.77978515625, -31.7783203125, -30.77685546875, -29.775390625, -28.77392578125, -27.7724609375, -26.77099609375, -25.76953125, -24.76806640625, -23.7666015625, -22.76513671875, -21.763671875, -20.76220703125, -19.7607421875, -18.75927734375, -17.7578125, -16.75634765625, -15.7548828125, -14.75341796875, -13.751953125, -12.75048828125, -11.7490234375, -10.74755859375, -9.74609375, -8.74462890625, -7.7431640625, -6.74169921875, -5.740234375, -4.73876953125, -3.7373046875, -2.73583984375, -1.734375, -0.73291015625, 0.2685546875, 1.27001953125, 2.271484375, 3.27294921875, 4.2744140625, 5.27587890625, 6.27734375, 7.27880859375, 8.2802734375, 9.28173828125, 10.283203125, 11.28466796875, 12.2861328125, 13.28759765625, 14.2890625, 15.29052734375, 16.2919921875, 17.29345703125, 18.294921875, 19.29638671875, 20.2978515625, 21.29931640625, 22.30078125, 23.30224609375, 24.3037109375, 25.30517578125, 26.306640625, 27.30810546875, 28.3095703125, 29.31103515625, 30.3125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 12.0, 9.0, 20.0, 12.0, 16.0, 29.0, 27.0, 36.0, 29.0, 44.0, 72.0, 89.0, 156.0, 313.0, 636.0, 2486.0, 130690.0, 3000939.0, 7922.0, 1087.0, 366.0, 186.0, 131.0, 81.0, 73.0, 46.0, 44.0, 31.0, 27.0, 12.0, 16.0, 13.0, 14.0, 11.0, 7.0, 7.0, 2.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.25, -81.4619140625, -78.673828125, -75.8857421875, -73.09765625, -70.3095703125, -67.521484375, -64.7333984375, -61.9453125, -59.1572265625, -56.369140625, -53.5810546875, -50.79296875, -48.0048828125, -45.216796875, -42.4287109375, -39.640625, -36.8525390625, -34.064453125, -31.2763671875, -28.48828125, -25.7001953125, -22.912109375, -20.1240234375, -17.3359375, -14.5478515625, -11.759765625, -8.9716796875, -6.18359375, -3.3955078125, -0.607421875, 2.1806640625, 4.96875, 7.7568359375, 10.544921875, 13.3330078125, 16.12109375, 18.9091796875, 21.697265625, 24.4853515625, 27.2734375, 30.0615234375, 32.849609375, 35.6376953125, 38.42578125, 41.2138671875, 44.001953125, 46.7900390625, 49.578125, 52.3662109375, 55.154296875, 57.9423828125, 60.73046875, 63.5185546875, 66.306640625, 69.0947265625, 71.8828125, 74.6708984375, 77.458984375, 80.2470703125, 83.03515625, 85.8232421875, 88.611328125, 91.3994140625, 94.1875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [3.0, 3.0, 42.0, 325.0, 484.0, 142.0, 17.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.861318588256836, -15.196775436401367, -10.532233238220215, -5.8676910400390625, -1.2031478881835938, 3.461395263671875, 8.125936508178711, 12.79047966003418, 17.45502281188965, 22.119565963745117, 26.784107208251953, 31.448650360107422, 36.11319351196289, 40.77773666381836, 45.44227600097656, 50.10681915283203, 54.7713623046875, 59.43590545654297, 64.10044860839844, 68.7649917602539, 73.42953491210938, 78.09407806396484, 82.75862121582031, 87.42315673828125, 92.08770751953125, 96.75225067138672, 101.41679382324219, 106.08133697509766, 110.74588012695312, 115.4104232788086, 120.07496643066406, 124.739501953125, 129.40403747558594, 134.06857299804688, 138.73312377929688, 143.3976593017578, 148.0622100830078, 152.72674560546875, 157.39129638671875, 162.0558319091797, 166.7203826904297, 171.38491821289062, 176.04946899414062, 180.71400451660156, 185.37855529785156, 190.0430908203125, 194.7076416015625, 199.37217712402344, 204.03671264648438, 208.7012481689453, 213.3657989501953, 218.03033447265625, 222.69488525390625, 227.3594207763672, 232.0239715576172, 236.68850708007812, 241.35305786132812, 246.01759338378906, 250.68214416503906, 255.3466796875, 260.01123046875, 264.67578125, 269.3403015136719, 274.0048522949219, 278.6694030761719]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 8.0, 3.0, 13.0, 5.0, 17.0, 10.0, 17.0, 22.0, 34.0, 25.0, 29.0, 24.0, 24.0, 21.0, 32.0, 31.0, 38.0, 36.0, 34.0, 41.0, 30.0, 42.0, 54.0, 43.0, 30.0, 29.0, 37.0, 34.0, 29.0, 24.0, 24.0, 20.0, 18.0, 24.0, 14.0, 20.0, 16.0, 15.0, 10.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.53705596923828, -72.21614837646484, -69.8952407836914, -67.57432556152344, -65.25341796875, -62.93251037597656, -60.611602783203125, -58.29069519042969, -55.969783782958984, -53.64887619018555, -51.327964782714844, -49.007057189941406, -46.68614959716797, -44.365238189697266, -42.04433059692383, -39.723419189453125, -37.40251159667969, -35.08160400390625, -32.76069259643555, -30.43978500366211, -28.11887550354004, -25.79796600341797, -23.47705841064453, -21.15614891052246, -18.83523941040039, -16.51432991027832, -14.193421363830566, -11.872512817382812, -9.551603317260742, -7.230693817138672, -4.909785270690918, -2.588876724243164, -0.267974853515625, 2.052934169769287, 4.373843193054199, 6.694752216339111, 9.015661239624023, 11.336570739746094, 13.657479286193848, 15.978387832641602, 18.299297332763672, 20.620206832885742, 22.941116333007812, 25.26202392578125, 27.58293342590332, 29.90384292602539, 32.22475051879883, 34.54566192626953, 36.86656951904297, 39.187477111816406, 41.50838851928711, 43.82929611206055, 46.15020751953125, 48.47111511230469, 50.792022705078125, 53.11293029785156, 55.433841705322266, 57.7547492980957, 60.075660705566406, 62.396568298339844, 64.71747589111328, 67.03839111328125, 69.35929870605469, 71.68020629882812, 74.00111389160156]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 1.0, 8.0, 8.0, 13.0, 9.0, 30.0, 20.0, 27.0, 18.0, 35.0, 37.0, 26.0, 23.0, 45.0, 29.0, 43.0, 36.0, 51.0, 41.0, 51.0, 41.0, 38.0, 54.0, 44.0, 22.0, 35.0, 29.0, 30.0, 24.0, 21.0, 13.0, 12.0, 17.0, 7.0, 10.0, 5.0, 8.0, 3.0, 8.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.7578125, -10.435546875, -10.11328125, -9.791015625, -9.46875, -9.146484375, -8.82421875, -8.501953125, -8.1796875, -7.857421875, -7.53515625, -7.212890625, -6.890625, -6.568359375, -6.24609375, -5.923828125, -5.6015625, -5.279296875, -4.95703125, -4.634765625, -4.3125, -3.990234375, -3.66796875, -3.345703125, -3.0234375, -2.701171875, -2.37890625, -2.056640625, -1.734375, -1.412109375, -1.08984375, -0.767578125, -0.4453125, -0.123046875, 0.19921875, 0.521484375, 0.84375, 1.166015625, 1.48828125, 1.810546875, 2.1328125, 2.455078125, 2.77734375, 3.099609375, 3.421875, 3.744140625, 4.06640625, 4.388671875, 4.7109375, 5.033203125, 5.35546875, 5.677734375, 6.0, 6.322265625, 6.64453125, 6.966796875, 7.2890625, 7.611328125, 7.93359375, 8.255859375, 8.578125, 8.900390625, 9.22265625, 9.544921875, 9.8671875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 14.0, 9.0, 11.0, 14.0, 18.0, 22.0, 29.0, 32.0, 57.0, 64.0, 82.0, 115.0, 139.0, 207.0, 271.0, 505.0, 1322.0, 5791.0, 46304.0, 530541.0, 2381272.0, 1103246.0, 109054.0, 11118.0, 2085.0, 731.0, 331.0, 222.0, 157.0, 128.0, 87.0, 63.0, 56.0, 36.0, 18.0, 31.0, 21.0, 16.0, 17.0, 15.0, 8.0, 2.0, 6.0, 5.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.0, -18.380615234375, -17.76123046875, -17.141845703125, -16.5224609375, -15.903076171875, -15.28369140625, -14.664306640625, -14.044921875, -13.425537109375, -12.80615234375, -12.186767578125, -11.5673828125, -10.947998046875, -10.32861328125, -9.709228515625, -9.08984375, -8.470458984375, -7.85107421875, -7.231689453125, -6.6123046875, -5.992919921875, -5.37353515625, -4.754150390625, -4.134765625, -3.515380859375, -2.89599609375, -2.276611328125, -1.6572265625, -1.037841796875, -0.41845703125, 0.200927734375, 0.8203125, 1.439697265625, 2.05908203125, 2.678466796875, 3.2978515625, 3.917236328125, 4.53662109375, 5.156005859375, 5.775390625, 6.394775390625, 7.01416015625, 7.633544921875, 8.2529296875, 8.872314453125, 9.49169921875, 10.111083984375, 10.73046875, 11.349853515625, 11.96923828125, 12.588623046875, 13.2080078125, 13.827392578125, 14.44677734375, 15.066162109375, 15.685546875, 16.304931640625, 16.92431640625, 17.543701171875, 18.1630859375, 18.782470703125, 19.40185546875, 20.021240234375, 20.640625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 7.0, 5.0, 5.0, 8.0, 8.0, 16.0, 22.0, 32.0, 34.0, 70.0, 63.0, 107.0, 163.0, 181.0, 263.0, 344.0, 352.0, 454.0, 439.0, 320.0, 303.0, 234.0, 165.0, 113.0, 104.0, 65.0, 39.0, 36.0, 23.0, 26.0, 16.0, 13.0, 11.0, 6.0, 3.0, 10.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-17.296875, -16.8123779296875, -16.327880859375, -15.8433837890625, -15.35888671875, -14.8743896484375, -14.389892578125, -13.9053955078125, -13.4208984375, -12.9364013671875, -12.451904296875, -11.9674072265625, -11.48291015625, -10.9984130859375, -10.513916015625, -10.0294189453125, -9.544921875, -9.0604248046875, -8.575927734375, -8.0914306640625, -7.60693359375, -7.1224365234375, -6.637939453125, -6.1534423828125, -5.6689453125, -5.1844482421875, -4.699951171875, -4.2154541015625, -3.73095703125, -3.2464599609375, -2.761962890625, -2.2774658203125, -1.79296875, -1.3084716796875, -0.823974609375, -0.3394775390625, 0.14501953125, 0.6295166015625, 1.114013671875, 1.5985107421875, 2.0830078125, 2.5675048828125, 3.052001953125, 3.5364990234375, 4.02099609375, 4.5054931640625, 4.989990234375, 5.4744873046875, 5.958984375, 6.4434814453125, 6.927978515625, 7.4124755859375, 7.89697265625, 8.3814697265625, 8.865966796875, 9.3504638671875, 9.8349609375, 10.3194580078125, 10.803955078125, 11.2884521484375, 11.77294921875, 12.2574462890625, 12.741943359375, 13.2264404296875, 13.7109375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 5.0, 5.0, 12.0, 8.0, 10.0, 30.0, 29.0, 39.0, 73.0, 90.0, 112.0, 198.0, 309.0, 531.0, 968.0, 2866.0, 19056.0, 470511.0, 3513883.0, 170716.0, 10761.0, 2063.0, 799.0, 415.0, 275.0, 164.0, 104.0, 88.0, 42.0, 37.0, 20.0, 19.0, 12.0, 8.0, 17.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.75, -41.42919921875, -40.1083984375, -38.78759765625, -37.466796875, -36.14599609375, -34.8251953125, -33.50439453125, -32.18359375, -30.86279296875, -29.5419921875, -28.22119140625, -26.900390625, -25.57958984375, -24.2587890625, -22.93798828125, -21.6171875, -20.29638671875, -18.9755859375, -17.65478515625, -16.333984375, -15.01318359375, -13.6923828125, -12.37158203125, -11.05078125, -9.72998046875, -8.4091796875, -7.08837890625, -5.767578125, -4.44677734375, -3.1259765625, -1.80517578125, -0.484375, 0.83642578125, 2.1572265625, 3.47802734375, 4.798828125, 6.11962890625, 7.4404296875, 8.76123046875, 10.08203125, 11.40283203125, 12.7236328125, 14.04443359375, 15.365234375, 16.68603515625, 18.0068359375, 19.32763671875, 20.6484375, 21.96923828125, 23.2900390625, 24.61083984375, 25.931640625, 27.25244140625, 28.5732421875, 29.89404296875, 31.21484375, 32.53564453125, 33.8564453125, 35.17724609375, 36.498046875, 37.81884765625, 39.1396484375, 40.46044921875, 41.78125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 404.0, 584.0, 19.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.4840850830078, -152.35263061523438, -137.22117614746094, -122.08971405029297, -106.958251953125, -91.82679748535156, -76.69534301757812, -61.563880920410156, -46.43242645263672, -31.300968170166016, -16.169511795043945, -1.038055419921875, 14.093402862548828, 29.22486114501953, 44.35631561279297, 59.48777770996094, 74.61923217773438, 89.75068664550781, 104.88214874267578, 120.01360321044922, 135.1450653076172, 150.27651977539062, 165.40797424316406, 180.5394287109375, 195.6708984375, 210.80235290527344, 225.93380737304688, 241.06527709960938, 256.19671630859375, 271.32818603515625, 286.45965576171875, 301.5910949707031, 316.7225646972656, 331.8540344238281, 346.9854736328125, 362.116943359375, 377.2483825683594, 392.3798522949219, 407.51129150390625, 422.64276123046875, 437.77423095703125, 452.90570068359375, 468.0371398925781, 483.1686096191406, 498.300048828125, 513.4315185546875, 528.56298828125, 543.6944580078125, 558.8258666992188, 573.9573364257812, 589.0888061523438, 604.22021484375, 619.3516845703125, 634.483154296875, 649.6146240234375, 664.74609375, 679.8775634765625, 695.009033203125, 710.1405029296875, 725.2719116210938, 740.4033813476562, 755.5348510742188, 770.6663208007812, 785.7977905273438, 800.92919921875]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 13.0, 15.0, 9.0, 17.0, 9.0, 25.0, 27.0, 26.0, 30.0, 33.0, 39.0, 33.0, 46.0, 32.0, 49.0, 54.0, 52.0, 47.0, 37.0, 45.0, 38.0, 31.0, 32.0, 44.0, 24.0, 22.0, 23.0, 17.0, 22.0, 16.0, 17.0, 7.0, 13.0, 14.0, 11.0, 9.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-65.03279876708984, -63.19601058959961, -61.359222412109375, -59.52243423461914, -57.685646057128906, -55.84886169433594, -54.01206970214844, -52.17528533935547, -50.338497161865234, -48.501708984375, -46.664920806884766, -44.82813262939453, -42.9913444519043, -41.15455627441406, -39.317771911621094, -37.48098373413086, -35.644195556640625, -33.80740737915039, -31.970619201660156, -30.133831024169922, -28.29704475402832, -26.460256576538086, -24.62346839904785, -22.78668212890625, -20.94989013671875, -19.113101959228516, -17.27631378173828, -15.439526557922363, -13.602739334106445, -11.765951156616211, -9.929162979125977, -8.092375755310059, -6.255588531494141, -4.4188008308410645, -2.582012891769409, -0.7452249526977539, 1.0915627479553223, 2.9283504486083984, 4.765138626098633, 6.601925849914551, 8.438714027404785, 10.27550220489502, 12.112289428710938, 13.949077606201172, 15.785865783691406, 17.62265396118164, 19.459442138671875, 21.296228408813477, 23.13301658630371, 24.969804763793945, 26.80659294128418, 28.64337921142578, 30.480167388916016, 32.31695556640625, 34.153743743896484, 35.99053192138672, 37.82732009887695, 39.66410827636719, 41.50089645385742, 43.337684631347656, 45.17447280883789, 47.011260986328125, 48.848045349121094, 50.68483352661133, 52.52162170410156]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 4.0, 9.0, 8.0, 17.0, 20.0, 14.0, 26.0, 27.0, 23.0, 33.0, 29.0, 32.0, 35.0, 48.0, 38.0, 44.0, 42.0, 56.0, 36.0, 38.0, 51.0, 44.0, 42.0, 46.0, 33.0, 25.0, 25.0, 18.0, 25.0, 25.0, 14.0, 15.0, 12.0, 7.0, 9.0, 6.0, 6.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.96875, -11.61279296875, -11.2568359375, -10.90087890625, -10.544921875, -10.18896484375, -9.8330078125, -9.47705078125, -9.12109375, -8.76513671875, -8.4091796875, -8.05322265625, -7.697265625, -7.34130859375, -6.9853515625, -6.62939453125, -6.2734375, -5.91748046875, -5.5615234375, -5.20556640625, -4.849609375, -4.49365234375, -4.1376953125, -3.78173828125, -3.42578125, -3.06982421875, -2.7138671875, -2.35791015625, -2.001953125, -1.64599609375, -1.2900390625, -0.93408203125, -0.578125, -0.22216796875, 0.1337890625, 0.48974609375, 0.845703125, 1.20166015625, 1.5576171875, 1.91357421875, 2.26953125, 2.62548828125, 2.9814453125, 3.33740234375, 3.693359375, 4.04931640625, 4.4052734375, 4.76123046875, 5.1171875, 5.47314453125, 5.8291015625, 6.18505859375, 6.541015625, 6.89697265625, 7.2529296875, 7.60888671875, 7.96484375, 8.32080078125, 8.6767578125, 9.03271484375, 9.388671875, 9.74462890625, 10.1005859375, 10.45654296875, 10.8125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 16.0, 11.0, 26.0, 39.0, 51.0, 81.0, 107.0, 167.0, 229.0, 366.0, 558.0, 846.0, 1243.0, 1935.0, 3156.0, 4742.0, 7559.0, 12493.0, 20764.0, 34768.0, 61530.0, 116430.0, 249036.0, 256323.0, 121483.0, 63216.0, 35702.0, 21195.0, 12765.0, 7851.0, 4950.0, 3174.0, 1983.0, 1254.0, 834.0, 565.0, 399.0, 224.0, 143.0, 110.0, 65.0, 49.0, 41.0, 22.0, 18.0, 11.0, 10.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.0, -1.9394378662109375, -1.878875732421875, -1.8183135986328125, -1.75775146484375, -1.6971893310546875, -1.636627197265625, -1.5760650634765625, -1.5155029296875, -1.4549407958984375, -1.394378662109375, -1.3338165283203125, -1.27325439453125, -1.2126922607421875, -1.152130126953125, -1.0915679931640625, -1.031005859375, -0.9704437255859375, -0.909881591796875, -0.8493194580078125, -0.78875732421875, -0.7281951904296875, -0.667633056640625, -0.6070709228515625, -0.5465087890625, -0.4859466552734375, -0.425384521484375, -0.3648223876953125, -0.30426025390625, -0.2436981201171875, -0.183135986328125, -0.1225738525390625, -0.06201171875, -0.0014495849609375, 0.059112548828125, 0.1196746826171875, 0.18023681640625, 0.2407989501953125, 0.301361083984375, 0.3619232177734375, 0.4224853515625, 0.4830474853515625, 0.543609619140625, 0.6041717529296875, 0.66473388671875, 0.7252960205078125, 0.785858154296875, 0.8464202880859375, 0.906982421875, 0.9675445556640625, 1.028106689453125, 1.0886688232421875, 1.14923095703125, 1.2097930908203125, 1.270355224609375, 1.3309173583984375, 1.3914794921875, 1.4520416259765625, 1.512603759765625, 1.5731658935546875, 1.63372802734375, 1.6942901611328125, 1.754852294921875, 1.8154144287109375, 1.8759765625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 8.0, 14.0, 15.0, 16.0, 14.0, 28.0, 18.0, 26.0, 29.0, 33.0, 27.0, 33.0, 33.0, 37.0, 36.0, 38.0, 43.0, 1064.0, 37.0, 34.0, 36.0, 44.0, 31.0, 37.0, 32.0, 38.0, 27.0, 24.0, 20.0, 18.0, 17.0, 21.0, 14.0, 17.0, 11.0, 6.0, 8.0, 5.0, 9.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.4140625, -6.20660400390625, -5.9991455078125, -5.79168701171875, -5.584228515625, -5.37677001953125, -5.1693115234375, -4.96185302734375, -4.75439453125, -4.54693603515625, -4.3394775390625, -4.13201904296875, -3.924560546875, -3.71710205078125, -3.5096435546875, -3.30218505859375, -3.0947265625, -2.88726806640625, -2.6798095703125, -2.47235107421875, -2.264892578125, -2.05743408203125, -1.8499755859375, -1.64251708984375, -1.43505859375, -1.22760009765625, -1.0201416015625, -0.81268310546875, -0.605224609375, -0.39776611328125, -0.1903076171875, 0.01715087890625, 0.224609375, 0.43206787109375, 0.6395263671875, 0.84698486328125, 1.054443359375, 1.26190185546875, 1.4693603515625, 1.67681884765625, 1.88427734375, 2.09173583984375, 2.2991943359375, 2.50665283203125, 2.714111328125, 2.92156982421875, 3.1290283203125, 3.33648681640625, 3.5439453125, 3.75140380859375, 3.9588623046875, 4.16632080078125, 4.373779296875, 4.58123779296875, 4.7886962890625, 4.99615478515625, 5.20361328125, 5.41107177734375, 5.6185302734375, 5.82598876953125, 6.033447265625, 6.24090576171875, 6.4483642578125, 6.65582275390625, 6.86328125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 5.0, 10.0, 16.0, 21.0, 26.0, 43.0, 74.0, 94.0, 133.0, 172.0, 285.0, 396.0, 626.0, 862.0, 1211.0, 1928.0, 3010.0, 4512.0, 6923.0, 11118.0, 16942.0, 26911.0, 42586.0, 71517.0, 131329.0, 1309561.0, 205896.0, 103081.0, 58035.0, 35642.0, 22775.0, 14269.0, 9338.0, 6108.0, 3857.0, 2593.0, 1602.0, 1187.0, 732.0, 518.0, 386.0, 261.0, 157.0, 120.0, 75.0, 55.0, 39.0, 32.0, 20.0, 18.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.75, -1.6949920654296875, -1.639984130859375, -1.5849761962890625, -1.52996826171875, -1.4749603271484375, -1.419952392578125, -1.3649444580078125, -1.3099365234375, -1.2549285888671875, -1.199920654296875, -1.1449127197265625, -1.08990478515625, -1.0348968505859375, -0.979888916015625, -0.9248809814453125, -0.869873046875, -0.8148651123046875, -0.759857177734375, -0.7048492431640625, -0.64984130859375, -0.5948333740234375, -0.539825439453125, -0.4848175048828125, -0.4298095703125, -0.3748016357421875, -0.319793701171875, -0.2647857666015625, -0.20977783203125, -0.1547698974609375, -0.099761962890625, -0.0447540283203125, 0.01025390625, 0.0652618408203125, 0.120269775390625, 0.1752777099609375, 0.23028564453125, 0.2852935791015625, 0.340301513671875, 0.3953094482421875, 0.4503173828125, 0.5053253173828125, 0.560333251953125, 0.6153411865234375, 0.67034912109375, 0.7253570556640625, 0.780364990234375, 0.8353729248046875, 0.890380859375, 0.9453887939453125, 1.000396728515625, 1.0554046630859375, 1.11041259765625, 1.1654205322265625, 1.220428466796875, 1.2754364013671875, 1.3304443359375, 1.3854522705078125, 1.440460205078125, 1.4954681396484375, 1.55047607421875, 1.6054840087890625, 1.660491943359375, 1.7154998779296875, 1.7705078125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 3.0, 5.0, 4.0, 5.0, 5.0, 2.0, 4.0, 7.0, 10.0, 4.0, 10.0, 14.0, 17.0, 23.0, 23.0, 29.0, 28.0, 29.0, 42.0, 40.0, 36.0, 53.0, 56.0, 51.0, 40.0, 53.0, 52.0, 50.0, 48.0, 41.0, 31.0, 26.0, 26.0, 16.0, 22.0, 16.0, 9.0, 14.0, 15.0, 6.0, 12.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0018529891967773438, -0.0017946064472198486, -0.0017362236976623535, -0.0016778409481048584, -0.0016194581985473633, -0.0015610754489898682, -0.001502692699432373, -0.001444309949874878, -0.0013859272003173828, -0.0013275444507598877, -0.0012691617012023926, -0.0012107789516448975, -0.0011523962020874023, -0.0010940134525299072, -0.0010356307029724121, -0.000977247953414917, -0.0009188652038574219, -0.0008604824542999268, -0.0008020997047424316, -0.0007437169551849365, -0.0006853342056274414, -0.0006269514560699463, -0.0005685687065124512, -0.0005101859569549561, -0.00045180320739746094, -0.0003934204578399658, -0.0003350377082824707, -0.0002766549587249756, -0.00021827220916748047, -0.00015988945960998535, -0.00010150671005249023, -4.312396049499512e-05, 1.52587890625e-05, 7.364153861999512e-05, 0.00013202428817749023, 0.00019040703773498535, 0.00024878978729248047, 0.0003071725368499756, 0.0003655552864074707, 0.0004239380359649658, 0.00048232078552246094, 0.0005407035350799561, 0.0005990862846374512, 0.0006574690341949463, 0.0007158517837524414, 0.0007742345333099365, 0.0008326172828674316, 0.0008910000324249268, 0.0009493827819824219, 0.001007765531539917, 0.0010661482810974121, 0.0011245310306549072, 0.0011829137802124023, 0.0012412965297698975, 0.0012996792793273926, 0.0013580620288848877, 0.0014164447784423828, 0.001474827527999878, 0.001533210277557373, 0.0015915930271148682, 0.0016499757766723633, 0.0017083585262298584, 0.0017667412757873535, 0.0018251240253448486, 0.0018835067749023438]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 4.0, 8.0, 3.0, 7.0, 4.0, 4.0, 9.0, 14.0, 10.0, 23.0, 21.0, 25.0, 27.0, 31.0, 36.0, 67.0, 64.0, 93.0, 118.0, 175.0, 243.0, 339.0, 663.0, 2151.0, 643545.0, 397279.0, 1757.0, 600.0, 325.0, 196.0, 169.0, 111.0, 89.0, 68.0, 61.0, 36.0, 31.0, 20.0, 24.0, 19.0, 9.0, 12.0, 8.0, 10.0, 9.0, 9.0, 8.0, 5.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0], "bins": [-0.03521728515625, -0.03411531448364258, -0.033013343811035156, -0.031911373138427734, -0.030809402465820312, -0.02970743179321289, -0.02860546112060547, -0.027503490447998047, -0.026401519775390625, -0.025299549102783203, -0.02419757843017578, -0.02309560775756836, -0.021993637084960938, -0.020891666412353516, -0.019789695739746094, -0.018687725067138672, -0.01758575439453125, -0.016483783721923828, -0.015381813049316406, -0.014279842376708984, -0.013177871704101562, -0.01207590103149414, -0.010973930358886719, -0.009871959686279297, -0.008769989013671875, -0.007668018341064453, -0.006566047668457031, -0.005464076995849609, -0.0043621063232421875, -0.0032601356506347656, -0.0021581649780273438, -0.0010561943054199219, 4.57763671875e-05, 0.0011477470397949219, 0.0022497177124023438, 0.0033516883850097656, 0.0044536590576171875, 0.005555629730224609, 0.006657600402832031, 0.007759571075439453, 0.008861541748046875, 0.009963512420654297, 0.011065483093261719, 0.01216745376586914, 0.013269424438476562, 0.014371395111083984, 0.015473365783691406, 0.016575336456298828, 0.01767730712890625, 0.018779277801513672, 0.019881248474121094, 0.020983219146728516, 0.022085189819335938, 0.02318716049194336, 0.02428913116455078, 0.025391101837158203, 0.026493072509765625, 0.027595043182373047, 0.02869701385498047, 0.02979898452758789, 0.030900955200195312, 0.032002925872802734, 0.033104896545410156, 0.03420686721801758, 0.035308837890625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 13.0, 20.0, 48.0, 120.0, 204.0, 236.0, 187.0, 101.0, 52.0, 19.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012192301219329238, -0.0011452160542830825, -0.001071202103048563, -0.0009971880353987217, -0.0009231739677488804, -0.0008491599583067, -0.0007751459488645196, -0.0007011318812146783, -0.0006271178717724979, -0.0005531038623303175, -0.0004790897946804762, -0.0004050757852382958, -0.00033106174669228494, -0.0002570477081462741, -0.0001830336987040937, -0.00010901963105425239, -3.500562161207199e-05, 3.900840965798125e-05, 0.00011302244092803448, 0.0001870364649221301, 0.00026105050346814096, 0.0003350645420141518, 0.0004090785514563322, 0.0004830926191061735, 0.0005571066285483539, 0.0006311206379905343, 0.0007051347056403756, 0.000779148715082556, 0.0008531627245247364, 0.0009271767921745777, 0.001001190859824419, 0.0010752049274742603, 0.001149218762293458, 0.0012232328299432993, 0.0012972467811778188, 0.00137126084882766, 0.0014452749164775014, 0.0015192888677120209, 0.0015933029353618622, 0.0016673170030117035, 0.0017413310706615448, 0.001815345138311386, 0.0018893590895459056, 0.0019633732736110687, 0.0020373871084302664, 0.0021114011760801077, 0.002185415243729949, 0.0022594293113797903, 0.002333443146198988, 0.0024074572138488293, 0.0024814712814986706, 0.002555485349148512, 0.0026294991839677095, 0.002703513251617551, 0.002777527319267392, 0.0028515413869172335, 0.0029255554545670748, 0.002999569522216916, 0.0030735835898667574, 0.003147597424685955, 0.0032216114923357964, 0.0032956255599856377, 0.003369639627635479, 0.0034436536952853203, 0.0035176677629351616]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 5.0, 4.0, 7.0, 6.0, 12.0, 11.0, 18.0, 15.0, 20.0, 29.0, 29.0, 32.0, 30.0, 39.0, 41.0, 48.0, 41.0, 50.0, 48.0, 54.0, 48.0, 41.0, 44.0, 49.0, 44.0, 39.0, 25.0, 29.0, 28.0, 19.0, 19.0, 20.0, 15.0, 13.0, 7.0, 3.0, 9.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0013067126274108887, -0.0012669125571846962, -0.0012271124869585037, -0.0011873124167323112, -0.0011475123465061188, -0.0011077122762799263, -0.0010679122060537338, -0.0010281121358275414, -0.0009883120656013489, -0.0009485119953751564, -0.0009087119251489639, -0.0008689118549227715, -0.000829111784696579, -0.0007893117144703865, -0.000749511644244194, -0.0007097115740180016, -0.0006699115037918091, -0.0006301114335656166, -0.0005903113633394241, -0.0005505112931132317, -0.0005107112228870392, -0.0004709111526608467, -0.00043111108243465424, -0.00039131101220846176, -0.0003515109419822693, -0.0003117108717560768, -0.00027191080152988434, -0.00023211073130369186, -0.0001923106610774994, -0.00015251059085130692, -0.00011271052062511444, -7.291045039892197e-05, -3.311038017272949e-05, 6.689690053462982e-06, 4.6489760279655457e-05, 8.628983050584793e-05, 0.0001260899007320404, 0.00016588997095823288, 0.00020569004118442535, 0.00024549011141061783, 0.0002852901816368103, 0.0003250902518630028, 0.00036489032208919525, 0.0004046903923153877, 0.0004444904625415802, 0.0004842905327677727, 0.0005240906029939651, 0.0005638906732201576, 0.0006036907434463501, 0.0006434908136725426, 0.000683290883898735, 0.0007230909541249275, 0.00076289102435112, 0.0008026910945773125, 0.0008424911648035049, 0.0008822912350296974, 0.0009220913052558899, 0.0009618913754820824, 0.0010016914457082748, 0.0010414915159344673, 0.0010812915861606598, 0.0011210916563868523, 0.0011608917266130447, 0.0012006917968392372, 0.0012404918670654297]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 4.0, 9.0, 8.0, 17.0, 20.0, 14.0, 26.0, 27.0, 23.0, 33.0, 29.0, 32.0, 35.0, 48.0, 38.0, 44.0, 42.0, 56.0, 37.0, 37.0, 51.0, 44.0, 42.0, 46.0, 33.0, 25.0, 25.0, 18.0, 25.0, 25.0, 14.0, 15.0, 12.0, 7.0, 9.0, 6.0, 6.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.96875, -11.61279296875, -11.2568359375, -10.90087890625, -10.544921875, -10.18896484375, -9.8330078125, -9.47705078125, -9.12109375, -8.76513671875, -8.4091796875, -8.05322265625, -7.697265625, -7.34130859375, -6.9853515625, -6.62939453125, -6.2734375, -5.91748046875, -5.5615234375, -5.20556640625, -4.849609375, -4.49365234375, -4.1376953125, -3.78173828125, -3.42578125, -3.06982421875, -2.7138671875, -2.35791015625, -2.001953125, -1.64599609375, -1.2900390625, -0.93408203125, -0.578125, -0.22216796875, 0.1337890625, 0.48974609375, 0.845703125, 1.20166015625, 1.5576171875, 1.91357421875, 2.26953125, 2.62548828125, 2.9814453125, 3.33740234375, 3.693359375, 4.04931640625, 4.4052734375, 4.76123046875, 5.1171875, 5.47314453125, 5.8291015625, 6.18505859375, 6.541015625, 6.89697265625, 7.2529296875, 7.60888671875, 7.96484375, 8.32080078125, 8.6767578125, 9.03271484375, 9.388671875, 9.74462890625, 10.1005859375, 10.45654296875, 10.8125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 7.0, 10.0, 16.0, 19.0, 26.0, 36.0, 47.0, 66.0, 79.0, 119.0, 152.0, 271.0, 417.0, 701.0, 1338.0, 2724.0, 6240.0, 15410.0, 42784.0, 122643.0, 354440.0, 325930.0, 110797.0, 38725.0, 14312.0, 5594.0, 2540.0, 1231.0, 656.0, 373.0, 237.0, 181.0, 113.0, 92.0, 50.0, 45.0, 32.0, 37.0, 16.0, 13.0, 13.0, 3.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.453125, -14.0145263671875, -13.575927734375, -13.1373291015625, -12.69873046875, -12.2601318359375, -11.821533203125, -11.3829345703125, -10.9443359375, -10.5057373046875, -10.067138671875, -9.6285400390625, -9.18994140625, -8.7513427734375, -8.312744140625, -7.8741455078125, -7.435546875, -6.9969482421875, -6.558349609375, -6.1197509765625, -5.68115234375, -5.2425537109375, -4.803955078125, -4.3653564453125, -3.9267578125, -3.4881591796875, -3.049560546875, -2.6109619140625, -2.17236328125, -1.7337646484375, -1.295166015625, -0.8565673828125, -0.41796875, 0.0206298828125, 0.459228515625, 0.8978271484375, 1.33642578125, 1.7750244140625, 2.213623046875, 2.6522216796875, 3.0908203125, 3.5294189453125, 3.968017578125, 4.4066162109375, 4.84521484375, 5.2838134765625, 5.722412109375, 6.1610107421875, 6.599609375, 7.0382080078125, 7.476806640625, 7.9154052734375, 8.35400390625, 8.7926025390625, 9.231201171875, 9.6697998046875, 10.1083984375, 10.5469970703125, 10.985595703125, 11.4241943359375, 11.86279296875, 12.3013916015625, 12.739990234375, 13.1785888671875, 13.6171875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 3.0, 4.0, 8.0, 8.0, 11.0, 6.0, 6.0, 5.0, 14.0, 21.0, 24.0, 23.0, 21.0, 20.0, 30.0, 32.0, 26.0, 56.0, 52.0, 82.0, 119.0, 219.0, 1517.0, 198.0, 102.0, 46.0, 54.0, 48.0, 33.0, 27.0, 31.0, 19.0, 24.0, 22.0, 16.0, 18.0, 14.0, 21.0, 8.0, 11.0, 9.0, 9.0, 8.0, 7.0, 4.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.671875, -27.75927734375, -26.8466796875, -25.93408203125, -25.021484375, -24.10888671875, -23.1962890625, -22.28369140625, -21.37109375, -20.45849609375, -19.5458984375, -18.63330078125, -17.720703125, -16.80810546875, -15.8955078125, -14.98291015625, -14.0703125, -13.15771484375, -12.2451171875, -11.33251953125, -10.419921875, -9.50732421875, -8.5947265625, -7.68212890625, -6.76953125, -5.85693359375, -4.9443359375, -4.03173828125, -3.119140625, -2.20654296875, -1.2939453125, -0.38134765625, 0.53125, 1.44384765625, 2.3564453125, 3.26904296875, 4.181640625, 5.09423828125, 6.0068359375, 6.91943359375, 7.83203125, 8.74462890625, 9.6572265625, 10.56982421875, 11.482421875, 12.39501953125, 13.3076171875, 14.22021484375, 15.1328125, 16.04541015625, 16.9580078125, 17.87060546875, 18.783203125, 19.69580078125, 20.6083984375, 21.52099609375, 22.43359375, 23.34619140625, 24.2587890625, 25.17138671875, 26.083984375, 26.99658203125, 27.9091796875, 28.82177734375, 29.734375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 8.0, 17.0, 12.0, 12.0, 17.0, 17.0, 29.0, 39.0, 44.0, 68.0, 137.0, 180.0, 317.0, 465.0, 860.0, 4877.0, 265748.0, 2840737.0, 28887.0, 1559.0, 612.0, 337.0, 232.0, 131.0, 99.0, 67.0, 47.0, 31.0, 31.0, 20.0, 15.0, 12.0, 7.0, 4.0, 2.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.53125, -56.38330078125, -54.2353515625, -52.08740234375, -49.939453125, -47.79150390625, -45.6435546875, -43.49560546875, -41.34765625, -39.19970703125, -37.0517578125, -34.90380859375, -32.755859375, -30.60791015625, -28.4599609375, -26.31201171875, -24.1640625, -22.01611328125, -19.8681640625, -17.72021484375, -15.572265625, -13.42431640625, -11.2763671875, -9.12841796875, -6.98046875, -4.83251953125, -2.6845703125, -0.53662109375, 1.611328125, 3.75927734375, 5.9072265625, 8.05517578125, 10.203125, 12.35107421875, 14.4990234375, 16.64697265625, 18.794921875, 20.94287109375, 23.0908203125, 25.23876953125, 27.38671875, 29.53466796875, 31.6826171875, 33.83056640625, 35.978515625, 38.12646484375, 40.2744140625, 42.42236328125, 44.5703125, 46.71826171875, 48.8662109375, 51.01416015625, 53.162109375, 55.31005859375, 57.4580078125, 59.60595703125, 61.75390625, 63.90185546875, 66.0498046875, 68.19775390625, 70.345703125, 72.49365234375, 74.6416015625, 76.78955078125, 78.9375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 37.0, 52.0, 134.0, 209.0, 229.0, 164.0, 99.0, 53.0, 17.0, 7.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.11601257324219, -66.57567596435547, -64.03533935546875, -61.49501037597656, -58.954673767089844, -56.414337158203125, -53.87400436401367, -51.33367156982422, -48.7933349609375, -46.25299835205078, -43.71266555786133, -41.172332763671875, -38.631996154785156, -36.09165954589844, -33.551326751708984, -31.0109920501709, -28.470657348632812, -25.930322647094727, -23.38998794555664, -20.849653244018555, -18.30931854248047, -15.768983840942383, -13.228649139404297, -10.688314437866211, -8.147979736328125, -5.607645034790039, -3.067310333251953, -0.5269756317138672, 2.0133590698242188, 4.553693771362305, 7.094028472900391, 9.634363174438477, 12.174697875976562, 14.715032577514648, 17.255367279052734, 19.79570198059082, 22.336036682128906, 24.876371383666992, 27.416706085205078, 29.957040786743164, 32.49737548828125, 35.03771209716797, 37.57804489135742, 40.118377685546875, 42.658714294433594, 45.19905090332031, 47.739383697509766, 50.27971649169922, 52.82005310058594, 55.360389709472656, 57.90072250366211, 60.44105529785156, 62.98139190673828, 65.521728515625, 68.06205749511719, 70.6023941040039, 73.14273071289062, 75.68306732177734, 78.22340393066406, 80.76373291015625, 83.30406951904297, 85.84440612792969, 88.38473510742188, 90.9250717163086, 93.46540832519531]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 3.0, 5.0, 10.0, 6.0, 14.0, 7.0, 16.0, 15.0, 13.0, 20.0, 20.0, 27.0, 21.0, 22.0, 18.0, 29.0, 37.0, 33.0, 32.0, 37.0, 38.0, 37.0, 36.0, 41.0, 42.0, 49.0, 38.0, 37.0, 33.0, 35.0, 23.0, 30.0, 23.0, 20.0, 22.0, 18.0, 11.0, 7.0, 16.0, 8.0, 8.0, 9.0, 5.0, 8.0, 2.0, 4.0, 2.0, 7.0, 3.0, 2.0, 2.0, 0.0, 4.0], "bins": [-70.0136947631836, -67.9543685913086, -65.8950424194336, -63.83572006225586, -61.77639389038086, -59.71706771850586, -57.657745361328125, -55.598419189453125, -53.539093017578125, -51.479766845703125, -49.420440673828125, -47.36111831665039, -45.30179214477539, -43.24246597290039, -41.183143615722656, -39.123817443847656, -37.064491271972656, -35.005165100097656, -32.945838928222656, -30.886516571044922, -28.827190399169922, -26.767864227294922, -24.708539962768555, -22.649215698242188, -20.589889526367188, -18.530563354492188, -16.47123908996582, -14.411913871765137, -12.352588653564453, -10.29326343536377, -8.233938217163086, -6.174612998962402, -4.115287780761719, -2.055962562561035, 0.0033626556396484375, 2.062687873840332, 4.122013092041016, 6.181338310241699, 8.240663528442383, 10.299988746643066, 12.35931396484375, 14.418639183044434, 16.477964401245117, 18.537288665771484, 20.596614837646484, 22.655941009521484, 24.71526527404785, 26.77458953857422, 28.83391571044922, 30.89324188232422, 32.95256805419922, 35.01189041137695, 37.07121658325195, 39.13054275512695, 41.18986511230469, 43.24919128417969, 45.30851745605469, 47.36784362792969, 49.42716979980469, 51.48649215698242, 53.54581832885742, 55.60514450073242, 57.664466857910156, 59.723793029785156, 61.783119201660156]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 11.0, 6.0, 13.0, 10.0, 18.0, 23.0, 19.0, 20.0, 28.0, 35.0, 39.0, 36.0, 40.0, 35.0, 36.0, 48.0, 41.0, 60.0, 34.0, 58.0, 52.0, 39.0, 48.0, 39.0, 28.0, 28.0, 32.0, 28.0, 16.0, 12.0, 13.0, 12.0, 5.0, 11.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.34375, -12.954345703125, -12.56494140625, -12.175537109375, -11.7861328125, -11.396728515625, -11.00732421875, -10.617919921875, -10.228515625, -9.839111328125, -9.44970703125, -9.060302734375, -8.6708984375, -8.281494140625, -7.89208984375, -7.502685546875, -7.11328125, -6.723876953125, -6.33447265625, -5.945068359375, -5.5556640625, -5.166259765625, -4.77685546875, -4.387451171875, -3.998046875, -3.608642578125, -3.21923828125, -2.829833984375, -2.4404296875, -2.051025390625, -1.66162109375, -1.272216796875, -0.8828125, -0.493408203125, -0.10400390625, 0.285400390625, 0.6748046875, 1.064208984375, 1.45361328125, 1.843017578125, 2.232421875, 2.621826171875, 3.01123046875, 3.400634765625, 3.7900390625, 4.179443359375, 4.56884765625, 4.958251953125, 5.34765625, 5.737060546875, 6.12646484375, 6.515869140625, 6.9052734375, 7.294677734375, 7.68408203125, 8.073486328125, 8.462890625, 8.852294921875, 9.24169921875, 9.631103515625, 10.0205078125, 10.409912109375, 10.79931640625, 11.188720703125, 11.578125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 5.0, 6.0, 7.0, 9.0, 8.0, 18.0, 15.0, 22.0, 24.0, 45.0, 46.0, 74.0, 100.0, 154.0, 255.0, 507.0, 986.0, 2425.0, 7829.0, 34535.0, 186863.0, 877943.0, 1825428.0, 980177.0, 222180.0, 40431.0, 9071.0, 2647.0, 1073.0, 541.0, 267.0, 143.0, 135.0, 90.0, 52.0, 34.0, 28.0, 23.0, 21.0, 12.0, 13.0, 11.0, 9.0, 9.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-14.640625, -14.1907958984375, -13.740966796875, -13.2911376953125, -12.84130859375, -12.3914794921875, -11.941650390625, -11.4918212890625, -11.0419921875, -10.5921630859375, -10.142333984375, -9.6925048828125, -9.24267578125, -8.7928466796875, -8.343017578125, -7.8931884765625, -7.443359375, -6.9935302734375, -6.543701171875, -6.0938720703125, -5.64404296875, -5.1942138671875, -4.744384765625, -4.2945556640625, -3.8447265625, -3.3948974609375, -2.945068359375, -2.4952392578125, -2.04541015625, -1.5955810546875, -1.145751953125, -0.6959228515625, -0.24609375, 0.2037353515625, 0.653564453125, 1.1033935546875, 1.55322265625, 2.0030517578125, 2.452880859375, 2.9027099609375, 3.3525390625, 3.8023681640625, 4.252197265625, 4.7020263671875, 5.15185546875, 5.6016845703125, 6.051513671875, 6.5013427734375, 6.951171875, 7.4010009765625, 7.850830078125, 8.3006591796875, 8.75048828125, 9.2003173828125, 9.650146484375, 10.0999755859375, 10.5498046875, 10.9996337890625, 11.449462890625, 11.8992919921875, 12.34912109375, 12.7989501953125, 13.248779296875, 13.6986083984375, 14.1484375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 6.0, 6.0, 9.0, 11.0, 6.0, 21.0, 36.0, 43.0, 47.0, 75.0, 81.0, 109.0, 200.0, 229.0, 388.0, 442.0, 498.0, 444.0, 403.0, 303.0, 213.0, 140.0, 127.0, 66.0, 43.0, 39.0, 25.0, 23.0, 14.0, 9.0, 7.0, 8.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-18.953125, -18.435546875, -17.91796875, -17.400390625, -16.8828125, -16.365234375, -15.84765625, -15.330078125, -14.8125, -14.294921875, -13.77734375, -13.259765625, -12.7421875, -12.224609375, -11.70703125, -11.189453125, -10.671875, -10.154296875, -9.63671875, -9.119140625, -8.6015625, -8.083984375, -7.56640625, -7.048828125, -6.53125, -6.013671875, -5.49609375, -4.978515625, -4.4609375, -3.943359375, -3.42578125, -2.908203125, -2.390625, -1.873046875, -1.35546875, -0.837890625, -0.3203125, 0.197265625, 0.71484375, 1.232421875, 1.75, 2.267578125, 2.78515625, 3.302734375, 3.8203125, 4.337890625, 4.85546875, 5.373046875, 5.890625, 6.408203125, 6.92578125, 7.443359375, 7.9609375, 8.478515625, 8.99609375, 9.513671875, 10.03125, 10.548828125, 11.06640625, 11.583984375, 12.1015625, 12.619140625, 13.13671875, 13.654296875, 14.171875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 8.0, 8.0, 11.0, 17.0, 14.0, 48.0, 36.0, 80.0, 105.0, 207.0, 348.0, 680.0, 1737.0, 5279.0, 20509.0, 116384.0, 1144636.0, 2542105.0, 305497.0, 42473.0, 9195.0, 2658.0, 1080.0, 457.0, 260.0, 158.0, 92.0, 60.0, 30.0, 34.0, 15.0, 19.0, 11.0, 4.0, 10.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.203125, -24.444580078125, -23.68603515625, -22.927490234375, -22.1689453125, -21.410400390625, -20.65185546875, -19.893310546875, -19.134765625, -18.376220703125, -17.61767578125, -16.859130859375, -16.1005859375, -15.342041015625, -14.58349609375, -13.824951171875, -13.06640625, -12.307861328125, -11.54931640625, -10.790771484375, -10.0322265625, -9.273681640625, -8.51513671875, -7.756591796875, -6.998046875, -6.239501953125, -5.48095703125, -4.722412109375, -3.9638671875, -3.205322265625, -2.44677734375, -1.688232421875, -0.9296875, -0.171142578125, 0.58740234375, 1.345947265625, 2.1044921875, 2.863037109375, 3.62158203125, 4.380126953125, 5.138671875, 5.897216796875, 6.65576171875, 7.414306640625, 8.1728515625, 8.931396484375, 9.68994140625, 10.448486328125, 11.20703125, 11.965576171875, 12.72412109375, 13.482666015625, 14.2412109375, 14.999755859375, 15.75830078125, 16.516845703125, 17.275390625, 18.033935546875, 18.79248046875, 19.551025390625, 20.3095703125, 21.068115234375, 21.82666015625, 22.585205078125, 23.34375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 17.0, 200.0, 557.0, 223.0, 16.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-248.54029846191406, -238.80068969726562, -229.06106567382812, -219.3214569091797, -209.58184814453125, -199.8422393798828, -190.10263061523438, -180.36300659179688, -170.62339782714844, -160.8837890625, -151.1441650390625, -141.40455627441406, -131.66494750976562, -121.92533874511719, -112.18572235107422, -102.44610595703125, -92.70649719238281, -82.96688842773438, -73.2272720336914, -63.4876594543457, -53.748046875, -44.0084342956543, -34.268821716308594, -24.529205322265625, -14.789596557617188, -5.049983978271484, 4.689628601074219, 14.429241180419922, 24.168853759765625, 33.90846633911133, 43.64807891845703, 53.3876953125, 63.1273193359375, 72.86692810058594, 82.6065444946289, 92.34616088867188, 102.08576965332031, 111.82537841796875, 121.56499481201172, 131.3046112060547, 141.04421997070312, 150.78382873535156, 160.5234375, 170.2630615234375, 180.00267028808594, 189.74227905273438, 199.48190307617188, 209.2215118408203, 218.96112060546875, 228.7007293701172, 238.44033813476562, 248.17996215820312, 257.9195556640625, 267.6591796875, 277.3988037109375, 287.138427734375, 296.8780212402344, 306.6176452636719, 316.35723876953125, 326.09686279296875, 335.83648681640625, 345.5760803222656, 355.3157043457031, 365.0552978515625, 374.794921875]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 4.0, 4.0, 15.0, 8.0, 12.0, 13.0, 15.0, 19.0, 18.0, 30.0, 27.0, 28.0, 31.0, 29.0, 32.0, 47.0, 47.0, 51.0, 34.0, 47.0, 47.0, 49.0, 30.0, 43.0, 40.0, 30.0, 30.0, 34.0, 29.0, 34.0, 21.0, 19.0, 12.0, 15.0, 14.0, 9.0, 12.0, 5.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-57.726356506347656, -55.976531982421875, -54.226707458496094, -52.47688293457031, -50.72705841064453, -48.97723388671875, -47.2274055480957, -45.47758102416992, -43.72775650024414, -41.97793197631836, -40.22810745239258, -38.4782829284668, -36.72845458984375, -34.97863006591797, -33.22880554199219, -31.478981018066406, -29.729156494140625, -27.979331970214844, -26.229507446289062, -24.47968101501465, -22.729856491088867, -20.980031967163086, -19.230205535888672, -17.48038101196289, -15.73055648803711, -13.980731964111328, -12.23090648651123, -10.481081008911133, -8.731256484985352, -6.98143196105957, -5.231606483459473, -3.481781005859375, -1.7319564819335938, 0.017868518829345703, 1.7676935195922852, 3.5175185203552246, 5.267343521118164, 7.017168045043945, 8.766993522644043, 10.51681900024414, 12.266643524169922, 14.016468048095703, 15.7662935256958, 17.5161190032959, 19.26594352722168, 21.01576805114746, 22.765594482421875, 24.515419006347656, 26.265243530273438, 28.01506805419922, 29.764892578125, 31.514719009399414, 33.26454162597656, 35.014366149902344, 36.76419448852539, 38.51401901245117, 40.26384353637695, 42.013668060302734, 43.763492584228516, 45.5133171081543, 47.263145446777344, 49.012969970703125, 50.762794494628906, 52.51261901855469, 54.26244354248047]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 5.0, 8.0, 5.0, 10.0, 10.0, 11.0, 16.0, 12.0, 19.0, 18.0, 21.0, 22.0, 27.0, 27.0, 36.0, 31.0, 42.0, 39.0, 39.0, 44.0, 46.0, 33.0, 41.0, 37.0, 37.0, 39.0, 39.0, 32.0, 28.0, 35.0, 24.0, 20.0, 26.0, 12.0, 16.0, 13.0, 13.0, 8.0, 7.0, 13.0, 7.0, 8.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-10.828125, -10.5028076171875, -10.177490234375, -9.8521728515625, -9.52685546875, -9.2015380859375, -8.876220703125, -8.5509033203125, -8.2255859375, -7.9002685546875, -7.574951171875, -7.2496337890625, -6.92431640625, -6.5989990234375, -6.273681640625, -5.9483642578125, -5.623046875, -5.2977294921875, -4.972412109375, -4.6470947265625, -4.32177734375, -3.9964599609375, -3.671142578125, -3.3458251953125, -3.0205078125, -2.6951904296875, -2.369873046875, -2.0445556640625, -1.71923828125, -1.3939208984375, -1.068603515625, -0.7432861328125, -0.41796875, -0.0926513671875, 0.232666015625, 0.5579833984375, 0.88330078125, 1.2086181640625, 1.533935546875, 1.8592529296875, 2.1845703125, 2.5098876953125, 2.835205078125, 3.1605224609375, 3.48583984375, 3.8111572265625, 4.136474609375, 4.4617919921875, 4.787109375, 5.1124267578125, 5.437744140625, 5.7630615234375, 6.08837890625, 6.4136962890625, 6.739013671875, 7.0643310546875, 7.3896484375, 7.7149658203125, 8.040283203125, 8.3656005859375, 8.69091796875, 9.0162353515625, 9.341552734375, 9.6668701171875, 9.9921875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 12.0, 9.0, 6.0, 19.0, 29.0, 41.0, 63.0, 82.0, 134.0, 221.0, 356.0, 594.0, 973.0, 1546.0, 2514.0, 4197.0, 6961.0, 11895.0, 19836.0, 35679.0, 66715.0, 140154.0, 333745.0, 218123.0, 92833.0, 47597.0, 26441.0, 15214.0, 8883.0, 5437.0, 3222.0, 1855.0, 1207.0, 747.0, 454.0, 298.0, 169.0, 119.0, 73.0, 38.0, 23.0, 14.0, 15.0, 4.0, 6.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.04351806640625, -1.9698486328125, -1.89617919921875, -1.822509765625, -1.74884033203125, -1.6751708984375, -1.60150146484375, -1.52783203125, -1.45416259765625, -1.3804931640625, -1.30682373046875, -1.233154296875, -1.15948486328125, -1.0858154296875, -1.01214599609375, -0.9384765625, -0.86480712890625, -0.7911376953125, -0.71746826171875, -0.643798828125, -0.57012939453125, -0.4964599609375, -0.42279052734375, -0.34912109375, -0.27545166015625, -0.2017822265625, -0.12811279296875, -0.054443359375, 0.01922607421875, 0.0928955078125, 0.16656494140625, 0.240234375, 0.31390380859375, 0.3875732421875, 0.46124267578125, 0.534912109375, 0.60858154296875, 0.6822509765625, 0.75592041015625, 0.82958984375, 0.90325927734375, 0.9769287109375, 1.05059814453125, 1.124267578125, 1.19793701171875, 1.2716064453125, 1.34527587890625, 1.4189453125, 1.49261474609375, 1.5662841796875, 1.63995361328125, 1.713623046875, 1.78729248046875, 1.8609619140625, 1.93463134765625, 2.00830078125, 2.08197021484375, 2.1556396484375, 2.22930908203125, 2.302978515625, 2.37664794921875, 2.4503173828125, 2.52398681640625, 2.59765625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 4.0, 4.0, 2.0, 4.0, 6.0, 8.0, 12.0, 11.0, 14.0, 27.0, 18.0, 32.0, 27.0, 29.0, 32.0, 23.0, 40.0, 42.0, 34.0, 34.0, 35.0, 48.0, 1063.0, 45.0, 43.0, 41.0, 38.0, 36.0, 31.0, 29.0, 36.0, 28.0, 18.0, 15.0, 22.0, 23.0, 13.0, 10.0, 14.0, 7.0, 10.0, 4.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.94921875, -6.73419189453125, -6.5191650390625, -6.30413818359375, -6.089111328125, -5.87408447265625, -5.6590576171875, -5.44403076171875, -5.22900390625, -5.01397705078125, -4.7989501953125, -4.58392333984375, -4.368896484375, -4.15386962890625, -3.9388427734375, -3.72381591796875, -3.5087890625, -3.29376220703125, -3.0787353515625, -2.86370849609375, -2.648681640625, -2.43365478515625, -2.2186279296875, -2.00360107421875, -1.78857421875, -1.57354736328125, -1.3585205078125, -1.14349365234375, -0.928466796875, -0.71343994140625, -0.4984130859375, -0.28338623046875, -0.068359375, 0.14666748046875, 0.3616943359375, 0.57672119140625, 0.791748046875, 1.00677490234375, 1.2218017578125, 1.43682861328125, 1.65185546875, 1.86688232421875, 2.0819091796875, 2.29693603515625, 2.511962890625, 2.72698974609375, 2.9420166015625, 3.15704345703125, 3.3720703125, 3.58709716796875, 3.8021240234375, 4.01715087890625, 4.232177734375, 4.44720458984375, 4.6622314453125, 4.87725830078125, 5.09228515625, 5.30731201171875, 5.5223388671875, 5.73736572265625, 5.952392578125, 6.16741943359375, 6.3824462890625, 6.59747314453125, 6.8125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 5.0, 5.0, 8.0, 12.0, 15.0, 34.0, 45.0, 61.0, 113.0, 122.0, 155.0, 248.0, 353.0, 529.0, 739.0, 1014.0, 1506.0, 2406.0, 3570.0, 5246.0, 7964.0, 12338.0, 19112.0, 30163.0, 48486.0, 82960.0, 158891.0, 1327189.0, 168320.0, 86730.0, 50209.0, 31383.0, 19769.0, 12837.0, 8158.0, 5545.0, 3494.0, 2307.0, 1575.0, 1129.0, 757.0, 459.0, 364.0, 227.0, 166.0, 121.0, 85.0, 67.0, 39.0, 36.0, 23.0, 21.0, 11.0, 8.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.6533203125, -1.59918212890625, -1.5450439453125, -1.49090576171875, -1.436767578125, -1.38262939453125, -1.3284912109375, -1.27435302734375, -1.22021484375, -1.16607666015625, -1.1119384765625, -1.05780029296875, -1.003662109375, -0.94952392578125, -0.8953857421875, -0.84124755859375, -0.787109375, -0.73297119140625, -0.6788330078125, -0.62469482421875, -0.570556640625, -0.51641845703125, -0.4622802734375, -0.40814208984375, -0.35400390625, -0.29986572265625, -0.2457275390625, -0.19158935546875, -0.137451171875, -0.08331298828125, -0.0291748046875, 0.02496337890625, 0.0791015625, 0.13323974609375, 0.1873779296875, 0.24151611328125, 0.295654296875, 0.34979248046875, 0.4039306640625, 0.45806884765625, 0.51220703125, 0.56634521484375, 0.6204833984375, 0.67462158203125, 0.728759765625, 0.78289794921875, 0.8370361328125, 0.89117431640625, 0.9453125, 0.99945068359375, 1.0535888671875, 1.10772705078125, 1.161865234375, 1.21600341796875, 1.2701416015625, 1.32427978515625, 1.37841796875, 1.43255615234375, 1.4866943359375, 1.54083251953125, 1.594970703125, 1.64910888671875, 1.7032470703125, 1.75738525390625, 1.8115234375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 7.0, 3.0, 9.0, 5.0, 5.0, 10.0, 9.0, 19.0, 15.0, 18.0, 26.0, 30.0, 35.0, 38.0, 54.0, 56.0, 65.0, 68.0, 61.0, 90.0, 77.0, 57.0, 39.0, 45.0, 22.0, 24.0, 24.0, 16.0, 7.0, 11.0, 13.0, 11.0, 7.0, 6.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023708343505859375, -0.002284109592437744, -0.0021973848342895508, -0.0021106600761413574, -0.002023935317993164, -0.0019372105598449707, -0.0018504858016967773, -0.001763761043548584, -0.0016770362854003906, -0.0015903115272521973, -0.001503586769104004, -0.0014168620109558105, -0.0013301372528076172, -0.0012434124946594238, -0.0011566877365112305, -0.0010699629783630371, -0.0009832382202148438, -0.0008965134620666504, -0.000809788703918457, -0.0007230639457702637, -0.0006363391876220703, -0.000549614429473877, -0.0004628896713256836, -0.00037616491317749023, -0.0002894401550292969, -0.00020271539688110352, -0.00011599063873291016, -2.9265880584716797e-05, 5.745887756347656e-05, 0.00014418363571166992, 0.00023090839385986328, 0.00031763315200805664, 0.00040435791015625, 0.0004910826683044434, 0.0005778074264526367, 0.0006645321846008301, 0.0007512569427490234, 0.0008379817008972168, 0.0009247064590454102, 0.0010114312171936035, 0.0010981559753417969, 0.0011848807334899902, 0.0012716054916381836, 0.001358330249786377, 0.0014450550079345703, 0.0015317797660827637, 0.001618504524230957, 0.0017052292823791504, 0.0017919540405273438, 0.0018786787986755371, 0.0019654035568237305, 0.002052128314971924, 0.002138853073120117, 0.0022255778312683105, 0.002312302589416504, 0.0023990273475646973, 0.0024857521057128906, 0.002572476863861084, 0.0026592016220092773, 0.0027459263801574707, 0.002832651138305664, 0.0029193758964538574, 0.0030061006546020508, 0.003092825412750244, 0.0031795501708984375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 6.0, 3.0, 3.0, 9.0, 7.0, 9.0, 13.0, 18.0, 18.0, 28.0, 22.0, 37.0, 49.0, 71.0, 77.0, 132.0, 202.0, 337.0, 593.0, 1797.0, 958040.0, 84551.0, 1077.0, 490.0, 269.0, 185.0, 121.0, 97.0, 64.0, 40.0, 36.0, 33.0, 26.0, 14.0, 16.0, 10.0, 13.0, 12.0, 10.0, 7.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.0601806640625, -0.05854654312133789, -0.05691242218017578, -0.05527830123901367, -0.05364418029785156, -0.05201005935668945, -0.050375938415527344, -0.048741817474365234, -0.047107696533203125, -0.045473575592041016, -0.043839454650878906, -0.0422053337097168, -0.04057121276855469, -0.03893709182739258, -0.03730297088623047, -0.03566884994506836, -0.03403472900390625, -0.03240060806274414, -0.03076648712158203, -0.029132366180419922, -0.027498245239257812, -0.025864124298095703, -0.024230003356933594, -0.022595882415771484, -0.020961761474609375, -0.019327640533447266, -0.017693519592285156, -0.016059398651123047, -0.014425277709960938, -0.012791156768798828, -0.011157035827636719, -0.00952291488647461, -0.0078887939453125, -0.006254673004150391, -0.004620552062988281, -0.002986431121826172, -0.0013523101806640625, 0.0002818107604980469, 0.0019159317016601562, 0.0035500526428222656, 0.005184173583984375, 0.006818294525146484, 0.008452415466308594, 0.010086536407470703, 0.011720657348632812, 0.013354778289794922, 0.014988899230957031, 0.01662302017211914, 0.01825714111328125, 0.01989126205444336, 0.02152538299560547, 0.023159503936767578, 0.024793624877929688, 0.026427745819091797, 0.028061866760253906, 0.029695987701416016, 0.031330108642578125, 0.032964229583740234, 0.034598350524902344, 0.03623247146606445, 0.03786659240722656, 0.03950071334838867, 0.04113483428955078, 0.04276895523071289, 0.044403076171875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 13.0, 35.0, 78.0, 157.0, 212.0, 187.0, 178.0, 83.0, 44.0, 13.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.003763421904295683, -0.0036912220530211926, -0.003619022434577346, -0.0035468225833028555, -0.003474622732028365, -0.0034024231135845184, -0.003330223262310028, -0.0032580234110355377, -0.0031858235597610474, -0.003113623708486557, -0.0030414240900427103, -0.00296922423876822, -0.0028970243874937296, -0.002824824769049883, -0.0027526249177753925, -0.002680425066500902, -0.0026082254480570555, -0.002536025596782565, -0.0024638259783387184, -0.002391626127064228, -0.0023194262757897377, -0.0022472264245152473, -0.0021750268060714006, -0.0021028269547969103, -0.0020306273363530636, -0.0019584274850785732, -0.0018862277502194047, -0.0018140280153602362, -0.0017418281640857458, -0.0016696284292265773, -0.0015974286943674088, -0.0015252288430929184, -0.0014530288754031062, -0.0013808291405439377, -0.0013086292892694473, -0.0012364295544102788, -0.0011642298195511103, -0.00109202996827662, -0.0010198302334174514, -0.0009476304403506219, -0.0008754306472837925, -0.000803230854216963, -0.0007310310611501336, -0.0006588313262909651, -0.0005866315332241356, -0.0005144317401573062, -0.0004422319761943072, -0.0003700322122313082, -0.0002978324191644788, -0.00022563264064956456, -0.00015343286213465035, -8.123308361973614e-05, -9.03330510482192e-06, 6.316648796200752e-05, 0.0001353662519250065, 0.0002075660158880055, 0.00027976580895483494, 0.0003519656020216644, 0.00042416536598466337, 0.0004963651299476624, 0.0005685649230144918, 0.0006407647160813212, 0.0007129644509404898, 0.0007851642440073192, 0.0008573640370741487]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 6.0, 7.0, 10.0, 11.0, 13.0, 10.0, 17.0, 15.0, 25.0, 25.0, 28.0, 27.0, 31.0, 38.0, 27.0, 33.0, 29.0, 42.0, 44.0, 34.0, 40.0, 42.0, 38.0, 40.0, 39.0, 32.0, 38.0, 29.0, 30.0, 32.0, 22.0, 27.0, 20.0, 15.0, 17.0, 5.0, 12.0, 10.0, 11.0, 5.0, 4.0, 4.0, 1.0, 0.0, 4.0, 6.0, 2.0, 2.0], "bins": [-0.0014423131942749023, -0.0014021145179867744, -0.0013619158416986465, -0.0013217171654105186, -0.0012815184891223907, -0.0012413198128342628, -0.001201121136546135, -0.001160922460258007, -0.0011207237839698792, -0.0010805251076817513, -0.0010403264313936234, -0.0010001277551054955, -0.0009599290788173676, -0.0009197304025292397, -0.0008795317262411118, -0.0008393330499529839, -0.000799134373664856, -0.0007589356973767281, -0.0007187370210886002, -0.0006785383448004723, -0.0006383396685123444, -0.0005981409922242165, -0.0005579423159360886, -0.0005177436396479607, -0.00047754496335983276, -0.00043734628707170486, -0.00039714761078357697, -0.00035694893449544907, -0.00031675025820732117, -0.00027655158191919327, -0.00023635290563106537, -0.00019615422934293747, -0.00015595555305480957, -0.00011575687676668167, -7.555820047855377e-05, -3.535952419042587e-05, 4.839152097702026e-06, 4.5037828385829926e-05, 8.523650467395782e-05, 0.00012543518096208572, 0.00016563385725021362, 0.00020583253353834152, 0.0002460312098264694, 0.0002862298861145973, 0.0003264285624027252, 0.0003666272386908531, 0.000406825914978981, 0.0004470245912671089, 0.0004872232675552368, 0.0005274219438433647, 0.0005676206201314926, 0.0006078192964196205, 0.0006480179727077484, 0.0006882166489958763, 0.0007284153252840042, 0.0007686140015721321, 0.00080881267786026, 0.0008490113541483879, 0.0008892100304365158, 0.0009294087067246437, 0.0009696073830127716, 0.0010098060593008995, 0.0010500047355890274, 0.0010902034118771553, 0.0011304020881652832]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 5.0, 8.0, 5.0, 10.0, 10.0, 11.0, 16.0, 12.0, 19.0, 18.0, 21.0, 22.0, 27.0, 27.0, 36.0, 31.0, 42.0, 39.0, 39.0, 44.0, 46.0, 33.0, 41.0, 37.0, 37.0, 39.0, 39.0, 32.0, 28.0, 35.0, 24.0, 20.0, 26.0, 12.0, 16.0, 13.0, 13.0, 8.0, 7.0, 13.0, 7.0, 8.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-10.828125, -10.5028076171875, -10.177490234375, -9.8521728515625, -9.52685546875, -9.2015380859375, -8.876220703125, -8.5509033203125, -8.2255859375, -7.9002685546875, -7.574951171875, -7.2496337890625, -6.92431640625, -6.5989990234375, -6.273681640625, -5.9483642578125, -5.623046875, -5.2977294921875, -4.972412109375, -4.6470947265625, -4.32177734375, -3.9964599609375, -3.671142578125, -3.3458251953125, -3.0205078125, -2.6951904296875, -2.369873046875, -2.0445556640625, -1.71923828125, -1.3939208984375, -1.068603515625, -0.7432861328125, -0.41796875, -0.0926513671875, 0.232666015625, 0.5579833984375, 0.88330078125, 1.2086181640625, 1.533935546875, 1.8592529296875, 2.1845703125, 2.5098876953125, 2.835205078125, 3.1605224609375, 3.48583984375, 3.8111572265625, 4.136474609375, 4.4617919921875, 4.787109375, 5.1124267578125, 5.437744140625, 5.7630615234375, 6.08837890625, 6.4136962890625, 6.739013671875, 7.0643310546875, 7.3896484375, 7.7149658203125, 8.040283203125, 8.3656005859375, 8.69091796875, 9.0162353515625, 9.341552734375, 9.6668701171875, 9.9921875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 5.0, 10.0, 10.0, 18.0, 9.0, 15.0, 28.0, 34.0, 51.0, 59.0, 78.0, 100.0, 104.0, 172.0, 182.0, 287.0, 398.0, 652.0, 1074.0, 1949.0, 3914.0, 9524.0, 26620.0, 75934.0, 210137.0, 370306.0, 220045.0, 79751.0, 27622.0, 10000.0, 4016.0, 2066.0, 1099.0, 696.0, 418.0, 273.0, 217.0, 158.0, 122.0, 73.0, 85.0, 49.0, 41.0, 37.0, 31.0, 33.0, 20.0, 12.0, 7.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-13.4296875, -13.003662109375, -12.57763671875, -12.151611328125, -11.7255859375, -11.299560546875, -10.87353515625, -10.447509765625, -10.021484375, -9.595458984375, -9.16943359375, -8.743408203125, -8.3173828125, -7.891357421875, -7.46533203125, -7.039306640625, -6.61328125, -6.187255859375, -5.76123046875, -5.335205078125, -4.9091796875, -4.483154296875, -4.05712890625, -3.631103515625, -3.205078125, -2.779052734375, -2.35302734375, -1.927001953125, -1.5009765625, -1.074951171875, -0.64892578125, -0.222900390625, 0.203125, 0.629150390625, 1.05517578125, 1.481201171875, 1.9072265625, 2.333251953125, 2.75927734375, 3.185302734375, 3.611328125, 4.037353515625, 4.46337890625, 4.889404296875, 5.3154296875, 5.741455078125, 6.16748046875, 6.593505859375, 7.01953125, 7.445556640625, 7.87158203125, 8.297607421875, 8.7236328125, 9.149658203125, 9.57568359375, 10.001708984375, 10.427734375, 10.853759765625, 11.27978515625, 11.705810546875, 12.1318359375, 12.557861328125, 12.98388671875, 13.409912109375, 13.8359375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 0.0, 5.0, 5.0, 7.0, 5.0, 8.0, 12.0, 16.0, 20.0, 22.0, 30.0, 40.0, 41.0, 45.0, 41.0, 77.0, 71.0, 197.0, 329.0, 1397.0, 190.0, 102.0, 72.0, 55.0, 42.0, 38.0, 25.0, 36.0, 22.0, 20.0, 11.0, 18.0, 14.0, 9.0, 9.0, 3.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.359375, -30.318603515625, -29.27783203125, -28.237060546875, -27.1962890625, -26.155517578125, -25.11474609375, -24.073974609375, -23.033203125, -21.992431640625, -20.95166015625, -19.910888671875, -18.8701171875, -17.829345703125, -16.78857421875, -15.747802734375, -14.70703125, -13.666259765625, -12.62548828125, -11.584716796875, -10.5439453125, -9.503173828125, -8.46240234375, -7.421630859375, -6.380859375, -5.340087890625, -4.29931640625, -3.258544921875, -2.2177734375, -1.177001953125, -0.13623046875, 0.904541015625, 1.9453125, 2.986083984375, 4.02685546875, 5.067626953125, 6.1083984375, 7.149169921875, 8.18994140625, 9.230712890625, 10.271484375, 11.312255859375, 12.35302734375, 13.393798828125, 14.4345703125, 15.475341796875, 16.51611328125, 17.556884765625, 18.59765625, 19.638427734375, 20.67919921875, 21.719970703125, 22.7607421875, 23.801513671875, 24.84228515625, 25.883056640625, 26.923828125, 27.964599609375, 29.00537109375, 30.046142578125, 31.0869140625, 32.127685546875, 33.16845703125, 34.209228515625, 35.25]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 3.0, 3.0, 4.0, 9.0, 9.0, 18.0, 24.0, 27.0, 25.0, 35.0, 49.0, 69.0, 113.0, 180.0, 238.0, 403.0, 739.0, 1780.0, 32790.0, 2975149.0, 128757.0, 3011.0, 842.0, 512.0, 290.0, 183.0, 121.0, 88.0, 54.0, 36.0, 35.0, 26.0, 22.0, 21.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.03125, -60.83056640625, -58.6298828125, -56.42919921875, -54.228515625, -52.02783203125, -49.8271484375, -47.62646484375, -45.42578125, -43.22509765625, -41.0244140625, -38.82373046875, -36.623046875, -34.42236328125, -32.2216796875, -30.02099609375, -27.8203125, -25.61962890625, -23.4189453125, -21.21826171875, -19.017578125, -16.81689453125, -14.6162109375, -12.41552734375, -10.21484375, -8.01416015625, -5.8134765625, -3.61279296875, -1.412109375, 0.78857421875, 2.9892578125, 5.18994140625, 7.390625, 9.59130859375, 11.7919921875, 13.99267578125, 16.193359375, 18.39404296875, 20.5947265625, 22.79541015625, 24.99609375, 27.19677734375, 29.3974609375, 31.59814453125, 33.798828125, 35.99951171875, 38.2001953125, 40.40087890625, 42.6015625, 44.80224609375, 47.0029296875, 49.20361328125, 51.404296875, 53.60498046875, 55.8056640625, 58.00634765625, 60.20703125, 62.40771484375, 64.6083984375, 66.80908203125, 69.009765625, 71.21044921875, 73.4111328125, 75.61181640625, 77.8125]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [2.0, 5.0, 40.0, 229.0, 464.0, 236.0, 38.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.76854133605957, -19.154367446899414, -13.540193557739258, -7.926019668579102, -2.3118457794189453, 3.302328109741211, 8.916501998901367, 14.530675888061523, 20.14484977722168, 25.759023666381836, 31.373197555541992, 36.98737335205078, 42.60154724121094, 48.215721130371094, 53.82989501953125, 59.444068908691406, 65.05824279785156, 70.67241668701172, 76.28659057617188, 81.90076446533203, 87.51493835449219, 93.12911224365234, 98.7432861328125, 104.35746002197266, 109.97163391113281, 115.58580780029297, 121.19998168945312, 126.81415557861328, 132.42832946777344, 138.04251098632812, 143.65667724609375, 149.27084350585938, 154.885009765625, 160.49917602539062, 166.1133575439453, 171.7275390625, 177.34170532226562, 182.95587158203125, 188.57005310058594, 194.18423461914062, 199.79840087890625, 205.41256713867188, 211.02674865722656, 216.64093017578125, 222.25509643554688, 227.8692626953125, 233.4834442138672, 239.09762573242188, 244.7117919921875, 250.32595825195312, 255.9401397705078, 261.5543212890625, 267.1684875488281, 272.78265380859375, 278.3968505859375, 284.0110168457031, 289.62518310546875, 295.2393493652344, 300.853515625, 306.46771240234375, 312.0818786621094, 317.696044921875, 323.31024169921875, 328.9244079589844, 334.53857421875]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 7.0, 2.0, 11.0, 11.0, 8.0, 16.0, 14.0, 19.0, 19.0, 26.0, 37.0, 36.0, 34.0, 34.0, 52.0, 44.0, 31.0, 38.0, 44.0, 48.0, 36.0, 37.0, 42.0, 43.0, 35.0, 38.0, 26.0, 38.0, 34.0, 26.0, 34.0, 19.0, 17.0, 16.0, 8.0, 13.0, 5.0, 6.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.93299102783203, -56.68267059326172, -54.432350158691406, -52.182029724121094, -49.93170928955078, -47.68138885498047, -45.431068420410156, -43.180747985839844, -40.93042755126953, -38.68010711669922, -36.429786682128906, -34.179466247558594, -31.92914581298828, -29.67882537841797, -27.428504943847656, -25.178184509277344, -22.92786407470703, -20.67754364013672, -18.427223205566406, -16.176902770996094, -13.926582336425781, -11.676261901855469, -9.425941467285156, -7.175621032714844, -4.925300598144531, -2.6749801635742188, -0.42465972900390625, 1.8256607055664062, 4.075981140136719, 6.326301574707031, 8.576622009277344, 10.826942443847656, 13.077255249023438, 15.32757568359375, 17.577896118164062, 19.828216552734375, 22.078536987304688, 24.328857421875, 26.579177856445312, 28.829498291015625, 31.079818725585938, 33.33013916015625, 35.58045959472656, 37.830780029296875, 40.08110046386719, 42.3314208984375, 44.58174133300781, 46.832061767578125, 49.08238220214844, 51.33270263671875, 53.58302307128906, 55.833343505859375, 58.08366394042969, 60.333984375, 62.58430480957031, 64.83462524414062, 67.08494567871094, 69.33526611328125, 71.58558654785156, 73.83590698242188, 76.08622741699219, 78.3365478515625, 80.58686828613281, 82.83718872070312, 85.08750915527344]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 10.0, 4.0, 6.0, 5.0, 9.0, 18.0, 14.0, 16.0, 15.0, 13.0, 22.0, 16.0, 33.0, 34.0, 47.0, 32.0, 29.0, 38.0, 46.0, 51.0, 40.0, 46.0, 43.0, 42.0, 40.0, 33.0, 53.0, 39.0, 36.0, 28.0, 26.0, 23.0, 16.0, 11.0, 13.0, 16.0, 6.0, 7.0, 5.0, 11.0, 7.0, 4.0, 2.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0234375, -12.651611328125, -12.27978515625, -11.907958984375, -11.5361328125, -11.164306640625, -10.79248046875, -10.420654296875, -10.048828125, -9.677001953125, -9.30517578125, -8.933349609375, -8.5615234375, -8.189697265625, -7.81787109375, -7.446044921875, -7.07421875, -6.702392578125, -6.33056640625, -5.958740234375, -5.5869140625, -5.215087890625, -4.84326171875, -4.471435546875, -4.099609375, -3.727783203125, -3.35595703125, -2.984130859375, -2.6123046875, -2.240478515625, -1.86865234375, -1.496826171875, -1.125, -0.753173828125, -0.38134765625, -0.009521484375, 0.3623046875, 0.734130859375, 1.10595703125, 1.477783203125, 1.849609375, 2.221435546875, 2.59326171875, 2.965087890625, 3.3369140625, 3.708740234375, 4.08056640625, 4.452392578125, 4.82421875, 5.196044921875, 5.56787109375, 5.939697265625, 6.3115234375, 6.683349609375, 7.05517578125, 7.427001953125, 7.798828125, 8.170654296875, 8.54248046875, 8.914306640625, 9.2861328125, 9.657958984375, 10.02978515625, 10.401611328125, 10.7734375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 7.0, 5.0, 4.0, 6.0, 9.0, 7.0, 8.0, 14.0, 17.0, 25.0, 24.0, 35.0, 29.0, 48.0, 63.0, 78.0, 116.0, 136.0, 202.0, 268.0, 337.0, 438.0, 1460.0, 3281591.0, 906614.0, 990.0, 391.0, 305.0, 251.0, 172.0, 157.0, 103.0, 70.0, 59.0, 53.0, 40.0, 34.0, 19.0, 24.0, 12.0, 12.0, 14.0, 13.0, 7.0, 8.0, 8.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-124.5, -120.7177734375, -116.935546875, -113.1533203125, -109.37109375, -105.5888671875, -101.806640625, -98.0244140625, -94.2421875, -90.4599609375, -86.677734375, -82.8955078125, -79.11328125, -75.3310546875, -71.548828125, -67.7666015625, -63.984375, -60.2021484375, -56.419921875, -52.6376953125, -48.85546875, -45.0732421875, -41.291015625, -37.5087890625, -33.7265625, -29.9443359375, -26.162109375, -22.3798828125, -18.59765625, -14.8154296875, -11.033203125, -7.2509765625, -3.46875, 0.3134765625, 4.095703125, 7.8779296875, 11.66015625, 15.4423828125, 19.224609375, 23.0068359375, 26.7890625, 30.5712890625, 34.353515625, 38.1357421875, 41.91796875, 45.7001953125, 49.482421875, 53.2646484375, 57.046875, 60.8291015625, 64.611328125, 68.3935546875, 72.17578125, 75.9580078125, 79.740234375, 83.5224609375, 87.3046875, 91.0869140625, 94.869140625, 98.6513671875, 102.43359375, 106.2158203125, 109.998046875, 113.7802734375, 117.5625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 6.0, 5.0, 4.0, 7.0, 9.0, 11.0, 19.0, 16.0, 20.0, 38.0, 51.0, 66.0, 93.0, 124.0, 159.0, 224.0, 312.0, 424.0, 512.0, 519.0, 377.0, 278.0, 234.0, 170.0, 96.0, 79.0, 52.0, 51.0, 18.0, 27.0, 13.0, 13.0, 11.0, 12.0, 6.0, 8.0, 4.0, 4.0, 1.0, 2.0, 6.0, 1.0, 0.0, 1.0], "bins": [-21.171875, -20.627197265625, -20.08251953125, -19.537841796875, -18.9931640625, -18.448486328125, -17.90380859375, -17.359130859375, -16.814453125, -16.269775390625, -15.72509765625, -15.180419921875, -14.6357421875, -14.091064453125, -13.54638671875, -13.001708984375, -12.45703125, -11.912353515625, -11.36767578125, -10.822998046875, -10.2783203125, -9.733642578125, -9.18896484375, -8.644287109375, -8.099609375, -7.554931640625, -7.01025390625, -6.465576171875, -5.9208984375, -5.376220703125, -4.83154296875, -4.286865234375, -3.7421875, -3.197509765625, -2.65283203125, -2.108154296875, -1.5634765625, -1.018798828125, -0.47412109375, 0.070556640625, 0.615234375, 1.159912109375, 1.70458984375, 2.249267578125, 2.7939453125, 3.338623046875, 3.88330078125, 4.427978515625, 4.97265625, 5.517333984375, 6.06201171875, 6.606689453125, 7.1513671875, 7.696044921875, 8.24072265625, 8.785400390625, 9.330078125, 9.874755859375, 10.41943359375, 10.964111328125, 11.5087890625, 12.053466796875, 12.59814453125, 13.142822265625, 13.6875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 10.0, 8.0, 14.0, 18.0, 19.0, 24.0, 27.0, 37.0, 54.0, 61.0, 147.0, 342.0, 1528.0, 138800.0, 4032529.0, 19301.0, 759.0, 239.0, 102.0, 58.0, 49.0, 36.0, 30.0, 19.0, 22.0, 15.0, 6.0, 10.0, 7.0, 8.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.375, -61.4921875, -58.609375, -55.7265625, -52.84375, -49.9609375, -47.078125, -44.1953125, -41.3125, -38.4296875, -35.546875, -32.6640625, -29.78125, -26.8984375, -24.015625, -21.1328125, -18.25, -15.3671875, -12.484375, -9.6015625, -6.71875, -3.8359375, -0.953125, 1.9296875, 4.8125, 7.6953125, 10.578125, 13.4609375, 16.34375, 19.2265625, 22.109375, 24.9921875, 27.875, 30.7578125, 33.640625, 36.5234375, 39.40625, 42.2890625, 45.171875, 48.0546875, 50.9375, 53.8203125, 56.703125, 59.5859375, 62.46875, 65.3515625, 68.234375, 71.1171875, 74.0, 76.8828125, 79.765625, 82.6484375, 85.53125, 88.4140625, 91.296875, 94.1796875, 97.0625, 99.9453125, 102.828125, 105.7109375, 108.59375, 111.4765625, 114.359375, 117.2421875, 120.125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 102.0, 679.0, 220.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-422.70098876953125, -410.1365966796875, -397.5722351074219, -385.00787353515625, -372.4434814453125, -359.87908935546875, -347.3147277832031, -334.7503662109375, -322.18597412109375, -309.62158203125, -297.0572204589844, -284.49285888671875, -271.928466796875, -259.36407470703125, -246.79971313476562, -234.23533630371094, -221.67095947265625, -209.10658264160156, -196.54220581054688, -183.9778289794922, -171.4134521484375, -158.8490753173828, -146.28469848632812, -133.72032165527344, -121.15594482421875, -108.59156799316406, -96.02719116210938, -83.46281433105469, -70.8984375, -58.33406066894531, -45.769683837890625, -33.20530700683594, -20.64093017578125, -8.076553344726562, 4.487823486328125, 17.052200317382812, 29.6165771484375, 42.18095397949219, 54.745330810546875, 67.30970764160156, 79.87408447265625, 92.43846130371094, 105.00283813476562, 117.56721496582031, 130.131591796875, 142.6959686279297, 155.26034545898438, 167.82472229003906, 180.38909912109375, 192.95347595214844, 205.51785278320312, 218.0822296142578, 230.6466064453125, 243.2109832763672, 255.77536010742188, 268.3397216796875, 280.90411376953125, 293.468505859375, 306.0328674316406, 318.59722900390625, 331.16162109375, 343.72601318359375, 356.2903747558594, 368.854736328125, 381.41912841796875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 11.0, 6.0, 6.0, 8.0, 12.0, 7.0, 8.0, 9.0, 15.0, 18.0, 17.0, 22.0, 32.0, 25.0, 18.0, 34.0, 24.0, 30.0, 42.0, 28.0, 37.0, 39.0, 36.0, 47.0, 35.0, 26.0, 40.0, 39.0, 40.0, 36.0, 25.0, 33.0, 21.0, 22.0, 21.0, 16.0, 16.0, 12.0, 17.0, 13.0, 10.0, 11.0, 6.0, 8.0, 5.0, 5.0, 4.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-55.753265380859375, -54.11888885498047, -52.48451232910156, -50.850135803222656, -49.21575927734375, -47.581382751464844, -45.94700622558594, -44.31262969970703, -42.678253173828125, -41.04387664794922, -39.40950012207031, -37.775123596191406, -36.1407470703125, -34.506370544433594, -32.87199401855469, -31.23761749267578, -29.603239059448242, -27.968862533569336, -26.33448600769043, -24.700109481811523, -23.065732955932617, -21.431354522705078, -19.796977996826172, -18.162601470947266, -16.52822494506836, -14.893848419189453, -13.259471893310547, -11.62509536743164, -9.990718841552734, -8.356341361999512, -6.7219648361206055, -5.087588310241699, -3.4532127380371094, -1.8188360929489136, -0.18445944786071777, 1.4499173164367676, 3.084293842315674, 4.718670845031738, 6.3530473709106445, 7.987423896789551, 9.621800422668457, 11.256176948547363, 12.89055347442627, 14.524930953979492, 16.1593074798584, 17.793684005737305, 19.42806053161621, 21.062437057495117, 22.696813583374023, 24.33119010925293, 25.965566635131836, 27.599943161010742, 29.23431968688965, 30.868698120117188, 32.503074645996094, 34.137451171875, 35.771827697753906, 37.40620422363281, 39.04058074951172, 40.674957275390625, 42.30933380126953, 43.94371032714844, 45.578086853027344, 47.21246337890625, 48.846839904785156]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 5.0, 12.0, 10.0, 8.0, 13.0, 9.0, 14.0, 19.0, 26.0, 23.0, 31.0, 30.0, 17.0, 34.0, 35.0, 34.0, 31.0, 53.0, 39.0, 48.0, 40.0, 34.0, 32.0, 43.0, 37.0, 30.0, 35.0, 29.0, 36.0, 27.0, 20.0, 20.0, 24.0, 17.0, 10.0, 9.0, 11.0, 10.0, 9.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0], "bins": [-11.8984375, -11.5672607421875, -11.236083984375, -10.9049072265625, -10.57373046875, -10.2425537109375, -9.911376953125, -9.5802001953125, -9.2490234375, -8.9178466796875, -8.586669921875, -8.2554931640625, -7.92431640625, -7.5931396484375, -7.261962890625, -6.9307861328125, -6.599609375, -6.2684326171875, -5.937255859375, -5.6060791015625, -5.27490234375, -4.9437255859375, -4.612548828125, -4.2813720703125, -3.9501953125, -3.6190185546875, -3.287841796875, -2.9566650390625, -2.62548828125, -2.2943115234375, -1.963134765625, -1.6319580078125, -1.30078125, -0.9696044921875, -0.638427734375, -0.3072509765625, 0.02392578125, 0.3551025390625, 0.686279296875, 1.0174560546875, 1.3486328125, 1.6798095703125, 2.010986328125, 2.3421630859375, 2.67333984375, 3.0045166015625, 3.335693359375, 3.6668701171875, 3.998046875, 4.3292236328125, 4.660400390625, 4.9915771484375, 5.32275390625, 5.6539306640625, 5.985107421875, 6.3162841796875, 6.6474609375, 6.9786376953125, 7.309814453125, 7.6409912109375, 7.97216796875, 8.3033447265625, 8.634521484375, 8.9656982421875, 9.296875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 9.0, 14.0, 22.0, 31.0, 42.0, 59.0, 113.0, 132.0, 195.0, 284.0, 388.0, 638.0, 968.0, 1394.0, 2167.0, 3307.0, 5204.0, 8034.0, 13121.0, 21440.0, 36022.0, 64476.0, 124508.0, 270279.0, 240064.0, 110630.0, 58633.0, 33040.0, 19689.0, 12179.0, 7404.0, 4907.0, 3124.0, 2008.0, 1326.0, 840.0, 599.0, 404.0, 283.0, 166.0, 132.0, 83.0, 68.0, 43.0, 33.0, 19.0, 9.0, 10.0, 7.0, 0.0, 1.0, 2.0, 1.0, 4.0], "bins": [-2.244140625, -2.177978515625, -2.11181640625, -2.045654296875, -1.9794921875, -1.913330078125, -1.84716796875, -1.781005859375, -1.71484375, -1.648681640625, -1.58251953125, -1.516357421875, -1.4501953125, -1.384033203125, -1.31787109375, -1.251708984375, -1.185546875, -1.119384765625, -1.05322265625, -0.987060546875, -0.9208984375, -0.854736328125, -0.78857421875, -0.722412109375, -0.65625, -0.590087890625, -0.52392578125, -0.457763671875, -0.3916015625, -0.325439453125, -0.25927734375, -0.193115234375, -0.126953125, -0.060791015625, 0.00537109375, 0.071533203125, 0.1376953125, 0.203857421875, 0.27001953125, 0.336181640625, 0.40234375, 0.468505859375, 0.53466796875, 0.600830078125, 0.6669921875, 0.733154296875, 0.79931640625, 0.865478515625, 0.931640625, 0.997802734375, 1.06396484375, 1.130126953125, 1.1962890625, 1.262451171875, 1.32861328125, 1.394775390625, 1.4609375, 1.527099609375, 1.59326171875, 1.659423828125, 1.7255859375, 1.791748046875, 1.85791015625, 1.924072265625, 1.990234375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 2.0, 1.0, 6.0, 10.0, 15.0, 11.0, 13.0, 16.0, 15.0, 18.0, 24.0, 24.0, 30.0, 37.0, 28.0, 34.0, 31.0, 33.0, 33.0, 34.0, 48.0, 1064.0, 41.0, 30.0, 38.0, 36.0, 40.0, 26.0, 31.0, 30.0, 26.0, 31.0, 31.0, 16.0, 19.0, 8.0, 13.0, 15.0, 9.0, 10.0, 6.0, 11.0, 9.0, 4.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.9375, -5.7283935546875, -5.519287109375, -5.3101806640625, -5.10107421875, -4.8919677734375, -4.682861328125, -4.4737548828125, -4.2646484375, -4.0555419921875, -3.846435546875, -3.6373291015625, -3.42822265625, -3.2191162109375, -3.010009765625, -2.8009033203125, -2.591796875, -2.3826904296875, -2.173583984375, -1.9644775390625, -1.75537109375, -1.5462646484375, -1.337158203125, -1.1280517578125, -0.9189453125, -0.7098388671875, -0.500732421875, -0.2916259765625, -0.08251953125, 0.1265869140625, 0.335693359375, 0.5447998046875, 0.75390625, 0.9630126953125, 1.172119140625, 1.3812255859375, 1.59033203125, 1.7994384765625, 2.008544921875, 2.2176513671875, 2.4267578125, 2.6358642578125, 2.844970703125, 3.0540771484375, 3.26318359375, 3.4722900390625, 3.681396484375, 3.8905029296875, 4.099609375, 4.3087158203125, 4.517822265625, 4.7269287109375, 4.93603515625, 5.1451416015625, 5.354248046875, 5.5633544921875, 5.7724609375, 5.9815673828125, 6.190673828125, 6.3997802734375, 6.60888671875, 6.8179931640625, 7.027099609375, 7.2362060546875, 7.4453125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 1.0, 4.0, 7.0, 12.0, 16.0, 15.0, 41.0, 63.0, 62.0, 114.0, 157.0, 195.0, 321.0, 436.0, 635.0, 903.0, 1370.0, 2087.0, 3162.0, 4601.0, 7144.0, 10632.0, 16431.0, 25730.0, 41887.0, 71456.0, 134231.0, 1312285.0, 205360.0, 102714.0, 57348.0, 34606.0, 21793.0, 13983.0, 8965.0, 6188.0, 3940.0, 2544.0, 1800.0, 1216.0, 830.0, 560.0, 365.0, 297.0, 189.0, 135.0, 98.0, 66.0, 45.0, 38.0, 20.0, 13.0, 11.0, 11.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.9609375, -1.902923583984375, -1.84490966796875, -1.786895751953125, -1.7288818359375, -1.670867919921875, -1.61285400390625, -1.554840087890625, -1.496826171875, -1.438812255859375, -1.38079833984375, -1.322784423828125, -1.2647705078125, -1.206756591796875, -1.14874267578125, -1.090728759765625, -1.03271484375, -0.974700927734375, -0.91668701171875, -0.858673095703125, -0.8006591796875, -0.742645263671875, -0.68463134765625, -0.626617431640625, -0.568603515625, -0.510589599609375, -0.45257568359375, -0.394561767578125, -0.3365478515625, -0.278533935546875, -0.22052001953125, -0.162506103515625, -0.1044921875, -0.046478271484375, 0.01153564453125, 0.069549560546875, 0.1275634765625, 0.185577392578125, 0.24359130859375, 0.301605224609375, 0.359619140625, 0.417633056640625, 0.47564697265625, 0.533660888671875, 0.5916748046875, 0.649688720703125, 0.70770263671875, 0.765716552734375, 0.82373046875, 0.881744384765625, 0.93975830078125, 0.997772216796875, 1.0557861328125, 1.113800048828125, 1.17181396484375, 1.229827880859375, 1.287841796875, 1.345855712890625, 1.40386962890625, 1.461883544921875, 1.5198974609375, 1.577911376953125, 1.63592529296875, 1.693939208984375, 1.751953125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 11.0, 9.0, 8.0, 16.0, 17.0, 16.0, 21.0, 44.0, 40.0, 45.0, 58.0, 72.0, 73.0, 82.0, 79.0, 54.0, 52.0, 52.0, 43.0, 43.0, 32.0, 29.0, 24.0, 19.0, 9.0, 12.0, 11.0, 6.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002109527587890625, -0.002039581537246704, -0.001969635486602783, -0.0018996894359588623, -0.0018297433853149414, -0.0017597973346710205, -0.0016898512840270996, -0.0016199052333831787, -0.0015499591827392578, -0.001480013132095337, -0.001410067081451416, -0.0013401210308074951, -0.0012701749801635742, -0.0012002289295196533, -0.0011302828788757324, -0.0010603368282318115, -0.0009903907775878906, -0.0009204447269439697, -0.0008504986763000488, -0.0007805526256561279, -0.000710606575012207, -0.0006406605243682861, -0.0005707144737243652, -0.0005007684230804443, -0.00043082237243652344, -0.00036087632179260254, -0.00029093027114868164, -0.00022098422050476074, -0.00015103816986083984, -8.109211921691895e-05, -1.1146068572998047e-05, 5.879998207092285e-05, 0.00012874603271484375, 0.00019869208335876465, 0.00026863813400268555, 0.00033858418464660645, 0.00040853023529052734, 0.00047847628593444824, 0.0005484223365783691, 0.00061836838722229, 0.0006883144378662109, 0.0007582604885101318, 0.0008282065391540527, 0.0008981525897979736, 0.0009680986404418945, 0.0010380446910858154, 0.0011079907417297363, 0.0011779367923736572, 0.0012478828430175781, 0.001317828893661499, 0.00138777494430542, 0.0014577209949493408, 0.0015276670455932617, 0.0015976130962371826, 0.0016675591468811035, 0.0017375051975250244, 0.0018074512481689453, 0.0018773972988128662, 0.0019473433494567871, 0.002017289400100708, 0.002087235450744629, 0.00215718150138855, 0.0022271275520324707, 0.0022970736026763916, 0.0023670196533203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 9.0, 11.0, 17.0, 13.0, 22.0, 23.0, 27.0, 49.0, 64.0, 59.0, 92.0, 164.0, 208.0, 406.0, 604.0, 1392.0, 395636.0, 646196.0, 1650.0, 676.0, 394.0, 245.0, 171.0, 100.0, 87.0, 60.0, 42.0, 27.0, 24.0, 22.0, 21.0, 15.0, 5.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.041015625, -0.0398106575012207, -0.038605690002441406, -0.03740072250366211, -0.03619575500488281, -0.034990787506103516, -0.03378582000732422, -0.03258085250854492, -0.031375885009765625, -0.030170917510986328, -0.02896595001220703, -0.027760982513427734, -0.026556015014648438, -0.02535104751586914, -0.024146080017089844, -0.022941112518310547, -0.02173614501953125, -0.020531177520751953, -0.019326210021972656, -0.01812124252319336, -0.016916275024414062, -0.015711307525634766, -0.014506340026855469, -0.013301372528076172, -0.012096405029296875, -0.010891437530517578, -0.009686470031738281, -0.008481502532958984, -0.0072765350341796875, -0.006071567535400391, -0.004866600036621094, -0.003661632537841797, -0.0024566650390625, -0.0012516975402832031, -4.673004150390625e-05, 0.0011582374572753906, 0.0023632049560546875, 0.0035681724548339844, 0.004773139953613281, 0.005978107452392578, 0.007183074951171875, 0.008388042449951172, 0.009593009948730469, 0.010797977447509766, 0.012002944946289062, 0.01320791244506836, 0.014412879943847656, 0.015617847442626953, 0.01682281494140625, 0.018027782440185547, 0.019232749938964844, 0.02043771743774414, 0.021642684936523438, 0.022847652435302734, 0.02405261993408203, 0.025257587432861328, 0.026462554931640625, 0.027667522430419922, 0.02887248992919922, 0.030077457427978516, 0.03128242492675781, 0.03248739242553711, 0.033692359924316406, 0.0348973274230957, 0.036102294921875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 29.0, 101.0, 236.0, 279.0, 233.0, 91.0, 24.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0023880270309746265, -0.0022976913023740053, -0.002207355573773384, -0.0021170200780034065, -0.0020266843494027853, -0.001936348620802164, -0.0018460128922015429, -0.0017556771636009216, -0.0016653415514156222, -0.001575005822815001, -0.0014846702106297016, -0.0013943344820290804, -0.0013039987534284592, -0.0012136631412431598, -0.0011233274126425385, -0.0010329918004572392, -0.0009426560718566179, -0.0008523204014636576, -0.0007619847310706973, -0.0006716490024700761, -0.0005813133320771158, -0.0004909776616841555, -0.00040064193308353424, -0.00031030626269057393, -0.00021997059229761362, -0.00012963490735273808, -3.9299222407862544e-05, 5.103647708892822e-05, 0.00014137214748188853, 0.00023170781787484884, 0.00032204354647547007, 0.0004123792168684304, 0.000502714654430747, 0.0005930503248237073, 0.0006833859952166677, 0.0007737217238172889, 0.0008640573942102492, 0.0009543930646032095, 0.0010447287932038307, 0.001135064521804452, 0.0012254001339897513, 0.0013157358625903726, 0.001406071474775672, 0.0014964072033762932, 0.0015867429319769144, 0.0016770785441622138, 0.001767414272762835, 0.0018577498849481344, 0.0019480856135487556, 0.002038421342149377, 0.002128757070749998, 0.0022190925665199757, 0.002309428295120597, 0.002399764023721218, 0.0024900997523218393, 0.0025804354809224606, 0.002670770976692438, 0.0027611067052930593, 0.0028514424338936806, 0.002941777929663658, 0.0030321136582642794, 0.0031224493868649006, 0.003212785115465522, 0.003303120844066143, 0.0033934565726667643]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 7.0, 8.0, 6.0, 17.0, 18.0, 10.0, 23.0, 23.0, 11.0, 23.0, 22.0, 25.0, 30.0, 24.0, 30.0, 34.0, 28.0, 46.0, 39.0, 41.0, 37.0, 45.0, 42.0, 36.0, 38.0, 35.0, 38.0, 26.0, 28.0, 31.0, 32.0, 16.0, 21.0, 20.0, 19.0, 13.0, 7.0, 17.0, 8.0, 3.0, 8.0, 6.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008754134178161621, -0.0008452590554952621, -0.0008151046931743622, -0.0007849503308534622, -0.0007547959685325623, -0.0007246416062116623, -0.0006944872438907623, -0.0006643328815698624, -0.0006341785192489624, -0.0006040241569280624, -0.0005738697946071625, -0.0005437154322862625, -0.0005135610699653625, -0.0004834067076444626, -0.0004532523453235626, -0.00042309798300266266, -0.0003929436206817627, -0.00036278925836086273, -0.00033263489603996277, -0.0003024805337190628, -0.00027232617139816284, -0.00024217180907726288, -0.00021201744675636292, -0.00018186308443546295, -0.000151708722114563, -0.00012155435979366302, -9.139999747276306e-05, -6.12456351518631e-05, -3.1091272830963135e-05, -9.369105100631714e-07, 2.9217451810836792e-05, 5.9371814131736755e-05, 8.952617645263672e-05, 0.00011968053877353668, 0.00014983490109443665, 0.0001799892634153366, 0.00021014362573623657, 0.00024029798805713654, 0.0002704523503780365, 0.00030060671269893646, 0.0003307610750198364, 0.0003609154373407364, 0.00039106979966163635, 0.0004212241619825363, 0.0004513785243034363, 0.00048153288662433624, 0.0005116872489452362, 0.0005418416112661362, 0.0005719959735870361, 0.0006021503359079361, 0.0006323046982288361, 0.000662459060549736, 0.000692613422870636, 0.000722767785191536, 0.0007529221475124359, 0.0007830765098333359, 0.0008132308721542358, 0.0008433852344751358, 0.0008735395967960358, 0.0009036939591169357, 0.0009338483214378357, 0.0009640026837587357, 0.0009941570460796356, 0.0010243114084005356, 0.0010544657707214355]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 5.0, 12.0, 10.0, 8.0, 13.0, 9.0, 14.0, 19.0, 26.0, 23.0, 30.0, 31.0, 17.0, 33.0, 36.0, 34.0, 31.0, 53.0, 39.0, 48.0, 40.0, 34.0, 32.0, 43.0, 37.0, 30.0, 35.0, 29.0, 36.0, 27.0, 20.0, 20.0, 24.0, 17.0, 10.0, 9.0, 11.0, 10.0, 9.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0], "bins": [-11.8984375, -11.5672607421875, -11.236083984375, -10.9049072265625, -10.57373046875, -10.2425537109375, -9.911376953125, -9.5802001953125, -9.2490234375, -8.9178466796875, -8.586669921875, -8.2554931640625, -7.92431640625, -7.5931396484375, -7.261962890625, -6.9307861328125, -6.599609375, -6.2684326171875, -5.937255859375, -5.6060791015625, -5.27490234375, -4.9437255859375, -4.612548828125, -4.2813720703125, -3.9501953125, -3.6190185546875, -3.287841796875, -2.9566650390625, -2.62548828125, -2.2943115234375, -1.963134765625, -1.6319580078125, -1.30078125, -0.9696044921875, -0.638427734375, -0.3072509765625, 0.02392578125, 0.3551025390625, 0.686279296875, 1.0174560546875, 1.3486328125, 1.6798095703125, 2.010986328125, 2.3421630859375, 2.67333984375, 3.0045166015625, 3.335693359375, 3.6668701171875, 3.998046875, 4.3292236328125, 4.660400390625, 4.9915771484375, 5.32275390625, 5.6539306640625, 5.985107421875, 6.3162841796875, 6.6474609375, 6.9786376953125, 7.309814453125, 7.6409912109375, 7.97216796875, 8.3033447265625, 8.634521484375, 8.9656982421875, 9.296875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 13.0, 8.0, 11.0, 17.0, 32.0, 33.0, 54.0, 58.0, 93.0, 107.0, 146.0, 196.0, 250.0, 331.0, 411.0, 519.0, 753.0, 1047.0, 1584.0, 3047.0, 9292.0, 49043.0, 275395.0, 531539.0, 138320.0, 23575.0, 5498.0, 2213.0, 1345.0, 837.0, 700.0, 498.0, 376.0, 301.0, 220.0, 135.0, 144.0, 92.0, 79.0, 58.0, 43.0, 30.0, 25.0, 24.0, 17.0, 10.0, 8.0, 12.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-22.53125, -21.8544921875, -21.177734375, -20.5009765625, -19.82421875, -19.1474609375, -18.470703125, -17.7939453125, -17.1171875, -16.4404296875, -15.763671875, -15.0869140625, -14.41015625, -13.7333984375, -13.056640625, -12.3798828125, -11.703125, -11.0263671875, -10.349609375, -9.6728515625, -8.99609375, -8.3193359375, -7.642578125, -6.9658203125, -6.2890625, -5.6123046875, -4.935546875, -4.2587890625, -3.58203125, -2.9052734375, -2.228515625, -1.5517578125, -0.875, -0.1982421875, 0.478515625, 1.1552734375, 1.83203125, 2.5087890625, 3.185546875, 3.8623046875, 4.5390625, 5.2158203125, 5.892578125, 6.5693359375, 7.24609375, 7.9228515625, 8.599609375, 9.2763671875, 9.953125, 10.6298828125, 11.306640625, 11.9833984375, 12.66015625, 13.3369140625, 14.013671875, 14.6904296875, 15.3671875, 16.0439453125, 16.720703125, 17.3974609375, 18.07421875, 18.7509765625, 19.427734375, 20.1044921875, 20.78125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 9.0, 7.0, 12.0, 12.0, 18.0, 18.0, 22.0, 27.0, 26.0, 28.0, 32.0, 44.0, 42.0, 49.0, 54.0, 100.0, 186.0, 1380.0, 329.0, 146.0, 83.0, 64.0, 49.0, 45.0, 33.0, 32.0, 30.0, 28.0, 25.0, 12.0, 19.0, 17.0, 15.0, 6.0, 11.0, 6.0, 8.0, 4.0, 9.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-31.015625, -30.125244140625, -29.23486328125, -28.344482421875, -27.4541015625, -26.563720703125, -25.67333984375, -24.782958984375, -23.892578125, -23.002197265625, -22.11181640625, -21.221435546875, -20.3310546875, -19.440673828125, -18.55029296875, -17.659912109375, -16.76953125, -15.879150390625, -14.98876953125, -14.098388671875, -13.2080078125, -12.317626953125, -11.42724609375, -10.536865234375, -9.646484375, -8.756103515625, -7.86572265625, -6.975341796875, -6.0849609375, -5.194580078125, -4.30419921875, -3.413818359375, -2.5234375, -1.633056640625, -0.74267578125, 0.147705078125, 1.0380859375, 1.928466796875, 2.81884765625, 3.709228515625, 4.599609375, 5.489990234375, 6.38037109375, 7.270751953125, 8.1611328125, 9.051513671875, 9.94189453125, 10.832275390625, 11.72265625, 12.613037109375, 13.50341796875, 14.393798828125, 15.2841796875, 16.174560546875, 17.06494140625, 17.955322265625, 18.845703125, 19.736083984375, 20.62646484375, 21.516845703125, 22.4072265625, 23.297607421875, 24.18798828125, 25.078369140625, 25.96875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 8.0, 3.0, 4.0, 8.0, 13.0, 17.0, 17.0, 15.0, 19.0, 24.0, 55.0, 48.0, 71.0, 105.0, 180.0, 240.0, 420.0, 831.0, 2182.0, 2957047.0, 180868.0, 1673.0, 735.0, 346.0, 214.0, 144.0, 112.0, 73.0, 65.0, 44.0, 27.0, 13.0, 17.0, 19.0, 6.0, 6.0, 10.0, 6.0, 8.0, 4.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-153.75, -148.9296875, -144.109375, -139.2890625, -134.46875, -129.6484375, -124.828125, -120.0078125, -115.1875, -110.3671875, -105.546875, -100.7265625, -95.90625, -91.0859375, -86.265625, -81.4453125, -76.625, -71.8046875, -66.984375, -62.1640625, -57.34375, -52.5234375, -47.703125, -42.8828125, -38.0625, -33.2421875, -28.421875, -23.6015625, -18.78125, -13.9609375, -9.140625, -4.3203125, 0.5, 5.3203125, 10.140625, 14.9609375, 19.78125, 24.6015625, 29.421875, 34.2421875, 39.0625, 43.8828125, 48.703125, 53.5234375, 58.34375, 63.1640625, 67.984375, 72.8046875, 77.625, 82.4453125, 87.265625, 92.0859375, 96.90625, 101.7265625, 106.546875, 111.3671875, 116.1875, 121.0078125, 125.828125, 130.6484375, 135.46875, 140.2890625, 145.109375, 149.9296875, 154.75]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 51.0, 125.0, 247.0, 294.0, 196.0, 57.0, 22.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.45406341552734, -76.62646484375, -72.79886627197266, -68.97126770019531, -65.14366149902344, -61.31606674194336, -57.48846435546875, -53.660865783691406, -49.83326721191406, -46.00566864013672, -42.178070068359375, -38.350467681884766, -34.52286911010742, -30.695270538330078, -26.8676700592041, -23.040069580078125, -19.21247100830078, -15.384871482849121, -11.557271957397461, -7.729672431945801, -3.9020729064941406, -0.07447433471679688, 3.7531261444091797, 7.580726623535156, 11.4083251953125, 15.23592472076416, 19.06352424621582, 22.891124725341797, 26.71872329711914, 30.546321868896484, 34.373924255371094, 38.20152282714844, 42.02911376953125, 45.856712341308594, 49.68431091308594, 53.51191329956055, 57.33951187133789, 61.167110443115234, 64.99471282958984, 68.82231140136719, 72.64990997314453, 76.47750854492188, 80.30510711669922, 84.13270568847656, 87.96031188964844, 91.78790283203125, 95.61550903320312, 99.44310760498047, 103.27070617675781, 107.09830474853516, 110.9259033203125, 114.75350189208984, 118.58110046386719, 122.40870666503906, 126.2363052368164, 130.06390380859375, 133.89151000976562, 137.7191162109375, 141.5467071533203, 145.3743133544922, 149.201904296875, 153.02951049804688, 156.8571014404297, 160.68470764160156, 164.51229858398438]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 17.0, 14.0, 21.0, 23.0, 32.0, 34.0, 34.0, 37.0, 39.0, 32.0, 42.0, 40.0, 55.0, 38.0, 50.0, 41.0, 51.0, 36.0, 33.0, 38.0, 32.0, 33.0, 31.0, 37.0, 24.0, 14.0, 13.0, 12.0, 11.0, 4.0, 14.0, 7.0, 8.0, 7.0, 5.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-75.38371276855469, -72.91327667236328, -70.44284057617188, -67.972412109375, -65.5019760131836, -63.03153991699219, -60.56110382080078, -58.090667724609375, -55.620235443115234, -53.14979934692383, -50.67936706542969, -48.20893096923828, -45.738494873046875, -43.268062591552734, -40.79762649536133, -38.32719421386719, -35.85675811767578, -33.386322021484375, -30.915889739990234, -28.445453643798828, -25.975019454956055, -23.50458526611328, -21.034149169921875, -18.5637149810791, -16.093280792236328, -13.622846603393555, -11.152411460876465, -8.681976318359375, -6.211542129516602, -3.741107940673828, -1.2706727981567383, 1.1997623443603516, 3.6701889038085938, 6.140623569488525, 8.611058235168457, 11.081493377685547, 13.55192756652832, 16.022361755371094, 18.4927978515625, 20.963232040405273, 23.433666229248047, 25.90410041809082, 28.374534606933594, 30.844970703125, 33.315406799316406, 35.78583908081055, 38.25627517700195, 40.726707458496094, 43.1971435546875, 45.667579650878906, 48.13801193237305, 50.60844802856445, 53.078880310058594, 55.54931640625, 58.019752502441406, 60.49018859863281, 62.96062088012695, 65.4310531616211, 67.9014892578125, 70.3719253540039, 72.84236145019531, 75.31278991699219, 77.7832260131836, 80.253662109375, 82.7240982055664]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 4.0, 9.0, 5.0, 5.0, 6.0, 6.0, 8.0, 12.0, 19.0, 9.0, 13.0, 19.0, 21.0, 25.0, 20.0, 33.0, 28.0, 28.0, 35.0, 27.0, 39.0, 26.0, 43.0, 39.0, 48.0, 47.0, 35.0, 35.0, 32.0, 32.0, 27.0, 31.0, 26.0, 23.0, 21.0, 30.0, 18.0, 16.0, 18.0, 19.0, 13.0, 8.0, 7.0, 6.0, 8.0, 5.0, 6.0, 6.0, 1.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.65625, -9.346923828125, -9.03759765625, -8.728271484375, -8.4189453125, -8.109619140625, -7.80029296875, -7.490966796875, -7.181640625, -6.872314453125, -6.56298828125, -6.253662109375, -5.9443359375, -5.635009765625, -5.32568359375, -5.016357421875, -4.70703125, -4.397705078125, -4.08837890625, -3.779052734375, -3.4697265625, -3.160400390625, -2.85107421875, -2.541748046875, -2.232421875, -1.923095703125, -1.61376953125, -1.304443359375, -0.9951171875, -0.685791015625, -0.37646484375, -0.067138671875, 0.2421875, 0.551513671875, 0.86083984375, 1.170166015625, 1.4794921875, 1.788818359375, 2.09814453125, 2.407470703125, 2.716796875, 3.026123046875, 3.33544921875, 3.644775390625, 3.9541015625, 4.263427734375, 4.57275390625, 4.882080078125, 5.19140625, 5.500732421875, 5.81005859375, 6.119384765625, 6.4287109375, 6.738037109375, 7.04736328125, 7.356689453125, 7.666015625, 7.975341796875, 8.28466796875, 8.593994140625, 8.9033203125, 9.212646484375, 9.52197265625, 9.831298828125, 10.140625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 7.0, 5.0, 6.0, 13.0, 20.0, 29.0, 40.0, 65.0, 101.0, 170.0, 301.0, 569.0, 1217.0, 3337.0, 14514.0, 139888.0, 1545580.0, 2195413.0, 263702.0, 22151.0, 4317.0, 1377.0, 638.0, 366.0, 184.0, 111.0, 62.0, 44.0, 27.0, 16.0, 9.0, 6.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.03125, -22.240234375, -21.44921875, -20.658203125, -19.8671875, -19.076171875, -18.28515625, -17.494140625, -16.703125, -15.912109375, -15.12109375, -14.330078125, -13.5390625, -12.748046875, -11.95703125, -11.166015625, -10.375, -9.583984375, -8.79296875, -8.001953125, -7.2109375, -6.419921875, -5.62890625, -4.837890625, -4.046875, -3.255859375, -2.46484375, -1.673828125, -0.8828125, -0.091796875, 0.69921875, 1.490234375, 2.28125, 3.072265625, 3.86328125, 4.654296875, 5.4453125, 6.236328125, 7.02734375, 7.818359375, 8.609375, 9.400390625, 10.19140625, 10.982421875, 11.7734375, 12.564453125, 13.35546875, 14.146484375, 14.9375, 15.728515625, 16.51953125, 17.310546875, 18.1015625, 18.892578125, 19.68359375, 20.474609375, 21.265625, 22.056640625, 22.84765625, 23.638671875, 24.4296875, 25.220703125, 26.01171875, 26.802734375, 27.59375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 9.0, 9.0, 10.0, 12.0, 20.0, 25.0, 46.0, 67.0, 86.0, 120.0, 156.0, 203.0, 232.0, 365.0, 435.0, 504.0, 509.0, 338.0, 223.0, 166.0, 137.0, 127.0, 77.0, 50.0, 44.0, 21.0, 21.0, 20.0, 12.0, 11.0, 4.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.296875, -14.645751953125, -13.99462890625, -13.343505859375, -12.6923828125, -12.041259765625, -11.39013671875, -10.739013671875, -10.087890625, -9.436767578125, -8.78564453125, -8.134521484375, -7.4833984375, -6.832275390625, -6.18115234375, -5.530029296875, -4.87890625, -4.227783203125, -3.57666015625, -2.925537109375, -2.2744140625, -1.623291015625, -0.97216796875, -0.321044921875, 0.330078125, 0.981201171875, 1.63232421875, 2.283447265625, 2.9345703125, 3.585693359375, 4.23681640625, 4.887939453125, 5.5390625, 6.190185546875, 6.84130859375, 7.492431640625, 8.1435546875, 8.794677734375, 9.44580078125, 10.096923828125, 10.748046875, 11.399169921875, 12.05029296875, 12.701416015625, 13.3525390625, 14.003662109375, 14.65478515625, 15.305908203125, 15.95703125, 16.608154296875, 17.25927734375, 17.910400390625, 18.5615234375, 19.212646484375, 19.86376953125, 20.514892578125, 21.166015625, 21.817138671875, 22.46826171875, 23.119384765625, 23.7705078125, 24.421630859375, 25.07275390625, 25.723876953125, 26.375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 11.0, 20.0, 37.0, 68.0, 96.0, 220.0, 429.0, 922.0, 2425.0, 12109.0, 583521.0, 3519782.0, 67115.0, 4717.0, 1556.0, 619.0, 295.0, 145.0, 84.0, 37.0, 32.0, 12.0, 10.0, 5.0, 5.0, 0.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.71875, -57.09912109375, -55.4794921875, -53.85986328125, -52.240234375, -50.62060546875, -49.0009765625, -47.38134765625, -45.76171875, -44.14208984375, -42.5224609375, -40.90283203125, -39.283203125, -37.66357421875, -36.0439453125, -34.42431640625, -32.8046875, -31.18505859375, -29.5654296875, -27.94580078125, -26.326171875, -24.70654296875, -23.0869140625, -21.46728515625, -19.84765625, -18.22802734375, -16.6083984375, -14.98876953125, -13.369140625, -11.74951171875, -10.1298828125, -8.51025390625, -6.890625, -5.27099609375, -3.6513671875, -2.03173828125, -0.412109375, 1.20751953125, 2.8271484375, 4.44677734375, 6.06640625, 7.68603515625, 9.3056640625, 10.92529296875, 12.544921875, 14.16455078125, 15.7841796875, 17.40380859375, 19.0234375, 20.64306640625, 22.2626953125, 23.88232421875, 25.501953125, 27.12158203125, 28.7412109375, 30.36083984375, 31.98046875, 33.60009765625, 35.2197265625, 36.83935546875, 38.458984375, 40.07861328125, 41.6982421875, 43.31787109375, 44.9375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 31.0, 365.0, 541.0, 71.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-304.3949890136719, -290.6909484863281, -276.9869079589844, -263.2828369140625, -249.57879638671875, -235.874755859375, -222.17071533203125, -208.4666748046875, -194.7626190185547, -181.05857849121094, -167.35452270507812, -153.65048217773438, -139.94644165039062, -126.24238586425781, -112.53834533691406, -98.83429718017578, -85.1302490234375, -71.42620086669922, -57.7221565246582, -44.01811218261719, -30.314064025878906, -16.610015869140625, -2.905975341796875, 10.798072814941406, 24.502120971679688, 38.20616912841797, 51.910213470458984, 65.6142578125, 79.31830596923828, 93.02235412597656, 106.72639465332031, 120.4304428100586, 134.134521484375, 147.83856201171875, 161.54261779785156, 175.2466583251953, 188.95071411132812, 202.65475463867188, 216.35879516601562, 230.06283569335938, 243.7668914794922, 257.470947265625, 271.17498779296875, 284.8790283203125, 298.58306884765625, 312.287109375, 325.99114990234375, 339.6952209472656, 353.3992614746094, 367.1033020019531, 380.8073425292969, 394.51141357421875, 408.2154541015625, 421.91949462890625, 435.62353515625, 449.32757568359375, 463.0316162109375, 476.73565673828125, 490.439697265625, 504.14373779296875, 517.8477783203125, 531.5518798828125, 545.255859375, 558.9599609375, 572.6640014648438]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 1.0, 11.0, 8.0, 10.0, 14.0, 12.0, 19.0, 28.0, 20.0, 19.0, 34.0, 24.0, 32.0, 43.0, 48.0, 34.0, 36.0, 38.0, 37.0, 32.0, 49.0, 43.0, 40.0, 36.0, 38.0, 34.0, 23.0, 27.0, 34.0, 24.0, 28.0, 22.0, 16.0, 19.0, 14.0, 11.0, 8.0, 9.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-86.5997543334961, -84.2680435180664, -81.93633270263672, -79.60462188720703, -77.27291107177734, -74.94120025634766, -72.60948944091797, -70.27777862548828, -67.9460678100586, -65.6143569946289, -63.28264617919922, -60.95093536376953, -58.619224548339844, -56.287513732910156, -53.95580291748047, -51.62409210205078, -49.29238510131836, -46.96067428588867, -44.628963470458984, -42.2972526550293, -39.96554183959961, -37.63383102416992, -35.3021240234375, -32.97041320800781, -30.638700485229492, -28.306989669799805, -25.975278854370117, -23.643569946289062, -21.311859130859375, -18.980148315429688, -16.6484375, -14.316726684570312, -11.985015869140625, -9.653305053710938, -7.321594715118408, -4.989884376525879, -2.6581735610961914, -0.3264627456665039, 2.005247116088867, 4.336957931518555, 6.668668746948242, 9.00037956237793, 11.332090377807617, 13.663800239562988, 15.995511054992676, 18.327220916748047, 20.658931732177734, 22.990642547607422, 25.32235336303711, 27.654064178466797, 29.985774993896484, 32.31748580932617, 34.64919662475586, 36.98090744018555, 39.31261444091797, 41.644325256347656, 43.976036071777344, 46.30774688720703, 48.63945770263672, 50.971168518066406, 53.302879333496094, 55.63459014892578, 57.96630096435547, 60.298011779785156, 62.629722595214844]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 4.0, 9.0, 12.0, 10.0, 12.0, 19.0, 14.0, 20.0, 17.0, 22.0, 35.0, 40.0, 41.0, 35.0, 47.0, 42.0, 44.0, 44.0, 46.0, 57.0, 56.0, 55.0, 37.0, 40.0, 28.0, 29.0, 34.0, 24.0, 23.0, 14.0, 22.0, 13.0, 8.0, 10.0, 9.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.830078125, -7.55078125, -7.271484375, -6.9921875, -6.712890625, -6.43359375, -6.154296875, -5.875, -5.595703125, -5.31640625, -5.037109375, -4.7578125, -4.478515625, -4.19921875, -3.919921875, -3.640625, -3.361328125, -3.08203125, -2.802734375, -2.5234375, -2.244140625, -1.96484375, -1.685546875, -1.40625, -1.126953125, -0.84765625, -0.568359375, -0.2890625, -0.009765625, 0.26953125, 0.548828125, 0.828125, 1.107421875, 1.38671875, 1.666015625, 1.9453125, 2.224609375, 2.50390625, 2.783203125, 3.0625, 3.341796875, 3.62109375, 3.900390625, 4.1796875, 4.458984375, 4.73828125, 5.017578125, 5.296875, 5.576171875, 5.85546875, 6.134765625, 6.4140625, 6.693359375, 6.97265625, 7.251953125, 7.53125, 7.810546875, 8.08984375, 8.369140625, 8.6484375, 8.927734375, 9.20703125, 9.486328125, 9.765625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 10.0, 5.0, 13.0, 16.0, 21.0, 46.0, 53.0, 89.0, 139.0, 187.0, 252.0, 402.0, 556.0, 894.0, 1300.0, 1928.0, 3065.0, 4719.0, 7388.0, 11557.0, 18179.0, 29588.0, 49267.0, 86236.0, 168477.0, 302903.0, 156554.0, 80870.0, 47097.0, 28255.0, 17255.0, 10750.0, 7244.0, 4475.0, 2926.0, 1934.0, 1267.0, 903.0, 576.0, 358.0, 250.0, 172.0, 141.0, 76.0, 57.0, 40.0, 22.0, 14.0, 16.0, 11.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-1.59765625, -1.549896240234375, -1.50213623046875, -1.454376220703125, -1.4066162109375, -1.358856201171875, -1.31109619140625, -1.263336181640625, -1.215576171875, -1.167816162109375, -1.12005615234375, -1.072296142578125, -1.0245361328125, -0.976776123046875, -0.92901611328125, -0.881256103515625, -0.83349609375, -0.785736083984375, -0.73797607421875, -0.690216064453125, -0.6424560546875, -0.594696044921875, -0.54693603515625, -0.499176025390625, -0.451416015625, -0.403656005859375, -0.35589599609375, -0.308135986328125, -0.2603759765625, -0.212615966796875, -0.16485595703125, -0.117095947265625, -0.0693359375, -0.021575927734375, 0.02618408203125, 0.073944091796875, 0.1217041015625, 0.169464111328125, 0.21722412109375, 0.264984130859375, 0.312744140625, 0.360504150390625, 0.40826416015625, 0.456024169921875, 0.5037841796875, 0.551544189453125, 0.59930419921875, 0.647064208984375, 0.69482421875, 0.742584228515625, 0.79034423828125, 0.838104248046875, 0.8858642578125, 0.933624267578125, 0.98138427734375, 1.029144287109375, 1.076904296875, 1.124664306640625, 1.17242431640625, 1.220184326171875, 1.2679443359375, 1.315704345703125, 1.36346435546875, 1.411224365234375, 1.458984375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 1.0, 5.0, 5.0, 9.0, 7.0, 11.0, 12.0, 20.0, 12.0, 15.0, 19.0, 33.0, 24.0, 35.0, 42.0, 40.0, 28.0, 38.0, 30.0, 51.0, 45.0, 1067.0, 39.0, 36.0, 33.0, 45.0, 33.0, 34.0, 33.0, 28.0, 30.0, 16.0, 21.0, 20.0, 14.0, 16.0, 17.0, 17.0, 11.0, 9.0, 8.0, 3.0, 9.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.26580810546875, -5.1058349609375, -4.94586181640625, -4.785888671875, -4.62591552734375, -4.4659423828125, -4.30596923828125, -4.14599609375, -3.98602294921875, -3.8260498046875, -3.66607666015625, -3.506103515625, -3.34613037109375, -3.1861572265625, -3.02618408203125, -2.8662109375, -2.70623779296875, -2.5462646484375, -2.38629150390625, -2.226318359375, -2.06634521484375, -1.9063720703125, -1.74639892578125, -1.58642578125, -1.42645263671875, -1.2664794921875, -1.10650634765625, -0.946533203125, -0.78656005859375, -0.6265869140625, -0.46661376953125, -0.306640625, -0.14666748046875, 0.0133056640625, 0.17327880859375, 0.333251953125, 0.49322509765625, 0.6531982421875, 0.81317138671875, 0.97314453125, 1.13311767578125, 1.2930908203125, 1.45306396484375, 1.613037109375, 1.77301025390625, 1.9329833984375, 2.09295654296875, 2.2529296875, 2.41290283203125, 2.5728759765625, 2.73284912109375, 2.892822265625, 3.05279541015625, 3.2127685546875, 3.37274169921875, 3.53271484375, 3.69268798828125, 3.8526611328125, 4.01263427734375, 4.172607421875, 4.33258056640625, 4.4925537109375, 4.65252685546875, 4.8125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 10.0, 9.0, 12.0, 14.0, 28.0, 45.0, 69.0, 85.0, 114.0, 153.0, 260.0, 328.0, 479.0, 752.0, 1074.0, 1645.0, 2569.0, 4079.0, 6310.0, 10009.0, 16062.0, 25806.0, 42205.0, 73307.0, 138424.0, 1325299.0, 204662.0, 100038.0, 55248.0, 32813.0, 20083.0, 12314.0, 8114.0, 5136.0, 3208.0, 2048.0, 1428.0, 966.0, 642.0, 412.0, 285.0, 194.0, 124.0, 68.0, 68.0, 46.0, 27.0, 20.0, 11.0, 11.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.3427734375, -1.2976531982421875, -1.252532958984375, -1.2074127197265625, -1.16229248046875, -1.1171722412109375, -1.072052001953125, -1.0269317626953125, -0.9818115234375, -0.9366912841796875, -0.891571044921875, -0.8464508056640625, -0.80133056640625, -0.7562103271484375, -0.711090087890625, -0.6659698486328125, -0.620849609375, -0.5757293701171875, -0.530609130859375, -0.4854888916015625, -0.44036865234375, -0.3952484130859375, -0.350128173828125, -0.3050079345703125, -0.2598876953125, -0.2147674560546875, -0.169647216796875, -0.1245269775390625, -0.07940673828125, -0.0342864990234375, 0.010833740234375, 0.0559539794921875, 0.10107421875, 0.1461944580078125, 0.191314697265625, 0.2364349365234375, 0.28155517578125, 0.3266754150390625, 0.371795654296875, 0.4169158935546875, 0.4620361328125, 0.5071563720703125, 0.552276611328125, 0.5973968505859375, 0.64251708984375, 0.6876373291015625, 0.732757568359375, 0.7778778076171875, 0.822998046875, 0.8681182861328125, 0.913238525390625, 0.9583587646484375, 1.00347900390625, 1.0485992431640625, 1.093719482421875, 1.1388397216796875, 1.1839599609375, 1.2290802001953125, 1.274200439453125, 1.3193206787109375, 1.36444091796875, 1.4095611572265625, 1.454681396484375, 1.4998016357421875, 1.544921875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 5.0, 3.0, 8.0, 5.0, 9.0, 12.0, 20.0, 21.0, 24.0, 28.0, 47.0, 57.0, 82.0, 108.0, 86.0, 94.0, 78.0, 76.0, 51.0, 40.0, 26.0, 20.0, 16.0, 20.0, 9.0, 15.0, 12.0, 3.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021381378173828125, -0.0020641982555389404, -0.0019902586936950684, -0.0019163191318511963, -0.0018423795700073242, -0.0017684400081634521, -0.00169450044631958, -0.001620560884475708, -0.001546621322631836, -0.0014726817607879639, -0.0013987421989440918, -0.0013248026371002197, -0.0012508630752563477, -0.0011769235134124756, -0.0011029839515686035, -0.0010290443897247314, -0.0009551048278808594, -0.0008811652660369873, -0.0008072257041931152, -0.0007332861423492432, -0.0006593465805053711, -0.000585407018661499, -0.000511467456817627, -0.0004375278949737549, -0.0003635883331298828, -0.00028964877128601074, -0.00021570920944213867, -0.0001417696475982666, -6.783008575439453e-05, 6.109476089477539e-06, 8.004903793334961e-05, 0.00015398859977722168, 0.00022792816162109375, 0.0003018677234649658, 0.0003758072853088379, 0.00044974684715270996, 0.000523686408996582, 0.0005976259708404541, 0.0006715655326843262, 0.0007455050945281982, 0.0008194446563720703, 0.0008933842182159424, 0.0009673237800598145, 0.0010412633419036865, 0.0011152029037475586, 0.0011891424655914307, 0.0012630820274353027, 0.0013370215892791748, 0.0014109611511230469, 0.001484900712966919, 0.001558840274810791, 0.001632779836654663, 0.0017067193984985352, 0.0017806589603424072, 0.0018545985221862793, 0.0019285380840301514, 0.0020024776458740234, 0.0020764172077178955, 0.0021503567695617676, 0.0022242963314056396, 0.0022982358932495117, 0.002372175455093384, 0.002446115016937256, 0.002520054578781128, 0.002593994140625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 2.0, 7.0, 4.0, 8.0, 12.0, 21.0, 31.0, 32.0, 44.0, 39.0, 74.0, 88.0, 173.0, 283.0, 577.0, 1784.0, 994972.0, 48168.0, 1082.0, 435.0, 218.0, 154.0, 75.0, 74.0, 44.0, 37.0, 15.0, 22.0, 14.0, 11.0, 10.0, 4.0, 3.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0], "bins": [-0.049346923828125, -0.047928810119628906, -0.04651069641113281, -0.04509258270263672, -0.043674468994140625, -0.04225635528564453, -0.04083824157714844, -0.039420127868652344, -0.03800201416015625, -0.036583900451660156, -0.03516578674316406, -0.03374767303466797, -0.032329559326171875, -0.03091144561767578, -0.029493331909179688, -0.028075218200683594, -0.0266571044921875, -0.025238990783691406, -0.023820877075195312, -0.02240276336669922, -0.020984649658203125, -0.01956653594970703, -0.018148422241210938, -0.016730308532714844, -0.01531219482421875, -0.013894081115722656, -0.012475967407226562, -0.011057853698730469, -0.009639739990234375, -0.008221626281738281, -0.0068035125732421875, -0.005385398864746094, -0.00396728515625, -0.0025491714477539062, -0.0011310577392578125, 0.00028705596923828125, 0.001705169677734375, 0.0031232833862304688, 0.0045413970947265625, 0.005959510803222656, 0.00737762451171875, 0.008795738220214844, 0.010213851928710938, 0.011631965637207031, 0.013050079345703125, 0.014468193054199219, 0.015886306762695312, 0.017304420471191406, 0.0187225341796875, 0.020140647888183594, 0.021558761596679688, 0.02297687530517578, 0.024394989013671875, 0.02581310272216797, 0.027231216430664062, 0.028649330139160156, 0.03006744384765625, 0.031485557556152344, 0.03290367126464844, 0.03432178497314453, 0.035739898681640625, 0.03715801239013672, 0.03857612609863281, 0.039994239807128906, 0.041412353515625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 52.0, 439.0, 468.0, 50.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007968557998538017, -0.007787508890032768, -0.007606459315866232, -0.007425410207360983, -0.007244361098855734, -0.007063311990350485, -0.0068822624161839485, -0.0067012133076786995, -0.0065201641991734505, -0.0063391150906682014, -0.006158065516501665, -0.005977016407996416, -0.005795967299491167, -0.005614918190985918, -0.005433868616819382, -0.005252819508314133, -0.005071770399808884, -0.004890721291303635, -0.004709671717137098, -0.004528622608631849, -0.0043475735001266, -0.004166524391621351, -0.003985474817454815, -0.003804425708949566, -0.0036233761347830296, -0.003442326793447137, -0.003261277684941888, -0.003080228343605995, -0.002899179235100746, -0.0027181298937648535, -0.002537080552428961, -0.0023560314439237118, -0.002174982102587819, -0.0019939327612519264, -0.0018128836527466774, -0.0016318343114107847, -0.0014507852029055357, -0.001269735861569643, -0.0010886866366490722, -0.0009076374117285013, -0.0007265881868079305, -0.0005455389618873596, -0.0003644897078629583, -0.000183440453838557, -2.3912289179861546e-06, 0.0001786579960025847, 0.00035970727913081646, 0.0005407565040513873, 0.0007218057289719582, 0.000902854953892529, 0.0010839041788130999, 0.0012649535201489925, 0.0014460026286542416, 0.0016270519699901342, 0.001808101194910705, 0.001989150419831276, 0.002170199528336525, 0.0023512488696724176, 0.0025322979781776667, 0.0027133473195135593, 0.0028943964280188084, 0.003075445769354701, 0.0032564951106905937, 0.0034375442191958427, 0.0036185935605317354]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 6.0, 2.0, 6.0, 7.0, 12.0, 12.0, 13.0, 18.0, 21.0, 24.0, 25.0, 39.0, 37.0, 38.0, 40.0, 41.0, 57.0, 57.0, 41.0, 52.0, 36.0, 49.0, 34.0, 28.0, 38.0, 38.0, 24.0, 30.0, 43.0, 23.0, 26.0, 22.0, 14.0, 15.0, 13.0, 9.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013026595115661621, -0.0012666219845414162, -0.0012305844575166702, -0.0011945469304919243, -0.0011585094034671783, -0.0011224718764424324, -0.0010864343494176865, -0.0010503968223929405, -0.0010143592953681946, -0.0009783217683434486, -0.0009422842413187027, -0.0009062467142939568, -0.0008702091872692108, -0.0008341716602444649, -0.0007981341332197189, -0.000762096606194973, -0.000726059079170227, -0.0006900215521454811, -0.0006539840251207352, -0.0006179464980959892, -0.0005819089710712433, -0.0005458714440464973, -0.0005098339170217514, -0.00047379638999700546, -0.0004377588629722595, -0.0004017213359475136, -0.00036568380892276764, -0.0003296462818980217, -0.00029360875487327576, -0.0002575712278485298, -0.00022153370082378387, -0.00018549617379903793, -0.000149458646774292, -0.00011342111974954605, -7.738359272480011e-05, -4.134606570005417e-05, -5.3085386753082275e-06, 3.0728988349437714e-05, 6.676651537418365e-05, 0.0001028040423989296, 0.00013884156942367554, 0.00017487909644842148, 0.00021091662347316742, 0.00024695415049791336, 0.0002829916775226593, 0.00031902920454740524, 0.0003550667315721512, 0.0003911042585968971, 0.00042714178562164307, 0.000463179312646389, 0.000499216839671135, 0.0005352543666958809, 0.0005712918937206268, 0.0006073294207453728, 0.0006433669477701187, 0.0006794044747948647, 0.0007154420018196106, 0.0007514795288443565, 0.0007875170558691025, 0.0008235545828938484, 0.0008595921099185944, 0.0008956296369433403, 0.0009316671639680862, 0.0009677046909928322, 0.0010037422180175781]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 4.0, 9.0, 12.0, 10.0, 12.0, 19.0, 14.0, 20.0, 17.0, 22.0, 35.0, 40.0, 41.0, 35.0, 47.0, 42.0, 44.0, 44.0, 46.0, 57.0, 56.0, 55.0, 37.0, 40.0, 28.0, 29.0, 34.0, 24.0, 23.0, 14.0, 22.0, 13.0, 8.0, 10.0, 9.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.830078125, -7.55078125, -7.271484375, -6.9921875, -6.712890625, -6.43359375, -6.154296875, -5.875, -5.595703125, -5.31640625, -5.037109375, -4.7578125, -4.478515625, -4.19921875, -3.919921875, -3.640625, -3.361328125, -3.08203125, -2.802734375, -2.5234375, -2.244140625, -1.96484375, -1.685546875, -1.40625, -1.126953125, -0.84765625, -0.568359375, -0.2890625, -0.009765625, 0.26953125, 0.548828125, 0.828125, 1.107421875, 1.38671875, 1.666015625, 1.9453125, 2.224609375, 2.50390625, 2.783203125, 3.0625, 3.341796875, 3.62109375, 3.900390625, 4.1796875, 4.458984375, 4.73828125, 5.017578125, 5.296875, 5.576171875, 5.85546875, 6.134765625, 6.4140625, 6.693359375, 6.97265625, 7.251953125, 7.53125, 7.810546875, 8.08984375, 8.369140625, 8.6484375, 8.927734375, 9.20703125, 9.486328125, 9.765625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 11.0, 15.0, 25.0, 14.0, 35.0, 48.0, 68.0, 79.0, 119.0, 159.0, 191.0, 272.0, 365.0, 464.0, 675.0, 886.0, 1322.0, 1904.0, 2932.0, 5942.0, 24672.0, 217108.0, 667859.0, 97281.0, 13309.0, 4476.0, 2455.0, 1670.0, 1086.0, 776.0, 628.0, 440.0, 326.0, 249.0, 182.0, 119.0, 102.0, 75.0, 61.0, 50.0, 38.0, 20.0, 24.0, 8.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.765625, -22.061279296875, -21.35693359375, -20.652587890625, -19.9482421875, -19.243896484375, -18.53955078125, -17.835205078125, -17.130859375, -16.426513671875, -15.72216796875, -15.017822265625, -14.3134765625, -13.609130859375, -12.90478515625, -12.200439453125, -11.49609375, -10.791748046875, -10.08740234375, -9.383056640625, -8.6787109375, -7.974365234375, -7.27001953125, -6.565673828125, -5.861328125, -5.156982421875, -4.45263671875, -3.748291015625, -3.0439453125, -2.339599609375, -1.63525390625, -0.930908203125, -0.2265625, 0.477783203125, 1.18212890625, 1.886474609375, 2.5908203125, 3.295166015625, 3.99951171875, 4.703857421875, 5.408203125, 6.112548828125, 6.81689453125, 7.521240234375, 8.2255859375, 8.929931640625, 9.63427734375, 10.338623046875, 11.04296875, 11.747314453125, 12.45166015625, 13.156005859375, 13.8603515625, 14.564697265625, 15.26904296875, 15.973388671875, 16.677734375, 17.382080078125, 18.08642578125, 18.790771484375, 19.4951171875, 20.199462890625, 20.90380859375, 21.608154296875, 22.3125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 6.0, 4.0, 4.0, 6.0, 6.0, 12.0, 11.0, 12.0, 14.0, 17.0, 25.0, 30.0, 26.0, 38.0, 40.0, 45.0, 53.0, 82.0, 104.0, 174.0, 1381.0, 296.0, 171.0, 95.0, 66.0, 50.0, 44.0, 29.0, 33.0, 29.0, 24.0, 17.0, 13.0, 16.0, 16.0, 11.0, 11.0, 7.0, 4.0, 4.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.3125, -19.673828125, -19.03515625, -18.396484375, -17.7578125, -17.119140625, -16.48046875, -15.841796875, -15.203125, -14.564453125, -13.92578125, -13.287109375, -12.6484375, -12.009765625, -11.37109375, -10.732421875, -10.09375, -9.455078125, -8.81640625, -8.177734375, -7.5390625, -6.900390625, -6.26171875, -5.623046875, -4.984375, -4.345703125, -3.70703125, -3.068359375, -2.4296875, -1.791015625, -1.15234375, -0.513671875, 0.125, 0.763671875, 1.40234375, 2.041015625, 2.6796875, 3.318359375, 3.95703125, 4.595703125, 5.234375, 5.873046875, 6.51171875, 7.150390625, 7.7890625, 8.427734375, 9.06640625, 9.705078125, 10.34375, 10.982421875, 11.62109375, 12.259765625, 12.8984375, 13.537109375, 14.17578125, 14.814453125, 15.453125, 16.091796875, 16.73046875, 17.369140625, 18.0078125, 18.646484375, 19.28515625, 19.923828125, 20.5625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 1.0, 5.0, 7.0, 9.0, 5.0, 10.0, 11.0, 18.0, 20.0, 16.0, 24.0, 33.0, 35.0, 62.0, 80.0, 91.0, 187.0, 276.0, 475.0, 851.0, 1821.0, 9529.0, 3113808.0, 14021.0, 2040.0, 889.0, 480.0, 271.0, 165.0, 106.0, 83.0, 77.0, 36.0, 32.0, 28.0, 26.0, 17.0, 13.0, 15.0, 11.0, 6.0, 6.0, 1.0, 5.0, 2.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.1875, -74.4833984375, -71.779296875, -69.0751953125, -66.37109375, -63.6669921875, -60.962890625, -58.2587890625, -55.5546875, -52.8505859375, -50.146484375, -47.4423828125, -44.73828125, -42.0341796875, -39.330078125, -36.6259765625, -33.921875, -31.2177734375, -28.513671875, -25.8095703125, -23.10546875, -20.4013671875, -17.697265625, -14.9931640625, -12.2890625, -9.5849609375, -6.880859375, -4.1767578125, -1.47265625, 1.2314453125, 3.935546875, 6.6396484375, 9.34375, 12.0478515625, 14.751953125, 17.4560546875, 20.16015625, 22.8642578125, 25.568359375, 28.2724609375, 30.9765625, 33.6806640625, 36.384765625, 39.0888671875, 41.79296875, 44.4970703125, 47.201171875, 49.9052734375, 52.609375, 55.3134765625, 58.017578125, 60.7216796875, 63.42578125, 66.1298828125, 68.833984375, 71.5380859375, 74.2421875, 76.9462890625, 79.650390625, 82.3544921875, 85.05859375, 87.7626953125, 90.466796875, 93.1708984375, 95.875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 13.0, 40.0, 90.0, 131.0, 166.0, 197.0, 173.0, 103.0, 57.0, 15.0, 11.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-143.60562133789062, -140.67494201660156, -137.7442626953125, -134.81358337402344, -131.88290405273438, -128.9522247314453, -126.02153778076172, -123.09085845947266, -120.1601791381836, -117.22949981689453, -114.29882049560547, -111.3681411743164, -108.43745422363281, -105.50677490234375, -102.57609558105469, -99.64541625976562, -96.71473693847656, -93.7840576171875, -90.85337829589844, -87.92269897460938, -84.99201965332031, -82.06133270263672, -79.13065338134766, -76.1999740600586, -73.26929473876953, -70.33861541748047, -67.4079360961914, -64.47725677490234, -61.546573638916016, -58.61589431762695, -55.685211181640625, -52.75453186035156, -49.82384490966797, -46.893165588378906, -43.962486267089844, -41.031803131103516, -38.10112380981445, -35.17044448852539, -32.23976135253906, -29.30908203125, -26.378402709960938, -23.447723388671875, -20.51704216003418, -17.586360931396484, -14.655681610107422, -11.725001335144043, -8.794321060180664, -5.863639831542969, -2.9329605102539062, -0.0022802352905273438, 2.9284000396728516, 5.8590803146362305, 8.78976058959961, 11.720440864562988, 14.651121139526367, 17.581802368164062, 20.512481689453125, 23.443161010742188, 26.373842239379883, 29.304523468017578, 32.23520278930664, 35.1658821105957, 38.09656524658203, 41.027244567871094, 43.957923889160156]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 9.0, 4.0, 5.0, 8.0, 13.0, 16.0, 8.0, 17.0, 12.0, 23.0, 16.0, 29.0, 26.0, 27.0, 20.0, 35.0, 38.0, 34.0, 47.0, 41.0, 34.0, 46.0, 36.0, 29.0, 30.0, 34.0, 41.0, 35.0, 43.0, 25.0, 28.0, 22.0, 19.0, 22.0, 15.0, 23.0, 16.0, 15.0, 6.0, 11.0, 6.0, 6.0, 9.0, 7.0, 3.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-50.77208709716797, -49.114017486572266, -47.45595169067383, -45.797882080078125, -44.13981246948242, -42.48174285888672, -40.82367706298828, -39.16560745239258, -37.507537841796875, -35.84946823120117, -34.191402435302734, -32.53333282470703, -30.875263214111328, -29.217195510864258, -27.559127807617188, -25.901058197021484, -24.242990493774414, -22.584922790527344, -20.92685317993164, -19.26878547668457, -17.610715866088867, -15.952648162841797, -14.29457950592041, -12.636510848999023, -10.978442192077637, -9.32037353515625, -7.662304878234863, -6.004236698150635, -4.346168041229248, -2.6880998611450195, -1.0300312042236328, 0.6280374526977539, 2.2861061096191406, 3.9441747665405273, 5.602243423461914, 7.260311603546143, 8.918380737304688, 10.576448440551758, 12.234517097473145, 13.892585754394531, 15.550654411315918, 17.208723068237305, 18.866790771484375, 20.524860382080078, 22.18292808532715, 23.84099578857422, 25.499065399169922, 27.157135009765625, 28.815202713012695, 30.473270416259766, 32.13134002685547, 33.78940963745117, 35.44747543334961, 37.10554504394531, 38.763614654541016, 40.42168426513672, 42.079750061035156, 43.73781967163086, 45.3958854675293, 47.053955078125, 48.7120246887207, 50.370094299316406, 52.028160095214844, 53.68622970581055, 55.34429931640625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 8.0, 2.0, 8.0, 13.0, 9.0, 15.0, 16.0, 13.0, 15.0, 16.0, 23.0, 21.0, 26.0, 28.0, 27.0, 49.0, 41.0, 45.0, 52.0, 47.0, 48.0, 45.0, 43.0, 50.0, 47.0, 30.0, 44.0, 34.0, 28.0, 24.0, 20.0, 19.0, 17.0, 15.0, 12.0, 16.0, 8.0, 4.0, 9.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.77734375, -7.50177001953125, -7.2261962890625, -6.95062255859375, -6.675048828125, -6.39947509765625, -6.1239013671875, -5.84832763671875, -5.57275390625, -5.29718017578125, -5.0216064453125, -4.74603271484375, -4.470458984375, -4.19488525390625, -3.9193115234375, -3.64373779296875, -3.3681640625, -3.09259033203125, -2.8170166015625, -2.54144287109375, -2.265869140625, -1.99029541015625, -1.7147216796875, -1.43914794921875, -1.16357421875, -0.88800048828125, -0.6124267578125, -0.33685302734375, -0.061279296875, 0.21429443359375, 0.4898681640625, 0.76544189453125, 1.041015625, 1.31658935546875, 1.5921630859375, 1.86773681640625, 2.143310546875, 2.41888427734375, 2.6944580078125, 2.97003173828125, 3.24560546875, 3.52117919921875, 3.7967529296875, 4.07232666015625, 4.347900390625, 4.62347412109375, 4.8990478515625, 5.17462158203125, 5.4501953125, 5.72576904296875, 6.0013427734375, 6.27691650390625, 6.552490234375, 6.82806396484375, 7.1036376953125, 7.37921142578125, 7.65478515625, 7.93035888671875, 8.2059326171875, 8.48150634765625, 8.757080078125, 9.03265380859375, 9.3082275390625, 9.58380126953125, 9.859375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 8.0, 5.0, 8.0, 5.0, 9.0, 15.0, 16.0, 20.0, 36.0, 30.0, 41.0, 50.0, 81.0, 115.0, 166.0, 266.0, 515.0, 994.0, 2269.0, 6251.0, 24271.0, 199049.0, 1773990.0, 1916626.0, 231688.0, 26442.0, 6589.0, 2369.0, 964.0, 496.0, 275.0, 164.0, 130.0, 88.0, 47.0, 51.0, 41.0, 29.0, 21.0, 9.0, 12.0, 12.0, 8.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.671875, -18.070068359375, -17.46826171875, -16.866455078125, -16.2646484375, -15.662841796875, -15.06103515625, -14.459228515625, -13.857421875, -13.255615234375, -12.65380859375, -12.052001953125, -11.4501953125, -10.848388671875, -10.24658203125, -9.644775390625, -9.04296875, -8.441162109375, -7.83935546875, -7.237548828125, -6.6357421875, -6.033935546875, -5.43212890625, -4.830322265625, -4.228515625, -3.626708984375, -3.02490234375, -2.423095703125, -1.8212890625, -1.219482421875, -0.61767578125, -0.015869140625, 0.5859375, 1.187744140625, 1.78955078125, 2.391357421875, 2.9931640625, 3.594970703125, 4.19677734375, 4.798583984375, 5.400390625, 6.002197265625, 6.60400390625, 7.205810546875, 7.8076171875, 8.409423828125, 9.01123046875, 9.613037109375, 10.21484375, 10.816650390625, 11.41845703125, 12.020263671875, 12.6220703125, 13.223876953125, 13.82568359375, 14.427490234375, 15.029296875, 15.631103515625, 16.23291015625, 16.834716796875, 17.4365234375, 18.038330078125, 18.64013671875, 19.241943359375, 19.84375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 10.0, 18.0, 30.0, 53.0, 76.0, 149.0, 226.0, 372.0, 628.0, 807.0, 693.0, 426.0, 243.0, 140.0, 85.0, 45.0, 30.0, 16.0, 10.0, 9.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.125, -28.283935546875, -27.44287109375, -26.601806640625, -25.7607421875, -24.919677734375, -24.07861328125, -23.237548828125, -22.396484375, -21.555419921875, -20.71435546875, -19.873291015625, -19.0322265625, -18.191162109375, -17.35009765625, -16.509033203125, -15.66796875, -14.826904296875, -13.98583984375, -13.144775390625, -12.3037109375, -11.462646484375, -10.62158203125, -9.780517578125, -8.939453125, -8.098388671875, -7.25732421875, -6.416259765625, -5.5751953125, -4.734130859375, -3.89306640625, -3.052001953125, -2.2109375, -1.369873046875, -0.52880859375, 0.312255859375, 1.1533203125, 1.994384765625, 2.83544921875, 3.676513671875, 4.517578125, 5.358642578125, 6.19970703125, 7.040771484375, 7.8818359375, 8.722900390625, 9.56396484375, 10.405029296875, 11.24609375, 12.087158203125, 12.92822265625, 13.769287109375, 14.6103515625, 15.451416015625, 16.29248046875, 17.133544921875, 17.974609375, 18.815673828125, 19.65673828125, 20.497802734375, 21.3388671875, 22.179931640625, 23.02099609375, 23.862060546875, 24.703125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 11.0, 11.0, 22.0, 41.0, 81.0, 178.0, 413.0, 1384.0, 7693.0, 3202234.0, 974878.0, 5364.0, 1163.0, 468.0, 174.0, 75.0, 45.0, 14.0, 12.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.8125, -65.619140625, -63.42578125, -61.232421875, -59.0390625, -56.845703125, -54.65234375, -52.458984375, -50.265625, -48.072265625, -45.87890625, -43.685546875, -41.4921875, -39.298828125, -37.10546875, -34.912109375, -32.71875, -30.525390625, -28.33203125, -26.138671875, -23.9453125, -21.751953125, -19.55859375, -17.365234375, -15.171875, -12.978515625, -10.78515625, -8.591796875, -6.3984375, -4.205078125, -2.01171875, 0.181640625, 2.375, 4.568359375, 6.76171875, 8.955078125, 11.1484375, 13.341796875, 15.53515625, 17.728515625, 19.921875, 22.115234375, 24.30859375, 26.501953125, 28.6953125, 30.888671875, 33.08203125, 35.275390625, 37.46875, 39.662109375, 41.85546875, 44.048828125, 46.2421875, 48.435546875, 50.62890625, 52.822265625, 55.015625, 57.208984375, 59.40234375, 61.595703125, 63.7890625, 65.982421875, 68.17578125, 70.369140625, 72.5625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 116.0, 683.0, 205.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-351.81243896484375, -338.5679016113281, -325.3233337402344, -312.07879638671875, -298.834228515625, -285.5896911621094, -272.34515380859375, -259.1005859375, -245.85604858398438, -232.6114959716797, -219.366943359375, -206.12240600585938, -192.8778533935547, -179.63330078125, -166.38876342773438, -153.1442108154297, -139.899658203125, -126.65510559082031, -113.41056060791016, -100.166015625, -86.92146301269531, -73.67691040039062, -60.43236541748047, -47.18782043457031, -33.943267822265625, -20.698719024658203, -7.454170227050781, 5.790378570556641, 19.034927368164062, 32.27947998046875, 45.524024963378906, 58.76856994628906, 72.01309204101562, 85.25764465332031, 98.50218963623047, 111.74673461914062, 124.99128723144531, 138.23583984375, 151.48037719726562, 164.7249298095703, 177.969482421875, 191.2140350341797, 204.45858764648438, 217.703125, 230.9476776123047, 244.19223022460938, 257.436767578125, 270.68133544921875, 283.9258728027344, 297.17041015625, 310.41497802734375, 323.6595153808594, 336.904052734375, 350.14862060546875, 363.3931579589844, 376.6376953125, 389.88226318359375, 403.1268005371094, 416.3713684082031, 429.61590576171875, 442.8604736328125, 456.1050109863281, 469.34954833984375, 482.5941162109375, 495.8386535644531]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 13.0, 12.0, 14.0, 16.0, 14.0, 18.0, 25.0, 33.0, 36.0, 34.0, 37.0, 39.0, 32.0, 36.0, 48.0, 38.0, 49.0, 47.0, 46.0, 43.0, 40.0, 39.0, 44.0, 29.0, 36.0, 26.0, 38.0, 22.0, 19.0, 16.0, 12.0, 8.0, 15.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.49935913085938, -63.37350082397461, -61.247642517089844, -59.12178421020508, -56.99592590332031, -54.87006759643555, -52.74420928955078, -50.618350982666016, -48.49249267578125, -46.366634368896484, -44.24077606201172, -42.11491775512695, -39.98905944824219, -37.86320114135742, -35.737342834472656, -33.61148452758789, -31.485626220703125, -29.35976791381836, -27.233909606933594, -25.108051300048828, -22.982192993164062, -20.856334686279297, -18.73047637939453, -16.604618072509766, -14.478759765625, -12.352901458740234, -10.227043151855469, -8.101184844970703, -5.9753265380859375, -3.849468231201172, -1.7236099243164062, 0.4022483825683594, 2.5281143188476562, 4.653972625732422, 6.7798309326171875, 8.905689239501953, 11.031547546386719, 13.157405853271484, 15.28326416015625, 17.409122467041016, 19.53498077392578, 21.660839080810547, 23.786697387695312, 25.912555694580078, 28.038414001464844, 30.16427230834961, 32.290130615234375, 34.41598892211914, 36.541847229003906, 38.66770553588867, 40.79356384277344, 42.9194221496582, 45.04528045654297, 47.171138763427734, 49.2969970703125, 51.422855377197266, 53.54871368408203, 55.6745719909668, 57.80043029785156, 59.92628860473633, 62.052146911621094, 64.17800903320312, 66.30386352539062, 68.42971801757812, 70.55558013916016]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 3.0, 4.0, 4.0, 8.0, 3.0, 6.0, 12.0, 9.0, 8.0, 15.0, 16.0, 16.0, 26.0, 21.0, 21.0, 44.0, 28.0, 27.0, 27.0, 43.0, 49.0, 47.0, 57.0, 37.0, 50.0, 40.0, 39.0, 39.0, 35.0, 29.0, 37.0, 22.0, 33.0, 20.0, 20.0, 26.0, 21.0, 6.0, 13.0, 7.0, 13.0, 7.0, 3.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.91015625, -6.70269775390625, -6.4952392578125, -6.28778076171875, -6.080322265625, -5.87286376953125, -5.6654052734375, -5.45794677734375, -5.25048828125, -5.04302978515625, -4.8355712890625, -4.62811279296875, -4.420654296875, -4.21319580078125, -4.0057373046875, -3.79827880859375, -3.5908203125, -3.38336181640625, -3.1759033203125, -2.96844482421875, -2.760986328125, -2.55352783203125, -2.3460693359375, -2.13861083984375, -1.93115234375, -1.72369384765625, -1.5162353515625, -1.30877685546875, -1.101318359375, -0.89385986328125, -0.6864013671875, -0.47894287109375, -0.271484375, -0.06402587890625, 0.1434326171875, 0.35089111328125, 0.558349609375, 0.76580810546875, 0.9732666015625, 1.18072509765625, 1.38818359375, 1.59564208984375, 1.8031005859375, 2.01055908203125, 2.218017578125, 2.42547607421875, 2.6329345703125, 2.84039306640625, 3.0478515625, 3.25531005859375, 3.4627685546875, 3.67022705078125, 3.877685546875, 4.08514404296875, 4.2926025390625, 4.50006103515625, 4.70751953125, 4.91497802734375, 5.1224365234375, 5.32989501953125, 5.537353515625, 5.74481201171875, 5.9522705078125, 6.15972900390625, 6.3671875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 10.0, 10.0, 30.0, 24.0, 42.0, 54.0, 80.0, 147.0, 176.0, 268.0, 368.0, 506.0, 733.0, 998.0, 1409.0, 2040.0, 2853.0, 4315.0, 5991.0, 8585.0, 12674.0, 18621.0, 27352.0, 41704.0, 67471.0, 119487.0, 229991.0, 209668.0, 108203.0, 63007.0, 39358.0, 25947.0, 17449.0, 11811.0, 8241.0, 5689.0, 3907.0, 2762.0, 1960.0, 1345.0, 956.0, 673.0, 482.0, 363.0, 228.0, 176.0, 151.0, 92.0, 62.0, 38.0, 22.0, 13.0, 10.0, 6.0, 7.0, 0.0, 2.0, 2.0], "bins": [-0.98095703125, -0.9511642456054688, -0.9213714599609375, -0.8915786743164062, -0.861785888671875, -0.8319931030273438, -0.8022003173828125, -0.7724075317382812, -0.74261474609375, -0.7128219604492188, -0.6830291748046875, -0.6532363891601562, -0.623443603515625, -0.5936508178710938, -0.5638580322265625, -0.5340652465820312, -0.5042724609375, -0.47447967529296875, -0.4446868896484375, -0.41489410400390625, -0.385101318359375, -0.35530853271484375, -0.3255157470703125, -0.29572296142578125, -0.26593017578125, -0.23613739013671875, -0.2063446044921875, -0.17655181884765625, -0.146759033203125, -0.11696624755859375, -0.0871734619140625, -0.05738067626953125, -0.027587890625, 0.00220489501953125, 0.0319976806640625, 0.06179046630859375, 0.091583251953125, 0.12137603759765625, 0.1511688232421875, 0.18096160888671875, 0.21075439453125, 0.24054718017578125, 0.2703399658203125, 0.30013275146484375, 0.329925537109375, 0.35971832275390625, 0.3895111083984375, 0.41930389404296875, 0.4490966796875, 0.47888946533203125, 0.5086822509765625, 0.5384750366210938, 0.568267822265625, 0.5980606079101562, 0.6278533935546875, 0.6576461791992188, 0.68743896484375, 0.7172317504882812, 0.7470245361328125, 0.7768173217773438, 0.806610107421875, 0.8364028930664062, 0.8661956787109375, 0.8959884643554688, 0.92578125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 1.0, 3.0, 6.0, 6.0, 6.0, 13.0, 10.0, 22.0, 16.0, 17.0, 19.0, 36.0, 40.0, 32.0, 23.0, 38.0, 35.0, 49.0, 46.0, 35.0, 48.0, 1053.0, 45.0, 49.0, 45.0, 50.0, 26.0, 33.0, 33.0, 28.0, 32.0, 28.0, 15.0, 23.0, 15.0, 8.0, 7.0, 12.0, 9.0, 5.0, 7.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.0185546875, -3.876953125, -3.7353515625, -3.59375, -3.4521484375, -3.310546875, -3.1689453125, -3.02734375, -2.8857421875, -2.744140625, -2.6025390625, -2.4609375, -2.3193359375, -2.177734375, -2.0361328125, -1.89453125, -1.7529296875, -1.611328125, -1.4697265625, -1.328125, -1.1865234375, -1.044921875, -0.9033203125, -0.76171875, -0.6201171875, -0.478515625, -0.3369140625, -0.1953125, -0.0537109375, 0.087890625, 0.2294921875, 0.37109375, 0.5126953125, 0.654296875, 0.7958984375, 0.9375, 1.0791015625, 1.220703125, 1.3623046875, 1.50390625, 1.6455078125, 1.787109375, 1.9287109375, 2.0703125, 2.2119140625, 2.353515625, 2.4951171875, 2.63671875, 2.7783203125, 2.919921875, 3.0615234375, 3.203125, 3.3447265625, 3.486328125, 3.6279296875, 3.76953125, 3.9111328125, 4.052734375, 4.1943359375, 4.3359375, 4.4775390625, 4.619140625, 4.7607421875, 4.90234375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 11.0, 21.0, 25.0, 26.0, 52.0, 61.0, 101.0, 149.0, 215.0, 300.0, 497.0, 772.0, 1112.0, 1815.0, 2851.0, 4455.0, 7497.0, 12290.0, 19990.0, 33657.0, 57655.0, 106570.0, 237350.0, 1328073.0, 122602.0, 64310.0, 37225.0, 22223.0, 13430.0, 8100.0, 4827.0, 3089.0, 1995.0, 1256.0, 800.0, 556.0, 363.0, 273.0, 145.0, 125.0, 82.0, 49.0, 35.0, 29.0, 17.0, 13.0, 8.0, 6.0, 8.0, 4.0, 1.0, 3.0, 3.0], "bins": [-1.3154296875, -1.27685546875, -1.23828125, -1.19970703125, -1.1611328125, -1.12255859375, -1.083984375, -1.04541015625, -1.0068359375, -0.96826171875, -0.9296875, -0.89111328125, -0.8525390625, -0.81396484375, -0.775390625, -0.73681640625, -0.6982421875, -0.65966796875, -0.62109375, -0.58251953125, -0.5439453125, -0.50537109375, -0.466796875, -0.42822265625, -0.3896484375, -0.35107421875, -0.3125, -0.27392578125, -0.2353515625, -0.19677734375, -0.158203125, -0.11962890625, -0.0810546875, -0.04248046875, -0.00390625, 0.03466796875, 0.0732421875, 0.11181640625, 0.150390625, 0.18896484375, 0.2275390625, 0.26611328125, 0.3046875, 0.34326171875, 0.3818359375, 0.42041015625, 0.458984375, 0.49755859375, 0.5361328125, 0.57470703125, 0.61328125, 0.65185546875, 0.6904296875, 0.72900390625, 0.767578125, 0.80615234375, 0.8447265625, 0.88330078125, 0.921875, 0.96044921875, 0.9990234375, 1.03759765625, 1.076171875, 1.11474609375, 1.1533203125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 9.0, 11.0, 10.0, 15.0, 20.0, 23.0, 33.0, 44.0, 65.0, 68.0, 93.0, 102.0, 91.0, 81.0, 62.0, 64.0, 53.0, 27.0, 27.0, 27.0, 17.0, 16.0, 8.0, 8.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00255584716796875, -0.0024900883436203003, -0.0024243295192718506, -0.002358570694923401, -0.002292811870574951, -0.0022270530462265015, -0.0021612942218780518, -0.002095535397529602, -0.0020297765731811523, -0.0019640177488327026, -0.001898258924484253, -0.0018325001001358032, -0.0017667412757873535, -0.0017009824514389038, -0.001635223627090454, -0.0015694648027420044, -0.0015037059783935547, -0.001437947154045105, -0.0013721883296966553, -0.0013064295053482056, -0.0012406706809997559, -0.0011749118566513062, -0.0011091530323028564, -0.0010433942079544067, -0.000977635383605957, -0.0009118765592575073, -0.0008461177349090576, -0.0007803589105606079, -0.0007146000862121582, -0.0006488412618637085, -0.0005830824375152588, -0.0005173236131668091, -0.0004515647888183594, -0.00038580596446990967, -0.00032004714012145996, -0.00025428831577301025, -0.00018852949142456055, -0.00012277066707611084, -5.701184272766113e-05, 8.746981620788574e-06, 7.450580596923828e-05, 0.000140264630317688, 0.0002060234546661377, 0.0002717822790145874, 0.0003375411033630371, 0.0004032999277114868, 0.0004690587520599365, 0.0005348175764083862, 0.0006005764007568359, 0.0006663352251052856, 0.0007320940494537354, 0.0007978528738021851, 0.0008636116981506348, 0.0009293705224990845, 0.0009951293468475342, 0.0010608881711959839, 0.0011266469955444336, 0.0011924058198928833, 0.001258164644241333, 0.0013239234685897827, 0.0013896822929382324, 0.0014554411172866821, 0.0015211999416351318, 0.0015869587659835815, 0.0016527175903320312]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 0.0, 7.0, 6.0, 4.0, 8.0, 7.0, 12.0, 13.0, 20.0, 36.0, 50.0, 58.0, 85.0, 103.0, 189.0, 312.0, 545.0, 1312.0, 661133.0, 382112.0, 1223.0, 531.0, 280.0, 156.0, 113.0, 59.0, 49.0, 34.0, 27.0, 23.0, 15.0, 11.0, 15.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0285491943359375, -0.027405977249145508, -0.026262760162353516, -0.025119543075561523, -0.02397632598876953, -0.02283310890197754, -0.021689891815185547, -0.020546674728393555, -0.019403457641601562, -0.01826024055480957, -0.017117023468017578, -0.015973806381225586, -0.014830589294433594, -0.013687372207641602, -0.01254415512084961, -0.011400938034057617, -0.010257720947265625, -0.009114503860473633, -0.00797128677368164, -0.0068280696868896484, -0.005684852600097656, -0.004541635513305664, -0.003398418426513672, -0.0022552013397216797, -0.0011119842529296875, 3.123283386230469e-05, 0.0011744499206542969, 0.002317667007446289, 0.0034608840942382812, 0.0046041011810302734, 0.005747318267822266, 0.006890535354614258, 0.00803375244140625, 0.009176969528198242, 0.010320186614990234, 0.011463403701782227, 0.012606620788574219, 0.013749837875366211, 0.014893054962158203, 0.016036272048950195, 0.017179489135742188, 0.01832270622253418, 0.019465923309326172, 0.020609140396118164, 0.021752357482910156, 0.02289557456970215, 0.02403879165649414, 0.025182008743286133, 0.026325225830078125, 0.027468442916870117, 0.02861166000366211, 0.0297548770904541, 0.030898094177246094, 0.032041311264038086, 0.03318452835083008, 0.03432774543762207, 0.03547096252441406, 0.036614179611206055, 0.03775739669799805, 0.03890061378479004, 0.04004383087158203, 0.04118704795837402, 0.042330265045166016, 0.04347348213195801, 0.04461669921875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 27.0, 139.0, 456.0, 330.0, 54.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030125004705041647, -0.0029232713859528303, -0.002834042301401496, -0.002744813449680805, -0.002655584365129471, -0.0025663552805781364, -0.002477126196026802, -0.0023878971114754677, -0.0022986680269241333, -0.002209438942372799, -0.0021202098578214645, -0.00203098077327013, -0.0019417519215494394, -0.001852522836998105, -0.0017632937524467707, -0.0016740646678954363, -0.0015848358161747456, -0.0014956067316234112, -0.0014063777634873986, -0.0013171486789360642, -0.0012279197108000517, -0.0011386906262487173, -0.001049461541697383, -0.0009602325153537095, -0.000871003489010036, -0.0007817744626663625, -0.0006925454363226891, -0.0006033163517713547, -0.0005140873254276812, -0.00042485829908400774, -0.00033562921453267336, -0.0002464001881889999, -0.00015717116184532642, -6.794212094973773e-05, 2.128691994585097e-05, 0.00011051597539335489, 0.00019974500173702836, 0.00028897402808070183, 0.0003782031126320362, 0.0004674321389757097, 0.0005566611653193831, 0.0006458901916630566, 0.0007351192180067301, 0.0008243483025580645, 0.0009135773289017379, 0.0010028063552454114, 0.0010920354397967458, 0.0011812644079327583, 0.0012704934924840927, 0.001359722577035427, 0.0014489515451714396, 0.001538180629722774, 0.0016274095978587866, 0.001716638682410121, 0.0018058677669614553, 0.0018950968515127897, 0.0019843257032334805, 0.002073554787784815, 0.002162783872336149, 0.0022520129568874836, 0.0023412418086081743, 0.0024304708931595087, 0.002519699977710843, 0.0026089290622621775, 0.002698158146813512]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 12.0, 12.0, 13.0, 11.0, 16.0, 16.0, 21.0, 27.0, 22.0, 37.0, 23.0, 36.0, 28.0, 38.0, 38.0, 31.0, 41.0, 37.0, 37.0, 40.0, 36.0, 41.0, 48.0, 46.0, 31.0, 27.0, 42.0, 32.0, 31.0, 17.0, 15.0, 21.0, 14.0, 10.0, 6.0, 7.0, 5.0, 3.0, 10.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0008577704429626465, -0.0008324626833200455, -0.0008071549236774445, -0.0007818471640348434, -0.0007565394043922424, -0.0007312316447496414, -0.0007059238851070404, -0.0006806161254644394, -0.0006553083658218384, -0.0006300006061792374, -0.0006046928465366364, -0.0005793850868940353, -0.0005540773272514343, -0.0005287695676088333, -0.0005034618079662323, -0.0004781540483236313, -0.0004528462886810303, -0.00042753852903842926, -0.00040223076939582825, -0.00037692300975322723, -0.0003516152501106262, -0.0003263074904680252, -0.0003009997308254242, -0.0002756919711828232, -0.00025038421154022217, -0.00022507645189762115, -0.00019976869225502014, -0.00017446093261241913, -0.00014915317296981812, -0.0001238454133272171, -9.853765368461609e-05, -7.322989404201508e-05, -4.792213439941406e-05, -2.261437475681305e-05, 2.693384885787964e-06, 2.8001144528388977e-05, 5.330890417098999e-05, 7.8616663813591e-05, 0.00010392442345619202, 0.00012923218309879303, 0.00015453994274139404, 0.00017984770238399506, 0.00020515546202659607, 0.00023046322166919708, 0.0002557709813117981, 0.0002810787409543991, 0.0003063865005970001, 0.00033169426023960114, 0.00035700201988220215, 0.00038230977952480316, 0.0004076175391674042, 0.0004329252988100052, 0.0004582330584526062, 0.0004835408180952072, 0.0005088485777378082, 0.0005341563373804092, 0.0005594640970230103, 0.0005847718566656113, 0.0006100796163082123, 0.0006353873759508133, 0.0006606951355934143, 0.0006860028952360153, 0.0007113106548786163, 0.0007366184145212173, 0.0007619261741638184]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 3.0, 4.0, 4.0, 8.0, 3.0, 6.0, 12.0, 9.0, 8.0, 15.0, 16.0, 16.0, 26.0, 21.0, 21.0, 44.0, 28.0, 27.0, 27.0, 43.0, 49.0, 47.0, 57.0, 37.0, 50.0, 40.0, 39.0, 39.0, 36.0, 28.0, 37.0, 22.0, 33.0, 20.0, 20.0, 26.0, 21.0, 6.0, 13.0, 7.0, 13.0, 7.0, 3.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.91015625, -6.70269775390625, -6.4952392578125, -6.28778076171875, -6.080322265625, -5.87286376953125, -5.6654052734375, -5.45794677734375, -5.25048828125, -5.04302978515625, -4.8355712890625, -4.62811279296875, -4.420654296875, -4.21319580078125, -4.0057373046875, -3.79827880859375, -3.5908203125, -3.38336181640625, -3.1759033203125, -2.96844482421875, -2.760986328125, -2.55352783203125, -2.3460693359375, -2.13861083984375, -1.93115234375, -1.72369384765625, -1.5162353515625, -1.30877685546875, -1.101318359375, -0.89385986328125, -0.6864013671875, -0.47894287109375, -0.271484375, -0.06402587890625, 0.1434326171875, 0.35089111328125, 0.558349609375, 0.76580810546875, 0.9732666015625, 1.18072509765625, 1.38818359375, 1.59564208984375, 1.8031005859375, 2.01055908203125, 2.218017578125, 2.42547607421875, 2.6329345703125, 2.84039306640625, 3.0478515625, 3.25531005859375, 3.4627685546875, 3.67022705078125, 3.877685546875, 4.08514404296875, 4.2926025390625, 4.50006103515625, 4.70751953125, 4.91497802734375, 5.1224365234375, 5.32989501953125, 5.537353515625, 5.74481201171875, 5.9522705078125, 6.15972900390625, 6.3671875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 12.0, 12.0, 15.0, 28.0, 20.0, 27.0, 50.0, 59.0, 87.0, 108.0, 164.0, 259.0, 327.0, 544.0, 885.0, 1487.0, 2928.0, 7583.0, 29451.0, 208736.0, 649496.0, 115386.0, 19187.0, 5778.0, 2412.0, 1246.0, 715.0, 455.0, 307.0, 223.0, 162.0, 106.0, 81.0, 60.0, 44.0, 39.0, 21.0, 11.0, 12.0, 8.0, 9.0, 2.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8359375, -13.3802490234375, -12.924560546875, -12.4688720703125, -12.01318359375, -11.5574951171875, -11.101806640625, -10.6461181640625, -10.1904296875, -9.7347412109375, -9.279052734375, -8.8233642578125, -8.36767578125, -7.9119873046875, -7.456298828125, -7.0006103515625, -6.544921875, -6.0892333984375, -5.633544921875, -5.1778564453125, -4.72216796875, -4.2664794921875, -3.810791015625, -3.3551025390625, -2.8994140625, -2.4437255859375, -1.988037109375, -1.5323486328125, -1.07666015625, -0.6209716796875, -0.165283203125, 0.2904052734375, 0.74609375, 1.2017822265625, 1.657470703125, 2.1131591796875, 2.56884765625, 3.0245361328125, 3.480224609375, 3.9359130859375, 4.3916015625, 4.8472900390625, 5.302978515625, 5.7586669921875, 6.21435546875, 6.6700439453125, 7.125732421875, 7.5814208984375, 8.037109375, 8.4927978515625, 8.948486328125, 9.4041748046875, 9.85986328125, 10.3155517578125, 10.771240234375, 11.2269287109375, 11.6826171875, 12.1383056640625, 12.593994140625, 13.0496826171875, 13.50537109375, 13.9610595703125, 14.416748046875, 14.8724365234375, 15.328125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 7.0, 4.0, 9.0, 6.0, 11.0, 9.0, 14.0, 21.0, 25.0, 24.0, 25.0, 32.0, 56.0, 61.0, 86.0, 144.0, 297.0, 1500.0, 225.0, 110.0, 60.0, 71.0, 49.0, 37.0, 29.0, 20.0, 17.0, 22.0, 15.0, 12.0, 10.0, 6.0, 15.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-23.875, -23.158203125, -22.44140625, -21.724609375, -21.0078125, -20.291015625, -19.57421875, -18.857421875, -18.140625, -17.423828125, -16.70703125, -15.990234375, -15.2734375, -14.556640625, -13.83984375, -13.123046875, -12.40625, -11.689453125, -10.97265625, -10.255859375, -9.5390625, -8.822265625, -8.10546875, -7.388671875, -6.671875, -5.955078125, -5.23828125, -4.521484375, -3.8046875, -3.087890625, -2.37109375, -1.654296875, -0.9375, -0.220703125, 0.49609375, 1.212890625, 1.9296875, 2.646484375, 3.36328125, 4.080078125, 4.796875, 5.513671875, 6.23046875, 6.947265625, 7.6640625, 8.380859375, 9.09765625, 9.814453125, 10.53125, 11.248046875, 11.96484375, 12.681640625, 13.3984375, 14.115234375, 14.83203125, 15.548828125, 16.265625, 16.982421875, 17.69921875, 18.416015625, 19.1328125, 19.849609375, 20.56640625, 21.283203125, 22.0]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 11.0, 25.0, 21.0, 23.0, 40.0, 46.0, 37.0, 79.0, 122.0, 129.0, 224.0, 369.0, 832.0, 2556.0, 65456.0, 3064877.0, 7854.0, 1533.0, 530.0, 300.0, 166.0, 132.0, 80.0, 47.0, 39.0, 40.0, 30.0, 12.0, 18.0, 12.0, 13.0, 15.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-50.03125, -48.61328125, -47.1953125, -45.77734375, -44.359375, -42.94140625, -41.5234375, -40.10546875, -38.6875, -37.26953125, -35.8515625, -34.43359375, -33.015625, -31.59765625, -30.1796875, -28.76171875, -27.34375, -25.92578125, -24.5078125, -23.08984375, -21.671875, -20.25390625, -18.8359375, -17.41796875, -16.0, -14.58203125, -13.1640625, -11.74609375, -10.328125, -8.91015625, -7.4921875, -6.07421875, -4.65625, -3.23828125, -1.8203125, -0.40234375, 1.015625, 2.43359375, 3.8515625, 5.26953125, 6.6875, 8.10546875, 9.5234375, 10.94140625, 12.359375, 13.77734375, 15.1953125, 16.61328125, 18.03125, 19.44921875, 20.8671875, 22.28515625, 23.703125, 25.12109375, 26.5390625, 27.95703125, 29.375, 30.79296875, 32.2109375, 33.62890625, 35.046875, 36.46484375, 37.8828125, 39.30078125, 40.71875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 741.0, 269.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.532894134521484, -44.8148193359375, -33.09674835205078, -21.378673553466797, -9.660598754882812, 2.057476043701172, 13.77554702758789, 25.49362564086914, 37.21169662475586, 48.929771423339844, 60.64784240722656, 72.36592102050781, 84.08399200439453, 95.80206298828125, 107.5201416015625, 119.23822021484375, 130.95628356933594, 142.6743621826172, 154.39242553710938, 166.11050415039062, 177.82858276367188, 189.54666137695312, 201.2647247314453, 212.98280334472656, 224.7008819580078, 236.41896057128906, 248.13702392578125, 259.8551025390625, 271.57318115234375, 283.291259765625, 295.00933837890625, 306.7274169921875, 318.4454650878906, 330.1635437011719, 341.8816223144531, 353.59967041015625, 365.3177490234375, 377.03582763671875, 388.75390625, 400.47198486328125, 412.1900634765625, 423.90814208984375, 435.626220703125, 447.34429931640625, 459.0623474121094, 470.7804260253906, 482.4985046386719, 494.2165832519531, 505.93463134765625, 517.6527099609375, 529.3707885742188, 541.0888671875, 552.8069458007812, 564.5250244140625, 576.2430419921875, 587.961181640625, 599.6792602539062, 611.3973388671875, 623.1154174804688, 634.83349609375, 646.5515747070312, 658.2696533203125, 669.9876708984375, 681.705810546875, 693.423828125]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 12.0, 5.0, 7.0, 5.0, 14.0, 15.0, 21.0, 21.0, 19.0, 24.0, 25.0, 46.0, 16.0, 37.0, 39.0, 50.0, 69.0, 36.0, 37.0, 34.0, 47.0, 38.0, 51.0, 41.0, 38.0, 30.0, 27.0, 29.0, 27.0, 21.0, 18.0, 16.0, 12.0, 17.0, 16.0, 8.0, 12.0, 8.0, 4.0, 3.0, 2.0, 6.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.21110534667969, -43.72639465332031, -42.24168014526367, -40.7569694519043, -39.27225875854492, -37.78754425048828, -36.302833557128906, -34.81812286376953, -33.333412170410156, -31.84869956970215, -30.363988876342773, -28.879276275634766, -27.39456558227539, -25.909852981567383, -24.425140380859375, -22.9404296875, -21.45571517944336, -19.97100257873535, -18.486291885375977, -17.00157928466797, -15.516867637634277, -14.032155990600586, -12.547443389892578, -11.062731742858887, -9.578020095825195, -8.093308448791504, -6.608596324920654, -5.123884201049805, -3.6391725540161133, -2.154460906982422, -0.6697483062744141, 0.8149633407592773, 2.2996749877929688, 3.7843868732452393, 5.26909875869751, 6.753810882568359, 8.23852252960205, 9.723234176635742, 11.20794677734375, 12.692658424377441, 14.177370071411133, 15.662081718444824, 17.146793365478516, 18.631505966186523, 20.11621856689453, 21.600929260253906, 23.085641860961914, 24.570354461669922, 26.055065155029297, 27.539777755737305, 29.02448844909668, 30.509201049804688, 31.993911743164062, 33.47862243652344, 34.96333694458008, 36.44804763793945, 37.932762145996094, 39.41747283935547, 40.90218734741211, 42.386898040771484, 43.87160873413086, 45.3563232421875, 46.841033935546875, 48.32574462890625, 49.810455322265625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 8.0, 6.0, 8.0, 6.0, 8.0, 10.0, 10.0, 26.0, 18.0, 15.0, 20.0, 29.0, 35.0, 38.0, 44.0, 46.0, 48.0, 44.0, 46.0, 60.0, 45.0, 49.0, 43.0, 44.0, 35.0, 45.0, 32.0, 27.0, 24.0, 29.0, 24.0, 13.0, 19.0, 17.0, 11.0, 9.0, 8.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.7890625, -9.52215576171875, -9.2552490234375, -8.98834228515625, -8.721435546875, -8.45452880859375, -8.1876220703125, -7.92071533203125, -7.65380859375, -7.38690185546875, -7.1199951171875, -6.85308837890625, -6.586181640625, -6.31927490234375, -6.0523681640625, -5.78546142578125, -5.5185546875, -5.25164794921875, -4.9847412109375, -4.71783447265625, -4.450927734375, -4.18402099609375, -3.9171142578125, -3.65020751953125, -3.38330078125, -3.11639404296875, -2.8494873046875, -2.58258056640625, -2.315673828125, -2.04876708984375, -1.7818603515625, -1.51495361328125, -1.248046875, -0.98114013671875, -0.7142333984375, -0.44732666015625, -0.180419921875, 0.08648681640625, 0.3533935546875, 0.62030029296875, 0.88720703125, 1.15411376953125, 1.4210205078125, 1.68792724609375, 1.954833984375, 2.22174072265625, 2.4886474609375, 2.75555419921875, 3.0224609375, 3.28936767578125, 3.5562744140625, 3.82318115234375, 4.090087890625, 4.35699462890625, 4.6239013671875, 4.89080810546875, 5.15771484375, 5.42462158203125, 5.6915283203125, 5.95843505859375, 6.225341796875, 6.49224853515625, 6.7591552734375, 7.02606201171875, 7.29296875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 7.0, 9.0, 17.0, 7.0, 28.0, 23.0, 24.0, 50.0, 56.0, 81.0, 113.0, 168.0, 231.0, 392.0, 580.0, 963.0, 2230.0, 12481.0, 1253060.0, 2888677.0, 29017.0, 2911.0, 1151.0, 660.0, 425.0, 237.0, 205.0, 144.0, 100.0, 63.0, 45.0, 32.0, 26.0, 23.0, 6.0, 13.0, 7.0, 13.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-53.5, -52.0966796875, -50.693359375, -49.2900390625, -47.88671875, -46.4833984375, -45.080078125, -43.6767578125, -42.2734375, -40.8701171875, -39.466796875, -38.0634765625, -36.66015625, -35.2568359375, -33.853515625, -32.4501953125, -31.046875, -29.6435546875, -28.240234375, -26.8369140625, -25.43359375, -24.0302734375, -22.626953125, -21.2236328125, -19.8203125, -18.4169921875, -17.013671875, -15.6103515625, -14.20703125, -12.8037109375, -11.400390625, -9.9970703125, -8.59375, -7.1904296875, -5.787109375, -4.3837890625, -2.98046875, -1.5771484375, -0.173828125, 1.2294921875, 2.6328125, 4.0361328125, 5.439453125, 6.8427734375, 8.24609375, 9.6494140625, 11.052734375, 12.4560546875, 13.859375, 15.2626953125, 16.666015625, 18.0693359375, 19.47265625, 20.8759765625, 22.279296875, 23.6826171875, 25.0859375, 26.4892578125, 27.892578125, 29.2958984375, 30.69921875, 32.1025390625, 33.505859375, 34.9091796875, 36.3125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 10.0, 14.0, 32.0, 57.0, 112.0, 236.0, 552.0, 907.0, 979.0, 607.0, 314.0, 129.0, 57.0, 32.0, 12.0, 7.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.328125, -30.43603515625, -29.5439453125, -28.65185546875, -27.759765625, -26.86767578125, -25.9755859375, -25.08349609375, -24.19140625, -23.29931640625, -22.4072265625, -21.51513671875, -20.623046875, -19.73095703125, -18.8388671875, -17.94677734375, -17.0546875, -16.16259765625, -15.2705078125, -14.37841796875, -13.486328125, -12.59423828125, -11.7021484375, -10.81005859375, -9.91796875, -9.02587890625, -8.1337890625, -7.24169921875, -6.349609375, -5.45751953125, -4.5654296875, -3.67333984375, -2.78125, -1.88916015625, -0.9970703125, -0.10498046875, 0.787109375, 1.67919921875, 2.5712890625, 3.46337890625, 4.35546875, 5.24755859375, 6.1396484375, 7.03173828125, 7.923828125, 8.81591796875, 9.7080078125, 10.60009765625, 11.4921875, 12.38427734375, 13.2763671875, 14.16845703125, 15.060546875, 15.95263671875, 16.8447265625, 17.73681640625, 18.62890625, 19.52099609375, 20.4130859375, 21.30517578125, 22.197265625, 23.08935546875, 23.9814453125, 24.87353515625, 25.765625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 13.0, 20.0, 31.0, 56.0, 123.0, 229.0, 473.0, 1232.0, 3946.0, 30324.0, 1776335.0, 2336628.0, 38189.0, 4286.0, 1374.0, 536.0, 237.0, 99.0, 51.0, 37.0, 15.0, 10.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.8125, -35.8447265625, -34.876953125, -33.9091796875, -32.94140625, -31.9736328125, -31.005859375, -30.0380859375, -29.0703125, -28.1025390625, -27.134765625, -26.1669921875, -25.19921875, -24.2314453125, -23.263671875, -22.2958984375, -21.328125, -20.3603515625, -19.392578125, -18.4248046875, -17.45703125, -16.4892578125, -15.521484375, -14.5537109375, -13.5859375, -12.6181640625, -11.650390625, -10.6826171875, -9.71484375, -8.7470703125, -7.779296875, -6.8115234375, -5.84375, -4.8759765625, -3.908203125, -2.9404296875, -1.97265625, -1.0048828125, -0.037109375, 0.9306640625, 1.8984375, 2.8662109375, 3.833984375, 4.8017578125, 5.76953125, 6.7373046875, 7.705078125, 8.6728515625, 9.640625, 10.6083984375, 11.576171875, 12.5439453125, 13.51171875, 14.4794921875, 15.447265625, 16.4150390625, 17.3828125, 18.3505859375, 19.318359375, 20.2861328125, 21.25390625, 22.2216796875, 23.189453125, 24.1572265625, 25.125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 9.0, 9.0, 15.0, 17.0, 21.0, 27.0, 39.0, 30.0, 42.0, 56.0, 42.0, 50.0, 50.0, 58.0, 66.0, 67.0, 53.0, 52.0, 50.0, 42.0, 30.0, 24.0, 25.0, 25.0, 22.0, 24.0, 11.0, 12.0, 6.0, 7.0, 2.0, 6.0, 2.0, 3.0], "bins": [-77.31253814697266, -75.52256774902344, -73.73259735107422, -71.942626953125, -70.15265655517578, -68.36268615722656, -66.57271575927734, -64.78274536132812, -62.992774963378906, -61.20280456542969, -59.41283416748047, -57.62286376953125, -55.83289337158203, -54.04292297363281, -52.252952575683594, -50.462982177734375, -48.67301559448242, -46.8830451965332, -45.093074798583984, -43.303104400634766, -41.51313400268555, -39.72316360473633, -37.933197021484375, -36.143226623535156, -34.35325622558594, -32.56328582763672, -30.7733154296875, -28.98334503173828, -27.193374633789062, -25.403404235839844, -23.613435745239258, -21.82346534729004, -20.033496856689453, -18.243526458740234, -16.453556060791016, -14.663586616516113, -12.873616218566895, -11.083645820617676, -9.293676376342773, -7.503705978393555, -5.713735580444336, -3.9237654209136963, -2.1337952613830566, -0.3438253402709961, 1.4461450576782227, 3.2361154556274414, 5.026084899902344, 6.8160552978515625, 8.606025695800781, 10.39599609375, 12.185966491699219, 13.975935935974121, 15.76590633392334, 17.555877685546875, 19.34584617614746, 21.13581657409668, 22.9257869720459, 24.715757369995117, 26.505727767944336, 28.295696258544922, 30.08566665649414, 31.87563705444336, 33.66560745239258, 35.4555778503418, 37.245548248291016]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 6.0, 12.0, 11.0, 15.0, 14.0, 14.0, 25.0, 32.0, 28.0, 25.0, 34.0, 40.0, 55.0, 39.0, 42.0, 53.0, 56.0, 45.0, 40.0, 46.0, 38.0, 41.0, 35.0, 27.0, 32.0, 28.0, 21.0, 23.0, 29.0, 12.0, 17.0, 13.0, 9.0, 12.0, 6.0, 4.0, 7.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.723941802978516, -39.10563659667969, -37.48733139038086, -35.86902618408203, -34.2507209777832, -32.632415771484375, -31.01411247253418, -29.39580726623535, -27.777502059936523, -26.159196853637695, -24.540891647338867, -22.922588348388672, -21.304283142089844, -19.685977935791016, -18.067672729492188, -16.44936752319336, -14.831062316894531, -13.212757110595703, -11.594451904296875, -9.976147651672363, -8.357842445373535, -6.739537239074707, -5.121232986450195, -3.502927780151367, -1.884622573852539, -0.26631760597229004, 1.351987361907959, 2.970292091369629, 4.588597297668457, 6.206902503967285, 7.825206756591797, 9.443511962890625, 11.061820983886719, 12.680126190185547, 14.298431396484375, 15.916735649108887, 17.53504180908203, 19.15334701538086, 20.771650314331055, 22.389955520629883, 24.00826072692871, 25.62656593322754, 27.244871139526367, 28.863174438476562, 30.48147964477539, 32.09978485107422, 33.71809005737305, 35.336395263671875, 36.9547004699707, 38.57300567626953, 40.19131088256836, 41.80961608886719, 43.427921295166016, 45.046226501464844, 46.664527893066406, 48.2828369140625, 49.90113830566406, 51.51944351196289, 53.13774871826172, 54.75605392456055, 56.374359130859375, 57.9926643371582, 59.61096954345703, 61.229270935058594, 62.84757995605469]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 5.0, 6.0, 8.0, 7.0, 11.0, 22.0, 25.0, 17.0, 25.0, 26.0, 32.0, 24.0, 45.0, 39.0, 52.0, 44.0, 40.0, 64.0, 50.0, 53.0, 47.0, 40.0, 35.0, 37.0, 31.0, 29.0, 33.0, 23.0, 20.0, 18.0, 19.0, 14.0, 14.0, 15.0, 8.0, 9.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.4375, -78.5595703125, -75.681640625, -72.8037109375, -69.92578125, -67.0478515625, -64.169921875, -61.2919921875, -58.4140625, -55.5361328125, -52.658203125, -49.7802734375, -46.90234375, -44.0244140625, -41.146484375, -38.2685546875, -35.390625, -32.5126953125, -29.634765625, -26.7568359375, -23.87890625, -21.0009765625, -18.123046875, -15.2451171875, -12.3671875, -9.4892578125, -6.611328125, -3.7333984375, -0.85546875, 2.0224609375, 4.900390625, 7.7783203125, 10.65625, 13.5341796875, 16.412109375, 19.2900390625, 22.16796875, 25.0458984375, 27.923828125, 30.8017578125, 33.6796875, 36.5576171875, 39.435546875, 42.3134765625, 45.19140625, 48.0693359375, 50.947265625, 53.8251953125, 56.703125, 59.5810546875, 62.458984375, 65.3369140625, 68.21484375, 71.0927734375, 73.970703125, 76.8486328125, 79.7265625, 82.6044921875, 85.482421875, 88.3603515625, 91.23828125, 94.1162109375, 96.994140625, 99.8720703125, 102.75]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 9.0, 8.0, 13.0, 44.0, 55.0, 75.0, 107.0, 175.0, 248.0, 386.0, 601.0, 979.0, 1576.0, 2518.0, 4034.0, 6635.0, 10675.0, 17394.0, 28494.0, 49090.0, 86957.0, 167322.0, 279392.0, 173430.0, 91271.0, 50826.0, 29746.0, 17885.0, 10775.0, 6709.0, 4095.0, 2638.0, 1609.0, 997.0, 644.0, 406.0, 231.0, 182.0, 96.0, 76.0, 46.0, 22.0, 27.0, 21.0, 12.0, 5.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1171875, -13.65478515625, -13.1923828125, -12.72998046875, -12.267578125, -11.80517578125, -11.3427734375, -10.88037109375, -10.41796875, -9.95556640625, -9.4931640625, -9.03076171875, -8.568359375, -8.10595703125, -7.6435546875, -7.18115234375, -6.71875, -6.25634765625, -5.7939453125, -5.33154296875, -4.869140625, -4.40673828125, -3.9443359375, -3.48193359375, -3.01953125, -2.55712890625, -2.0947265625, -1.63232421875, -1.169921875, -0.70751953125, -0.2451171875, 0.21728515625, 0.6796875, 1.14208984375, 1.6044921875, 2.06689453125, 2.529296875, 2.99169921875, 3.4541015625, 3.91650390625, 4.37890625, 4.84130859375, 5.3037109375, 5.76611328125, 6.228515625, 6.69091796875, 7.1533203125, 7.61572265625, 8.078125, 8.54052734375, 9.0029296875, 9.46533203125, 9.927734375, 10.39013671875, 10.8525390625, 11.31494140625, 11.77734375, 12.23974609375, 12.7021484375, 13.16455078125, 13.626953125, 14.08935546875, 14.5517578125, 15.01416015625, 15.4765625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 0.0, 6.0, 4.0, 7.0, 2.0, 6.0, 7.0, 14.0, 15.0, 16.0, 27.0, 19.0, 22.0, 23.0, 29.0, 28.0, 35.0, 31.0, 41.0, 41.0, 41.0, 40.0, 1078.0, 45.0, 44.0, 36.0, 42.0, 46.0, 36.0, 32.0, 28.0, 26.0, 18.0, 22.0, 33.0, 29.0, 16.0, 10.0, 5.0, 10.0, 5.0, 3.0, 3.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.25, -55.443359375, -53.63671875, -51.830078125, -50.0234375, -48.216796875, -46.41015625, -44.603515625, -42.796875, -40.990234375, -39.18359375, -37.376953125, -35.5703125, -33.763671875, -31.95703125, -30.150390625, -28.34375, -26.537109375, -24.73046875, -22.923828125, -21.1171875, -19.310546875, -17.50390625, -15.697265625, -13.890625, -12.083984375, -10.27734375, -8.470703125, -6.6640625, -4.857421875, -3.05078125, -1.244140625, 0.5625, 2.369140625, 4.17578125, 5.982421875, 7.7890625, 9.595703125, 11.40234375, 13.208984375, 15.015625, 16.822265625, 18.62890625, 20.435546875, 22.2421875, 24.048828125, 25.85546875, 27.662109375, 29.46875, 31.275390625, 33.08203125, 34.888671875, 36.6953125, 38.501953125, 40.30859375, 42.115234375, 43.921875, 45.728515625, 47.53515625, 49.341796875, 51.1484375, 52.955078125, 54.76171875, 56.568359375, 58.375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 7.0, 8.0, 15.0, 20.0, 39.0, 36.0, 59.0, 80.0, 132.0, 166.0, 265.0, 382.0, 554.0, 818.0, 1219.0, 1750.0, 2831.0, 4443.0, 6825.0, 10979.0, 17290.0, 27829.0, 46087.0, 80279.0, 151637.0, 1322181.0, 184133.0, 95977.0, 54250.0, 32175.0, 19898.0, 12357.0, 7814.0, 5014.0, 3246.0, 2074.0, 1331.0, 947.0, 601.0, 460.0, 319.0, 192.0, 113.0, 83.0, 73.0, 49.0, 32.0, 21.0, 14.0, 11.0, 8.0, 4.0, 0.0, 5.0, 3.0, 2.0, 1.0], "bins": [-15.0546875, -14.593505859375, -14.13232421875, -13.671142578125, -13.2099609375, -12.748779296875, -12.28759765625, -11.826416015625, -11.365234375, -10.904052734375, -10.44287109375, -9.981689453125, -9.5205078125, -9.059326171875, -8.59814453125, -8.136962890625, -7.67578125, -7.214599609375, -6.75341796875, -6.292236328125, -5.8310546875, -5.369873046875, -4.90869140625, -4.447509765625, -3.986328125, -3.525146484375, -3.06396484375, -2.602783203125, -2.1416015625, -1.680419921875, -1.21923828125, -0.758056640625, -0.296875, 0.164306640625, 0.62548828125, 1.086669921875, 1.5478515625, 2.009033203125, 2.47021484375, 2.931396484375, 3.392578125, 3.853759765625, 4.31494140625, 4.776123046875, 5.2373046875, 5.698486328125, 6.15966796875, 6.620849609375, 7.08203125, 7.543212890625, 8.00439453125, 8.465576171875, 8.9267578125, 9.387939453125, 9.84912109375, 10.310302734375, 10.771484375, 11.232666015625, 11.69384765625, 12.155029296875, 12.6162109375, 13.077392578125, 13.53857421875, 13.999755859375, 14.4609375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 4.0, 6.0, 7.0, 5.0, 7.0, 14.0, 14.0, 23.0, 18.0, 23.0, 27.0, 50.0, 50.0, 51.0, 83.0, 72.0, 103.0, 77.0, 80.0, 56.0, 46.0, 34.0, 32.0, 27.0, 18.0, 12.0, 9.0, 13.0, 4.0, 10.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03900146484375, -0.03766012191772461, -0.03631877899169922, -0.03497743606567383, -0.03363609313964844, -0.03229475021362305, -0.030953407287597656, -0.029612064361572266, -0.028270721435546875, -0.026929378509521484, -0.025588035583496094, -0.024246692657470703, -0.022905349731445312, -0.021564006805419922, -0.02022266387939453, -0.01888132095336914, -0.01753997802734375, -0.01619863510131836, -0.014857292175292969, -0.013515949249267578, -0.012174606323242188, -0.010833263397216797, -0.009491920471191406, -0.008150577545166016, -0.006809234619140625, -0.005467891693115234, -0.004126548767089844, -0.002785205841064453, -0.0014438629150390625, -0.00010251998901367188, 0.0012388229370117188, 0.0025801658630371094, 0.0039215087890625, 0.005262851715087891, 0.006604194641113281, 0.007945537567138672, 0.009286880493164062, 0.010628223419189453, 0.011969566345214844, 0.013310909271240234, 0.014652252197265625, 0.015993595123291016, 0.017334938049316406, 0.018676280975341797, 0.020017623901367188, 0.021358966827392578, 0.02270030975341797, 0.02404165267944336, 0.02538299560546875, 0.02672433853149414, 0.02806568145751953, 0.029407024383544922, 0.030748367309570312, 0.0320897102355957, 0.033431053161621094, 0.034772396087646484, 0.036113739013671875, 0.037455081939697266, 0.038796424865722656, 0.04013776779174805, 0.04147911071777344, 0.04282045364379883, 0.04416179656982422, 0.04550313949584961, 0.046844482421875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 10.0, 8.0, 13.0, 12.0, 10.0, 28.0, 36.0, 43.0, 65.0, 84.0, 114.0, 164.0, 310.0, 486.0, 854.0, 1817.0, 4473.0, 15813.0, 91870.0, 612723.0, 270868.0, 35097.0, 7928.0, 2607.0, 1298.0, 653.0, 368.0, 238.0, 165.0, 95.0, 68.0, 49.0, 36.0, 37.0, 21.0, 19.0, 13.0, 14.0, 15.0, 2.0, 4.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24072265625, -0.23337173461914062, -0.22602081298828125, -0.21866989135742188, -0.2113189697265625, -0.20396804809570312, -0.19661712646484375, -0.18926620483398438, -0.181915283203125, -0.17456436157226562, -0.16721343994140625, -0.15986251831054688, -0.1525115966796875, -0.14516067504882812, -0.13780975341796875, -0.13045883178710938, -0.12310791015625, -0.11575698852539062, -0.10840606689453125, -0.10105514526367188, -0.0937042236328125, -0.08635330200195312, -0.07900238037109375, -0.07165145874023438, -0.064300537109375, -0.056949615478515625, -0.04959869384765625, -0.042247772216796875, -0.0348968505859375, -0.027545928955078125, -0.02019500732421875, -0.012844085693359375, -0.0054931640625, 0.001857757568359375, 0.00920867919921875, 0.016559600830078125, 0.0239105224609375, 0.031261444091796875, 0.03861236572265625, 0.045963287353515625, 0.053314208984375, 0.060665130615234375, 0.06801605224609375, 0.07536697387695312, 0.0827178955078125, 0.09006881713867188, 0.09741973876953125, 0.10477066040039062, 0.11212158203125, 0.11947250366210938, 0.12682342529296875, 0.13417434692382812, 0.1415252685546875, 0.14887619018554688, 0.15622711181640625, 0.16357803344726562, 0.170928955078125, 0.17827987670898438, 0.18563079833984375, 0.19298171997070312, 0.2003326416015625, 0.20768356323242188, 0.21503448486328125, 0.22238540649414062, 0.229736328125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 7.0, 18.0, 36.0, 92.0, 179.0, 266.0, 207.0, 116.0, 44.0, 18.0, 11.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08062899857759476, -0.07869229465723038, -0.0767555981874466, -0.07481889426708221, -0.07288219779729843, -0.07094549387693405, -0.06900879740715027, -0.06707209348678589, -0.06513538956642151, -0.06319868564605713, -0.061261989176273346, -0.059325288981199265, -0.05738858878612518, -0.0554518848657608, -0.05351518467068672, -0.05157848447561264, -0.04964178800582886, -0.047705087810754776, -0.045768387615680695, -0.04383168742060661, -0.04189498722553253, -0.03995828330516815, -0.03802158311009407, -0.03608488291501999, -0.03414818271994591, -0.032211482524871826, -0.030274782329797745, -0.028338080272078514, -0.026401380077004433, -0.02446467988193035, -0.02252797782421112, -0.02059127762913704, -0.01865457370877266, -0.016717873513698578, -0.014781172387301922, -0.012844471260905266, -0.010907771065831184, -0.008971070870757103, -0.007034369744360447, -0.005097668617963791, -0.0031609684228897095, -0.0012242677621543407, 0.000712432898581028, 0.0026491335593163967, 0.0045858342200517654, 0.006522534415125847, 0.008459235541522503, 0.010395936667919159, 0.01233263686299324, 0.014269337058067322, 0.016206037253141403, 0.018142739310860634, 0.020079439505934715, 0.022016139701008797, 0.023952841758728027, 0.02588954195380211, 0.02782624214887619, 0.02976294234395027, 0.03169964253902435, 0.033636342734098434, 0.035573042929172516, 0.037509746849536896, 0.03944644704461098, 0.04138314723968506, 0.04331984743475914]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 7.0, 4.0, 4.0, 7.0, 9.0, 7.0, 13.0, 10.0, 12.0, 21.0, 12.0, 20.0, 20.0, 23.0, 27.0, 27.0, 19.0, 29.0, 32.0, 31.0, 42.0, 45.0, 39.0, 44.0, 42.0, 39.0, 34.0, 43.0, 39.0, 40.0, 33.0, 27.0, 26.0, 30.0, 31.0, 19.0, 17.0, 15.0, 15.0, 8.0, 13.0, 7.0, 8.0, 11.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.019526362419128418, -0.01888122223317623, -0.018236082047224045, -0.017590941861271858, -0.01694580167531967, -0.016300661489367485, -0.0156555213034153, -0.015010381117463112, -0.014365240931510925, -0.013720100745558739, -0.013074960559606552, -0.012429820373654366, -0.011784680187702179, -0.011139540001749992, -0.010494399815797806, -0.00984925962984562, -0.009204119443893433, -0.008558979257941246, -0.00791383907198906, -0.007268698886036873, -0.006623558700084686, -0.0059784185141325, -0.005333278328180313, -0.0046881381422281265, -0.00404299795627594, -0.0033978577703237534, -0.0027527175843715668, -0.00210757739841938, -0.0014624372124671936, -0.000817297026515007, -0.00017215684056282043, 0.00047298334538936615, 0.0011181235313415527, 0.0017632637172937393, 0.002408403903245926, 0.0030535440891981125, 0.003698684275150299, 0.004343824461102486, 0.004988964647054672, 0.005634104833006859, 0.006279245018959045, 0.006924385204911232, 0.007569525390863419, 0.008214665576815605, 0.008859805762767792, 0.009504945948719978, 0.010150086134672165, 0.010795226320624352, 0.011440366506576538, 0.012085506692528725, 0.012730646878480911, 0.013375787064433098, 0.014020927250385284, 0.014666067436337471, 0.015311207622289658, 0.015956347808241844, 0.01660148799419403, 0.017246628180146217, 0.017891768366098404, 0.01853690855205059, 0.019182048738002777, 0.019827188923954964, 0.02047232910990715, 0.021117469295859337, 0.021762609481811523]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 5.0, 6.0, 8.0, 8.0, 10.0, 22.0, 27.0, 16.0, 24.0, 26.0, 35.0, 21.0, 45.0, 40.0, 53.0, 42.0, 42.0, 63.0, 52.0, 52.0, 46.0, 40.0, 35.0, 37.0, 30.0, 30.0, 32.0, 24.0, 19.0, 18.0, 21.0, 12.0, 14.0, 16.0, 7.0, 9.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.3125, -78.4365234375, -75.560546875, -72.6845703125, -69.80859375, -66.9326171875, -64.056640625, -61.1806640625, -58.3046875, -55.4287109375, -52.552734375, -49.6767578125, -46.80078125, -43.9248046875, -41.048828125, -38.1728515625, -35.296875, -32.4208984375, -29.544921875, -26.6689453125, -23.79296875, -20.9169921875, -18.041015625, -15.1650390625, -12.2890625, -9.4130859375, -6.537109375, -3.6611328125, -0.78515625, 2.0908203125, 4.966796875, 7.8427734375, 10.71875, 13.5947265625, 16.470703125, 19.3466796875, 22.22265625, 25.0986328125, 27.974609375, 30.8505859375, 33.7265625, 36.6025390625, 39.478515625, 42.3544921875, 45.23046875, 48.1064453125, 50.982421875, 53.8583984375, 56.734375, 59.6103515625, 62.486328125, 65.3623046875, 68.23828125, 71.1142578125, 73.990234375, 76.8662109375, 79.7421875, 82.6181640625, 85.494140625, 88.3701171875, 91.24609375, 94.1220703125, 96.998046875, 99.8740234375, 102.75]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 6.0, 18.0, 21.0, 37.0, 43.0, 58.0, 102.0, 121.0, 219.0, 312.0, 602.0, 1115.0, 2131.0, 4909.0, 13976.0, 56643.0, 268684.0, 505870.0, 146256.0, 31405.0, 8783.0, 3478.0, 1589.0, 837.0, 479.0, 267.0, 194.0, 111.0, 66.0, 53.0, 42.0, 28.0, 26.0, 16.0, 11.0, 8.0, 11.0, 4.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.546875, -13.011474609375, -12.47607421875, -11.940673828125, -11.4052734375, -10.869873046875, -10.33447265625, -9.799072265625, -9.263671875, -8.728271484375, -8.19287109375, -7.657470703125, -7.1220703125, -6.586669921875, -6.05126953125, -5.515869140625, -4.98046875, -4.445068359375, -3.90966796875, -3.374267578125, -2.8388671875, -2.303466796875, -1.76806640625, -1.232666015625, -0.697265625, -0.161865234375, 0.37353515625, 0.908935546875, 1.4443359375, 1.979736328125, 2.51513671875, 3.050537109375, 3.5859375, 4.121337890625, 4.65673828125, 5.192138671875, 5.7275390625, 6.262939453125, 6.79833984375, 7.333740234375, 7.869140625, 8.404541015625, 8.93994140625, 9.475341796875, 10.0107421875, 10.546142578125, 11.08154296875, 11.616943359375, 12.15234375, 12.687744140625, 13.22314453125, 13.758544921875, 14.2939453125, 14.829345703125, 15.36474609375, 15.900146484375, 16.435546875, 16.970947265625, 17.50634765625, 18.041748046875, 18.5771484375, 19.112548828125, 19.64794921875, 20.183349609375, 20.71875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 7.0, 2.0, 3.0, 5.0, 9.0, 14.0, 12.0, 20.0, 38.0, 25.0, 22.0, 36.0, 27.0, 35.0, 52.0, 41.0, 51.0, 41.0, 42.0, 1913.0, 214.0, 56.0, 47.0, 35.0, 25.0, 26.0, 38.0, 33.0, 31.0, 18.0, 22.0, 13.0, 18.0, 11.0, 13.0, 7.0, 8.0, 10.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0], "bins": [-144.0, -140.0947265625, -136.189453125, -132.2841796875, -128.37890625, -124.4736328125, -120.568359375, -116.6630859375, -112.7578125, -108.8525390625, -104.947265625, -101.0419921875, -97.13671875, -93.2314453125, -89.326171875, -85.4208984375, -81.515625, -77.6103515625, -73.705078125, -69.7998046875, -65.89453125, -61.9892578125, -58.083984375, -54.1787109375, -50.2734375, -46.3681640625, -42.462890625, -38.5576171875, -34.65234375, -30.7470703125, -26.841796875, -22.9365234375, -19.03125, -15.1259765625, -11.220703125, -7.3154296875, -3.41015625, 0.4951171875, 4.400390625, 8.3056640625, 12.2109375, 16.1162109375, 20.021484375, 23.9267578125, 27.83203125, 31.7373046875, 35.642578125, 39.5478515625, 43.453125, 47.3583984375, 51.263671875, 55.1689453125, 59.07421875, 62.9794921875, 66.884765625, 70.7900390625, 74.6953125, 78.6005859375, 82.505859375, 86.4111328125, 90.31640625, 94.2216796875, 98.126953125, 102.0322265625, 105.9375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 2.0, 3.0, 6.0, 10.0, 13.0, 16.0, 28.0, 47.0, 59.0, 63.0, 99.0, 124.0, 179.0, 244.0, 374.0, 560.0, 900.0, 1813.0, 5106.0, 27607.0, 253294.0, 2732022.0, 103113.0, 12984.0, 3238.0, 1323.0, 776.0, 500.0, 336.0, 241.0, 164.0, 103.0, 90.0, 64.0, 52.0, 33.0, 27.0, 23.0, 20.0, 12.0, 11.0, 7.0, 4.0, 3.0, 2.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.734375, -23.96875, -23.203125, -22.4375, -21.671875, -20.90625, -20.140625, -19.375, -18.609375, -17.84375, -17.078125, -16.3125, -15.546875, -14.78125, -14.015625, -13.25, -12.484375, -11.71875, -10.953125, -10.1875, -9.421875, -8.65625, -7.890625, -7.125, -6.359375, -5.59375, -4.828125, -4.0625, -3.296875, -2.53125, -1.765625, -1.0, -0.234375, 0.53125, 1.296875, 2.0625, 2.828125, 3.59375, 4.359375, 5.125, 5.890625, 6.65625, 7.421875, 8.1875, 8.953125, 9.71875, 10.484375, 11.25, 12.015625, 12.78125, 13.546875, 14.3125, 15.078125, 15.84375, 16.609375, 17.375, 18.140625, 18.90625, 19.671875, 20.4375, 21.203125, 21.96875, 22.734375, 23.5, 24.265625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 5.0, 29.0, 72.0, 164.0, 246.0, 237.0, 112.0, 56.0, 29.0, 11.0, 13.0, 3.0, 6.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-178.3229217529297, -167.10427856445312, -155.8856201171875, -144.66697692871094, -133.44833374023438, -122.22969055175781, -111.01103973388672, -99.79238891601562, -88.57374572753906, -77.3551025390625, -66.1364517211914, -54.91780471801758, -43.69915771484375, -32.48051071166992, -21.261863708496094, -10.043212890625, 1.1754302978515625, 12.39407730102539, 23.61272430419922, 34.83137130737305, 46.050018310546875, 57.2686653137207, 68.48731231689453, 79.70596313476562, 90.92460632324219, 102.14324951171875, 113.36190032958984, 124.58055114746094, 135.7991943359375, 147.01783752441406, 158.23648071289062, 169.45513916015625, 180.67376708984375, 191.8924102783203, 203.11105346679688, 214.3297119140625, 225.54835510253906, 236.76699829101562, 247.98565673828125, 259.20428466796875, 270.4229431152344, 281.6416015625, 292.8602294921875, 304.0788879394531, 315.29754638671875, 326.51617431640625, 337.7348327636719, 348.9534912109375, 360.172119140625, 371.3907775878906, 382.6094055175781, 393.82806396484375, 405.04669189453125, 416.2653503417969, 427.4840087890625, 438.70263671875, 449.9212951660156, 461.13995361328125, 472.35858154296875, 483.5772399902344, 494.7958984375, 506.0145263671875, 517.233154296875, 528.4518432617188, 539.6704711914062]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 8.0, 8.0, 5.0, 8.0, 10.0, 7.0, 12.0, 13.0, 16.0, 18.0, 23.0, 28.0, 21.0, 36.0, 27.0, 45.0, 47.0, 46.0, 45.0, 43.0, 56.0, 36.0, 43.0, 49.0, 41.0, 35.0, 45.0, 26.0, 38.0, 27.0, 24.0, 21.0, 20.0, 13.0, 9.0, 12.0, 3.0, 6.0, 8.0, 8.0, 9.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-181.45619201660156, -176.06277465820312, -170.66934204101562, -165.2759246826172, -159.88250732421875, -154.4890899658203, -149.0956573486328, -143.70223999023438, -138.30882263183594, -132.9154052734375, -127.52198028564453, -122.12855529785156, -116.73513793945312, -111.34171295166016, -105.94828796386719, -100.55487060546875, -95.16144561767578, -89.76802062988281, -84.37460327148438, -78.9811782836914, -73.58776092529297, -68.1943359375, -62.8009147644043, -57.407493591308594, -52.01407241821289, -46.62065124511719, -41.227230072021484, -35.83380889892578, -30.440385818481445, -25.046964645385742, -19.653541564941406, -14.260120391845703, -8.86669921875, -3.4732775688171387, 1.9201440811157227, 7.313566207885742, 12.706987380981445, 18.10040855407715, 23.493831634521484, 28.887252807617188, 34.28067398071289, 39.674095153808594, 45.0675163269043, 50.4609375, 55.85436248779297, 61.247779846191406, 66.64120483398438, 72.03462219238281, 77.42804718017578, 82.82147216796875, 88.21488952636719, 93.60831451416016, 99.0017318725586, 104.39515686035156, 109.78857421875, 115.18199920654297, 120.57542419433594, 125.9688491821289, 131.36227416992188, 136.7556915283203, 142.14910888671875, 147.5425262451172, 152.9359588623047, 158.32937622070312, 163.72279357910156]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 16.0, 13.0, 23.0, 47.0, 46.0, 83.0, 118.0, 179.0, 257.0, 370.0, 513.0, 797.0, 1041.0, 1541.0, 2198.0, 2950.0, 4153.0, 1015315.0, 6154.0, 3711.0, 2603.0, 1946.0, 1337.0, 921.0, 663.0, 455.0, 320.0, 257.0, 161.0, 108.0, 69.0, 63.0, 45.0, 21.0, 11.0, 13.0, 11.0, 3.0, 1.0, 5.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.211097717285156, -32.134246826171875, -31.057397842407227, -29.980546951293945, -28.903697967529297, -27.826847076416016, -26.749996185302734, -25.673145294189453, -24.596296310424805, -23.519445419311523, -22.442596435546875, -21.365745544433594, -20.288894653320312, -19.212045669555664, -18.135194778442383, -17.058345794677734, -15.981494903564453, -14.904644966125488, -13.827795028686523, -12.750944137573242, -11.674094200134277, -10.597244262695312, -9.520393371582031, -8.443543434143066, -7.366693496704102, -6.289843559265137, -5.212993144989014, -4.136142730712891, -3.059292793273926, -1.982442855834961, -0.9055924415588379, 0.17125797271728516, 1.24810791015625, 2.324958086013794, 3.401808261871338, 4.478658676147461, 5.555508613586426, 6.632358551025391, 7.709208965301514, 8.786059379577637, 9.862909317016602, 10.939759254455566, 12.016609191894531, 13.093460083007812, 14.170310020446777, 15.247159957885742, 16.324010848999023, 17.400859832763672, 18.477710723876953, 19.554561614990234, 20.631410598754883, 21.708261489868164, 22.785110473632812, 23.861961364746094, 24.938812255859375, 26.015663146972656, 27.092512130737305, 28.169363021850586, 29.246212005615234, 30.323062896728516, 31.399913787841797, 32.47676086425781, 33.553611755371094, 34.630462646484375, 35.707313537597656]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 11.0, 18.0, 35.0, 86.0, 89.0, 221.0, 51461384.0, 926.0, 160.0, 41.0, 41.0, 34.0, 45.0, 29.0, 15.0, 7.0, 10.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7336.69287109375, -7052.1484375, -6767.6044921875, -6483.06005859375, -6198.51611328125, -5913.9716796875, -5629.427734375, -5344.88330078125, -5060.3388671875, -4775.79443359375, -4491.25048828125, -4206.7060546875, -3922.162109375, -3637.61767578125, -3353.073486328125, -3068.529296875, -2783.9853515625, -2499.441162109375, -2214.89697265625, -1930.3526611328125, -1645.8084716796875, -1361.2642822265625, -1076.719970703125, -792.17578125, -507.631591796875, -223.08737182617188, 61.45684814453125, 346.0010986328125, 630.5452880859375, 915.0894775390625, 1199.6337890625, 1484.177978515625, 1768.72265625, 2053.266845703125, 2337.81103515625, 2622.35546875, 2906.8994140625, 3191.44384765625, 3475.988037109375, 3760.5322265625, 4045.076416015625, 4329.62060546875, 4614.1650390625, 4898.708984375, 5183.25341796875, 5467.79736328125, 5752.341796875, 6036.8857421875, 6321.43017578125, 6605.974609375, 6890.5185546875, 7175.06298828125, 7459.60693359375, 7744.1513671875, 8028.6953125, 8313.240234375, 8597.7841796875, 8882.328125, 9166.873046875, 9451.4169921875, 9735.9609375, 10020.5048828125, 10305.0498046875, 10589.59375, 10874.1376953125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 18.0, 7.0, 13.0, 20.0, 31.0, 65.0, 103.0, 148.0, 212.0, 378.0, 560.0, 842.0, 1480.0, 2297.0, 3838.0, 5921.0, 10031.0, 16101.0, 26197.0, 44441.0, 74961.0, 132122.0, 251395.0, 598793.0, 4046342.0, 536850.0, 233926.0, 125649.0, 72097.0, 42158.0, 24790.0, 15549.0, 9171.0, 5607.0, 3494.0, 2201.0, 1316.0, 918.0, 509.0, 334.0, 182.0, 136.0, 68.0, 57.0, 43.0, 17.0, 18.0, 6.0, 7.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-8.0546875, -7.798583984375, -7.54248046875, -7.286376953125, -7.0302734375, -6.774169921875, -6.51806640625, -6.261962890625, -6.005859375, -5.749755859375, -5.49365234375, -5.237548828125, -4.9814453125, -4.725341796875, -4.46923828125, -4.213134765625, -3.95703125, -3.700927734375, -3.44482421875, -3.188720703125, -2.9326171875, -2.676513671875, -2.42041015625, -2.164306640625, -1.908203125, -1.652099609375, -1.39599609375, -1.139892578125, -0.8837890625, -0.627685546875, -0.37158203125, -0.115478515625, 0.140625, 0.396728515625, 0.65283203125, 0.908935546875, 1.1650390625, 1.421142578125, 1.67724609375, 1.933349609375, 2.189453125, 2.445556640625, 2.70166015625, 2.957763671875, 3.2138671875, 3.469970703125, 3.72607421875, 3.982177734375, 4.23828125, 4.494384765625, 4.75048828125, 5.006591796875, 5.2626953125, 5.518798828125, 5.77490234375, 6.031005859375, 6.287109375, 6.543212890625, 6.79931640625, 7.055419921875, 7.3115234375, 7.567626953125, 7.82373046875, 8.079833984375, 8.3359375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 7.0, 9.0, 7.0, 8.0, 11.0, 15.0, 16.0, 33.0, 25.0, 30.0, 32.0, 30.0, 26.0, 32.0, 37.0, 36.0, 47.0, 90.0, 325.0, 650.0, 100.0, 46.0, 37.0, 46.0, 45.0, 32.0, 27.0, 36.0, 24.0, 21.0, 19.0, 19.0, 20.0, 8.0, 17.0, 11.0, 11.0, 6.0, 4.0, 5.0, 5.0, 5.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.390625, -17.802978515625, -17.21533203125, -16.627685546875, -16.0400390625, -15.452392578125, -14.86474609375, -14.277099609375, -13.689453125, -13.101806640625, -12.51416015625, -11.926513671875, -11.3388671875, -10.751220703125, -10.16357421875, -9.575927734375, -8.98828125, -8.400634765625, -7.81298828125, -7.225341796875, -6.6376953125, -6.050048828125, -5.46240234375, -4.874755859375, -4.287109375, -3.699462890625, -3.11181640625, -2.524169921875, -1.9365234375, -1.348876953125, -0.76123046875, -0.173583984375, 0.4140625, 1.001708984375, 1.58935546875, 2.177001953125, 2.7646484375, 3.352294921875, 3.93994140625, 4.527587890625, 5.115234375, 5.702880859375, 6.29052734375, 6.878173828125, 7.4658203125, 8.053466796875, 8.64111328125, 9.228759765625, 9.81640625, 10.404052734375, 10.99169921875, 11.579345703125, 12.1669921875, 12.754638671875, 13.34228515625, 13.929931640625, 14.517578125, 15.105224609375, 15.69287109375, 16.280517578125, 16.8681640625, 17.455810546875, 18.04345703125, 18.631103515625, 19.21875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 6.0, 4.0, 5.0, 6.0, 7.0, 9.0, 21.0, 39.0, 58.0, 54.0, 44.0, 93.0, 148.0, 241.0, 311.0, 388.0, 641.0, 940.0, 1421.0, 2219.0, 3145.0, 4870.0, 7784.0, 11623.0, 19570.0, 30931.0, 50964.0, 86846.0, 157672.0, 329772.0, 1769271.0, 3062173.0, 353259.0, 165532.0, 90093.0, 53456.0, 31872.0, 19778.0, 12788.0, 7734.0, 5159.0, 3501.0, 2254.0, 1449.0, 1103.0, 635.0, 397.0, 285.0, 283.0, 233.0, 99.0, 54.0, 47.0, 41.0, 42.0, 37.0, 13.0, 9.0, 6.0, 3.0, 3.0, 7.0, 5.0], "bins": [-9.28125, -8.9915771484375, -8.701904296875, -8.4122314453125, -8.12255859375, -7.8328857421875, -7.543212890625, -7.2535400390625, -6.9638671875, -6.6741943359375, -6.384521484375, -6.0948486328125, -5.80517578125, -5.5155029296875, -5.225830078125, -4.9361572265625, -4.646484375, -4.3568115234375, -4.067138671875, -3.7774658203125, -3.48779296875, -3.1981201171875, -2.908447265625, -2.6187744140625, -2.3291015625, -2.0394287109375, -1.749755859375, -1.4600830078125, -1.17041015625, -0.8807373046875, -0.591064453125, -0.3013916015625, -0.01171875, 0.2779541015625, 0.567626953125, 0.8572998046875, 1.14697265625, 1.4366455078125, 1.726318359375, 2.0159912109375, 2.3056640625, 2.5953369140625, 2.885009765625, 3.1746826171875, 3.46435546875, 3.7540283203125, 4.043701171875, 4.3333740234375, 4.623046875, 4.9127197265625, 5.202392578125, 5.4920654296875, 5.78173828125, 6.0714111328125, 6.361083984375, 6.6507568359375, 6.9404296875, 7.2301025390625, 7.519775390625, 7.8094482421875, 8.09912109375, 8.3887939453125, 8.678466796875, 8.9681396484375, 9.2578125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 10.0, 9.0, 19.0, 18.0, 29.0, 35.0, 32.0, 36.0, 39.0, 50.0, 38.0, 61.0, 128.0, 407.0, 591.0, 106.0, 62.0, 52.0, 50.0, 36.0, 29.0, 36.0, 31.0, 19.0, 16.0, 13.0, 18.0, 9.0, 7.0, 9.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.029052734375, -16.46435546875, -15.899658203125, -15.3349609375, -14.770263671875, -14.20556640625, -13.640869140625, -13.076171875, -12.511474609375, -11.94677734375, -11.382080078125, -10.8173828125, -10.252685546875, -9.68798828125, -9.123291015625, -8.55859375, -7.993896484375, -7.42919921875, -6.864501953125, -6.2998046875, -5.735107421875, -5.17041015625, -4.605712890625, -4.041015625, -3.476318359375, -2.91162109375, -2.346923828125, -1.7822265625, -1.217529296875, -0.65283203125, -0.088134765625, 0.4765625, 1.041259765625, 1.60595703125, 2.170654296875, 2.7353515625, 3.300048828125, 3.86474609375, 4.429443359375, 4.994140625, 5.558837890625, 6.12353515625, 6.688232421875, 7.2529296875, 7.817626953125, 8.38232421875, 8.947021484375, 9.51171875, 10.076416015625, 10.64111328125, 11.205810546875, 11.7705078125, 12.335205078125, 12.89990234375, 13.464599609375, 14.029296875, 14.593994140625, 15.15869140625, 15.723388671875, 16.2880859375, 16.852783203125, 17.41748046875, 17.982177734375, 18.546875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 11.0, 5.0, 3.0, 3.0, 7.0, 14.0, 20.0, 16.0, 22.0, 53.0, 110.0, 73.0, 69.0, 94.0, 140.0, 189.0, 380.0, 390.0, 476.0, 775.0, 1128.0, 1601.0, 2698.0, 4303.0, 8135.0, 17053.0, 46567.0, 308839.0, 5791029.0, 62661.0, 21233.0, 9246.0, 5075.0, 2814.0, 1993.0, 1193.0, 757.0, 600.0, 409.0, 317.0, 250.0, 166.0, 104.0, 112.0, 83.0, 37.0, 44.0, 50.0, 43.0, 9.0, 10.0, 8.0, 9.0, 4.0, 3.0, 0.0, 6.0, 1.0, 2.0, 6.0], "bins": [-28.59375, -27.703369140625, -26.81298828125, -25.922607421875, -25.0322265625, -24.141845703125, -23.25146484375, -22.361083984375, -21.470703125, -20.580322265625, -19.68994140625, -18.799560546875, -17.9091796875, -17.018798828125, -16.12841796875, -15.238037109375, -14.34765625, -13.457275390625, -12.56689453125, -11.676513671875, -10.7861328125, -9.895751953125, -9.00537109375, -8.114990234375, -7.224609375, -6.334228515625, -5.44384765625, -4.553466796875, -3.6630859375, -2.772705078125, -1.88232421875, -0.991943359375, -0.1015625, 0.788818359375, 1.67919921875, 2.569580078125, 3.4599609375, 4.350341796875, 5.24072265625, 6.131103515625, 7.021484375, 7.911865234375, 8.80224609375, 9.692626953125, 10.5830078125, 11.473388671875, 12.36376953125, 13.254150390625, 14.14453125, 15.034912109375, 15.92529296875, 16.815673828125, 17.7060546875, 18.596435546875, 19.48681640625, 20.377197265625, 21.267578125, 22.157958984375, 23.04833984375, 23.938720703125, 24.8291015625, 25.719482421875, 26.60986328125, 27.500244140625, 28.390625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 11.0, 9.0, 6.0, 9.0, 12.0, 13.0, 9.0, 15.0, 22.0, 21.0, 29.0, 37.0, 45.0, 38.0, 41.0, 58.0, 89.0, 172.0, 409.0, 400.0, 114.0, 74.0, 51.0, 42.0, 27.0, 35.0, 28.0, 32.0, 29.0, 29.0, 18.0, 20.0, 16.0, 10.0, 8.0, 9.0, 17.0, 5.0, 2.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.8515625, -9.511962890625, -9.17236328125, -8.832763671875, -8.4931640625, -8.153564453125, -7.81396484375, -7.474365234375, -7.134765625, -6.795166015625, -6.45556640625, -6.115966796875, -5.7763671875, -5.436767578125, -5.09716796875, -4.757568359375, -4.41796875, -4.078369140625, -3.73876953125, -3.399169921875, -3.0595703125, -2.719970703125, -2.38037109375, -2.040771484375, -1.701171875, -1.361572265625, -1.02197265625, -0.682373046875, -0.3427734375, -0.003173828125, 0.33642578125, 0.676025390625, 1.015625, 1.355224609375, 1.69482421875, 2.034423828125, 2.3740234375, 2.713623046875, 3.05322265625, 3.392822265625, 3.732421875, 4.072021484375, 4.41162109375, 4.751220703125, 5.0908203125, 5.430419921875, 5.77001953125, 6.109619140625, 6.44921875, 6.788818359375, 7.12841796875, 7.468017578125, 7.8076171875, 8.147216796875, 8.48681640625, 8.826416015625, 9.166015625, 9.505615234375, 9.84521484375, 10.184814453125, 10.5244140625, 10.864013671875, 11.20361328125, 11.543212890625, 11.8828125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 7.0, 10.0, 26.0, 62.0, 205.0, 469.0, 139.0, 49.0, 24.0, 8.0, 4.0, 2.0, 1.0], "bins": [-125.38099670410156, -123.1585922241211, -120.93618774414062, -118.71378326416016, -116.49137878417969, -114.26897430419922, -112.04656982421875, -109.82416534423828, -107.60176086425781, -105.37935638427734, -103.15695190429688, -100.9345474243164, -98.71214294433594, -96.48973846435547, -94.267333984375, -92.04492950439453, -89.82252502441406, -87.6001205444336, -85.37771606445312, -83.15531158447266, -80.93290710449219, -78.71050262451172, -76.48809814453125, -74.26569366455078, -72.04329681396484, -69.82089233398438, -67.5984878540039, -65.37608337402344, -63.15367889404297, -60.9312744140625, -58.70886993408203, -56.48646545410156, -54.264060974121094, -52.041656494140625, -49.819252014160156, -47.59684753417969, -45.37444305419922, -43.15203857421875, -40.92963409423828, -38.70722961425781, -36.48482894897461, -34.26242446899414, -32.04001998901367, -29.817615509033203, -27.595211029052734, -25.372806549072266, -23.15040397644043, -20.92799949645996, -18.705595016479492, -16.483190536499023, -14.260786056518555, -12.038382530212402, -9.815978050231934, -7.593573570251465, -5.3711700439453125, -3.1487655639648438, -0.926361083984375, 1.2960431575775146, 3.5184473991394043, 5.740851402282715, 7.963255882263184, 10.185660362243652, 12.408063888549805, 14.630468368530273, 16.852872848510742]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 6.0, 13.0, 15.0, 16.0, 25.0, 19.0, 27.0, 29.0, 37.0, 33.0, 37.0, 32.0, 40.0, 50.0, 41.0, 51.0, 48.0, 46.0, 39.0, 49.0, 38.0, 44.0, 34.0, 40.0, 33.0, 26.0, 24.0, 16.0, 16.0, 12.0, 14.0, 10.0, 5.0, 11.0, 7.0, 5.0, 1.0, 2.0, 2.0, 4.0], "bins": [-22.12297821044922, -21.571548461914062, -21.020118713378906, -20.46868896484375, -19.917259216308594, -19.365829467773438, -18.81439971923828, -18.262969970703125, -17.71154022216797, -17.160110473632812, -16.608680725097656, -16.0572509765625, -15.505821228027344, -14.954391479492188, -14.402961730957031, -13.851531982421875, -13.300103187561035, -12.748673439025879, -12.197243690490723, -11.645813941955566, -11.09438419342041, -10.542954444885254, -9.991525650024414, -9.440095901489258, -8.888666152954102, -8.337236404418945, -7.785806655883789, -7.234376907348633, -6.682947158813477, -6.13151741027832, -5.580088138580322, -5.028658390045166, -4.477227210998535, -3.925797462463379, -3.3743677139282227, -2.8229382038116455, -2.2715084552764893, -1.720078706741333, -1.1686491966247559, -0.6172194480895996, -0.06578969955444336, 0.4856399893760681, 1.0370696783065796, 1.5884993076324463, 2.1399290561676025, 2.691358804702759, 3.242788314819336, 3.794218063354492, 4.345647811889648, 4.897077560424805, 5.448507308959961, 5.999937057495117, 6.551366806030273, 7.10279655456543, 7.654225826263428, 8.205656051635742, 8.757085800170898, 9.308515548706055, 9.859945297241211, 10.411375045776367, 10.962804794311523, 11.51423454284668, 12.065664291381836, 12.617094039916992, 13.168522834777832]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 3.0, 1.0, 2.0, 6.0, 6.0, 8.0, 6.0, 16.0, 19.0, 12.0, 28.0, 28.0, 40.0, 44.0, 66.0, 82.0, 128.0, 190.0, 243.0, 359.0, 566.0, 844.0, 1289.0, 2090.0, 3455.0, 6220.0, 12349.0, 29927.0, 104418.0, 3822134.0, 144269.0, 35747.0, 13986.0, 6588.0, 3525.0, 1982.0, 1225.0, 780.0, 448.0, 305.0, 220.0, 162.0, 130.0, 88.0, 51.0, 50.0, 40.0, 24.0, 24.0, 16.0, 9.0, 18.0, 4.0, 8.0, 2.0, 6.0, 4.0, 0.0, 6.0, 0.0, 1.0], "bins": [-0.1090087890625, -0.10566329956054688, -0.10231781005859375, -0.09897232055664062, -0.0956268310546875, -0.09228134155273438, -0.08893585205078125, -0.08559036254882812, -0.082244873046875, -0.07889938354492188, -0.07555389404296875, -0.07220840454101562, -0.0688629150390625, -0.06551742553710938, -0.06217193603515625, -0.058826446533203125, -0.05548095703125, -0.052135467529296875, -0.04878997802734375, -0.045444488525390625, -0.0420989990234375, -0.038753509521484375, -0.03540802001953125, -0.032062530517578125, -0.028717041015625, -0.025371551513671875, -0.02202606201171875, -0.018680572509765625, -0.0153350830078125, -0.011989593505859375, -0.00864410400390625, -0.005298614501953125, -0.001953125, 0.001392364501953125, 0.00473785400390625, 0.008083343505859375, 0.0114288330078125, 0.014774322509765625, 0.01811981201171875, 0.021465301513671875, 0.024810791015625, 0.028156280517578125, 0.03150177001953125, 0.034847259521484375, 0.0381927490234375, 0.041538238525390625, 0.04488372802734375, 0.048229217529296875, 0.05157470703125, 0.054920196533203125, 0.05826568603515625, 0.061611175537109375, 0.0649566650390625, 0.06830215454101562, 0.07164764404296875, 0.07499313354492188, 0.078338623046875, 0.08168411254882812, 0.08502960205078125, 0.08837509155273438, 0.0917205810546875, 0.09506607055664062, 0.09841156005859375, 0.10175704956054688, 0.1051025390625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 8.0, 5.0, 8.0, 6.0, 4.0, 11.0, 15.0, 18.0, 83.0, 712.0, 13.0, 14.0, 12.0, 9.0, 5.0, 4.0, 8.0, 7.0, 3.0, 12.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.03173828125, -0.030810117721557617, -0.029881954193115234, -0.02895379066467285, -0.02802562713623047, -0.027097463607788086, -0.026169300079345703, -0.02524113655090332, -0.024312973022460938, -0.023384809494018555, -0.022456645965576172, -0.02152848243713379, -0.020600318908691406, -0.019672155380249023, -0.01874399185180664, -0.017815828323364258, -0.016887664794921875, -0.015959501266479492, -0.01503133773803711, -0.014103174209594727, -0.013175010681152344, -0.012246847152709961, -0.011318683624267578, -0.010390520095825195, -0.009462356567382812, -0.00853419303894043, -0.007606029510498047, -0.006677865982055664, -0.005749702453613281, -0.0048215389251708984, -0.0038933753967285156, -0.002965211868286133, -0.00203704833984375, -0.0011088848114013672, -0.00018072128295898438, 0.0007474422454833984, 0.0016756057739257812, 0.002603769302368164, 0.003531932830810547, 0.00446009635925293, 0.0053882598876953125, 0.006316423416137695, 0.007244586944580078, 0.008172750473022461, 0.009100914001464844, 0.010029077529907227, 0.01095724105834961, 0.011885404586791992, 0.012813568115234375, 0.013741731643676758, 0.01466989517211914, 0.015598058700561523, 0.016526222229003906, 0.01745438575744629, 0.018382549285888672, 0.019310712814331055, 0.020238876342773438, 0.02116703987121582, 0.022095203399658203, 0.023023366928100586, 0.02395153045654297, 0.02487969398498535, 0.025807857513427734, 0.026736021041870117, 0.0276641845703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 6.0, 3.0, 5.0, 13.0, 16.0, 13.0, 31.0, 36.0, 108.0, 268.0, 641.0, 1746.0, 6129.0, 30586.0, 295329.0, 3509286.0, 308529.0, 31990.0, 6469.0, 1874.0, 649.0, 273.0, 138.0, 55.0, 33.0, 15.0, 12.0, 10.0, 8.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165283203125, -0.1596813201904297, -0.15407943725585938, -0.14847755432128906, -0.14287567138671875, -0.13727378845214844, -0.13167190551757812, -0.1260700225830078, -0.1204681396484375, -0.11486625671386719, -0.10926437377929688, -0.10366249084472656, -0.09806060791015625, -0.09245872497558594, -0.08685684204101562, -0.08125495910644531, -0.075653076171875, -0.07005119323730469, -0.06444931030273438, -0.05884742736816406, -0.05324554443359375, -0.04764366149902344, -0.042041778564453125, -0.03643989562988281, -0.0308380126953125, -0.025236129760742188, -0.019634246826171875, -0.014032363891601562, -0.00843048095703125, -0.0028285980224609375, 0.002773284912109375, 0.008375167846679688, 0.01397705078125, 0.019578933715820312, 0.025180816650390625, 0.030782699584960938, 0.03638458251953125, 0.04198646545410156, 0.047588348388671875, 0.05319023132324219, 0.0587921142578125, 0.06439399719238281, 0.06999588012695312, 0.07559776306152344, 0.08119964599609375, 0.08680152893066406, 0.09240341186523438, 0.09800529479980469, 0.103607177734375, 0.10920906066894531, 0.11481094360351562, 0.12041282653808594, 0.12601470947265625, 0.13161659240722656, 0.13721847534179688, 0.1428203582763672, 0.1484222412109375, 0.1540241241455078, 0.15962600708007812, 0.16522789001464844, 0.17082977294921875, 0.17643165588378906, 0.18203353881835938, 0.1876354217529297, 0.1932373046875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 9.0, 11.0, 8.0, 14.0, 28.0, 27.0, 43.0, 68.0, 103.0, 124.0, 219.0, 342.0, 628.0, 918.0, 533.0, 320.0, 188.0, 144.0, 82.0, 63.0, 54.0, 43.0, 25.0, 23.0, 13.0, 7.0, 4.0, 8.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.045501708984375, -0.04414081573486328, -0.04277992248535156, -0.041419029235839844, -0.040058135986328125, -0.038697242736816406, -0.03733634948730469, -0.03597545623779297, -0.03461456298828125, -0.03325366973876953, -0.03189277648925781, -0.030531883239746094, -0.029170989990234375, -0.027810096740722656, -0.026449203491210938, -0.02508831024169922, -0.0237274169921875, -0.02236652374267578, -0.021005630493164062, -0.019644737243652344, -0.018283843994140625, -0.016922950744628906, -0.015562057495117188, -0.014201164245605469, -0.01284027099609375, -0.011479377746582031, -0.010118484497070312, -0.008757591247558594, -0.007396697998046875, -0.006035804748535156, -0.0046749114990234375, -0.0033140182495117188, -0.001953125, -0.0005922317504882812, 0.0007686614990234375, 0.0021295547485351562, 0.003490447998046875, 0.004851341247558594, 0.0062122344970703125, 0.007573127746582031, 0.00893402099609375, 0.010294914245605469, 0.011655807495117188, 0.013016700744628906, 0.014377593994140625, 0.015738487243652344, 0.017099380493164062, 0.01846027374267578, 0.0198211669921875, 0.02118206024169922, 0.022542953491210938, 0.023903846740722656, 0.025264739990234375, 0.026625633239746094, 0.027986526489257812, 0.02934741973876953, 0.03070831298828125, 0.03206920623779297, 0.03343009948730469, 0.034790992736816406, 0.036151885986328125, 0.037512779235839844, 0.03887367248535156, 0.04023456573486328, 0.041595458984375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 39.0, 65.0, 145.0, 280.0, 253.0, 116.0, 50.0, 29.0, 15.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6133080720901489, -0.597533643245697, -0.5817592144012451, -0.5659847855567932, -0.5502103567123413, -0.5344359278678894, -0.5186614990234375, -0.5028870701789856, -0.4871126413345337, -0.4713382124900818, -0.4555637836456299, -0.439789354801178, -0.4240149259567261, -0.40824049711227417, -0.39246606826782227, -0.37669163942337036, -0.36091718077659607, -0.34514275193214417, -0.32936832308769226, -0.31359389424324036, -0.29781946539878845, -0.28204503655433655, -0.26627057790756226, -0.25049614906311035, -0.23472173511981964, -0.21894730627536774, -0.20317287743091583, -0.18739843368530273, -0.17162400484085083, -0.15584957599639893, -0.14007514715194702, -0.12430071830749512, -0.10852628946304321, -0.09275186061859131, -0.0769774317741394, -0.0612029954791069, -0.045428566634655, -0.029654137790203094, -0.013879701495170593, 0.001894727349281311, 0.017669156193733215, 0.03344358503818512, 0.04921801760792732, 0.06499245017766953, 0.08076687902212143, 0.09654130786657333, 0.11231574416160583, 0.12809017300605774, 0.14386460185050964, 0.15963903069496155, 0.17541345953941345, 0.19118788838386536, 0.20696231722831726, 0.22273674607276917, 0.23851118981838226, 0.25428563356399536, 0.27006006240844727, 0.28583449125289917, 0.3016089200973511, 0.317383348941803, 0.3331577777862549, 0.3489322066307068, 0.3647066354751587, 0.3804810643196106, 0.3962554931640625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 1.0, 6.0, 8.0, 7.0, 11.0, 19.0, 24.0, 35.0, 44.0, 36.0, 49.0, 52.0, 60.0, 63.0, 65.0, 62.0, 58.0, 76.0, 60.0, 51.0, 44.0, 32.0, 29.0, 19.0, 19.0, 12.0, 16.0, 9.0, 8.0, 3.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23663735389709473, -0.23024378716945648, -0.22385022044181824, -0.21745665371418, -0.21106308698654175, -0.2046695202589035, -0.19827595353126526, -0.1918824017047882, -0.18548882007598877, -0.17909525334835052, -0.17270168662071228, -0.16630811989307404, -0.1599145531654358, -0.15352098643779755, -0.1471274197101593, -0.14073386788368225, -0.134340301156044, -0.12794673442840576, -0.12155316770076752, -0.11515960097312927, -0.10876603424549103, -0.10237246751785278, -0.09597890824079514, -0.08958534151315689, -0.08319177478551865, -0.0767982080578804, -0.07040464133024216, -0.06401108205318451, -0.057617511600255966, -0.05122394487261772, -0.044830381870269775, -0.03843681514263153, -0.032043248414993286, -0.02564968168735504, -0.019256116822361946, -0.01286255195736885, -0.006468985229730606, -7.541850209236145e-05, 0.006318144500255585, 0.01271171122789383, 0.019105277955532074, 0.02549884468317032, 0.03189241141080856, 0.03828597441315651, 0.044679541140794754, 0.051073107868433, 0.057466670870780945, 0.06386023759841919, 0.07025380432605743, 0.07664737105369568, 0.08304093778133392, 0.08943450450897217, 0.09582807123661041, 0.10222163796424866, 0.1086151972413063, 0.11500876396894455, 0.1214023306965828, 0.12779588997364044, 0.1341894567012787, 0.14058302342891693, 0.14697659015655518, 0.15337015688419342, 0.15976372361183167, 0.1661572903394699, 0.17255085706710815]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 5.0, 16.0, 10.0, 20.0, 32.0, 33.0, 36.0, 69.0, 88.0, 133.0, 176.0, 271.0, 383.0, 520.0, 786.0, 1102.0, 1771.0, 2560.0, 4083.0, 6916.0, 12463.0, 26626.0, 249228.0, 672147.0, 33355.0, 14429.0, 7841.0, 4578.0, 2962.0, 1865.0, 1238.0, 830.0, 582.0, 410.0, 285.0, 199.0, 148.0, 95.0, 72.0, 52.0, 33.0, 39.0, 11.0, 20.0, 10.0, 9.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.157470703125, -0.15256690979003906, -0.14766311645507812, -0.1427593231201172, -0.13785552978515625, -0.1329517364501953, -0.12804794311523438, -0.12314414978027344, -0.1182403564453125, -0.11333656311035156, -0.10843276977539062, -0.10352897644042969, -0.09862518310546875, -0.09372138977050781, -0.08881759643554688, -0.08391380310058594, -0.079010009765625, -0.07410621643066406, -0.06920242309570312, -0.06429862976074219, -0.05939483642578125, -0.05449104309082031, -0.049587249755859375, -0.04468345642089844, -0.0397796630859375, -0.03487586975097656, -0.029972076416015625, -0.025068283081054688, -0.02016448974609375, -0.015260696411132812, -0.010356903076171875, -0.0054531097412109375, -0.00054931640625, 0.0043544769287109375, 0.009258270263671875, 0.014162063598632812, 0.01906585693359375, 0.023969650268554688, 0.028873443603515625, 0.03377723693847656, 0.0386810302734375, 0.04358482360839844, 0.048488616943359375, 0.05339241027832031, 0.05829620361328125, 0.06319999694824219, 0.06810379028320312, 0.07300758361816406, 0.077911376953125, 0.08281517028808594, 0.08771896362304688, 0.09262275695800781, 0.09752655029296875, 0.10243034362792969, 0.10733413696289062, 0.11223793029785156, 0.1171417236328125, 0.12204551696777344, 0.12694931030273438, 0.1318531036376953, 0.13675689697265625, 0.1416606903076172, 0.14656448364257812, 0.15146827697753906, 0.1563720703125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 6.0, 10.0, 9.0, 11.0, 13.0, 24.0, 92.0, 301.0, 298.0, 96.0, 22.0, 17.0, 13.0, 5.0, 6.0, 7.0, 7.0, 7.0, 4.0, 4.0, 7.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.030303955078125, -0.029439926147460938, -0.028575897216796875, -0.027711868286132812, -0.02684783935546875, -0.025983810424804688, -0.025119781494140625, -0.024255752563476562, -0.0233917236328125, -0.022527694702148438, -0.021663665771484375, -0.020799636840820312, -0.01993560791015625, -0.019071578979492188, -0.018207550048828125, -0.017343521118164062, -0.0164794921875, -0.015615463256835938, -0.014751434326171875, -0.013887405395507812, -0.01302337646484375, -0.012159347534179688, -0.011295318603515625, -0.010431289672851562, -0.0095672607421875, -0.008703231811523438, -0.007839202880859375, -0.0069751739501953125, -0.00611114501953125, -0.0052471160888671875, -0.004383087158203125, -0.0035190582275390625, -0.002655029296875, -0.0017910003662109375, -0.000926971435546875, -6.29425048828125e-05, 0.00080108642578125, 0.0016651153564453125, 0.002529144287109375, 0.0033931732177734375, 0.0042572021484375, 0.0051212310791015625, 0.005985260009765625, 0.0068492889404296875, 0.00771331787109375, 0.008577346801757812, 0.009441375732421875, 0.010305404663085938, 0.01116943359375, 0.012033462524414062, 0.012897491455078125, 0.013761520385742188, 0.01462554931640625, 0.015489578247070312, 0.016353607177734375, 0.017217636108398438, 0.0180816650390625, 0.018945693969726562, 0.019809722900390625, 0.020673751831054688, 0.02153778076171875, 0.022401809692382812, 0.023265838623046875, 0.024129867553710938, 0.024993896484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 8.0, 10.0, 11.0, 12.0, 15.0, 32.0, 55.0, 77.0, 127.0, 230.0, 511.0, 1373.0, 5592.0, 69179.0, 904948.0, 58975.0, 5081.0, 1269.0, 467.0, 221.0, 138.0, 82.0, 50.0, 23.0, 25.0, 15.0, 7.0, 6.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42626953125, -0.4118080139160156, -0.39734649658203125, -0.3828849792480469, -0.3684234619140625, -0.3539619445800781, -0.33950042724609375, -0.3250389099121094, -0.310577392578125, -0.2961158752441406, -0.28165435791015625, -0.2671928405761719, -0.2527313232421875, -0.23826980590820312, -0.22380828857421875, -0.20934677124023438, -0.19488525390625, -0.18042373657226562, -0.16596221923828125, -0.15150070190429688, -0.1370391845703125, -0.12257766723632812, -0.10811614990234375, -0.09365463256835938, -0.079193115234375, -0.06473159790039062, -0.05027008056640625, -0.035808563232421875, -0.0213470458984375, -0.006885528564453125, 0.00757598876953125, 0.022037506103515625, 0.0364990234375, 0.050960540771484375, 0.06542205810546875, 0.07988357543945312, 0.0943450927734375, 0.10880661010742188, 0.12326812744140625, 0.13772964477539062, 0.152191162109375, 0.16665267944335938, 0.18111419677734375, 0.19557571411132812, 0.2100372314453125, 0.22449874877929688, 0.23896026611328125, 0.2534217834472656, 0.26788330078125, 0.2823448181152344, 0.29680633544921875, 0.3112678527832031, 0.3257293701171875, 0.3401908874511719, 0.35465240478515625, 0.3691139221191406, 0.383575439453125, 0.3980369567871094, 0.41249847412109375, 0.4269599914550781, 0.4414215087890625, 0.4558830261230469, 0.47034454345703125, 0.4848060607910156, 0.499267578125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 5.0, 11.0, 7.0, 9.0, 11.0, 21.0, 16.0, 13.0, 21.0, 19.0, 26.0, 26.0, 24.0, 33.0, 45.0, 35.0, 31.0, 43.0, 48.0, 37.0, 42.0, 38.0, 46.0, 48.0, 29.0, 34.0, 27.0, 35.0, 43.0, 25.0, 24.0, 17.0, 30.0, 9.0, 18.0, 11.0, 4.0, 9.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.1298828125, -0.12615203857421875, -0.1224212646484375, -0.11869049072265625, -0.114959716796875, -0.11122894287109375, -0.1074981689453125, -0.10376739501953125, -0.10003662109375, -0.09630584716796875, -0.0925750732421875, -0.08884429931640625, -0.085113525390625, -0.08138275146484375, -0.0776519775390625, -0.07392120361328125, -0.0701904296875, -0.06645965576171875, -0.0627288818359375, -0.05899810791015625, -0.055267333984375, -0.05153656005859375, -0.0478057861328125, -0.04407501220703125, -0.04034423828125, -0.03661346435546875, -0.0328826904296875, -0.02915191650390625, -0.025421142578125, -0.02169036865234375, -0.0179595947265625, -0.01422882080078125, -0.010498046875, -0.00676727294921875, -0.0030364990234375, 0.00069427490234375, 0.004425048828125, 0.00815582275390625, 0.0118865966796875, 0.01561737060546875, 0.01934814453125, 0.02307891845703125, 0.0268096923828125, 0.03054046630859375, 0.034271240234375, 0.03800201416015625, 0.0417327880859375, 0.04546356201171875, 0.0491943359375, 0.05292510986328125, 0.0566558837890625, 0.06038665771484375, 0.064117431640625, 0.06784820556640625, 0.0715789794921875, 0.07530975341796875, 0.07904052734375, 0.08277130126953125, 0.0865020751953125, 0.09023284912109375, 0.093963623046875, 0.09769439697265625, 0.1014251708984375, 0.10515594482421875, 0.10888671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 10.0, 18.0, 24.0, 50.0, 65.0, 88.0, 209.0, 369.0, 820.0, 2678.0, 15492.0, 968493.0, 53306.0, 4559.0, 1299.0, 442.0, 278.0, 128.0, 73.0, 37.0, 28.0, 20.0, 14.0, 8.0, 10.0, 3.0, 7.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4326171875, -0.4180450439453125, -0.403472900390625, -0.3889007568359375, -0.37432861328125, -0.3597564697265625, -0.345184326171875, -0.3306121826171875, -0.3160400390625, -0.3014678955078125, -0.286895751953125, -0.2723236083984375, -0.25775146484375, -0.2431793212890625, -0.228607177734375, -0.2140350341796875, -0.199462890625, -0.1848907470703125, -0.170318603515625, -0.1557464599609375, -0.14117431640625, -0.1266021728515625, -0.112030029296875, -0.0974578857421875, -0.0828857421875, -0.0683135986328125, -0.053741455078125, -0.0391693115234375, -0.02459716796875, -0.0100250244140625, 0.004547119140625, 0.0191192626953125, 0.03369140625, 0.0482635498046875, 0.062835693359375, 0.0774078369140625, 0.09197998046875, 0.1065521240234375, 0.121124267578125, 0.1356964111328125, 0.1502685546875, 0.1648406982421875, 0.179412841796875, 0.1939849853515625, 0.20855712890625, 0.2231292724609375, 0.237701416015625, 0.2522735595703125, 0.266845703125, 0.2814178466796875, 0.295989990234375, 0.3105621337890625, 0.32513427734375, 0.3397064208984375, 0.354278564453125, 0.3688507080078125, 0.3834228515625, 0.3979949951171875, 0.412567138671875, 0.4271392822265625, 0.44171142578125, 0.4562835693359375, 0.470855712890625, 0.4854278564453125, 0.5]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 7.0, 7.0, 11.0, 13.0, 9.0, 11.0, 18.0, 21.0, 26.0, 36.0, 38.0, 44.0, 46.0, 98.0, 149.0, 86.0, 68.0, 69.0, 48.0, 27.0, 29.0, 25.0, 22.0, 12.0, 19.0, 8.0, 10.0, 9.0, 4.0, 6.0, 3.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0016937255859375, -0.0016447901725769043, -0.0015958547592163086, -0.0015469193458557129, -0.0014979839324951172, -0.0014490485191345215, -0.0014001131057739258, -0.00135117769241333, -0.0013022422790527344, -0.0012533068656921387, -0.001204371452331543, -0.0011554360389709473, -0.0011065006256103516, -0.0010575652122497559, -0.0010086297988891602, -0.0009596943855285645, -0.0009107589721679688, -0.000861823558807373, -0.0008128881454467773, -0.0007639527320861816, -0.0007150173187255859, -0.0006660819053649902, -0.0006171464920043945, -0.0005682110786437988, -0.0005192756652832031, -0.0004703402519226074, -0.0004214048385620117, -0.000372469425201416, -0.0003235340118408203, -0.0002745985984802246, -0.0002256631851196289, -0.0001767277717590332, -0.0001277923583984375, -7.88569450378418e-05, -2.9921531677246094e-05, 1.901388168334961e-05, 6.794929504394531e-05, 0.00011688470840454102, 0.00016582012176513672, 0.00021475553512573242, 0.0002636909484863281, 0.00031262636184692383, 0.00036156177520751953, 0.00041049718856811523, 0.00045943260192871094, 0.0005083680152893066, 0.0005573034286499023, 0.000606238842010498, 0.0006551742553710938, 0.0007041096687316895, 0.0007530450820922852, 0.0008019804954528809, 0.0008509159088134766, 0.0008998513221740723, 0.000948786735534668, 0.0009977221488952637, 0.0010466575622558594, 0.001095592975616455, 0.0011445283889770508, 0.0011934638023376465, 0.0012423992156982422, 0.0012913346290588379, 0.0013402700424194336, 0.0013892054557800293, 0.001438140869140625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 10.0, 6.0, 5.0, 15.0, 19.0, 19.0, 34.0, 59.0, 77.0, 125.0, 169.0, 317.0, 534.0, 961.0, 1783.0, 3831.0, 9479.0, 29937.0, 170627.0, 693493.0, 101356.0, 21657.0, 7468.0, 3120.0, 1473.0, 791.0, 424.0, 264.0, 154.0, 101.0, 76.0, 43.0, 33.0, 31.0, 19.0, 8.0, 8.0, 8.0, 8.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1461181640625, -0.14130783081054688, -0.13649749755859375, -0.13168716430664062, -0.1268768310546875, -0.12206649780273438, -0.11725616455078125, -0.11244583129882812, -0.107635498046875, -0.10282516479492188, -0.09801483154296875, -0.09320449829101562, -0.0883941650390625, -0.08358383178710938, -0.07877349853515625, -0.07396316528320312, -0.06915283203125, -0.06434249877929688, -0.05953216552734375, -0.054721832275390625, -0.0499114990234375, -0.045101165771484375, -0.04029083251953125, -0.035480499267578125, -0.030670166015625, -0.025859832763671875, -0.02104949951171875, -0.016239166259765625, -0.0114288330078125, -0.006618499755859375, -0.00180816650390625, 0.003002166748046875, 0.0078125, 0.012622833251953125, 0.01743316650390625, 0.022243499755859375, 0.0270538330078125, 0.031864166259765625, 0.03667449951171875, 0.041484832763671875, 0.046295166015625, 0.051105499267578125, 0.05591583251953125, 0.060726165771484375, 0.0655364990234375, 0.07034683227539062, 0.07515716552734375, 0.07996749877929688, 0.08477783203125, 0.08958816528320312, 0.09439849853515625, 0.09920883178710938, 0.1040191650390625, 0.10882949829101562, 0.11363983154296875, 0.11845016479492188, 0.123260498046875, 0.12807083129882812, 0.13288116455078125, 0.13769149780273438, 0.1425018310546875, 0.14731216430664062, 0.15212249755859375, 0.15693283081054688, 0.1617431640625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 5.0, 8.0, 11.0, 10.0, 21.0, 20.0, 31.0, 44.0, 43.0, 50.0, 78.0, 102.0, 93.0, 89.0, 72.0, 62.0, 38.0, 35.0, 39.0, 21.0, 14.0, 17.0, 18.0, 10.0, 11.0, 10.0, 5.0, 4.0, 10.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1387939453125, -0.13465118408203125, -0.1305084228515625, -0.12636566162109375, -0.122222900390625, -0.11808013916015625, -0.1139373779296875, -0.10979461669921875, -0.10565185546875, -0.10150909423828125, -0.0973663330078125, -0.09322357177734375, -0.089080810546875, -0.08493804931640625, -0.0807952880859375, -0.07665252685546875, -0.072509765625, -0.06836700439453125, -0.0642242431640625, -0.06008148193359375, -0.055938720703125, -0.05179595947265625, -0.0476531982421875, -0.04351043701171875, -0.03936767578125, -0.03522491455078125, -0.0310821533203125, -0.02693939208984375, -0.022796630859375, -0.01865386962890625, -0.0145111083984375, -0.01036834716796875, -0.0062255859375, -0.00208282470703125, 0.0020599365234375, 0.00620269775390625, 0.010345458984375, 0.01448822021484375, 0.0186309814453125, 0.02277374267578125, 0.02691650390625, 0.03105926513671875, 0.0352020263671875, 0.03934478759765625, 0.043487548828125, 0.04763031005859375, 0.0517730712890625, 0.05591583251953125, 0.06005859375, 0.06420135498046875, 0.0683441162109375, 0.07248687744140625, 0.076629638671875, 0.08077239990234375, 0.0849151611328125, 0.08905792236328125, 0.09320068359375, 0.09734344482421875, 0.1014862060546875, 0.10562896728515625, 0.109771728515625, 0.11391448974609375, 0.1180572509765625, 0.12220001220703125, 0.1263427734375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 3.0, 3.0, 4.0, 9.0, 5.0, 15.0, 11.0, 43.0, 84.0, 188.0, 346.0, 157.0, 57.0, 31.0, 17.0, 10.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.265544891357422, -2.198141574859619, -2.1307382583618164, -2.0633351802825928, -1.99593186378479, -1.9285285472869873, -1.8611253499984741, -1.793722152709961, -1.7263188362121582, -1.6589155197143555, -1.5915123224258423, -1.524109125137329, -1.4567058086395264, -1.3893024921417236, -1.3218992948532104, -1.2544960975646973, -1.1870927810668945, -1.1196894645690918, -1.0522862672805786, -0.9848830103874207, -0.9174797534942627, -0.8500764966011047, -0.7826732397079468, -0.7152699828147888, -0.6478667259216309, -0.5804634690284729, -0.5130602121353149, -0.445656955242157, -0.378253698348999, -0.31085044145584106, -0.2434471845626831, -0.17604392766952515, -0.10864090919494629, -0.04123765230178833, 0.02616560459136963, 0.09356886148452759, 0.16097211837768555, 0.2283753752708435, 0.29577863216400146, 0.3631818890571594, 0.4305851459503174, 0.49798840284347534, 0.5653916597366333, 0.6327949166297913, 0.7001981735229492, 0.7676014304161072, 0.8350046873092651, 0.9024079442024231, 0.969811201095581, 1.0372145175933838, 1.104617714881897, 1.1720209121704102, 1.239424228668213, 1.3068275451660156, 1.3742307424545288, 1.441633939743042, 1.5090372562408447, 1.5764405727386475, 1.6438437700271606, 1.7112469673156738, 1.7786502838134766, 1.8460536003112793, 1.9134567975997925, 1.9808599948883057, 2.0482633113861084]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 7.0, 13.0, 13.0, 20.0, 22.0, 64.0, 86.0, 117.0, 168.0, 158.0, 116.0, 60.0, 35.0, 27.0, 16.0, 13.0, 9.0, 8.0, 3.0, 3.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1231069564819336, -2.040691375732422, -1.9582756757736206, -1.8758600950241089, -1.7934445142745972, -1.711028814315796, -1.6286132335662842, -1.5461976528167725, -1.4637820720672607, -1.381366491317749, -1.2989507913589478, -1.216535210609436, -1.1341196298599243, -1.051703929901123, -0.9692883491516113, -0.8868727684020996, -0.8044570684432983, -0.7220414280891418, -0.6396258473396301, -0.5572102069854736, -0.4747945964336395, -0.3923789858818054, -0.3099633455276489, -0.2275477647781372, -0.1451321244239807, -0.06271650642156601, 0.019699111580848694, 0.102114737033844, 0.1845303475856781, 0.2669459581375122, 0.3493615984916687, 0.4317771792411804, 0.5141928195953369, 0.5966084599494934, 0.6790240406990051, 0.7614396810531616, 0.8438552618026733, 0.9262709021568298, 1.0086865425109863, 1.091102123260498, 1.1735177040100098, 1.2559332847595215, 1.3383489847183228, 1.4207645654678345, 1.5031801462173462, 1.5855958461761475, 1.6680114269256592, 1.750427007675171, 1.8328427076339722, 1.9152582883834839, 1.9976739883422852, 2.080089569091797, 2.1625051498413086, 2.2449207305908203, 2.327336311340332, 2.4097518920898438, 2.4921677112579346, 2.5745832920074463, 2.656998872756958, 2.739414691925049, 2.8218302726745605, 2.9042458534240723, 2.986661434173584, 3.0690770149230957, 3.1514925956726074]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 3.0, 5.0, 10.0, 18.0, 26.0, 30.0, 46.0, 111.0, 476.0, 27133.0, 4165389.0, 844.0, 75.0, 37.0, 26.0, 14.0, 13.0, 6.0, 3.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.491119384765625, -8.29473876953125, -8.098358154296875, -7.9019775390625, -7.705596923828125, -7.50921630859375, -7.312835693359375, -7.116455078125, -6.920074462890625, -6.72369384765625, -6.527313232421875, -6.3309326171875, -6.134552001953125, -5.93817138671875, -5.741790771484375, -5.54541015625, -5.349029541015625, -5.15264892578125, -4.956268310546875, -4.7598876953125, -4.563507080078125, -4.36712646484375, -4.170745849609375, -3.974365234375, -3.777984619140625, -3.58160400390625, -3.385223388671875, -3.1888427734375, -2.992462158203125, -2.79608154296875, -2.599700927734375, -2.4033203125, -2.206939697265625, -2.01055908203125, -1.814178466796875, -1.6177978515625, -1.421417236328125, -1.22503662109375, -1.028656005859375, -0.832275390625, -0.635894775390625, -0.43951416015625, -0.243133544921875, -0.0467529296875, 0.149627685546875, 0.34600830078125, 0.542388916015625, 0.73876953125, 0.935150146484375, 1.13153076171875, 1.327911376953125, 1.5242919921875, 1.720672607421875, 1.91705322265625, 2.113433837890625, 2.309814453125, 2.506195068359375, 2.70257568359375, 2.898956298828125, 3.0953369140625, 3.291717529296875, 3.48809814453125, 3.684478759765625, 3.880859375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 3.0, 6.0, 16.0, 16.0, 38.0, 57.0, 114.0, 178.0, 199.0, 138.0, 64.0, 41.0, 16.0, 15.0, 10.0, 10.0, 7.0, 7.0, 3.0, 3.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0254364013671875, -0.024671077728271484, -0.02390575408935547, -0.023140430450439453, -0.022375106811523438, -0.021609783172607422, -0.020844459533691406, -0.02007913589477539, -0.019313812255859375, -0.01854848861694336, -0.017783164978027344, -0.017017841339111328, -0.016252517700195312, -0.015487194061279297, -0.014721870422363281, -0.013956546783447266, -0.01319122314453125, -0.012425899505615234, -0.011660575866699219, -0.010895252227783203, -0.010129928588867188, -0.009364604949951172, -0.008599281311035156, -0.00783395767211914, -0.007068634033203125, -0.006303310394287109, -0.005537986755371094, -0.004772663116455078, -0.0040073394775390625, -0.003242015838623047, -0.0024766921997070312, -0.0017113685607910156, -0.000946044921875, -0.00018072128295898438, 0.0005846023559570312, 0.0013499259948730469, 0.0021152496337890625, 0.002880573272705078, 0.0036458969116210938, 0.004411220550537109, 0.005176544189453125, 0.005941867828369141, 0.006707191467285156, 0.007472515106201172, 0.008237838745117188, 0.009003162384033203, 0.009768486022949219, 0.010533809661865234, 0.01129913330078125, 0.012064456939697266, 0.012829780578613281, 0.013595104217529297, 0.014360427856445312, 0.015125751495361328, 0.015891075134277344, 0.01665639877319336, 0.017421722412109375, 0.01818704605102539, 0.018952369689941406, 0.019717693328857422, 0.020483016967773438, 0.021248340606689453, 0.02201366424560547, 0.022778987884521484, 0.0235443115234375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 6.0, 1.0, 9.0, 17.0, 29.0, 46.0, 86.0, 231.0, 2059.0, 3775002.0, 414531.0, 1395.0, 283.0, 188.0, 145.0, 100.0, 73.0, 39.0, 35.0, 9.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66162109375, -0.6141128540039062, -0.5666046142578125, -0.5190963745117188, -0.471588134765625, -0.42407989501953125, -0.3765716552734375, -0.32906341552734375, -0.28155517578125, -0.23404693603515625, -0.1865386962890625, -0.13903045654296875, -0.091522216796875, -0.04401397705078125, 0.0034942626953125, 0.05100250244140625, 0.0985107421875, 0.14601898193359375, 0.1935272216796875, 0.24103546142578125, 0.288543701171875, 0.33605194091796875, 0.3835601806640625, 0.43106842041015625, 0.47857666015625, 0.5260848999023438, 0.5735931396484375, 0.6211013793945312, 0.668609619140625, 0.7161178588867188, 0.7636260986328125, 0.8111343383789062, 0.858642578125, 0.9061508178710938, 0.9536590576171875, 1.0011672973632812, 1.048675537109375, 1.0961837768554688, 1.1436920166015625, 1.1912002563476562, 1.23870849609375, 1.2862167358398438, 1.3337249755859375, 1.3812332153320312, 1.428741455078125, 1.4762496948242188, 1.5237579345703125, 1.5712661743164062, 1.6187744140625, 1.6662826538085938, 1.7137908935546875, 1.7612991333007812, 1.808807373046875, 1.8563156127929688, 1.9038238525390625, 1.9513320922851562, 1.99884033203125, 2.0463485717773438, 2.0938568115234375, 2.1413650512695312, 2.188873291015625, 2.2363815307617188, 2.2838897705078125, 2.3313980102539062, 2.37890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 11.0, 24.0, 25.0, 29.0, 52.0, 76.0, 146.0, 275.0, 658.0, 1309.0, 752.0, 330.0, 151.0, 68.0, 34.0, 24.0, 18.0, 8.0, 12.0, 9.0, 14.0, 5.0, 5.0, 4.0, 5.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043487548828125, -0.04218769073486328, -0.04088783264160156, -0.039587974548339844, -0.038288116455078125, -0.036988258361816406, -0.03568840026855469, -0.03438854217529297, -0.03308868408203125, -0.03178882598876953, -0.030488967895507812, -0.029189109802246094, -0.027889251708984375, -0.026589393615722656, -0.025289535522460938, -0.02398967742919922, -0.0226898193359375, -0.02138996124267578, -0.020090103149414062, -0.018790245056152344, -0.017490386962890625, -0.016190528869628906, -0.014890670776367188, -0.013590812683105469, -0.01229095458984375, -0.010991096496582031, -0.009691238403320312, -0.008391380310058594, -0.007091522216796875, -0.005791664123535156, -0.0044918060302734375, -0.0031919479370117188, -0.00189208984375, -0.0005922317504882812, 0.0007076263427734375, 0.0020074844360351562, 0.003307342529296875, 0.004607200622558594, 0.0059070587158203125, 0.007206916809082031, 0.00850677490234375, 0.009806632995605469, 0.011106491088867188, 0.012406349182128906, 0.013706207275390625, 0.015006065368652344, 0.016305923461914062, 0.01760578155517578, 0.0189056396484375, 0.02020549774169922, 0.021505355834960938, 0.022805213928222656, 0.024105072021484375, 0.025404930114746094, 0.026704788208007812, 0.02800464630126953, 0.02930450439453125, 0.03060436248779297, 0.03190422058105469, 0.033204078674316406, 0.034503936767578125, 0.035803794860839844, 0.03710365295410156, 0.03840351104736328, 0.039703369140625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [778.0, 230.0, 14.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12951700389385223, 0.027795732021331787, 0.1851084679365158, 0.34242117404937744, 0.49973392486572266, 0.6570466756820679, 0.8143593668937683, 0.9716721177101135, 1.1289849281311035, 1.2862976789474487, 1.443610429763794, 1.6009230613708496, 1.7582359313964844, 1.91554856300354, 2.0728611946105957, 2.2301740646362305, 2.387486696243286, 2.544799327850342, 2.7021121978759766, 2.8594248294830322, 3.016737699508667, 3.1740503311157227, 3.3313632011413574, 3.488675832748413, 3.645988702774048, 3.8033013343811035, 3.9606142044067383, 4.117927074432373, 4.27523946762085, 4.432552337646484, 4.589865207672119, 4.747178077697754, 4.904490947723389, 5.061803817749023, 5.2191162109375, 5.376429080963135, 5.5337419509887695, 5.691054821014404, 5.848367214202881, 6.005680084228516, 6.16299295425415, 6.320305824279785, 6.477618217468262, 6.6349310874938965, 6.792243957519531, 6.949556827545166, 7.106869220733643, 7.264182090759277, 7.421494483947754, 7.578807353973389, 7.736119747161865, 7.8934326171875, 8.050745010375977, 8.20805835723877, 8.365370750427246, 8.522684097290039, 8.679996490478516, 8.837308883666992, 8.994622230529785, 9.151934623718262, 9.309247016906738, 9.466560363769531, 9.623872756958008, 9.781185150146484, 9.938498497009277]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 1.0, 7.0, 6.0, 10.0, 7.0, 22.0, 35.0, 38.0, 47.0, 66.0, 98.0, 83.0, 119.0, 88.0, 87.0, 73.0, 48.0, 43.0, 35.0, 14.0, 17.0, 10.0, 9.0, 4.0, 3.0, 7.0, 4.0, 1.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23453474044799805, -0.22675292193889618, -0.2189711034297943, -0.21118929982185364, -0.20340748131275177, -0.1956256628036499, -0.18784385919570923, -0.18006204068660736, -0.1722802221775055, -0.16449840366840363, -0.15671658515930176, -0.14893478155136108, -0.14115296304225922, -0.13337114453315735, -0.12558934092521667, -0.11780752241611481, -0.11002570390701294, -0.10224388539791107, -0.0944620743393898, -0.08668026328086853, -0.07889844477176666, -0.0711166262626648, -0.06333481520414352, -0.055553000420331955, -0.047771185636520386, -0.039989370852708817, -0.03220755606889725, -0.024425741285085678, -0.01664392650127411, -0.00886211171746254, -0.0010802969336509705, 0.006701517850160599, 0.014483332633972168, 0.022265147417783737, 0.030046962201595306, 0.037828776985406876, 0.045610591769218445, 0.053392406553030014, 0.06117422133684158, 0.06895603239536285, 0.07673785090446472, 0.08451966941356659, 0.09230148047208786, 0.10008329153060913, 0.107865110039711, 0.11564692854881287, 0.12342873960733414, 0.1312105506658554, 0.13899236917495728, 0.14677418768405914, 0.154556006193161, 0.16233780980110168, 0.17011962831020355, 0.17790144681930542, 0.1856832504272461, 0.19346506893634796, 0.20124688744544983, 0.2090287059545517, 0.21681052446365356, 0.22459232807159424, 0.2323741465806961, 0.24015596508979797, 0.24793776869773865, 0.2557196021080017, 0.2635014057159424]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 8.0, 8.0, 12.0, 6.0, 13.0, 22.0, 28.0, 17.0, 38.0, 48.0, 63.0, 145.0, 673.0, 3504.0, 27875.0, 907262.0, 99286.0, 7694.0, 1264.0, 283.0, 74.0, 34.0, 46.0, 23.0, 24.0, 14.0, 9.0, 20.0, 11.0, 12.0, 3.0, 5.0, 4.0, 6.0, 1.0, 8.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.397705078125, -0.38385009765625, -0.3699951171875, -0.35614013671875, -0.34228515625, -0.32843017578125, -0.3145751953125, -0.30072021484375, -0.286865234375, -0.27301025390625, -0.2591552734375, -0.24530029296875, -0.2314453125, -0.21759033203125, -0.2037353515625, -0.18988037109375, -0.176025390625, -0.16217041015625, -0.1483154296875, -0.13446044921875, -0.12060546875, -0.10675048828125, -0.0928955078125, -0.07904052734375, -0.065185546875, -0.05133056640625, -0.0374755859375, -0.02362060546875, -0.009765625, 0.00408935546875, 0.0179443359375, 0.03179931640625, 0.045654296875, 0.05950927734375, 0.0733642578125, 0.08721923828125, 0.10107421875, 0.11492919921875, 0.1287841796875, 0.14263916015625, 0.156494140625, 0.17034912109375, 0.1842041015625, 0.19805908203125, 0.2119140625, 0.22576904296875, 0.2396240234375, 0.25347900390625, 0.267333984375, 0.28118896484375, 0.2950439453125, 0.30889892578125, 0.32275390625, 0.33660888671875, 0.3504638671875, 0.36431884765625, 0.378173828125, 0.39202880859375, 0.4058837890625, 0.41973876953125, 0.43359375, 0.44744873046875, 0.4613037109375, 0.47515869140625, 0.489013671875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 10.0, 5.0, 18.0, 19.0, 29.0, 119.0, 275.0, 296.0, 144.0, 30.0, 21.0, 10.0, 13.0, 8.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.07470703125, -0.07324361801147461, -0.07178020477294922, -0.07031679153442383, -0.06885337829589844, -0.06738996505737305, -0.06592655181884766, -0.06446313858032227, -0.06299972534179688, -0.061536312103271484, -0.060072898864746094, -0.0586094856262207, -0.05714607238769531, -0.05568265914916992, -0.05421924591064453, -0.05275583267211914, -0.05129241943359375, -0.04982900619506836, -0.04836559295654297, -0.04690217971801758, -0.04543876647949219, -0.0439753532409668, -0.042511940002441406, -0.041048526763916016, -0.039585113525390625, -0.038121700286865234, -0.036658287048339844, -0.03519487380981445, -0.03373146057128906, -0.03226804733276367, -0.03080463409423828, -0.02934122085571289, -0.0278778076171875, -0.02641439437866211, -0.02495098114013672, -0.023487567901611328, -0.022024154663085938, -0.020560741424560547, -0.019097328186035156, -0.017633914947509766, -0.016170501708984375, -0.014707088470458984, -0.013243675231933594, -0.011780261993408203, -0.010316848754882812, -0.008853435516357422, -0.007390022277832031, -0.005926609039306641, -0.00446319580078125, -0.0029997825622558594, -0.0015363693237304688, -7.295608520507812e-05, 0.0013904571533203125, 0.002853870391845703, 0.004317283630371094, 0.005780696868896484, 0.007244110107421875, 0.008707523345947266, 0.010170936584472656, 0.011634349822998047, 0.013097763061523438, 0.014561176300048828, 0.01602458953857422, 0.01748800277709961, 0.018951416015625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 6.0, 12.0, 17.0, 21.0, 53.0, 127.0, 713.0, 15961.0, 959774.0, 70130.0, 1384.0, 202.0, 55.0, 30.0, 12.0, 13.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6650390625, -0.6468925476074219, -0.6287460327148438, -0.6105995178222656, -0.5924530029296875, -0.5743064880371094, -0.5561599731445312, -0.5380134582519531, -0.519866943359375, -0.5017204284667969, -0.48357391357421875, -0.4654273986816406, -0.4472808837890625, -0.4291343688964844, -0.41098785400390625, -0.3928413391113281, -0.37469482421875, -0.3565483093261719, -0.33840179443359375, -0.3202552795410156, -0.3021087646484375, -0.2839622497558594, -0.26581573486328125, -0.24766921997070312, -0.229522705078125, -0.21137619018554688, -0.19322967529296875, -0.17508316040039062, -0.1569366455078125, -0.13879013061523438, -0.12064361572265625, -0.10249710083007812, -0.0843505859375, -0.06620407104492188, -0.04805755615234375, -0.029911041259765625, -0.0117645263671875, 0.006381988525390625, 0.02452850341796875, 0.042675018310546875, 0.060821533203125, 0.07896804809570312, 0.09711456298828125, 0.11526107788085938, 0.1334075927734375, 0.15155410766601562, 0.16970062255859375, 0.18784713745117188, 0.20599365234375, 0.22414016723632812, 0.24228668212890625, 0.2604331970214844, 0.2785797119140625, 0.2967262268066406, 0.31487274169921875, 0.3330192565917969, 0.351165771484375, 0.3693122863769531, 0.38745880126953125, 0.4056053161621094, 0.4237518310546875, 0.4418983459472656, 0.46004486083984375, 0.4781913757324219, 0.496337890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 9.0, 3.0, 7.0, 5.0, 5.0, 9.0, 15.0, 22.0, 19.0, 22.0, 25.0, 25.0, 31.0, 32.0, 38.0, 38.0, 41.0, 43.0, 50.0, 41.0, 32.0, 32.0, 33.0, 41.0, 31.0, 29.0, 46.0, 45.0, 31.0, 21.0, 31.0, 33.0, 11.0, 21.0, 14.0, 15.0, 11.0, 11.0, 5.0, 5.0, 3.0, 3.0, 6.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06683349609375, -0.06458473205566406, -0.062335968017578125, -0.06008720397949219, -0.05783843994140625, -0.05558967590332031, -0.053340911865234375, -0.05109214782714844, -0.0488433837890625, -0.04659461975097656, -0.044345855712890625, -0.04209709167480469, -0.03984832763671875, -0.03759956359863281, -0.035350799560546875, -0.03310203552246094, -0.030853271484375, -0.028604507446289062, -0.026355743408203125, -0.024106979370117188, -0.02185821533203125, -0.019609451293945312, -0.017360687255859375, -0.015111923217773438, -0.0128631591796875, -0.010614395141601562, -0.008365631103515625, -0.0061168670654296875, -0.00386810302734375, -0.0016193389892578125, 0.000629425048828125, 0.0028781890869140625, 0.005126953125, 0.0073757171630859375, 0.009624481201171875, 0.011873245239257812, 0.01412200927734375, 0.016370773315429688, 0.018619537353515625, 0.020868301391601562, 0.0231170654296875, 0.025365829467773438, 0.027614593505859375, 0.029863357543945312, 0.03211212158203125, 0.03436088562011719, 0.036609649658203125, 0.03885841369628906, 0.041107177734375, 0.04335594177246094, 0.045604705810546875, 0.04785346984863281, 0.05010223388671875, 0.05235099792480469, 0.054599761962890625, 0.05684852600097656, 0.0590972900390625, 0.06134605407714844, 0.06359481811523438, 0.06584358215332031, 0.06809234619140625, 0.07034111022949219, 0.07258987426757812, 0.07483863830566406, 0.07708740234375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 8.0, 18.0, 56.0, 267.0, 1850.0, 994066.0, 51125.0, 890.0, 152.0, 41.0, 19.0, 9.0, 7.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.005859375, -0.9709930419921875, -0.936126708984375, -0.9012603759765625, -0.86639404296875, -0.8315277099609375, -0.796661376953125, -0.7617950439453125, -0.7269287109375, -0.6920623779296875, -0.657196044921875, -0.6223297119140625, -0.58746337890625, -0.5525970458984375, -0.517730712890625, -0.4828643798828125, -0.447998046875, -0.4131317138671875, -0.378265380859375, -0.3433990478515625, -0.30853271484375, -0.2736663818359375, -0.238800048828125, -0.2039337158203125, -0.1690673828125, -0.1342010498046875, -0.099334716796875, -0.0644683837890625, -0.02960205078125, 0.0052642822265625, 0.040130615234375, 0.0749969482421875, 0.10986328125, 0.1447296142578125, 0.179595947265625, 0.2144622802734375, 0.24932861328125, 0.2841949462890625, 0.319061279296875, 0.3539276123046875, 0.3887939453125, 0.4236602783203125, 0.458526611328125, 0.4933929443359375, 0.52825927734375, 0.5631256103515625, 0.597991943359375, 0.6328582763671875, 0.667724609375, 0.7025909423828125, 0.737457275390625, 0.7723236083984375, 0.80718994140625, 0.8420562744140625, 0.876922607421875, 0.9117889404296875, 0.9466552734375, 0.9815216064453125, 1.016387939453125, 1.0512542724609375, 1.08612060546875, 1.1209869384765625, 1.155853271484375, 1.1907196044921875, 1.2255859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 3.0, 5.0, 3.0, 11.0, 12.0, 12.0, 25.0, 39.0, 169.0, 544.0, 65.0, 37.0, 22.0, 16.0, 5.0, 3.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029354095458984375, -0.0028274953365325928, -0.002719581127166748, -0.0026116669178009033, -0.0025037527084350586, -0.002395838499069214, -0.002287924289703369, -0.0021800100803375244, -0.0020720958709716797, -0.001964181661605835, -0.0018562674522399902, -0.0017483532428741455, -0.0016404390335083008, -0.001532524824142456, -0.0014246106147766113, -0.0013166964054107666, -0.0012087821960449219, -0.0011008679866790771, -0.0009929537773132324, -0.0008850395679473877, -0.000777125358581543, -0.0006692111492156982, -0.0005612969398498535, -0.0004533827304840088, -0.00034546852111816406, -0.00023755431175231934, -0.0001296401023864746, -2.1725893020629883e-05, 8.618831634521484e-05, 0.00019410252571105957, 0.0003020167350769043, 0.000409930944442749, 0.0005178451538085938, 0.0006257593631744385, 0.0007336735725402832, 0.0008415877819061279, 0.0009495019912719727, 0.0010574162006378174, 0.0011653304100036621, 0.0012732446193695068, 0.0013811588287353516, 0.0014890730381011963, 0.001596987247467041, 0.0017049014568328857, 0.0018128156661987305, 0.0019207298755645752, 0.00202864408493042, 0.0021365582942962646, 0.0022444725036621094, 0.002352386713027954, 0.002460300922393799, 0.0025682151317596436, 0.0026761293411254883, 0.002784043550491333, 0.0028919577598571777, 0.0029998719692230225, 0.003107786178588867, 0.003215700387954712, 0.0033236145973205566, 0.0034315288066864014, 0.003539443016052246, 0.003647357225418091, 0.0037552714347839355, 0.0038631856441497803, 0.003971099853515625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 2.0, 8.0, 15.0, 22.0, 21.0, 23.0, 35.0, 70.0, 86.0, 134.0, 210.0, 388.0, 799.0, 1922.0, 7112.0, 53185.0, 829934.0, 137549.0, 11981.0, 2942.0, 1039.0, 418.0, 259.0, 139.0, 85.0, 66.0, 33.0, 26.0, 18.0, 9.0, 7.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25244140625, -0.24446487426757812, -0.23648834228515625, -0.22851181030273438, -0.2205352783203125, -0.21255874633789062, -0.20458221435546875, -0.19660568237304688, -0.188629150390625, -0.18065261840820312, -0.17267608642578125, -0.16469955444335938, -0.1567230224609375, -0.14874649047851562, -0.14076995849609375, -0.13279342651367188, -0.12481689453125, -0.11684036254882812, -0.10886383056640625, -0.10088729858398438, -0.0929107666015625, -0.08493423461914062, -0.07695770263671875, -0.06898117065429688, -0.061004638671875, -0.053028106689453125, -0.04505157470703125, -0.037075042724609375, -0.0290985107421875, -0.021121978759765625, -0.01314544677734375, -0.005168914794921875, 0.0028076171875, 0.010784149169921875, 0.01876068115234375, 0.026737213134765625, 0.0347137451171875, 0.042690277099609375, 0.05066680908203125, 0.058643341064453125, 0.066619873046875, 0.07459640502929688, 0.08257293701171875, 0.09054946899414062, 0.0985260009765625, 0.10650253295898438, 0.11447906494140625, 0.12245559692382812, 0.13043212890625, 0.13840866088867188, 0.14638519287109375, 0.15436172485351562, 0.1623382568359375, 0.17031478881835938, 0.17829132080078125, 0.18626785278320312, 0.194244384765625, 0.20222091674804688, 0.21019744873046875, 0.21817398071289062, 0.2261505126953125, 0.23412704467773438, 0.24210357666015625, 0.2500801086425781, 0.258056640625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 15.0, 16.0, 24.0, 36.0, 71.0, 107.0, 148.0, 155.0, 130.0, 102.0, 67.0, 44.0, 22.0, 25.0, 8.0, 9.0, 4.0, 4.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1883544921875, -0.18403053283691406, -0.17970657348632812, -0.1753826141357422, -0.17105865478515625, -0.1667346954345703, -0.16241073608398438, -0.15808677673339844, -0.1537628173828125, -0.14943885803222656, -0.14511489868164062, -0.1407909393310547, -0.13646697998046875, -0.1321430206298828, -0.12781906127929688, -0.12349510192871094, -0.119171142578125, -0.11484718322753906, -0.11052322387695312, -0.10619926452636719, -0.10187530517578125, -0.09755134582519531, -0.09322738647460938, -0.08890342712402344, -0.0845794677734375, -0.08025550842285156, -0.07593154907226562, -0.07160758972167969, -0.06728363037109375, -0.06295967102050781, -0.058635711669921875, -0.05431175231933594, -0.04998779296875, -0.04566383361816406, -0.041339874267578125, -0.03701591491699219, -0.03269195556640625, -0.028367996215820312, -0.024044036865234375, -0.019720077514648438, -0.0153961181640625, -0.011072158813476562, -0.006748199462890625, -0.0024242401123046875, 0.00189971923828125, 0.0062236785888671875, 0.010547637939453125, 0.014871597290039062, 0.019195556640625, 0.023519515991210938, 0.027843475341796875, 0.03216743469238281, 0.03649139404296875, 0.04081535339355469, 0.045139312744140625, 0.04946327209472656, 0.0537872314453125, 0.05811119079589844, 0.062435150146484375, 0.06675910949707031, 0.07108306884765625, 0.07540702819824219, 0.07973098754882812, 0.08405494689941406, 0.08837890625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 10.0, 12.0, 18.0, 38.0, 63.0, 105.0, 178.0, 195.0, 153.0, 114.0, 36.0, 27.0, 15.0, 10.0, 9.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.082637071609497, -1.0558706521987915, -1.029104232788086, -1.00233793258667, -0.9755715131759644, -0.9488050937652588, -0.9220386743545532, -0.8952723145484924, -0.8685059547424316, -0.8417395353317261, -0.8149731755256653, -0.7882067561149597, -0.7614403963088989, -0.7346739768981934, -0.7079075574874878, -0.681141197681427, -0.6543747782707214, -0.6276083588600159, -0.6008419990539551, -0.5740755796432495, -0.5473092198371887, -0.5205428004264832, -0.4937764108181, -0.4670100212097168, -0.4402436316013336, -0.41347724199295044, -0.38671085238456726, -0.3599444627761841, -0.3331780433654785, -0.3064116835594177, -0.27964526414871216, -0.252878874540329, -0.22611242532730103, -0.19934603571891785, -0.17257964611053467, -0.1458132416009903, -0.11904685199260712, -0.09228046238422394, -0.06551405787467957, -0.03874766826629639, -0.011981278657913208, 0.01478511467576027, 0.041551508009433746, 0.06831790506839752, 0.0950842946767807, 0.12185068428516388, 0.14861708879470825, 0.17538347840309143, 0.2021498680114746, 0.2289162576198578, 0.25568264722824097, 0.28244906663894653, 0.3092154264450073, 0.3359818458557129, 0.36274823546409607, 0.38951462507247925, 0.4162810146808624, 0.4430474042892456, 0.4698137938976288, 0.49658018350601196, 0.5233466029167175, 0.5501129627227783, 0.5768793821334839, 0.6036458015441895, 0.6304121613502502]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 11.0, 9.0, 10.0, 13.0, 13.0, 26.0, 46.0, 47.0, 63.0, 105.0, 89.0, 111.0, 112.0, 71.0, 74.0, 51.0, 47.0, 28.0, 19.0, 13.0, 6.0, 8.0, 4.0, 2.0, 3.0, 3.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1939961910247803, -1.161128044128418, -1.1282597780227661, -1.0953916311264038, -1.062523365020752, -1.0296552181243896, -0.9967870712280273, -0.9639188647270203, -0.9310506582260132, -0.8981824517250061, -0.865314245223999, -0.8324460983276367, -0.7995778918266296, -0.7667096853256226, -0.7338415384292603, -0.7009733319282532, -0.6681051254272461, -0.635236918926239, -0.6023687124252319, -0.5695005655288696, -0.5366323590278625, -0.5037641525268555, -0.4708959758281708, -0.4380277991294861, -0.405159592628479, -0.3722913861274719, -0.33942320942878723, -0.30655503273010254, -0.27368682622909546, -0.24081863462924957, -0.2079504430294037, -0.1750822514295578, -0.14221394062042236, -0.10934574902057648, -0.07647755742073059, -0.043609365820884705, -0.010741174221038818, 0.022127017378807068, 0.054995208978652954, 0.08786340057849884, 0.12073159217834473, 0.1535997837781906, 0.1864679753780365, 0.21933616697788239, 0.25220435857772827, 0.28507256507873535, 0.31794074177742004, 0.35080891847610474, 0.3836771249771118, 0.4165453314781189, 0.4494135081768036, 0.4822816848754883, 0.5151498913764954, 0.5480180978775024, 0.5808862447738647, 0.6137544512748718, 0.6466226577758789, 0.679490864276886, 0.7123590707778931, 0.7452272176742554, 0.7780954241752625, 0.8109636306762695, 0.8438317775726318, 0.8766999840736389, 0.909568190574646]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 4.0, 4.0, 4.0, 2.0, 4.0, 6.0, 8.0, 0.0, 6.0, 13.0, 11.0, 15.0, 17.0, 26.0, 21.0, 24.0, 25.0, 33.0, 62.0, 100.0, 533.0, 6077.0, 4161316.0, 24273.0, 1305.0, 194.0, 53.0, 30.0, 24.0, 14.0, 18.0, 10.0, 4.0, 8.0, 2.0, 6.0, 8.0, 0.0, 0.0, 2.0, 6.0, 2.0, 6.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1796875, -2.118560791015625, -2.05743408203125, -1.996307373046875, -1.9351806640625, -1.874053955078125, -1.81292724609375, -1.751800537109375, -1.690673828125, -1.629547119140625, -1.56842041015625, -1.507293701171875, -1.4461669921875, -1.385040283203125, -1.32391357421875, -1.262786865234375, -1.20166015625, -1.140533447265625, -1.07940673828125, -1.018280029296875, -0.9571533203125, -0.896026611328125, -0.83489990234375, -0.773773193359375, -0.712646484375, -0.651519775390625, -0.59039306640625, -0.529266357421875, -0.4681396484375, -0.407012939453125, -0.34588623046875, -0.284759521484375, -0.2236328125, -0.162506103515625, -0.10137939453125, -0.040252685546875, 0.0208740234375, 0.082000732421875, 0.14312744140625, 0.204254150390625, 0.265380859375, 0.326507568359375, 0.38763427734375, 0.448760986328125, 0.5098876953125, 0.571014404296875, 0.63214111328125, 0.693267822265625, 0.75439453125, 0.815521240234375, 0.87664794921875, 0.937774658203125, 0.9989013671875, 1.060028076171875, 1.12115478515625, 1.182281494140625, 1.243408203125, 1.304534912109375, 1.36566162109375, 1.426788330078125, 1.4879150390625, 1.549041748046875, 1.61016845703125, 1.671295166015625, 1.732421875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 11.0, 5.0, 11.0, 15.0, 26.0, 55.0, 89.0, 145.0, 203.0, 186.0, 109.0, 61.0, 32.0, 18.0, 10.0, 6.0, 7.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0401611328125, -0.03921937942504883, -0.038277626037597656, -0.037335872650146484, -0.03639411926269531, -0.03545236587524414, -0.03451061248779297, -0.0335688591003418, -0.032627105712890625, -0.03168535232543945, -0.03074359893798828, -0.02980184555053711, -0.028860092163085938, -0.027918338775634766, -0.026976585388183594, -0.026034832000732422, -0.02509307861328125, -0.024151325225830078, -0.023209571838378906, -0.022267818450927734, -0.021326065063476562, -0.02038431167602539, -0.01944255828857422, -0.018500804901123047, -0.017559051513671875, -0.016617298126220703, -0.01567554473876953, -0.01473379135131836, -0.013792037963867188, -0.012850284576416016, -0.011908531188964844, -0.010966777801513672, -0.0100250244140625, -0.009083271026611328, -0.008141517639160156, -0.007199764251708984, -0.0062580108642578125, -0.005316257476806641, -0.004374504089355469, -0.003432750701904297, -0.002490997314453125, -0.0015492439270019531, -0.0006074905395507812, 0.0003342628479003906, 0.0012760162353515625, 0.0022177696228027344, 0.0031595230102539062, 0.004101276397705078, 0.00504302978515625, 0.005984783172607422, 0.006926536560058594, 0.007868289947509766, 0.008810043334960938, 0.00975179672241211, 0.010693550109863281, 0.011635303497314453, 0.012577056884765625, 0.013518810272216797, 0.014460563659667969, 0.01540231704711914, 0.016344070434570312, 0.017285823822021484, 0.018227577209472656, 0.019169330596923828, 0.020111083984375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 16.0, 99.0, 748.0, 4187702.0, 5509.0, 185.0, 36.0], "bins": [-6.7734375, -6.661884307861328, -6.550331115722656, -6.438777923583984, -6.3272247314453125, -6.215671539306641, -6.104118347167969, -5.992565155029297, -5.881011962890625, -5.769458770751953, -5.657905578613281, -5.546352386474609, -5.4347991943359375, -5.323246002197266, -5.211692810058594, -5.100139617919922, -4.98858642578125, -4.877033233642578, -4.765480041503906, -4.653926849365234, -4.5423736572265625, -4.430820465087891, -4.319267272949219, -4.207714080810547, -4.096160888671875, -3.984607696533203, -3.8730545043945312, -3.7615013122558594, -3.6499481201171875, -3.5383949279785156, -3.4268417358398438, -3.315288543701172, -3.2037353515625, -3.092182159423828, -2.9806289672851562, -2.8690757751464844, -2.7575225830078125, -2.6459693908691406, -2.5344161987304688, -2.422863006591797, -2.311309814453125, -2.199756622314453, -2.0882034301757812, -1.9766502380371094, -1.8650970458984375, -1.7535438537597656, -1.6419906616210938, -1.5304374694824219, -1.41888427734375, -1.3073310852050781, -1.1957778930664062, -1.0842247009277344, -0.9726715087890625, -0.8611183166503906, -0.7495651245117188, -0.6380119323730469, -0.526458740234375, -0.4149055480957031, -0.30335235595703125, -0.19179916381835938, -0.0802459716796875, 0.031307220458984375, 0.14286041259765625, 0.2544136047363281, 0.365966796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 7.0, 9.0, 15.0, 32.0, 51.0, 174.0, 864.0, 2369.0, 349.0, 109.0, 46.0, 34.0, 12.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1461181640625, -0.1429586410522461, -0.1397991180419922, -0.13663959503173828, -0.13348007202148438, -0.13032054901123047, -0.12716102600097656, -0.12400150299072266, -0.12084197998046875, -0.11768245697021484, -0.11452293395996094, -0.11136341094970703, -0.10820388793945312, -0.10504436492919922, -0.10188484191894531, -0.0987253189086914, -0.0955657958984375, -0.0924062728881836, -0.08924674987792969, -0.08608722686767578, -0.08292770385742188, -0.07976818084716797, -0.07660865783691406, -0.07344913482666016, -0.07028961181640625, -0.06713008880615234, -0.06397056579589844, -0.06081104278564453, -0.057651519775390625, -0.05449199676513672, -0.05133247375488281, -0.048172950744628906, -0.045013427734375, -0.041853904724121094, -0.03869438171386719, -0.03553485870361328, -0.032375335693359375, -0.02921581268310547, -0.026056289672851562, -0.022896766662597656, -0.01973724365234375, -0.016577720642089844, -0.013418197631835938, -0.010258674621582031, -0.007099151611328125, -0.003939628601074219, -0.0007801055908203125, 0.0023794174194335938, 0.0055389404296875, 0.008698463439941406, 0.011857986450195312, 0.015017509460449219, 0.018177032470703125, 0.02133655548095703, 0.024496078491210938, 0.027655601501464844, 0.03081512451171875, 0.033974647521972656, 0.03713417053222656, 0.04029369354248047, 0.043453216552734375, 0.04661273956298828, 0.04977226257324219, 0.052931785583496094, 0.05609130859375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 363.0, 644.0, 8.0, 1.0, 1.0], "bins": [-16.237573623657227, -15.967021942138672, -15.696470260620117, -15.425917625427246, -15.155365943908691, -14.884814262390137, -14.614261627197266, -14.343709945678711, -14.073158264160156, -13.802606582641602, -13.532054901123047, -13.261502265930176, -12.990950584411621, -12.720398902893066, -12.449846267700195, -12.17929458618164, -11.908742904663086, -11.638191223144531, -11.367639541625977, -11.097086906433105, -10.82653522491455, -10.555983543395996, -10.285430908203125, -10.01487922668457, -9.744327545166016, -9.473775863647461, -9.203224182128906, -8.932671546936035, -8.66211986541748, -8.391568183898926, -8.121015548706055, -7.8504638671875, -7.579912185668945, -7.309360504150391, -7.038808345794678, -6.768256187438965, -6.49770450592041, -6.2271528244018555, -5.956600666046143, -5.68604850769043, -5.415496826171875, -5.14494514465332, -4.874392986297607, -4.6038408279418945, -4.33328914642334, -4.062737464904785, -3.7921853065490723, -3.5216333866119385, -3.251081705093384, -2.98052978515625, -2.709977865219116, -2.4394259452819824, -2.1688740253448486, -1.8983221054077148, -1.627770185470581, -1.3572182655334473, -1.0866663455963135, -0.8161144256591797, -0.5455625057220459, -0.2750105857849121, -0.00445866584777832, 0.26609325408935547, 0.5366451740264893, 0.807197093963623, 1.0777490139007568]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 15.0, 30.0, 112.0, 211.0, 282.0, 192.0, 109.0, 40.0, 14.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.9985620975494385, -2.9411702156066895, -2.8837780952453613, -2.8263862133026123, -2.768994092941284, -2.711602210998535, -2.654210329055786, -2.596818208694458, -2.539426326751709, -2.48203444480896, -2.424642324447632, -2.367250442504883, -2.3098583221435547, -2.2524664402008057, -2.1950745582580566, -2.1376824378967285, -2.0802905559539795, -2.0228986740112305, -1.9655065536499023, -1.9081146717071533, -1.8507226705551147, -1.7933306694030762, -1.7359386682510376, -1.678546667098999, -1.6211546659469604, -1.5637626647949219, -1.5063706636428833, -1.4489787817001343, -1.3915867805480957, -1.3341947793960571, -1.2768027782440186, -1.2194108963012695, -1.1620190143585205, -1.104627013206482, -1.0472350120544434, -0.9898430705070496, -0.9324511289596558, -0.8750591278076172, -0.8176671266555786, -0.7602751851081848, -0.7028831243515015, -0.6454911231994629, -0.5880991816520691, -0.5307071805000305, -0.4733152389526367, -0.41592323780059814, -0.35853126645088196, -0.30113929510116577, -0.24374735355377197, -0.1863553822040558, -0.1289634108543396, -0.07157142460346222, -0.014179453253746033, 0.04321253299713135, 0.10060450434684753, 0.15799647569656372, 0.2153884470462799, 0.2727804183959961, 0.3301723897457123, 0.38756436109542847, 0.44495636224746704, 0.5023483037948608, 0.5597403049468994, 0.617132306098938, 0.6745242476463318]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 7.0, 6.0, 5.0, 6.0, 22.0, 13.0, 19.0, 19.0, 24.0, 35.0, 26.0, 29.0, 47.0, 52.0, 37.0, 73.0, 6758.0, 1040878.0, 89.0, 57.0, 59.0, 43.0, 35.0, 38.0, 18.0, 30.0, 20.0, 16.0, 19.0, 12.0, 12.0, 4.0, 9.0, 6.0, 3.0, 4.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.44921875, -3.3311767578125, -3.213134765625, -3.0950927734375, -2.97705078125, -2.8590087890625, -2.740966796875, -2.6229248046875, -2.5048828125, -2.3868408203125, -2.268798828125, -2.1507568359375, -2.03271484375, -1.9146728515625, -1.796630859375, -1.6785888671875, -1.560546875, -1.4425048828125, -1.324462890625, -1.2064208984375, -1.08837890625, -0.9703369140625, -0.852294921875, -0.7342529296875, -0.6162109375, -0.4981689453125, -0.380126953125, -0.2620849609375, -0.14404296875, -0.0260009765625, 0.092041015625, 0.2100830078125, 0.328125, 0.4461669921875, 0.564208984375, 0.6822509765625, 0.80029296875, 0.9183349609375, 1.036376953125, 1.1544189453125, 1.2724609375, 1.3905029296875, 1.508544921875, 1.6265869140625, 1.74462890625, 1.8626708984375, 1.980712890625, 2.0987548828125, 2.216796875, 2.3348388671875, 2.452880859375, 2.5709228515625, 2.68896484375, 2.8070068359375, 2.925048828125, 3.0430908203125, 3.1611328125, 3.2791748046875, 3.397216796875, 3.5152587890625, 3.63330078125, 3.7513427734375, 3.869384765625, 3.9874267578125, 4.10546875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 150.0, 771.0, 95.0, 2.0], "bins": [-0.84716796875, -0.8333635330200195, -0.8195590972900391, -0.8057546615600586, -0.7919502258300781, -0.7781457901000977, -0.7643413543701172, -0.7505369186401367, -0.7367324829101562, -0.7229280471801758, -0.7091236114501953, -0.6953191757202148, -0.6815147399902344, -0.6677103042602539, -0.6539058685302734, -0.640101432800293, -0.6262969970703125, -0.612492561340332, -0.5986881256103516, -0.5848836898803711, -0.5710792541503906, -0.5572748184204102, -0.5434703826904297, -0.5296659469604492, -0.5158615112304688, -0.5020570755004883, -0.4882526397705078, -0.47444820404052734, -0.4606437683105469, -0.4468393325805664, -0.43303489685058594, -0.41923046112060547, -0.405426025390625, -0.39162158966064453, -0.37781715393066406, -0.3640127182006836, -0.3502082824707031, -0.33640384674072266, -0.3225994110107422, -0.3087949752807617, -0.29499053955078125, -0.2811861038208008, -0.2673816680908203, -0.25357723236083984, -0.23977279663085938, -0.2259683609008789, -0.21216392517089844, -0.19835948944091797, -0.1845550537109375, -0.17075061798095703, -0.15694618225097656, -0.1431417465209961, -0.12933731079101562, -0.11553287506103516, -0.10172843933105469, -0.08792400360107422, -0.07411956787109375, -0.06031513214111328, -0.04651069641113281, -0.032706260681152344, -0.018901824951171875, -0.005097389221191406, 0.008707046508789062, 0.02251148223876953, 0.03631591796875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 7.0, 10.0, 9.0, 14.0, 19.0, 26.0, 45.0, 73.0, 157.0, 249.0, 509.0, 1092.0, 2718.0, 7804.0, 29410.0, 173878.0, 704239.0, 98796.0, 19934.0, 5741.0, 2031.0, 814.0, 411.0, 211.0, 111.0, 77.0, 43.0, 43.0, 19.0, 9.0, 9.0, 8.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.73388671875, -0.708892822265625, -0.68389892578125, -0.658905029296875, -0.6339111328125, -0.608917236328125, -0.58392333984375, -0.558929443359375, -0.533935546875, -0.508941650390625, -0.48394775390625, -0.458953857421875, -0.4339599609375, -0.408966064453125, -0.38397216796875, -0.358978271484375, -0.333984375, -0.308990478515625, -0.28399658203125, -0.259002685546875, -0.2340087890625, -0.209014892578125, -0.18402099609375, -0.159027099609375, -0.134033203125, -0.109039306640625, -0.08404541015625, -0.059051513671875, -0.0340576171875, -0.009063720703125, 0.01593017578125, 0.040924072265625, 0.06591796875, 0.090911865234375, 0.11590576171875, 0.140899658203125, 0.1658935546875, 0.190887451171875, 0.21588134765625, 0.240875244140625, 0.265869140625, 0.290863037109375, 0.31585693359375, 0.340850830078125, 0.3658447265625, 0.390838623046875, 0.41583251953125, 0.440826416015625, 0.4658203125, 0.490814208984375, 0.51580810546875, 0.540802001953125, 0.5657958984375, 0.590789794921875, 0.61578369140625, 0.640777587890625, 0.665771484375, 0.690765380859375, 0.71575927734375, 0.740753173828125, 0.7657470703125, 0.790740966796875, 0.81573486328125, 0.840728759765625, 0.86572265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 7.0, 13.0, 7.0, 11.0, 11.0, 25.0, 32.0, 38.0, 50.0, 54.0, 50.0, 52.0, 75.0, 80.0, 59.0, 72.0, 71.0, 59.0, 39.0, 29.0, 40.0, 25.0, 25.0, 16.0, 11.0, 10.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56201171875, -0.5417861938476562, -0.5215606689453125, -0.5013351440429688, -0.481109619140625, -0.46088409423828125, -0.4406585693359375, -0.42043304443359375, -0.40020751953125, -0.37998199462890625, -0.3597564697265625, -0.33953094482421875, -0.319305419921875, -0.29907989501953125, -0.2788543701171875, -0.25862884521484375, -0.2384033203125, -0.21817779541015625, -0.1979522705078125, -0.17772674560546875, -0.157501220703125, -0.13727569580078125, -0.1170501708984375, -0.09682464599609375, -0.07659912109375, -0.05637359619140625, -0.0361480712890625, -0.01592254638671875, 0.004302978515625, 0.02452850341796875, 0.0447540283203125, 0.06497955322265625, 0.085205078125, 0.10543060302734375, 0.1256561279296875, 0.14588165283203125, 0.166107177734375, 0.18633270263671875, 0.2065582275390625, 0.22678375244140625, 0.24700927734375, 0.26723480224609375, 0.2874603271484375, 0.30768585205078125, 0.327911376953125, 0.34813690185546875, 0.3683624267578125, 0.38858795166015625, 0.4088134765625, 0.42903900146484375, 0.4492645263671875, 0.46949005126953125, 0.489715576171875, 0.5099411010742188, 0.5301666259765625, 0.5503921508789062, 0.57061767578125, 0.5908432006835938, 0.6110687255859375, 0.6312942504882812, 0.651519775390625, 0.6717453002929688, 0.6919708251953125, 0.7121963500976562, 0.732421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 5.0, 8.0, 6.0, 12.0, 12.0, 20.0, 18.0, 32.0, 53.0, 68.0, 149.0, 304.0, 924.0, 4040.0, 52803.0, 932467.0, 52031.0, 4000.0, 865.0, 320.0, 145.0, 69.0, 53.0, 29.0, 21.0, 17.0, 16.0, 14.0, 11.0, 4.0, 2.0, 3.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.369140625, -1.3270111083984375, -1.284881591796875, -1.2427520751953125, -1.20062255859375, -1.1584930419921875, -1.116363525390625, -1.0742340087890625, -1.0321044921875, -0.9899749755859375, -0.947845458984375, -0.9057159423828125, -0.86358642578125, -0.8214569091796875, -0.779327392578125, -0.7371978759765625, -0.695068359375, -0.6529388427734375, -0.610809326171875, -0.5686798095703125, -0.52655029296875, -0.4844207763671875, -0.442291259765625, -0.4001617431640625, -0.3580322265625, -0.3159027099609375, -0.273773193359375, -0.2316436767578125, -0.18951416015625, -0.1473846435546875, -0.105255126953125, -0.0631256103515625, -0.02099609375, 0.0211334228515625, 0.063262939453125, 0.1053924560546875, 0.14752197265625, 0.1896514892578125, 0.231781005859375, 0.2739105224609375, 0.3160400390625, 0.3581695556640625, 0.400299072265625, 0.4424285888671875, 0.48455810546875, 0.5266876220703125, 0.568817138671875, 0.6109466552734375, 0.653076171875, 0.6952056884765625, 0.737335205078125, 0.7794647216796875, 0.82159423828125, 0.8637237548828125, 0.905853271484375, 0.9479827880859375, 0.9901123046875, 1.0322418212890625, 1.074371337890625, 1.1165008544921875, 1.15863037109375, 1.2007598876953125, 1.242889404296875, 1.2850189208984375, 1.3271484375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 4.0, 3.0, 4.0, 8.0, 10.0, 16.0, 18.0, 21.0, 40.0, 49.0, 82.0, 97.0, 181.0, 155.0, 91.0, 56.0, 46.0, 31.0, 23.0, 18.0, 12.0, 12.0, 2.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0008244514465332031, -0.0008032247424125671, -0.0007819980382919312, -0.0007607713341712952, -0.0007395446300506592, -0.0007183179259300232, -0.0006970912218093872, -0.0006758645176887512, -0.0006546378135681152, -0.0006334111094474792, -0.0006121844053268433, -0.0005909577012062073, -0.0005697309970855713, -0.0005485042929649353, -0.0005272775888442993, -0.0005060508847236633, -0.00048482418060302734, -0.00046359747648239136, -0.00044237077236175537, -0.0004211440682411194, -0.0003999173641204834, -0.0003786906599998474, -0.0003574639558792114, -0.00033623725175857544, -0.00031501054763793945, -0.00029378384351730347, -0.0002725571393966675, -0.0002513304352760315, -0.0002301037311553955, -0.00020887702703475952, -0.00018765032291412354, -0.00016642361879348755, -0.00014519691467285156, -0.00012397021055221558, -0.00010274350643157959, -8.15168023109436e-05, -6.029009819030762e-05, -3.906339406967163e-05, -1.7836689949035645e-05, 3.390014171600342e-06, 2.4616718292236328e-05, 4.5843422412872314e-05, 6.70701265335083e-05, 8.829683065414429e-05, 0.00010952353477478027, 0.00013075023889541626, 0.00015197694301605225, 0.00017320364713668823, 0.00019443035125732422, 0.0002156570553779602, 0.0002368837594985962, 0.0002581104636192322, 0.00027933716773986816, 0.00030056387186050415, 0.00032179057598114014, 0.0003430172801017761, 0.0003642439842224121, 0.0003854706883430481, 0.0004066973924636841, 0.00042792409658432007, 0.00044915080070495605, 0.00047037750482559204, 0.000491604208946228, 0.000512830913066864, 0.0005340576171875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 6.0, 4.0, 5.0, 6.0, 4.0, 11.0, 22.0, 48.0, 81.0, 166.0, 447.0, 1284.0, 4679.0, 25142.0, 690337.0, 302818.0, 17742.0, 3872.0, 1121.0, 406.0, 157.0, 75.0, 45.0, 26.0, 10.0, 7.0, 9.0, 7.0, 5.0, 7.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1591796875, -1.110687255859375, -1.06219482421875, -1.013702392578125, -0.9652099609375, -0.916717529296875, -0.86822509765625, -0.819732666015625, -0.771240234375, -0.722747802734375, -0.67425537109375, -0.625762939453125, -0.5772705078125, -0.528778076171875, -0.48028564453125, -0.431793212890625, -0.38330078125, -0.334808349609375, -0.28631591796875, -0.237823486328125, -0.1893310546875, -0.140838623046875, -0.09234619140625, -0.043853759765625, 0.004638671875, 0.053131103515625, 0.10162353515625, 0.150115966796875, 0.1986083984375, 0.247100830078125, 0.29559326171875, 0.344085693359375, 0.392578125, 0.441070556640625, 0.48956298828125, 0.538055419921875, 0.5865478515625, 0.635040283203125, 0.68353271484375, 0.732025146484375, 0.780517578125, 0.829010009765625, 0.87750244140625, 0.925994873046875, 0.9744873046875, 1.022979736328125, 1.07147216796875, 1.119964599609375, 1.16845703125, 1.216949462890625, 1.26544189453125, 1.313934326171875, 1.3624267578125, 1.410919189453125, 1.45941162109375, 1.507904052734375, 1.556396484375, 1.604888916015625, 1.65338134765625, 1.701873779296875, 1.7503662109375, 1.798858642578125, 1.84735107421875, 1.895843505859375, 1.9443359375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 4.0, 15.0, 12.0, 28.0, 41.0, 64.0, 134.0, 277.0, 157.0, 87.0, 54.0, 32.0, 20.0, 13.0, 5.0, 6.0, 3.0, 4.0, 4.0, 5.0, 3.0, 1.0, 7.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65087890625, -0.6244277954101562, -0.5979766845703125, -0.5715255737304688, -0.545074462890625, -0.5186233520507812, -0.4921722412109375, -0.46572113037109375, -0.43927001953125, -0.41281890869140625, -0.3863677978515625, -0.35991668701171875, -0.333465576171875, -0.30701446533203125, -0.2805633544921875, -0.25411224365234375, -0.2276611328125, -0.20121002197265625, -0.1747589111328125, -0.14830780029296875, -0.121856689453125, -0.09540557861328125, -0.0689544677734375, -0.04250335693359375, -0.01605224609375, 0.01039886474609375, 0.0368499755859375, 0.06330108642578125, 0.089752197265625, 0.11620330810546875, 0.1426544189453125, 0.16910552978515625, 0.195556640625, 0.22200775146484375, 0.2484588623046875, 0.27490997314453125, 0.301361083984375, 0.32781219482421875, 0.3542633056640625, 0.38071441650390625, 0.40716552734375, 0.43361663818359375, 0.4600677490234375, 0.48651885986328125, 0.512969970703125, 0.5394210815429688, 0.5658721923828125, 0.5923233032226562, 0.6187744140625, 0.6452255249023438, 0.6716766357421875, 0.6981277465820312, 0.724578857421875, 0.7510299682617188, 0.7774810791015625, 0.8039321899414062, 0.83038330078125, 0.8568344116210938, 0.8832855224609375, 0.9097366333007812, 0.936187744140625, 0.9626388549804688, 0.9890899658203125, 1.0155410766601562, 1.0419921875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 51.0, 929.0, 32.0, 7.0], "bins": [-121.34996032714844, -119.36675262451172, -117.38353729248047, -115.40032958984375, -113.41712188720703, -111.43391418457031, -109.45069885253906, -107.46749114990234, -105.48428344726562, -103.5010757446289, -101.51786041259766, -99.53465270996094, -97.55144500732422, -95.5682373046875, -93.58502197265625, -91.60181427001953, -89.61859893798828, -87.63539123535156, -85.65217590332031, -83.6689682006836, -81.68576049804688, -79.70254516601562, -77.7193374633789, -75.73612976074219, -73.75291442871094, -71.76970672607422, -69.78649139404297, -67.80328369140625, -65.82007598876953, -63.83686447143555, -61.85365295410156, -59.870445251464844, -57.88724136352539, -55.904029846191406, -53.92082214355469, -51.9376106262207, -49.95439910888672, -47.97119140625, -45.987979888916016, -44.00476837158203, -42.02156066894531, -40.03834915161133, -38.05514144897461, -36.071929931640625, -34.088722229003906, -32.10551071166992, -30.122299194335938, -28.139089584350586, -26.155879974365234, -24.172670364379883, -22.18946075439453, -20.206249237060547, -18.223039627075195, -16.239830017089844, -14.256619453430176, -12.273408889770508, -10.29019832611084, -8.306987762451172, -6.32377815246582, -4.3405680656433105, -2.357357978820801, -0.3741483688354492, 1.6090621948242188, 3.5922727584838867, 5.575482368469238]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 10.0, 23.0, 44.0, 65.0, 77.0, 109.0, 121.0, 132.0, 128.0, 100.0, 82.0, 46.0, 29.0, 24.0, 11.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-14.445422172546387, -14.167328834533691, -13.889235496520996, -13.611141204833984, -13.333047866821289, -13.054954528808594, -12.776861190795898, -12.498767852783203, -12.220673561096191, -11.942580223083496, -11.6644868850708, -11.386392593383789, -11.108299255371094, -10.830205917358398, -10.552112579345703, -10.274019241333008, -9.995925903320312, -9.717832565307617, -9.439739227294922, -9.16164493560791, -8.883551597595215, -8.60545825958252, -8.327364921569824, -8.049270629882812, -7.771177291870117, -7.493083953857422, -7.214990139007568, -6.936896800994873, -6.6588029861450195, -6.380709648132324, -6.102616310119629, -5.824522495269775, -5.546428680419922, -5.268335342407227, -4.990241527557373, -4.712148189544678, -4.434054374694824, -4.155961036682129, -3.8778674602508545, -3.59977388381958, -3.3216803073883057, -3.0435867309570312, -2.765493154525757, -2.4873995780944824, -2.209306240081787, -1.9312125444412231, -1.6531190872192383, -1.3750255107879639, -1.0969319343566895, -0.818838357925415, -0.5407448410987854, -0.26265132427215576, 0.015442252159118652, 0.29353582859039307, 0.5716292858123779, 0.8497228622436523, 1.1278164386749268, 1.4059100151062012, 1.6840035915374756, 1.9620970487594604, 2.2401905059814453, 2.518284320831299, 2.796377658843994, 3.0744712352752686, 3.352564811706543]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 10.0, 11.0, 12.0, 28.0, 39.0, 44.0, 100.0, 141.0, 357.0, 2312.0, 4190913.0, 251.0, 62.0, 12.0, 3.0], "bins": [-34.4375, -33.85693359375, -33.2763671875, -32.69580078125, -32.115234375, -31.53466796875, -30.9541015625, -30.37353515625, -29.79296875, -29.21240234375, -28.6318359375, -28.05126953125, -27.470703125, -26.89013671875, -26.3095703125, -25.72900390625, -25.1484375, -24.56787109375, -23.9873046875, -23.40673828125, -22.826171875, -22.24560546875, -21.6650390625, -21.08447265625, -20.50390625, -19.92333984375, -19.3427734375, -18.76220703125, -18.181640625, -17.60107421875, -17.0205078125, -16.43994140625, -15.859375, -15.27880859375, -14.6982421875, -14.11767578125, -13.537109375, -12.95654296875, -12.3759765625, -11.79541015625, -11.21484375, -10.63427734375, -10.0537109375, -9.47314453125, -8.892578125, -8.31201171875, -7.7314453125, -7.15087890625, -6.5703125, -5.98974609375, -5.4091796875, -4.82861328125, -4.248046875, -3.66748046875, -3.0869140625, -2.50634765625, -1.92578125, -1.34521484375, -0.7646484375, -0.18408203125, 0.396484375, 0.97705078125, 1.5576171875, 2.13818359375, 2.71875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 16.0, 74.0, 247.0, 383.0, 215.0, 67.0, 13.0, 3.0], "bins": [-0.99462890625, -0.977874755859375, -0.96112060546875, -0.944366455078125, -0.9276123046875, -0.910858154296875, -0.89410400390625, -0.877349853515625, -0.860595703125, -0.843841552734375, -0.82708740234375, -0.810333251953125, -0.7935791015625, -0.776824951171875, -0.76007080078125, -0.743316650390625, -0.7265625, -0.709808349609375, -0.69305419921875, -0.676300048828125, -0.6595458984375, -0.642791748046875, -0.62603759765625, -0.609283447265625, -0.592529296875, -0.575775146484375, -0.55902099609375, -0.542266845703125, -0.5255126953125, -0.508758544921875, -0.49200439453125, -0.475250244140625, -0.45849609375, -0.441741943359375, -0.42498779296875, -0.408233642578125, -0.3914794921875, -0.374725341796875, -0.35797119140625, -0.341217041015625, -0.324462890625, -0.307708740234375, -0.29095458984375, -0.274200439453125, -0.2574462890625, -0.240692138671875, -0.22393798828125, -0.207183837890625, -0.1904296875, -0.173675537109375, -0.15692138671875, -0.140167236328125, -0.1234130859375, -0.106658935546875, -0.08990478515625, -0.073150634765625, -0.056396484375, -0.039642333984375, -0.02288818359375, -0.006134033203125, 0.0106201171875, 0.027374267578125, 0.04412841796875, 0.060882568359375, 0.07763671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 11.0, 21.0, 41.0, 45.0, 80.0, 126.0, 231.0, 675.0, 22648.0, 4167945.0, 1879.0, 331.0, 117.0, 61.0, 28.0, 25.0, 8.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.3125, -20.87042236328125, -20.4283447265625, -19.98626708984375, -19.544189453125, -19.10211181640625, -18.6600341796875, -18.21795654296875, -17.77587890625, -17.33380126953125, -16.8917236328125, -16.44964599609375, -16.007568359375, -15.56549072265625, -15.1234130859375, -14.68133544921875, -14.2392578125, -13.79718017578125, -13.3551025390625, -12.91302490234375, -12.470947265625, -12.02886962890625, -11.5867919921875, -11.14471435546875, -10.70263671875, -10.26055908203125, -9.8184814453125, -9.37640380859375, -8.934326171875, -8.49224853515625, -8.0501708984375, -7.60809326171875, -7.166015625, -6.72393798828125, -6.2818603515625, -5.83978271484375, -5.397705078125, -4.95562744140625, -4.5135498046875, -4.07147216796875, -3.62939453125, -3.18731689453125, -2.7452392578125, -2.30316162109375, -1.861083984375, -1.41900634765625, -0.9769287109375, -0.53485107421875, -0.0927734375, 0.34930419921875, 0.7913818359375, 1.23345947265625, 1.675537109375, 2.11761474609375, 2.5596923828125, 3.00177001953125, 3.44384765625, 3.88592529296875, 4.3280029296875, 4.77008056640625, 5.212158203125, 5.65423583984375, 6.0963134765625, 6.53839111328125, 6.98046875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 32.0, 2979.0, 949.0, 88.0, 22.0, 8.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.990234375, -2.9237060546875, -2.857177734375, -2.7906494140625, -2.72412109375, -2.6575927734375, -2.591064453125, -2.5245361328125, -2.4580078125, -2.3914794921875, -2.324951171875, -2.2584228515625, -2.19189453125, -2.1253662109375, -2.058837890625, -1.9923095703125, -1.92578125, -1.8592529296875, -1.792724609375, -1.7261962890625, -1.65966796875, -1.5931396484375, -1.526611328125, -1.4600830078125, -1.3935546875, -1.3270263671875, -1.260498046875, -1.1939697265625, -1.12744140625, -1.0609130859375, -0.994384765625, -0.9278564453125, -0.861328125, -0.7947998046875, -0.728271484375, -0.6617431640625, -0.59521484375, -0.5286865234375, -0.462158203125, -0.3956298828125, -0.3291015625, -0.2625732421875, -0.196044921875, -0.1295166015625, -0.06298828125, 0.0035400390625, 0.070068359375, 0.1365966796875, 0.203125, 0.2696533203125, 0.336181640625, 0.4027099609375, 0.46923828125, 0.5357666015625, 0.602294921875, 0.6688232421875, 0.7353515625, 0.8018798828125, 0.868408203125, 0.9349365234375, 1.00146484375, 1.0679931640625, 1.134521484375, 1.2010498046875, 1.267578125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 10.0, 77.0, 525.0, 320.0, 42.0, 22.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-22.40868377685547, -21.999893188476562, -21.591102600097656, -21.18231201171875, -20.773521423339844, -20.364730834960938, -19.95594024658203, -19.547149658203125, -19.138357162475586, -18.72956657409668, -18.320775985717773, -17.911985397338867, -17.50319480895996, -17.094404220581055, -16.685611724853516, -16.27682113647461, -15.868032455444336, -15.45924186706543, -15.050451278686523, -14.641660690307617, -14.232869148254395, -13.824078559875488, -13.415287971496582, -13.006497383117676, -12.597705841064453, -12.188915252685547, -11.78012466430664, -11.371334075927734, -10.962542533874512, -10.553751945495605, -10.1449613571167, -9.736170768737793, -9.32737922668457, -8.918588638305664, -8.509798049926758, -8.101007461547852, -7.692216396331787, -7.283425331115723, -6.874634742736816, -6.46584415435791, -6.057053565979004, -5.648262977600098, -5.239471912384033, -4.830681324005127, -4.421890735626221, -4.013099670410156, -3.60430908203125, -3.1955184936523438, -2.7867279052734375, -2.377937078475952, -1.969146490097046, -1.5603556632995605, -1.1515649557113647, -0.742774248123169, -0.3339834213256836, 0.07480716705322266, 0.483597993850708, 0.8923887014389038, 1.3011794090270996, 1.709970235824585, 2.1187610626220703, 2.5275516510009766, 2.936342477798462, 3.345133066177368, 3.7539238929748535]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 12.0, 17.0, 44.0, 72.0, 103.0, 149.0, 152.0, 148.0, 115.0, 82.0, 51.0, 23.0, 21.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.61284065246582, -9.29484748840332, -8.97685432434082, -8.65886116027832, -8.34086799621582, -8.02287483215332, -7.704881191253662, -7.386888027191162, -7.068894863128662, -6.750901699066162, -6.432908535003662, -6.114915370941162, -5.796921730041504, -5.478928565979004, -5.160935401916504, -4.842942237854004, -4.524949073791504, -4.206955909729004, -3.888962745666504, -3.570969343185425, -3.252976179122925, -2.934983015060425, -2.6169896125793457, -2.2989964485168457, -1.9810032844543457, -1.6630101203918457, -1.3450168371200562, -1.0270235538482666, -0.7090303897857666, -0.3910372257232666, -0.07304394245147705, 0.2449493408203125, 0.5629415512084961, 0.8809347748756409, 1.1989279985427856, 1.5169212818145752, 1.8349144458770752, 2.152907609939575, 2.4709010124206543, 2.7888941764831543, 3.1068873405456543, 3.4248805046081543, 3.7428736686706543, 4.060866832733154, 4.3788604736328125, 4.6968536376953125, 5.0148468017578125, 5.3328399658203125, 5.6508331298828125, 5.9688262939453125, 6.2868194580078125, 6.6048126220703125, 6.9228057861328125, 7.2407989501953125, 7.558792591094971, 7.876785755157471, 8.194778442382812, 8.512771606445312, 8.830764770507812, 9.148757934570312, 9.466751098632812, 9.784744262695312, 10.102737426757812, 10.420730590820312, 10.738724708557129]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 7.0, 3.0, 2.0, 10.0, 16.0, 15.0, 22.0, 26.0, 46.0, 61.0, 105.0, 185.0, 570.0, 2640.0, 54527.0, 971174.0, 16665.0, 1605.0, 419.0, 179.0, 83.0, 51.0, 38.0, 28.0, 16.0, 12.0, 13.0, 9.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.37109375, -5.205078125, -5.0390625, -4.873046875, -4.70703125, -4.541015625, -4.375, -4.208984375, -4.04296875, -3.876953125, -3.7109375, -3.544921875, -3.37890625, -3.212890625, -3.046875, -2.880859375, -2.71484375, -2.548828125, -2.3828125, -2.216796875, -2.05078125, -1.884765625, -1.71875, -1.552734375, -1.38671875, -1.220703125, -1.0546875, -0.888671875, -0.72265625, -0.556640625, -0.390625, -0.224609375, -0.05859375, 0.107421875, 0.2734375, 0.439453125, 0.60546875, 0.771484375, 0.9375, 1.103515625, 1.26953125, 1.435546875, 1.6015625, 1.767578125, 1.93359375, 2.099609375, 2.265625, 2.431640625, 2.59765625, 2.763671875, 2.9296875, 3.095703125, 3.26171875, 3.427734375, 3.59375, 3.759765625, 3.92578125, 4.091796875, 4.2578125, 4.423828125, 4.58984375, 4.755859375, 4.921875, 5.087890625, 5.25390625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 23.0, 48.0, 116.0, 176.0, 230.0, 209.0, 116.0, 50.0, 23.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2392578125, -1.2136955261230469, -1.1881332397460938, -1.1625709533691406, -1.1370086669921875, -1.1114463806152344, -1.0858840942382812, -1.0603218078613281, -1.034759521484375, -1.0091972351074219, -0.9836349487304688, -0.9580726623535156, -0.9325103759765625, -0.9069480895996094, -0.8813858032226562, -0.8558235168457031, -0.83026123046875, -0.8046989440917969, -0.7791366577148438, -0.7535743713378906, -0.7280120849609375, -0.7024497985839844, -0.6768875122070312, -0.6513252258300781, -0.625762939453125, -0.6002006530761719, -0.5746383666992188, -0.5490760803222656, -0.5235137939453125, -0.4979515075683594, -0.47238922119140625, -0.4468269348144531, -0.4212646484375, -0.3957023620605469, -0.37014007568359375, -0.3445777893066406, -0.3190155029296875, -0.2934532165527344, -0.26789093017578125, -0.24232864379882812, -0.216766357421875, -0.19120407104492188, -0.16564178466796875, -0.14007949829101562, -0.1145172119140625, -0.08895492553710938, -0.06339263916015625, -0.037830352783203125, -0.01226806640625, 0.013294219970703125, 0.03885650634765625, 0.06441879272460938, 0.0899810791015625, 0.11554336547851562, 0.14110565185546875, 0.16666793823242188, 0.192230224609375, 0.21779251098632812, 0.24335479736328125, 0.2689170837402344, 0.2944793701171875, 0.3200416564941406, 0.34560394287109375, 0.3711662292480469, 0.396728515625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 17.0, 14.0, 17.0, 15.0, 30.0, 57.0, 80.0, 232.0, 632.0, 3074.0, 40184.0, 910688.0, 87258.0, 4907.0, 815.0, 259.0, 101.0, 54.0, 17.0, 25.0, 17.0, 13.0, 11.0, 7.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.544921875, -2.458984375, -2.373046875, -2.287109375, -2.201171875, -2.115234375, -2.029296875, -1.943359375, -1.857421875, -1.771484375, -1.685546875, -1.599609375, -1.513671875, -1.427734375, -1.341796875, -1.255859375, -1.169921875, -1.083984375, -0.998046875, -0.912109375, -0.826171875, -0.740234375, -0.654296875, -0.568359375, -0.482421875, -0.396484375, -0.310546875, -0.224609375, -0.138671875, -0.052734375, 0.033203125, 0.119140625, 0.205078125, 0.291015625, 0.376953125, 0.462890625, 0.548828125, 0.634765625, 0.720703125, 0.806640625, 0.892578125, 0.978515625, 1.064453125, 1.150390625, 1.236328125, 1.322265625, 1.408203125, 1.494140625, 1.580078125, 1.666015625, 1.751953125, 1.837890625, 1.923828125, 2.009765625, 2.095703125, 2.181640625, 2.267578125, 2.353515625, 2.439453125, 2.525390625, 2.611328125, 2.697265625, 2.783203125, 2.869140625, 2.955078125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 4.0, 9.0, 9.0, 15.0, 16.0, 21.0, 23.0, 36.0, 31.0, 43.0, 42.0, 53.0, 64.0, 79.0, 73.0, 67.0, 71.0, 61.0, 52.0, 50.0, 37.0, 32.0, 24.0, 21.0, 16.0, 9.0, 13.0, 8.0, 6.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2353515625, -1.19635009765625, -1.1573486328125, -1.11834716796875, -1.079345703125, -1.04034423828125, -1.0013427734375, -0.96234130859375, -0.92333984375, -0.88433837890625, -0.8453369140625, -0.80633544921875, -0.767333984375, -0.72833251953125, -0.6893310546875, -0.65032958984375, -0.611328125, -0.57232666015625, -0.5333251953125, -0.49432373046875, -0.455322265625, -0.41632080078125, -0.3773193359375, -0.33831787109375, -0.29931640625, -0.26031494140625, -0.2213134765625, -0.18231201171875, -0.143310546875, -0.10430908203125, -0.0653076171875, -0.02630615234375, 0.0126953125, 0.05169677734375, 0.0906982421875, 0.12969970703125, 0.168701171875, 0.20770263671875, 0.2467041015625, 0.28570556640625, 0.32470703125, 0.36370849609375, 0.4027099609375, 0.44171142578125, 0.480712890625, 0.51971435546875, 0.5587158203125, 0.59771728515625, 0.63671875, 0.67572021484375, 0.7147216796875, 0.75372314453125, 0.792724609375, 0.83172607421875, 0.8707275390625, 0.90972900390625, 0.94873046875, 0.98773193359375, 1.0267333984375, 1.06573486328125, 1.104736328125, 1.14373779296875, 1.1827392578125, 1.22174072265625, 1.2607421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 12.0, 20.0, 24.0, 48.0, 86.0, 180.0, 373.0, 1053.0, 4308.0, 46893.0, 857943.0, 127333.0, 7764.0, 1549.0, 522.0, 204.0, 109.0, 51.0, 32.0, 16.0, 9.0, 8.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3251953125, -1.2858123779296875, -1.246429443359375, -1.2070465087890625, -1.16766357421875, -1.1282806396484375, -1.088897705078125, -1.0495147705078125, -1.0101318359375, -0.9707489013671875, -0.931365966796875, -0.8919830322265625, -0.85260009765625, -0.8132171630859375, -0.773834228515625, -0.7344512939453125, -0.695068359375, -0.6556854248046875, -0.616302490234375, -0.5769195556640625, -0.53753662109375, -0.4981536865234375, -0.458770751953125, -0.4193878173828125, -0.3800048828125, -0.3406219482421875, -0.301239013671875, -0.2618560791015625, -0.22247314453125, -0.1830902099609375, -0.143707275390625, -0.1043243408203125, -0.06494140625, -0.0255584716796875, 0.013824462890625, 0.0532073974609375, 0.09259033203125, 0.1319732666015625, 0.171356201171875, 0.2107391357421875, 0.2501220703125, 0.2895050048828125, 0.328887939453125, 0.3682708740234375, 0.40765380859375, 0.4470367431640625, 0.486419677734375, 0.5258026123046875, 0.565185546875, 0.6045684814453125, 0.643951416015625, 0.6833343505859375, 0.72271728515625, 0.7621002197265625, 0.801483154296875, 0.8408660888671875, 0.8802490234375, 0.9196319580078125, 0.959014892578125, 0.9983978271484375, 1.03778076171875, 1.0771636962890625, 1.116546630859375, 1.1559295654296875, 1.1953125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 1.0, 6.0, 10.0, 6.0, 9.0, 10.0, 13.0, 14.0, 13.0, 19.0, 27.0, 30.0, 43.0, 54.0, 88.0, 163.0, 132.0, 89.0, 46.0, 23.0, 33.0, 24.0, 19.0, 15.0, 19.0, 14.0, 15.0, 14.0, 4.0, 8.0, 3.0, 4.0, 6.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0004858970642089844, -0.00047066062688827515, -0.0004554241895675659, -0.0004401877522468567, -0.00042495131492614746, -0.00040971487760543823, -0.000394478440284729, -0.0003792420029640198, -0.00036400556564331055, -0.0003487691283226013, -0.0003335326910018921, -0.00031829625368118286, -0.00030305981636047363, -0.0002878233790397644, -0.0002725869417190552, -0.00025735050439834595, -0.00024211406707763672, -0.0002268776297569275, -0.00021164119243621826, -0.00019640475511550903, -0.0001811683177947998, -0.00016593188047409058, -0.00015069544315338135, -0.00013545900583267212, -0.00012022256851196289, -0.00010498613119125366, -8.974969387054443e-05, -7.45132565498352e-05, -5.9276819229125977e-05, -4.404038190841675e-05, -2.880394458770752e-05, -1.3567507266998291e-05, 1.6689300537109375e-06, 1.6905367374420166e-05, 3.2141804695129395e-05, 4.737824201583862e-05, 6.261467933654785e-05, 7.785111665725708e-05, 9.308755397796631e-05, 0.00010832399129867554, 0.00012356042861938477, 0.000138796865940094, 0.00015403330326080322, 0.00016926974058151245, 0.00018450617790222168, 0.0001997426152229309, 0.00021497905254364014, 0.00023021548986434937, 0.0002454519271850586, 0.0002606883645057678, 0.00027592480182647705, 0.0002911612391471863, 0.0003063976764678955, 0.00032163411378860474, 0.00033687055110931396, 0.0003521069884300232, 0.0003673434257507324, 0.00038257986307144165, 0.0003978163003921509, 0.0004130527377128601, 0.00042828917503356934, 0.00044352561235427856, 0.0004587620496749878, 0.000473998486995697, 0.0004892349243164062]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 15.0, 21.0, 38.0, 81.0, 249.0, 760.0, 2866.0, 24839.0, 865952.0, 144979.0, 6822.0, 1289.0, 377.0, 131.0, 61.0, 31.0, 16.0, 8.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.203125, -2.1490478515625, -2.094970703125, -2.0408935546875, -1.98681640625, -1.9327392578125, -1.878662109375, -1.8245849609375, -1.7705078125, -1.7164306640625, -1.662353515625, -1.6082763671875, -1.55419921875, -1.5001220703125, -1.446044921875, -1.3919677734375, -1.337890625, -1.2838134765625, -1.229736328125, -1.1756591796875, -1.12158203125, -1.0675048828125, -1.013427734375, -0.9593505859375, -0.9052734375, -0.8511962890625, -0.797119140625, -0.7430419921875, -0.68896484375, -0.6348876953125, -0.580810546875, -0.5267333984375, -0.47265625, -0.4185791015625, -0.364501953125, -0.3104248046875, -0.25634765625, -0.2022705078125, -0.148193359375, -0.0941162109375, -0.0400390625, 0.0140380859375, 0.068115234375, 0.1221923828125, 0.17626953125, 0.2303466796875, 0.284423828125, 0.3385009765625, 0.392578125, 0.4466552734375, 0.500732421875, 0.5548095703125, 0.60888671875, 0.6629638671875, 0.717041015625, 0.7711181640625, 0.8251953125, 0.8792724609375, 0.933349609375, 0.9874267578125, 1.04150390625, 1.0955810546875, 1.149658203125, 1.2037353515625, 1.2578125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 5.0, 11.0, 22.0, 35.0, 51.0, 77.0, 130.0, 202.0, 167.0, 114.0, 61.0, 48.0, 29.0, 21.0, 10.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03125, -1.0053787231445312, -0.9795074462890625, -0.9536361694335938, -0.927764892578125, -0.9018936157226562, -0.8760223388671875, -0.8501510620117188, -0.82427978515625, -0.7984085083007812, -0.7725372314453125, -0.7466659545898438, -0.720794677734375, -0.6949234008789062, -0.6690521240234375, -0.6431808471679688, -0.6173095703125, -0.5914382934570312, -0.5655670166015625, -0.5396957397460938, -0.513824462890625, -0.48795318603515625, -0.4620819091796875, -0.43621063232421875, -0.41033935546875, -0.38446807861328125, -0.3585968017578125, -0.33272552490234375, -0.306854248046875, -0.28098297119140625, -0.2551116943359375, -0.22924041748046875, -0.203369140625, -0.17749786376953125, -0.1516265869140625, -0.12575531005859375, -0.099884033203125, -0.07401275634765625, -0.0481414794921875, -0.02227020263671875, 0.00360107421875, 0.02947235107421875, 0.0553436279296875, 0.08121490478515625, 0.107086181640625, 0.13295745849609375, 0.1588287353515625, 0.18470001220703125, 0.2105712890625, 0.23644256591796875, 0.2623138427734375, 0.28818511962890625, 0.314056396484375, 0.33992767333984375, 0.3657989501953125, 0.39167022705078125, 0.41754150390625, 0.44341278076171875, 0.4692840576171875, 0.49515533447265625, 0.521026611328125, 0.5468978881835938, 0.5727691650390625, 0.5986404418945312, 0.62451171875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 26.0, 99.0, 391.0, 357.0, 92.0, 24.0, 11.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.354442596435547, -19.86855125427246, -19.382659912109375, -18.89676856994629, -18.410877227783203, -17.924985885620117, -17.43909454345703, -16.953205108642578, -16.46731185913086, -15.981420516967773, -15.495529174804688, -15.009637832641602, -14.523746490478516, -14.03785514831543, -13.55196475982666, -13.066073417663574, -12.580183029174805, -12.094291687011719, -11.608400344848633, -11.122509002685547, -10.636617660522461, -10.150726318359375, -9.664835929870605, -9.17894458770752, -8.693053245544434, -8.207161903381348, -7.721270561218262, -7.235379695892334, -6.749488353729248, -6.263597011566162, -5.777706146240234, -5.291814804077148, -4.8059234619140625, -4.320032119750977, -3.8341410160064697, -3.348249912261963, -2.862358570098877, -2.376467227935791, -1.8905761241912842, -1.4046850204467773, -0.9187936782836914, -0.432902455329895, 0.05298876762390137, 0.5388799905776978, 1.0247712135314941, 1.51066255569458, 1.996553659439087, 2.4824447631835938, 2.9683361053466797, 3.4542274475097656, 3.9401185512542725, 4.426009654998779, 4.911900997161865, 5.397792339324951, 5.883683204650879, 6.369574546813965, 6.855465888977051, 7.341357231140137, 7.827248573303223, 8.313139915466309, 8.799030303955078, 9.284921646118164, 9.77081298828125, 10.256704330444336, 10.742595672607422]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 6.0, 18.0, 13.0, 13.0, 25.0, 29.0, 38.0, 52.0, 65.0, 63.0, 58.0, 70.0, 54.0, 59.0, 62.0, 60.0, 57.0, 53.0, 46.0, 35.0, 28.0, 26.0, 22.0, 18.0, 9.0, 7.0, 6.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9454803466796875, -6.694910526275635, -6.444340705871582, -6.1937713623046875, -5.943201541900635, -5.692631721496582, -5.442061901092529, -5.191492080688477, -4.940922737121582, -4.690352916717529, -4.439783096313477, -4.189213752746582, -3.9386439323425293, -3.6880741119384766, -3.437504291534424, -3.186934471130371, -2.9363646507263184, -2.6857948303222656, -2.435225248336792, -2.1846554279327393, -1.934085726737976, -1.683516025543213, -1.4329462051391602, -1.182376503944397, -0.9318068027496338, -0.6812371015548706, -0.43066734075546265, -0.1800975799560547, 0.0704721212387085, 0.3210418224334717, 0.5716116428375244, 0.8221813440322876, 1.0727510452270508, 1.323320746421814, 1.5738904476165771, 1.8244602680206299, 2.0750298500061035, 2.3255996704101562, 2.576169490814209, 2.8267393112182617, 3.0773088932037354, 3.327878713607788, 3.5784482955932617, 3.8290181159973145, 4.079587936401367, 4.330157279968262, 4.580727577209473, 4.831296920776367, 5.08186674118042, 5.332436561584473, 5.583006381988525, 5.833576202392578, 6.084145545959473, 6.334715366363525, 6.585285186767578, 6.835855007171631, 7.086424827575684, 7.336994647979736, 7.587564468383789, 7.838133811950684, 8.088704109191895, 8.339273452758789, 8.58984375, 8.840413093566895, 9.090982437133789]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 5.0, 6.0, 17.0, 17.0, 23.0, 16.0, 22.0, 33.0, 25.0, 44.0, 53.0, 67.0, 123.0, 192.0, 428.0, 1353.0, 12059.0, 4001603.0, 172674.0, 4670.0, 618.0, 152.0, 54.0, 18.0, 7.0, 3.0, 0.0, 0.0, 2.0], "bins": [-11.2890625, -11.0753173828125, -10.861572265625, -10.6478271484375, -10.43408203125, -10.2203369140625, -10.006591796875, -9.7928466796875, -9.5791015625, -9.3653564453125, -9.151611328125, -8.9378662109375, -8.72412109375, -8.5103759765625, -8.296630859375, -8.0828857421875, -7.869140625, -7.6553955078125, -7.441650390625, -7.2279052734375, -7.01416015625, -6.8004150390625, -6.586669921875, -6.3729248046875, -6.1591796875, -5.9454345703125, -5.731689453125, -5.5179443359375, -5.30419921875, -5.0904541015625, -4.876708984375, -4.6629638671875, -4.44921875, -4.2354736328125, -4.021728515625, -3.8079833984375, -3.59423828125, -3.3804931640625, -3.166748046875, -2.9530029296875, -2.7392578125, -2.5255126953125, -2.311767578125, -2.0980224609375, -1.88427734375, -1.6705322265625, -1.456787109375, -1.2430419921875, -1.029296875, -0.8155517578125, -0.601806640625, -0.3880615234375, -0.17431640625, 0.0394287109375, 0.253173828125, 0.4669189453125, 0.6806640625, 0.8944091796875, 1.108154296875, 1.3218994140625, 1.53564453125, 1.7493896484375, 1.963134765625, 2.1768798828125, 2.390625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 12.0, 26.0, 63.0, 98.0, 187.0, 194.0, 182.0, 113.0, 71.0, 25.0, 21.0, 12.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.2275390625, -1.2041969299316406, -1.1808547973632812, -1.1575126647949219, -1.1341705322265625, -1.1108283996582031, -1.0874862670898438, -1.0641441345214844, -1.040802001953125, -1.0174598693847656, -0.9941177368164062, -0.9707756042480469, -0.9474334716796875, -0.9240913391113281, -0.9007492065429688, -0.8774070739746094, -0.85406494140625, -0.8307228088378906, -0.8073806762695312, -0.7840385437011719, -0.7606964111328125, -0.7373542785644531, -0.7140121459960938, -0.6906700134277344, -0.667327880859375, -0.6439857482910156, -0.6206436157226562, -0.5973014831542969, -0.5739593505859375, -0.5506172180175781, -0.5272750854492188, -0.5039329528808594, -0.4805908203125, -0.4572486877441406, -0.43390655517578125, -0.4105644226074219, -0.3872222900390625, -0.3638801574707031, -0.34053802490234375, -0.3171958923339844, -0.293853759765625, -0.2705116271972656, -0.24716949462890625, -0.22382736206054688, -0.2004852294921875, -0.17714309692382812, -0.15380096435546875, -0.13045883178710938, -0.10711669921875, -0.08377456665039062, -0.06043243408203125, -0.037090301513671875, -0.0137481689453125, 0.009593963623046875, 0.03293609619140625, 0.056278228759765625, 0.079620361328125, 0.10296249389648438, 0.12630462646484375, 0.14964675903320312, 0.1729888916015625, 0.19633102416992188, 0.21967315673828125, 0.24301528930664062, 0.266357421875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 8.0, 10.0, 14.0, 32.0, 46.0, 92.0, 150.0, 401.0, 2776.0, 4188023.0, 2273.0, 262.0, 87.0, 49.0, 38.0, 17.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.15625, -33.466552734375, -32.77685546875, -32.087158203125, -31.3974609375, -30.707763671875, -30.01806640625, -29.328369140625, -28.638671875, -27.948974609375, -27.25927734375, -26.569580078125, -25.8798828125, -25.190185546875, -24.50048828125, -23.810791015625, -23.12109375, -22.431396484375, -21.74169921875, -21.052001953125, -20.3623046875, -19.672607421875, -18.98291015625, -18.293212890625, -17.603515625, -16.913818359375, -16.22412109375, -15.534423828125, -14.8447265625, -14.155029296875, -13.46533203125, -12.775634765625, -12.0859375, -11.396240234375, -10.70654296875, -10.016845703125, -9.3271484375, -8.637451171875, -7.94775390625, -7.258056640625, -6.568359375, -5.878662109375, -5.18896484375, -4.499267578125, -3.8095703125, -3.119873046875, -2.43017578125, -1.740478515625, -1.05078125, -0.361083984375, 0.32861328125, 1.018310546875, 1.7080078125, 2.397705078125, 3.08740234375, 3.777099609375, 4.466796875, 5.156494140625, 5.84619140625, 6.535888671875, 7.2255859375, 7.915283203125, 8.60498046875, 9.294677734375, 9.984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 19.0, 102.0, 3427.0, 453.0, 44.0, 16.0, 8.0, 6.0], "bins": [-4.68359375, -4.6039276123046875, -4.524261474609375, -4.4445953369140625, -4.36492919921875, -4.2852630615234375, -4.205596923828125, -4.1259307861328125, -4.0462646484375, -3.9665985107421875, -3.886932373046875, -3.8072662353515625, -3.72760009765625, -3.6479339599609375, -3.568267822265625, -3.4886016845703125, -3.408935546875, -3.3292694091796875, -3.249603271484375, -3.1699371337890625, -3.09027099609375, -3.0106048583984375, -2.930938720703125, -2.8512725830078125, -2.7716064453125, -2.6919403076171875, -2.612274169921875, -2.5326080322265625, -2.45294189453125, -2.3732757568359375, -2.293609619140625, -2.2139434814453125, -2.13427734375, -2.0546112060546875, -1.974945068359375, -1.8952789306640625, -1.81561279296875, -1.7359466552734375, -1.656280517578125, -1.5766143798828125, -1.4969482421875, -1.4172821044921875, -1.337615966796875, -1.2579498291015625, -1.17828369140625, -1.0986175537109375, -1.018951416015625, -0.9392852783203125, -0.859619140625, -0.7799530029296875, -0.700286865234375, -0.6206207275390625, -0.54095458984375, -0.4612884521484375, -0.381622314453125, -0.3019561767578125, -0.2222900390625, -0.1426239013671875, -0.062957763671875, 0.0167083740234375, 0.09637451171875, 0.1760406494140625, 0.255706787109375, 0.3353729248046875, 0.4150390625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 10.0, 9.0, 22.0, 55.0, 179.0, 476.0, 183.0, 45.0, 8.0, 8.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.767427444458008, -15.442994117736816, -15.118560791015625, -14.794127464294434, -14.469694137573242, -14.145259857177734, -13.820826530456543, -13.496393203735352, -13.17195987701416, -12.847526550292969, -12.523093223571777, -12.198659896850586, -11.874225616455078, -11.549792289733887, -11.225358963012695, -10.900925636291504, -10.576492309570312, -10.252058982849121, -9.92762565612793, -9.603192329406738, -9.278759002685547, -8.954324722290039, -8.629891395568848, -8.305458068847656, -7.981024742126465, -7.656591415405273, -7.332158088684082, -7.007724285125732, -6.683290958404541, -6.35885763168335, -6.034423828125, -5.709990501403809, -5.385556221008301, -5.061122894287109, -4.736689567565918, -4.412255764007568, -4.087822437286377, -3.7633891105651855, -3.438955545425415, -3.1145219802856445, -2.790088653564453, -2.4656553268432617, -2.141221761703491, -1.8167883157730103, -1.4923548698425293, -1.1679214239120483, -0.8434879779815674, -0.5190544128417969, -0.19462108612060547, 0.1298123598098755, 0.45424580574035645, 0.7786792516708374, 1.1031126976013184, 1.4275461435317993, 1.7519795894622803, 2.076413154602051, 2.400846481323242, 2.7252798080444336, 3.049713373184204, 3.3741469383239746, 3.698580265045166, 4.023013591766357, 4.347447395324707, 4.671880722045898, 4.99631404876709]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 6.0, 2.0, 10.0, 19.0, 35.0, 49.0, 68.0, 93.0, 121.0, 131.0, 118.0, 90.0, 106.0, 64.0, 40.0, 23.0, 14.0, 8.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.52816390991211, -10.221487998962402, -9.914811134338379, -9.608135223388672, -9.301459312438965, -8.994783401489258, -8.688106536865234, -8.381430625915527, -8.07475471496582, -7.768078327178955, -7.461402416229248, -7.154726028442383, -6.848050117492676, -6.5413737297058105, -6.234697341918945, -5.928021430969238, -5.621345043182373, -5.314668655395508, -5.007992744445801, -4.7013163566589355, -4.3946404457092285, -4.087964057922363, -3.781287908554077, -3.474611759185791, -3.167935609817505, -2.8612594604492188, -2.5545833110809326, -2.2479071617126465, -1.9412308931350708, -1.6345547437667847, -1.327878475189209, -1.0212023258209229, -0.7145261764526367, -0.4078499972820282, -0.10117381811141968, 0.20550239086151123, 0.5121785402297974, 0.8188546895980835, 1.1255309581756592, 1.4322071075439453, 1.7388832569122314, 2.0455594062805176, 2.3522355556488037, 2.65891170501709, 2.965588092803955, 3.272264003753662, 3.5789403915405273, 3.8856165409088135, 4.1922926902771, 4.498969078063965, 4.805644989013672, 5.112321376800537, 5.418997287750244, 5.725673675537109, 6.032349586486816, 6.339025974273682, 6.645702362060547, 6.952378749847412, 7.259054660797119, 7.565731048583984, 7.872406959533691, 8.179082870483398, 8.485759735107422, 8.792435646057129, 9.099111557006836]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 8.0, 14.0, 17.0, 15.0, 20.0, 41.0, 45.0, 75.0, 91.0, 135.0, 237.0, 389.0, 839.0, 2351.0, 9018.0, 63009.0, 795173.0, 154951.0, 16090.0, 3551.0, 1163.0, 463.0, 276.0, 174.0, 106.0, 63.0, 56.0, 42.0, 22.0, 28.0, 18.0, 16.0, 13.0, 4.0, 7.0, 5.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.748046875, -3.642974853515625, -3.53790283203125, -3.432830810546875, -3.3277587890625, -3.222686767578125, -3.11761474609375, -3.012542724609375, -2.907470703125, -2.802398681640625, -2.69732666015625, -2.592254638671875, -2.4871826171875, -2.382110595703125, -2.27703857421875, -2.171966552734375, -2.06689453125, -1.961822509765625, -1.85675048828125, -1.751678466796875, -1.6466064453125, -1.541534423828125, -1.43646240234375, -1.331390380859375, -1.226318359375, -1.121246337890625, -1.01617431640625, -0.911102294921875, -0.8060302734375, -0.700958251953125, -0.59588623046875, -0.490814208984375, -0.3857421875, -0.280670166015625, -0.17559814453125, -0.070526123046875, 0.0345458984375, 0.139617919921875, 0.24468994140625, 0.349761962890625, 0.454833984375, 0.559906005859375, 0.66497802734375, 0.770050048828125, 0.8751220703125, 0.980194091796875, 1.08526611328125, 1.190338134765625, 1.29541015625, 1.400482177734375, 1.50555419921875, 1.610626220703125, 1.7156982421875, 1.820770263671875, 1.92584228515625, 2.030914306640625, 2.135986328125, 2.241058349609375, 2.34613037109375, 2.451202392578125, 2.5562744140625, 2.661346435546875, 2.76641845703125, 2.871490478515625, 2.9765625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 7.0, 19.0, 36.0, 53.0, 77.0, 93.0, 138.0, 138.0, 132.0, 102.0, 82.0, 51.0, 39.0, 15.0, 10.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.287109375, -1.2581939697265625, -1.229278564453125, -1.2003631591796875, -1.17144775390625, -1.1425323486328125, -1.113616943359375, -1.0847015380859375, -1.0557861328125, -1.0268707275390625, -0.997955322265625, -0.9690399169921875, -0.94012451171875, -0.9112091064453125, -0.882293701171875, -0.8533782958984375, -0.824462890625, -0.7955474853515625, -0.766632080078125, -0.7377166748046875, -0.70880126953125, -0.6798858642578125, -0.650970458984375, -0.6220550537109375, -0.5931396484375, -0.5642242431640625, -0.535308837890625, -0.5063934326171875, -0.47747802734375, -0.4485626220703125, -0.419647216796875, -0.3907318115234375, -0.36181640625, -0.3329010009765625, -0.303985595703125, -0.2750701904296875, -0.24615478515625, -0.2172393798828125, -0.188323974609375, -0.1594085693359375, -0.1304931640625, -0.1015777587890625, -0.072662353515625, -0.0437469482421875, -0.01483154296875, 0.0140838623046875, 0.042999267578125, 0.0719146728515625, 0.100830078125, 0.1297454833984375, 0.158660888671875, 0.1875762939453125, 0.21649169921875, 0.2454071044921875, 0.274322509765625, 0.3032379150390625, 0.3321533203125, 0.3610687255859375, 0.389984130859375, 0.4188995361328125, 0.44781494140625, 0.4767303466796875, 0.505645751953125, 0.5345611572265625, 0.5634765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 12.0, 12.0, 13.0, 18.0, 29.0, 59.0, 60.0, 109.0, 186.0, 373.0, 706.0, 1826.0, 5173.0, 18923.0, 103757.0, 733511.0, 149160.0, 24376.0, 6258.0, 2078.0, 888.0, 440.0, 215.0, 114.0, 70.0, 45.0, 34.0, 22.0, 24.0, 8.0, 11.0, 6.0, 12.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8046875, -1.741546630859375, -1.67840576171875, -1.615264892578125, -1.5521240234375, -1.488983154296875, -1.42584228515625, -1.362701416015625, -1.299560546875, -1.236419677734375, -1.17327880859375, -1.110137939453125, -1.0469970703125, -0.983856201171875, -0.92071533203125, -0.857574462890625, -0.79443359375, -0.731292724609375, -0.66815185546875, -0.605010986328125, -0.5418701171875, -0.478729248046875, -0.41558837890625, -0.352447509765625, -0.289306640625, -0.226165771484375, -0.16302490234375, -0.099884033203125, -0.0367431640625, 0.026397705078125, 0.08953857421875, 0.152679443359375, 0.2158203125, 0.278961181640625, 0.34210205078125, 0.405242919921875, 0.4683837890625, 0.531524658203125, 0.59466552734375, 0.657806396484375, 0.720947265625, 0.784088134765625, 0.84722900390625, 0.910369873046875, 0.9735107421875, 1.036651611328125, 1.09979248046875, 1.162933349609375, 1.22607421875, 1.289215087890625, 1.35235595703125, 1.415496826171875, 1.4786376953125, 1.541778564453125, 1.60491943359375, 1.668060302734375, 1.731201171875, 1.794342041015625, 1.85748291015625, 1.920623779296875, 1.9837646484375, 2.046905517578125, 2.11004638671875, 2.173187255859375, 2.236328125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 7.0, 9.0, 8.0, 11.0, 14.0, 19.0, 23.0, 31.0, 32.0, 29.0, 37.0, 35.0, 53.0, 62.0, 56.0, 63.0, 58.0, 54.0, 55.0, 58.0, 39.0, 41.0, 42.0, 30.0, 23.0, 24.0, 18.0, 15.0, 11.0, 11.0, 5.0, 8.0, 4.0, 7.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.607421875, -1.551849365234375, -1.49627685546875, -1.440704345703125, -1.3851318359375, -1.329559326171875, -1.27398681640625, -1.218414306640625, -1.162841796875, -1.107269287109375, -1.05169677734375, -0.996124267578125, -0.9405517578125, -0.884979248046875, -0.82940673828125, -0.773834228515625, -0.71826171875, -0.662689208984375, -0.60711669921875, -0.551544189453125, -0.4959716796875, -0.440399169921875, -0.38482666015625, -0.329254150390625, -0.273681640625, -0.218109130859375, -0.16253662109375, -0.106964111328125, -0.0513916015625, 0.004180908203125, 0.05975341796875, 0.115325927734375, 0.1708984375, 0.226470947265625, 0.28204345703125, 0.337615966796875, 0.3931884765625, 0.448760986328125, 0.50433349609375, 0.559906005859375, 0.615478515625, 0.671051025390625, 0.72662353515625, 0.782196044921875, 0.8377685546875, 0.893341064453125, 0.94891357421875, 1.004486083984375, 1.06005859375, 1.115631103515625, 1.17120361328125, 1.226776123046875, 1.2823486328125, 1.337921142578125, 1.39349365234375, 1.449066162109375, 1.504638671875, 1.560211181640625, 1.61578369140625, 1.671356201171875, 1.7269287109375, 1.782501220703125, 1.83807373046875, 1.893646240234375, 1.94921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 9.0, 10.0, 15.0, 13.0, 34.0, 46.0, 98.0, 155.0, 271.0, 594.0, 1257.0, 3050.0, 8924.0, 37875.0, 630545.0, 328150.0, 25985.0, 6880.0, 2478.0, 1111.0, 461.0, 217.0, 128.0, 79.0, 52.0, 38.0, 19.0, 12.0, 11.0, 12.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9375, -0.9071502685546875, -0.876800537109375, -0.8464508056640625, -0.81610107421875, -0.7857513427734375, -0.755401611328125, -0.7250518798828125, -0.6947021484375, -0.6643524169921875, -0.634002685546875, -0.6036529541015625, -0.57330322265625, -0.5429534912109375, -0.512603759765625, -0.4822540283203125, -0.451904296875, -0.4215545654296875, -0.391204833984375, -0.3608551025390625, -0.33050537109375, -0.3001556396484375, -0.269805908203125, -0.2394561767578125, -0.2091064453125, -0.1787567138671875, -0.148406982421875, -0.1180572509765625, -0.08770751953125, -0.0573577880859375, -0.027008056640625, 0.0033416748046875, 0.03369140625, 0.0640411376953125, 0.094390869140625, 0.1247406005859375, 0.15509033203125, 0.1854400634765625, 0.215789794921875, 0.2461395263671875, 0.2764892578125, 0.3068389892578125, 0.337188720703125, 0.3675384521484375, 0.39788818359375, 0.4282379150390625, 0.458587646484375, 0.4889373779296875, 0.519287109375, 0.5496368408203125, 0.579986572265625, 0.6103363037109375, 0.64068603515625, 0.6710357666015625, 0.701385498046875, 0.7317352294921875, 0.7620849609375, 0.7924346923828125, 0.822784423828125, 0.8531341552734375, 0.88348388671875, 0.9138336181640625, 0.944183349609375, 0.9745330810546875, 1.0048828125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 17.0, 26.0, 32.0, 36.0, 74.0, 110.0, 163.0, 164.0, 129.0, 81.0, 52.0, 37.0, 28.0, 10.0, 5.0, 7.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003216266632080078, -0.0003131777048110962, -0.00030472874641418457, -0.00029627978801727295, -0.00028783082962036133, -0.0002793818712234497, -0.0002709329128265381, -0.00026248395442962646, -0.00025403499603271484, -0.0002455860376358032, -0.0002371370792388916, -0.00022868812084197998, -0.00022023916244506836, -0.00021179020404815674, -0.00020334124565124512, -0.0001948922872543335, -0.00018644332885742188, -0.00017799437046051025, -0.00016954541206359863, -0.000161096453666687, -0.0001526474952697754, -0.00014419853687286377, -0.00013574957847595215, -0.00012730062007904053, -0.0001188516616821289, -0.00011040270328521729, -0.00010195374488830566, -9.350478649139404e-05, -8.505582809448242e-05, -7.66068696975708e-05, -6.815791130065918e-05, -5.970895290374756e-05, -5.125999450683594e-05, -4.2811036109924316e-05, -3.4362077713012695e-05, -2.5913119316101074e-05, -1.7464160919189453e-05, -9.015202522277832e-06, -5.662441253662109e-07, 7.88271427154541e-06, 1.633167266845703e-05, 2.4780631065368652e-05, 3.3229589462280273e-05, 4.1678547859191895e-05, 5.0127506256103516e-05, 5.857646465301514e-05, 6.702542304992676e-05, 7.547438144683838e-05, 8.392333984375e-05, 9.237229824066162e-05, 0.00010082125663757324, 0.00010927021503448486, 0.00011771917343139648, 0.0001261681318283081, 0.00013461709022521973, 0.00014306604862213135, 0.00015151500701904297, 0.0001599639654159546, 0.0001684129238128662, 0.00017686188220977783, 0.00018531084060668945, 0.00019375979900360107, 0.0002022087574005127, 0.00021065771579742432, 0.00021910667419433594]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 9.0, 7.0, 8.0, 19.0, 27.0, 35.0, 53.0, 92.0, 170.0, 291.0, 484.0, 959.0, 2428.0, 6982.0, 32149.0, 555157.0, 412548.0, 26654.0, 6254.0, 2087.0, 1011.0, 483.0, 252.0, 131.0, 84.0, 55.0, 41.0, 26.0, 16.0, 14.0, 9.0, 9.0, 3.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.189453125, -1.158111572265625, -1.12677001953125, -1.095428466796875, -1.0640869140625, -1.032745361328125, -1.00140380859375, -0.970062255859375, -0.938720703125, -0.907379150390625, -0.87603759765625, -0.844696044921875, -0.8133544921875, -0.782012939453125, -0.75067138671875, -0.719329833984375, -0.68798828125, -0.656646728515625, -0.62530517578125, -0.593963623046875, -0.5626220703125, -0.531280517578125, -0.49993896484375, -0.468597412109375, -0.437255859375, -0.405914306640625, -0.37457275390625, -0.343231201171875, -0.3118896484375, -0.280548095703125, -0.24920654296875, -0.217864990234375, -0.1865234375, -0.155181884765625, -0.12384033203125, -0.092498779296875, -0.0611572265625, -0.029815673828125, 0.00152587890625, 0.032867431640625, 0.064208984375, 0.095550537109375, 0.12689208984375, 0.158233642578125, 0.1895751953125, 0.220916748046875, 0.25225830078125, 0.283599853515625, 0.31494140625, 0.346282958984375, 0.37762451171875, 0.408966064453125, 0.4403076171875, 0.471649169921875, 0.50299072265625, 0.534332275390625, 0.565673828125, 0.597015380859375, 0.62835693359375, 0.659698486328125, 0.6910400390625, 0.722381591796875, 0.75372314453125, 0.785064697265625, 0.81640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 1.0, 4.0, 3.0, 5.0, 8.0, 18.0, 33.0, 39.0, 82.0, 175.0, 175.0, 184.0, 128.0, 67.0, 23.0, 23.0, 12.0, 8.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98876953125, -0.9632339477539062, -0.9376983642578125, -0.9121627807617188, -0.886627197265625, -0.8610916137695312, -0.8355560302734375, -0.8100204467773438, -0.78448486328125, -0.7589492797851562, -0.7334136962890625, -0.7078781127929688, -0.682342529296875, -0.6568069458007812, -0.6312713623046875, -0.6057357788085938, -0.5802001953125, -0.5546646118164062, -0.5291290283203125, -0.5035934448242188, -0.478057861328125, -0.45252227783203125, -0.4269866943359375, -0.40145111083984375, -0.37591552734375, -0.35037994384765625, -0.3248443603515625, -0.29930877685546875, -0.273773193359375, -0.24823760986328125, -0.2227020263671875, -0.19716644287109375, -0.171630859375, -0.14609527587890625, -0.1205596923828125, -0.09502410888671875, -0.069488525390625, -0.04395294189453125, -0.0184173583984375, 0.00711822509765625, 0.03265380859375, 0.05818939208984375, 0.0837249755859375, 0.10926055908203125, 0.134796142578125, 0.16033172607421875, 0.1858673095703125, 0.21140289306640625, 0.2369384765625, 0.26247406005859375, 0.2880096435546875, 0.31354522705078125, 0.339080810546875, 0.36461639404296875, 0.3901519775390625, 0.41568756103515625, 0.44122314453125, 0.46675872802734375, 0.4922943115234375, 0.5178298950195312, 0.543365478515625, 0.5689010620117188, 0.5944366455078125, 0.6199722290039062, 0.6455078125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 10.0, 28.0, 125.0, 377.0, 305.0, 105.0, 25.0, 14.0, 8.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.373247146606445, -27.724830627441406, -27.076416015625, -26.42799949645996, -25.779582977294922, -25.131168365478516, -24.482751846313477, -23.834335327148438, -23.18592071533203, -22.537504196166992, -21.889089584350586, -21.240673065185547, -20.592256546020508, -19.94384002685547, -19.295425415039062, -18.647008895874023, -17.998592376708984, -17.350175857543945, -16.70176124572754, -16.0533447265625, -15.404928207397461, -14.756512641906738, -14.108097076416016, -13.459680557250977, -12.811264991760254, -12.162849426269531, -11.514432907104492, -10.86601734161377, -10.217601776123047, -9.569185256958008, -8.920769691467285, -8.272354125976562, -7.623935699462891, -6.97551965713501, -6.327103614807129, -5.678688049316406, -5.030272006988525, -4.3818559646606445, -3.7334401607513428, -3.085024356842041, -2.43660831451416, -1.7881923913955688, -1.1397764682769775, -0.49136054515838623, 0.15705537796020508, 0.8054714202880859, 1.4538872241973877, 2.1023030281066895, 2.7507190704345703, 3.399135112762451, 4.047551155090332, 4.695966720581055, 5.3443827629089355, 5.992798805236816, 6.641214370727539, 7.28963041305542, 7.938046455383301, 8.586462020874023, 9.234878540039062, 9.883294105529785, 10.531709671020508, 11.180126190185547, 11.82854175567627, 12.476957321166992, 13.125373840332031]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 7.0, 8.0, 9.0, 7.0, 6.0, 11.0, 21.0, 29.0, 22.0, 36.0, 30.0, 39.0, 42.0, 48.0, 60.0, 50.0, 58.0, 59.0, 56.0, 51.0, 46.0, 37.0, 28.0, 42.0, 32.0, 38.0, 29.0, 23.0, 16.0, 16.0, 13.0, 13.0, 3.0, 4.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.747722625732422, -9.450126647949219, -9.1525297164917, -8.85493278503418, -8.557336807250977, -8.259740829467773, -7.962143898010254, -7.664547443389893, -7.366950988769531, -7.06935453414917, -6.771758079528809, -6.474161624908447, -6.176565170288086, -5.878968715667725, -5.581372261047363, -5.283775806427002, -4.986179351806641, -4.688582897186279, -4.390986442565918, -4.093389987945557, -3.7957935333251953, -3.498197078704834, -3.2006006240844727, -2.9030041694641113, -2.60540771484375, -2.3078112602233887, -2.0102148056030273, -1.712618350982666, -1.4150218963623047, -1.1174254417419434, -0.819828987121582, -0.5222325325012207, -0.22463607788085938, 0.07296037673950195, 0.3705568313598633, 0.6681532859802246, 0.9657497406005859, 1.2633461952209473, 1.5609426498413086, 1.85853910446167, 2.1561355590820312, 2.4537320137023926, 2.751328468322754, 3.0489249229431152, 3.3465213775634766, 3.644117832183838, 3.941714286804199, 4.2393107414245605, 4.536907196044922, 4.834503650665283, 5.1321001052856445, 5.429696559906006, 5.727293014526367, 6.0248894691467285, 6.32248592376709, 6.620082378387451, 6.9176788330078125, 7.215275287628174, 7.512871742248535, 7.8104681968688965, 8.108064651489258, 8.405660629272461, 8.70325756072998, 9.0008544921875, 9.298450469970703]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 6.0, 6.0, 13.0, 11.0, 15.0, 25.0, 28.0, 24.0, 43.0, 53.0, 100.0, 98.0, 176.0, 356.0, 801.0, 2045.0, 7804.0, 69795.0, 4053531.0, 49648.0, 6770.0, 1774.0, 642.0, 249.0, 107.0, 55.0, 31.0, 26.0, 15.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.73828125, -5.59637451171875, -5.4544677734375, -5.31256103515625, -5.170654296875, -5.02874755859375, -4.8868408203125, -4.74493408203125, -4.60302734375, -4.46112060546875, -4.3192138671875, -4.17730712890625, -4.035400390625, -3.89349365234375, -3.7515869140625, -3.60968017578125, -3.4677734375, -3.32586669921875, -3.1839599609375, -3.04205322265625, -2.900146484375, -2.75823974609375, -2.6163330078125, -2.47442626953125, -2.33251953125, -2.19061279296875, -2.0487060546875, -1.90679931640625, -1.764892578125, -1.62298583984375, -1.4810791015625, -1.33917236328125, -1.197265625, -1.05535888671875, -0.9134521484375, -0.77154541015625, -0.629638671875, -0.48773193359375, -0.3458251953125, -0.20391845703125, -0.06201171875, 0.07989501953125, 0.2218017578125, 0.36370849609375, 0.505615234375, 0.64752197265625, 0.7894287109375, 0.93133544921875, 1.0732421875, 1.21514892578125, 1.3570556640625, 1.49896240234375, 1.640869140625, 1.78277587890625, 1.9246826171875, 2.06658935546875, 2.20849609375, 2.35040283203125, 2.4923095703125, 2.63421630859375, 2.776123046875, 2.91802978515625, 3.0599365234375, 3.20184326171875, 3.34375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 7.0, 15.0, 17.0, 43.0, 63.0, 78.0, 124.0, 121.0, 140.0, 100.0, 89.0, 83.0, 46.0, 31.0, 22.0, 12.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3369140625, -1.3079910278320312, -1.2790679931640625, -1.2501449584960938, -1.221221923828125, -1.1922988891601562, -1.1633758544921875, -1.1344528198242188, -1.10552978515625, -1.0766067504882812, -1.0476837158203125, -1.0187606811523438, -0.989837646484375, -0.9609146118164062, -0.9319915771484375, -0.9030685424804688, -0.8741455078125, -0.8452224731445312, -0.8162994384765625, -0.7873764038085938, -0.758453369140625, -0.7295303344726562, -0.7006072998046875, -0.6716842651367188, -0.64276123046875, -0.6138381958007812, -0.5849151611328125, -0.5559921264648438, -0.527069091796875, -0.49814605712890625, -0.4692230224609375, -0.44029998779296875, -0.411376953125, -0.38245391845703125, -0.3535308837890625, -0.32460784912109375, -0.295684814453125, -0.26676177978515625, -0.2378387451171875, -0.20891571044921875, -0.17999267578125, -0.15106964111328125, -0.1221466064453125, -0.09322357177734375, -0.064300537109375, -0.03537750244140625, -0.0064544677734375, 0.02246856689453125, 0.0513916015625, 0.08031463623046875, 0.1092376708984375, 0.13816070556640625, 0.167083740234375, 0.19600677490234375, 0.2249298095703125, 0.25385284423828125, 0.28277587890625, 0.31169891357421875, 0.3406219482421875, 0.36954498291015625, 0.398468017578125, 0.42739105224609375, 0.4563140869140625, 0.48523712158203125, 0.51416015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 11.0, 29.0, 31.0, 64.0, 120.0, 190.0, 387.0, 1505.0, 464747.0, 3724303.0, 1859.0, 500.0, 229.0, 136.0, 73.0, 46.0, 20.0, 19.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1875, -9.8482666015625, -9.509033203125, -9.1697998046875, -8.83056640625, -8.4913330078125, -8.152099609375, -7.8128662109375, -7.4736328125, -7.1343994140625, -6.795166015625, -6.4559326171875, -6.11669921875, -5.7774658203125, -5.438232421875, -5.0989990234375, -4.759765625, -4.4205322265625, -4.081298828125, -3.7420654296875, -3.40283203125, -3.0635986328125, -2.724365234375, -2.3851318359375, -2.0458984375, -1.7066650390625, -1.367431640625, -1.0281982421875, -0.68896484375, -0.3497314453125, -0.010498046875, 0.3287353515625, 0.66796875, 1.0072021484375, 1.346435546875, 1.6856689453125, 2.02490234375, 2.3641357421875, 2.703369140625, 3.0426025390625, 3.3818359375, 3.7210693359375, 4.060302734375, 4.3995361328125, 4.73876953125, 5.0780029296875, 5.417236328125, 5.7564697265625, 6.095703125, 6.4349365234375, 6.774169921875, 7.1134033203125, 7.45263671875, 7.7918701171875, 8.131103515625, 8.4703369140625, 8.8095703125, 9.1488037109375, 9.488037109375, 9.8272705078125, 10.16650390625, 10.5057373046875, 10.844970703125, 11.1842041015625, 11.5234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 38.0, 178.0, 3619.0, 198.0, 27.0, 17.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.456939697265625, -2.37091064453125, -2.284881591796875, -2.1988525390625, -2.112823486328125, -2.02679443359375, -1.940765380859375, -1.854736328125, -1.768707275390625, -1.68267822265625, -1.596649169921875, -1.5106201171875, -1.424591064453125, -1.33856201171875, -1.252532958984375, -1.16650390625, -1.080474853515625, -0.99444580078125, -0.908416748046875, -0.8223876953125, -0.736358642578125, -0.65032958984375, -0.564300537109375, -0.478271484375, -0.392242431640625, -0.30621337890625, -0.220184326171875, -0.1341552734375, -0.048126220703125, 0.03790283203125, 0.123931884765625, 0.2099609375, 0.295989990234375, 0.38201904296875, 0.468048095703125, 0.5540771484375, 0.640106201171875, 0.72613525390625, 0.812164306640625, 0.898193359375, 0.984222412109375, 1.07025146484375, 1.156280517578125, 1.2423095703125, 1.328338623046875, 1.41436767578125, 1.500396728515625, 1.58642578125, 1.672454833984375, 1.75848388671875, 1.844512939453125, 1.9305419921875, 2.016571044921875, 2.10260009765625, 2.188629150390625, 2.274658203125, 2.360687255859375, 2.44671630859375, 2.532745361328125, 2.6187744140625, 2.704803466796875, 2.79083251953125, 2.876861572265625, 2.962890625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 9.0, 18.0, 71.0, 268.0, 404.0, 170.0, 35.0, 15.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.647691249847412, -6.404347896575928, -6.161004066467285, -5.917660713195801, -5.674317359924316, -5.430974006652832, -5.1876301765441895, -4.944286823272705, -4.7009429931640625, -4.457599639892578, -4.2142558097839355, -3.970912456512451, -3.727569103240967, -3.4842255115509033, -3.24088191986084, -2.9975385665893555, -2.754195213317871, -2.5108516216278076, -2.2675082683563232, -2.0241646766662598, -1.7808212041854858, -1.537477731704712, -1.2941341400146484, -1.0507906675338745, -0.8074471950531006, -0.5641037225723267, -0.32076019048690796, -0.07741665840148926, 0.16592681407928467, 0.4092702865600586, 0.6526138782501221, 0.895957350730896, 1.1393003463745117, 1.3826438188552856, 1.6259872913360596, 1.869330883026123, 2.1126742362976074, 2.356017827987671, 2.5993614196777344, 2.8427047729492188, 3.0860483646392822, 3.3293919563293457, 3.57273530960083, 3.8160789012908936, 4.059422492980957, 4.302765846252441, 4.546109199523926, 4.789453029632568, 5.032796382904053, 5.276139736175537, 5.51948356628418, 5.762826919555664, 6.006170272827148, 6.249513626098633, 6.492857456207275, 6.73620080947876, 6.979544639587402, 7.222887992858887, 7.466231822967529, 7.709575176239014, 7.952918529510498, 8.19626235961914, 8.439605712890625, 8.68294906616211, 8.926292419433594]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 3.0, 7.0, 9.0, 26.0, 29.0, 41.0, 66.0, 57.0, 83.0, 96.0, 90.0, 103.0, 90.0, 77.0, 79.0, 46.0, 37.0, 28.0, 9.0, 15.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.543935775756836, -4.413177490234375, -4.282419204711914, -4.151660442352295, -4.020902156829834, -3.890143871307373, -3.759385347366333, -3.628626823425293, -3.497868537902832, -3.367110252380371, -3.236351728439331, -3.105593204498291, -2.97483491897583, -2.844076633453369, -2.713318109512329, -2.582559585571289, -2.451801300048828, -2.321043014526367, -2.190284490585327, -2.059525966644287, -1.9287676811218262, -1.7980092763900757, -1.6672508716583252, -1.5364924669265747, -1.4057340621948242, -1.2749756574630737, -1.1442172527313232, -1.0134588479995728, -0.8827004432678223, -0.7519420385360718, -0.6211836338043213, -0.4904252290725708, -0.3596673011779785, -0.22890889644622803, -0.09815049171447754, 0.03260791301727295, 0.16336631774902344, 0.2941247224807739, 0.4248831272125244, 0.5556415319442749, 0.6863999366760254, 0.8171583414077759, 0.9479167461395264, 1.0786751508712769, 1.2094335556030273, 1.3401919603347778, 1.4709503650665283, 1.6017087697982788, 1.7324671745300293, 1.8632255792617798, 1.9939839839935303, 2.1247425079345703, 2.2555007934570312, 2.386259078979492, 2.5170176029205322, 2.6477761268615723, 2.778534412384033, 2.909292697906494, 3.040051221847534, 3.170809745788574, 3.301568031311035, 3.432326316833496, 3.563084840774536, 3.693843364715576, 3.824601650238037]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 2.0, 9.0, 6.0, 13.0, 12.0, 13.0, 24.0, 25.0, 52.0, 77.0, 147.0, 200.0, 464.0, 1115.0, 3689.0, 18796.0, 280381.0, 697221.0, 37510.0, 5818.0, 1615.0, 637.0, 298.0, 147.0, 97.0, 64.0, 35.0, 26.0, 18.0, 10.0, 8.0, 4.0, 7.0, 10.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.310546875, -3.200775146484375, -3.09100341796875, -2.981231689453125, -2.8714599609375, -2.761688232421875, -2.65191650390625, -2.542144775390625, -2.432373046875, -2.322601318359375, -2.21282958984375, -2.103057861328125, -1.9932861328125, -1.883514404296875, -1.77374267578125, -1.663970947265625, -1.55419921875, -1.444427490234375, -1.33465576171875, -1.224884033203125, -1.1151123046875, -1.005340576171875, -0.89556884765625, -0.785797119140625, -0.676025390625, -0.566253662109375, -0.45648193359375, -0.346710205078125, -0.2369384765625, -0.127166748046875, -0.01739501953125, 0.092376708984375, 0.2021484375, 0.311920166015625, 0.42169189453125, 0.531463623046875, 0.6412353515625, 0.751007080078125, 0.86077880859375, 0.970550537109375, 1.080322265625, 1.190093994140625, 1.29986572265625, 1.409637451171875, 1.5194091796875, 1.629180908203125, 1.73895263671875, 1.848724365234375, 1.95849609375, 2.068267822265625, 2.17803955078125, 2.287811279296875, 2.3975830078125, 2.507354736328125, 2.61712646484375, 2.726898193359375, 2.836669921875, 2.946441650390625, 3.05621337890625, 3.165985107421875, 3.2757568359375, 3.385528564453125, 3.49530029296875, 3.605072021484375, 3.71484375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 4.0, 12.0, 22.0, 41.0, 47.0, 68.0, 85.0, 109.0, 106.0, 108.0, 97.0, 80.0, 61.0, 65.0, 34.0, 23.0, 15.0, 8.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1962890625, -1.1702537536621094, -1.1442184448242188, -1.1181831359863281, -1.0921478271484375, -1.0661125183105469, -1.0400772094726562, -1.0140419006347656, -0.988006591796875, -0.9619712829589844, -0.9359359741210938, -0.9099006652832031, -0.8838653564453125, -0.8578300476074219, -0.8317947387695312, -0.8057594299316406, -0.77972412109375, -0.7536888122558594, -0.7276535034179688, -0.7016181945800781, -0.6755828857421875, -0.6495475769042969, -0.6235122680664062, -0.5974769592285156, -0.571441650390625, -0.5454063415527344, -0.5193710327148438, -0.4933357238769531, -0.4673004150390625, -0.4412651062011719, -0.41522979736328125, -0.3891944885253906, -0.3631591796875, -0.3371238708496094, -0.31108856201171875, -0.2850532531738281, -0.2590179443359375, -0.23298263549804688, -0.20694732666015625, -0.18091201782226562, -0.154876708984375, -0.12884140014648438, -0.10280609130859375, -0.07677078247070312, -0.0507354736328125, -0.024700164794921875, 0.00133514404296875, 0.027370452880859375, 0.05340576171875, 0.07944107055664062, 0.10547637939453125, 0.13151168823242188, 0.1575469970703125, 0.18358230590820312, 0.20961761474609375, 0.23565292358398438, 0.261688232421875, 0.2877235412597656, 0.31375885009765625, 0.3397941589355469, 0.3658294677734375, 0.3918647766113281, 0.41790008544921875, 0.4439353942871094, 0.469970703125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 8.0, 10.0, 12.0, 13.0, 25.0, 40.0, 44.0, 81.0, 127.0, 272.0, 451.0, 1087.0, 3072.0, 12329.0, 86973.0, 779392.0, 141198.0, 16986.0, 3969.0, 1242.0, 521.0, 256.0, 176.0, 98.0, 38.0, 35.0, 23.0, 17.0, 10.0, 7.0, 6.0, 9.0, 2.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.291015625, -3.20574951171875, -3.1204833984375, -3.03521728515625, -2.949951171875, -2.86468505859375, -2.7794189453125, -2.69415283203125, -2.60888671875, -2.52362060546875, -2.4383544921875, -2.35308837890625, -2.267822265625, -2.18255615234375, -2.0972900390625, -2.01202392578125, -1.9267578125, -1.84149169921875, -1.7562255859375, -1.67095947265625, -1.585693359375, -1.50042724609375, -1.4151611328125, -1.32989501953125, -1.24462890625, -1.15936279296875, -1.0740966796875, -0.98883056640625, -0.903564453125, -0.81829833984375, -0.7330322265625, -0.64776611328125, -0.5625, -0.47723388671875, -0.3919677734375, -0.30670166015625, -0.221435546875, -0.13616943359375, -0.0509033203125, 0.03436279296875, 0.11962890625, 0.20489501953125, 0.2901611328125, 0.37542724609375, 0.460693359375, 0.54595947265625, 0.6312255859375, 0.71649169921875, 0.8017578125, 0.88702392578125, 0.9722900390625, 1.05755615234375, 1.142822265625, 1.22808837890625, 1.3133544921875, 1.39862060546875, 1.48388671875, 1.56915283203125, 1.6544189453125, 1.73968505859375, 1.824951171875, 1.91021728515625, 1.9954833984375, 2.08074951171875, 2.166015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 10.0, 3.0, 8.0, 15.0, 18.0, 19.0, 24.0, 28.0, 41.0, 26.0, 58.0, 65.0, 76.0, 63.0, 73.0, 65.0, 80.0, 58.0, 44.0, 40.0, 36.0, 41.0, 27.0, 26.0, 10.0, 9.0, 8.0, 4.0, 2.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-3.271484375, -3.188720703125, -3.10595703125, -3.023193359375, -2.9404296875, -2.857666015625, -2.77490234375, -2.692138671875, -2.609375, -2.526611328125, -2.44384765625, -2.361083984375, -2.2783203125, -2.195556640625, -2.11279296875, -2.030029296875, -1.947265625, -1.864501953125, -1.78173828125, -1.698974609375, -1.6162109375, -1.533447265625, -1.45068359375, -1.367919921875, -1.28515625, -1.202392578125, -1.11962890625, -1.036865234375, -0.9541015625, -0.871337890625, -0.78857421875, -0.705810546875, -0.623046875, -0.540283203125, -0.45751953125, -0.374755859375, -0.2919921875, -0.209228515625, -0.12646484375, -0.043701171875, 0.0390625, 0.121826171875, 0.20458984375, 0.287353515625, 0.3701171875, 0.452880859375, 0.53564453125, 0.618408203125, 0.701171875, 0.783935546875, 0.86669921875, 0.949462890625, 1.0322265625, 1.114990234375, 1.19775390625, 1.280517578125, 1.36328125, 1.446044921875, 1.52880859375, 1.611572265625, 1.6943359375, 1.777099609375, 1.85986328125, 1.942626953125, 2.025390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 10.0, 12.0, 10.0, 18.0, 27.0, 43.0, 51.0, 77.0, 120.0, 210.0, 302.0, 561.0, 1022.0, 2001.0, 4225.0, 10243.0, 31312.0, 198128.0, 681930.0, 84579.0, 19785.0, 7228.0, 3189.0, 1452.0, 789.0, 474.0, 259.0, 171.0, 91.0, 74.0, 50.0, 31.0, 27.0, 15.0, 10.0, 7.0, 9.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8251953125, -0.7970428466796875, -0.768890380859375, -0.7407379150390625, -0.71258544921875, -0.6844329833984375, -0.656280517578125, -0.6281280517578125, -0.5999755859375, -0.5718231201171875, -0.543670654296875, -0.5155181884765625, -0.48736572265625, -0.4592132568359375, -0.431060791015625, -0.4029083251953125, -0.374755859375, -0.3466033935546875, -0.318450927734375, -0.2902984619140625, -0.26214599609375, -0.2339935302734375, -0.205841064453125, -0.1776885986328125, -0.1495361328125, -0.1213836669921875, -0.093231201171875, -0.0650787353515625, -0.03692626953125, -0.0087738037109375, 0.019378662109375, 0.0475311279296875, 0.07568359375, 0.1038360595703125, 0.131988525390625, 0.1601409912109375, 0.18829345703125, 0.2164459228515625, 0.244598388671875, 0.2727508544921875, 0.3009033203125, 0.3290557861328125, 0.357208251953125, 0.3853607177734375, 0.41351318359375, 0.4416656494140625, 0.469818115234375, 0.4979705810546875, 0.526123046875, 0.5542755126953125, 0.582427978515625, 0.6105804443359375, 0.63873291015625, 0.6668853759765625, 0.695037841796875, 0.7231903076171875, 0.7513427734375, 0.7794952392578125, 0.807647705078125, 0.8358001708984375, 0.86395263671875, 0.8921051025390625, 0.920257568359375, 0.9484100341796875, 0.9765625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 10.0, 6.0, 7.0, 12.0, 9.0, 12.0, 29.0, 32.0, 42.0, 48.0, 50.0, 52.0, 91.0, 85.0, 110.0, 69.0, 69.0, 57.0, 47.0, 40.0, 19.0, 20.0, 19.0, 16.0, 6.0, 9.0, 8.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00013780593872070312, -0.00013336539268493652, -0.00012892484664916992, -0.00012448430061340332, -0.00012004375457763672, -0.00011560320854187012, -0.00011116266250610352, -0.00010672211647033691, -0.00010228157043457031, -9.784102439880371e-05, -9.340047836303711e-05, -8.895993232727051e-05, -8.45193862915039e-05, -8.00788402557373e-05, -7.56382942199707e-05, -7.11977481842041e-05, -6.67572021484375e-05, -6.23166561126709e-05, -5.78761100769043e-05, -5.3435564041137695e-05, -4.8995018005371094e-05, -4.455447196960449e-05, -4.011392593383789e-05, -3.567337989807129e-05, -3.123283386230469e-05, -2.6792287826538086e-05, -2.2351741790771484e-05, -1.7911195755004883e-05, -1.3470649719238281e-05, -9.03010368347168e-06, -4.589557647705078e-06, -1.4901161193847656e-07, 4.291534423828125e-06, 8.732080459594727e-06, 1.3172626495361328e-05, 1.761317253112793e-05, 2.205371856689453e-05, 2.6494264602661133e-05, 3.0934810638427734e-05, 3.5375356674194336e-05, 3.981590270996094e-05, 4.425644874572754e-05, 4.869699478149414e-05, 5.313754081726074e-05, 5.7578086853027344e-05, 6.201863288879395e-05, 6.645917892456055e-05, 7.089972496032715e-05, 7.534027099609375e-05, 7.978081703186035e-05, 8.422136306762695e-05, 8.866190910339355e-05, 9.310245513916016e-05, 9.754300117492676e-05, 0.00010198354721069336, 0.00010642409324645996, 0.00011086463928222656, 0.00011530518531799316, 0.00011974573135375977, 0.00012418627738952637, 0.00012862682342529297, 0.00013306736946105957, 0.00013750791549682617, 0.00014194846153259277, 0.00014638900756835938]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 2.0, 8.0, 11.0, 20.0, 25.0, 28.0, 44.0, 85.0, 137.0, 225.0, 430.0, 809.0, 1836.0, 5227.0, 21295.0, 322097.0, 652606.0, 32646.0, 6598.0, 2338.0, 960.0, 474.0, 237.0, 141.0, 101.0, 57.0, 38.0, 15.0, 21.0, 12.0, 5.0, 7.0, 6.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8642578125, -1.81658935546875, -1.7689208984375, -1.72125244140625, -1.673583984375, -1.62591552734375, -1.5782470703125, -1.53057861328125, -1.48291015625, -1.43524169921875, -1.3875732421875, -1.33990478515625, -1.292236328125, -1.24456787109375, -1.1968994140625, -1.14923095703125, -1.1015625, -1.05389404296875, -1.0062255859375, -0.95855712890625, -0.910888671875, -0.86322021484375, -0.8155517578125, -0.76788330078125, -0.72021484375, -0.67254638671875, -0.6248779296875, -0.57720947265625, -0.529541015625, -0.48187255859375, -0.4342041015625, -0.38653564453125, -0.3388671875, -0.29119873046875, -0.2435302734375, -0.19586181640625, -0.148193359375, -0.10052490234375, -0.0528564453125, -0.00518798828125, 0.04248046875, 0.09014892578125, 0.1378173828125, 0.18548583984375, 0.233154296875, 0.28082275390625, 0.3284912109375, 0.37615966796875, 0.423828125, 0.47149658203125, 0.5191650390625, 0.56683349609375, 0.614501953125, 0.66217041015625, 0.7098388671875, 0.75750732421875, 0.80517578125, 0.85284423828125, 0.9005126953125, 0.94818115234375, 0.995849609375, 1.04351806640625, 1.0911865234375, 1.13885498046875, 1.1865234375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 6.0, 9.0, 6.0, 7.0, 15.0, 28.0, 39.0, 65.0, 88.0, 161.0, 178.0, 162.0, 100.0, 44.0, 29.0, 12.0, 15.0, 8.0, 7.0, 9.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.33203125, -1.2973098754882812, -1.2625885009765625, -1.2278671264648438, -1.193145751953125, -1.1584243774414062, -1.1237030029296875, -1.0889816284179688, -1.05426025390625, -1.0195388793945312, -0.9848175048828125, -0.9500961303710938, -0.915374755859375, -0.8806533813476562, -0.8459320068359375, -0.8112106323242188, -0.7764892578125, -0.7417678833007812, -0.7070465087890625, -0.6723251342773438, -0.637603759765625, -0.6028823852539062, -0.5681610107421875, -0.5334396362304688, -0.49871826171875, -0.46399688720703125, -0.4292755126953125, -0.39455413818359375, -0.359832763671875, -0.32511138916015625, -0.2903900146484375, -0.25566864013671875, -0.220947265625, -0.18622589111328125, -0.1515045166015625, -0.11678314208984375, -0.082061767578125, -0.04734039306640625, -0.0126190185546875, 0.02210235595703125, 0.05682373046875, 0.09154510498046875, 0.1262664794921875, 0.16098785400390625, 0.195709228515625, 0.23043060302734375, 0.2651519775390625, 0.29987335205078125, 0.3345947265625, 0.36931610107421875, 0.4040374755859375, 0.43875885009765625, 0.473480224609375, 0.5082015991210938, 0.5429229736328125, 0.5776443481445312, 0.61236572265625, 0.6470870971679688, 0.6818084716796875, 0.7165298461914062, 0.751251220703125, 0.7859725952148438, 0.8206939697265625, 0.8554153442382812, 0.89013671875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 8.0, 12.0, 15.0, 41.0, 121.0, 283.0, 303.0, 135.0, 50.0, 24.0, 6.0, 9.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.609941482543945, -28.949974060058594, -28.29000473022461, -27.630035400390625, -26.970067977905273, -26.310100555419922, -25.650131225585938, -24.990161895751953, -24.3301944732666, -23.67022705078125, -23.010257720947266, -22.35028839111328, -21.69032096862793, -21.030353546142578, -20.370384216308594, -19.71041488647461, -19.050447463989258, -18.390480041503906, -17.730510711669922, -17.070541381835938, -16.410573959350586, -15.750605583190918, -15.09063720703125, -14.430668830871582, -13.770700454711914, -13.110732078552246, -12.450763702392578, -11.79079532623291, -11.130826950073242, -10.470858573913574, -9.810890197753906, -9.150921821594238, -8.490952491760254, -7.830984115600586, -7.171015739440918, -6.51104736328125, -5.851078987121582, -5.191110610961914, -4.531142234802246, -3.871173858642578, -3.21120548248291, -2.551237106323242, -1.8912687301635742, -1.2313003540039062, -0.5713319778442383, 0.08863639831542969, 0.7486047744750977, 1.4085731506347656, 2.0685415267944336, 2.7285099029541016, 3.3884782791137695, 4.0484466552734375, 4.7084150314331055, 5.368383407592773, 6.028351783752441, 6.688320159912109, 7.348288536071777, 8.008256912231445, 8.668225288391113, 9.328193664550781, 9.98816204071045, 10.648130416870117, 11.308098793029785, 11.968067169189453, 12.628035545349121]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 8.0, 12.0, 6.0, 12.0, 16.0, 11.0, 12.0, 20.0, 24.0, 31.0, 39.0, 34.0, 43.0, 45.0, 37.0, 49.0, 56.0, 48.0, 41.0, 54.0, 39.0, 42.0, 31.0, 48.0, 39.0, 33.0, 20.0, 32.0, 17.0, 15.0, 13.0, 15.0, 9.0, 10.0, 8.0, 6.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.417352676391602, -11.057940483093262, -10.698528289794922, -10.339116096496582, -9.979703903198242, -9.620291709899902, -9.260879516601562, -8.901466369628906, -8.542055130004883, -8.182642936706543, -7.823230743408203, -7.463818550109863, -7.104406356811523, -6.744994163513184, -6.3855814933776855, -6.026169300079346, -5.666756629943848, -5.307344436645508, -4.947932243347168, -4.588520050048828, -4.229107856750488, -3.8696954250335693, -3.5102829933166504, -3.1508708000183105, -2.7914586067199707, -2.432046413421631, -2.072634220123291, -1.713221788406372, -1.3538095951080322, -0.9943974018096924, -0.6349849700927734, -0.2755727767944336, 0.08383941650390625, 0.44325166940689087, 0.8026639223098755, 1.1620762348175049, 1.5214884281158447, 1.8809006214141846, 2.2403130531311035, 2.5997252464294434, 2.959137439727783, 3.318549633026123, 3.677961826324463, 4.037374496459961, 4.396786689758301, 4.756198883056641, 5.1156110763549805, 5.47502326965332, 5.83443546295166, 6.19384765625, 6.55325984954834, 6.91267204284668, 7.2720842361450195, 7.631496429443359, 7.990909099578857, 8.350320816040039, 8.709733963012695, 9.069146156311035, 9.428558349609375, 9.787970542907715, 10.147382736206055, 10.506794929504395, 10.866207122802734, 11.22562026977539, 11.585031509399414]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 9.0, 7.0, 16.0, 17.0, 15.0, 25.0, 37.0, 60.0, 69.0, 127.0, 188.0, 347.0, 702.0, 1724.0, 6845.0, 49182.0, 3996598.0, 123314.0, 11210.0, 2412.0, 776.0, 329.0, 126.0, 68.0, 27.0, 18.0, 13.0, 6.0, 1.0, 4.0, 0.0, 3.0], "bins": [-8.5390625, -8.363525390625, -8.18798828125, -8.012451171875, -7.8369140625, -7.661376953125, -7.48583984375, -7.310302734375, -7.134765625, -6.959228515625, -6.78369140625, -6.608154296875, -6.4326171875, -6.257080078125, -6.08154296875, -5.906005859375, -5.73046875, -5.554931640625, -5.37939453125, -5.203857421875, -5.0283203125, -4.852783203125, -4.67724609375, -4.501708984375, -4.326171875, -4.150634765625, -3.97509765625, -3.799560546875, -3.6240234375, -3.448486328125, -3.27294921875, -3.097412109375, -2.921875, -2.746337890625, -2.57080078125, -2.395263671875, -2.2197265625, -2.044189453125, -1.86865234375, -1.693115234375, -1.517578125, -1.342041015625, -1.16650390625, -0.990966796875, -0.8154296875, -0.639892578125, -0.46435546875, -0.288818359375, -0.11328125, 0.062255859375, 0.23779296875, 0.413330078125, 0.5888671875, 0.764404296875, 0.93994140625, 1.115478515625, 1.291015625, 1.466552734375, 1.64208984375, 1.817626953125, 1.9931640625, 2.168701171875, 2.34423828125, 2.519775390625, 2.6953125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 9.0, 13.0, 18.0, 34.0, 47.0, 45.0, 75.0, 106.0, 83.0, 102.0, 99.0, 86.0, 77.0, 65.0, 49.0, 36.0, 22.0, 13.0, 11.0, 3.0, 2.0, 5.0, 2.0, 1.0, 3.0], "bins": [-1.283203125, -1.2567710876464844, -1.2303390502929688, -1.2039070129394531, -1.1774749755859375, -1.1510429382324219, -1.1246109008789062, -1.0981788635253906, -1.071746826171875, -1.0453147888183594, -1.0188827514648438, -0.9924507141113281, -0.9660186767578125, -0.9395866394042969, -0.9131546020507812, -0.8867225646972656, -0.86029052734375, -0.8338584899902344, -0.8074264526367188, -0.7809944152832031, -0.7545623779296875, -0.7281303405761719, -0.7016983032226562, -0.6752662658691406, -0.648834228515625, -0.6224021911621094, -0.5959701538085938, -0.5695381164550781, -0.5431060791015625, -0.5166740417480469, -0.49024200439453125, -0.4638099670410156, -0.4373779296875, -0.4109458923339844, -0.38451385498046875, -0.3580818176269531, -0.3316497802734375, -0.3052177429199219, -0.27878570556640625, -0.2523536682128906, -0.225921630859375, -0.19948959350585938, -0.17305755615234375, -0.14662551879882812, -0.1201934814453125, -0.09376144409179688, -0.06732940673828125, -0.040897369384765625, -0.01446533203125, 0.011966705322265625, 0.03839874267578125, 0.06483078002929688, 0.0912628173828125, 0.11769485473632812, 0.14412689208984375, 0.17055892944335938, 0.196990966796875, 0.22342300415039062, 0.24985504150390625, 0.2762870788574219, 0.3027191162109375, 0.3291511535644531, 0.35558319091796875, 0.3820152282714844, 0.408447265625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 4.0, 9.0, 21.0, 14.0, 32.0, 34.0, 64.0, 90.0, 149.0, 366.0, 1354.0, 9082.0, 4099535.0, 79038.0, 3487.0, 600.0, 205.0, 83.0, 38.0, 25.0, 19.0, 14.0, 11.0, 12.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.140625, -15.78021240234375, -15.4197998046875, -15.05938720703125, -14.698974609375, -14.33856201171875, -13.9781494140625, -13.61773681640625, -13.25732421875, -12.89691162109375, -12.5364990234375, -12.17608642578125, -11.815673828125, -11.45526123046875, -11.0948486328125, -10.73443603515625, -10.3740234375, -10.01361083984375, -9.6531982421875, -9.29278564453125, -8.932373046875, -8.57196044921875, -8.2115478515625, -7.85113525390625, -7.49072265625, -7.13031005859375, -6.7698974609375, -6.40948486328125, -6.049072265625, -5.68865966796875, -5.3282470703125, -4.96783447265625, -4.607421875, -4.24700927734375, -3.8865966796875, -3.52618408203125, -3.165771484375, -2.80535888671875, -2.4449462890625, -2.08453369140625, -1.72412109375, -1.36370849609375, -1.0032958984375, -0.64288330078125, -0.282470703125, 0.07794189453125, 0.4383544921875, 0.79876708984375, 1.1591796875, 1.51959228515625, 1.8800048828125, 2.24041748046875, 2.600830078125, 2.96124267578125, 3.3216552734375, 3.68206787109375, 4.04248046875, 4.40289306640625, 4.7633056640625, 5.12371826171875, 5.484130859375, 5.84454345703125, 6.2049560546875, 6.56536865234375, 6.92578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 13.0, 26.0, 58.0, 160.0, 2984.0, 664.0, 98.0, 27.0, 17.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.34765625, -5.2423553466796875, -5.137054443359375, -5.0317535400390625, -4.92645263671875, -4.8211517333984375, -4.715850830078125, -4.6105499267578125, -4.5052490234375, -4.3999481201171875, -4.294647216796875, -4.1893463134765625, -4.08404541015625, -3.9787445068359375, -3.873443603515625, -3.7681427001953125, -3.662841796875, -3.5575408935546875, -3.452239990234375, -3.3469390869140625, -3.24163818359375, -3.1363372802734375, -3.031036376953125, -2.9257354736328125, -2.8204345703125, -2.7151336669921875, -2.609832763671875, -2.5045318603515625, -2.39923095703125, -2.2939300537109375, -2.188629150390625, -2.0833282470703125, -1.97802734375, -1.8727264404296875, -1.767425537109375, -1.6621246337890625, -1.55682373046875, -1.4515228271484375, -1.346221923828125, -1.2409210205078125, -1.1356201171875, -1.0303192138671875, -0.925018310546875, -0.8197174072265625, -0.71441650390625, -0.6091156005859375, -0.503814697265625, -0.3985137939453125, -0.293212890625, -0.1879119873046875, -0.082611083984375, 0.0226898193359375, 0.12799072265625, 0.2332916259765625, 0.338592529296875, 0.4438934326171875, 0.5491943359375, 0.6544952392578125, 0.759796142578125, 0.8650970458984375, 0.97039794921875, 1.0756988525390625, 1.180999755859375, 1.2863006591796875, 1.3916015625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 13.0, 16.0, 27.0, 77.0, 185.0, 294.0, 203.0, 102.0, 37.0, 24.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.662993431091309, -11.335687637329102, -11.008380889892578, -10.681075096130371, -10.353768348693848, -10.02646255493164, -9.699155807495117, -9.37185001373291, -9.044544219970703, -8.717238426208496, -8.389931678771973, -8.062625885009766, -7.735319137573242, -7.408013343811035, -7.08070707321167, -6.753400802612305, -6.426094055175781, -6.098787784576416, -5.771481513977051, -5.4441752433776855, -5.11686897277832, -4.789563179016113, -4.462256908416748, -4.134950637817383, -3.8076443672180176, -3.4803380966186523, -3.153031826019287, -2.825725793838501, -2.4984195232391357, -2.1711132526397705, -1.8438071012496948, -1.5165009498596191, -1.1891937255859375, -0.861887514591217, -0.5345813035964966, -0.20727509260177612, 0.12003111839294434, 0.44733738899230957, 0.7746435403823853, 1.101949691772461, 1.4292559623718262, 1.7565622329711914, 2.0838685035705566, 2.4111745357513428, 2.738480806350708, 3.0657870769500732, 3.3930931091308594, 3.7203993797302246, 4.04770565032959, 4.375011920928955, 4.70231819152832, 5.0296244621276855, 5.356930732727051, 5.684236526489258, 6.011542797088623, 6.338849067687988, 6.6661553382873535, 6.993461608886719, 7.320767879486084, 7.648074150085449, 7.975379943847656, 8.30268669128418, 8.629992485046387, 8.957298278808594, 9.284605026245117]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 14.0, 40.0, 59.0, 71.0, 103.0, 127.0, 154.0, 126.0, 114.0, 83.0, 51.0, 27.0, 18.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.98848819732666, -12.605815887451172, -12.223142623901367, -11.840470314025879, -11.457797050476074, -11.075124740600586, -10.692451477050781, -10.309779167175293, -9.927106857299805, -9.544434547424316, -9.161761283874512, -8.779088973999023, -8.396415710449219, -8.01374340057373, -7.631070613861084, -7.2483978271484375, -6.865724563598633, -6.483051776885986, -6.10037899017334, -5.717706680297852, -5.335033416748047, -4.952361106872559, -4.569688320159912, -4.187015533447266, -3.804342746734619, -3.4216699600219727, -3.038997173309326, -2.656324625015259, -2.2736518383026123, -1.8909790515899658, -1.5083065032958984, -1.125633716583252, -0.7429599761962891, -0.36028724908828735, 0.022385478019714355, 0.4050581455230713, 0.7877309322357178, 1.1704037189483643, 1.5530762672424316, 1.9357490539550781, 2.3184218406677246, 2.701094627380371, 3.0837674140930176, 3.466439962387085, 3.8491127490997314, 4.231785774230957, 4.614458084106445, 4.997130870819092, 5.379803657531738, 5.762476444244385, 6.145149230957031, 6.5278215408325195, 6.910494804382324, 7.2931671142578125, 7.675839900970459, 8.058512687683105, 8.441184997558594, 8.823857307434082, 9.206530570983887, 9.589202880859375, 9.97187614440918, 10.354548454284668, 10.737220764160156, 11.119894027709961, 11.502567291259766]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 6.0, 6.0, 7.0, 14.0, 8.0, 16.0, 22.0, 24.0, 45.0, 61.0, 107.0, 158.0, 238.0, 460.0, 946.0, 2851.0, 13529.0, 109013.0, 756723.0, 142450.0, 16247.0, 3388.0, 1077.0, 443.0, 238.0, 132.0, 99.0, 69.0, 51.0, 35.0, 22.0, 11.0, 8.0, 14.0, 10.0, 6.0, 6.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.853515625, -2.7569580078125, -2.660400390625, -2.5638427734375, -2.46728515625, -2.3707275390625, -2.274169921875, -2.1776123046875, -2.0810546875, -1.9844970703125, -1.887939453125, -1.7913818359375, -1.69482421875, -1.5982666015625, -1.501708984375, -1.4051513671875, -1.30859375, -1.2120361328125, -1.115478515625, -1.0189208984375, -0.92236328125, -0.8258056640625, -0.729248046875, -0.6326904296875, -0.5361328125, -0.4395751953125, -0.343017578125, -0.2464599609375, -0.14990234375, -0.0533447265625, 0.043212890625, 0.1397705078125, 0.236328125, 0.3328857421875, 0.429443359375, 0.5260009765625, 0.62255859375, 0.7191162109375, 0.815673828125, 0.9122314453125, 1.0087890625, 1.1053466796875, 1.201904296875, 1.2984619140625, 1.39501953125, 1.4915771484375, 1.588134765625, 1.6846923828125, 1.78125, 1.8778076171875, 1.974365234375, 2.0709228515625, 2.16748046875, 2.2640380859375, 2.360595703125, 2.4571533203125, 2.5537109375, 2.6502685546875, 2.746826171875, 2.8433837890625, 2.93994140625, 3.0364990234375, 3.133056640625, 3.2296142578125, 3.326171875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 16.0, 39.0, 69.0, 83.0, 96.0, 144.0, 135.0, 110.0, 110.0, 82.0, 57.0, 28.0, 9.0, 14.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.630859375, -1.5941162109375, -1.557373046875, -1.5206298828125, -1.48388671875, -1.4471435546875, -1.410400390625, -1.3736572265625, -1.3369140625, -1.3001708984375, -1.263427734375, -1.2266845703125, -1.18994140625, -1.1531982421875, -1.116455078125, -1.0797119140625, -1.04296875, -1.0062255859375, -0.969482421875, -0.9327392578125, -0.89599609375, -0.8592529296875, -0.822509765625, -0.7857666015625, -0.7490234375, -0.7122802734375, -0.675537109375, -0.6387939453125, -0.60205078125, -0.5653076171875, -0.528564453125, -0.4918212890625, -0.455078125, -0.4183349609375, -0.381591796875, -0.3448486328125, -0.30810546875, -0.2713623046875, -0.234619140625, -0.1978759765625, -0.1611328125, -0.1243896484375, -0.087646484375, -0.0509033203125, -0.01416015625, 0.0225830078125, 0.059326171875, 0.0960693359375, 0.1328125, 0.1695556640625, 0.206298828125, 0.2430419921875, 0.27978515625, 0.3165283203125, 0.353271484375, 0.3900146484375, 0.4267578125, 0.4635009765625, 0.500244140625, 0.5369873046875, 0.57373046875, 0.6104736328125, 0.647216796875, 0.6839599609375, 0.720703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 6.0, 5.0, 6.0, 8.0, 7.0, 14.0, 15.0, 24.0, 21.0, 30.0, 38.0, 48.0, 113.0, 163.0, 317.0, 605.0, 1263.0, 2622.0, 5878.0, 14161.0, 37566.0, 118598.0, 417280.0, 316550.0, 85016.0, 27894.0, 11026.0, 4776.0, 2123.0, 1061.0, 511.0, 286.0, 165.0, 104.0, 67.0, 38.0, 29.0, 24.0, 27.0, 19.0, 10.0, 12.0, 9.0, 8.0, 3.0, 6.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-1.27734375, -1.2384796142578125, -1.199615478515625, -1.1607513427734375, -1.12188720703125, -1.0830230712890625, -1.044158935546875, -1.0052947998046875, -0.9664306640625, -0.9275665283203125, -0.888702392578125, -0.8498382568359375, -0.81097412109375, -0.7721099853515625, -0.733245849609375, -0.6943817138671875, -0.655517578125, -0.6166534423828125, -0.577789306640625, -0.5389251708984375, -0.50006103515625, -0.4611968994140625, -0.422332763671875, -0.3834686279296875, -0.3446044921875, -0.3057403564453125, -0.266876220703125, -0.2280120849609375, -0.18914794921875, -0.1502838134765625, -0.111419677734375, -0.0725555419921875, -0.03369140625, 0.0051727294921875, 0.044036865234375, 0.0829010009765625, 0.12176513671875, 0.1606292724609375, 0.199493408203125, 0.2383575439453125, 0.2772216796875, 0.3160858154296875, 0.354949951171875, 0.3938140869140625, 0.43267822265625, 0.4715423583984375, 0.510406494140625, 0.5492706298828125, 0.588134765625, 0.6269989013671875, 0.665863037109375, 0.7047271728515625, 0.74359130859375, 0.7824554443359375, 0.821319580078125, 0.8601837158203125, 0.8990478515625, 0.9379119873046875, 0.976776123046875, 1.0156402587890625, 1.05450439453125, 1.0933685302734375, 1.132232666015625, 1.1710968017578125, 1.2099609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 9.0, 3.0, 5.0, 7.0, 6.0, 13.0, 18.0, 16.0, 36.0, 24.0, 20.0, 24.0, 32.0, 29.0, 46.0, 45.0, 40.0, 47.0, 45.0, 47.0, 52.0, 49.0, 48.0, 38.0, 51.0, 40.0, 28.0, 23.0, 27.0, 21.0, 22.0, 16.0, 14.0, 17.0, 7.0, 7.0, 7.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.83203125, -1.7748565673828125, -1.717681884765625, -1.6605072021484375, -1.60333251953125, -1.5461578369140625, -1.488983154296875, -1.4318084716796875, -1.3746337890625, -1.3174591064453125, -1.260284423828125, -1.2031097412109375, -1.14593505859375, -1.0887603759765625, -1.031585693359375, -0.9744110107421875, -0.917236328125, -0.8600616455078125, -0.802886962890625, -0.7457122802734375, -0.68853759765625, -0.6313629150390625, -0.574188232421875, -0.5170135498046875, -0.4598388671875, -0.4026641845703125, -0.345489501953125, -0.2883148193359375, -0.23114013671875, -0.1739654541015625, -0.116790771484375, -0.0596160888671875, -0.00244140625, 0.0547332763671875, 0.111907958984375, 0.1690826416015625, 0.22625732421875, 0.2834320068359375, 0.340606689453125, 0.3977813720703125, 0.4549560546875, 0.5121307373046875, 0.569305419921875, 0.6264801025390625, 0.68365478515625, 0.7408294677734375, 0.798004150390625, 0.8551788330078125, 0.912353515625, 0.9695281982421875, 1.026702880859375, 1.0838775634765625, 1.14105224609375, 1.1982269287109375, 1.255401611328125, 1.3125762939453125, 1.3697509765625, 1.4269256591796875, 1.484100341796875, 1.5412750244140625, 1.59844970703125, 1.6556243896484375, 1.712799072265625, 1.7699737548828125, 1.8271484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 8.0, 3.0, 9.0, 15.0, 19.0, 18.0, 25.0, 40.0, 56.0, 94.0, 150.0, 215.0, 354.0, 663.0, 1215.0, 2788.0, 6446.0, 18023.0, 71780.0, 481864.0, 381435.0, 57066.0, 15452.0, 5651.0, 2500.0, 1136.0, 617.0, 314.0, 206.0, 107.0, 73.0, 72.0, 44.0, 37.0, 13.0, 15.0, 10.0, 7.0, 6.0, 3.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.79345703125, -0.7660293579101562, -0.7386016845703125, -0.7111740112304688, -0.683746337890625, -0.6563186645507812, -0.6288909912109375, -0.6014633178710938, -0.57403564453125, -0.5466079711914062, -0.5191802978515625, -0.49175262451171875, -0.464324951171875, -0.43689727783203125, -0.4094696044921875, -0.38204193115234375, -0.3546142578125, -0.32718658447265625, -0.2997589111328125, -0.27233123779296875, -0.244903564453125, -0.21747589111328125, -0.1900482177734375, -0.16262054443359375, -0.13519287109375, -0.10776519775390625, -0.0803375244140625, -0.05290985107421875, -0.025482177734375, 0.00194549560546875, 0.0293731689453125, 0.05680084228515625, 0.084228515625, 0.11165618896484375, 0.1390838623046875, 0.16651153564453125, 0.193939208984375, 0.22136688232421875, 0.2487945556640625, 0.27622222900390625, 0.30364990234375, 0.33107757568359375, 0.3585052490234375, 0.38593292236328125, 0.413360595703125, 0.44078826904296875, 0.4682159423828125, 0.49564361572265625, 0.5230712890625, 0.5504989624023438, 0.5779266357421875, 0.6053543090820312, 0.632781982421875, 0.6602096557617188, 0.6876373291015625, 0.7150650024414062, 0.74249267578125, 0.7699203491210938, 0.7973480224609375, 0.8247756958007812, 0.852203369140625, 0.8796310424804688, 0.9070587158203125, 0.9344863891601562, 0.9619140625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 8.0, 12.0, 9.0, 31.0, 32.0, 60.0, 88.0, 206.0, 246.0, 135.0, 57.0, 49.0, 19.0, 22.0, 15.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004286766052246094, -0.000416487455368042, -0.0004042983055114746, -0.0003921091556549072, -0.00037992000579833984, -0.00036773085594177246, -0.0003555417060852051, -0.0003433525562286377, -0.0003311634063720703, -0.00031897425651550293, -0.00030678510665893555, -0.00029459595680236816, -0.0002824068069458008, -0.0002702176570892334, -0.000258028507232666, -0.00024583935737609863, -0.00023365020751953125, -0.00022146105766296387, -0.00020927190780639648, -0.0001970827579498291, -0.00018489360809326172, -0.00017270445823669434, -0.00016051530838012695, -0.00014832615852355957, -0.0001361370086669922, -0.0001239478588104248, -0.00011175870895385742, -9.956955909729004e-05, -8.738040924072266e-05, -7.519125938415527e-05, -6.300210952758789e-05, -5.081295967102051e-05, -3.8623809814453125e-05, -2.6434659957885742e-05, -1.424551010131836e-05, -2.0563602447509766e-06, 1.0132789611816406e-05, 2.232193946838379e-05, 3.451108932495117e-05, 4.6700239181518555e-05, 5.888938903808594e-05, 7.107853889465332e-05, 8.32676887512207e-05, 9.545683860778809e-05, 0.00010764598846435547, 0.00011983513832092285, 0.00013202428817749023, 0.00014421343803405762, 0.000156402587890625, 0.00016859173774719238, 0.00018078088760375977, 0.00019297003746032715, 0.00020515918731689453, 0.00021734833717346191, 0.0002295374870300293, 0.00024172663688659668, 0.00025391578674316406, 0.00026610493659973145, 0.00027829408645629883, 0.0002904832363128662, 0.0003026723861694336, 0.000314861536026001, 0.00032705068588256836, 0.00033923983573913574, 0.0003514289855957031]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 5.0, 15.0, 24.0, 42.0, 56.0, 84.0, 185.0, 416.0, 843.0, 2026.0, 5914.0, 25157.0, 253649.0, 686537.0, 57966.0, 10190.0, 3147.0, 1250.0, 511.0, 253.0, 126.0, 56.0, 34.0, 23.0, 15.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.05078125, -1.00738525390625, -0.9639892578125, -0.92059326171875, -0.877197265625, -0.83380126953125, -0.7904052734375, -0.74700927734375, -0.70361328125, -0.66021728515625, -0.6168212890625, -0.57342529296875, -0.530029296875, -0.48663330078125, -0.4432373046875, -0.39984130859375, -0.3564453125, -0.31304931640625, -0.2696533203125, -0.22625732421875, -0.182861328125, -0.13946533203125, -0.0960693359375, -0.05267333984375, -0.00927734375, 0.03411865234375, 0.0775146484375, 0.12091064453125, 0.164306640625, 0.20770263671875, 0.2510986328125, 0.29449462890625, 0.337890625, 0.38128662109375, 0.4246826171875, 0.46807861328125, 0.511474609375, 0.55487060546875, 0.5982666015625, 0.64166259765625, 0.68505859375, 0.72845458984375, 0.7718505859375, 0.81524658203125, 0.858642578125, 0.90203857421875, 0.9454345703125, 0.98883056640625, 1.0322265625, 1.07562255859375, 1.1190185546875, 1.16241455078125, 1.205810546875, 1.24920654296875, 1.2926025390625, 1.33599853515625, 1.37939453125, 1.42279052734375, 1.4661865234375, 1.50958251953125, 1.552978515625, 1.59637451171875, 1.6397705078125, 1.68316650390625, 1.7265625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 6.0, 7.0, 10.0, 12.0, 27.0, 36.0, 67.0, 80.0, 109.0, 144.0, 119.0, 100.0, 82.0, 61.0, 46.0, 25.0, 17.0, 12.0, 8.0, 6.0, 5.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.88623046875, -0.8558883666992188, -0.8255462646484375, -0.7952041625976562, -0.764862060546875, -0.7345199584960938, -0.7041778564453125, -0.6738357543945312, -0.64349365234375, -0.6131515502929688, -0.5828094482421875, -0.5524673461914062, -0.522125244140625, -0.49178314208984375, -0.4614410400390625, -0.43109893798828125, -0.4007568359375, -0.37041473388671875, -0.3400726318359375, -0.30973052978515625, -0.279388427734375, -0.24904632568359375, -0.2187042236328125, -0.18836212158203125, -0.15802001953125, -0.12767791748046875, -0.0973358154296875, -0.06699371337890625, -0.036651611328125, -0.00630950927734375, 0.0240325927734375, 0.05437469482421875, 0.084716796875, 0.11505889892578125, 0.1454010009765625, 0.17574310302734375, 0.206085205078125, 0.23642730712890625, 0.2667694091796875, 0.29711151123046875, 0.32745361328125, 0.35779571533203125, 0.3881378173828125, 0.41847991943359375, 0.448822021484375, 0.47916412353515625, 0.5095062255859375, 0.5398483276367188, 0.5701904296875, 0.6005325317382812, 0.6308746337890625, 0.6612167358398438, 0.691558837890625, 0.7219009399414062, 0.7522430419921875, 0.7825851440429688, 0.81292724609375, 0.8432693481445312, 0.8736114501953125, 0.9039535522460938, 0.934295654296875, 0.9646377563476562, 0.9949798583984375, 1.0253219604492188, 1.0556640625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 25.0, 68.0, 235.0, 440.0, 179.0, 43.0, 16.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.55865478515625, -44.59474563598633, -43.630836486816406, -42.666927337646484, -41.70301818847656, -40.73910903930664, -39.77519989013672, -38.8112907409668, -37.847381591796875, -36.88347244262695, -35.91956329345703, -34.95565414428711, -33.99174499511719, -33.027835845947266, -32.063926696777344, -31.100017547607422, -30.1361083984375, -29.172199249267578, -28.208290100097656, -27.244380950927734, -26.280471801757812, -25.31656265258789, -24.35265350341797, -23.388744354248047, -22.424835205078125, -21.460926055908203, -20.49701690673828, -19.53310775756836, -18.569198608398438, -17.605289459228516, -16.641380310058594, -15.677471160888672, -14.713560104370117, -13.749650955200195, -12.785741806030273, -11.821832656860352, -10.85792350769043, -9.894014358520508, -8.930105209350586, -7.966196060180664, -7.002286911010742, -6.03837776184082, -5.074468612670898, -4.110559463500977, -3.1466503143310547, -2.182741165161133, -1.218832015991211, -0.25492286682128906, 0.7089862823486328, 1.6728954315185547, 2.6368045806884766, 3.6007137298583984, 4.56462287902832, 5.528532028198242, 6.492441177368164, 7.456350326538086, 8.420259475708008, 9.38416862487793, 10.348077774047852, 11.311986923217773, 12.275896072387695, 13.239805221557617, 14.203714370727539, 15.167623519897461, 16.131532669067383]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 7.0, 6.0, 8.0, 17.0, 22.0, 19.0, 16.0, 21.0, 24.0, 33.0, 43.0, 28.0, 48.0, 47.0, 40.0, 35.0, 44.0, 46.0, 59.0, 40.0, 56.0, 38.0, 44.0, 32.0, 38.0, 29.0, 30.0, 31.0, 20.0, 9.0, 13.0, 13.0, 12.0, 4.0, 4.0, 7.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.683826446533203, -11.341886520385742, -10.999945640563965, -10.658005714416504, -10.316064834594727, -9.974124908447266, -9.632184982299805, -9.290244102478027, -8.94830322265625, -8.606363296508789, -8.264422416687012, -7.922482490539551, -7.580541610717773, -7.2386016845703125, -6.896661281585693, -6.554720878601074, -6.212780952453613, -5.870840549468994, -5.528900146484375, -5.186960220336914, -4.845019340515137, -4.503079414367676, -4.161139011383057, -3.8191986083984375, -3.4772582054138184, -3.135317802429199, -2.79337739944458, -2.45143723487854, -2.109496831893921, -1.7675564289093018, -1.4256162643432617, -1.0836758613586426, -0.7417354583740234, -0.3997951149940491, -0.05785477161407471, 0.2840855121612549, 0.626025915145874, 0.9679663181304932, 1.3099064826965332, 1.6518468856811523, 1.9937872886657715, 2.3357276916503906, 2.6776680946350098, 3.01960825920105, 3.361548662185669, 3.703489065170288, 4.045429229736328, 4.387369632720947, 4.729310035705566, 5.0712504386901855, 5.413190841674805, 5.755130767822266, 6.097071647644043, 6.439011573791504, 6.780951976776123, 7.122892379760742, 7.464832782745361, 7.8067731857299805, 8.148713111877441, 8.490653991699219, 8.83259391784668, 9.174534797668457, 9.516474723815918, 9.858415603637695, 10.200355529785156]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 3.0, 7.0, 7.0, 12.0, 14.0, 17.0, 27.0, 29.0, 53.0, 79.0, 115.0, 260.0, 594.0, 2170.0, 10669.0, 196800.0, 3957790.0, 20591.0, 3399.0, 910.0, 333.0, 156.0, 88.0, 48.0, 34.0, 18.0, 9.0, 13.0, 7.0, 4.0, 4.0, 7.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.84765625, -4.72064208984375, -4.5936279296875, -4.46661376953125, -4.339599609375, -4.21258544921875, -4.0855712890625, -3.95855712890625, -3.83154296875, -3.70452880859375, -3.5775146484375, -3.45050048828125, -3.323486328125, -3.19647216796875, -3.0694580078125, -2.94244384765625, -2.8154296875, -2.68841552734375, -2.5614013671875, -2.43438720703125, -2.307373046875, -2.18035888671875, -2.0533447265625, -1.92633056640625, -1.79931640625, -1.67230224609375, -1.5452880859375, -1.41827392578125, -1.291259765625, -1.16424560546875, -1.0372314453125, -0.91021728515625, -0.783203125, -0.65618896484375, -0.5291748046875, -0.40216064453125, -0.275146484375, -0.14813232421875, -0.0211181640625, 0.10589599609375, 0.23291015625, 0.35992431640625, 0.4869384765625, 0.61395263671875, 0.740966796875, 0.86798095703125, 0.9949951171875, 1.12200927734375, 1.2490234375, 1.37603759765625, 1.5030517578125, 1.63006591796875, 1.757080078125, 1.88409423828125, 2.0111083984375, 2.13812255859375, 2.26513671875, 2.39215087890625, 2.5191650390625, 2.64617919921875, 2.773193359375, 2.90020751953125, 3.0272216796875, 3.15423583984375, 3.28125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 16.0, 19.0, 32.0, 59.0, 71.0, 107.0, 119.0, 108.0, 102.0, 111.0, 94.0, 69.0, 47.0, 27.0, 5.0, 5.0, 6.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.625, -1.5894317626953125, -1.553863525390625, -1.5182952880859375, -1.48272705078125, -1.4471588134765625, -1.411590576171875, -1.3760223388671875, -1.3404541015625, -1.3048858642578125, -1.269317626953125, -1.2337493896484375, -1.19818115234375, -1.1626129150390625, -1.127044677734375, -1.0914764404296875, -1.055908203125, -1.0203399658203125, -0.984771728515625, -0.9492034912109375, -0.91363525390625, -0.8780670166015625, -0.842498779296875, -0.8069305419921875, -0.7713623046875, -0.7357940673828125, -0.700225830078125, -0.6646575927734375, -0.62908935546875, -0.5935211181640625, -0.557952880859375, -0.5223846435546875, -0.48681640625, -0.4512481689453125, -0.415679931640625, -0.3801116943359375, -0.34454345703125, -0.3089752197265625, -0.273406982421875, -0.2378387451171875, -0.2022705078125, -0.1667022705078125, -0.131134033203125, -0.0955657958984375, -0.05999755859375, -0.0244293212890625, 0.011138916015625, 0.0467071533203125, 0.082275390625, 0.1178436279296875, 0.153411865234375, 0.1889801025390625, 0.22454833984375, 0.2601165771484375, 0.295684814453125, 0.3312530517578125, 0.3668212890625, 0.4023895263671875, 0.437957763671875, 0.4735260009765625, 0.50909423828125, 0.5446624755859375, 0.580230712890625, 0.6157989501953125, 0.6513671875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 4.0, 12.0, 20.0, 25.0, 44.0, 62.0, 103.0, 179.0, 832.0, 10789.0, 4129143.0, 50494.0, 1831.0, 316.0, 150.0, 111.0, 67.0, 40.0, 20.0, 22.0, 11.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.224609375, -3.005035400390625, -2.78546142578125, -2.565887451171875, -2.3463134765625, -2.126739501953125, -1.90716552734375, -1.687591552734375, -1.468017578125, -1.248443603515625, -1.02886962890625, -0.809295654296875, -0.5897216796875, -0.370147705078125, -0.15057373046875, 0.069000244140625, 0.28857421875, 0.508148193359375, 0.72772216796875, 0.947296142578125, 1.1668701171875, 1.386444091796875, 1.60601806640625, 1.825592041015625, 2.045166015625, 2.264739990234375, 2.48431396484375, 2.703887939453125, 2.9234619140625, 3.143035888671875, 3.36260986328125, 3.582183837890625, 3.8017578125, 4.021331787109375, 4.24090576171875, 4.460479736328125, 4.6800537109375, 4.899627685546875, 5.11920166015625, 5.338775634765625, 5.558349609375, 5.777923583984375, 5.99749755859375, 6.217071533203125, 6.4366455078125, 6.656219482421875, 6.87579345703125, 7.095367431640625, 7.31494140625, 7.534515380859375, 7.75408935546875, 7.973663330078125, 8.1932373046875, 8.412811279296875, 8.63238525390625, 8.851959228515625, 9.071533203125, 9.291107177734375, 9.51068115234375, 9.730255126953125, 9.9498291015625, 10.169403076171875, 10.38897705078125, 10.608551025390625, 10.828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 8.0, 10.0, 25.0, 68.0, 229.0, 3060.0, 479.0, 93.0, 42.0, 20.0, 19.0, 10.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68310546875, -0.6365432739257812, -0.5899810791015625, -0.5434188842773438, -0.496856689453125, -0.45029449462890625, -0.4037322998046875, -0.35717010498046875, -0.31060791015625, -0.26404571533203125, -0.2174835205078125, -0.17092132568359375, -0.124359130859375, -0.07779693603515625, -0.0312347412109375, 0.01532745361328125, 0.0618896484375, 0.10845184326171875, 0.1550140380859375, 0.20157623291015625, 0.248138427734375, 0.29470062255859375, 0.3412628173828125, 0.38782501220703125, 0.43438720703125, 0.48094940185546875, 0.5275115966796875, 0.5740737915039062, 0.620635986328125, 0.6671981811523438, 0.7137603759765625, 0.7603225708007812, 0.806884765625, 0.8534469604492188, 0.9000091552734375, 0.9465713500976562, 0.993133544921875, 1.0396957397460938, 1.0862579345703125, 1.1328201293945312, 1.17938232421875, 1.2259445190429688, 1.2725067138671875, 1.3190689086914062, 1.365631103515625, 1.4121932983398438, 1.4587554931640625, 1.5053176879882812, 1.5518798828125, 1.5984420776367188, 1.6450042724609375, 1.6915664672851562, 1.738128662109375, 1.7846908569335938, 1.8312530517578125, 1.8778152465820312, 1.92437744140625, 1.9709396362304688, 2.0175018310546875, 2.0640640258789062, 2.110626220703125, 2.1571884155273438, 2.2037506103515625, 2.2503128051757812, 2.296875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 22.0, 89.0, 305.0, 334.0, 160.0, 62.0, 20.0, 8.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.603825569152832, -6.2742085456848145, -5.944591522216797, -5.614974498748779, -5.285357475280762, -4.955740451812744, -4.626123428344727, -4.296506404876709, -3.9668893814086914, -3.637272357940674, -3.3076553344726562, -2.9780383110046387, -2.648421287536621, -2.3188042640686035, -1.989187240600586, -1.6595702171325684, -1.3299531936645508, -1.0003361701965332, -0.6707191467285156, -0.34110212326049805, -0.011485099792480469, 0.3181319236755371, 0.6477489471435547, 0.9773659706115723, 1.3069829940795898, 1.6366000175476074, 1.966217041015625, 2.2958340644836426, 2.62545108795166, 2.9550681114196777, 3.2846851348876953, 3.614302158355713, 3.943918228149414, 4.273535251617432, 4.603152275085449, 4.932769298553467, 5.262386322021484, 5.592003345489502, 5.9216203689575195, 6.251237392425537, 6.580854415893555, 6.910471439361572, 7.24008846282959, 7.569705486297607, 7.899322509765625, 8.228939056396484, 8.55855655670166, 8.888174057006836, 9.217790603637695, 9.547407150268555, 9.87702465057373, 10.206642150878906, 10.536258697509766, 10.865875244140625, 11.1954927444458, 11.525110244750977, 11.854726791381836, 12.184343338012695, 12.513960838317871, 12.843578338623047, 13.173194885253906, 13.502811431884766, 13.832428932189941, 14.162046432495117, 14.491662979125977]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 3.0, 11.0, 13.0, 14.0, 22.0, 43.0, 42.0, 48.0, 69.0, 65.0, 84.0, 76.0, 75.0, 80.0, 64.0, 64.0, 53.0, 47.0, 31.0, 27.0, 21.0, 21.0, 11.0, 9.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.327057361602783, -3.1848394870758057, -3.042621612548828, -2.9004037380218506, -2.758185863494873, -2.6159679889678955, -2.473750114440918, -2.3315322399139404, -2.189314365386963, -2.0470964908599854, -1.9048786163330078, -1.7626607418060303, -1.6204428672790527, -1.4782249927520752, -1.3360071182250977, -1.1937892436981201, -1.0515713691711426, -0.909353494644165, -0.7671356201171875, -0.62491774559021, -0.4826998710632324, -0.3404819965362549, -0.19826412200927734, -0.056046247482299805, 0.08617162704467773, 0.22838950157165527, 0.3706073760986328, 0.5128252506256104, 0.6550431251525879, 0.7972609996795654, 0.939478874206543, 1.0816967487335205, 1.2239151000976562, 1.3661329746246338, 1.5083508491516113, 1.6505687236785889, 1.7927865982055664, 1.935004472732544, 2.0772223472595215, 2.219440221786499, 2.3616580963134766, 2.503875970840454, 2.6460938453674316, 2.788311719894409, 2.9305295944213867, 3.0727474689483643, 3.214965343475342, 3.3571832180023193, 3.499401092529297, 3.6416189670562744, 3.783836841583252, 3.9260547161102295, 4.068272590637207, 4.2104902267456055, 4.352708339691162, 4.494926452636719, 4.637144088745117, 4.779361724853516, 4.921579837799072, 5.063797950744629, 5.206015586853027, 5.348233222961426, 5.490451335906982, 5.632669448852539, 5.7748870849609375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 9.0, 7.0, 19.0, 17.0, 24.0, 43.0, 83.0, 129.0, 266.0, 696.0, 2266.0, 10709.0, 85363.0, 780939.0, 147612.0, 15814.0, 3022.0, 832.0, 309.0, 153.0, 77.0, 60.0, 28.0, 29.0, 13.0, 9.0, 10.0, 3.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.576171875, -2.471466064453125, -2.36676025390625, -2.262054443359375, -2.1573486328125, -2.052642822265625, -1.94793701171875, -1.843231201171875, -1.738525390625, -1.633819580078125, -1.52911376953125, -1.424407958984375, -1.3197021484375, -1.214996337890625, -1.11029052734375, -1.005584716796875, -0.90087890625, -0.796173095703125, -0.69146728515625, -0.586761474609375, -0.4820556640625, -0.377349853515625, -0.27264404296875, -0.167938232421875, -0.063232421875, 0.041473388671875, 0.14617919921875, 0.250885009765625, 0.3555908203125, 0.460296630859375, 0.56500244140625, 0.669708251953125, 0.7744140625, 0.879119873046875, 0.98382568359375, 1.088531494140625, 1.1932373046875, 1.297943115234375, 1.40264892578125, 1.507354736328125, 1.612060546875, 1.716766357421875, 1.82147216796875, 1.926177978515625, 2.0308837890625, 2.135589599609375, 2.24029541015625, 2.345001220703125, 2.44970703125, 2.554412841796875, 2.65911865234375, 2.763824462890625, 2.8685302734375, 2.973236083984375, 3.07794189453125, 3.182647705078125, 3.287353515625, 3.392059326171875, 3.49676513671875, 3.601470947265625, 3.7061767578125, 3.810882568359375, 3.91558837890625, 4.020294189453125, 4.125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 10.0, 7.0, 25.0, 29.0, 45.0, 64.0, 68.0, 89.0, 99.0, 91.0, 118.0, 81.0, 73.0, 77.0, 46.0, 36.0, 18.0, 11.0, 9.0, 0.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.361328125, -1.3308029174804688, -1.3002777099609375, -1.2697525024414062, -1.239227294921875, -1.2087020874023438, -1.1781768798828125, -1.1476516723632812, -1.11712646484375, -1.0866012573242188, -1.0560760498046875, -1.0255508422851562, -0.995025634765625, -0.9645004272460938, -0.9339752197265625, -0.9034500122070312, -0.8729248046875, -0.8423995971679688, -0.8118743896484375, -0.7813491821289062, -0.750823974609375, -0.7202987670898438, -0.6897735595703125, -0.6592483520507812, -0.62872314453125, -0.5981979370117188, -0.5676727294921875, -0.5371475219726562, -0.506622314453125, -0.47609710693359375, -0.4455718994140625, -0.41504669189453125, -0.384521484375, -0.35399627685546875, -0.3234710693359375, -0.29294586181640625, -0.262420654296875, -0.23189544677734375, -0.2013702392578125, -0.17084503173828125, -0.14031982421875, -0.10979461669921875, -0.0792694091796875, -0.04874420166015625, -0.018218994140625, 0.01230621337890625, 0.0428314208984375, 0.07335662841796875, 0.1038818359375, 0.13440704345703125, 0.1649322509765625, 0.19545745849609375, 0.225982666015625, 0.25650787353515625, 0.2870330810546875, 0.31755828857421875, 0.34808349609375, 0.37860870361328125, 0.4091339111328125, 0.43965911865234375, 0.470184326171875, 0.5007095336914062, 0.5312347412109375, 0.5617599487304688, 0.59228515625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 7.0, 10.0, 9.0, 13.0, 22.0, 22.0, 40.0, 80.0, 143.0, 235.0, 508.0, 1243.0, 3151.0, 8399.0, 26891.0, 124451.0, 644572.0, 186303.0, 35493.0, 10295.0, 3806.0, 1487.0, 607.0, 338.0, 173.0, 84.0, 45.0, 32.0, 23.0, 13.0, 9.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9580078125, -1.8940277099609375, -1.830047607421875, -1.7660675048828125, -1.70208740234375, -1.6381072998046875, -1.574127197265625, -1.5101470947265625, -1.4461669921875, -1.3821868896484375, -1.318206787109375, -1.2542266845703125, -1.19024658203125, -1.1262664794921875, -1.062286376953125, -0.9983062744140625, -0.934326171875, -0.8703460693359375, -0.806365966796875, -0.7423858642578125, -0.67840576171875, -0.6144256591796875, -0.550445556640625, -0.4864654541015625, -0.4224853515625, -0.3585052490234375, -0.294525146484375, -0.2305450439453125, -0.16656494140625, -0.1025848388671875, -0.038604736328125, 0.0253753662109375, 0.08935546875, 0.1533355712890625, 0.217315673828125, 0.2812957763671875, 0.34527587890625, 0.4092559814453125, 0.473236083984375, 0.5372161865234375, 0.6011962890625, 0.6651763916015625, 0.729156494140625, 0.7931365966796875, 0.85711669921875, 0.9210968017578125, 0.985076904296875, 1.0490570068359375, 1.113037109375, 1.1770172119140625, 1.240997314453125, 1.3049774169921875, 1.36895751953125, 1.4329376220703125, 1.496917724609375, 1.5608978271484375, 1.6248779296875, 1.6888580322265625, 1.752838134765625, 1.8168182373046875, 1.88079833984375, 1.9447784423828125, 2.008758544921875, 2.0727386474609375, 2.13671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 10.0, 11.0, 8.0, 11.0, 13.0, 14.0, 30.0, 30.0, 38.0, 47.0, 30.0, 47.0, 49.0, 55.0, 59.0, 70.0, 61.0, 39.0, 55.0, 45.0, 41.0, 50.0, 32.0, 36.0, 24.0, 28.0, 16.0, 15.0, 12.0, 7.0, 2.0, 6.0, 7.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.04296875, -1.96466064453125, -1.8863525390625, -1.80804443359375, -1.729736328125, -1.65142822265625, -1.5731201171875, -1.49481201171875, -1.41650390625, -1.33819580078125, -1.2598876953125, -1.18157958984375, -1.103271484375, -1.02496337890625, -0.9466552734375, -0.86834716796875, -0.7900390625, -0.71173095703125, -0.6334228515625, -0.55511474609375, -0.476806640625, -0.39849853515625, -0.3201904296875, -0.24188232421875, -0.16357421875, -0.08526611328125, -0.0069580078125, 0.07135009765625, 0.149658203125, 0.22796630859375, 0.3062744140625, 0.38458251953125, 0.462890625, 0.54119873046875, 0.6195068359375, 0.69781494140625, 0.776123046875, 0.85443115234375, 0.9327392578125, 1.01104736328125, 1.08935546875, 1.16766357421875, 1.2459716796875, 1.32427978515625, 1.402587890625, 1.48089599609375, 1.5592041015625, 1.63751220703125, 1.7158203125, 1.79412841796875, 1.8724365234375, 1.95074462890625, 2.029052734375, 2.10736083984375, 2.1856689453125, 2.26397705078125, 2.34228515625, 2.42059326171875, 2.4989013671875, 2.57720947265625, 2.655517578125, 2.73382568359375, 2.8121337890625, 2.89044189453125, 2.96875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 3.0, 18.0, 18.0, 28.0, 35.0, 51.0, 79.0, 145.0, 195.0, 292.0, 592.0, 1151.0, 2244.0, 5259.0, 14951.0, 67772.0, 674813.0, 233042.0, 31745.0, 8976.0, 3490.0, 1625.0, 830.0, 441.0, 271.0, 172.0, 93.0, 69.0, 48.0, 21.0, 19.0, 18.0, 15.0, 7.0, 7.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5732421875, -1.529266357421875, -1.48529052734375, -1.441314697265625, -1.3973388671875, -1.353363037109375, -1.30938720703125, -1.265411376953125, -1.221435546875, -1.177459716796875, -1.13348388671875, -1.089508056640625, -1.0455322265625, -1.001556396484375, -0.95758056640625, -0.913604736328125, -0.86962890625, -0.825653076171875, -0.78167724609375, -0.737701416015625, -0.6937255859375, -0.649749755859375, -0.60577392578125, -0.561798095703125, -0.517822265625, -0.473846435546875, -0.42987060546875, -0.385894775390625, -0.3419189453125, -0.297943115234375, -0.25396728515625, -0.209991455078125, -0.166015625, -0.122039794921875, -0.07806396484375, -0.034088134765625, 0.0098876953125, 0.053863525390625, 0.09783935546875, 0.141815185546875, 0.185791015625, 0.229766845703125, 0.27374267578125, 0.317718505859375, 0.3616943359375, 0.405670166015625, 0.44964599609375, 0.493621826171875, 0.53759765625, 0.581573486328125, 0.62554931640625, 0.669525146484375, 0.7135009765625, 0.757476806640625, 0.80145263671875, 0.845428466796875, 0.889404296875, 0.933380126953125, 0.97735595703125, 1.021331787109375, 1.0653076171875, 1.109283447265625, 1.15325927734375, 1.197235107421875, 1.2412109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 8.0, 8.0, 17.0, 23.0, 26.0, 49.0, 57.0, 96.0, 191.0, 188.0, 89.0, 51.0, 42.0, 42.0, 23.0, 16.0, 18.0, 12.0, 9.0, 5.0, 2.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00036072731018066406, -0.0003509595990180969, -0.0003411918878555298, -0.00033142417669296265, -0.0003216564655303955, -0.00031188875436782837, -0.00030212104320526123, -0.0002923533320426941, -0.00028258562088012695, -0.0002728179097175598, -0.0002630501985549927, -0.00025328248739242554, -0.0002435147762298584, -0.00023374706506729126, -0.00022397935390472412, -0.00021421164274215698, -0.00020444393157958984, -0.0001946762204170227, -0.00018490850925445557, -0.00017514079809188843, -0.0001653730869293213, -0.00015560537576675415, -0.000145837664604187, -0.00013606995344161987, -0.00012630224227905273, -0.0001165345311164856, -0.00010676681995391846, -9.699910879135132e-05, -8.723139762878418e-05, -7.746368646621704e-05, -6.76959753036499e-05, -5.7928264141082764e-05, -4.8160552978515625e-05, -3.8392841815948486e-05, -2.8625130653381348e-05, -1.885741949081421e-05, -9.08970832824707e-06, 6.780028343200684e-07, 1.0445713996887207e-05, 2.0213425159454346e-05, 2.9981136322021484e-05, 3.974884748458862e-05, 4.951655864715576e-05, 5.92842698097229e-05, 6.905198097229004e-05, 7.881969213485718e-05, 8.858740329742432e-05, 9.835511445999146e-05, 0.0001081228256225586, 0.00011789053678512573, 0.00012765824794769287, 0.00013742595911026, 0.00014719367027282715, 0.0001569613814353943, 0.00016672909259796143, 0.00017649680376052856, 0.0001862645149230957, 0.00019603222608566284, 0.00020579993724822998, 0.00021556764841079712, 0.00022533535957336426, 0.0002351030707359314, 0.00024487078189849854, 0.0002546384930610657, 0.0002644062042236328]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 10.0, 21.0, 24.0, 41.0, 92.0, 172.0, 336.0, 813.0, 2260.0, 6865.0, 30144.0, 443537.0, 519536.0, 33293.0, 7642.0, 2225.0, 849.0, 333.0, 158.0, 71.0, 53.0, 31.0, 13.0, 9.0, 9.0, 9.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.208984375, -2.14208984375, -2.0751953125, -2.00830078125, -1.94140625, -1.87451171875, -1.8076171875, -1.74072265625, -1.673828125, -1.60693359375, -1.5400390625, -1.47314453125, -1.40625, -1.33935546875, -1.2724609375, -1.20556640625, -1.138671875, -1.07177734375, -1.0048828125, -0.93798828125, -0.87109375, -0.80419921875, -0.7373046875, -0.67041015625, -0.603515625, -0.53662109375, -0.4697265625, -0.40283203125, -0.3359375, -0.26904296875, -0.2021484375, -0.13525390625, -0.068359375, -0.00146484375, 0.0654296875, 0.13232421875, 0.19921875, 0.26611328125, 0.3330078125, 0.39990234375, 0.466796875, 0.53369140625, 0.6005859375, 0.66748046875, 0.734375, 0.80126953125, 0.8681640625, 0.93505859375, 1.001953125, 1.06884765625, 1.1357421875, 1.20263671875, 1.26953125, 1.33642578125, 1.4033203125, 1.47021484375, 1.537109375, 1.60400390625, 1.6708984375, 1.73779296875, 1.8046875, 1.87158203125, 1.9384765625, 2.00537109375, 2.072265625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 13.0, 7.0, 13.0, 16.0, 21.0, 32.0, 39.0, 87.0, 92.0, 150.0, 162.0, 109.0, 73.0, 48.0, 40.0, 24.0, 19.0, 12.0, 14.0, 11.0, 7.0, 8.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.611328125, -1.5677490234375, -1.524169921875, -1.4805908203125, -1.43701171875, -1.3934326171875, -1.349853515625, -1.3062744140625, -1.2626953125, -1.2191162109375, -1.175537109375, -1.1319580078125, -1.08837890625, -1.0447998046875, -1.001220703125, -0.9576416015625, -0.9140625, -0.8704833984375, -0.826904296875, -0.7833251953125, -0.73974609375, -0.6961669921875, -0.652587890625, -0.6090087890625, -0.5654296875, -0.5218505859375, -0.478271484375, -0.4346923828125, -0.39111328125, -0.3475341796875, -0.303955078125, -0.2603759765625, -0.216796875, -0.1732177734375, -0.129638671875, -0.0860595703125, -0.04248046875, 0.0010986328125, 0.044677734375, 0.0882568359375, 0.1318359375, 0.1754150390625, 0.218994140625, 0.2625732421875, 0.30615234375, 0.3497314453125, 0.393310546875, 0.4368896484375, 0.48046875, 0.5240478515625, 0.567626953125, 0.6112060546875, 0.65478515625, 0.6983642578125, 0.741943359375, 0.7855224609375, 0.8291015625, 0.8726806640625, 0.916259765625, 0.9598388671875, 1.00341796875, 1.0469970703125, 1.090576171875, 1.1341552734375, 1.177734375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 12.0, 26.0, 39.0, 70.0, 115.0, 199.0, 192.0, 131.0, 89.0, 51.0, 36.0, 22.0, 9.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.77408504486084, -14.223430633544922, -13.672775268554688, -13.12212085723877, -12.571466445922852, -12.020811080932617, -11.4701566696167, -10.919502258300781, -10.368846893310547, -9.818192481994629, -9.267537117004395, -8.716882705688477, -8.166228294372559, -7.615573406219482, -7.064918518066406, -6.514264106750488, -5.96360969543457, -5.412954807281494, -4.862300395965576, -4.3116455078125, -3.760990858078003, -3.210336208343506, -2.6596813201904297, -2.1090266704559326, -1.5583720207214355, -1.0077173709869385, -0.45706260204315186, 0.09359216690063477, 0.6442468166351318, 1.194901466369629, 1.745556354522705, 2.296211004257202, 2.8468666076660156, 3.3975212574005127, 3.9481759071350098, 4.498830795288086, 5.049485206604004, 5.60014009475708, 6.150794982910156, 6.701449394226074, 7.25210428237915, 7.802759170532227, 8.353413581848145, 8.904067993164062, 9.454723358154297, 10.005377769470215, 10.556032180786133, 11.106687545776367, 11.657341957092285, 12.207996368408203, 12.758651733398438, 13.309306144714355, 13.859960556030273, 14.410615921020508, 14.961270332336426, 15.511924743652344, 16.062580108642578, 16.613235473632812, 17.163888931274414, 17.71454429626465, 18.265199661254883, 18.815853118896484, 19.36650848388672, 19.917163848876953, 20.467817306518555]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 9.0, 13.0, 10.0, 17.0, 24.0, 20.0, 32.0, 27.0, 42.0, 52.0, 64.0, 68.0, 61.0, 63.0, 46.0, 70.0, 56.0, 58.0, 44.0, 36.0, 44.0, 26.0, 29.0, 25.0, 20.0, 12.0, 16.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.967788696289062, -14.452939987182617, -13.938092231750488, -13.423243522644043, -12.908395767211914, -12.393547058105469, -11.878698348999023, -11.363850593566895, -10.849002838134766, -10.33415412902832, -9.819306373596191, -9.304457664489746, -8.789609909057617, -8.274761199951172, -7.759912967681885, -7.245064735412598, -6.730216026306152, -6.215367794036865, -5.700519561767578, -5.185670852661133, -4.670823097229004, -4.155974388122559, -3.6411261558532715, -3.1262779235839844, -2.6114296913146973, -2.09658145904541, -1.5817331075668335, -1.0668847560882568, -0.5520365238189697, -0.03718829154968262, 0.4776601791381836, 0.9925084114074707, 1.5073566436767578, 2.022204875946045, 2.537053108215332, 3.0519015789031982, 3.5667498111724854, 4.081598281860352, 4.596446514129639, 5.111294746398926, 5.626142978668213, 6.1409912109375, 6.655839443206787, 7.170687675476074, 7.6855363845825195, 8.200384140014648, 8.715232849121094, 9.230081558227539, 9.744929313659668, 10.259778022766113, 10.774625778198242, 11.289474487304688, 11.804322242736816, 12.319170951843262, 12.83401870727539, 13.348867416381836, 13.863716125488281, 14.378564834594727, 14.893412590026855, 15.4082612991333, 15.92310905456543, 16.437957763671875, 16.95280647277832, 17.467655181884766, 17.982501983642578]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 12.0, 13.0, 11.0, 26.0, 46.0, 79.0, 155.0, 265.0, 612.0, 1729.0, 6494.0, 54550.0, 4093707.0, 29534.0, 4703.0, 1328.0, 487.0, 257.0, 124.0, 56.0, 30.0, 28.0, 11.0, 8.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.40625, -7.21826171875, -7.0302734375, -6.84228515625, -6.654296875, -6.46630859375, -6.2783203125, -6.09033203125, -5.90234375, -5.71435546875, -5.5263671875, -5.33837890625, -5.150390625, -4.96240234375, -4.7744140625, -4.58642578125, -4.3984375, -4.21044921875, -4.0224609375, -3.83447265625, -3.646484375, -3.45849609375, -3.2705078125, -3.08251953125, -2.89453125, -2.70654296875, -2.5185546875, -2.33056640625, -2.142578125, -1.95458984375, -1.7666015625, -1.57861328125, -1.390625, -1.20263671875, -1.0146484375, -0.82666015625, -0.638671875, -0.45068359375, -0.2626953125, -0.07470703125, 0.11328125, 0.30126953125, 0.4892578125, 0.67724609375, 0.865234375, 1.05322265625, 1.2412109375, 1.42919921875, 1.6171875, 1.80517578125, 1.9931640625, 2.18115234375, 2.369140625, 2.55712890625, 2.7451171875, 2.93310546875, 3.12109375, 3.30908203125, 3.4970703125, 3.68505859375, 3.873046875, 4.06103515625, 4.2490234375, 4.43701171875, 4.625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 16.0, 14.0, 29.0, 31.0, 37.0, 50.0, 67.0, 59.0, 89.0, 84.0, 91.0, 79.0, 73.0, 71.0, 48.0, 43.0, 42.0, 28.0, 20.0, 13.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.353515625, -1.3221664428710938, -1.2908172607421875, -1.2594680786132812, -1.228118896484375, -1.1967697143554688, -1.1654205322265625, -1.1340713500976562, -1.10272216796875, -1.0713729858398438, -1.0400238037109375, -1.0086746215820312, -0.977325439453125, -0.9459762573242188, -0.9146270751953125, -0.8832778930664062, -0.8519287109375, -0.8205795288085938, -0.7892303466796875, -0.7578811645507812, -0.726531982421875, -0.6951828002929688, -0.6638336181640625, -0.6324844360351562, -0.60113525390625, -0.5697860717773438, -0.5384368896484375, -0.5070877075195312, -0.475738525390625, -0.44438934326171875, -0.4130401611328125, -0.38169097900390625, -0.350341796875, -0.31899261474609375, -0.2876434326171875, -0.25629425048828125, -0.224945068359375, -0.19359588623046875, -0.1622467041015625, -0.13089752197265625, -0.09954833984375, -0.06819915771484375, -0.0368499755859375, -0.00550079345703125, 0.025848388671875, 0.05719757080078125, 0.0885467529296875, 0.11989593505859375, 0.1512451171875, 0.18259429931640625, 0.2139434814453125, 0.24529266357421875, 0.276641845703125, 0.30799102783203125, 0.3393402099609375, 0.37068939208984375, 0.40203857421875, 0.43338775634765625, 0.4647369384765625, 0.49608612060546875, 0.527435302734375, 0.5587844848632812, 0.5901336669921875, 0.6214828491210938, 0.65283203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 8.0, 22.0, 41.0, 57.0, 111.0, 282.0, 1603.0, 28359.0, 4147012.0, 15166.0, 1207.0, 224.0, 94.0, 44.0, 26.0, 21.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5546875, -13.2274169921875, -12.900146484375, -12.5728759765625, -12.24560546875, -11.9183349609375, -11.591064453125, -11.2637939453125, -10.9365234375, -10.6092529296875, -10.281982421875, -9.9547119140625, -9.62744140625, -9.3001708984375, -8.972900390625, -8.6456298828125, -8.318359375, -7.9910888671875, -7.663818359375, -7.3365478515625, -7.00927734375, -6.6820068359375, -6.354736328125, -6.0274658203125, -5.7001953125, -5.3729248046875, -5.045654296875, -4.7183837890625, -4.39111328125, -4.0638427734375, -3.736572265625, -3.4093017578125, -3.08203125, -2.7547607421875, -2.427490234375, -2.1002197265625, -1.77294921875, -1.4456787109375, -1.118408203125, -0.7911376953125, -0.4638671875, -0.1365966796875, 0.190673828125, 0.5179443359375, 0.84521484375, 1.1724853515625, 1.499755859375, 1.8270263671875, 2.154296875, 2.4815673828125, 2.808837890625, 3.1361083984375, 3.46337890625, 3.7906494140625, 4.117919921875, 4.4451904296875, 4.7724609375, 5.0997314453125, 5.427001953125, 5.7542724609375, 6.08154296875, 6.4088134765625, 6.736083984375, 7.0633544921875, 7.390625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 12.0, 5.0, 13.0, 36.0, 57.0, 157.0, 2196.0, 1378.0, 120.0, 38.0, 27.0, 15.0, 8.0, 2.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.197265625, -3.1210784912109375, -3.044891357421875, -2.9687042236328125, -2.89251708984375, -2.8163299560546875, -2.740142822265625, -2.6639556884765625, -2.5877685546875, -2.5115814208984375, -2.435394287109375, -2.3592071533203125, -2.28302001953125, -2.2068328857421875, -2.130645751953125, -2.0544586181640625, -1.978271484375, -1.9020843505859375, -1.825897216796875, -1.7497100830078125, -1.67352294921875, -1.5973358154296875, -1.521148681640625, -1.4449615478515625, -1.3687744140625, -1.2925872802734375, -1.216400146484375, -1.1402130126953125, -1.06402587890625, -0.9878387451171875, -0.911651611328125, -0.8354644775390625, -0.75927734375, -0.6830902099609375, -0.606903076171875, -0.5307159423828125, -0.45452880859375, -0.3783416748046875, -0.302154541015625, -0.2259674072265625, -0.1497802734375, -0.0735931396484375, 0.002593994140625, 0.0787811279296875, 0.15496826171875, 0.2311553955078125, 0.307342529296875, 0.3835296630859375, 0.459716796875, 0.5359039306640625, 0.612091064453125, 0.6882781982421875, 0.76446533203125, 0.8406524658203125, 0.916839599609375, 0.9930267333984375, 1.0692138671875, 1.1454010009765625, 1.221588134765625, 1.2977752685546875, 1.37396240234375, 1.4501495361328125, 1.526336669921875, 1.6025238037109375, 1.6787109375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 13.0, 16.0, 25.0, 46.0, 64.0, 95.0, 128.0, 171.0, 154.0, 107.0, 65.0, 34.0, 21.0, 17.0, 6.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3805065155029297, -3.1994922161102295, -3.0184779167175293, -2.837463855743408, -2.656449317932129, -2.475435256958008, -2.2944209575653076, -2.1134066581726074, -1.9323923587799072, -1.751378059387207, -1.5703637599945068, -1.3893495798110962, -1.208335280418396, -1.0273209810256958, -0.8463068008422852, -0.665292501449585, -0.48427820205688477, -0.30326393246650696, -0.12224966287612915, 0.05876457691192627, 0.23977887630462646, 0.42079317569732666, 0.6018073558807373, 0.7828216552734375, 0.9638359546661377, 1.144850254058838, 1.325864553451538, 1.5068787336349487, 1.687893033027649, 1.8689073324203491, 2.0499215126037598, 2.23093581199646, 2.41195011138916, 2.5929644107818604, 2.7739787101745605, 2.9549927711486816, 3.136007308959961, 3.317021369934082, 3.4980356693267822, 3.6790499687194824, 3.8600642681121826, 4.041078567504883, 4.222092628479004, 4.403107166290283, 4.584121227264404, 4.765135765075684, 4.946149826049805, 5.127163887023926, 5.308178424835205, 5.489192485809326, 5.6702070236206055, 5.851221084594727, 6.032235622406006, 6.213249683380127, 6.394264221191406, 6.575278282165527, 6.756292343139648, 6.9373064041137695, 7.118320941925049, 7.29933500289917, 7.480349540710449, 7.66136360168457, 7.842377662658691, 8.023391723632812, 8.20440673828125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 11.0, 4.0, 9.0, 14.0, 22.0, 19.0, 26.0, 25.0, 22.0, 28.0, 48.0, 50.0, 45.0, 35.0, 48.0, 49.0, 37.0, 45.0, 64.0, 42.0, 52.0, 34.0, 43.0, 39.0, 30.0, 27.0, 22.0, 21.0, 22.0, 11.0, 14.0, 7.0, 9.0, 6.0, 5.0, 2.0, 2.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.015883445739746, -2.8940465450286865, -2.772209882736206, -2.6503729820251465, -2.528536319732666, -2.4066994190216064, -2.284862518310547, -2.1630258560180664, -2.041188955307007, -1.9193521738052368, -1.7975153923034668, -1.6756784915924072, -1.5538417100906372, -1.4320049285888672, -1.3101680278778076, -1.1883312463760376, -1.0664944648742676, -0.9446576833724976, -0.8228208422660828, -0.700984001159668, -0.579147219657898, -0.45731043815612793, -0.33547359704971313, -0.21363675594329834, -0.09179997444152832, 0.030036836862564087, 0.1518736481666565, 0.2737104594707489, 0.3955472707748413, 0.5173840522766113, 0.6392208933830261, 0.7610577344894409, 0.8828945159912109, 1.004731297492981, 1.126568078994751, 1.2484049797058105, 1.3702417612075806, 1.4920785427093506, 1.6139154434204102, 1.7357522249221802, 1.8575890064239502, 1.9794257879257202, 2.1012625694274902, 2.22309947013855, 2.3449363708496094, 2.46677303314209, 2.5886099338531494, 2.710446834564209, 2.8322834968566895, 2.954120397567749, 3.0759570598602295, 3.197793960571289, 3.3196306228637695, 3.441467523574829, 3.5633044242858887, 3.685141086578369, 3.8069779872894287, 3.9288148880004883, 4.050651550292969, 4.172488212585449, 4.294325351715088, 4.416162014007568, 4.537998676300049, 4.6598358154296875, 4.781672477722168]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 4.0, 5.0, 13.0, 29.0, 48.0, 89.0, 183.0, 405.0, 1057.0, 3092.0, 13443.0, 148372.0, 810001.0, 60219.0, 8095.0, 2096.0, 770.0, 326.0, 138.0, 69.0, 44.0, 22.0, 12.0, 9.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.9139404296875, -3.765380859375, -3.6168212890625, -3.46826171875, -3.3197021484375, -3.171142578125, -3.0225830078125, -2.8740234375, -2.7254638671875, -2.576904296875, -2.4283447265625, -2.27978515625, -2.1312255859375, -1.982666015625, -1.8341064453125, -1.685546875, -1.5369873046875, -1.388427734375, -1.2398681640625, -1.09130859375, -0.9427490234375, -0.794189453125, -0.6456298828125, -0.4970703125, -0.3485107421875, -0.199951171875, -0.0513916015625, 0.09716796875, 0.2457275390625, 0.394287109375, 0.5428466796875, 0.69140625, 0.8399658203125, 0.988525390625, 1.1370849609375, 1.28564453125, 1.4342041015625, 1.582763671875, 1.7313232421875, 1.8798828125, 2.0284423828125, 2.177001953125, 2.3255615234375, 2.47412109375, 2.6226806640625, 2.771240234375, 2.9197998046875, 3.068359375, 3.2169189453125, 3.365478515625, 3.5140380859375, 3.66259765625, 3.8111572265625, 3.959716796875, 4.1082763671875, 4.2568359375, 4.4053955078125, 4.553955078125, 4.7025146484375, 4.85107421875, 4.9996337890625, 5.148193359375, 5.2967529296875, 5.4453125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 10.0, 16.0, 23.0, 39.0, 36.0, 53.0, 56.0, 50.0, 70.0, 89.0, 73.0, 80.0, 58.0, 76.0, 72.0, 48.0, 37.0, 40.0, 25.0, 17.0, 6.0, 7.0, 7.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2919921875, -1.2610397338867188, -1.2300872802734375, -1.1991348266601562, -1.168182373046875, -1.1372299194335938, -1.1062774658203125, -1.0753250122070312, -1.04437255859375, -1.0134201049804688, -0.9824676513671875, -0.9515151977539062, -0.920562744140625, -0.8896102905273438, -0.8586578369140625, -0.8277053833007812, -0.7967529296875, -0.7658004760742188, -0.7348480224609375, -0.7038955688476562, -0.672943115234375, -0.6419906616210938, -0.6110382080078125, -0.5800857543945312, -0.54913330078125, -0.5181808471679688, -0.4872283935546875, -0.45627593994140625, -0.425323486328125, -0.39437103271484375, -0.3634185791015625, -0.33246612548828125, -0.301513671875, -0.27056121826171875, -0.2396087646484375, -0.20865631103515625, -0.177703857421875, -0.14675140380859375, -0.1157989501953125, -0.08484649658203125, -0.05389404296875, -0.02294158935546875, 0.0080108642578125, 0.03896331787109375, 0.069915771484375, 0.10086822509765625, 0.1318206787109375, 0.16277313232421875, 0.1937255859375, 0.22467803955078125, 0.2556304931640625, 0.28658294677734375, 0.317535400390625, 0.34848785400390625, 0.3794403076171875, 0.41039276123046875, 0.44134521484375, 0.47229766845703125, 0.5032501220703125, 0.5342025756835938, 0.565155029296875, 0.5961074829101562, 0.6270599365234375, 0.6580123901367188, 0.68896484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 11.0, 28.0, 75.0, 132.0, 293.0, 638.0, 2085.0, 9884.0, 155936.0, 837044.0, 35802.0, 4545.0, 1192.0, 417.0, 208.0, 102.0, 57.0, 26.0, 29.0, 9.0, 9.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1484375, -4.99822998046875, -4.8480224609375, -4.69781494140625, -4.547607421875, -4.39739990234375, -4.2471923828125, -4.09698486328125, -3.94677734375, -3.79656982421875, -3.6463623046875, -3.49615478515625, -3.345947265625, -3.19573974609375, -3.0455322265625, -2.89532470703125, -2.7451171875, -2.59490966796875, -2.4447021484375, -2.29449462890625, -2.144287109375, -1.99407958984375, -1.8438720703125, -1.69366455078125, -1.54345703125, -1.39324951171875, -1.2430419921875, -1.09283447265625, -0.942626953125, -0.79241943359375, -0.6422119140625, -0.49200439453125, -0.341796875, -0.19158935546875, -0.0413818359375, 0.10882568359375, 0.259033203125, 0.40924072265625, 0.5594482421875, 0.70965576171875, 0.85986328125, 1.01007080078125, 1.1602783203125, 1.31048583984375, 1.460693359375, 1.61090087890625, 1.7611083984375, 1.91131591796875, 2.0615234375, 2.21173095703125, 2.3619384765625, 2.51214599609375, 2.662353515625, 2.81256103515625, 2.9627685546875, 3.11297607421875, 3.26318359375, 3.41339111328125, 3.5635986328125, 3.71380615234375, 3.864013671875, 4.01422119140625, 4.1644287109375, 4.31463623046875, 4.46484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 1.0, 5.0, 10.0, 13.0, 13.0, 23.0, 21.0, 34.0, 33.0, 58.0, 55.0, 72.0, 51.0, 69.0, 62.0, 76.0, 62.0, 55.0, 46.0, 48.0, 29.0, 25.0, 30.0, 23.0, 21.0, 10.0, 11.0, 15.0, 6.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.80859375, -3.7020263671875, -3.595458984375, -3.4888916015625, -3.38232421875, -3.2757568359375, -3.169189453125, -3.0626220703125, -2.9560546875, -2.8494873046875, -2.742919921875, -2.6363525390625, -2.52978515625, -2.4232177734375, -2.316650390625, -2.2100830078125, -2.103515625, -1.9969482421875, -1.890380859375, -1.7838134765625, -1.67724609375, -1.5706787109375, -1.464111328125, -1.3575439453125, -1.2509765625, -1.1444091796875, -1.037841796875, -0.9312744140625, -0.82470703125, -0.7181396484375, -0.611572265625, -0.5050048828125, -0.3984375, -0.2918701171875, -0.185302734375, -0.0787353515625, 0.02783203125, 0.1343994140625, 0.240966796875, 0.3475341796875, 0.4541015625, 0.5606689453125, 0.667236328125, 0.7738037109375, 0.88037109375, 0.9869384765625, 1.093505859375, 1.2000732421875, 1.306640625, 1.4132080078125, 1.519775390625, 1.6263427734375, 1.73291015625, 1.8394775390625, 1.946044921875, 2.0526123046875, 2.1591796875, 2.2657470703125, 2.372314453125, 2.4788818359375, 2.58544921875, 2.6920166015625, 2.798583984375, 2.9051513671875, 3.01171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 7.0, 18.0, 40.0, 61.0, 178.0, 533.0, 2137.0, 11839.0, 898996.0, 126127.0, 6672.0, 1330.0, 393.0, 103.0, 52.0, 30.0, 18.0, 7.0, 6.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.47265625, -5.282958984375, -5.09326171875, -4.903564453125, -4.7138671875, -4.524169921875, -4.33447265625, -4.144775390625, -3.955078125, -3.765380859375, -3.57568359375, -3.385986328125, -3.1962890625, -3.006591796875, -2.81689453125, -2.627197265625, -2.4375, -2.247802734375, -2.05810546875, -1.868408203125, -1.6787109375, -1.489013671875, -1.29931640625, -1.109619140625, -0.919921875, -0.730224609375, -0.54052734375, -0.350830078125, -0.1611328125, 0.028564453125, 0.21826171875, 0.407958984375, 0.59765625, 0.787353515625, 0.97705078125, 1.166748046875, 1.3564453125, 1.546142578125, 1.73583984375, 1.925537109375, 2.115234375, 2.304931640625, 2.49462890625, 2.684326171875, 2.8740234375, 3.063720703125, 3.25341796875, 3.443115234375, 3.6328125, 3.822509765625, 4.01220703125, 4.201904296875, 4.3916015625, 4.581298828125, 4.77099609375, 4.960693359375, 5.150390625, 5.340087890625, 5.52978515625, 5.719482421875, 5.9091796875, 6.098876953125, 6.28857421875, 6.478271484375, 6.66796875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 12.0, 19.0, 37.0, 79.0, 192.0, 388.0, 157.0, 60.0, 32.0, 15.0, 3.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007786750793457031, -0.0007607340812683105, -0.000742793083190918, -0.0007248520851135254, -0.0007069110870361328, -0.0006889700889587402, -0.0006710290908813477, -0.0006530880928039551, -0.0006351470947265625, -0.0006172060966491699, -0.0005992650985717773, -0.0005813241004943848, -0.0005633831024169922, -0.0005454421043395996, -0.000527501106262207, -0.0005095601081848145, -0.0004916191101074219, -0.0004736781120300293, -0.0004557371139526367, -0.00043779611587524414, -0.00041985511779785156, -0.000401914119720459, -0.0003839731216430664, -0.00036603212356567383, -0.00034809112548828125, -0.00033015012741088867, -0.0003122091293334961, -0.0002942681312561035, -0.00027632713317871094, -0.00025838613510131836, -0.00024044513702392578, -0.0002225041389465332, -0.00020456314086914062, -0.00018662214279174805, -0.00016868114471435547, -0.0001507401466369629, -0.0001327991485595703, -0.00011485815048217773, -9.691715240478516e-05, -7.897615432739258e-05, -6.103515625e-05, -4.309415817260742e-05, -2.5153160095214844e-05, -7.212162017822266e-06, 1.0728836059570312e-05, 2.866983413696289e-05, 4.661083221435547e-05, 6.455183029174805e-05, 8.249282836914062e-05, 0.0001004338264465332, 0.00011837482452392578, 0.00013631582260131836, 0.00015425682067871094, 0.00017219781875610352, 0.0001901388168334961, 0.00020807981491088867, 0.00022602081298828125, 0.00024396181106567383, 0.0002619028091430664, 0.000279843807220459, 0.00029778480529785156, 0.00031572580337524414, 0.0003336668014526367, 0.0003516077995300293, 0.0003695487976074219]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 15.0, 21.0, 30.0, 68.0, 155.0, 368.0, 1256.0, 9466.0, 959681.0, 72635.0, 3700.0, 717.0, 244.0, 82.0, 40.0, 26.0, 13.0, 11.0, 5.0, 9.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.2890625, -9.05560302734375, -8.8221435546875, -8.58868408203125, -8.355224609375, -8.12176513671875, -7.8883056640625, -7.65484619140625, -7.42138671875, -7.18792724609375, -6.9544677734375, -6.72100830078125, -6.487548828125, -6.25408935546875, -6.0206298828125, -5.78717041015625, -5.5537109375, -5.32025146484375, -5.0867919921875, -4.85333251953125, -4.619873046875, -4.38641357421875, -4.1529541015625, -3.91949462890625, -3.68603515625, -3.45257568359375, -3.2191162109375, -2.98565673828125, -2.752197265625, -2.51873779296875, -2.2852783203125, -2.05181884765625, -1.818359375, -1.58489990234375, -1.3514404296875, -1.11798095703125, -0.884521484375, -0.65106201171875, -0.4176025390625, -0.18414306640625, 0.04931640625, 0.28277587890625, 0.5162353515625, 0.74969482421875, 0.983154296875, 1.21661376953125, 1.4500732421875, 1.68353271484375, 1.9169921875, 2.15045166015625, 2.3839111328125, 2.61737060546875, 2.850830078125, 3.08428955078125, 3.3177490234375, 3.55120849609375, 3.78466796875, 4.01812744140625, 4.2515869140625, 4.48504638671875, 4.718505859375, 4.95196533203125, 5.1854248046875, 5.41888427734375, 5.65234375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 8.0, 6.0, 14.0, 16.0, 74.0, 412.0, 371.0, 51.0, 20.0, 13.0, 10.0, 7.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.1400146484375, -7.936279296875, -7.7325439453125, -7.52880859375, -7.3250732421875, -7.121337890625, -6.9176025390625, -6.7138671875, -6.5101318359375, -6.306396484375, -6.1026611328125, -5.89892578125, -5.6951904296875, -5.491455078125, -5.2877197265625, -5.083984375, -4.8802490234375, -4.676513671875, -4.4727783203125, -4.26904296875, -4.0653076171875, -3.861572265625, -3.6578369140625, -3.4541015625, -3.2503662109375, -3.046630859375, -2.8428955078125, -2.63916015625, -2.4354248046875, -2.231689453125, -2.0279541015625, -1.82421875, -1.6204833984375, -1.416748046875, -1.2130126953125, -1.00927734375, -0.8055419921875, -0.601806640625, -0.3980712890625, -0.1943359375, 0.0093994140625, 0.213134765625, 0.4168701171875, 0.62060546875, 0.8243408203125, 1.028076171875, 1.2318115234375, 1.435546875, 1.6392822265625, 1.843017578125, 2.0467529296875, 2.25048828125, 2.4542236328125, 2.657958984375, 2.8616943359375, 3.0654296875, 3.2691650390625, 3.472900390625, 3.6766357421875, 3.88037109375, 4.0841064453125, 4.287841796875, 4.4915771484375, 4.6953125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 10.0, 3.0, 14.0, 25.0, 61.0, 106.0, 185.0, 266.0, 195.0, 83.0, 36.0, 12.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.32080078125, -40.34654235839844, -39.372283935546875, -38.39802551269531, -37.42376708984375, -36.44950866699219, -35.475250244140625, -34.50099182128906, -33.5267333984375, -32.55247497558594, -31.578216552734375, -30.603958129882812, -29.62969970703125, -28.655441284179688, -27.681182861328125, -26.706924438476562, -25.732666015625, -24.758407592773438, -23.784149169921875, -22.809890747070312, -21.83563232421875, -20.861373901367188, -19.887115478515625, -18.912857055664062, -17.9385986328125, -16.964340209960938, -15.990081787109375, -15.015823364257812, -14.04156494140625, -13.067306518554688, -12.093048095703125, -11.118789672851562, -10.144533157348633, -9.17027473449707, -8.196016311645508, -7.221757888793945, -6.247499465942383, -5.27324104309082, -4.298982620239258, -3.3247241973876953, -2.350465774536133, -1.3762073516845703, -0.4019489288330078, 0.5723094940185547, 1.5465679168701172, 2.5208263397216797, 3.495084762573242, 4.469343185424805, 5.443601608276367, 6.41786003112793, 7.392118453979492, 8.366376876831055, 9.340635299682617, 10.31489372253418, 11.289152145385742, 12.263410568237305, 13.237668991088867, 14.21192741394043, 15.186185836791992, 16.160444259643555, 17.134702682495117, 18.10896110534668, 19.083219528198242, 20.057477951049805, 21.031736373901367]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 8.0, 5.0, 11.0, 9.0, 13.0, 22.0, 20.0, 25.0, 25.0, 25.0, 33.0, 35.0, 35.0, 22.0, 40.0, 35.0, 59.0, 41.0, 39.0, 54.0, 34.0, 42.0, 37.0, 33.0, 35.0, 35.0, 29.0, 24.0, 31.0, 20.0, 19.0, 13.0, 9.0, 13.0, 16.0, 10.0, 8.0, 6.0, 9.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-14.256242752075195, -13.861167907714844, -13.466093063354492, -13.07101821899414, -12.675944328308105, -12.280869483947754, -11.885794639587402, -11.49071979522705, -11.0956449508667, -10.700570106506348, -10.305495262145996, -9.910421371459961, -9.51534652709961, -9.120271682739258, -8.725196838378906, -8.330121994018555, -7.935047626495361, -7.53997278213501, -7.144898414611816, -6.749823570251465, -6.354748725891113, -5.959673881530762, -5.564599514007568, -5.169524669647217, -4.774450302124023, -4.379375457763672, -3.9843008518218994, -3.589226245880127, -3.1941514015197754, -2.799076795578003, -2.4040021896362305, -2.008927345275879, -1.6138525009155273, -1.2187777757644653, -0.8237031102180481, -0.42862844467163086, -0.03355371952056885, 0.36152100563049316, 0.7565956115722656, 1.1516704559326172, 1.5467450618743896, 1.9418197870254517, 2.3368945121765137, 2.731969118118286, 3.1270437240600586, 3.52211856842041, 3.9171931743621826, 4.312268257141113, 4.707342624664307, 5.102417469024658, 5.497491836547852, 5.892566680908203, 6.287641525268555, 6.682716369628906, 7.0777907371521, 7.472865581512451, 7.8679399490356445, 8.263014793395996, 8.658089637756348, 9.053163528442383, 9.448238372802734, 9.843313217163086, 10.238388061523438, 10.633462905883789, 11.02853775024414]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 10.0, 13.0, 14.0, 16.0, 25.0, 31.0, 29.0, 50.0, 81.0, 155.0, 293.0, 882.0, 3727.0, 31740.0, 4126162.0, 26118.0, 3365.0, 826.0, 304.0, 143.0, 90.0, 58.0, 31.0, 28.0, 19.0, 16.0, 9.0, 11.0, 9.0, 8.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.59765625, -7.409912109375, -7.22216796875, -7.034423828125, -6.8466796875, -6.658935546875, -6.47119140625, -6.283447265625, -6.095703125, -5.907958984375, -5.72021484375, -5.532470703125, -5.3447265625, -5.156982421875, -4.96923828125, -4.781494140625, -4.59375, -4.406005859375, -4.21826171875, -4.030517578125, -3.8427734375, -3.655029296875, -3.46728515625, -3.279541015625, -3.091796875, -2.904052734375, -2.71630859375, -2.528564453125, -2.3408203125, -2.153076171875, -1.96533203125, -1.777587890625, -1.58984375, -1.402099609375, -1.21435546875, -1.026611328125, -0.8388671875, -0.651123046875, -0.46337890625, -0.275634765625, -0.087890625, 0.099853515625, 0.28759765625, 0.475341796875, 0.6630859375, 0.850830078125, 1.03857421875, 1.226318359375, 1.4140625, 1.601806640625, 1.78955078125, 1.977294921875, 2.1650390625, 2.352783203125, 2.54052734375, 2.728271484375, 2.916015625, 3.103759765625, 3.29150390625, 3.479248046875, 3.6669921875, 3.854736328125, 4.04248046875, 4.230224609375, 4.41796875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 17.0, 15.0, 17.0, 29.0, 29.0, 59.0, 55.0, 61.0, 74.0, 78.0, 76.0, 86.0, 73.0, 72.0, 64.0, 61.0, 52.0, 23.0, 21.0, 15.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.568359375, -1.5324478149414062, -1.4965362548828125, -1.4606246948242188, -1.424713134765625, -1.3888015747070312, -1.3528900146484375, -1.3169784545898438, -1.28106689453125, -1.2451553344726562, -1.2092437744140625, -1.1733322143554688, -1.137420654296875, -1.1015090942382812, -1.0655975341796875, -1.0296859741210938, -0.9937744140625, -0.9578628540039062, -0.9219512939453125, -0.8860397338867188, -0.850128173828125, -0.8142166137695312, -0.7783050537109375, -0.7423934936523438, -0.70648193359375, -0.6705703735351562, -0.6346588134765625, -0.5987472534179688, -0.562835693359375, -0.5269241333007812, -0.4910125732421875, -0.45510101318359375, -0.419189453125, -0.38327789306640625, -0.3473663330078125, -0.31145477294921875, -0.275543212890625, -0.23963165283203125, -0.2037200927734375, -0.16780853271484375, -0.13189697265625, -0.09598541259765625, -0.0600738525390625, -0.02416229248046875, 0.011749267578125, 0.04766082763671875, 0.0835723876953125, 0.11948394775390625, 0.1553955078125, 0.19130706787109375, 0.2272186279296875, 0.26313018798828125, 0.299041748046875, 0.33495330810546875, 0.3708648681640625, 0.40677642822265625, 0.44268798828125, 0.47859954833984375, 0.5145111083984375, 0.5504226684570312, 0.586334228515625, 0.6222457885742188, 0.6581573486328125, 0.6940689086914062, 0.72998046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 21.0, 30.0, 82.0, 126.0, 292.0, 915.0, 7068.0, 4116433.0, 65471.0, 2908.0, 526.0, 198.0, 95.0, 47.0, 29.0, 15.0, 12.0, 10.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.328125, -6.008544921875, -5.68896484375, -5.369384765625, -5.0498046875, -4.730224609375, -4.41064453125, -4.091064453125, -3.771484375, -3.451904296875, -3.13232421875, -2.812744140625, -2.4931640625, -2.173583984375, -1.85400390625, -1.534423828125, -1.21484375, -0.895263671875, -0.57568359375, -0.256103515625, 0.0634765625, 0.383056640625, 0.70263671875, 1.022216796875, 1.341796875, 1.661376953125, 1.98095703125, 2.300537109375, 2.6201171875, 2.939697265625, 3.25927734375, 3.578857421875, 3.8984375, 4.218017578125, 4.53759765625, 4.857177734375, 5.1767578125, 5.496337890625, 5.81591796875, 6.135498046875, 6.455078125, 6.774658203125, 7.09423828125, 7.413818359375, 7.7333984375, 8.052978515625, 8.37255859375, 8.692138671875, 9.01171875, 9.331298828125, 9.65087890625, 9.970458984375, 10.2900390625, 10.609619140625, 10.92919921875, 11.248779296875, 11.568359375, 11.887939453125, 12.20751953125, 12.527099609375, 12.8466796875, 13.166259765625, 13.48583984375, 13.805419921875, 14.125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 10.0, 29.0, 31.0, 170.0, 3222.0, 498.0, 56.0, 14.0, 15.0, 7.0, 8.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3125, -2.234893798828125, -2.15728759765625, -2.079681396484375, -2.0020751953125, -1.924468994140625, -1.84686279296875, -1.769256591796875, -1.691650390625, -1.614044189453125, -1.53643798828125, -1.458831787109375, -1.3812255859375, -1.303619384765625, -1.22601318359375, -1.148406982421875, -1.07080078125, -0.993194580078125, -0.91558837890625, -0.837982177734375, -0.7603759765625, -0.682769775390625, -0.60516357421875, -0.527557373046875, -0.449951171875, -0.372344970703125, -0.29473876953125, -0.217132568359375, -0.1395263671875, -0.061920166015625, 0.01568603515625, 0.093292236328125, 0.1708984375, 0.248504638671875, 0.32611083984375, 0.403717041015625, 0.4813232421875, 0.558929443359375, 0.63653564453125, 0.714141845703125, 0.791748046875, 0.869354248046875, 0.94696044921875, 1.024566650390625, 1.1021728515625, 1.179779052734375, 1.25738525390625, 1.334991455078125, 1.41259765625, 1.490203857421875, 1.56781005859375, 1.645416259765625, 1.7230224609375, 1.800628662109375, 1.87823486328125, 1.955841064453125, 2.033447265625, 2.111053466796875, 2.18865966796875, 2.266265869140625, 2.3438720703125, 2.421478271484375, 2.49908447265625, 2.576690673828125, 2.654296875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 10.0, 8.0, 13.0, 36.0, 70.0, 119.0, 177.0, 207.0, 140.0, 100.0, 48.0, 29.0, 16.0, 11.0, 6.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.163535118103027, -7.940217971801758, -7.71690034866333, -7.493582725524902, -7.270265579223633, -7.046948432922363, -6.8236308097839355, -6.600313186645508, -6.376996040344238, -6.153678894042969, -5.930361270904541, -5.707043647766113, -5.483726501464844, -5.260409355163574, -5.0370917320251465, -4.813774108886719, -4.590456962585449, -4.36713981628418, -4.143822193145752, -3.9205048084259033, -3.6971874237060547, -3.473870038986206, -3.2505526542663574, -3.027235269546509, -2.80391788482666, -2.5806005001068115, -2.357283115386963, -2.1339657306671143, -1.9106483459472656, -1.687330961227417, -1.4640135765075684, -1.2406961917877197, -1.017378330230713, -0.7940609455108643, -0.5707435607910156, -0.347426176071167, -0.12410879135131836, 0.09920859336853027, 0.3225259780883789, 0.5458433628082275, 0.7691607475280762, 0.9924781322479248, 1.2157955169677734, 1.439112901687622, 1.6624302864074707, 1.8857476711273193, 2.109065055847168, 2.3323824405670166, 2.5556998252868652, 2.779017210006714, 3.0023345947265625, 3.225651979446411, 3.4489693641662598, 3.6722867488861084, 3.895604133605957, 4.118921279907227, 4.342238903045654, 4.565556526184082, 4.788873672485352, 5.012190818786621, 5.235508441925049, 5.458826065063477, 5.682143211364746, 5.905460357666016, 6.128777980804443]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 3.0, 1.0, 5.0, 13.0, 7.0, 2.0, 13.0, 20.0, 17.0, 20.0, 21.0, 30.0, 30.0, 38.0, 40.0, 34.0, 37.0, 57.0, 44.0, 54.0, 43.0, 39.0, 51.0, 40.0, 40.0, 50.0, 32.0, 35.0, 36.0, 26.0, 14.0, 17.0, 15.0, 19.0, 15.0, 14.0, 8.0, 4.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-3.828338384628296, -3.725740432739258, -3.623142719268799, -3.5205447673797607, -3.4179468154907227, -3.3153488636016846, -3.2127509117126465, -3.1101531982421875, -3.0075552463531494, -2.9049572944641113, -2.8023595809936523, -2.6997616291046143, -2.597163677215576, -2.494565725326538, -2.3919677734375, -2.289370059967041, -2.186772108078003, -2.084174156188965, -1.9815763235092163, -1.8789784908294678, -1.7763805389404297, -1.6737825870513916, -1.571184754371643, -1.4685869216918945, -1.3659889698028564, -1.2633910179138184, -1.1607931852340698, -1.0581953525543213, -0.9555974006652832, -0.8529995083808899, -0.7504016160964966, -0.6478037238121033, -0.5452060699462891, -0.44260817766189575, -0.34001028537750244, -0.23741239309310913, -0.13481450080871582, -0.03221660852432251, 0.0703812837600708, 0.1729791760444641, 0.2755770683288574, 0.37817496061325073, 0.48077285289764404, 0.5833707451820374, 0.6859686374664307, 0.788566529750824, 0.8911644220352173, 0.9937623143196106, 1.096360206604004, 1.198958158493042, 1.3015559911727905, 1.404153823852539, 1.5067517757415771, 1.6093497276306152, 1.7119475603103638, 1.8145453929901123, 1.9171433448791504, 2.0197412967681885, 2.1223392486572266, 2.2249369621276855, 2.3275349140167236, 2.4301328659057617, 2.5327305793762207, 2.635328531265259, 2.737926483154297]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 15.0, 2.0, 14.0, 18.0, 37.0, 60.0, 79.0, 213.0, 415.0, 912.0, 2277.0, 5841.0, 18191.0, 75007.0, 503634.0, 363877.0, 55300.0, 14394.0, 4851.0, 1886.0, 815.0, 330.0, 163.0, 72.0, 34.0, 25.0, 16.0, 14.0, 14.0, 11.0, 3.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.876953125, -2.789520263671875, -2.70208740234375, -2.614654541015625, -2.5272216796875, -2.439788818359375, -2.35235595703125, -2.264923095703125, -2.177490234375, -2.090057373046875, -2.00262451171875, -1.915191650390625, -1.8277587890625, -1.740325927734375, -1.65289306640625, -1.565460205078125, -1.47802734375, -1.390594482421875, -1.30316162109375, -1.215728759765625, -1.1282958984375, -1.040863037109375, -0.95343017578125, -0.865997314453125, -0.778564453125, -0.691131591796875, -0.60369873046875, -0.516265869140625, -0.4288330078125, -0.341400146484375, -0.25396728515625, -0.166534423828125, -0.0791015625, 0.008331298828125, 0.09576416015625, 0.183197021484375, 0.2706298828125, 0.358062744140625, 0.44549560546875, 0.532928466796875, 0.620361328125, 0.707794189453125, 0.79522705078125, 0.882659912109375, 0.9700927734375, 1.057525634765625, 1.14495849609375, 1.232391357421875, 1.31982421875, 1.407257080078125, 1.49468994140625, 1.582122802734375, 1.6695556640625, 1.756988525390625, 1.84442138671875, 1.931854248046875, 2.019287109375, 2.106719970703125, 2.19415283203125, 2.281585693359375, 2.3690185546875, 2.456451416015625, 2.54388427734375, 2.631317138671875, 2.71875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 5.0, 14.0, 14.0, 17.0, 28.0, 33.0, 36.0, 56.0, 60.0, 75.0, 65.0, 85.0, 76.0, 76.0, 82.0, 57.0, 69.0, 46.0, 30.0, 31.0, 25.0, 5.0, 7.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0], "bins": [-1.666015625, -1.6298446655273438, -1.5936737060546875, -1.5575027465820312, -1.521331787109375, -1.4851608276367188, -1.4489898681640625, -1.4128189086914062, -1.37664794921875, -1.3404769897460938, -1.3043060302734375, -1.2681350708007812, -1.231964111328125, -1.1957931518554688, -1.1596221923828125, -1.1234512329101562, -1.0872802734375, -1.0511093139648438, -1.0149383544921875, -0.9787673950195312, -0.942596435546875, -0.9064254760742188, -0.8702545166015625, -0.8340835571289062, -0.79791259765625, -0.7617416381835938, -0.7255706787109375, -0.6893997192382812, -0.653228759765625, -0.6170578002929688, -0.5808868408203125, -0.5447158813476562, -0.508544921875, -0.47237396240234375, -0.4362030029296875, -0.40003204345703125, -0.363861083984375, -0.32769012451171875, -0.2915191650390625, -0.25534820556640625, -0.21917724609375, -0.18300628662109375, -0.1468353271484375, -0.11066436767578125, -0.074493408203125, -0.03832244873046875, -0.0021514892578125, 0.03401947021484375, 0.0701904296875, 0.10636138916015625, 0.1425323486328125, 0.17870330810546875, 0.214874267578125, 0.25104522705078125, 0.2872161865234375, 0.32338714599609375, 0.35955810546875, 0.39572906494140625, 0.4319000244140625, 0.46807098388671875, 0.504241943359375, 0.5404129028320312, 0.5765838623046875, 0.6127548217773438, 0.64892578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 7.0, 10.0, 9.0, 11.0, 28.0, 36.0, 91.0, 257.0, 934.0, 4712.0, 39167.0, 841086.0, 149284.0, 10450.0, 1679.0, 477.0, 137.0, 57.0, 29.0, 17.0, 11.0, 10.0, 6.0, 5.0, 8.0, 6.0, 4.0, 5.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.37109375, -6.2021484375, -6.033203125, -5.8642578125, -5.6953125, -5.5263671875, -5.357421875, -5.1884765625, -5.01953125, -4.8505859375, -4.681640625, -4.5126953125, -4.34375, -4.1748046875, -4.005859375, -3.8369140625, -3.66796875, -3.4990234375, -3.330078125, -3.1611328125, -2.9921875, -2.8232421875, -2.654296875, -2.4853515625, -2.31640625, -2.1474609375, -1.978515625, -1.8095703125, -1.640625, -1.4716796875, -1.302734375, -1.1337890625, -0.96484375, -0.7958984375, -0.626953125, -0.4580078125, -0.2890625, -0.1201171875, 0.048828125, 0.2177734375, 0.38671875, 0.5556640625, 0.724609375, 0.8935546875, 1.0625, 1.2314453125, 1.400390625, 1.5693359375, 1.73828125, 1.9072265625, 2.076171875, 2.2451171875, 2.4140625, 2.5830078125, 2.751953125, 2.9208984375, 3.08984375, 3.2587890625, 3.427734375, 3.5966796875, 3.765625, 3.9345703125, 4.103515625, 4.2724609375, 4.44140625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 7.0, 3.0, 8.0, 8.0, 12.0, 19.0, 26.0, 28.0, 18.0, 27.0, 32.0, 48.0, 53.0, 50.0, 70.0, 56.0, 58.0, 61.0, 55.0, 46.0, 66.0, 34.0, 31.0, 32.0, 30.0, 20.0, 28.0, 22.0, 11.0, 11.0, 9.0, 15.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-4.5546875, -4.4451904296875, -4.335693359375, -4.2261962890625, -4.11669921875, -4.0072021484375, -3.897705078125, -3.7882080078125, -3.6787109375, -3.5692138671875, -3.459716796875, -3.3502197265625, -3.24072265625, -3.1312255859375, -3.021728515625, -2.9122314453125, -2.802734375, -2.6932373046875, -2.583740234375, -2.4742431640625, -2.36474609375, -2.2552490234375, -2.145751953125, -2.0362548828125, -1.9267578125, -1.8172607421875, -1.707763671875, -1.5982666015625, -1.48876953125, -1.3792724609375, -1.269775390625, -1.1602783203125, -1.05078125, -0.9412841796875, -0.831787109375, -0.7222900390625, -0.61279296875, -0.5032958984375, -0.393798828125, -0.2843017578125, -0.1748046875, -0.0653076171875, 0.044189453125, 0.1536865234375, 0.26318359375, 0.3726806640625, 0.482177734375, 0.5916748046875, 0.701171875, 0.8106689453125, 0.920166015625, 1.0296630859375, 1.13916015625, 1.2486572265625, 1.358154296875, 1.4676513671875, 1.5771484375, 1.6866455078125, 1.796142578125, 1.9056396484375, 2.01513671875, 2.1246337890625, 2.234130859375, 2.3436279296875, 2.453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 11.0, 7.0, 11.0, 16.0, 22.0, 37.0, 48.0, 103.0, 232.0, 571.0, 1850.0, 8409.0, 954097.0, 77241.0, 4003.0, 1124.0, 403.0, 154.0, 76.0, 46.0, 27.0, 20.0, 18.0, 13.0, 6.0, 4.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-9.0546875, -8.8525390625, -8.650390625, -8.4482421875, -8.24609375, -8.0439453125, -7.841796875, -7.6396484375, -7.4375, -7.2353515625, -7.033203125, -6.8310546875, -6.62890625, -6.4267578125, -6.224609375, -6.0224609375, -5.8203125, -5.6181640625, -5.416015625, -5.2138671875, -5.01171875, -4.8095703125, -4.607421875, -4.4052734375, -4.203125, -4.0009765625, -3.798828125, -3.5966796875, -3.39453125, -3.1923828125, -2.990234375, -2.7880859375, -2.5859375, -2.3837890625, -2.181640625, -1.9794921875, -1.77734375, -1.5751953125, -1.373046875, -1.1708984375, -0.96875, -0.7666015625, -0.564453125, -0.3623046875, -0.16015625, 0.0419921875, 0.244140625, 0.4462890625, 0.6484375, 0.8505859375, 1.052734375, 1.2548828125, 1.45703125, 1.6591796875, 1.861328125, 2.0634765625, 2.265625, 2.4677734375, 2.669921875, 2.8720703125, 3.07421875, 3.2763671875, 3.478515625, 3.6806640625, 3.8828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 4.0, 2.0, 11.0, 17.0, 28.0, 43.0, 107.0, 234.0, 311.0, 133.0, 46.0, 31.0, 13.0, 4.0, 9.0, 3.0, 1.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0006165504455566406, -0.0006031878292560577, -0.0005898252129554749, -0.000576462596654892, -0.0005630999803543091, -0.0005497373640537262, -0.0005363747477531433, -0.0005230121314525604, -0.0005096495151519775, -0.0004962868988513947, -0.00048292428255081177, -0.0004695616662502289, -0.000456199049949646, -0.0004428364336490631, -0.0004294738173484802, -0.00041611120104789734, -0.00040274858474731445, -0.00038938596844673157, -0.0003760233521461487, -0.0003626607358455658, -0.0003492981195449829, -0.0003359355032444, -0.00032257288694381714, -0.00030921027064323425, -0.00029584765434265137, -0.0002824850380420685, -0.0002691224217414856, -0.0002557598054409027, -0.00024239718914031982, -0.00022903457283973694, -0.00021567195653915405, -0.00020230934023857117, -0.00018894672393798828, -0.0001755841076374054, -0.0001622214913368225, -0.00014885887503623962, -0.00013549625873565674, -0.00012213364243507385, -0.00010877102613449097, -9.540840983390808e-05, -8.20457935333252e-05, -6.868317723274231e-05, -5.5320560932159424e-05, -4.195794463157654e-05, -2.8595328330993652e-05, -1.5232712030410767e-05, -1.8700957298278809e-06, 1.1492520570755005e-05, 2.485513687133789e-05, 3.8217753171920776e-05, 5.158036947250366e-05, 6.494298577308655e-05, 7.830560207366943e-05, 9.166821837425232e-05, 0.0001050308346748352, 0.00011839345097541809, 0.00013175606727600098, 0.00014511868357658386, 0.00015848129987716675, 0.00017184391617774963, 0.00018520653247833252, 0.0001985691487789154, 0.0002119317650794983, 0.00022529438138008118, 0.00023865699768066406]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 10.0, 10.0, 45.0, 88.0, 307.0, 934.0, 3448.0, 58840.0, 974307.0, 8035.0, 1730.0, 521.0, 180.0, 50.0, 25.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.8125, -5.60662841796875, -5.4007568359375, -5.19488525390625, -4.989013671875, -4.78314208984375, -4.5772705078125, -4.37139892578125, -4.16552734375, -3.95965576171875, -3.7537841796875, -3.54791259765625, -3.342041015625, -3.13616943359375, -2.9302978515625, -2.72442626953125, -2.5185546875, -2.31268310546875, -2.1068115234375, -1.90093994140625, -1.695068359375, -1.48919677734375, -1.2833251953125, -1.07745361328125, -0.87158203125, -0.66571044921875, -0.4598388671875, -0.25396728515625, -0.048095703125, 0.15777587890625, 0.3636474609375, 0.56951904296875, 0.775390625, 0.98126220703125, 1.1871337890625, 1.39300537109375, 1.598876953125, 1.80474853515625, 2.0106201171875, 2.21649169921875, 2.42236328125, 2.62823486328125, 2.8341064453125, 3.03997802734375, 3.245849609375, 3.45172119140625, 3.6575927734375, 3.86346435546875, 4.0693359375, 4.27520751953125, 4.4810791015625, 4.68695068359375, 4.892822265625, 5.09869384765625, 5.3045654296875, 5.51043701171875, 5.71630859375, 5.92218017578125, 6.1280517578125, 6.33392333984375, 6.539794921875, 6.74566650390625, 6.9515380859375, 7.15740966796875, 7.36328125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 12.0, 13.0, 31.0, 91.0, 170.0, 256.0, 194.0, 87.0, 48.0, 27.0, 23.0, 11.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.130859375, -2.053802490234375, -1.97674560546875, -1.899688720703125, -1.8226318359375, -1.745574951171875, -1.66851806640625, -1.591461181640625, -1.514404296875, -1.437347412109375, -1.36029052734375, -1.283233642578125, -1.2061767578125, -1.129119873046875, -1.05206298828125, -0.975006103515625, -0.89794921875, -0.820892333984375, -0.74383544921875, -0.666778564453125, -0.5897216796875, -0.512664794921875, -0.43560791015625, -0.358551025390625, -0.281494140625, -0.204437255859375, -0.12738037109375, -0.050323486328125, 0.0267333984375, 0.103790283203125, 0.18084716796875, 0.257904052734375, 0.3349609375, 0.412017822265625, 0.48907470703125, 0.566131591796875, 0.6431884765625, 0.720245361328125, 0.79730224609375, 0.874359130859375, 0.951416015625, 1.028472900390625, 1.10552978515625, 1.182586669921875, 1.2596435546875, 1.336700439453125, 1.41375732421875, 1.490814208984375, 1.56787109375, 1.644927978515625, 1.72198486328125, 1.799041748046875, 1.8760986328125, 1.953155517578125, 2.03021240234375, 2.107269287109375, 2.184326171875, 2.261383056640625, 2.33843994140625, 2.415496826171875, 2.4925537109375, 2.569610595703125, 2.64666748046875, 2.723724365234375, 2.80078125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 12.0, 33.0, 109.0, 317.0, 324.0, 155.0, 36.0, 14.0, 7.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.81879806518555, -32.27683639526367, -30.734874725341797, -29.192913055419922, -27.650951385498047, -26.108989715576172, -24.56702995300293, -23.025068283081055, -21.48310661315918, -19.941144943237305, -18.39918327331543, -16.857223510742188, -15.315260887145996, -13.773299217224121, -12.231338500976562, -10.689376831054688, -9.147415161132812, -7.6054534912109375, -6.063492298126221, -4.521531105041504, -2.979569435119629, -1.437607765197754, 0.10435295104980469, 1.6463146209716797, 3.1882762908935547, 4.73023796081543, 6.2721991539001465, 7.814160346984863, 9.356122016906738, 10.898083686828613, 12.440044403076172, 13.982006072998047, 15.523971557617188, 17.065933227539062, 18.607894897460938, 20.149856567382812, 21.691818237304688, 23.233779907226562, 24.775739669799805, 26.31770133972168, 27.859663009643555, 29.40162467956543, 30.943586349487305, 32.48554611206055, 34.02750778198242, 35.5694694519043, 37.11143112182617, 38.65339279174805, 40.19535446166992, 41.7373161315918, 43.27927780151367, 44.82123947143555, 46.36320114135742, 47.9051628112793, 49.447120666503906, 50.98908233642578, 52.531044006347656, 54.07300567626953, 55.614967346191406, 57.15692901611328, 58.698890686035156, 60.24085235595703, 61.782814025878906, 63.32477569580078, 64.86673736572266]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 9.0, 10.0, 9.0, 20.0, 20.0, 14.0, 15.0, 18.0, 34.0, 36.0, 32.0, 49.0, 43.0, 41.0, 34.0, 47.0, 56.0, 59.0, 44.0, 46.0, 36.0, 51.0, 30.0, 36.0, 35.0, 34.0, 24.0, 16.0, 17.0, 19.0, 11.0, 11.0, 11.0, 11.0, 7.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.812686920166016, -12.33586597442627, -11.859044075012207, -11.382223129272461, -10.905401229858398, -10.428580284118652, -9.951759338378906, -9.474937438964844, -8.998116493225098, -8.521295547485352, -8.044473648071289, -7.567652702331543, -7.090831279754639, -6.614009857177734, -6.137188911437988, -5.660367488861084, -5.18354606628418, -4.706724643707275, -4.229903221130371, -3.753082275390625, -3.2762608528137207, -2.7994394302368164, -2.322618246078491, -1.845797061920166, -1.3689756393432617, -0.892154335975647, -0.4153330326080322, 0.06148827075958252, 0.5383095741271973, 1.0151309967041016, 1.4919521808624268, 1.968773365020752, 2.4455947875976562, 2.9224162101745605, 3.3992373943328857, 3.876058578491211, 4.352880001068115, 4.8297014236450195, 5.306522369384766, 5.78334379196167, 6.260165214538574, 6.7369866371154785, 7.213808059692383, 7.690629005432129, 8.167449951171875, 8.644271850585938, 9.121092796325684, 9.59791374206543, 10.074735641479492, 10.551556587219238, 11.0283784866333, 11.505199432373047, 11.98202133178711, 12.458842277526855, 12.935663223266602, 13.412485122680664, 13.88930606842041, 14.366127014160156, 14.842948913574219, 15.319769859313965, 15.796590805053711, 16.273412704467773, 16.750234603881836, 17.227054595947266, 17.703876495361328]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 7.0, 5.0, 10.0, 17.0, 24.0, 45.0, 61.0, 66.0, 109.0, 198.0, 278.0, 383.0, 662.0, 1093.0, 1973.0, 3533.0, 7884.0, 24721.0, 419602.0, 3684803.0, 30691.0, 8811.0, 3821.0, 2090.0, 1262.0, 703.0, 489.0, 321.0, 216.0, 121.0, 87.0, 61.0, 32.0, 21.0, 23.0, 17.0, 10.0, 11.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.59375, -4.4698486328125, -4.345947265625, -4.2220458984375, -4.09814453125, -3.9742431640625, -3.850341796875, -3.7264404296875, -3.6025390625, -3.4786376953125, -3.354736328125, -3.2308349609375, -3.10693359375, -2.9830322265625, -2.859130859375, -2.7352294921875, -2.611328125, -2.4874267578125, -2.363525390625, -2.2396240234375, -2.11572265625, -1.9918212890625, -1.867919921875, -1.7440185546875, -1.6201171875, -1.4962158203125, -1.372314453125, -1.2484130859375, -1.12451171875, -1.0006103515625, -0.876708984375, -0.7528076171875, -0.62890625, -0.5050048828125, -0.381103515625, -0.2572021484375, -0.13330078125, -0.0093994140625, 0.114501953125, 0.2384033203125, 0.3623046875, 0.4862060546875, 0.610107421875, 0.7340087890625, 0.85791015625, 0.9818115234375, 1.105712890625, 1.2296142578125, 1.353515625, 1.4774169921875, 1.601318359375, 1.7252197265625, 1.84912109375, 1.9730224609375, 2.096923828125, 2.2208251953125, 2.3447265625, 2.4686279296875, 2.592529296875, 2.7164306640625, 2.84033203125, 2.9642333984375, 3.088134765625, 3.2120361328125, 3.3359375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 4.0, 6.0, 6.0, 10.0, 9.0, 30.0, 27.0, 36.0, 46.0, 58.0, 44.0, 63.0, 62.0, 64.0, 66.0, 50.0, 73.0, 61.0, 40.0, 50.0, 46.0, 34.0, 26.0, 25.0, 21.0, 10.0, 17.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.3984375, -1.3647994995117188, -1.3311614990234375, -1.2975234985351562, -1.263885498046875, -1.2302474975585938, -1.1966094970703125, -1.1629714965820312, -1.12933349609375, -1.0956954956054688, -1.0620574951171875, -1.0284194946289062, -0.994781494140625, -0.9611434936523438, -0.9275054931640625, -0.8938674926757812, -0.8602294921875, -0.8265914916992188, -0.7929534912109375, -0.7593154907226562, -0.725677490234375, -0.6920394897460938, -0.6584014892578125, -0.6247634887695312, -0.59112548828125, -0.5574874877929688, -0.5238494873046875, -0.49021148681640625, -0.456573486328125, -0.42293548583984375, -0.3892974853515625, -0.35565948486328125, -0.322021484375, -0.28838348388671875, -0.2547454833984375, -0.22110748291015625, -0.187469482421875, -0.15383148193359375, -0.1201934814453125, -0.08655548095703125, -0.05291748046875, -0.01927947998046875, 0.0143585205078125, 0.04799652099609375, 0.081634521484375, 0.11527252197265625, 0.1489105224609375, 0.18254852294921875, 0.2161865234375, 0.24982452392578125, 0.2834625244140625, 0.31710052490234375, 0.350738525390625, 0.38437652587890625, 0.4180145263671875, 0.45165252685546875, 0.48529052734375, 0.5189285278320312, 0.5525665283203125, 0.5862045288085938, 0.619842529296875, 0.6534805297851562, 0.6871185302734375, 0.7207565307617188, 0.75439453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 5.0, 19.0, 40.0, 51.0, 89.0, 201.0, 453.0, 1223.0, 4012.0, 20497.0, 4088218.0, 69242.0, 6974.0, 1959.0, 686.0, 271.0, 143.0, 85.0, 42.0, 30.0, 17.0, 7.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.21875, -5.9564208984375, -5.694091796875, -5.4317626953125, -5.16943359375, -4.9071044921875, -4.644775390625, -4.3824462890625, -4.1201171875, -3.8577880859375, -3.595458984375, -3.3331298828125, -3.07080078125, -2.8084716796875, -2.546142578125, -2.2838134765625, -2.021484375, -1.7591552734375, -1.496826171875, -1.2344970703125, -0.97216796875, -0.7098388671875, -0.447509765625, -0.1851806640625, 0.0771484375, 0.3394775390625, 0.601806640625, 0.8641357421875, 1.12646484375, 1.3887939453125, 1.651123046875, 1.9134521484375, 2.17578125, 2.4381103515625, 2.700439453125, 2.9627685546875, 3.22509765625, 3.4874267578125, 3.749755859375, 4.0120849609375, 4.2744140625, 4.5367431640625, 4.799072265625, 5.0614013671875, 5.32373046875, 5.5860595703125, 5.848388671875, 6.1107177734375, 6.373046875, 6.6353759765625, 6.897705078125, 7.1600341796875, 7.42236328125, 7.6846923828125, 7.947021484375, 8.2093505859375, 8.4716796875, 8.7340087890625, 8.996337890625, 9.2586669921875, 9.52099609375, 9.7833251953125, 10.045654296875, 10.3079833984375, 10.5703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 5.0, 1.0, 6.0, 10.0, 15.0, 24.0, 47.0, 171.0, 3415.0, 243.0, 70.0, 21.0, 14.0, 9.0, 10.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.22265625, -1.13897705078125, -1.0552978515625, -0.97161865234375, -0.887939453125, -0.80426025390625, -0.7205810546875, -0.63690185546875, -0.55322265625, -0.46954345703125, -0.3858642578125, -0.30218505859375, -0.218505859375, -0.13482666015625, -0.0511474609375, 0.03253173828125, 0.1162109375, 0.19989013671875, 0.2835693359375, 0.36724853515625, 0.450927734375, 0.53460693359375, 0.6182861328125, 0.70196533203125, 0.78564453125, 0.86932373046875, 0.9530029296875, 1.03668212890625, 1.120361328125, 1.20404052734375, 1.2877197265625, 1.37139892578125, 1.455078125, 1.53875732421875, 1.6224365234375, 1.70611572265625, 1.789794921875, 1.87347412109375, 1.9571533203125, 2.04083251953125, 2.12451171875, 2.20819091796875, 2.2918701171875, 2.37554931640625, 2.459228515625, 2.54290771484375, 2.6265869140625, 2.71026611328125, 2.7939453125, 2.87762451171875, 2.9613037109375, 3.04498291015625, 3.128662109375, 3.21234130859375, 3.2960205078125, 3.37969970703125, 3.46337890625, 3.54705810546875, 3.6307373046875, 3.71441650390625, 3.798095703125, 3.88177490234375, 3.9654541015625, 4.04913330078125, 4.1328125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 7.0, 4.0, 3.0, 7.0, 21.0, 48.0, 100.0, 172.0, 239.0, 190.0, 106.0, 45.0, 20.0, 14.0, 8.0, 6.0, 4.0, 5.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.624087810516357, -5.3508381843566895, -5.077588081359863, -4.804338455200195, -4.531088352203369, -4.257838726043701, -3.984588861465454, -3.711338996887207, -3.43808913230896, -3.164839267730713, -2.891589403152466, -2.6183395385742188, -2.345089912414551, -2.0718398094177246, -1.7985901832580566, -1.5253403186798096, -1.2520904541015625, -0.9788405895233154, -0.7055907845497131, -0.43234097957611084, -0.15909111499786377, 0.1141587495803833, 0.3874084949493408, 0.6606583595275879, 0.933908224105835, 1.207158088684082, 1.480407953262329, 1.7536576986312866, 2.026907444000244, 2.3001575469970703, 2.5734071731567383, 2.8466570377349854, 3.119906425476074, 3.3931562900543213, 3.6664061546325684, 3.9396557807922363, 4.2129058837890625, 4.4861555099487305, 4.759405136108398, 5.032655239105225, 5.305905342102051, 5.579154968261719, 5.852405071258545, 6.125654697418213, 6.398904800415039, 6.672154426574707, 6.945404052734375, 7.218654155731201, 7.491903781890869, 7.765153408050537, 8.038403511047363, 8.311653137207031, 8.5849027633667, 8.858153343200684, 9.131402969360352, 9.40465259552002, 9.677902221679688, 9.951151847839355, 10.224401473999023, 10.497652053833008, 10.770901679992676, 11.044151306152344, 11.317400932312012, 11.59065055847168, 11.863901138305664]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 12.0, 16.0, 14.0, 21.0, 29.0, 30.0, 28.0, 30.0, 33.0, 53.0, 60.0, 73.0, 57.0, 62.0, 61.0, 58.0, 52.0, 41.0, 39.0, 48.0, 36.0, 29.0, 29.0, 26.0, 15.0, 8.0, 12.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.688807487487793, -4.528800964355469, -4.3687944412231445, -4.208787441253662, -4.048780918121338, -3.8887743949890137, -3.7287676334381104, -3.568760871887207, -3.408754348754883, -3.2487478256225586, -3.0887410640716553, -2.928734302520752, -2.7687277793884277, -2.6087212562561035, -2.4487144947052, -2.288707733154297, -2.1287012100219727, -1.9686945676803589, -1.8086879253387451, -1.6486812829971313, -1.4886746406555176, -1.3286679983139038, -1.16866135597229, -1.0086547136306763, -0.8486480712890625, -0.6886414289474487, -0.528634786605835, -0.3686281442642212, -0.20862150192260742, -0.04861485958099365, 0.11139178276062012, 0.2713984251022339, 0.43140506744384766, 0.5914117097854614, 0.7514183521270752, 0.911424994468689, 1.0714316368103027, 1.2314382791519165, 1.3914449214935303, 1.551451563835144, 1.7114582061767578, 1.8714648485183716, 2.0314714908599854, 2.1914782524108887, 2.351484775543213, 2.511491298675537, 2.6714980602264404, 2.8315048217773438, 2.991511344909668, 3.151517868041992, 3.3115246295928955, 3.471531391143799, 3.631537914276123, 3.7915444374084473, 3.9515511989593506, 4.111557960510254, 4.271564483642578, 4.431571006774902, 4.591577529907227, 4.751584529876709, 4.911591053009033, 5.071597576141357, 5.23160457611084, 5.391611099243164, 5.551617622375488]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 8.0, 17.0, 23.0, 34.0, 66.0, 87.0, 167.0, 261.0, 569.0, 1177.0, 2296.0, 5013.0, 11864.0, 29687.0, 82193.0, 241705.0, 401015.0, 174228.0, 59538.0, 21735.0, 9007.0, 3980.0, 1838.0, 981.0, 466.0, 232.0, 132.0, 79.0, 50.0, 40.0, 28.0, 16.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7763671875, -1.7158355712890625, -1.655303955078125, -1.5947723388671875, -1.53424072265625, -1.4737091064453125, -1.413177490234375, -1.3526458740234375, -1.2921142578125, -1.2315826416015625, -1.171051025390625, -1.1105194091796875, -1.04998779296875, -0.9894561767578125, -0.928924560546875, -0.8683929443359375, -0.807861328125, -0.7473297119140625, -0.686798095703125, -0.6262664794921875, -0.56573486328125, -0.5052032470703125, -0.444671630859375, -0.3841400146484375, -0.3236083984375, -0.2630767822265625, -0.202545166015625, -0.1420135498046875, -0.08148193359375, -0.0209503173828125, 0.039581298828125, 0.1001129150390625, 0.16064453125, 0.2211761474609375, 0.281707763671875, 0.3422393798828125, 0.40277099609375, 0.4633026123046875, 0.523834228515625, 0.5843658447265625, 0.6448974609375, 0.7054290771484375, 0.765960693359375, 0.8264923095703125, 0.88702392578125, 0.9475555419921875, 1.008087158203125, 1.0686187744140625, 1.129150390625, 1.1896820068359375, 1.250213623046875, 1.3107452392578125, 1.37127685546875, 1.4318084716796875, 1.492340087890625, 1.5528717041015625, 1.6134033203125, 1.6739349365234375, 1.734466552734375, 1.7949981689453125, 1.85552978515625, 1.9160614013671875, 1.976593017578125, 2.0371246337890625, 2.09765625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 7.0, 1.0, 10.0, 13.0, 19.0, 20.0, 26.0, 30.0, 25.0, 29.0, 39.0, 46.0, 61.0, 63.0, 52.0, 77.0, 60.0, 56.0, 47.0, 41.0, 50.0, 32.0, 38.0, 30.0, 19.0, 36.0, 20.0, 18.0, 10.0, 11.0, 6.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3525390625, -1.3187103271484375, -1.284881591796875, -1.2510528564453125, -1.21722412109375, -1.1833953857421875, -1.149566650390625, -1.1157379150390625, -1.0819091796875, -1.0480804443359375, -1.014251708984375, -0.9804229736328125, -0.94659423828125, -0.9127655029296875, -0.878936767578125, -0.8451080322265625, -0.811279296875, -0.7774505615234375, -0.743621826171875, -0.7097930908203125, -0.67596435546875, -0.6421356201171875, -0.608306884765625, -0.5744781494140625, -0.5406494140625, -0.5068206787109375, -0.472991943359375, -0.4391632080078125, -0.40533447265625, -0.3715057373046875, -0.337677001953125, -0.3038482666015625, -0.27001953125, -0.2361907958984375, -0.202362060546875, -0.1685333251953125, -0.13470458984375, -0.1008758544921875, -0.067047119140625, -0.0332183837890625, 0.0006103515625, 0.0344390869140625, 0.068267822265625, 0.1020965576171875, 0.13592529296875, 0.1697540283203125, 0.203582763671875, 0.2374114990234375, 0.271240234375, 0.3050689697265625, 0.338897705078125, 0.3727264404296875, 0.40655517578125, 0.4403839111328125, 0.474212646484375, 0.5080413818359375, 0.5418701171875, 0.5756988525390625, 0.609527587890625, 0.6433563232421875, 0.67718505859375, 0.7110137939453125, 0.744842529296875, 0.7786712646484375, 0.8125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 7.0, 1.0, 3.0, 6.0, 9.0, 6.0, 21.0, 16.0, 26.0, 33.0, 46.0, 69.0, 102.0, 167.0, 337.0, 644.0, 1817.0, 7729.0, 48830.0, 562887.0, 382283.0, 34749.0, 5966.0, 1455.0, 579.0, 251.0, 168.0, 117.0, 62.0, 43.0, 29.0, 18.0, 15.0, 15.0, 11.0, 11.0, 10.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.9453125, -3.81768798828125, -3.6900634765625, -3.56243896484375, -3.434814453125, -3.30718994140625, -3.1795654296875, -3.05194091796875, -2.92431640625, -2.79669189453125, -2.6690673828125, -2.54144287109375, -2.413818359375, -2.28619384765625, -2.1585693359375, -2.03094482421875, -1.9033203125, -1.77569580078125, -1.6480712890625, -1.52044677734375, -1.392822265625, -1.26519775390625, -1.1375732421875, -1.00994873046875, -0.88232421875, -0.75469970703125, -0.6270751953125, -0.49945068359375, -0.371826171875, -0.24420166015625, -0.1165771484375, 0.01104736328125, 0.138671875, 0.26629638671875, 0.3939208984375, 0.52154541015625, 0.649169921875, 0.77679443359375, 0.9044189453125, 1.03204345703125, 1.15966796875, 1.28729248046875, 1.4149169921875, 1.54254150390625, 1.670166015625, 1.79779052734375, 1.9254150390625, 2.05303955078125, 2.1806640625, 2.30828857421875, 2.4359130859375, 2.56353759765625, 2.691162109375, 2.81878662109375, 2.9464111328125, 3.07403564453125, 3.20166015625, 3.32928466796875, 3.4569091796875, 3.58453369140625, 3.712158203125, 3.83978271484375, 3.9674072265625, 4.09503173828125, 4.22265625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 9.0, 12.0, 15.0, 11.0, 12.0, 20.0, 21.0, 27.0, 31.0, 42.0, 32.0, 46.0, 41.0, 57.0, 42.0, 54.0, 50.0, 45.0, 53.0, 42.0, 37.0, 42.0, 37.0, 33.0, 25.0, 40.0, 14.0, 18.0, 18.0, 14.0, 13.0, 11.0, 7.0, 8.0, 10.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.794921875, -3.656402587890625, -3.51788330078125, -3.379364013671875, -3.2408447265625, -3.102325439453125, -2.96380615234375, -2.825286865234375, -2.686767578125, -2.548248291015625, -2.40972900390625, -2.271209716796875, -2.1326904296875, -1.994171142578125, -1.85565185546875, -1.717132568359375, -1.57861328125, -1.440093994140625, -1.30157470703125, -1.163055419921875, -1.0245361328125, -0.886016845703125, -0.74749755859375, -0.608978271484375, -0.470458984375, -0.331939697265625, -0.19342041015625, -0.054901123046875, 0.0836181640625, 0.222137451171875, 0.36065673828125, 0.499176025390625, 0.6376953125, 0.776214599609375, 0.91473388671875, 1.053253173828125, 1.1917724609375, 1.330291748046875, 1.46881103515625, 1.607330322265625, 1.745849609375, 1.884368896484375, 2.02288818359375, 2.161407470703125, 2.2999267578125, 2.438446044921875, 2.57696533203125, 2.715484619140625, 2.85400390625, 2.992523193359375, 3.13104248046875, 3.269561767578125, 3.4080810546875, 3.546600341796875, 3.68511962890625, 3.823638916015625, 3.962158203125, 4.100677490234375, 4.23919677734375, 4.377716064453125, 4.5162353515625, 4.654754638671875, 4.79327392578125, 4.931793212890625, 5.0703125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 12.0, 26.0, 41.0, 72.0, 169.0, 434.0, 1826.0, 13867.0, 883879.0, 140612.0, 6078.0, 1019.0, 256.0, 108.0, 68.0, 40.0, 17.0, 8.0, 5.0, 0.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.984375, -4.82769775390625, -4.6710205078125, -4.51434326171875, -4.357666015625, -4.20098876953125, -4.0443115234375, -3.88763427734375, -3.73095703125, -3.57427978515625, -3.4176025390625, -3.26092529296875, -3.104248046875, -2.94757080078125, -2.7908935546875, -2.63421630859375, -2.4775390625, -2.32086181640625, -2.1641845703125, -2.00750732421875, -1.850830078125, -1.69415283203125, -1.5374755859375, -1.38079833984375, -1.22412109375, -1.06744384765625, -0.9107666015625, -0.75408935546875, -0.597412109375, -0.44073486328125, -0.2840576171875, -0.12738037109375, 0.029296875, 0.18597412109375, 0.3426513671875, 0.49932861328125, 0.656005859375, 0.81268310546875, 0.9693603515625, 1.12603759765625, 1.28271484375, 1.43939208984375, 1.5960693359375, 1.75274658203125, 1.909423828125, 2.06610107421875, 2.2227783203125, 2.37945556640625, 2.5361328125, 2.69281005859375, 2.8494873046875, 3.00616455078125, 3.162841796875, 3.31951904296875, 3.4761962890625, 3.63287353515625, 3.78955078125, 3.94622802734375, 4.1029052734375, 4.25958251953125, 4.416259765625, 4.57293701171875, 4.7296142578125, 4.88629150390625, 5.04296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 6.0, 8.0, 14.0, 13.0, 17.0, 26.0, 33.0, 55.0, 63.0, 120.0, 152.0, 148.0, 95.0, 70.0, 42.0, 41.0, 21.0, 16.0, 10.0, 13.0, 12.0, 3.0, 3.0, 0.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00032210350036621094, -0.00031422078609466553, -0.0003063380718231201, -0.0002984553575515747, -0.0002905726432800293, -0.0002826899290084839, -0.0002748072147369385, -0.00026692450046539307, -0.00025904178619384766, -0.00025115907192230225, -0.00024327635765075684, -0.00023539364337921143, -0.00022751092910766602, -0.0002196282148361206, -0.0002117455005645752, -0.00020386278629302979, -0.00019598007202148438, -0.00018809735774993896, -0.00018021464347839355, -0.00017233192920684814, -0.00016444921493530273, -0.00015656650066375732, -0.00014868378639221191, -0.0001408010721206665, -0.0001329183578491211, -0.00012503564357757568, -0.00011715292930603027, -0.00010927021503448486, -0.00010138750076293945, -9.350478649139404e-05, -8.562207221984863e-05, -7.773935794830322e-05, -6.985664367675781e-05, -6.19739294052124e-05, -5.409121513366699e-05, -4.620850086212158e-05, -3.832578659057617e-05, -3.0443072319030762e-05, -2.256035804748535e-05, -1.4677643775939941e-05, -6.794929504394531e-06, 1.087784767150879e-06, 8.970499038696289e-06, 1.68532133102417e-05, 2.473592758178711e-05, 3.261864185333252e-05, 4.050135612487793e-05, 4.838407039642334e-05, 5.626678466796875e-05, 6.414949893951416e-05, 7.203221321105957e-05, 7.991492748260498e-05, 8.779764175415039e-05, 9.56803560256958e-05, 0.00010356307029724121, 0.00011144578456878662, 0.00011932849884033203, 0.00012721121311187744, 0.00013509392738342285, 0.00014297664165496826, 0.00015085935592651367, 0.00015874207019805908, 0.0001666247844696045, 0.0001745074987411499, 0.0001823902130126953]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 10.0, 7.0, 16.0, 12.0, 33.0, 35.0, 51.0, 82.0, 211.0, 518.0, 1596.0, 6964.0, 59822.0, 868570.0, 98293.0, 9159.0, 2024.0, 608.0, 257.0, 122.0, 45.0, 33.0, 18.0, 19.0, 19.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.83984375, -2.71942138671875, -2.5989990234375, -2.47857666015625, -2.358154296875, -2.23773193359375, -2.1173095703125, -1.99688720703125, -1.87646484375, -1.75604248046875, -1.6356201171875, -1.51519775390625, -1.394775390625, -1.27435302734375, -1.1539306640625, -1.03350830078125, -0.9130859375, -0.79266357421875, -0.6722412109375, -0.55181884765625, -0.431396484375, -0.31097412109375, -0.1905517578125, -0.07012939453125, 0.05029296875, 0.17071533203125, 0.2911376953125, 0.41156005859375, 0.531982421875, 0.65240478515625, 0.7728271484375, 0.89324951171875, 1.013671875, 1.13409423828125, 1.2545166015625, 1.37493896484375, 1.495361328125, 1.61578369140625, 1.7362060546875, 1.85662841796875, 1.97705078125, 2.09747314453125, 2.2178955078125, 2.33831787109375, 2.458740234375, 2.57916259765625, 2.6995849609375, 2.82000732421875, 2.9404296875, 3.06085205078125, 3.1812744140625, 3.30169677734375, 3.422119140625, 3.54254150390625, 3.6629638671875, 3.78338623046875, 3.90380859375, 4.02423095703125, 4.1446533203125, 4.26507568359375, 4.385498046875, 4.50592041015625, 4.6263427734375, 4.74676513671875, 4.8671875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 8.0, 12.0, 15.0, 16.0, 16.0, 20.0, 37.0, 44.0, 56.0, 56.0, 62.0, 97.0, 98.0, 71.0, 78.0, 71.0, 38.0, 34.0, 34.0, 30.0, 22.0, 10.0, 15.0, 9.0, 10.0, 1.0, 3.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4931640625, -1.438690185546875, -1.38421630859375, -1.329742431640625, -1.2752685546875, -1.220794677734375, -1.16632080078125, -1.111846923828125, -1.057373046875, -1.002899169921875, -0.94842529296875, -0.893951416015625, -0.8394775390625, -0.785003662109375, -0.73052978515625, -0.676055908203125, -0.62158203125, -0.567108154296875, -0.51263427734375, -0.458160400390625, -0.4036865234375, -0.349212646484375, -0.29473876953125, -0.240264892578125, -0.185791015625, -0.131317138671875, -0.07684326171875, -0.022369384765625, 0.0321044921875, 0.086578369140625, 0.14105224609375, 0.195526123046875, 0.25, 0.304473876953125, 0.35894775390625, 0.413421630859375, 0.4678955078125, 0.522369384765625, 0.57684326171875, 0.631317138671875, 0.685791015625, 0.740264892578125, 0.79473876953125, 0.849212646484375, 0.9036865234375, 0.958160400390625, 1.01263427734375, 1.067108154296875, 1.12158203125, 1.176055908203125, 1.23052978515625, 1.285003662109375, 1.3394775390625, 1.393951416015625, 1.44842529296875, 1.502899169921875, 1.557373046875, 1.611846923828125, 1.66632080078125, 1.720794677734375, 1.7752685546875, 1.829742431640625, 1.88421630859375, 1.938690185546875, 1.9931640625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 13.0, 52.0, 268.0, 458.0, 171.0, 37.0, 9.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.21356201171875, -79.81673431396484, -77.41991424560547, -75.02308654785156, -72.62626647949219, -70.22943878173828, -67.83261108398438, -65.435791015625, -63.038963317871094, -60.64213943481445, -58.24531555175781, -55.848487854003906, -53.451663970947266, -51.054840087890625, -48.65801239013672, -46.26118850708008, -43.86436462402344, -41.4675407409668, -39.070716857910156, -36.67388916015625, -34.27706527709961, -31.88024139404297, -29.483415603637695, -27.086589813232422, -24.68976593017578, -22.29294204711914, -19.896116256713867, -17.499290466308594, -15.102466583251953, -12.705641746520996, -10.308816909790039, -7.911991119384766, -5.515174865722656, -3.118350028991699, -0.7215251922607422, 1.6752996444702148, 4.072124481201172, 6.468949317932129, 8.865774154663086, 11.26259994506836, 13.659423828125, 16.05624771118164, 18.453073501586914, 20.849899291992188, 23.246723175048828, 25.64354705810547, 28.040372848510742, 30.437198638916016, 32.834022521972656, 35.2308464050293, 37.62767028808594, 40.024497985839844, 42.421321868896484, 44.818145751953125, 47.21497344970703, 49.61179733276367, 52.00862121582031, 54.40544509887695, 56.802268981933594, 59.1990966796875, 61.59592056274414, 63.99274444580078, 66.38957214355469, 68.78639221191406, 71.18321990966797]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 5.0, 10.0, 5.0, 11.0, 18.0, 13.0, 23.0, 16.0, 19.0, 36.0, 24.0, 27.0, 40.0, 27.0, 35.0, 40.0, 45.0, 35.0, 49.0, 46.0, 51.0, 42.0, 42.0, 36.0, 35.0, 38.0, 25.0, 37.0, 23.0, 27.0, 20.0, 14.0, 19.0, 9.0, 14.0, 9.0, 7.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.294517517089844, -18.607702255249023, -17.920886993408203, -17.234071731567383, -16.547256469726562, -15.860441207885742, -15.173625946044922, -14.486810684204102, -13.799995422363281, -13.113180160522461, -12.42636489868164, -11.73954963684082, -11.052734375, -10.36591911315918, -9.67910385131836, -8.992288589477539, -8.305474281311035, -7.618659019470215, -6.9318437576293945, -6.245028495788574, -5.558213233947754, -4.871397972106934, -4.1845831871032715, -3.497767925262451, -2.810952663421631, -2.1241374015808105, -1.4373222589492798, -0.750507116317749, -0.06369185447692871, 0.6231234073638916, 1.3099384307861328, 1.9967536926269531, 2.6835689544677734, 3.3703842163085938, 4.057199478149414, 4.744014739990234, 5.430830001831055, 6.117645263671875, 6.804460048675537, 7.491275310516357, 8.178091049194336, 8.864906311035156, 9.551721572875977, 10.238536834716797, 10.925352096557617, 11.612167358398438, 12.298982620239258, 12.985797882080078, 13.672612190246582, 14.359427452087402, 15.046242713928223, 15.733057975769043, 16.419872283935547, 17.106687545776367, 17.793502807617188, 18.480318069458008, 19.167133331298828, 19.85394859313965, 20.54076385498047, 21.22757911682129, 21.91439437866211, 22.60120964050293, 23.28802490234375, 23.97484016418457, 24.66165542602539]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 10.0, 13.0, 17.0, 28.0, 37.0, 66.0, 86.0, 160.0, 244.0, 440.0, 888.0, 1721.0, 3717.0, 9080.0, 33498.0, 2874147.0, 1222851.0, 31664.0, 8592.0, 3391.0, 1614.0, 829.0, 457.0, 278.0, 160.0, 94.0, 77.0, 43.0, 28.0, 16.0, 8.0, 11.0, 6.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.015625, -3.900848388671875, -3.78607177734375, -3.671295166015625, -3.5565185546875, -3.441741943359375, -3.32696533203125, -3.212188720703125, -3.097412109375, -2.982635498046875, -2.86785888671875, -2.753082275390625, -2.6383056640625, -2.523529052734375, -2.40875244140625, -2.293975830078125, -2.17919921875, -2.064422607421875, -1.94964599609375, -1.834869384765625, -1.7200927734375, -1.605316162109375, -1.49053955078125, -1.375762939453125, -1.260986328125, -1.146209716796875, -1.03143310546875, -0.916656494140625, -0.8018798828125, -0.687103271484375, -0.57232666015625, -0.457550048828125, -0.3427734375, -0.227996826171875, -0.11322021484375, 0.001556396484375, 0.1163330078125, 0.231109619140625, 0.34588623046875, 0.460662841796875, 0.575439453125, 0.690216064453125, 0.80499267578125, 0.919769287109375, 1.0345458984375, 1.149322509765625, 1.26409912109375, 1.378875732421875, 1.49365234375, 1.608428955078125, 1.72320556640625, 1.837982177734375, 1.9527587890625, 2.067535400390625, 2.18231201171875, 2.297088623046875, 2.411865234375, 2.526641845703125, 2.64141845703125, 2.756195068359375, 2.8709716796875, 2.985748291015625, 3.10052490234375, 3.215301513671875, 3.330078125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 10.0, 10.0, 12.0, 16.0, 18.0, 24.0, 31.0, 20.0, 37.0, 29.0, 41.0, 46.0, 47.0, 40.0, 52.0, 61.0, 59.0, 47.0, 47.0, 40.0, 51.0, 41.0, 37.0, 27.0, 27.0, 20.0, 21.0, 11.0, 17.0, 15.0, 16.0, 11.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1884765625, -1.151519775390625, -1.11456298828125, -1.077606201171875, -1.0406494140625, -1.003692626953125, -0.96673583984375, -0.929779052734375, -0.892822265625, -0.855865478515625, -0.81890869140625, -0.781951904296875, -0.7449951171875, -0.708038330078125, -0.67108154296875, -0.634124755859375, -0.59716796875, -0.560211181640625, -0.52325439453125, -0.486297607421875, -0.4493408203125, -0.412384033203125, -0.37542724609375, -0.338470458984375, -0.301513671875, -0.264556884765625, -0.22760009765625, -0.190643310546875, -0.1536865234375, -0.116729736328125, -0.07977294921875, -0.042816162109375, -0.005859375, 0.031097412109375, 0.06805419921875, 0.105010986328125, 0.1419677734375, 0.178924560546875, 0.21588134765625, 0.252838134765625, 0.289794921875, 0.326751708984375, 0.36370849609375, 0.400665283203125, 0.4376220703125, 0.474578857421875, 0.51153564453125, 0.548492431640625, 0.58544921875, 0.622406005859375, 0.65936279296875, 0.696319580078125, 0.7332763671875, 0.770233154296875, 0.80718994140625, 0.844146728515625, 0.881103515625, 0.918060302734375, 0.95501708984375, 0.991973876953125, 1.0289306640625, 1.065887451171875, 1.10284423828125, 1.139801025390625, 1.1767578125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 19.0, 20.0, 27.0, 66.0, 102.0, 234.0, 501.0, 1402.0, 4923.0, 55906.0, 4102352.0, 23654.0, 3261.0, 1037.0, 402.0, 162.0, 99.0, 52.0, 29.0, 17.0, 3.0, 9.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.84375, -8.5787353515625, -8.313720703125, -8.0487060546875, -7.78369140625, -7.5186767578125, -7.253662109375, -6.9886474609375, -6.7236328125, -6.4586181640625, -6.193603515625, -5.9285888671875, -5.66357421875, -5.3985595703125, -5.133544921875, -4.8685302734375, -4.603515625, -4.3385009765625, -4.073486328125, -3.8084716796875, -3.54345703125, -3.2784423828125, -3.013427734375, -2.7484130859375, -2.4833984375, -2.2183837890625, -1.953369140625, -1.6883544921875, -1.42333984375, -1.1583251953125, -0.893310546875, -0.6282958984375, -0.36328125, -0.0982666015625, 0.166748046875, 0.4317626953125, 0.69677734375, 0.9617919921875, 1.226806640625, 1.4918212890625, 1.7568359375, 2.0218505859375, 2.286865234375, 2.5518798828125, 2.81689453125, 3.0819091796875, 3.346923828125, 3.6119384765625, 3.876953125, 4.1419677734375, 4.406982421875, 4.6719970703125, 4.93701171875, 5.2020263671875, 5.467041015625, 5.7320556640625, 5.9970703125, 6.2620849609375, 6.527099609375, 6.7921142578125, 7.05712890625, 7.3221435546875, 7.587158203125, 7.8521728515625, 8.1171875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 16.0, 17.0, 38.0, 52.0, 104.0, 1047.0, 2517.0, 112.0, 61.0, 26.0, 26.0, 11.0, 10.0, 5.0, 9.0, 0.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904296875, -2.816436767578125, -2.72857666015625, -2.640716552734375, -2.5528564453125, -2.464996337890625, -2.37713623046875, -2.289276123046875, -2.201416015625, -2.113555908203125, -2.02569580078125, -1.937835693359375, -1.8499755859375, -1.762115478515625, -1.67425537109375, -1.586395263671875, -1.49853515625, -1.410675048828125, -1.32281494140625, -1.234954833984375, -1.1470947265625, -1.059234619140625, -0.97137451171875, -0.883514404296875, -0.795654296875, -0.707794189453125, -0.61993408203125, -0.532073974609375, -0.4442138671875, -0.356353759765625, -0.26849365234375, -0.180633544921875, -0.0927734375, -0.004913330078125, 0.08294677734375, 0.170806884765625, 0.2586669921875, 0.346527099609375, 0.43438720703125, 0.522247314453125, 0.610107421875, 0.697967529296875, 0.78582763671875, 0.873687744140625, 0.9615478515625, 1.049407958984375, 1.13726806640625, 1.225128173828125, 1.31298828125, 1.400848388671875, 1.48870849609375, 1.576568603515625, 1.6644287109375, 1.752288818359375, 1.84014892578125, 1.928009033203125, 2.015869140625, 2.103729248046875, 2.19158935546875, 2.279449462890625, 2.3673095703125, 2.455169677734375, 2.54302978515625, 2.630889892578125, 2.71875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 15.0, 30.0, 130.0, 366.0, 306.0, 104.0, 26.0, 10.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.114532470703125, -26.49797821044922, -25.881423950195312, -25.26487159729004, -24.648317337036133, -24.031763076782227, -23.41520881652832, -22.798654556274414, -22.18210220336914, -21.565547943115234, -20.948993682861328, -20.332441329956055, -19.71588706970215, -19.099332809448242, -18.482778549194336, -17.86622428894043, -17.249670028686523, -16.633115768432617, -16.01656150817871, -15.400008201599121, -14.783454895019531, -14.166900634765625, -13.550346374511719, -12.933792114257812, -12.317238807678223, -11.700684547424316, -11.084131240844727, -10.46757698059082, -9.851022720336914, -9.234469413757324, -8.617915153503418, -8.001361846923828, -7.384807586669922, -6.768253803253174, -6.151700019836426, -5.5351457595825195, -4.9185919761657715, -4.302038192749023, -3.6854841709136963, -3.068930149078369, -2.452376365661621, -1.8358224630355835, -1.219268560409546, -0.6027146577835083, 0.013839244842529297, 0.6303930282592773, 1.2469470500946045, 1.8635010719299316, 2.4800548553466797, 3.0966086387634277, 3.713162660598755, 4.329716682434082, 4.94627046585083, 5.562824249267578, 6.179378509521484, 6.795932292938232, 7.4124860763549805, 8.029040336608887, 8.645593643188477, 9.262147903442383, 9.878702163696289, 10.495255470275879, 11.111809730529785, 11.728363037109375, 12.344917297363281]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 1.0, 5.0, 7.0, 3.0, 7.0, 11.0, 17.0, 12.0, 24.0, 22.0, 15.0, 34.0, 39.0, 24.0, 31.0, 44.0, 47.0, 53.0, 44.0, 31.0, 55.0, 44.0, 52.0, 57.0, 55.0, 50.0, 26.0, 21.0, 27.0, 28.0, 16.0, 17.0, 23.0, 14.0, 12.0, 10.0, 6.0, 5.0, 2.0, 0.0, 6.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-5.83771276473999, -5.674121379852295, -5.5105299949646, -5.346938610076904, -5.183347225189209, -5.019755840301514, -4.856164455413818, -4.692573070526123, -4.528981685638428, -4.365390300750732, -4.201798915863037, -4.038207530975342, -3.8746161460876465, -3.711024761199951, -3.547433376312256, -3.3838419914245605, -3.2202506065368652, -3.05665922164917, -2.8930678367614746, -2.7294764518737793, -2.565885066986084, -2.4022936820983887, -2.2387022972106934, -2.075110912322998, -1.9115195274353027, -1.7479281425476074, -1.584336757659912, -1.4207453727722168, -1.2571539878845215, -1.0935626029968262, -0.9299712181091309, -0.7663798332214355, -0.6027884483337402, -0.4391970634460449, -0.2756056785583496, -0.1120142936706543, 0.051577091217041016, 0.21516847610473633, 0.37875986099243164, 0.542351245880127, 0.7059426307678223, 0.8695340156555176, 1.033125400543213, 1.1967167854309082, 1.3603081703186035, 1.5238995552062988, 1.6874909400939941, 1.8510823249816895, 2.0146737098693848, 2.17826509475708, 2.3418564796447754, 2.5054478645324707, 2.669039249420166, 2.8326306343078613, 2.9962220191955566, 3.159813404083252, 3.3234047889709473, 3.4869961738586426, 3.650587558746338, 3.814178943634033, 3.9777703285217285, 4.141361713409424, 4.304953098297119, 4.4685444831848145, 4.63213586807251]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 3.0, 3.0, 10.0, 21.0, 19.0, 21.0, 23.0, 43.0, 52.0, 68.0, 134.0, 290.0, 652.0, 1614.0, 4202.0, 13513.0, 52453.0, 260075.0, 537779.0, 133871.0, 30123.0, 8629.0, 2800.0, 1107.0, 471.0, 257.0, 86.0, 73.0, 35.0, 29.0, 20.0, 20.0, 9.0, 7.0, 11.0, 9.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.51953125, -2.430511474609375, -2.34149169921875, -2.252471923828125, -2.1634521484375, -2.074432373046875, -1.98541259765625, -1.896392822265625, -1.807373046875, -1.718353271484375, -1.62933349609375, -1.540313720703125, -1.4512939453125, -1.362274169921875, -1.27325439453125, -1.184234619140625, -1.09521484375, -1.006195068359375, -0.91717529296875, -0.828155517578125, -0.7391357421875, -0.650115966796875, -0.56109619140625, -0.472076416015625, -0.383056640625, -0.294036865234375, -0.20501708984375, -0.115997314453125, -0.0269775390625, 0.062042236328125, 0.15106201171875, 0.240081787109375, 0.3291015625, 0.418121337890625, 0.50714111328125, 0.596160888671875, 0.6851806640625, 0.774200439453125, 0.86322021484375, 0.952239990234375, 1.041259765625, 1.130279541015625, 1.21929931640625, 1.308319091796875, 1.3973388671875, 1.486358642578125, 1.57537841796875, 1.664398193359375, 1.75341796875, 1.842437744140625, 1.93145751953125, 2.020477294921875, 2.1094970703125, 2.198516845703125, 2.28753662109375, 2.376556396484375, 2.465576171875, 2.554595947265625, 2.64361572265625, 2.732635498046875, 2.8216552734375, 2.910675048828125, 2.99969482421875, 3.088714599609375, 3.177734375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 4.0, 4.0, 13.0, 14.0, 13.0, 19.0, 22.0, 22.0, 29.0, 31.0, 45.0, 35.0, 51.0, 47.0, 50.0, 50.0, 63.0, 52.0, 52.0, 49.0, 51.0, 31.0, 40.0, 40.0, 28.0, 18.0, 28.0, 20.0, 15.0, 14.0, 15.0, 7.0, 7.0, 9.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.263671875, -1.2228240966796875, -1.181976318359375, -1.1411285400390625, -1.10028076171875, -1.0594329833984375, -1.018585205078125, -0.9777374267578125, -0.9368896484375, -0.8960418701171875, -0.855194091796875, -0.8143463134765625, -0.77349853515625, -0.7326507568359375, -0.691802978515625, -0.6509552001953125, -0.610107421875, -0.5692596435546875, -0.528411865234375, -0.4875640869140625, -0.44671630859375, -0.4058685302734375, -0.365020751953125, -0.3241729736328125, -0.2833251953125, -0.2424774169921875, -0.201629638671875, -0.1607818603515625, -0.11993408203125, -0.0790863037109375, -0.038238525390625, 0.0026092529296875, 0.04345703125, 0.0843048095703125, 0.125152587890625, 0.1660003662109375, 0.20684814453125, 0.2476959228515625, 0.288543701171875, 0.3293914794921875, 0.3702392578125, 0.4110870361328125, 0.451934814453125, 0.4927825927734375, 0.53363037109375, 0.5744781494140625, 0.615325927734375, 0.6561737060546875, 0.697021484375, 0.7378692626953125, 0.778717041015625, 0.8195648193359375, 0.86041259765625, 0.9012603759765625, 0.942108154296875, 0.9829559326171875, 1.0238037109375, 1.0646514892578125, 1.105499267578125, 1.1463470458984375, 1.18719482421875, 1.2280426025390625, 1.268890380859375, 1.3097381591796875, 1.3505859375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 7.0, 6.0, 10.0, 19.0, 21.0, 27.0, 47.0, 52.0, 97.0, 135.0, 185.0, 306.0, 573.0, 1812.0, 8194.0, 68654.0, 815204.0, 136474.0, 12598.0, 2336.0, 763.0, 361.0, 198.0, 130.0, 89.0, 67.0, 42.0, 41.0, 13.0, 23.0, 21.0, 9.0, 9.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.0625, -4.91192626953125, -4.7613525390625, -4.61077880859375, -4.460205078125, -4.30963134765625, -4.1590576171875, -4.00848388671875, -3.85791015625, -3.70733642578125, -3.5567626953125, -3.40618896484375, -3.255615234375, -3.10504150390625, -2.9544677734375, -2.80389404296875, -2.6533203125, -2.50274658203125, -2.3521728515625, -2.20159912109375, -2.051025390625, -1.90045166015625, -1.7498779296875, -1.59930419921875, -1.44873046875, -1.29815673828125, -1.1475830078125, -0.99700927734375, -0.846435546875, -0.69586181640625, -0.5452880859375, -0.39471435546875, -0.244140625, -0.09356689453125, 0.0570068359375, 0.20758056640625, 0.358154296875, 0.50872802734375, 0.6593017578125, 0.80987548828125, 0.96044921875, 1.11102294921875, 1.2615966796875, 1.41217041015625, 1.562744140625, 1.71331787109375, 1.8638916015625, 2.01446533203125, 2.1650390625, 2.31561279296875, 2.4661865234375, 2.61676025390625, 2.767333984375, 2.91790771484375, 3.0684814453125, 3.21905517578125, 3.36962890625, 3.52020263671875, 3.6707763671875, 3.82135009765625, 3.971923828125, 4.12249755859375, 4.2730712890625, 4.42364501953125, 4.57421875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 12.0, 3.0, 6.0, 7.0, 10.0, 10.0, 21.0, 31.0, 29.0, 36.0, 42.0, 34.0, 38.0, 40.0, 58.0, 48.0, 59.0, 63.0, 67.0, 62.0, 57.0, 46.0, 53.0, 34.0, 30.0, 15.0, 20.0, 20.0, 12.0, 10.0, 13.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.484375, -8.27679443359375, -8.0692138671875, -7.86163330078125, -7.654052734375, -7.44647216796875, -7.2388916015625, -7.03131103515625, -6.82373046875, -6.61614990234375, -6.4085693359375, -6.20098876953125, -5.993408203125, -5.78582763671875, -5.5782470703125, -5.37066650390625, -5.1630859375, -4.95550537109375, -4.7479248046875, -4.54034423828125, -4.332763671875, -4.12518310546875, -3.9176025390625, -3.71002197265625, -3.50244140625, -3.29486083984375, -3.0872802734375, -2.87969970703125, -2.672119140625, -2.46453857421875, -2.2569580078125, -2.04937744140625, -1.841796875, -1.63421630859375, -1.4266357421875, -1.21905517578125, -1.011474609375, -0.80389404296875, -0.5963134765625, -0.38873291015625, -0.18115234375, 0.02642822265625, 0.2340087890625, 0.44158935546875, 0.649169921875, 0.85675048828125, 1.0643310546875, 1.27191162109375, 1.4794921875, 1.68707275390625, 1.8946533203125, 2.10223388671875, 2.309814453125, 2.51739501953125, 2.7249755859375, 2.93255615234375, 3.14013671875, 3.34771728515625, 3.5552978515625, 3.76287841796875, 3.970458984375, 4.17803955078125, 4.3856201171875, 4.59320068359375, 4.80078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 2.0, 11.0, 10.0, 15.0, 31.0, 33.0, 54.0, 119.0, 164.0, 341.0, 666.0, 1302.0, 3120.0, 8257.0, 34987.0, 576962.0, 381984.0, 27929.0, 7191.0, 2808.0, 1244.0, 601.0, 327.0, 143.0, 79.0, 58.0, 40.0, 25.0, 12.0, 12.0, 7.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.951629638671875, -1.88177490234375, -1.811920166015625, -1.7420654296875, -1.672210693359375, -1.60235595703125, -1.532501220703125, -1.462646484375, -1.392791748046875, -1.32293701171875, -1.253082275390625, -1.1832275390625, -1.113372802734375, -1.04351806640625, -0.973663330078125, -0.90380859375, -0.833953857421875, -0.76409912109375, -0.694244384765625, -0.6243896484375, -0.554534912109375, -0.48468017578125, -0.414825439453125, -0.344970703125, -0.275115966796875, -0.20526123046875, -0.135406494140625, -0.0655517578125, 0.004302978515625, 0.07415771484375, 0.144012451171875, 0.2138671875, 0.283721923828125, 0.35357666015625, 0.423431396484375, 0.4932861328125, 0.563140869140625, 0.63299560546875, 0.702850341796875, 0.772705078125, 0.842559814453125, 0.91241455078125, 0.982269287109375, 1.0521240234375, 1.121978759765625, 1.19183349609375, 1.261688232421875, 1.33154296875, 1.401397705078125, 1.47125244140625, 1.541107177734375, 1.6109619140625, 1.680816650390625, 1.75067138671875, 1.820526123046875, 1.890380859375, 1.960235595703125, 2.03009033203125, 2.099945068359375, 2.1697998046875, 2.239654541015625, 2.30950927734375, 2.379364013671875, 2.44921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 10.0, 13.0, 22.0, 74.0, 200.0, 346.0, 189.0, 75.0, 28.0, 15.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033783912658691406, -0.00032046064734458923, -0.0003030821681022644, -0.0002857036888599396, -0.00026832520961761475, -0.0002509467303752899, -0.0002335682511329651, -0.00021618977189064026, -0.00019881129264831543, -0.0001814328134059906, -0.00016405433416366577, -0.00014667585492134094, -0.0001292973756790161, -0.00011191889643669128, -9.454041719436646e-05, -7.716193795204163e-05, -5.97834587097168e-05, -4.240497946739197e-05, -2.502650022506714e-05, -7.64802098274231e-06, 9.73045825958252e-06, 2.710893750190735e-05, 4.448741674423218e-05, 6.186589598655701e-05, 7.924437522888184e-05, 9.662285447120667e-05, 0.0001140013337135315, 0.00013137981295585632, 0.00014875829219818115, 0.00016613677144050598, 0.0001835152506828308, 0.00020089372992515564, 0.00021827220916748047, 0.0002356506884098053, 0.0002530291676521301, 0.00027040764689445496, 0.0002877861261367798, 0.0003051646053791046, 0.00032254308462142944, 0.00033992156386375427, 0.0003573000431060791, 0.00037467852234840393, 0.00039205700159072876, 0.0004094354808330536, 0.0004268139600753784, 0.00044419243931770325, 0.0004615709185600281, 0.0004789493978023529, 0.0004963278770446777, 0.0005137063562870026, 0.0005310848355293274, 0.0005484633147716522, 0.000565841794013977, 0.0005832202732563019, 0.0006005987524986267, 0.0006179772317409515, 0.0006353557109832764, 0.0006527341902256012, 0.000670112669467926, 0.0006874911487102509, 0.0007048696279525757, 0.0007222481071949005, 0.0007396265864372253, 0.0007570050656795502, 0.000774383544921875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 6.0, 5.0, 7.0, 10.0, 22.0, 22.0, 30.0, 41.0, 54.0, 83.0, 160.0, 334.0, 673.0, 1256.0, 2620.0, 6390.0, 20361.0, 183399.0, 752431.0, 60560.0, 11849.0, 4306.0, 1891.0, 941.0, 443.0, 268.0, 130.0, 74.0, 54.0, 40.0, 28.0, 19.0, 17.0, 11.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.1484375, -2.0775146484375, -2.006591796875, -1.9356689453125, -1.86474609375, -1.7938232421875, -1.722900390625, -1.6519775390625, -1.5810546875, -1.5101318359375, -1.439208984375, -1.3682861328125, -1.29736328125, -1.2264404296875, -1.155517578125, -1.0845947265625, -1.013671875, -0.9427490234375, -0.871826171875, -0.8009033203125, -0.72998046875, -0.6590576171875, -0.588134765625, -0.5172119140625, -0.4462890625, -0.3753662109375, -0.304443359375, -0.2335205078125, -0.16259765625, -0.0916748046875, -0.020751953125, 0.0501708984375, 0.12109375, 0.1920166015625, 0.262939453125, 0.3338623046875, 0.40478515625, 0.4757080078125, 0.546630859375, 0.6175537109375, 0.6884765625, 0.7593994140625, 0.830322265625, 0.9012451171875, 0.97216796875, 1.0430908203125, 1.114013671875, 1.1849365234375, 1.255859375, 1.3267822265625, 1.397705078125, 1.4686279296875, 1.53955078125, 1.6104736328125, 1.681396484375, 1.7523193359375, 1.8232421875, 1.8941650390625, 1.965087890625, 2.0360107421875, 2.10693359375, 2.1778564453125, 2.248779296875, 2.3197021484375, 2.390625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 1.0, 2.0, 5.0, 16.0, 8.0, 16.0, 21.0, 44.0, 61.0, 96.0, 139.0, 211.0, 129.0, 76.0, 43.0, 37.0, 32.0, 16.0, 23.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.724609375, -3.63677978515625, -3.5489501953125, -3.46112060546875, -3.373291015625, -3.28546142578125, -3.1976318359375, -3.10980224609375, -3.02197265625, -2.93414306640625, -2.8463134765625, -2.75848388671875, -2.670654296875, -2.58282470703125, -2.4949951171875, -2.40716552734375, -2.3193359375, -2.23150634765625, -2.1436767578125, -2.05584716796875, -1.968017578125, -1.88018798828125, -1.7923583984375, -1.70452880859375, -1.61669921875, -1.52886962890625, -1.4410400390625, -1.35321044921875, -1.265380859375, -1.17755126953125, -1.0897216796875, -1.00189208984375, -0.9140625, -0.82623291015625, -0.7384033203125, -0.65057373046875, -0.562744140625, -0.47491455078125, -0.3870849609375, -0.29925537109375, -0.21142578125, -0.12359619140625, -0.0357666015625, 0.05206298828125, 0.139892578125, 0.22772216796875, 0.3155517578125, 0.40338134765625, 0.4912109375, 0.57904052734375, 0.6668701171875, 0.75469970703125, 0.842529296875, 0.93035888671875, 1.0181884765625, 1.10601806640625, 1.19384765625, 1.28167724609375, 1.3695068359375, 1.45733642578125, 1.545166015625, 1.63299560546875, 1.7208251953125, 1.80865478515625, 1.896484375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 12.0, 91.0, 445.0, 366.0, 73.0, 12.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.65074157714844, -34.00177764892578, -31.352811813354492, -28.703847885131836, -26.054882049560547, -23.40591812133789, -20.756954193115234, -18.107988357543945, -15.459024429321289, -12.810059547424316, -10.161094665527344, -7.5121307373046875, -4.863165855407715, -2.214200973510742, 0.43476295471191406, 3.083728790283203, 5.732692718505859, 8.381657600402832, 11.030622482299805, 13.679586410522461, 16.32855224609375, 18.977516174316406, 21.626480102539062, 24.27544593811035, 26.924409866333008, 29.573373794555664, 32.22233963012695, 34.87130355834961, 37.520267486572266, 40.16923522949219, 42.818199157714844, 45.4671630859375, 48.116127014160156, 50.76509094238281, 53.41405487060547, 56.063018798828125, 58.71198654174805, 61.3609504699707, 64.00991821289062, 66.65888214111328, 69.30784606933594, 71.9568099975586, 74.60577392578125, 77.2547378540039, 79.90370178222656, 82.55267333984375, 85.20162963867188, 87.85060119628906, 90.49955749511719, 93.14852142333984, 95.7974853515625, 98.44644927978516, 101.09541320800781, 103.744384765625, 106.39334106445312, 109.04231262207031, 111.69127655029297, 114.34024047851562, 116.98920440673828, 119.63816833496094, 122.2871322631836, 124.93609619140625, 127.58506774902344, 130.23402404785156, 132.88299560546875]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 6.0, 15.0, 22.0, 21.0, 20.0, 21.0, 28.0, 30.0, 34.0, 31.0, 43.0, 51.0, 42.0, 42.0, 58.0, 41.0, 42.0, 50.0, 53.0, 44.0, 36.0, 31.0, 33.0, 27.0, 27.0, 35.0, 30.0, 21.0, 11.0, 6.0, 8.0, 4.0, 3.0, 8.0, 6.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.014636993408203, -26.159589767456055, -25.30454444885254, -24.44949722290039, -23.594451904296875, -22.739404678344727, -21.884357452392578, -21.029312133789062, -20.174264907836914, -19.319217681884766, -18.46417236328125, -17.6091251373291, -16.754077911376953, -15.899032592773438, -15.043985366821289, -14.188939094543457, -13.333892822265625, -12.478846549987793, -11.623800277709961, -10.768753051757812, -9.91370677947998, -9.058660507202148, -8.20361328125, -7.348567008972168, -6.493520736694336, -5.638474464416504, -4.783427715301514, -3.9283812046051025, -3.0733346939086914, -2.2182884216308594, -1.3632416725158691, -0.5081949234008789, 0.3468494415283203, 1.2018959522247314, 2.0569424629211426, 2.9119889736175537, 3.767035484313965, 4.622081756591797, 5.477128505706787, 6.332175254821777, 7.187221527099609, 8.042267799377441, 8.897314071655273, 9.752361297607422, 10.607407569885254, 11.462453842163086, 12.317501068115234, 13.172547340393066, 14.027593612670898, 14.88263988494873, 15.737686157226562, 16.59273338317871, 17.44778060913086, 18.302825927734375, 19.157873153686523, 20.012920379638672, 20.867965698242188, 21.723012924194336, 22.57805824279785, 23.43310546875, 24.288150787353516, 25.143198013305664, 25.998245239257812, 26.853290557861328, 27.708337783813477]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 7.0, 6.0, 12.0, 18.0, 14.0, 19.0, 23.0, 32.0, 31.0, 32.0, 47.0, 51.0, 67.0, 97.0, 134.0, 265.0, 618.0, 1880.0, 7617.0, 3979910.0, 193902.0, 6394.0, 1720.0, 538.0, 260.0, 135.0, 79.0, 60.0, 49.0, 50.0, 40.0, 30.0, 26.0, 24.0, 17.0, 18.0, 10.0, 10.0, 10.0, 6.0, 6.0, 1.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.7265625, -4.56329345703125, -4.4000244140625, -4.23675537109375, -4.073486328125, -3.91021728515625, -3.7469482421875, -3.58367919921875, -3.42041015625, -3.25714111328125, -3.0938720703125, -2.93060302734375, -2.767333984375, -2.60406494140625, -2.4407958984375, -2.27752685546875, -2.1142578125, -1.95098876953125, -1.7877197265625, -1.62445068359375, -1.461181640625, -1.29791259765625, -1.1346435546875, -0.97137451171875, -0.80810546875, -0.64483642578125, -0.4815673828125, -0.31829833984375, -0.155029296875, 0.00823974609375, 0.1715087890625, 0.33477783203125, 0.498046875, 0.66131591796875, 0.8245849609375, 0.98785400390625, 1.151123046875, 1.31439208984375, 1.4776611328125, 1.64093017578125, 1.80419921875, 1.96746826171875, 2.1307373046875, 2.29400634765625, 2.457275390625, 2.62054443359375, 2.7838134765625, 2.94708251953125, 3.1103515625, 3.27362060546875, 3.4368896484375, 3.60015869140625, 3.763427734375, 3.92669677734375, 4.0899658203125, 4.25323486328125, 4.41650390625, 4.57977294921875, 4.7430419921875, 4.90631103515625, 5.069580078125, 5.23284912109375, 5.3961181640625, 5.55938720703125, 5.72265625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 6.0, 0.0, 0.0, 5.0, 3.0, 2.0, 8.0, 7.0, 7.0, 8.0, 8.0, 14.0, 8.0, 18.0, 23.0, 29.0, 30.0, 34.0, 43.0, 44.0, 41.0, 34.0, 41.0, 37.0, 40.0, 43.0, 52.0, 51.0, 37.0, 42.0, 26.0, 32.0, 32.0, 20.0, 28.0, 35.0, 15.0, 20.0, 21.0, 14.0, 13.0, 10.0, 13.0, 5.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1826171875, -1.1425018310546875, -1.102386474609375, -1.0622711181640625, -1.02215576171875, -0.9820404052734375, -0.941925048828125, -0.9018096923828125, -0.8616943359375, -0.8215789794921875, -0.781463623046875, -0.7413482666015625, -0.70123291015625, -0.6611175537109375, -0.621002197265625, -0.5808868408203125, -0.540771484375, -0.5006561279296875, -0.460540771484375, -0.4204254150390625, -0.38031005859375, -0.3401947021484375, -0.300079345703125, -0.2599639892578125, -0.2198486328125, -0.1797332763671875, -0.139617919921875, -0.0995025634765625, -0.05938720703125, -0.0192718505859375, 0.020843505859375, 0.0609588623046875, 0.10107421875, 0.1411895751953125, 0.181304931640625, 0.2214202880859375, 0.26153564453125, 0.3016510009765625, 0.341766357421875, 0.3818817138671875, 0.4219970703125, 0.4621124267578125, 0.502227783203125, 0.5423431396484375, 0.58245849609375, 0.6225738525390625, 0.662689208984375, 0.7028045654296875, 0.742919921875, 0.7830352783203125, 0.823150634765625, 0.8632659912109375, 0.90338134765625, 0.9434967041015625, 0.983612060546875, 1.0237274169921875, 1.0638427734375, 1.1039581298828125, 1.144073486328125, 1.1841888427734375, 1.22430419921875, 1.2644195556640625, 1.304534912109375, 1.3446502685546875, 1.384765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 9.0, 11.0, 8.0, 15.0, 29.0, 34.0, 36.0, 49.0, 75.0, 141.0, 269.0, 684.0, 2846.0, 4069245.0, 116796.0, 2552.0, 743.0, 265.0, 145.0, 87.0, 73.0, 47.0, 38.0, 16.0, 15.0, 15.0, 14.0, 8.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.359375, -8.96875, -8.578125, -8.1875, -7.796875, -7.40625, -7.015625, -6.625, -6.234375, -5.84375, -5.453125, -5.0625, -4.671875, -4.28125, -3.890625, -3.5, -3.109375, -2.71875, -2.328125, -1.9375, -1.546875, -1.15625, -0.765625, -0.375, 0.015625, 0.40625, 0.796875, 1.1875, 1.578125, 1.96875, 2.359375, 2.75, 3.140625, 3.53125, 3.921875, 4.3125, 4.703125, 5.09375, 5.484375, 5.875, 6.265625, 6.65625, 7.046875, 7.4375, 7.828125, 8.21875, 8.609375, 9.0, 9.390625, 9.78125, 10.171875, 10.5625, 10.953125, 11.34375, 11.734375, 12.125, 12.515625, 12.90625, 13.296875, 13.6875, 14.078125, 14.46875, 14.859375, 15.25, 15.640625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 29.0, 3911.0, 105.0, 13.0, 3.0, 5.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5517578125, -1.4595794677734375, -1.367401123046875, -1.2752227783203125, -1.18304443359375, -1.0908660888671875, -0.998687744140625, -0.9065093994140625, -0.8143310546875, -0.7221527099609375, -0.629974365234375, -0.5377960205078125, -0.44561767578125, -0.3534393310546875, -0.261260986328125, -0.1690826416015625, -0.076904296875, 0.0152740478515625, 0.107452392578125, 0.1996307373046875, 0.29180908203125, 0.3839874267578125, 0.476165771484375, 0.5683441162109375, 0.6605224609375, 0.7527008056640625, 0.844879150390625, 0.9370574951171875, 1.02923583984375, 1.1214141845703125, 1.213592529296875, 1.3057708740234375, 1.39794921875, 1.4901275634765625, 1.582305908203125, 1.6744842529296875, 1.76666259765625, 1.8588409423828125, 1.951019287109375, 2.0431976318359375, 2.1353759765625, 2.2275543212890625, 2.319732666015625, 2.4119110107421875, 2.50408935546875, 2.5962677001953125, 2.688446044921875, 2.7806243896484375, 2.872802734375, 2.9649810791015625, 3.057159423828125, 3.1493377685546875, 3.24151611328125, 3.3336944580078125, 3.425872802734375, 3.5180511474609375, 3.6102294921875, 3.7024078369140625, 3.794586181640625, 3.8867645263671875, 3.97894287109375, 4.0711212158203125, 4.163299560546875, 4.2554779052734375, 4.34765625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 4.0, 17.0, 33.0, 69.0, 203.0, 252.0, 205.0, 107.0, 45.0, 32.0, 13.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4273147583007812, -3.2193522453308105, -3.01138973236084, -2.80342698097229, -2.5954644680023193, -2.3875019550323486, -2.179539203643799, -1.9715766906738281, -1.7636141777038574, -1.5556516647338867, -1.3476890325546265, -1.1397264003753662, -0.9317638874053955, -0.7238013744354248, -0.5158387422561646, -0.3078761100769043, -0.0999135971069336, 0.10804897546768188, 0.31601154804229736, 0.5239741206169128, 0.7319366931915283, 0.939899206161499, 1.1478618383407593, 1.3558244705200195, 1.5637869834899902, 1.771749496459961, 1.9797121286392212, 2.1876747608184814, 2.395637273788452, 2.603599786758423, 2.8115625381469727, 3.0195250511169434, 3.227487564086914, 3.4354500770568848, 3.6434125900268555, 3.8513753414154053, 4.059337615966797, 4.267300605773926, 4.4752631187438965, 4.683225631713867, 4.891188144683838, 5.099150657653809, 5.307113170623779, 5.51507568359375, 5.723038673400879, 5.931000709533691, 6.13896369934082, 6.346926212310791, 6.554888725280762, 6.762851238250732, 6.970813751220703, 7.178776264190674, 7.3867387771606445, 7.594701766967773, 7.802664279937744, 8.010626792907715, 8.218589782714844, 8.426552772521973, 8.634514808654785, 8.842477798461914, 9.050439834594727, 9.258402824401855, 9.466364860534668, 9.674327850341797, 9.88228988647461]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 5.0, 5.0, 11.0, 12.0, 6.0, 14.0, 21.0, 18.0, 21.0, 32.0, 21.0, 29.0, 32.0, 38.0, 47.0, 38.0, 56.0, 55.0, 48.0, 46.0, 58.0, 41.0, 38.0, 35.0, 44.0, 37.0, 32.0, 24.0, 21.0, 22.0, 16.0, 17.0, 12.0, 8.0, 13.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.9107766151428223, -3.8045763969421387, -3.698376178741455, -3.5921757221221924, -3.485975503921509, -3.379775285720825, -3.2735750675201416, -3.167374610900879, -3.0611743927001953, -2.9549741744995117, -2.848773956298828, -2.7425734996795654, -2.636373281478882, -2.5301730632781982, -2.4239728450775146, -2.317772388458252, -2.2115721702575684, -2.1053719520568848, -1.9991716146469116, -1.892971396446228, -1.7867710590362549, -1.6805708408355713, -1.5743706226348877, -1.4681702852249146, -1.3619701862335205, -1.255769968032837, -1.1495696306228638, -1.0433694124221802, -0.937169075012207, -0.8309688568115234, -0.7247685790061951, -0.6185683012008667, -0.5123679637908936, -0.4061676859855652, -0.2999674081802368, -0.19376716017723083, -0.08756688237190247, 0.018633365631103516, 0.12483364343643188, 0.23103392124176025, 0.3372341990470886, 0.443434476852417, 0.5496347546577454, 0.6558350324630737, 0.7620352506637573, 0.8682355284690857, 0.9744358062744141, 1.0806360244750977, 1.1868363618850708, 1.2930365800857544, 1.3992369174957275, 1.5054371356964111, 1.6116374731063843, 1.7178376913070679, 1.824038028717041, 1.9302382469177246, 2.036438465118408, 2.142638683319092, 2.2488389015197754, 2.355039358139038, 2.4612395763397217, 2.5674397945404053, 2.673640012741089, 2.7798404693603516, 2.886040687561035]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 4.0, 5.0, 11.0, 8.0, 11.0, 6.0, 15.0, 14.0, 13.0, 19.0, 30.0, 31.0, 45.0, 59.0, 80.0, 131.0, 243.0, 480.0, 973.0, 2007.0, 4522.0, 10643.0, 27504.0, 77509.0, 234945.0, 401447.0, 187374.0, 61734.0, 22371.0, 8877.0, 3754.0, 1762.0, 806.0, 436.0, 232.0, 143.0, 70.0, 43.0, 44.0, 22.0, 25.0, 23.0, 22.0, 10.0, 13.0, 10.0, 7.0, 4.0, 5.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0], "bins": [-2.341796875, -2.273712158203125, -2.20562744140625, -2.137542724609375, -2.0694580078125, -2.001373291015625, -1.93328857421875, -1.865203857421875, -1.797119140625, -1.729034423828125, -1.66094970703125, -1.592864990234375, -1.5247802734375, -1.456695556640625, -1.38861083984375, -1.320526123046875, -1.25244140625, -1.184356689453125, -1.11627197265625, -1.048187255859375, -0.9801025390625, -0.912017822265625, -0.84393310546875, -0.775848388671875, -0.707763671875, -0.639678955078125, -0.57159423828125, -0.503509521484375, -0.4354248046875, -0.367340087890625, -0.29925537109375, -0.231170654296875, -0.1630859375, -0.095001220703125, -0.02691650390625, 0.041168212890625, 0.1092529296875, 0.177337646484375, 0.24542236328125, 0.313507080078125, 0.381591796875, 0.449676513671875, 0.51776123046875, 0.585845947265625, 0.6539306640625, 0.722015380859375, 0.79010009765625, 0.858184814453125, 0.92626953125, 0.994354248046875, 1.06243896484375, 1.130523681640625, 1.1986083984375, 1.266693115234375, 1.33477783203125, 1.402862548828125, 1.470947265625, 1.539031982421875, 1.60711669921875, 1.675201416015625, 1.7432861328125, 1.811370849609375, 1.87945556640625, 1.947540283203125, 2.015625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 7.0, 9.0, 10.0, 11.0, 10.0, 17.0, 14.0, 12.0, 19.0, 23.0, 35.0, 32.0, 25.0, 34.0, 36.0, 36.0, 39.0, 55.0, 37.0, 31.0, 39.0, 51.0, 45.0, 36.0, 41.0, 37.0, 24.0, 31.0, 19.0, 29.0, 29.0, 17.0, 18.0, 19.0, 10.0, 13.0, 8.0, 5.0, 8.0, 9.0, 7.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.390625, -1.343994140625, -1.29736328125, -1.250732421875, -1.2041015625, -1.157470703125, -1.11083984375, -1.064208984375, -1.017578125, -0.970947265625, -0.92431640625, -0.877685546875, -0.8310546875, -0.784423828125, -0.73779296875, -0.691162109375, -0.64453125, -0.597900390625, -0.55126953125, -0.504638671875, -0.4580078125, -0.411376953125, -0.36474609375, -0.318115234375, -0.271484375, -0.224853515625, -0.17822265625, -0.131591796875, -0.0849609375, -0.038330078125, 0.00830078125, 0.054931640625, 0.1015625, 0.148193359375, 0.19482421875, 0.241455078125, 0.2880859375, 0.334716796875, 0.38134765625, 0.427978515625, 0.474609375, 0.521240234375, 0.56787109375, 0.614501953125, 0.6611328125, 0.707763671875, 0.75439453125, 0.801025390625, 0.84765625, 0.894287109375, 0.94091796875, 0.987548828125, 1.0341796875, 1.080810546875, 1.12744140625, 1.174072265625, 1.220703125, 1.267333984375, 1.31396484375, 1.360595703125, 1.4072265625, 1.453857421875, 1.50048828125, 1.547119140625, 1.59375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 1.0, 6.0, 4.0, 6.0, 10.0, 9.0, 20.0, 18.0, 26.0, 43.0, 62.0, 91.0, 124.0, 183.0, 270.0, 565.0, 1372.0, 5665.0, 49725.0, 800144.0, 174153.0, 11964.0, 2267.0, 742.0, 368.0, 235.0, 129.0, 89.0, 65.0, 50.0, 34.0, 26.0, 24.0, 18.0, 12.0, 10.0, 2.0, 7.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.67578125, -6.493896484375, -6.31201171875, -6.130126953125, -5.9482421875, -5.766357421875, -5.58447265625, -5.402587890625, -5.220703125, -5.038818359375, -4.85693359375, -4.675048828125, -4.4931640625, -4.311279296875, -4.12939453125, -3.947509765625, -3.765625, -3.583740234375, -3.40185546875, -3.219970703125, -3.0380859375, -2.856201171875, -2.67431640625, -2.492431640625, -2.310546875, -2.128662109375, -1.94677734375, -1.764892578125, -1.5830078125, -1.401123046875, -1.21923828125, -1.037353515625, -0.85546875, -0.673583984375, -0.49169921875, -0.309814453125, -0.1279296875, 0.053955078125, 0.23583984375, 0.417724609375, 0.599609375, 0.781494140625, 0.96337890625, 1.145263671875, 1.3271484375, 1.509033203125, 1.69091796875, 1.872802734375, 2.0546875, 2.236572265625, 2.41845703125, 2.600341796875, 2.7822265625, 2.964111328125, 3.14599609375, 3.327880859375, 3.509765625, 3.691650390625, 3.87353515625, 4.055419921875, 4.2373046875, 4.419189453125, 4.60107421875, 4.782958984375, 4.96484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 8.0, 9.0, 4.0, 11.0, 13.0, 13.0, 14.0, 26.0, 26.0, 23.0, 35.0, 32.0, 31.0, 30.0, 36.0, 40.0, 43.0, 42.0, 53.0, 49.0, 43.0, 55.0, 38.0, 48.0, 29.0, 39.0, 23.0, 13.0, 31.0, 21.0, 18.0, 14.0, 19.0, 20.0, 10.0, 8.0, 9.0, 2.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.93359375, -5.70587158203125, -5.4781494140625, -5.25042724609375, -5.022705078125, -4.79498291015625, -4.5672607421875, -4.33953857421875, -4.11181640625, -3.88409423828125, -3.6563720703125, -3.42864990234375, -3.200927734375, -2.97320556640625, -2.7454833984375, -2.51776123046875, -2.2900390625, -2.06231689453125, -1.8345947265625, -1.60687255859375, -1.379150390625, -1.15142822265625, -0.9237060546875, -0.69598388671875, -0.46826171875, -0.24053955078125, -0.0128173828125, 0.21490478515625, 0.442626953125, 0.67034912109375, 0.8980712890625, 1.12579345703125, 1.353515625, 1.58123779296875, 1.8089599609375, 2.03668212890625, 2.264404296875, 2.49212646484375, 2.7198486328125, 2.94757080078125, 3.17529296875, 3.40301513671875, 3.6307373046875, 3.85845947265625, 4.086181640625, 4.31390380859375, 4.5416259765625, 4.76934814453125, 4.9970703125, 5.22479248046875, 5.4525146484375, 5.68023681640625, 5.907958984375, 6.13568115234375, 6.3634033203125, 6.59112548828125, 6.81884765625, 7.04656982421875, 7.2742919921875, 7.50201416015625, 7.729736328125, 7.95745849609375, 8.1851806640625, 8.41290283203125, 8.640625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 11.0, 17.0, 16.0, 28.0, 43.0, 82.0, 155.0, 355.0, 868.0, 2958.0, 14288.0, 280541.0, 719706.0, 23390.0, 4096.0, 1175.0, 401.0, 167.0, 101.0, 50.0, 40.0, 23.0, 12.0, 12.0, 1.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.142578125, -3.05047607421875, -2.9583740234375, -2.86627197265625, -2.774169921875, -2.68206787109375, -2.5899658203125, -2.49786376953125, -2.40576171875, -2.31365966796875, -2.2215576171875, -2.12945556640625, -2.037353515625, -1.94525146484375, -1.8531494140625, -1.76104736328125, -1.6689453125, -1.57684326171875, -1.4847412109375, -1.39263916015625, -1.300537109375, -1.20843505859375, -1.1163330078125, -1.02423095703125, -0.93212890625, -0.84002685546875, -0.7479248046875, -0.65582275390625, -0.563720703125, -0.47161865234375, -0.3795166015625, -0.28741455078125, -0.1953125, -0.10321044921875, -0.0111083984375, 0.08099365234375, 0.173095703125, 0.26519775390625, 0.3572998046875, 0.44940185546875, 0.54150390625, 0.63360595703125, 0.7257080078125, 0.81781005859375, 0.909912109375, 1.00201416015625, 1.0941162109375, 1.18621826171875, 1.2783203125, 1.37042236328125, 1.4625244140625, 1.55462646484375, 1.646728515625, 1.73883056640625, 1.8309326171875, 1.92303466796875, 2.01513671875, 2.10723876953125, 2.1993408203125, 2.29144287109375, 2.383544921875, 2.47564697265625, 2.5677490234375, 2.65985107421875, 2.751953125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 5.0, 8.0, 8.0, 14.0, 19.0, 34.0, 44.0, 107.0, 164.0, 191.0, 151.0, 108.0, 61.0, 26.0, 20.0, 17.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001786947250366211, -0.000169483944773674, -0.00016027316451072693, -0.00015106238424777985, -0.00014185160398483276, -0.00013264082372188568, -0.0001234300434589386, -0.00011421926319599152, -0.00010500848293304443, -9.579770267009735e-05, -8.658692240715027e-05, -7.737614214420319e-05, -6.81653618812561e-05, -5.895458161830902e-05, -4.974380135536194e-05, -4.0533021092414856e-05, -3.1322240829467773e-05, -2.211146056652069e-05, -1.2900680303573608e-05, -3.689900040626526e-06, 5.520880222320557e-06, 1.473166048526764e-05, 2.394244074821472e-05, 3.3153221011161804e-05, 4.236400127410889e-05, 5.157478153705597e-05, 6.078556180000305e-05, 6.999634206295013e-05, 7.920712232589722e-05, 8.84179025888443e-05, 9.762868285179138e-05, 0.00010683946311473846, 0.00011605024337768555, 0.00012526102364063263, 0.0001344718039035797, 0.0001436825841665268, 0.00015289336442947388, 0.00016210414469242096, 0.00017131492495536804, 0.00018052570521831512, 0.0001897364854812622, 0.0001989472657442093, 0.00020815804600715637, 0.00021736882627010345, 0.00022657960653305054, 0.00023579038679599762, 0.0002450011670589447, 0.0002542119473218918, 0.00026342272758483887, 0.00027263350784778595, 0.00028184428811073303, 0.0002910550683736801, 0.0003002658486366272, 0.0003094766288995743, 0.00031868740916252136, 0.00032789818942546844, 0.00033710896968841553, 0.0003463197499513626, 0.0003555305302143097, 0.0003647413104772568, 0.00037395209074020386, 0.00038316287100315094, 0.000392373651266098, 0.0004015844315290451, 0.0004107952117919922]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 8.0, 11.0, 12.0, 33.0, 25.0, 71.0, 124.0, 370.0, 1174.0, 6035.0, 106597.0, 904899.0, 24966.0, 3051.0, 722.0, 229.0, 96.0, 47.0, 29.0, 25.0, 10.0, 6.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01953125, -2.895263671875, -2.77099609375, -2.646728515625, -2.5224609375, -2.398193359375, -2.27392578125, -2.149658203125, -2.025390625, -1.901123046875, -1.77685546875, -1.652587890625, -1.5283203125, -1.404052734375, -1.27978515625, -1.155517578125, -1.03125, -0.906982421875, -0.78271484375, -0.658447265625, -0.5341796875, -0.409912109375, -0.28564453125, -0.161376953125, -0.037109375, 0.087158203125, 0.21142578125, 0.335693359375, 0.4599609375, 0.584228515625, 0.70849609375, 0.832763671875, 0.95703125, 1.081298828125, 1.20556640625, 1.329833984375, 1.4541015625, 1.578369140625, 1.70263671875, 1.826904296875, 1.951171875, 2.075439453125, 2.19970703125, 2.323974609375, 2.4482421875, 2.572509765625, 2.69677734375, 2.821044921875, 2.9453125, 3.069580078125, 3.19384765625, 3.318115234375, 3.4423828125, 3.566650390625, 3.69091796875, 3.815185546875, 3.939453125, 4.063720703125, 4.18798828125, 4.312255859375, 4.4365234375, 4.560791015625, 4.68505859375, 4.809326171875, 4.93359375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 8.0, 6.0, 13.0, 16.0, 29.0, 43.0, 68.0, 105.0, 150.0, 148.0, 159.0, 84.0, 56.0, 40.0, 19.0, 14.0, 17.0, 7.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.603515625, -2.50115966796875, -2.3988037109375, -2.29644775390625, -2.194091796875, -2.09173583984375, -1.9893798828125, -1.88702392578125, -1.78466796875, -1.68231201171875, -1.5799560546875, -1.47760009765625, -1.375244140625, -1.27288818359375, -1.1705322265625, -1.06817626953125, -0.9658203125, -0.86346435546875, -0.7611083984375, -0.65875244140625, -0.556396484375, -0.45404052734375, -0.3516845703125, -0.24932861328125, -0.14697265625, -0.04461669921875, 0.0577392578125, 0.16009521484375, 0.262451171875, 0.36480712890625, 0.4671630859375, 0.56951904296875, 0.671875, 0.77423095703125, 0.8765869140625, 0.97894287109375, 1.081298828125, 1.18365478515625, 1.2860107421875, 1.38836669921875, 1.49072265625, 1.59307861328125, 1.6954345703125, 1.79779052734375, 1.900146484375, 2.00250244140625, 2.1048583984375, 2.20721435546875, 2.3095703125, 2.41192626953125, 2.5142822265625, 2.61663818359375, 2.718994140625, 2.82135009765625, 2.9237060546875, 3.02606201171875, 3.12841796875, 3.23077392578125, 3.3331298828125, 3.43548583984375, 3.537841796875, 3.64019775390625, 3.7425537109375, 3.84490966796875, 3.947265625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 35.0, 81.0, 162.0, 253.0, 204.0, 135.0, 66.0, 42.0, 9.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-75.76907348632812, -74.25141906738281, -72.7337646484375, -71.21611022949219, -69.69845581054688, -68.18080139160156, -66.66314697265625, -65.14550018310547, -63.627845764160156, -62.110191345214844, -60.59253692626953, -59.07488250732422, -57.55723190307617, -56.03957748413086, -54.52192306518555, -53.004268646240234, -51.48661422729492, -49.96895980834961, -48.4513053894043, -46.93365478515625, -45.41600036621094, -43.898345947265625, -42.38069152832031, -40.863037109375, -39.34538269042969, -37.827728271484375, -36.31007385253906, -34.79241943359375, -33.2747688293457, -31.75711441040039, -30.239459991455078, -28.721805572509766, -27.204158782958984, -25.686504364013672, -24.168851852416992, -22.65119743347168, -21.133544921875, -19.615890502929688, -18.098236083984375, -16.580581665039062, -15.062929153442383, -13.545275688171387, -12.02762222290039, -10.509967803955078, -8.992314338684082, -7.474660873413086, -5.957006454467773, -4.439352989196777, -2.9216995239257812, -1.404045820236206, 0.11360788345336914, 1.6312618255615234, 3.1489152908325195, 4.666568756103516, 6.184223175048828, 7.701876640319824, 9.21953010559082, 10.737183570861816, 12.254837036132812, 13.772491455078125, 15.290144920349121, 16.807798385620117, 18.32545280456543, 19.84310531616211, 21.360759735107422]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 6.0, 6.0, 12.0, 7.0, 7.0, 15.0, 18.0, 14.0, 27.0, 20.0, 20.0, 23.0, 39.0, 38.0, 51.0, 39.0, 52.0, 41.0, 59.0, 55.0, 47.0, 51.0, 44.0, 47.0, 32.0, 29.0, 29.0, 16.0, 26.0, 32.0, 16.0, 20.0, 5.0, 12.0, 8.0, 13.0, 8.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.92325210571289, -31.663043975830078, -30.402835845947266, -29.142629623413086, -27.882421493530273, -26.62221336364746, -25.36200714111328, -24.10179901123047, -22.841590881347656, -21.581382751464844, -20.32117462158203, -19.06096839904785, -17.80076026916504, -16.540552139282227, -15.28034496307373, -14.020137786865234, -12.759929656982422, -11.49972152709961, -10.239514350891113, -8.979307174682617, -7.719099044799805, -6.45889139175415, -5.198683738708496, -3.9384765625, -2.6782684326171875, -1.4180607795715332, -0.1578531265258789, 1.1023545265197754, 2.3625621795654297, 3.622769832611084, 4.882977485656738, 6.143184661865234, 7.4033966064453125, 8.663604736328125, 9.923811912536621, 11.184019088745117, 12.44422721862793, 13.704435348510742, 14.964642524719238, 16.224849700927734, 17.485057830810547, 18.74526596069336, 20.005474090576172, 21.26568031311035, 22.525888442993164, 23.786096572875977, 25.046302795410156, 26.30651092529297, 27.56671905517578, 28.826927185058594, 30.087135314941406, 31.347341537475586, 32.60755157470703, 33.86775588989258, 35.12796401977539, 36.3881721496582, 37.648380279541016, 38.90858840942383, 40.16879653930664, 41.42900466918945, 42.689208984375, 43.94941711425781, 45.209625244140625, 46.46983337402344, 47.73004150390625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 7.0, 7.0, 18.0, 23.0, 21.0, 25.0, 34.0, 42.0, 52.0, 79.0, 98.0, 208.0, 334.0, 635.0, 1418.0, 3683.0, 18747.0, 4100149.0, 58710.0, 6192.0, 1910.0, 825.0, 393.0, 209.0, 124.0, 80.0, 64.0, 44.0, 33.0, 27.0, 19.0, 15.0, 9.0, 15.0, 10.0, 4.0, 2.0, 2.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.814453125, -2.71282958984375, -2.6112060546875, -2.50958251953125, -2.407958984375, -2.30633544921875, -2.2047119140625, -2.10308837890625, -2.00146484375, -1.89984130859375, -1.7982177734375, -1.69659423828125, -1.594970703125, -1.49334716796875, -1.3917236328125, -1.29010009765625, -1.1884765625, -1.08685302734375, -0.9852294921875, -0.88360595703125, -0.781982421875, -0.68035888671875, -0.5787353515625, -0.47711181640625, -0.37548828125, -0.27386474609375, -0.1722412109375, -0.07061767578125, 0.031005859375, 0.13262939453125, 0.2342529296875, 0.33587646484375, 0.4375, 0.53912353515625, 0.6407470703125, 0.74237060546875, 0.843994140625, 0.94561767578125, 1.0472412109375, 1.14886474609375, 1.25048828125, 1.35211181640625, 1.4537353515625, 1.55535888671875, 1.656982421875, 1.75860595703125, 1.8602294921875, 1.96185302734375, 2.0634765625, 2.16510009765625, 2.2667236328125, 2.36834716796875, 2.469970703125, 2.57159423828125, 2.6732177734375, 2.77484130859375, 2.87646484375, 2.97808837890625, 3.0797119140625, 3.18133544921875, 3.282958984375, 3.38458251953125, 3.4862060546875, 3.58782958984375, 3.689453125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 2.0, 12.0, 9.0, 8.0, 12.0, 17.0, 19.0, 18.0, 28.0, 36.0, 25.0, 31.0, 35.0, 41.0, 50.0, 35.0, 51.0, 44.0, 48.0, 48.0, 43.0, 29.0, 46.0, 42.0, 27.0, 30.0, 33.0, 27.0, 20.0, 23.0, 28.0, 11.0, 15.0, 8.0, 16.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6650390625, -1.611846923828125, -1.55865478515625, -1.505462646484375, -1.4522705078125, -1.399078369140625, -1.34588623046875, -1.292694091796875, -1.239501953125, -1.186309814453125, -1.13311767578125, -1.079925537109375, -1.0267333984375, -0.973541259765625, -0.92034912109375, -0.867156982421875, -0.81396484375, -0.760772705078125, -0.70758056640625, -0.654388427734375, -0.6011962890625, -0.548004150390625, -0.49481201171875, -0.441619873046875, -0.388427734375, -0.335235595703125, -0.28204345703125, -0.228851318359375, -0.1756591796875, -0.122467041015625, -0.06927490234375, -0.016082763671875, 0.037109375, 0.090301513671875, 0.14349365234375, 0.196685791015625, 0.2498779296875, 0.303070068359375, 0.35626220703125, 0.409454345703125, 0.462646484375, 0.515838623046875, 0.56903076171875, 0.622222900390625, 0.6754150390625, 0.728607177734375, 0.78179931640625, 0.834991455078125, 0.88818359375, 0.941375732421875, 0.99456787109375, 1.047760009765625, 1.1009521484375, 1.154144287109375, 1.20733642578125, 1.260528564453125, 1.313720703125, 1.366912841796875, 1.42010498046875, 1.473297119140625, 1.5264892578125, 1.579681396484375, 1.63287353515625, 1.686065673828125, 1.7392578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 6.0, 10.0, 9.0, 8.0, 18.0, 19.0, 20.0, 23.0, 21.0, 26.0, 27.0, 35.0, 42.0, 38.0, 45.0, 135.0, 493.0, 9253.0, 4181518.0, 1860.0, 256.0, 80.0, 58.0, 40.0, 37.0, 37.0, 32.0, 27.0, 24.0, 22.0, 14.0, 20.0, 8.0, 6.0, 6.0, 7.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.34375, -15.837890625, -15.33203125, -14.826171875, -14.3203125, -13.814453125, -13.30859375, -12.802734375, -12.296875, -11.791015625, -11.28515625, -10.779296875, -10.2734375, -9.767578125, -9.26171875, -8.755859375, -8.25, -7.744140625, -7.23828125, -6.732421875, -6.2265625, -5.720703125, -5.21484375, -4.708984375, -4.203125, -3.697265625, -3.19140625, -2.685546875, -2.1796875, -1.673828125, -1.16796875, -0.662109375, -0.15625, 0.349609375, 0.85546875, 1.361328125, 1.8671875, 2.373046875, 2.87890625, 3.384765625, 3.890625, 4.396484375, 4.90234375, 5.408203125, 5.9140625, 6.419921875, 6.92578125, 7.431640625, 7.9375, 8.443359375, 8.94921875, 9.455078125, 9.9609375, 10.466796875, 10.97265625, 11.478515625, 11.984375, 12.490234375, 12.99609375, 13.501953125, 14.0078125, 14.513671875, 15.01953125, 15.525390625, 16.03125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 21.0, 180.0, 3855.0, 21.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80859375, -0.67779541015625, -0.5469970703125, -0.41619873046875, -0.285400390625, -0.15460205078125, -0.0238037109375, 0.10699462890625, 0.23779296875, 0.36859130859375, 0.4993896484375, 0.63018798828125, 0.760986328125, 0.89178466796875, 1.0225830078125, 1.15338134765625, 1.2841796875, 1.41497802734375, 1.5457763671875, 1.67657470703125, 1.807373046875, 1.93817138671875, 2.0689697265625, 2.19976806640625, 2.33056640625, 2.46136474609375, 2.5921630859375, 2.72296142578125, 2.853759765625, 2.98455810546875, 3.1153564453125, 3.24615478515625, 3.376953125, 3.50775146484375, 3.6385498046875, 3.76934814453125, 3.900146484375, 4.03094482421875, 4.1617431640625, 4.29254150390625, 4.42333984375, 4.55413818359375, 4.6849365234375, 4.81573486328125, 4.946533203125, 5.07733154296875, 5.2081298828125, 5.33892822265625, 5.4697265625, 5.60052490234375, 5.7313232421875, 5.86212158203125, 5.992919921875, 6.12371826171875, 6.2545166015625, 6.38531494140625, 6.51611328125, 6.64691162109375, 6.7777099609375, 6.90850830078125, 7.039306640625, 7.17010498046875, 7.3009033203125, 7.43170166015625, 7.5625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 8.0, 20.0, 70.0, 414.0, 346.0, 103.0, 26.0, 20.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.981804847717285, -2.3991165161132812, -1.8164284229278564, -1.233740210533142, -0.6510519981384277, -0.06836366653442383, 0.514324426651001, 1.0970125198364258, 1.6797008514404297, 2.2623891830444336, 2.8450772762298584, 3.427765369415283, 4.010453701019287, 4.593142032623291, 5.175829887390137, 5.758518218994141, 6.3412065505981445, 6.923894882202148, 7.506583213806152, 8.089271545410156, 8.671958923339844, 9.254648208618164, 9.837335586547852, 10.420023918151855, 11.00271224975586, 11.585400581359863, 12.168088912963867, 12.750777244567871, 13.333465576171875, 13.916152954101562, 14.498841285705566, 15.08152961730957, 15.66421890258789, 16.246906280517578, 16.8295955657959, 17.412282943725586, 17.994972229003906, 18.577659606933594, 19.160348892211914, 19.7430362701416, 20.325725555419922, 20.90841293334961, 21.49110221862793, 22.073789596557617, 22.656478881835938, 23.239166259765625, 23.821855545043945, 24.404542922973633, 24.98723030090332, 25.569917678833008, 26.152606964111328, 26.735294342041016, 27.317983627319336, 27.900671005249023, 28.483360290527344, 29.06604766845703, 29.64873504638672, 30.231422424316406, 30.814111709594727, 31.396799087524414, 31.979488372802734, 32.56217575073242, 33.14486312866211, 33.72755432128906, 34.31024169921875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 4.0, 11.0, 12.0, 10.0, 13.0, 12.0, 26.0, 16.0, 21.0, 28.0, 36.0, 28.0, 39.0, 44.0, 35.0, 39.0, 55.0, 51.0, 49.0, 40.0, 30.0, 52.0, 40.0, 42.0, 36.0, 36.0, 28.0, 22.0, 23.0, 17.0, 18.0, 14.0, 11.0, 13.0, 10.0, 8.0, 4.0, 7.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.090295314788818, -3.941415786743164, -3.792536497116089, -3.6436569690704346, -3.4947776794433594, -3.345898151397705, -3.197018623352051, -3.0481393337249756, -2.8992600440979004, -2.750380516052246, -2.601501226425171, -2.4526216983795166, -2.3037424087524414, -2.154862880706787, -2.005983352661133, -1.8571040630340576, -1.7082245349884033, -1.5593451261520386, -1.4104657173156738, -1.2615861892700195, -1.1127068996429443, -0.9638274312019348, -0.8149479627609253, -0.6660685539245605, -0.5171891450881958, -0.36830973625183105, -0.21943029761314392, -0.07055085897445679, 0.07832854986190796, 0.2272079586982727, 0.3760874271392822, 0.524966835975647, 0.6738462448120117, 0.8227256536483765, 0.9716050624847412, 1.1204845905303955, 1.2693638801574707, 1.418243408203125, 1.5671228170394897, 1.7160022258758545, 1.8648816347122192, 2.013761043548584, 2.1626405715942383, 2.3115198612213135, 2.4603993892669678, 2.609278678894043, 2.7581582069396973, 2.9070377349853516, 3.0559170246124268, 3.204796552658081, 3.3536758422851562, 3.5025553703308105, 3.6514346599578857, 3.80031418800354, 3.9491934776306152, 4.0980730056762695, 4.246952533721924, 4.395832061767578, 4.544711589813232, 4.6935906410217285, 4.842470169067383, 4.991349697113037, 5.140229225158691, 5.2891082763671875, 5.437987804412842]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 7.0, 15.0, 12.0, 14.0, 24.0, 34.0, 22.0, 48.0, 72.0, 91.0, 105.0, 208.0, 325.0, 632.0, 1167.0, 2668.0, 6301.0, 16624.0, 46503.0, 144732.0, 390998.0, 292608.0, 94042.0, 31108.0, 11496.0, 4458.0, 2019.0, 897.0, 470.0, 262.0, 165.0, 105.0, 83.0, 72.0, 27.0, 25.0, 22.0, 17.0, 18.0, 19.0, 10.0, 4.0, 8.0, 3.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.13671875, -2.06256103515625, -1.9884033203125, -1.91424560546875, -1.840087890625, -1.76593017578125, -1.6917724609375, -1.61761474609375, -1.54345703125, -1.46929931640625, -1.3951416015625, -1.32098388671875, -1.246826171875, -1.17266845703125, -1.0985107421875, -1.02435302734375, -0.9501953125, -0.87603759765625, -0.8018798828125, -0.72772216796875, -0.653564453125, -0.57940673828125, -0.5052490234375, -0.43109130859375, -0.35693359375, -0.28277587890625, -0.2086181640625, -0.13446044921875, -0.060302734375, 0.01385498046875, 0.0880126953125, 0.16217041015625, 0.236328125, 0.31048583984375, 0.3846435546875, 0.45880126953125, 0.532958984375, 0.60711669921875, 0.6812744140625, 0.75543212890625, 0.82958984375, 0.90374755859375, 0.9779052734375, 1.05206298828125, 1.126220703125, 1.20037841796875, 1.2745361328125, 1.34869384765625, 1.4228515625, 1.49700927734375, 1.5711669921875, 1.64532470703125, 1.719482421875, 1.79364013671875, 1.8677978515625, 1.94195556640625, 2.01611328125, 2.09027099609375, 2.1644287109375, 2.23858642578125, 2.312744140625, 2.38690185546875, 2.4610595703125, 2.53521728515625, 2.609375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 12.0, 13.0, 8.0, 19.0, 27.0, 21.0, 32.0, 33.0, 32.0, 30.0, 42.0, 40.0, 46.0, 48.0, 50.0, 45.0, 50.0, 39.0, 46.0, 47.0, 34.0, 30.0, 28.0, 34.0, 27.0, 25.0, 27.0, 14.0, 15.0, 18.0, 16.0, 4.0, 10.0, 4.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.380859375, -2.3139495849609375, -2.247039794921875, -2.1801300048828125, -2.11322021484375, -2.0463104248046875, -1.979400634765625, -1.9124908447265625, -1.8455810546875, -1.7786712646484375, -1.711761474609375, -1.6448516845703125, -1.57794189453125, -1.5110321044921875, -1.444122314453125, -1.3772125244140625, -1.310302734375, -1.2433929443359375, -1.176483154296875, -1.1095733642578125, -1.04266357421875, -0.9757537841796875, -0.908843994140625, -0.8419342041015625, -0.7750244140625, -0.7081146240234375, -0.641204833984375, -0.5742950439453125, -0.50738525390625, -0.4404754638671875, -0.373565673828125, -0.3066558837890625, -0.23974609375, -0.1728363037109375, -0.105926513671875, -0.0390167236328125, 0.02789306640625, 0.0948028564453125, 0.161712646484375, 0.2286224365234375, 0.2955322265625, 0.3624420166015625, 0.429351806640625, 0.4962615966796875, 0.56317138671875, 0.6300811767578125, 0.696990966796875, 0.7639007568359375, 0.830810546875, 0.8977203369140625, 0.964630126953125, 1.0315399169921875, 1.09844970703125, 1.1653594970703125, 1.232269287109375, 1.2991790771484375, 1.3660888671875, 1.4329986572265625, 1.499908447265625, 1.5668182373046875, 1.63372802734375, 1.7006378173828125, 1.767547607421875, 1.8344573974609375, 1.9013671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 6.0, 7.0, 8.0, 13.0, 13.0, 20.0, 32.0, 34.0, 55.0, 65.0, 85.0, 146.0, 227.0, 449.0, 1015.0, 3452.0, 30894.0, 798764.0, 199535.0, 10250.0, 1883.0, 637.0, 313.0, 201.0, 129.0, 79.0, 57.0, 45.0, 28.0, 19.0, 22.0, 13.0, 17.0, 8.0, 11.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.9765625, -6.7498779296875, -6.523193359375, -6.2965087890625, -6.06982421875, -5.8431396484375, -5.616455078125, -5.3897705078125, -5.1630859375, -4.9364013671875, -4.709716796875, -4.4830322265625, -4.25634765625, -4.0296630859375, -3.802978515625, -3.5762939453125, -3.349609375, -3.1229248046875, -2.896240234375, -2.6695556640625, -2.44287109375, -2.2161865234375, -1.989501953125, -1.7628173828125, -1.5361328125, -1.3094482421875, -1.082763671875, -0.8560791015625, -0.62939453125, -0.4027099609375, -0.176025390625, 0.0506591796875, 0.27734375, 0.5040283203125, 0.730712890625, 0.9573974609375, 1.18408203125, 1.4107666015625, 1.637451171875, 1.8641357421875, 2.0908203125, 2.3175048828125, 2.544189453125, 2.7708740234375, 2.99755859375, 3.2242431640625, 3.450927734375, 3.6776123046875, 3.904296875, 4.1309814453125, 4.357666015625, 4.5843505859375, 4.81103515625, 5.0377197265625, 5.264404296875, 5.4910888671875, 5.7177734375, 5.9444580078125, 6.171142578125, 6.3978271484375, 6.62451171875, 6.8511962890625, 7.077880859375, 7.3045654296875, 7.53125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 7.0, 6.0, 12.0, 15.0, 16.0, 29.0, 25.0, 31.0, 49.0, 43.0, 58.0, 66.0, 82.0, 60.0, 61.0, 82.0, 74.0, 53.0, 53.0, 45.0, 33.0, 31.0, 19.0, 14.0, 10.0, 6.0, 5.0, 6.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.6640625, -15.224609375, -14.78515625, -14.345703125, -13.90625, -13.466796875, -13.02734375, -12.587890625, -12.1484375, -11.708984375, -11.26953125, -10.830078125, -10.390625, -9.951171875, -9.51171875, -9.072265625, -8.6328125, -8.193359375, -7.75390625, -7.314453125, -6.875, -6.435546875, -5.99609375, -5.556640625, -5.1171875, -4.677734375, -4.23828125, -3.798828125, -3.359375, -2.919921875, -2.48046875, -2.041015625, -1.6015625, -1.162109375, -0.72265625, -0.283203125, 0.15625, 0.595703125, 1.03515625, 1.474609375, 1.9140625, 2.353515625, 2.79296875, 3.232421875, 3.671875, 4.111328125, 4.55078125, 4.990234375, 5.4296875, 5.869140625, 6.30859375, 6.748046875, 7.1875, 7.626953125, 8.06640625, 8.505859375, 8.9453125, 9.384765625, 9.82421875, 10.263671875, 10.703125, 11.142578125, 11.58203125, 12.021484375, 12.4609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 9.0, 25.0, 60.0, 224.0, 3422.0, 1040811.0, 3625.0, 263.0, 62.0, 23.0, 10.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.984375, -19.5546875, -19.125, -18.6953125, -18.265625, -17.8359375, -17.40625, -16.9765625, -16.546875, -16.1171875, -15.6875, -15.2578125, -14.828125, -14.3984375, -13.96875, -13.5390625, -13.109375, -12.6796875, -12.25, -11.8203125, -11.390625, -10.9609375, -10.53125, -10.1015625, -9.671875, -9.2421875, -8.8125, -8.3828125, -7.953125, -7.5234375, -7.09375, -6.6640625, -6.234375, -5.8046875, -5.375, -4.9453125, -4.515625, -4.0859375, -3.65625, -3.2265625, -2.796875, -2.3671875, -1.9375, -1.5078125, -1.078125, -0.6484375, -0.21875, 0.2109375, 0.640625, 1.0703125, 1.5, 1.9296875, 2.359375, 2.7890625, 3.21875, 3.6484375, 4.078125, 4.5078125, 4.9375, 5.3671875, 5.796875, 6.2265625, 6.65625, 7.0859375, 7.515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 7.0, 11.0, 16.0, 23.0, 28.0, 54.0, 103.0, 128.0, 185.0, 183.0, 102.0, 59.0, 44.0, 12.0, 14.0, 12.0, 8.0, 4.0, 1.0, 5.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031447410583496094, -0.0003067515790462494, -0.00029902905225753784, -0.0002913065254688263, -0.00028358399868011475, -0.0002758614718914032, -0.00026813894510269165, -0.0002604164183139801, -0.00025269389152526855, -0.000244971364736557, -0.00023724883794784546, -0.0002295263111591339, -0.00022180378437042236, -0.00021408125758171082, -0.00020635873079299927, -0.00019863620400428772, -0.00019091367721557617, -0.00018319115042686462, -0.00017546862363815308, -0.00016774609684944153, -0.00016002357006072998, -0.00015230104327201843, -0.00014457851648330688, -0.00013685598969459534, -0.0001291334629058838, -0.00012141093611717224, -0.0001136884093284607, -0.00010596588253974915, -9.82433557510376e-05, -9.052082896232605e-05, -8.27983021736145e-05, -7.507577538490295e-05, -6.73532485961914e-05, -5.963072180747986e-05, -5.190819501876831e-05, -4.418566823005676e-05, -3.6463141441345215e-05, -2.8740614652633667e-05, -2.101808786392212e-05, -1.3295561075210571e-05, -5.5730342864990234e-06, 2.1494925022125244e-06, 9.872019290924072e-06, 1.759454607963562e-05, 2.5317072868347168e-05, 3.3039599657058716e-05, 4.0762126445770264e-05, 4.848465323448181e-05, 5.620718002319336e-05, 6.392970681190491e-05, 7.165223360061646e-05, 7.9374760389328e-05, 8.709728717803955e-05, 9.48198139667511e-05, 0.00010254234075546265, 0.0001102648675441742, 0.00011798739433288574, 0.0001257099211215973, 0.00013343244791030884, 0.00014115497469902039, 0.00014887750148773193, 0.00015660002827644348, 0.00016432255506515503, 0.00017204508185386658, 0.00017976760864257812]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 11.0, 18.0, 46.0, 105.0, 362.0, 1217.0, 46448.0, 995563.0, 3885.0, 560.0, 180.0, 82.0, 25.0, 19.0, 11.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.50390625, -6.2813720703125, -6.058837890625, -5.8363037109375, -5.61376953125, -5.3912353515625, -5.168701171875, -4.9461669921875, -4.7236328125, -4.5010986328125, -4.278564453125, -4.0560302734375, -3.83349609375, -3.6109619140625, -3.388427734375, -3.1658935546875, -2.943359375, -2.7208251953125, -2.498291015625, -2.2757568359375, -2.05322265625, -1.8306884765625, -1.608154296875, -1.3856201171875, -1.1630859375, -0.9405517578125, -0.718017578125, -0.4954833984375, -0.27294921875, -0.0504150390625, 0.172119140625, 0.3946533203125, 0.6171875, 0.8397216796875, 1.062255859375, 1.2847900390625, 1.50732421875, 1.7298583984375, 1.952392578125, 2.1749267578125, 2.3974609375, 2.6199951171875, 2.842529296875, 3.0650634765625, 3.28759765625, 3.5101318359375, 3.732666015625, 3.9552001953125, 4.177734375, 4.4002685546875, 4.622802734375, 4.8453369140625, 5.06787109375, 5.2904052734375, 5.512939453125, 5.7354736328125, 5.9580078125, 6.1805419921875, 6.403076171875, 6.6256103515625, 6.84814453125, 7.0706787109375, 7.293212890625, 7.5157470703125, 7.73828125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 8.0, 18.0, 63.0, 232.0, 471.0, 154.0, 35.0, 14.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -2.964324951171875, -2.67669677734375, -2.389068603515625, -2.1014404296875, -1.813812255859375, -1.52618408203125, -1.238555908203125, -0.950927734375, -0.663299560546875, -0.37567138671875, -0.088043212890625, 0.1995849609375, 0.487213134765625, 0.77484130859375, 1.062469482421875, 1.35009765625, 1.637725830078125, 1.92535400390625, 2.212982177734375, 2.5006103515625, 2.788238525390625, 3.07586669921875, 3.363494873046875, 3.651123046875, 3.938751220703125, 4.22637939453125, 4.514007568359375, 4.8016357421875, 5.089263916015625, 5.37689208984375, 5.664520263671875, 5.9521484375, 6.239776611328125, 6.52740478515625, 6.815032958984375, 7.1026611328125, 7.390289306640625, 7.67791748046875, 7.965545654296875, 8.253173828125, 8.540802001953125, 8.82843017578125, 9.116058349609375, 9.4036865234375, 9.691314697265625, 9.97894287109375, 10.266571044921875, 10.55419921875, 10.841827392578125, 11.12945556640625, 11.417083740234375, 11.7047119140625, 11.992340087890625, 12.27996826171875, 12.567596435546875, 12.855224609375, 13.142852783203125, 13.43048095703125, 13.718109130859375, 14.0057373046875, 14.293365478515625, 14.58099365234375, 14.868621826171875, 15.15625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 9.0, 44.0, 571.0, 327.0, 38.0, 10.0, 9.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.04873657226562, -164.12355041503906, -158.19834899902344, -152.27316284179688, -146.34796142578125, -140.4227752685547, -134.49758911132812, -128.5723876953125, -122.6471939086914, -116.72200012207031, -110.79680633544922, -104.87161254882812, -98.94642639160156, -93.02122497558594, -87.09603881835938, -81.17084503173828, -75.24565124511719, -69.3204574584961, -63.395263671875, -57.47007369995117, -51.54487991333008, -45.619686126708984, -39.694496154785156, -33.76930236816406, -27.84410858154297, -21.918914794921875, -15.993722915649414, -10.068531036376953, -4.143337249755859, 1.7818565368652344, 7.7070465087890625, 13.632240295410156, 19.55743408203125, 25.482627868652344, 31.407819747924805, 37.333011627197266, 43.25820541381836, 49.18339920043945, 55.10858917236328, 61.033782958984375, 66.95897674560547, 72.88417053222656, 78.80936431884766, 84.73455810546875, 90.65974426269531, 96.58494567871094, 102.5101318359375, 108.4353256225586, 114.36051940917969, 120.28571319580078, 126.21090698242188, 132.13609313964844, 138.06129455566406, 143.98648071289062, 149.91168212890625, 155.8368682861328, 161.76205444335938, 167.68724060058594, 173.61244201660156, 179.53762817382812, 185.46282958984375, 191.3880157470703, 197.31320190429688, 203.2384033203125, 209.16360473632812]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 10.0, 9.0, 12.0, 16.0, 11.0, 15.0, 12.0, 19.0, 21.0, 23.0, 38.0, 44.0, 36.0, 36.0, 52.0, 52.0, 47.0, 52.0, 47.0, 45.0, 60.0, 43.0, 43.0, 37.0, 37.0, 31.0, 13.0, 25.0, 25.0, 19.0, 12.0, 11.0, 8.0, 7.0, 11.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.665367126464844, -42.15768814086914, -40.6500129699707, -39.142333984375, -37.6346549987793, -36.126976013183594, -34.619300842285156, -33.11162185668945, -31.60394287109375, -30.09626579284668, -28.588586807250977, -27.080909729003906, -25.573230743408203, -24.065553665161133, -22.557876586914062, -21.05019760131836, -19.54252052307129, -18.03484344482422, -16.527164459228516, -15.019487380981445, -13.511808395385742, -12.004131317138672, -10.496453285217285, -8.988775253295898, -7.481097221374512, -5.973419189453125, -4.465741157531738, -2.9580636024475098, -1.450385570526123, 0.05729246139526367, 1.5649700164794922, 3.072648048400879, 4.580326080322266, 6.088004112243652, 7.595682144165039, 9.10335922241211, 10.611038208007812, 12.118715286254883, 13.62639331817627, 15.134071350097656, 16.64175033569336, 18.14942741394043, 19.657106399536133, 21.164783477783203, 22.672462463378906, 24.180139541625977, 25.687816619873047, 27.19549560546875, 28.70317268371582, 30.21084976196289, 31.718528747558594, 33.2262077331543, 34.733882904052734, 36.24156188964844, 37.74924087524414, 39.256919860839844, 40.76459503173828, 42.272274017333984, 43.77994918823242, 45.287628173828125, 46.79530715942383, 48.30298614501953, 49.81066131591797, 51.31834030151367, 52.826019287109375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 9.0, 12.0, 15.0, 13.0, 29.0, 20.0, 42.0, 53.0, 70.0, 89.0, 125.0, 175.0, 213.0, 254.0, 372.0, 528.0, 1039.0, 2122.0, 8154.0, 179746.0, 3985410.0, 10103.0, 2487.0, 1067.0, 563.0, 367.0, 276.0, 222.0, 156.0, 134.0, 116.0, 80.0, 67.0, 30.0, 35.0, 27.0, 21.0, 15.0, 8.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.548828125, -3.43817138671875, -3.3275146484375, -3.21685791015625, -3.106201171875, -2.99554443359375, -2.8848876953125, -2.77423095703125, -2.66357421875, -2.55291748046875, -2.4422607421875, -2.33160400390625, -2.220947265625, -2.11029052734375, -1.9996337890625, -1.88897705078125, -1.7783203125, -1.66766357421875, -1.5570068359375, -1.44635009765625, -1.335693359375, -1.22503662109375, -1.1143798828125, -1.00372314453125, -0.89306640625, -0.78240966796875, -0.6717529296875, -0.56109619140625, -0.450439453125, -0.33978271484375, -0.2291259765625, -0.11846923828125, -0.0078125, 0.10284423828125, 0.2135009765625, 0.32415771484375, 0.434814453125, 0.54547119140625, 0.6561279296875, 0.76678466796875, 0.87744140625, 0.98809814453125, 1.0987548828125, 1.20941162109375, 1.320068359375, 1.43072509765625, 1.5413818359375, 1.65203857421875, 1.7626953125, 1.87335205078125, 1.9840087890625, 2.09466552734375, 2.205322265625, 2.31597900390625, 2.4266357421875, 2.53729248046875, 2.64794921875, 2.75860595703125, 2.8692626953125, 2.97991943359375, 3.090576171875, 3.20123291015625, 3.3118896484375, 3.42254638671875, 3.533203125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 7.0, 8.0, 8.0, 8.0, 10.0, 14.0, 12.0, 15.0, 20.0, 22.0, 32.0, 26.0, 32.0, 44.0, 50.0, 60.0, 57.0, 56.0, 52.0, 67.0, 48.0, 44.0, 31.0, 35.0, 28.0, 30.0, 41.0, 26.0, 23.0, 28.0, 16.0, 12.0, 9.0, 6.0, 6.0, 7.0, 8.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.68359375, -2.598236083984375, -2.51287841796875, -2.427520751953125, -2.3421630859375, -2.256805419921875, -2.17144775390625, -2.086090087890625, -2.000732421875, -1.915374755859375, -1.83001708984375, -1.744659423828125, -1.6593017578125, -1.573944091796875, -1.48858642578125, -1.403228759765625, -1.31787109375, -1.232513427734375, -1.14715576171875, -1.061798095703125, -0.9764404296875, -0.891082763671875, -0.80572509765625, -0.720367431640625, -0.635009765625, -0.549652099609375, -0.46429443359375, -0.378936767578125, -0.2935791015625, -0.208221435546875, -0.12286376953125, -0.037506103515625, 0.0478515625, 0.133209228515625, 0.21856689453125, 0.303924560546875, 0.3892822265625, 0.474639892578125, 0.55999755859375, 0.645355224609375, 0.730712890625, 0.816070556640625, 0.90142822265625, 0.986785888671875, 1.0721435546875, 1.157501220703125, 1.24285888671875, 1.328216552734375, 1.41357421875, 1.498931884765625, 1.58428955078125, 1.669647216796875, 1.7550048828125, 1.840362548828125, 1.92572021484375, 2.011077880859375, 2.096435546875, 2.181793212890625, 2.26715087890625, 2.352508544921875, 2.4378662109375, 2.523223876953125, 2.60858154296875, 2.693939208984375, 2.779296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 9.0, 5.0, 9.0, 17.0, 10.0, 23.0, 38.0, 56.0, 62.0, 86.0, 122.0, 128.0, 160.0, 226.0, 420.0, 1589.0, 20497.0, 4164701.0, 4233.0, 811.0, 292.0, 195.0, 136.0, 98.0, 101.0, 72.0, 54.0, 46.0, 32.0, 19.0, 12.0, 11.0, 12.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.1484375, -11.8133544921875, -11.478271484375, -11.1431884765625, -10.80810546875, -10.4730224609375, -10.137939453125, -9.8028564453125, -9.4677734375, -9.1326904296875, -8.797607421875, -8.4625244140625, -8.12744140625, -7.7923583984375, -7.457275390625, -7.1221923828125, -6.787109375, -6.4520263671875, -6.116943359375, -5.7818603515625, -5.44677734375, -5.1116943359375, -4.776611328125, -4.4415283203125, -4.1064453125, -3.7713623046875, -3.436279296875, -3.1011962890625, -2.76611328125, -2.4310302734375, -2.095947265625, -1.7608642578125, -1.42578125, -1.0906982421875, -0.755615234375, -0.4205322265625, -0.08544921875, 0.2496337890625, 0.584716796875, 0.9197998046875, 1.2548828125, 1.5899658203125, 1.925048828125, 2.2601318359375, 2.59521484375, 2.9302978515625, 3.265380859375, 3.6004638671875, 3.935546875, 4.2706298828125, 4.605712890625, 4.9407958984375, 5.27587890625, 5.6109619140625, 5.946044921875, 6.2811279296875, 6.6162109375, 6.9512939453125, 7.286376953125, 7.6214599609375, 7.95654296875, 8.2916259765625, 8.626708984375, 8.9617919921875, 9.296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 43.0, 3993.0, 28.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.47265625, -4.3468017578125, -4.220947265625, -4.0950927734375, -3.96923828125, -3.8433837890625, -3.717529296875, -3.5916748046875, -3.4658203125, -3.3399658203125, -3.214111328125, -3.0882568359375, -2.96240234375, -2.8365478515625, -2.710693359375, -2.5848388671875, -2.458984375, -2.3331298828125, -2.207275390625, -2.0814208984375, -1.95556640625, -1.8297119140625, -1.703857421875, -1.5780029296875, -1.4521484375, -1.3262939453125, -1.200439453125, -1.0745849609375, -0.94873046875, -0.8228759765625, -0.697021484375, -0.5711669921875, -0.4453125, -0.3194580078125, -0.193603515625, -0.0677490234375, 0.05810546875, 0.1839599609375, 0.309814453125, 0.4356689453125, 0.5615234375, 0.6873779296875, 0.813232421875, 0.9390869140625, 1.06494140625, 1.1907958984375, 1.316650390625, 1.4425048828125, 1.568359375, 1.6942138671875, 1.820068359375, 1.9459228515625, 2.07177734375, 2.1976318359375, 2.323486328125, 2.4493408203125, 2.5751953125, 2.7010498046875, 2.826904296875, 2.9527587890625, 3.07861328125, 3.2044677734375, 3.330322265625, 3.4561767578125, 3.58203125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 28.0, 87.0, 306.0, 435.0, 119.0, 20.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.674741744995117, -13.319316864013672, -12.963892936706543, -12.608469009399414, -12.253044128417969, -11.897619247436523, -11.542195320129395, -11.186771392822266, -10.83134651184082, -10.475921630859375, -10.120497703552246, -9.765073776245117, -9.409648895263672, -9.054224014282227, -8.698800086975098, -8.343376159667969, -7.987951278686523, -7.632526874542236, -7.277102470397949, -6.921678066253662, -6.566253662109375, -6.210829257965088, -5.855404853820801, -5.499980449676514, -5.144556045532227, -4.7891316413879395, -4.433707237243652, -4.078282833099365, -3.722858428955078, -3.367434024810791, -3.012009620666504, -2.656585216522217, -2.301161766052246, -1.945737361907959, -1.5903129577636719, -1.2348885536193848, -0.8794641494750977, -0.5240397453308105, -0.16861534118652344, 0.18680906295776367, 0.5422334671020508, 0.8976578712463379, 1.253082275390625, 1.608506679534912, 1.9639310836791992, 2.3193554878234863, 2.6747798919677734, 3.0302042961120605, 3.3856287002563477, 3.7410531044006348, 4.096477508544922, 4.451901912689209, 4.807326316833496, 5.162750720977783, 5.51817512512207, 5.873599529266357, 6.2290239334106445, 6.584448337554932, 6.939872741699219, 7.295297145843506, 7.650721549987793, 8.006145477294922, 8.361570358276367, 8.716995239257812, 9.072419166564941]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 7.0, 13.0, 7.0, 7.0, 19.0, 15.0, 19.0, 22.0, 16.0, 25.0, 31.0, 26.0, 26.0, 33.0, 38.0, 28.0, 34.0, 31.0, 40.0, 37.0, 50.0, 41.0, 33.0, 46.0, 43.0, 41.0, 35.0, 26.0, 26.0, 29.0, 24.0, 23.0, 15.0, 15.0, 12.0, 12.0, 9.0, 10.0, 3.0, 5.0, 5.0, 7.0, 2.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5065388679504395, -2.421565294265747, -2.3365917205810547, -2.251617908477783, -2.166644334793091, -2.0816707611083984, -1.996697187423706, -1.9117236137390137, -1.8267499208450317, -1.7417763471603394, -1.6568026542663574, -1.571829080581665, -1.4868555068969727, -1.4018818140029907, -1.3169082403182983, -1.2319345474243164, -1.146960973739624, -1.0619874000549316, -0.9770137071609497, -0.8920401334762573, -0.8070665001869202, -0.722092866897583, -0.6371192932128906, -0.5521456599235535, -0.4671720266342163, -0.38219839334487915, -0.2972247898578644, -0.2122511863708496, -0.12727755308151245, -0.04230391979217529, 0.04266965389251709, 0.12764328718185425, 0.2126169204711914, 0.29759055376052856, 0.38256415724754333, 0.4675377607345581, 0.5525113940238953, 0.6374850273132324, 0.7224586009979248, 0.807432234287262, 0.8924058675765991, 0.9773795008659363, 1.0623531341552734, 1.1473267078399658, 1.2323002815246582, 1.3172739744186401, 1.4022475481033325, 1.4872212409973145, 1.5721948146820068, 1.6571683883666992, 1.7421420812606812, 1.8271156549453735, 1.9120893478393555, 1.9970629215240479, 2.0820364952087402, 2.1670100688934326, 2.251983642578125, 2.3369572162628174, 2.4219307899475098, 2.5069046020507812, 2.5918781757354736, 2.676851749420166, 2.7618253231048584, 2.846798896789551, 2.9317727088928223]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 4.0, 9.0, 17.0, 20.0, 27.0, 33.0, 61.0, 98.0, 174.0, 274.0, 440.0, 719.0, 1354.0, 2441.0, 4501.0, 8541.0, 16709.0, 35764.0, 83154.0, 212828.0, 356388.0, 186964.0, 73723.0, 32120.0, 15018.0, 7821.0, 4161.0, 2214.0, 1285.0, 665.0, 389.0, 226.0, 141.0, 92.0, 53.0, 37.0, 30.0, 22.0, 11.0, 6.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.939453125, -1.87774658203125, -1.8160400390625, -1.75433349609375, -1.692626953125, -1.63092041015625, -1.5692138671875, -1.50750732421875, -1.44580078125, -1.38409423828125, -1.3223876953125, -1.26068115234375, -1.198974609375, -1.13726806640625, -1.0755615234375, -1.01385498046875, -0.9521484375, -0.89044189453125, -0.8287353515625, -0.76702880859375, -0.705322265625, -0.64361572265625, -0.5819091796875, -0.52020263671875, -0.45849609375, -0.39678955078125, -0.3350830078125, -0.27337646484375, -0.211669921875, -0.14996337890625, -0.0882568359375, -0.02655029296875, 0.03515625, 0.09686279296875, 0.1585693359375, 0.22027587890625, 0.281982421875, 0.34368896484375, 0.4053955078125, 0.46710205078125, 0.52880859375, 0.59051513671875, 0.6522216796875, 0.71392822265625, 0.775634765625, 0.83734130859375, 0.8990478515625, 0.96075439453125, 1.0224609375, 1.08416748046875, 1.1458740234375, 1.20758056640625, 1.269287109375, 1.33099365234375, 1.3927001953125, 1.45440673828125, 1.51611328125, 1.57781982421875, 1.6395263671875, 1.70123291015625, 1.762939453125, 1.82464599609375, 1.8863525390625, 1.94805908203125, 2.009765625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 5.0, 10.0, 7.0, 11.0, 8.0, 10.0, 16.0, 15.0, 25.0, 26.0, 31.0, 32.0, 26.0, 47.0, 43.0, 54.0, 61.0, 61.0, 53.0, 51.0, 52.0, 42.0, 34.0, 40.0, 27.0, 24.0, 31.0, 25.0, 23.0, 28.0, 20.0, 17.0, 8.0, 15.0, 6.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.208984375, -2.12786865234375, -2.0467529296875, -1.96563720703125, -1.884521484375, -1.80340576171875, -1.7222900390625, -1.64117431640625, -1.56005859375, -1.47894287109375, -1.3978271484375, -1.31671142578125, -1.235595703125, -1.15447998046875, -1.0733642578125, -0.99224853515625, -0.9111328125, -0.83001708984375, -0.7489013671875, -0.66778564453125, -0.586669921875, -0.50555419921875, -0.4244384765625, -0.34332275390625, -0.26220703125, -0.18109130859375, -0.0999755859375, -0.01885986328125, 0.062255859375, 0.14337158203125, 0.2244873046875, 0.30560302734375, 0.38671875, 0.46783447265625, 0.5489501953125, 0.63006591796875, 0.711181640625, 0.79229736328125, 0.8734130859375, 0.95452880859375, 1.03564453125, 1.11676025390625, 1.1978759765625, 1.27899169921875, 1.360107421875, 1.44122314453125, 1.5223388671875, 1.60345458984375, 1.6845703125, 1.76568603515625, 1.8468017578125, 1.92791748046875, 2.009033203125, 2.09014892578125, 2.1712646484375, 2.25238037109375, 2.33349609375, 2.41461181640625, 2.4957275390625, 2.57684326171875, 2.657958984375, 2.73907470703125, 2.8201904296875, 2.90130615234375, 2.982421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 12.0, 6.0, 7.0, 10.0, 11.0, 14.0, 19.0, 23.0, 37.0, 47.0, 60.0, 73.0, 114.0, 155.0, 245.0, 617.0, 1275.0, 3655.0, 17394.0, 190536.0, 762252.0, 59248.0, 8367.0, 2325.0, 873.0, 398.0, 238.0, 153.0, 93.0, 69.0, 49.0, 50.0, 27.0, 23.0, 14.0, 14.0, 8.0, 14.0, 8.0, 4.0, 8.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.99609375, -5.81597900390625, -5.6358642578125, -5.45574951171875, -5.275634765625, -5.09552001953125, -4.9154052734375, -4.73529052734375, -4.55517578125, -4.37506103515625, -4.1949462890625, -4.01483154296875, -3.834716796875, -3.65460205078125, -3.4744873046875, -3.29437255859375, -3.1142578125, -2.93414306640625, -2.7540283203125, -2.57391357421875, -2.393798828125, -2.21368408203125, -2.0335693359375, -1.85345458984375, -1.67333984375, -1.49322509765625, -1.3131103515625, -1.13299560546875, -0.952880859375, -0.77276611328125, -0.5926513671875, -0.41253662109375, -0.232421875, -0.05230712890625, 0.1278076171875, 0.30792236328125, 0.488037109375, 0.66815185546875, 0.8482666015625, 1.02838134765625, 1.20849609375, 1.38861083984375, 1.5687255859375, 1.74884033203125, 1.928955078125, 2.10906982421875, 2.2891845703125, 2.46929931640625, 2.6494140625, 2.82952880859375, 3.0096435546875, 3.18975830078125, 3.369873046875, 3.54998779296875, 3.7301025390625, 3.91021728515625, 4.09033203125, 4.27044677734375, 4.4505615234375, 4.63067626953125, 4.810791015625, 4.99090576171875, 5.1710205078125, 5.35113525390625, 5.53125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 7.0, 3.0, 9.0, 7.0, 9.0, 14.0, 20.0, 22.0, 29.0, 42.0, 40.0, 44.0, 54.0, 72.0, 56.0, 64.0, 75.0, 55.0, 59.0, 50.0, 49.0, 47.0, 36.0, 26.0, 26.0, 23.0, 22.0, 13.0, 7.0, 7.0, 7.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.25, -16.7860107421875, -16.322021484375, -15.8580322265625, -15.39404296875, -14.9300537109375, -14.466064453125, -14.0020751953125, -13.5380859375, -13.0740966796875, -12.610107421875, -12.1461181640625, -11.68212890625, -11.2181396484375, -10.754150390625, -10.2901611328125, -9.826171875, -9.3621826171875, -8.898193359375, -8.4342041015625, -7.97021484375, -7.5062255859375, -7.042236328125, -6.5782470703125, -6.1142578125, -5.6502685546875, -5.186279296875, -4.7222900390625, -4.25830078125, -3.7943115234375, -3.330322265625, -2.8663330078125, -2.40234375, -1.9383544921875, -1.474365234375, -1.0103759765625, -0.54638671875, -0.0823974609375, 0.381591796875, 0.8455810546875, 1.3095703125, 1.7735595703125, 2.237548828125, 2.7015380859375, 3.16552734375, 3.6295166015625, 4.093505859375, 4.5574951171875, 5.021484375, 5.4854736328125, 5.949462890625, 6.4134521484375, 6.87744140625, 7.3414306640625, 7.805419921875, 8.2694091796875, 8.7333984375, 9.1973876953125, 9.661376953125, 10.1253662109375, 10.58935546875, 11.0533447265625, 11.517333984375, 11.9813232421875, 12.4453125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 10.0, 7.0, 41.0, 180.0, 2551.0, 1043661.0, 1847.0, 168.0, 44.0, 17.0, 4.0, 8.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.1893310546875, -7.745849609375, -7.3023681640625, -6.85888671875, -6.4154052734375, -5.971923828125, -5.5284423828125, -5.0849609375, -4.6414794921875, -4.197998046875, -3.7545166015625, -3.31103515625, -2.8675537109375, -2.424072265625, -1.9805908203125, -1.537109375, -1.0936279296875, -0.650146484375, -0.2066650390625, 0.23681640625, 0.6802978515625, 1.123779296875, 1.5672607421875, 2.0107421875, 2.4542236328125, 2.897705078125, 3.3411865234375, 3.78466796875, 4.2281494140625, 4.671630859375, 5.1151123046875, 5.55859375, 6.0020751953125, 6.445556640625, 6.8890380859375, 7.33251953125, 7.7760009765625, 8.219482421875, 8.6629638671875, 9.1064453125, 9.5499267578125, 9.993408203125, 10.4368896484375, 10.88037109375, 11.3238525390625, 11.767333984375, 12.2108154296875, 12.654296875, 13.0977783203125, 13.541259765625, 13.9847412109375, 14.42822265625, 14.8717041015625, 15.315185546875, 15.7586669921875, 16.2021484375, 16.6456298828125, 17.089111328125, 17.5325927734375, 17.97607421875, 18.4195556640625, 18.863037109375, 19.3065185546875, 19.75]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 11.0, 11.0, 17.0, 17.0, 31.0, 33.0, 61.0, 80.0, 91.0, 104.0, 111.0, 97.0, 81.0, 62.0, 49.0, 30.0, 32.0, 23.0, 13.0, 11.0, 5.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00016427040100097656, -0.00015943869948387146, -0.00015460699796676636, -0.00014977529644966125, -0.00014494359493255615, -0.00014011189341545105, -0.00013528019189834595, -0.00013044849038124084, -0.00012561678886413574, -0.00012078508734703064, -0.00011595338582992554, -0.00011112168431282043, -0.00010628998279571533, -0.00010145828127861023, -9.662657976150513e-05, -9.179487824440002e-05, -8.696317672729492e-05, -8.213147521018982e-05, -7.729977369308472e-05, -7.246807217597961e-05, -6.763637065887451e-05, -6.280466914176941e-05, -5.797296762466431e-05, -5.3141266107559204e-05, -4.83095645904541e-05, -4.3477863073349e-05, -3.8646161556243896e-05, -3.3814460039138794e-05, -2.898275852203369e-05, -2.415105700492859e-05, -1.9319355487823486e-05, -1.4487653970718384e-05, -9.655952453613281e-06, -4.824250936508179e-06, 7.450580596923828e-09, 4.839152097702026e-06, 9.670853614807129e-06, 1.4502555131912231e-05, 1.9334256649017334e-05, 2.4165958166122437e-05, 2.899765968322754e-05, 3.382936120033264e-05, 3.8661062717437744e-05, 4.349276423454285e-05, 4.832446575164795e-05, 5.315616726875305e-05, 5.7987868785858154e-05, 6.281957030296326e-05, 6.765127182006836e-05, 7.248297333717346e-05, 7.731467485427856e-05, 8.214637637138367e-05, 8.697807788848877e-05, 9.180977940559387e-05, 9.664148092269897e-05, 0.00010147318243980408, 0.00010630488395690918, 0.00011113658547401428, 0.00011596828699111938, 0.00012079998850822449, 0.0001256316900253296, 0.0001304633915424347, 0.0001352950930595398, 0.0001401267945766449, 0.00014495849609375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 2.0, 7.0, 10.0, 15.0, 28.0, 57.0, 87.0, 218.0, 586.0, 2440.0, 29598.0, 979641.0, 32280.0, 2520.0, 607.0, 218.0, 106.0, 49.0, 24.0, 22.0, 14.0, 6.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91015625, -2.79608154296875, -2.6820068359375, -2.56793212890625, -2.453857421875, -2.33978271484375, -2.2257080078125, -2.11163330078125, -1.99755859375, -1.88348388671875, -1.7694091796875, -1.65533447265625, -1.541259765625, -1.42718505859375, -1.3131103515625, -1.19903564453125, -1.0849609375, -0.97088623046875, -0.8568115234375, -0.74273681640625, -0.628662109375, -0.51458740234375, -0.4005126953125, -0.28643798828125, -0.17236328125, -0.05828857421875, 0.0557861328125, 0.16986083984375, 0.283935546875, 0.39801025390625, 0.5120849609375, 0.62615966796875, 0.740234375, 0.85430908203125, 0.9683837890625, 1.08245849609375, 1.196533203125, 1.31060791015625, 1.4246826171875, 1.53875732421875, 1.65283203125, 1.76690673828125, 1.8809814453125, 1.99505615234375, 2.109130859375, 2.22320556640625, 2.3372802734375, 2.45135498046875, 2.5654296875, 2.67950439453125, 2.7935791015625, 2.90765380859375, 3.021728515625, 3.13580322265625, 3.2498779296875, 3.36395263671875, 3.47802734375, 3.59210205078125, 3.7061767578125, 3.82025146484375, 3.934326171875, 4.04840087890625, 4.1624755859375, 4.27655029296875, 4.390625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 15.0, 18.0, 97.0, 186.0, 268.0, 217.0, 107.0, 44.0, 12.0, 12.0, 1.0, 7.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.951171875, -3.750518798828125, -3.54986572265625, -3.349212646484375, -3.1485595703125, -2.947906494140625, -2.74725341796875, -2.546600341796875, -2.345947265625, -2.145294189453125, -1.94464111328125, -1.743988037109375, -1.5433349609375, -1.342681884765625, -1.14202880859375, -0.941375732421875, -0.74072265625, -0.540069580078125, -0.33941650390625, -0.138763427734375, 0.0618896484375, 0.262542724609375, 0.46319580078125, 0.663848876953125, 0.864501953125, 1.065155029296875, 1.26580810546875, 1.466461181640625, 1.6671142578125, 1.867767333984375, 2.06842041015625, 2.269073486328125, 2.4697265625, 2.670379638671875, 2.87103271484375, 3.071685791015625, 3.2723388671875, 3.472991943359375, 3.67364501953125, 3.874298095703125, 4.074951171875, 4.275604248046875, 4.47625732421875, 4.676910400390625, 4.8775634765625, 5.078216552734375, 5.27886962890625, 5.479522705078125, 5.68017578125, 5.880828857421875, 6.08148193359375, 6.282135009765625, 6.4827880859375, 6.683441162109375, 6.88409423828125, 7.084747314453125, 7.285400390625, 7.486053466796875, 7.68670654296875, 7.887359619140625, 8.0880126953125, 8.288665771484375, 8.48931884765625, 8.689971923828125, 8.890625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 21.0, 83.0, 296.0, 448.0, 114.0, 26.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.44511413574219, -82.52705383300781, -79.60899353027344, -76.69093322753906, -73.77287292480469, -70.85481262207031, -67.93675231933594, -65.01869201660156, -62.10062789916992, -59.18256759643555, -56.26450729370117, -53.34644317626953, -50.428382873535156, -47.51032257080078, -44.592262268066406, -41.67420196533203, -38.756141662597656, -35.83808135986328, -32.920021057128906, -30.0019588470459, -27.083898544311523, -24.16583824157715, -21.24777603149414, -18.329715728759766, -15.41165542602539, -12.493595123291016, -9.575533866882324, -6.657472610473633, -3.739412307739258, -0.8213520050048828, 2.096710205078125, 5.0147705078125, 7.932823181152344, 10.850883483886719, 13.76894474029541, 16.6870059967041, 19.605066299438477, 22.52312660217285, 25.44118881225586, 28.359249114990234, 31.27730941772461, 34.195369720458984, 37.11343002319336, 40.031494140625, 42.949554443359375, 45.86761474609375, 48.785675048828125, 51.7037353515625, 54.621795654296875, 57.53985595703125, 60.457916259765625, 63.3759765625, 66.29403686523438, 69.21209716796875, 72.13015747070312, 75.0482177734375, 77.96627807617188, 80.88433837890625, 83.80239868164062, 86.720458984375, 89.63851928710938, 92.55657958984375, 95.47463989257812, 98.3927001953125, 101.3107681274414]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 9.0, 9.0, 8.0, 11.0, 15.0, 15.0, 11.0, 10.0, 27.0, 31.0, 26.0, 20.0, 33.0, 48.0, 41.0, 42.0, 46.0, 53.0, 47.0, 58.0, 43.0, 48.0, 41.0, 27.0, 30.0, 19.0, 37.0, 31.0, 19.0, 21.0, 23.0, 15.0, 17.0, 8.0, 7.0, 11.0, 7.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-48.65369415283203, -47.24525451660156, -45.83681106567383, -44.42837142944336, -43.019927978515625, -41.611488342285156, -40.20304870605469, -38.79460525512695, -37.386165618896484, -35.977725982666016, -34.56928253173828, -33.16084289550781, -31.75240135192871, -30.34395980834961, -28.935518264770508, -27.527076721191406, -26.118635177612305, -24.710193634033203, -23.3017520904541, -21.893310546875, -20.48487091064453, -19.07642936706543, -17.667987823486328, -16.25954818725586, -14.851105690002441, -13.44266414642334, -12.034223556518555, -10.625782012939453, -9.217340469360352, -7.808899879455566, -6.400458335876465, -4.99201774597168, -3.583576202392578, -2.1751351356506348, -0.7666938304901123, 0.6417474746704102, 2.0501885414123535, 3.458629608154297, 4.867071151733398, 6.275511741638184, 7.683953285217285, 9.092394828796387, 10.500835418701172, 11.909276962280273, 13.317718505859375, 14.72615909576416, 16.134601593017578, 17.543041229248047, 18.95148277282715, 20.35992431640625, 21.76836585998535, 23.176807403564453, 24.585247039794922, 25.993688583374023, 27.402130126953125, 28.810569763183594, 30.219013214111328, 31.62745475769043, 33.03589630126953, 34.4443359375, 35.852779388427734, 37.2612190246582, 38.66966247558594, 40.078102111816406, 41.486541748046875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 4.0, 6.0, 21.0, 17.0, 31.0, 43.0, 69.0, 86.0, 118.0, 187.0, 252.0, 520.0, 1177.0, 3758.0, 50091.0, 4120692.0, 13294.0, 2058.0, 732.0, 376.0, 238.0, 163.0, 100.0, 64.0, 52.0, 36.0, 26.0, 18.0, 11.0, 9.0, 10.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8671875, -6.68316650390625, -6.4991455078125, -6.31512451171875, -6.131103515625, -5.94708251953125, -5.7630615234375, -5.57904052734375, -5.39501953125, -5.21099853515625, -5.0269775390625, -4.84295654296875, -4.658935546875, -4.47491455078125, -4.2908935546875, -4.10687255859375, -3.9228515625, -3.73883056640625, -3.5548095703125, -3.37078857421875, -3.186767578125, -3.00274658203125, -2.8187255859375, -2.63470458984375, -2.45068359375, -2.26666259765625, -2.0826416015625, -1.89862060546875, -1.714599609375, -1.53057861328125, -1.3465576171875, -1.16253662109375, -0.978515625, -0.79449462890625, -0.6104736328125, -0.42645263671875, -0.242431640625, -0.05841064453125, 0.1256103515625, 0.30963134765625, 0.49365234375, 0.67767333984375, 0.8616943359375, 1.04571533203125, 1.229736328125, 1.41375732421875, 1.5977783203125, 1.78179931640625, 1.9658203125, 2.14984130859375, 2.3338623046875, 2.51788330078125, 2.701904296875, 2.88592529296875, 3.0699462890625, 3.25396728515625, 3.43798828125, 3.62200927734375, 3.8060302734375, 3.99005126953125, 4.174072265625, 4.35809326171875, 4.5421142578125, 4.72613525390625, 4.91015625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 7.0, 4.0, 7.0, 16.0, 16.0, 14.0, 20.0, 21.0, 22.0, 27.0, 36.0, 48.0, 28.0, 45.0, 60.0, 55.0, 55.0, 53.0, 60.0, 49.0, 54.0, 42.0, 28.0, 27.0, 28.0, 36.0, 32.0, 21.0, 17.0, 16.0, 9.0, 8.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.1640625, -3.08050537109375, -2.9969482421875, -2.91339111328125, -2.829833984375, -2.74627685546875, -2.6627197265625, -2.57916259765625, -2.49560546875, -2.41204833984375, -2.3284912109375, -2.24493408203125, -2.161376953125, -2.07781982421875, -1.9942626953125, -1.91070556640625, -1.8271484375, -1.74359130859375, -1.6600341796875, -1.57647705078125, -1.492919921875, -1.40936279296875, -1.3258056640625, -1.24224853515625, -1.15869140625, -1.07513427734375, -0.9915771484375, -0.90802001953125, -0.824462890625, -0.74090576171875, -0.6573486328125, -0.57379150390625, -0.490234375, -0.40667724609375, -0.3231201171875, -0.23956298828125, -0.156005859375, -0.07244873046875, 0.0111083984375, 0.09466552734375, 0.17822265625, 0.26177978515625, 0.3453369140625, 0.42889404296875, 0.512451171875, 0.59600830078125, 0.6795654296875, 0.76312255859375, 0.8466796875, 0.93023681640625, 1.0137939453125, 1.09735107421875, 1.180908203125, 1.26446533203125, 1.3480224609375, 1.43157958984375, 1.51513671875, 1.59869384765625, 1.6822509765625, 1.76580810546875, 1.849365234375, 1.93292236328125, 2.0164794921875, 2.10003662109375, 2.18359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 6.0, 6.0, 9.0, 11.0, 20.0, 22.0, 17.0, 15.0, 18.0, 20.0, 31.0, 23.0, 36.0, 39.0, 49.0, 74.0, 125.0, 181.0, 309.0, 1046.0, 4165054.0, 25504.0, 653.0, 283.0, 182.0, 131.0, 71.0, 48.0, 33.0, 35.0, 20.0, 33.0, 24.0, 23.0, 15.0, 18.0, 14.0, 15.0, 20.0, 8.0, 7.0, 5.0, 7.0, 7.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.515625, -25.597412109375, -24.67919921875, -23.760986328125, -22.8427734375, -21.924560546875, -21.00634765625, -20.088134765625, -19.169921875, -18.251708984375, -17.33349609375, -16.415283203125, -15.4970703125, -14.578857421875, -13.66064453125, -12.742431640625, -11.82421875, -10.906005859375, -9.98779296875, -9.069580078125, -8.1513671875, -7.233154296875, -6.31494140625, -5.396728515625, -4.478515625, -3.560302734375, -2.64208984375, -1.723876953125, -0.8056640625, 0.112548828125, 1.03076171875, 1.948974609375, 2.8671875, 3.785400390625, 4.70361328125, 5.621826171875, 6.5400390625, 7.458251953125, 8.37646484375, 9.294677734375, 10.212890625, 11.131103515625, 12.04931640625, 12.967529296875, 13.8857421875, 14.803955078125, 15.72216796875, 16.640380859375, 17.55859375, 18.476806640625, 19.39501953125, 20.313232421875, 21.2314453125, 22.149658203125, 23.06787109375, 23.986083984375, 24.904296875, 25.822509765625, 26.74072265625, 27.658935546875, 28.5771484375, 29.495361328125, 30.41357421875, 31.331787109375, 32.25]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 3.0, 21.0, 4040.0, 22.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.654296875, -1.910675048828125, -1.16705322265625, -0.423431396484375, 0.3201904296875, 1.063812255859375, 1.80743408203125, 2.551055908203125, 3.294677734375, 4.038299560546875, 4.78192138671875, 5.525543212890625, 6.2691650390625, 7.012786865234375, 7.75640869140625, 8.500030517578125, 9.24365234375, 9.987274169921875, 10.73089599609375, 11.474517822265625, 12.2181396484375, 12.961761474609375, 13.70538330078125, 14.449005126953125, 15.192626953125, 15.936248779296875, 16.67987060546875, 17.423492431640625, 18.1671142578125, 18.910736083984375, 19.65435791015625, 20.397979736328125, 21.1416015625, 21.885223388671875, 22.62884521484375, 23.372467041015625, 24.1160888671875, 24.859710693359375, 25.60333251953125, 26.346954345703125, 27.090576171875, 27.834197998046875, 28.57781982421875, 29.321441650390625, 30.0650634765625, 30.808685302734375, 31.55230712890625, 32.295928955078125, 33.03955078125, 33.783172607421875, 34.52679443359375, 35.270416259765625, 36.0140380859375, 36.757659912109375, 37.50128173828125, 38.244903564453125, 38.988525390625, 39.732147216796875, 40.47576904296875, 41.219390869140625, 41.9630126953125, 42.706634521484375, 43.45025634765625, 44.193878173828125, 44.9375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 46.0, 727.0, 216.0, 15.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.04730224609375, -60.826637268066406, -57.60597229003906, -54.38530731201172, -51.164642333984375, -47.94397735595703, -44.72331619262695, -41.50265121459961, -38.281986236572266, -35.06132125854492, -31.840656280517578, -28.619993209838867, -25.399328231811523, -22.17866325378418, -18.95800018310547, -15.737335205078125, -12.516670227050781, -9.296005249023438, -6.07534122467041, -2.854677200317383, 0.36598777770996094, 3.5866527557373047, 6.807315826416016, 10.02798080444336, 13.248645782470703, 16.469310760498047, 19.68997573852539, 22.9106388092041, 26.131303787231445, 29.35196876525879, 32.5726318359375, 35.793296813964844, 39.01396179199219, 42.23462677001953, 45.455291748046875, 48.67595672607422, 51.89662170410156, 55.117286682128906, 58.337947845458984, 61.55861282348633, 64.77928161621094, 67.99994659423828, 71.22061157226562, 74.44127655029297, 77.66194152832031, 80.88260650634766, 84.103271484375, 87.32392883300781, 90.54459381103516, 93.7652587890625, 96.98592376708984, 100.20658874511719, 103.42725372314453, 106.64791870117188, 109.86857604980469, 113.08924865722656, 116.30990600585938, 119.53057098388672, 122.75123596191406, 125.9719009399414, 129.19256591796875, 132.41322326660156, 135.63389587402344, 138.85455322265625, 142.07522583007812]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 12.0, 26.0, 23.0, 35.0, 79.0, 135.0, 169.0, 185.0, 141.0, 80.0, 51.0, 29.0, 18.0, 8.0, 10.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.52603149414062, -87.03592681884766, -84.54582214355469, -82.05570983886719, -79.56560516357422, -77.07550048828125, -74.58539581298828, -72.09529113769531, -69.60518646240234, -67.11508178710938, -64.6249771118164, -62.13486862182617, -59.6447639465332, -57.15465545654297, -54.66455078125, -52.17444610595703, -49.6843376159668, -47.19423294067383, -44.704124450683594, -42.214019775390625, -39.723915100097656, -37.23381042480469, -34.74370193481445, -32.253597259521484, -29.763490676879883, -27.27338409423828, -24.783279418945312, -22.29317283630371, -19.80306625366211, -17.31296157836914, -14.822854995727539, -12.33275032043457, -9.842643737792969, -7.352538108825684, -4.86243200302124, -2.372325897216797, 0.11777973175048828, 2.6078853607177734, 5.097991943359375, 7.588096618652344, 10.078203201293945, 12.56830883026123, 15.058414459228516, 17.548521041870117, 20.03862762451172, 22.528732299804688, 25.01883888244629, 27.508943557739258, 29.99905014038086, 32.48915481567383, 34.97926330566406, 37.46936798095703, 39.95947265625, 42.44957733154297, 44.9396858215332, 47.42979049682617, 49.919898986816406, 52.410003662109375, 54.90011215209961, 57.39021682739258, 59.88032150268555, 62.37042999267578, 64.86053466796875, 67.35063934326172, 69.84074401855469]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 12.0, 15.0, 16.0, 17.0, 22.0, 41.0, 69.0, 109.0, 182.0, 339.0, 737.0, 1844.0, 5381.0, 21508.0, 148840.0, 727702.0, 115812.0, 18130.0, 4617.0, 1610.0, 706.0, 356.0, 173.0, 106.0, 69.0, 41.0, 29.0, 20.0, 15.0, 5.0, 10.0, 6.0, 4.0, 7.0, 2.0, 0.0, 2.0], "bins": [-8.5, -8.29974365234375, -8.0994873046875, -7.89923095703125, -7.698974609375, -7.49871826171875, -7.2984619140625, -7.09820556640625, -6.89794921875, -6.69769287109375, -6.4974365234375, -6.29718017578125, -6.096923828125, -5.89666748046875, -5.6964111328125, -5.49615478515625, -5.2958984375, -5.09564208984375, -4.8953857421875, -4.69512939453125, -4.494873046875, -4.29461669921875, -4.0943603515625, -3.89410400390625, -3.69384765625, -3.49359130859375, -3.2933349609375, -3.09307861328125, -2.892822265625, -2.69256591796875, -2.4923095703125, -2.29205322265625, -2.091796875, -1.89154052734375, -1.6912841796875, -1.49102783203125, -1.290771484375, -1.09051513671875, -0.8902587890625, -0.69000244140625, -0.48974609375, -0.28948974609375, -0.0892333984375, 0.11102294921875, 0.311279296875, 0.51153564453125, 0.7117919921875, 0.91204833984375, 1.1123046875, 1.31256103515625, 1.5128173828125, 1.71307373046875, 1.913330078125, 2.11358642578125, 2.3138427734375, 2.51409912109375, 2.71435546875, 2.91461181640625, 3.1148681640625, 3.31512451171875, 3.515380859375, 3.71563720703125, 3.9158935546875, 4.11614990234375, 4.31640625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 5.0, 1.0, 10.0, 12.0, 11.0, 16.0, 28.0, 39.0, 37.0, 55.0, 54.0, 83.0, 68.0, 90.0, 92.0, 73.0, 56.0, 74.0, 43.0, 42.0, 31.0, 16.0, 14.0, 8.0, 11.0, 5.0, 9.0, 5.0, 6.0, 4.0, 0.0, 1.0, 2.0, 4.0], "bins": [-6.8828125, -6.72552490234375, -6.5682373046875, -6.41094970703125, -6.253662109375, -6.09637451171875, -5.9390869140625, -5.78179931640625, -5.62451171875, -5.46722412109375, -5.3099365234375, -5.15264892578125, -4.995361328125, -4.83807373046875, -4.6807861328125, -4.52349853515625, -4.3662109375, -4.20892333984375, -4.0516357421875, -3.89434814453125, -3.737060546875, -3.57977294921875, -3.4224853515625, -3.26519775390625, -3.10791015625, -2.95062255859375, -2.7933349609375, -2.63604736328125, -2.478759765625, -2.32147216796875, -2.1641845703125, -2.00689697265625, -1.849609375, -1.69232177734375, -1.5350341796875, -1.37774658203125, -1.220458984375, -1.06317138671875, -0.9058837890625, -0.74859619140625, -0.59130859375, -0.43402099609375, -0.2767333984375, -0.11944580078125, 0.037841796875, 0.19512939453125, 0.3524169921875, 0.50970458984375, 0.6669921875, 0.82427978515625, 0.9815673828125, 1.13885498046875, 1.296142578125, 1.45343017578125, 1.6107177734375, 1.76800537109375, 1.92529296875, 2.08258056640625, 2.2398681640625, 2.39715576171875, 2.554443359375, 2.71173095703125, 2.8690185546875, 3.02630615234375, 3.18359375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 11.0, 20.0, 34.0, 73.0, 149.0, 445.0, 1560.0, 360419.0, 683267.0, 1840.0, 437.0, 148.0, 71.0, 29.0, 21.0, 11.0, 7.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.234375, -25.33056640625, -24.4267578125, -23.52294921875, -22.619140625, -21.71533203125, -20.8115234375, -19.90771484375, -19.00390625, -18.10009765625, -17.1962890625, -16.29248046875, -15.388671875, -14.48486328125, -13.5810546875, -12.67724609375, -11.7734375, -10.86962890625, -9.9658203125, -9.06201171875, -8.158203125, -7.25439453125, -6.3505859375, -5.44677734375, -4.54296875, -3.63916015625, -2.7353515625, -1.83154296875, -0.927734375, -0.02392578125, 0.8798828125, 1.78369140625, 2.6875, 3.59130859375, 4.4951171875, 5.39892578125, 6.302734375, 7.20654296875, 8.1103515625, 9.01416015625, 9.91796875, 10.82177734375, 11.7255859375, 12.62939453125, 13.533203125, 14.43701171875, 15.3408203125, 16.24462890625, 17.1484375, 18.05224609375, 18.9560546875, 19.85986328125, 20.763671875, 21.66748046875, 22.5712890625, 23.47509765625, 24.37890625, 25.28271484375, 26.1865234375, 27.09033203125, 27.994140625, 28.89794921875, 29.8017578125, 30.70556640625, 31.609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 14.0, 38.0, 133.0, 226.0, 255.0, 197.0, 94.0, 36.0, 9.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.40625, -33.47802734375, -31.5498046875, -29.62158203125, -27.693359375, -25.76513671875, -23.8369140625, -21.90869140625, -19.98046875, -18.05224609375, -16.1240234375, -14.19580078125, -12.267578125, -10.33935546875, -8.4111328125, -6.48291015625, -4.5546875, -2.62646484375, -0.6982421875, 1.22998046875, 3.158203125, 5.08642578125, 7.0146484375, 8.94287109375, 10.87109375, 12.79931640625, 14.7275390625, 16.65576171875, 18.583984375, 20.51220703125, 22.4404296875, 24.36865234375, 26.296875, 28.22509765625, 30.1533203125, 32.08154296875, 34.009765625, 35.93798828125, 37.8662109375, 39.79443359375, 41.72265625, 43.65087890625, 45.5791015625, 47.50732421875, 49.435546875, 51.36376953125, 53.2919921875, 55.22021484375, 57.1484375, 59.07666015625, 61.0048828125, 62.93310546875, 64.861328125, 66.78955078125, 68.7177734375, 70.64599609375, 72.57421875, 74.50244140625, 76.4306640625, 78.35888671875, 80.287109375, 82.21533203125, 84.1435546875, 86.07177734375, 88.0]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 12.0, 20.0, 41.0, 142.0, 931.0, 1033163.0, 13737.0, 382.0, 79.0, 31.0, 11.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.953125, -9.495849609375, -9.03857421875, -8.581298828125, -8.1240234375, -7.666748046875, -7.20947265625, -6.752197265625, -6.294921875, -5.837646484375, -5.38037109375, -4.923095703125, -4.4658203125, -4.008544921875, -3.55126953125, -3.093994140625, -2.63671875, -2.179443359375, -1.72216796875, -1.264892578125, -0.8076171875, -0.350341796875, 0.10693359375, 0.564208984375, 1.021484375, 1.478759765625, 1.93603515625, 2.393310546875, 2.8505859375, 3.307861328125, 3.76513671875, 4.222412109375, 4.6796875, 5.136962890625, 5.59423828125, 6.051513671875, 6.5087890625, 6.966064453125, 7.42333984375, 7.880615234375, 8.337890625, 8.795166015625, 9.25244140625, 9.709716796875, 10.1669921875, 10.624267578125, 11.08154296875, 11.538818359375, 11.99609375, 12.453369140625, 12.91064453125, 13.367919921875, 13.8251953125, 14.282470703125, 14.73974609375, 15.197021484375, 15.654296875, 16.111572265625, 16.56884765625, 17.026123046875, 17.4833984375, 17.940673828125, 18.39794921875, 18.855224609375, 19.3125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 7.0, 8.0, 9.0, 17.0, 14.0, 31.0, 29.0, 53.0, 77.0, 114.0, 149.0, 146.0, 93.0, 73.0, 45.0, 35.0, 22.0, 12.0, 13.0, 8.0, 11.0, 6.0, 6.0, 3.0, 2.0, 7.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001894235610961914, -0.00018262676894664764, -0.00017582997679710388, -0.00016903318464756012, -0.00016223639249801636, -0.0001554396003484726, -0.00014864280819892883, -0.00014184601604938507, -0.0001350492238998413, -0.00012825243175029755, -0.00012145563960075378, -0.00011465884745121002, -0.00010786205530166626, -0.0001010652631521225, -9.426847100257874e-05, -8.747167885303497e-05, -8.067488670349121e-05, -7.387809455394745e-05, -6.708130240440369e-05, -6.0284510254859924e-05, -5.348771810531616e-05, -4.66909259557724e-05, -3.989413380622864e-05, -3.3097341656684875e-05, -2.6300549507141113e-05, -1.950375735759735e-05, -1.2706965208053589e-05, -5.910173058509827e-06, 8.866190910339355e-07, 7.683411240577698e-06, 1.448020339012146e-05, 2.1276995539665222e-05, 2.8073787689208984e-05, 3.4870579838752747e-05, 4.166737198829651e-05, 4.846416413784027e-05, 5.526095628738403e-05, 6.20577484369278e-05, 6.885454058647156e-05, 7.565133273601532e-05, 8.244812488555908e-05, 8.924491703510284e-05, 9.60417091846466e-05, 0.00010283850133419037, 0.00010963529348373413, 0.00011643208563327789, 0.00012322887778282166, 0.00013002566993236542, 0.00013682246208190918, 0.00014361925423145294, 0.0001504160463809967, 0.00015721283853054047, 0.00016400963068008423, 0.000170806422829628, 0.00017760321497917175, 0.00018440000712871552, 0.00019119679927825928, 0.00019799359142780304, 0.0002047903835773468, 0.00021158717572689056, 0.00021838396787643433, 0.0002251807600259781, 0.00023197755217552185, 0.0002387743443250656, 0.0002455711364746094]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 5.0, 7.0, 24.0, 48.0, 166.0, 642.0, 35337.0, 1010495.0, 1487.0, 231.0, 58.0, 32.0, 14.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.28125, -15.8951416015625, -15.509033203125, -15.1229248046875, -14.73681640625, -14.3507080078125, -13.964599609375, -13.5784912109375, -13.1923828125, -12.8062744140625, -12.420166015625, -12.0340576171875, -11.64794921875, -11.2618408203125, -10.875732421875, -10.4896240234375, -10.103515625, -9.7174072265625, -9.331298828125, -8.9451904296875, -8.55908203125, -8.1729736328125, -7.786865234375, -7.4007568359375, -7.0146484375, -6.6285400390625, -6.242431640625, -5.8563232421875, -5.47021484375, -5.0841064453125, -4.697998046875, -4.3118896484375, -3.92578125, -3.5396728515625, -3.153564453125, -2.7674560546875, -2.38134765625, -1.9952392578125, -1.609130859375, -1.2230224609375, -0.8369140625, -0.4508056640625, -0.064697265625, 0.3214111328125, 0.70751953125, 1.0936279296875, 1.479736328125, 1.8658447265625, 2.251953125, 2.6380615234375, 3.024169921875, 3.4102783203125, 3.79638671875, 4.1824951171875, 4.568603515625, 4.9547119140625, 5.3408203125, 5.7269287109375, 6.113037109375, 6.4991455078125, 6.88525390625, 7.2713623046875, 7.657470703125, 8.0435791015625, 8.4296875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 10.0, 28.0, 76.0, 421.0, 367.0, 64.0, 17.0, 12.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5, -16.0970458984375, -15.694091796875, -15.2911376953125, -14.88818359375, -14.4852294921875, -14.082275390625, -13.6793212890625, -13.2763671875, -12.8734130859375, -12.470458984375, -12.0675048828125, -11.66455078125, -11.2615966796875, -10.858642578125, -10.4556884765625, -10.052734375, -9.6497802734375, -9.246826171875, -8.8438720703125, -8.44091796875, -8.0379638671875, -7.635009765625, -7.2320556640625, -6.8291015625, -6.4261474609375, -6.023193359375, -5.6202392578125, -5.21728515625, -4.8143310546875, -4.411376953125, -4.0084228515625, -3.60546875, -3.2025146484375, -2.799560546875, -2.3966064453125, -1.99365234375, -1.5906982421875, -1.187744140625, -0.7847900390625, -0.3818359375, 0.0211181640625, 0.424072265625, 0.8270263671875, 1.22998046875, 1.6329345703125, 2.035888671875, 2.4388427734375, 2.841796875, 3.2447509765625, 3.647705078125, 4.0506591796875, 4.45361328125, 4.8565673828125, 5.259521484375, 5.6624755859375, 6.0654296875, 6.4683837890625, 6.871337890625, 7.2742919921875, 7.67724609375, 8.0802001953125, 8.483154296875, 8.8861083984375, 9.2890625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 7.0, 5.0, 28.0, 156.0, 492.0, 222.0, 60.0, 17.0, 10.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-256.1046447753906, -250.3303985595703, -244.55615234375, -238.7819061279297, -233.00765991210938, -227.23341369628906, -221.45916748046875, -215.6849365234375, -209.91067504882812, -204.1364288330078, -198.3621826171875, -192.5879364013672, -186.81369018554688, -181.03944396972656, -175.26519775390625, -169.490966796875, -163.7167205810547, -157.94247436523438, -152.16822814941406, -146.39398193359375, -140.61973571777344, -134.84548950195312, -129.07125854492188, -123.29700469970703, -117.52275848388672, -111.7485122680664, -105.9742660522461, -100.20002746582031, -94.42578125, -88.65153503417969, -82.87728881835938, -77.10304260253906, -71.32878875732422, -65.5545425415039, -59.780296325683594, -54.00605392456055, -48.231807708740234, -42.45756149291992, -36.683319091796875, -30.909072875976562, -25.13482666015625, -19.360580444335938, -13.586336135864258, -7.812091827392578, -2.0378456115722656, 3.736400604248047, 9.510643005371094, 15.284889221191406, 21.05913543701172, 26.83338165283203, 32.607627868652344, 38.38187026977539, 44.1561164855957, 49.930362701416016, 55.70460510253906, 61.478851318359375, 67.25309753417969, 73.02734375, 78.80158996582031, 84.57583618164062, 90.35008239746094, 96.12432861328125, 101.89856719970703, 107.67281341552734, 113.44705963134766]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 10.0, 13.0, 13.0, 15.0, 21.0, 25.0, 34.0, 33.0, 44.0, 46.0, 60.0, 72.0, 82.0, 76.0, 66.0, 71.0, 64.0, 43.0, 45.0, 48.0, 31.0, 24.0, 11.0, 17.0, 13.0, 10.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.9471435546875, -77.71564483642578, -73.48414611816406, -69.25264739990234, -65.02114868164062, -60.789649963378906, -56.55815505981445, -52.326656341552734, -48.095157623291016, -43.8636589050293, -39.63216018676758, -35.400665283203125, -31.169164657592773, -26.937665939331055, -22.70616912841797, -18.47467041015625, -14.243171691894531, -10.011672973632812, -5.78017520904541, -1.5486774444580078, 2.682821273803711, 6.91431999206543, 11.145816802978516, 15.377315521240234, 19.608814239501953, 23.840312957763672, 28.07181167602539, 32.303306579589844, 36.53480529785156, 40.76630401611328, 44.997802734375, 49.22930145263672, 53.46080017089844, 57.692298889160156, 61.923797607421875, 66.1552963256836, 70.38679504394531, 74.61829376220703, 78.84979248046875, 83.08128356933594, 87.31278991699219, 91.5442886352539, 95.77578735351562, 100.00728607177734, 104.23878479003906, 108.47028350830078, 112.7017822265625, 116.93327331542969, 121.1647720336914, 125.39627075195312, 129.6277618408203, 133.85926818847656, 138.09075927734375, 142.322265625, 146.5537567138672, 150.78526306152344, 155.01675415039062, 159.2482452392578, 163.47975158691406, 167.71124267578125, 171.9427490234375, 176.1742401123047, 180.40574645996094, 184.63723754882812, 188.86874389648438]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 11.0, 9.0, 7.0, 26.0, 27.0, 47.0, 79.0, 91.0, 144.0, 252.0, 404.0, 733.0, 1210.0, 2190.0, 4264.0, 8955.0, 27393.0, 210128.0, 3373499.0, 496189.0, 44862.0, 12310.0, 5392.0, 2725.0, 1405.0, 796.0, 464.0, 260.0, 147.0, 99.0, 47.0, 34.0, 21.0, 23.0, 9.0, 11.0, 7.0, 7.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.759765625, -2.66668701171875, -2.5736083984375, -2.48052978515625, -2.387451171875, -2.29437255859375, -2.2012939453125, -2.10821533203125, -2.01513671875, -1.92205810546875, -1.8289794921875, -1.73590087890625, -1.642822265625, -1.54974365234375, -1.4566650390625, -1.36358642578125, -1.2705078125, -1.17742919921875, -1.0843505859375, -0.99127197265625, -0.898193359375, -0.80511474609375, -0.7120361328125, -0.61895751953125, -0.52587890625, -0.43280029296875, -0.3397216796875, -0.24664306640625, -0.153564453125, -0.06048583984375, 0.0325927734375, 0.12567138671875, 0.21875, 0.31182861328125, 0.4049072265625, 0.49798583984375, 0.591064453125, 0.68414306640625, 0.7772216796875, 0.87030029296875, 0.96337890625, 1.05645751953125, 1.1495361328125, 1.24261474609375, 1.335693359375, 1.42877197265625, 1.5218505859375, 1.61492919921875, 1.7080078125, 1.80108642578125, 1.8941650390625, 1.98724365234375, 2.080322265625, 2.17340087890625, 2.2664794921875, 2.35955810546875, 2.45263671875, 2.54571533203125, 2.6387939453125, 2.73187255859375, 2.824951171875, 2.91802978515625, 3.0111083984375, 3.10418701171875, 3.197265625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 6.0, 7.0, 9.0, 11.0, 8.0, 10.0, 16.0, 12.0, 27.0, 34.0, 33.0, 24.0, 44.0, 39.0, 46.0, 53.0, 59.0, 56.0, 57.0, 58.0, 60.0, 46.0, 38.0, 45.0, 32.0, 27.0, 19.0, 23.0, 14.0, 11.0, 16.0, 14.0, 14.0, 6.0, 4.0, 4.0, 6.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.873046875, -2.78851318359375, -2.7039794921875, -2.61944580078125, -2.534912109375, -2.45037841796875, -2.3658447265625, -2.28131103515625, -2.19677734375, -2.11224365234375, -2.0277099609375, -1.94317626953125, -1.858642578125, -1.77410888671875, -1.6895751953125, -1.60504150390625, -1.5205078125, -1.43597412109375, -1.3514404296875, -1.26690673828125, -1.182373046875, -1.09783935546875, -1.0133056640625, -0.92877197265625, -0.84423828125, -0.75970458984375, -0.6751708984375, -0.59063720703125, -0.506103515625, -0.42156982421875, -0.3370361328125, -0.25250244140625, -0.16796875, -0.08343505859375, 0.0010986328125, 0.08563232421875, 0.170166015625, 0.25469970703125, 0.3392333984375, 0.42376708984375, 0.50830078125, 0.59283447265625, 0.6773681640625, 0.76190185546875, 0.846435546875, 0.93096923828125, 1.0155029296875, 1.10003662109375, 1.1845703125, 1.26910400390625, 1.3536376953125, 1.43817138671875, 1.522705078125, 1.60723876953125, 1.6917724609375, 1.77630615234375, 1.86083984375, 1.94537353515625, 2.0299072265625, 2.11444091796875, 2.198974609375, 2.28350830078125, 2.3680419921875, 2.45257568359375, 2.537109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 9.0, 13.0, 25.0, 55.0, 142.0, 600.0, 49322.0, 4141759.0, 1955.0, 240.0, 91.0, 44.0, 23.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.625, -26.766845703125, -25.90869140625, -25.050537109375, -24.1923828125, -23.334228515625, -22.47607421875, -21.617919921875, -20.759765625, -19.901611328125, -19.04345703125, -18.185302734375, -17.3271484375, -16.468994140625, -15.61083984375, -14.752685546875, -13.89453125, -13.036376953125, -12.17822265625, -11.320068359375, -10.4619140625, -9.603759765625, -8.74560546875, -7.887451171875, -7.029296875, -6.171142578125, -5.31298828125, -4.454833984375, -3.5966796875, -2.738525390625, -1.88037109375, -1.022216796875, -0.1640625, 0.694091796875, 1.55224609375, 2.410400390625, 3.2685546875, 4.126708984375, 4.98486328125, 5.843017578125, 6.701171875, 7.559326171875, 8.41748046875, 9.275634765625, 10.1337890625, 10.991943359375, 11.85009765625, 12.708251953125, 13.56640625, 14.424560546875, 15.28271484375, 16.140869140625, 16.9990234375, 17.857177734375, 18.71533203125, 19.573486328125, 20.431640625, 21.289794921875, 22.14794921875, 23.006103515625, 23.8642578125, 24.722412109375, 25.58056640625, 26.438720703125, 27.296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 13.0, 6.0, 12.0, 26.0, 38.0, 73.0, 239.0, 2233.0, 1199.0, 114.0, 40.0, 24.0, 22.0, 13.0, 6.0, 4.0, 7.0, 2.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.33203125, -6.98052978515625, -6.6290283203125, -6.27752685546875, -5.926025390625, -5.57452392578125, -5.2230224609375, -4.87152099609375, -4.52001953125, -4.16851806640625, -3.8170166015625, -3.46551513671875, -3.114013671875, -2.76251220703125, -2.4110107421875, -2.05950927734375, -1.7080078125, -1.35650634765625, -1.0050048828125, -0.65350341796875, -0.302001953125, 0.04949951171875, 0.4010009765625, 0.75250244140625, 1.10400390625, 1.45550537109375, 1.8070068359375, 2.15850830078125, 2.510009765625, 2.86151123046875, 3.2130126953125, 3.56451416015625, 3.916015625, 4.26751708984375, 4.6190185546875, 4.97052001953125, 5.322021484375, 5.67352294921875, 6.0250244140625, 6.37652587890625, 6.72802734375, 7.07952880859375, 7.4310302734375, 7.78253173828125, 8.134033203125, 8.48553466796875, 8.8370361328125, 9.18853759765625, 9.5400390625, 9.89154052734375, 10.2430419921875, 10.59454345703125, 10.946044921875, 11.29754638671875, 11.6490478515625, 12.00054931640625, 12.35205078125, 12.70355224609375, 13.0550537109375, 13.40655517578125, 13.758056640625, 14.10955810546875, 14.4610595703125, 14.81256103515625, 15.1640625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 8.0, 10.0, 13.0, 14.0, 33.0, 74.0, 158.0, 280.0, 220.0, 120.0, 35.0, 12.0, 4.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.198890686035156, -51.682254791259766, -50.165618896484375, -48.648983001708984, -47.132347106933594, -45.6157112121582, -44.09907531738281, -42.582435607910156, -41.06580352783203, -39.54916763305664, -38.03253173828125, -36.51589584350586, -34.99925994873047, -33.48262405395508, -31.965986251831055, -30.449350357055664, -28.93271255493164, -27.41607666015625, -25.89944076538086, -24.38280487060547, -22.866168975830078, -21.349533081054688, -19.832895278930664, -18.316259384155273, -16.799623489379883, -15.282987594604492, -13.766351699829102, -12.249714851379395, -10.733078956604004, -9.216443061828613, -7.699806213378906, -6.183170318603516, -4.666538238525391, -3.149902105331421, -1.6332659721374512, -0.11662960052490234, 1.4000062942504883, 2.916642189025879, 4.433279037475586, 5.949914932250977, 7.466550827026367, 8.983186721801758, 10.499822616577148, 12.016459465026855, 13.533095359802246, 15.049731254577637, 16.566368103027344, 18.083003997802734, 19.599639892578125, 21.116275787353516, 22.632911682128906, 24.149547576904297, 25.666183471679688, 27.182819366455078, 28.6994571685791, 30.216093063354492, 31.732728958129883, 33.249366760253906, 34.7660026550293, 36.28263854980469, 37.79927444458008, 39.31591033935547, 40.83254623413086, 42.34918212890625, 43.86581802368164]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 12.0, 11.0, 13.0, 12.0, 27.0, 27.0, 27.0, 43.0, 40.0, 48.0, 36.0, 50.0, 53.0, 56.0, 56.0, 42.0, 55.0, 49.0, 40.0, 43.0, 44.0, 38.0, 34.0, 19.0, 22.0, 12.0, 11.0, 10.0, 6.0, 8.0, 10.0, 4.0, 7.0, 4.0, 6.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.131750106811523, -24.353090286254883, -23.574432373046875, -22.795772552490234, -22.017112731933594, -21.238452911376953, -20.459794998168945, -19.681135177612305, -18.902477264404297, -18.123817443847656, -17.34515953063965, -16.566499710083008, -15.787839889526367, -15.009181022644043, -14.230522155761719, -13.451862335205078, -12.673202514648438, -11.894543647766113, -11.115883827209473, -10.337224960327148, -9.558565139770508, -8.779906272888184, -8.00124740600586, -7.222588062286377, -6.4439287185668945, -5.665269374847412, -4.88661003112793, -4.1079511642456055, -3.329291820526123, -2.5506324768066406, -1.7719736099243164, -0.993314266204834, -0.21465301513671875, 0.5640062093734741, 1.342665433883667, 2.1213245391845703, 2.8999838829040527, 3.678643226623535, 4.457302093505859, 5.235961437225342, 6.014620780944824, 6.793280124664307, 7.571939468383789, 8.350598335266113, 9.129257202148438, 9.907917022705078, 10.686575889587402, 11.465234756469727, 12.243894577026367, 13.022553443908691, 13.801213264465332, 14.579872131347656, 15.358531951904297, 16.137191772460938, 16.915849685668945, 17.694509506225586, 18.473167419433594, 19.251827239990234, 20.030485153198242, 20.809144973754883, 21.587804794311523, 22.36646270751953, 23.145122528076172, 23.923782348632812, 24.702442169189453]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 6.0, 7.0, 8.0, 14.0, 21.0, 44.0, 46.0, 54.0, 95.0, 153.0, 244.0, 376.0, 544.0, 991.0, 1625.0, 2797.0, 4769.0, 9001.0, 16655.0, 34067.0, 74287.0, 170938.0, 323030.0, 222401.0, 96970.0, 43443.0, 21037.0, 10959.0, 5844.0, 3223.0, 1899.0, 1070.0, 652.0, 435.0, 291.0, 206.0, 114.0, 82.0, 41.0, 28.0, 27.0, 19.0, 8.0, 8.0, 7.0, 5.0, 5.0, 1.0, 5.0, 3.0, 3.0], "bins": [-2.12109375, -2.061614990234375, -2.00213623046875, -1.942657470703125, -1.8831787109375, -1.823699951171875, -1.76422119140625, -1.704742431640625, -1.645263671875, -1.585784912109375, -1.52630615234375, -1.466827392578125, -1.4073486328125, -1.347869873046875, -1.28839111328125, -1.228912353515625, -1.16943359375, -1.109954833984375, -1.05047607421875, -0.990997314453125, -0.9315185546875, -0.872039794921875, -0.81256103515625, -0.753082275390625, -0.693603515625, -0.634124755859375, -0.57464599609375, -0.515167236328125, -0.4556884765625, -0.396209716796875, -0.33673095703125, -0.277252197265625, -0.2177734375, -0.158294677734375, -0.09881591796875, -0.039337158203125, 0.0201416015625, 0.079620361328125, 0.13909912109375, 0.198577880859375, 0.258056640625, 0.317535400390625, 0.37701416015625, 0.436492919921875, 0.4959716796875, 0.555450439453125, 0.61492919921875, 0.674407958984375, 0.73388671875, 0.793365478515625, 0.85284423828125, 0.912322998046875, 0.9718017578125, 1.031280517578125, 1.09075927734375, 1.150238037109375, 1.209716796875, 1.269195556640625, 1.32867431640625, 1.388153076171875, 1.4476318359375, 1.507110595703125, 1.56658935546875, 1.626068115234375, 1.685546875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 5.0, 2.0, 8.0, 11.0, 12.0, 16.0, 8.0, 17.0, 10.0, 26.0, 26.0, 20.0, 20.0, 37.0, 39.0, 46.0, 45.0, 31.0, 37.0, 53.0, 41.0, 46.0, 55.0, 40.0, 43.0, 40.0, 42.0, 26.0, 31.0, 26.0, 15.0, 17.0, 20.0, 11.0, 15.0, 12.0, 8.0, 4.0, 4.0, 10.0, 2.0, 4.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0], "bins": [-2.265625, -2.19573974609375, -2.1258544921875, -2.05596923828125, -1.986083984375, -1.91619873046875, -1.8463134765625, -1.77642822265625, -1.70654296875, -1.63665771484375, -1.5667724609375, -1.49688720703125, -1.427001953125, -1.35711669921875, -1.2872314453125, -1.21734619140625, -1.1474609375, -1.07757568359375, -1.0076904296875, -0.93780517578125, -0.867919921875, -0.79803466796875, -0.7281494140625, -0.65826416015625, -0.58837890625, -0.51849365234375, -0.4486083984375, -0.37872314453125, -0.308837890625, -0.23895263671875, -0.1690673828125, -0.09918212890625, -0.029296875, 0.04058837890625, 0.1104736328125, 0.18035888671875, 0.250244140625, 0.32012939453125, 0.3900146484375, 0.45989990234375, 0.52978515625, 0.59967041015625, 0.6695556640625, 0.73944091796875, 0.809326171875, 0.87921142578125, 0.9490966796875, 1.01898193359375, 1.0888671875, 1.15875244140625, 1.2286376953125, 1.29852294921875, 1.368408203125, 1.43829345703125, 1.5081787109375, 1.57806396484375, 1.64794921875, 1.71783447265625, 1.7877197265625, 1.85760498046875, 1.927490234375, 1.99737548828125, 2.0672607421875, 2.13714599609375, 2.20703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 11.0, 12.0, 9.0, 25.0, 40.0, 67.0, 81.0, 135.0, 213.0, 388.0, 730.0, 1928.0, 9508.0, 412215.0, 607978.0, 11285.0, 2070.0, 807.0, 438.0, 243.0, 136.0, 79.0, 45.0, 36.0, 22.0, 17.0, 10.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0], "bins": [-13.6484375, -13.32373046875, -12.9990234375, -12.67431640625, -12.349609375, -12.02490234375, -11.7001953125, -11.37548828125, -11.05078125, -10.72607421875, -10.4013671875, -10.07666015625, -9.751953125, -9.42724609375, -9.1025390625, -8.77783203125, -8.453125, -8.12841796875, -7.8037109375, -7.47900390625, -7.154296875, -6.82958984375, -6.5048828125, -6.18017578125, -5.85546875, -5.53076171875, -5.2060546875, -4.88134765625, -4.556640625, -4.23193359375, -3.9072265625, -3.58251953125, -3.2578125, -2.93310546875, -2.6083984375, -2.28369140625, -1.958984375, -1.63427734375, -1.3095703125, -0.98486328125, -0.66015625, -0.33544921875, -0.0107421875, 0.31396484375, 0.638671875, 0.96337890625, 1.2880859375, 1.61279296875, 1.9375, 2.26220703125, 2.5869140625, 2.91162109375, 3.236328125, 3.56103515625, 3.8857421875, 4.21044921875, 4.53515625, 4.85986328125, 5.1845703125, 5.50927734375, 5.833984375, 6.15869140625, 6.4833984375, 6.80810546875, 7.1328125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 6.0, 12.0, 6.0, 11.0, 8.0, 4.0, 17.0, 26.0, 27.0, 32.0, 42.0, 46.0, 56.0, 60.0, 63.0, 52.0, 57.0, 58.0, 56.0, 57.0, 64.0, 42.0, 40.0, 40.0, 24.0, 24.0, 18.0, 15.0, 9.0, 8.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-15.1484375, -14.7421875, -14.3359375, -13.9296875, -13.5234375, -13.1171875, -12.7109375, -12.3046875, -11.8984375, -11.4921875, -11.0859375, -10.6796875, -10.2734375, -9.8671875, -9.4609375, -9.0546875, -8.6484375, -8.2421875, -7.8359375, -7.4296875, -7.0234375, -6.6171875, -6.2109375, -5.8046875, -5.3984375, -4.9921875, -4.5859375, -4.1796875, -3.7734375, -3.3671875, -2.9609375, -2.5546875, -2.1484375, -1.7421875, -1.3359375, -0.9296875, -0.5234375, -0.1171875, 0.2890625, 0.6953125, 1.1015625, 1.5078125, 1.9140625, 2.3203125, 2.7265625, 3.1328125, 3.5390625, 3.9453125, 4.3515625, 4.7578125, 5.1640625, 5.5703125, 5.9765625, 6.3828125, 6.7890625, 7.1953125, 7.6015625, 8.0078125, 8.4140625, 8.8203125, 9.2265625, 9.6328125, 10.0390625, 10.4453125, 10.8515625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 9.0, 18.0, 20.0, 23.0, 35.0, 47.0, 97.0, 179.0, 347.0, 1081.0, 4270.0, 40886.0, 945830.0, 49286.0, 4503.0, 1054.0, 403.0, 189.0, 89.0, 55.0, 47.0, 22.0, 6.0, 14.0, 6.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.896484375, -2.812591552734375, -2.72869873046875, -2.644805908203125, -2.5609130859375, -2.477020263671875, -2.39312744140625, -2.309234619140625, -2.225341796875, -2.141448974609375, -2.05755615234375, -1.973663330078125, -1.8897705078125, -1.805877685546875, -1.72198486328125, -1.638092041015625, -1.55419921875, -1.470306396484375, -1.38641357421875, -1.302520751953125, -1.2186279296875, -1.134735107421875, -1.05084228515625, -0.966949462890625, -0.883056640625, -0.799163818359375, -0.71527099609375, -0.631378173828125, -0.5474853515625, -0.463592529296875, -0.37969970703125, -0.295806884765625, -0.2119140625, -0.128021240234375, -0.04412841796875, 0.039764404296875, 0.1236572265625, 0.207550048828125, 0.29144287109375, 0.375335693359375, 0.459228515625, 0.543121337890625, 0.62701416015625, 0.710906982421875, 0.7947998046875, 0.878692626953125, 0.96258544921875, 1.046478271484375, 1.13037109375, 1.214263916015625, 1.29815673828125, 1.382049560546875, 1.4659423828125, 1.549835205078125, 1.63372802734375, 1.717620849609375, 1.801513671875, 1.885406494140625, 1.96929931640625, 2.053192138671875, 2.1370849609375, 2.220977783203125, 2.30487060546875, 2.388763427734375, 2.47265625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 7.0, 12.0, 12.0, 16.0, 24.0, 32.0, 46.0, 49.0, 110.0, 125.0, 146.0, 120.0, 76.0, 77.0, 48.0, 19.0, 26.0, 18.0, 9.0, 8.0, 8.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028324127197265625, -0.00027640722692012787, -0.0002695731818675995, -0.0002627391368150711, -0.0002559050917625427, -0.00024907104671001434, -0.00024223700165748596, -0.00023540295660495758, -0.0002285689115524292, -0.00022173486649990082, -0.00021490082144737244, -0.00020806677639484406, -0.00020123273134231567, -0.0001943986862897873, -0.0001875646412372589, -0.00018073059618473053, -0.00017389655113220215, -0.00016706250607967377, -0.00016022846102714539, -0.000153394415974617, -0.00014656037092208862, -0.00013972632586956024, -0.00013289228081703186, -0.00012605823576450348, -0.0001192241907119751, -0.00011239014565944672, -0.00010555610060691833, -9.872205555438995e-05, -9.188801050186157e-05, -8.505396544933319e-05, -7.821992039680481e-05, -7.138587534427643e-05, -6.455183029174805e-05, -5.7717785239219666e-05, -5.0883740186691284e-05, -4.40496951341629e-05, -3.721565008163452e-05, -3.038160502910614e-05, -2.354755997657776e-05, -1.6713514924049377e-05, -9.879469871520996e-06, -3.0454248189926147e-06, 3.7886202335357666e-06, 1.0622665286064148e-05, 1.745671033859253e-05, 2.429075539112091e-05, 3.112480044364929e-05, 3.795884549617767e-05, 4.4792890548706055e-05, 5.1626935601234436e-05, 5.846098065376282e-05, 6.52950257062912e-05, 7.212907075881958e-05, 7.896311581134796e-05, 8.579716086387634e-05, 9.263120591640472e-05, 9.94652509689331e-05, 0.00010629929602146149, 0.00011313334107398987, 0.00011996738612651825, 0.00012680143117904663, 0.000133635476231575, 0.0001404695212841034, 0.00014730356633663177, 0.00015413761138916016]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 13.0, 27.0, 27.0, 50.0, 85.0, 178.0, 379.0, 871.0, 3369.0, 31457.0, 954189.0, 51844.0, 4097.0, 1115.0, 408.0, 189.0, 116.0, 43.0, 27.0, 20.0, 11.0, 11.0, 6.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.330078125, -3.233734130859375, -3.13739013671875, -3.041046142578125, -2.9447021484375, -2.848358154296875, -2.75201416015625, -2.655670166015625, -2.559326171875, -2.462982177734375, -2.36663818359375, -2.270294189453125, -2.1739501953125, -2.077606201171875, -1.98126220703125, -1.884918212890625, -1.78857421875, -1.692230224609375, -1.59588623046875, -1.499542236328125, -1.4031982421875, -1.306854248046875, -1.21051025390625, -1.114166259765625, -1.017822265625, -0.921478271484375, -0.82513427734375, -0.728790283203125, -0.6324462890625, -0.536102294921875, -0.43975830078125, -0.343414306640625, -0.2470703125, -0.150726318359375, -0.05438232421875, 0.041961669921875, 0.1383056640625, 0.234649658203125, 0.33099365234375, 0.427337646484375, 0.523681640625, 0.620025634765625, 0.71636962890625, 0.812713623046875, 0.9090576171875, 1.005401611328125, 1.10174560546875, 1.198089599609375, 1.29443359375, 1.390777587890625, 1.48712158203125, 1.583465576171875, 1.6798095703125, 1.776153564453125, 1.87249755859375, 1.968841552734375, 2.065185546875, 2.161529541015625, 2.25787353515625, 2.354217529296875, 2.4505615234375, 2.546905517578125, 2.64324951171875, 2.739593505859375, 2.8359375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 13.0, 14.0, 15.0, 23.0, 36.0, 45.0, 51.0, 67.0, 72.0, 81.0, 81.0, 76.0, 76.0, 71.0, 59.0, 49.0, 35.0, 28.0, 28.0, 14.0, 13.0, 7.0, 4.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8017578125, -1.7408905029296875, -1.680023193359375, -1.6191558837890625, -1.55828857421875, -1.4974212646484375, -1.436553955078125, -1.3756866455078125, -1.3148193359375, -1.2539520263671875, -1.193084716796875, -1.1322174072265625, -1.07135009765625, -1.0104827880859375, -0.949615478515625, -0.8887481689453125, -0.827880859375, -0.7670135498046875, -0.706146240234375, -0.6452789306640625, -0.58441162109375, -0.5235443115234375, -0.462677001953125, -0.4018096923828125, -0.3409423828125, -0.2800750732421875, -0.219207763671875, -0.1583404541015625, -0.09747314453125, -0.0366058349609375, 0.024261474609375, 0.0851287841796875, 0.14599609375, 0.2068634033203125, 0.267730712890625, 0.3285980224609375, 0.38946533203125, 0.4503326416015625, 0.511199951171875, 0.5720672607421875, 0.6329345703125, 0.6938018798828125, 0.754669189453125, 0.8155364990234375, 0.87640380859375, 0.9372711181640625, 0.998138427734375, 1.0590057373046875, 1.119873046875, 1.1807403564453125, 1.241607666015625, 1.3024749755859375, 1.36334228515625, 1.4242095947265625, 1.485076904296875, 1.5459442138671875, 1.6068115234375, 1.6676788330078125, 1.728546142578125, 1.7894134521484375, 1.85028076171875, 1.9111480712890625, 1.972015380859375, 2.0328826904296875, 2.09375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 21.0, 141.0, 650.0, 170.0, 14.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.50665283203125, -45.238956451416016, -40.97126007080078, -36.70356369018555, -32.43586730957031, -28.168170928955078, -23.900474548339844, -19.63277816772461, -15.365081787109375, -11.09738540649414, -6.829689025878906, -2.561992645263672, 1.7057037353515625, 5.973400115966797, 10.241096496582031, 14.508792877197266, 18.7764892578125, 23.044185638427734, 27.31188201904297, 31.579578399658203, 35.84727478027344, 40.11497116088867, 44.382667541503906, 48.65036392211914, 52.918060302734375, 57.18575668334961, 61.453453063964844, 65.72114562988281, 69.98884582519531, 74.25654602050781, 78.52423858642578, 82.79193115234375, 87.05961608886719, 91.32731628417969, 95.59500885009766, 99.86270141601562, 104.13040161132812, 108.39810180664062, 112.6657943725586, 116.93348693847656, 121.20118713378906, 125.46888732910156, 129.736572265625, 134.0042724609375, 138.27197265625, 142.5396728515625, 146.807373046875, 151.07505798339844, 155.34275817871094, 159.61045837402344, 163.87814331054688, 168.14584350585938, 172.41354370117188, 176.68124389648438, 180.94894409179688, 185.2166290283203, 189.4843292236328, 193.7520294189453, 198.01971435546875, 202.28741455078125, 206.55511474609375, 210.82281494140625, 215.09051513671875, 219.3582000732422, 223.6259002685547]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 12.0, 17.0, 20.0, 27.0, 31.0, 31.0, 40.0, 53.0, 56.0, 62.0, 77.0, 81.0, 73.0, 59.0, 54.0, 64.0, 54.0, 35.0, 22.0, 29.0, 16.0, 7.0, 13.0, 13.0, 9.0, 10.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.91963195800781, -62.166988372802734, -60.41434860229492, -58.661705017089844, -56.909061431884766, -55.15641784667969, -53.403778076171875, -51.6511344909668, -49.89849090576172, -48.14584732055664, -46.39320755004883, -44.64056396484375, -42.88792037963867, -41.135276794433594, -39.38263702392578, -37.6299934387207, -35.87735366821289, -34.12471008300781, -32.3720703125, -30.619426727294922, -28.866783142089844, -27.1141414642334, -25.361499786376953, -23.608856201171875, -21.85621452331543, -20.103572845458984, -18.350929260253906, -16.59828758239746, -14.8456449508667, -13.093002319335938, -11.340360641479492, -9.58771800994873, -7.835079193115234, -6.082436561584473, -4.329794406890869, -2.5771522521972656, -0.8245096206665039, 0.9281330108642578, 2.680774688720703, 4.433417320251465, 6.186059951782227, 7.938702583312988, 9.69134521484375, 11.443986892700195, 13.196629524230957, 14.949272155761719, 16.701913833618164, 18.45455551147461, 20.207199096679688, 21.959840774536133, 23.71248435974121, 25.465126037597656, 27.217769622802734, 28.97041130065918, 30.723052978515625, 32.4756965637207, 34.22834014892578, 35.98098373413086, 37.73362350463867, 39.48626708984375, 41.23891067504883, 42.991554260253906, 44.74419403076172, 46.4968376159668, 48.24947738647461]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 8.0, 4.0, 12.0, 14.0, 9.0, 15.0, 27.0, 45.0, 47.0, 63.0, 94.0, 132.0, 185.0, 476.0, 3225.0, 2468854.0, 1716041.0, 3918.0, 510.0, 190.0, 119.0, 74.0, 55.0, 45.0, 31.0, 18.0, 23.0, 13.0, 9.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.75, -13.3201904296875, -12.890380859375, -12.4605712890625, -12.03076171875, -11.6009521484375, -11.171142578125, -10.7413330078125, -10.3115234375, -9.8817138671875, -9.451904296875, -9.0220947265625, -8.59228515625, -8.1624755859375, -7.732666015625, -7.3028564453125, -6.873046875, -6.4432373046875, -6.013427734375, -5.5836181640625, -5.15380859375, -4.7239990234375, -4.294189453125, -3.8643798828125, -3.4345703125, -3.0047607421875, -2.574951171875, -2.1451416015625, -1.71533203125, -1.2855224609375, -0.855712890625, -0.4259033203125, 0.00390625, 0.4337158203125, 0.863525390625, 1.2933349609375, 1.72314453125, 2.1529541015625, 2.582763671875, 3.0125732421875, 3.4423828125, 3.8721923828125, 4.302001953125, 4.7318115234375, 5.16162109375, 5.5914306640625, 6.021240234375, 6.4510498046875, 6.880859375, 7.3106689453125, 7.740478515625, 8.1702880859375, 8.60009765625, 9.0299072265625, 9.459716796875, 9.8895263671875, 10.3193359375, 10.7491455078125, 11.178955078125, 11.6087646484375, 12.03857421875, 12.4683837890625, 12.898193359375, 13.3280029296875, 13.7578125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 9.0, 15.0, 34.0, 43.0, 56.0, 104.0, 125.0, 136.0, 150.0, 118.0, 71.0, 60.0, 41.0, 24.0, 11.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.34375, -9.1396484375, -8.935546875, -8.7314453125, -8.52734375, -8.3232421875, -8.119140625, -7.9150390625, -7.7109375, -7.5068359375, -7.302734375, -7.0986328125, -6.89453125, -6.6904296875, -6.486328125, -6.2822265625, -6.078125, -5.8740234375, -5.669921875, -5.4658203125, -5.26171875, -5.0576171875, -4.853515625, -4.6494140625, -4.4453125, -4.2412109375, -4.037109375, -3.8330078125, -3.62890625, -3.4248046875, -3.220703125, -3.0166015625, -2.8125, -2.6083984375, -2.404296875, -2.2001953125, -1.99609375, -1.7919921875, -1.587890625, -1.3837890625, -1.1796875, -0.9755859375, -0.771484375, -0.5673828125, -0.36328125, -0.1591796875, 0.044921875, 0.2490234375, 0.453125, 0.6572265625, 0.861328125, 1.0654296875, 1.26953125, 1.4736328125, 1.677734375, 1.8818359375, 2.0859375, 2.2900390625, 2.494140625, 2.6982421875, 2.90234375, 3.1064453125, 3.310546875, 3.5146484375, 3.71875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 14.0, 25.0, 47.0, 58.0, 77.0, 315.0, 61885.0, 4131003.0, 472.0, 137.0, 89.0, 75.0, 43.0, 21.0, 12.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.734375, -30.518798828125, -29.30322265625, -28.087646484375, -26.8720703125, -25.656494140625, -24.44091796875, -23.225341796875, -22.009765625, -20.794189453125, -19.57861328125, -18.363037109375, -17.1474609375, -15.931884765625, -14.71630859375, -13.500732421875, -12.28515625, -11.069580078125, -9.85400390625, -8.638427734375, -7.4228515625, -6.207275390625, -4.99169921875, -3.776123046875, -2.560546875, -1.344970703125, -0.12939453125, 1.086181640625, 2.3017578125, 3.517333984375, 4.73291015625, 5.948486328125, 7.1640625, 8.379638671875, 9.59521484375, 10.810791015625, 12.0263671875, 13.241943359375, 14.45751953125, 15.673095703125, 16.888671875, 18.104248046875, 19.31982421875, 20.535400390625, 21.7509765625, 22.966552734375, 24.18212890625, 25.397705078125, 26.61328125, 27.828857421875, 29.04443359375, 30.260009765625, 31.4755859375, 32.691162109375, 33.90673828125, 35.122314453125, 36.337890625, 37.553466796875, 38.76904296875, 39.984619140625, 41.2001953125, 42.415771484375, 43.63134765625, 44.846923828125, 46.0625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 14.0, 20.0, 88.0, 3067.0, 805.0, 59.0, 12.0, 11.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.260498046875, -9.56787109375, -8.875244140625, -8.1826171875, -7.489990234375, -6.79736328125, -6.104736328125, -5.412109375, -4.719482421875, -4.02685546875, -3.334228515625, -2.6416015625, -1.948974609375, -1.25634765625, -0.563720703125, 0.12890625, 0.821533203125, 1.51416015625, 2.206787109375, 2.8994140625, 3.592041015625, 4.28466796875, 4.977294921875, 5.669921875, 6.362548828125, 7.05517578125, 7.747802734375, 8.4404296875, 9.133056640625, 9.82568359375, 10.518310546875, 11.2109375, 11.903564453125, 12.59619140625, 13.288818359375, 13.9814453125, 14.674072265625, 15.36669921875, 16.059326171875, 16.751953125, 17.444580078125, 18.13720703125, 18.829833984375, 19.5224609375, 20.215087890625, 20.90771484375, 21.600341796875, 22.29296875, 22.985595703125, 23.67822265625, 24.370849609375, 25.0634765625, 25.756103515625, 26.44873046875, 27.141357421875, 27.833984375, 28.526611328125, 29.21923828125, 29.911865234375, 30.6044921875, 31.297119140625, 31.98974609375, 32.682373046875, 33.375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 13.0, 21.0, 47.0, 148.0, 332.0, 260.0, 103.0, 39.0, 19.0, 8.0, 5.0, 2.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.54374313354492, -59.61746597290039, -57.69118881225586, -55.764915466308594, -53.83863830566406, -51.91236114501953, -49.986083984375, -48.05980682373047, -46.13352966308594, -44.207252502441406, -42.280975341796875, -40.354698181152344, -38.42842483520508, -36.50214767456055, -34.575870513916016, -32.649593353271484, -30.723318099975586, -28.797040939331055, -26.870765686035156, -24.944488525390625, -23.018211364746094, -21.091934204101562, -19.165658950805664, -17.239381790161133, -15.313105583190918, -13.386829376220703, -11.460552215576172, -9.534276008605957, -7.607999324798584, -5.681722640991211, -3.755446434020996, -1.8291692733764648, 0.09710693359375, 2.023383617401123, 3.949660062789917, 5.875936508178711, 7.802213191986084, 9.728489875793457, 11.654766082763672, 13.581043243408203, 15.507319450378418, 17.433595657348633, 19.359872817993164, 21.286148071289062, 23.212425231933594, 25.138702392578125, 27.064979553222656, 28.991256713867188, 30.917531967163086, 32.843807220458984, 34.770084381103516, 36.69636154174805, 38.62263870239258, 40.54891586303711, 42.475189208984375, 44.401466369628906, 46.32774353027344, 48.25402069091797, 50.1802978515625, 52.10657501220703, 54.0328483581543, 55.95912551879883, 57.88540267944336, 59.81167984008789, 61.73795700073242]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 8.0, 14.0, 8.0, 12.0, 13.0, 30.0, 40.0, 48.0, 58.0, 47.0, 56.0, 69.0, 69.0, 84.0, 65.0, 57.0, 49.0, 53.0, 44.0, 35.0, 30.0, 19.0, 24.0, 21.0, 11.0, 12.0, 8.0, 3.0, 6.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.435894012451172, -25.313499450683594, -24.19110679626465, -23.06871223449707, -21.946319580078125, -20.823925018310547, -19.70153045654297, -18.57913589477539, -17.456743240356445, -16.334348678588867, -15.211956024169922, -14.089561462402344, -12.967167854309082, -11.84477424621582, -10.722379684448242, -9.59998607635498, -8.477592468261719, -7.355198860168457, -6.232804775238037, -5.110410690307617, -3.9880170822143555, -2.8656234741210938, -1.7432293891906738, -0.6208353042602539, 0.5015583038330078, 1.6239521503448486, 2.7463459968566895, 3.8687398433685303, 4.991133689880371, 6.113527297973633, 7.235921382904053, 8.358315467834473, 9.480705261230469, 10.60309886932373, 11.725492477416992, 12.84788703918457, 13.970280647277832, 15.092674255371094, 16.215068817138672, 17.33746337890625, 18.459856033325195, 19.582250595092773, 20.70464324951172, 21.827037811279297, 22.949432373046875, 24.07182502746582, 25.1942195892334, 26.316612243652344, 27.439006805419922, 28.5614013671875, 29.683794021606445, 30.806188583374023, 31.92858123779297, 33.05097579956055, 34.173370361328125, 35.2957649230957, 36.41815948486328, 37.54055404663086, 38.66294860839844, 39.78533935546875, 40.90773391723633, 42.030128479003906, 43.152523040771484, 44.27491760253906, 45.397308349609375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 4.0, 12.0, 14.0, 26.0, 21.0, 57.0, 65.0, 101.0, 158.0, 224.0, 343.0, 583.0, 953.0, 1637.0, 2937.0, 5598.0, 12571.0, 30210.0, 82537.0, 258010.0, 413011.0, 150723.0, 50925.0, 19540.0, 8673.0, 4078.0, 2194.0, 1261.0, 789.0, 424.0, 303.0, 171.0, 121.0, 88.0, 67.0, 41.0, 27.0, 20.0, 7.0, 8.0, 4.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.943359375, -2.8392333984375, -2.735107421875, -2.6309814453125, -2.52685546875, -2.4227294921875, -2.318603515625, -2.2144775390625, -2.1103515625, -2.0062255859375, -1.902099609375, -1.7979736328125, -1.69384765625, -1.5897216796875, -1.485595703125, -1.3814697265625, -1.27734375, -1.1732177734375, -1.069091796875, -0.9649658203125, -0.86083984375, -0.7567138671875, -0.652587890625, -0.5484619140625, -0.4443359375, -0.3402099609375, -0.236083984375, -0.1319580078125, -0.02783203125, 0.0762939453125, 0.180419921875, 0.2845458984375, 0.388671875, 0.4927978515625, 0.596923828125, 0.7010498046875, 0.80517578125, 0.9093017578125, 1.013427734375, 1.1175537109375, 1.2216796875, 1.3258056640625, 1.429931640625, 1.5340576171875, 1.63818359375, 1.7423095703125, 1.846435546875, 1.9505615234375, 2.0546875, 2.1588134765625, 2.262939453125, 2.3670654296875, 2.47119140625, 2.5753173828125, 2.679443359375, 2.7835693359375, 2.8876953125, 2.9918212890625, 3.095947265625, 3.2000732421875, 3.30419921875, 3.4083251953125, 3.512451171875, 3.6165771484375, 3.720703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 9.0, 4.0, 4.0, 10.0, 12.0, 14.0, 14.0, 19.0, 29.0, 22.0, 46.0, 41.0, 50.0, 53.0, 57.0, 61.0, 60.0, 69.0, 59.0, 47.0, 49.0, 46.0, 41.0, 39.0, 46.0, 26.0, 21.0, 13.0, 14.0, 4.0, 7.0, 10.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.69140625, -3.58258056640625, -3.4737548828125, -3.36492919921875, -3.256103515625, -3.14727783203125, -3.0384521484375, -2.92962646484375, -2.82080078125, -2.71197509765625, -2.6031494140625, -2.49432373046875, -2.385498046875, -2.27667236328125, -2.1678466796875, -2.05902099609375, -1.9501953125, -1.84136962890625, -1.7325439453125, -1.62371826171875, -1.514892578125, -1.40606689453125, -1.2972412109375, -1.18841552734375, -1.07958984375, -0.97076416015625, -0.8619384765625, -0.75311279296875, -0.644287109375, -0.53546142578125, -0.4266357421875, -0.31781005859375, -0.208984375, -0.10015869140625, 0.0086669921875, 0.11749267578125, 0.226318359375, 0.33514404296875, 0.4439697265625, 0.55279541015625, 0.66162109375, 0.77044677734375, 0.8792724609375, 0.98809814453125, 1.096923828125, 1.20574951171875, 1.3145751953125, 1.42340087890625, 1.5322265625, 1.64105224609375, 1.7498779296875, 1.85870361328125, 1.967529296875, 2.07635498046875, 2.1851806640625, 2.29400634765625, 2.40283203125, 2.51165771484375, 2.6204833984375, 2.72930908203125, 2.838134765625, 2.94696044921875, 3.0557861328125, 3.16461181640625, 3.2734375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 5.0, 5.0, 16.0, 17.0, 21.0, 41.0, 72.0, 127.0, 206.0, 413.0, 931.0, 2729.0, 18301.0, 764250.0, 247872.0, 9950.0, 2011.0, 766.0, 319.0, 176.0, 111.0, 68.0, 44.0, 30.0, 12.0, 20.0, 10.0, 4.0, 2.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.3203125, -11.9337158203125, -11.547119140625, -11.1605224609375, -10.77392578125, -10.3873291015625, -10.000732421875, -9.6141357421875, -9.2275390625, -8.8409423828125, -8.454345703125, -8.0677490234375, -7.68115234375, -7.2945556640625, -6.907958984375, -6.5213623046875, -6.134765625, -5.7481689453125, -5.361572265625, -4.9749755859375, -4.58837890625, -4.2017822265625, -3.815185546875, -3.4285888671875, -3.0419921875, -2.6553955078125, -2.268798828125, -1.8822021484375, -1.49560546875, -1.1090087890625, -0.722412109375, -0.3358154296875, 0.05078125, 0.4373779296875, 0.823974609375, 1.2105712890625, 1.59716796875, 1.9837646484375, 2.370361328125, 2.7569580078125, 3.1435546875, 3.5301513671875, 3.916748046875, 4.3033447265625, 4.68994140625, 5.0765380859375, 5.463134765625, 5.8497314453125, 6.236328125, 6.6229248046875, 7.009521484375, 7.3961181640625, 7.78271484375, 8.1693115234375, 8.555908203125, 8.9425048828125, 9.3291015625, 9.7156982421875, 10.102294921875, 10.4888916015625, 10.87548828125, 11.2620849609375, 11.648681640625, 12.0352783203125, 12.421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 6.0, 10.0, 21.0, 21.0, 36.0, 48.0, 67.0, 74.0, 114.0, 109.0, 107.0, 98.0, 76.0, 72.0, 54.0, 26.0, 28.0, 10.0, 8.0, 7.0, 9.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.763916015625, -15.04345703125, -14.322998046875, -13.6025390625, -12.882080078125, -12.16162109375, -11.441162109375, -10.720703125, -10.000244140625, -9.27978515625, -8.559326171875, -7.8388671875, -7.118408203125, -6.39794921875, -5.677490234375, -4.95703125, -4.236572265625, -3.51611328125, -2.795654296875, -2.0751953125, -1.354736328125, -0.63427734375, 0.086181640625, 0.806640625, 1.527099609375, 2.24755859375, 2.968017578125, 3.6884765625, 4.408935546875, 5.12939453125, 5.849853515625, 6.5703125, 7.290771484375, 8.01123046875, 8.731689453125, 9.4521484375, 10.172607421875, 10.89306640625, 11.613525390625, 12.333984375, 13.054443359375, 13.77490234375, 14.495361328125, 15.2158203125, 15.936279296875, 16.65673828125, 17.377197265625, 18.09765625, 18.818115234375, 19.53857421875, 20.259033203125, 20.9794921875, 21.699951171875, 22.42041015625, 23.140869140625, 23.861328125, 24.581787109375, 25.30224609375, 26.022705078125, 26.7431640625, 27.463623046875, 28.18408203125, 28.904541015625, 29.625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 14.0, 7.0, 16.0, 17.0, 36.0, 79.0, 123.0, 245.0, 781.0, 3413.0, 35880.0, 928791.0, 72393.0, 5046.0, 1028.0, 314.0, 149.0, 69.0, 46.0, 26.0, 18.0, 15.0, 8.0, 4.0, 5.0, 6.0, 6.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.078125, -3.956756591796875, -3.83538818359375, -3.714019775390625, -3.5926513671875, -3.471282958984375, -3.34991455078125, -3.228546142578125, -3.107177734375, -2.985809326171875, -2.86444091796875, -2.743072509765625, -2.6217041015625, -2.500335693359375, -2.37896728515625, -2.257598876953125, -2.13623046875, -2.014862060546875, -1.89349365234375, -1.772125244140625, -1.6507568359375, -1.529388427734375, -1.40802001953125, -1.286651611328125, -1.165283203125, -1.043914794921875, -0.92254638671875, -0.801177978515625, -0.6798095703125, -0.558441162109375, -0.43707275390625, -0.315704345703125, -0.1943359375, -0.072967529296875, 0.04840087890625, 0.169769287109375, 0.2911376953125, 0.412506103515625, 0.53387451171875, 0.655242919921875, 0.776611328125, 0.897979736328125, 1.01934814453125, 1.140716552734375, 1.2620849609375, 1.383453369140625, 1.50482177734375, 1.626190185546875, 1.74755859375, 1.868927001953125, 1.99029541015625, 2.111663818359375, 2.2330322265625, 2.354400634765625, 2.47576904296875, 2.597137451171875, 2.718505859375, 2.839874267578125, 2.96124267578125, 3.082611083984375, 3.2039794921875, 3.325347900390625, 3.44671630859375, 3.568084716796875, 3.689453125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 3.0, 5.0, 5.0, 12.0, 13.0, 15.0, 15.0, 39.0, 61.0, 83.0, 131.0, 168.0, 141.0, 98.0, 53.0, 45.0, 29.0, 23.0, 16.0, 10.0, 6.0, 8.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00042366981506347656, -0.00041301921010017395, -0.00040236860513687134, -0.0003917180001735687, -0.0003810673952102661, -0.0003704167902469635, -0.0003597661852836609, -0.0003491155803203583, -0.00033846497535705566, -0.00032781437039375305, -0.00031716376543045044, -0.00030651316046714783, -0.0002958625555038452, -0.0002852119505405426, -0.00027456134557724, -0.0002639107406139374, -0.00025326013565063477, -0.00024260953068733215, -0.00023195892572402954, -0.00022130832076072693, -0.00021065771579742432, -0.0002000071108341217, -0.0001893565058708191, -0.00017870590090751648, -0.00016805529594421387, -0.00015740469098091125, -0.00014675408601760864, -0.00013610348105430603, -0.00012545287609100342, -0.0001148022711277008, -0.0001041516661643982, -9.350106120109558e-05, -8.285045623779297e-05, -7.219985127449036e-05, -6.154924631118774e-05, -5.089864134788513e-05, -4.024803638458252e-05, -2.9597431421279907e-05, -1.8946826457977295e-05, -8.296221494674683e-06, 2.3543834686279297e-06, 1.3004988431930542e-05, 2.3655593395233154e-05, 3.4306198358535767e-05, 4.495680332183838e-05, 5.560740828514099e-05, 6.62580132484436e-05, 7.690861821174622e-05, 8.755922317504883e-05, 9.820982813835144e-05, 0.00010886043310165405, 0.00011951103806495667, 0.00013016164302825928, 0.0001408122479915619, 0.0001514628529548645, 0.00016211345791816711, 0.00017276406288146973, 0.00018341466784477234, 0.00019406527280807495, 0.00020471587777137756, 0.00021536648273468018, 0.0002260170876979828, 0.0002366676926612854, 0.000247318297624588, 0.0002579689025878906]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 3.0, 6.0, 6.0, 9.0, 6.0, 9.0, 25.0, 25.0, 31.0, 54.0, 94.0, 137.0, 225.0, 455.0, 1015.0, 2460.0, 8382.0, 56525.0, 775435.0, 179849.0, 17096.0, 3909.0, 1398.0, 599.0, 271.0, 167.0, 104.0, 77.0, 42.0, 38.0, 19.0, 25.0, 17.0, 10.0, 9.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.744140625, -2.66729736328125, -2.5904541015625, -2.51361083984375, -2.436767578125, -2.35992431640625, -2.2830810546875, -2.20623779296875, -2.12939453125, -2.05255126953125, -1.9757080078125, -1.89886474609375, -1.822021484375, -1.74517822265625, -1.6683349609375, -1.59149169921875, -1.5146484375, -1.43780517578125, -1.3609619140625, -1.28411865234375, -1.207275390625, -1.13043212890625, -1.0535888671875, -0.97674560546875, -0.89990234375, -0.82305908203125, -0.7462158203125, -0.66937255859375, -0.592529296875, -0.51568603515625, -0.4388427734375, -0.36199951171875, -0.28515625, -0.20831298828125, -0.1314697265625, -0.05462646484375, 0.022216796875, 0.09906005859375, 0.1759033203125, 0.25274658203125, 0.32958984375, 0.40643310546875, 0.4832763671875, 0.56011962890625, 0.636962890625, 0.71380615234375, 0.7906494140625, 0.86749267578125, 0.9443359375, 1.02117919921875, 1.0980224609375, 1.17486572265625, 1.251708984375, 1.32855224609375, 1.4053955078125, 1.48223876953125, 1.55908203125, 1.63592529296875, 1.7127685546875, 1.78961181640625, 1.866455078125, 1.94329833984375, 2.0201416015625, 2.09698486328125, 2.173828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 5.0, 17.0, 12.0, 12.0, 27.0, 27.0, 29.0, 36.0, 52.0, 52.0, 71.0, 78.0, 86.0, 90.0, 65.0, 69.0, 42.0, 41.0, 32.0, 27.0, 24.0, 18.0, 20.0, 10.0, 14.0, 4.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.044921875, -1.98590087890625, -1.9268798828125, -1.86785888671875, -1.808837890625, -1.74981689453125, -1.6907958984375, -1.63177490234375, -1.57275390625, -1.51373291015625, -1.4547119140625, -1.39569091796875, -1.336669921875, -1.27764892578125, -1.2186279296875, -1.15960693359375, -1.1005859375, -1.04156494140625, -0.9825439453125, -0.92352294921875, -0.864501953125, -0.80548095703125, -0.7464599609375, -0.68743896484375, -0.62841796875, -0.56939697265625, -0.5103759765625, -0.45135498046875, -0.392333984375, -0.33331298828125, -0.2742919921875, -0.21527099609375, -0.15625, -0.09722900390625, -0.0382080078125, 0.02081298828125, 0.079833984375, 0.13885498046875, 0.1978759765625, 0.25689697265625, 0.31591796875, 0.37493896484375, 0.4339599609375, 0.49298095703125, 0.552001953125, 0.61102294921875, 0.6700439453125, 0.72906494140625, 0.7880859375, 0.84710693359375, 0.9061279296875, 0.96514892578125, 1.024169921875, 1.08319091796875, 1.1422119140625, 1.20123291015625, 1.26025390625, 1.31927490234375, 1.3782958984375, 1.43731689453125, 1.496337890625, 1.55535888671875, 1.6143798828125, 1.67340087890625, 1.732421875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 29.0, 156.0, 594.0, 168.0, 37.0, 7.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.571998596191406, -44.29484939575195, -40.017696380615234, -35.74054718017578, -31.463396072387695, -27.18624496459961, -22.909095764160156, -18.63194465637207, -14.354793548583984, -10.077642440795898, -5.800492286682129, -1.5233421325683594, 2.7538089752197266, 7.0309600830078125, 11.308109283447266, 15.585260391235352, 19.862411499023438, 24.139562606811523, 28.41671371459961, 32.69386291503906, 36.97101593017578, 41.248165130615234, 45.52531433105469, 49.802467346191406, 54.07961654663086, 58.35676574707031, 62.63391876220703, 66.91107177734375, 71.18821716308594, 75.46537017822266, 79.74252319335938, 84.01966857910156, 88.29682922363281, 92.57398223876953, 96.85112762451172, 101.12828063964844, 105.40543365478516, 109.68258666992188, 113.95973205566406, 118.23688507080078, 122.5140380859375, 126.79119110107422, 131.06834411621094, 135.34548950195312, 139.6226348876953, 143.89979553222656, 148.17694091796875, 152.45408630371094, 156.73123168945312, 161.0083770751953, 165.28553771972656, 169.56268310546875, 173.83982849121094, 178.1169891357422, 182.39413452148438, 186.67127990722656, 190.9484405517578, 195.2255859375, 199.50274658203125, 203.77989196777344, 208.05703735351562, 212.33419799804688, 216.61134338378906, 220.88848876953125, 225.1656494140625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 7.0, 13.0, 12.0, 25.0, 26.0, 37.0, 35.0, 51.0, 51.0, 61.0, 78.0, 87.0, 89.0, 87.0, 53.0, 53.0, 57.0, 43.0, 31.0, 30.0, 22.0, 17.0, 12.0, 5.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.364501953125, -78.12635803222656, -75.88821411132812, -73.65007019042969, -71.41192626953125, -69.17378234863281, -66.93563842773438, -64.69750213623047, -62.45935821533203, -60.221214294433594, -57.983070373535156, -55.74492645263672, -53.50678634643555, -51.26864242553711, -49.03049850463867, -46.792354583740234, -44.5542106628418, -42.31606674194336, -40.07792282104492, -37.83978271484375, -35.60163879394531, -33.363494873046875, -31.125350952148438, -28.88720703125, -26.649065017700195, -24.410921096801758, -22.172779083251953, -19.934635162353516, -17.696491241455078, -15.458349227905273, -13.220205307006836, -10.982062339782715, -8.743919372558594, -6.505776405334473, -4.267632961273193, -2.029489517211914, 0.20865345001220703, 2.446796417236328, 4.684940338134766, 6.923083305358887, 9.161226272583008, 11.399369239807129, 13.63751220703125, 15.875656127929688, 18.113800048828125, 20.35194206237793, 22.590085983276367, 24.828227996826172, 27.06637191772461, 29.304515838623047, 31.54265785217285, 33.780799865722656, 36.018943786621094, 38.25708770751953, 40.49523162841797, 42.733375549316406, 44.971519470214844, 47.20966339111328, 49.44780731201172, 51.685951232910156, 53.92409133911133, 56.162235260009766, 58.4003791809082, 60.63852310180664, 62.87666320800781]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 3.0, 6.0, 6.0, 13.0, 21.0, 19.0, 30.0, 55.0, 83.0, 117.0, 219.0, 470.0, 976.0, 2348.0, 5781.0, 19803.0, 185796.0, 3316025.0, 608068.0, 38834.0, 9233.0, 3658.0, 1452.0, 604.0, 282.0, 140.0, 96.0, 54.0, 40.0, 16.0, 15.0, 10.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.44921875, -5.315277099609375, -5.18133544921875, -5.047393798828125, -4.9134521484375, -4.779510498046875, -4.64556884765625, -4.511627197265625, -4.377685546875, -4.243743896484375, -4.10980224609375, -3.975860595703125, -3.8419189453125, -3.707977294921875, -3.57403564453125, -3.440093994140625, -3.30615234375, -3.172210693359375, -3.03826904296875, -2.904327392578125, -2.7703857421875, -2.636444091796875, -2.50250244140625, -2.368560791015625, -2.234619140625, -2.100677490234375, -1.96673583984375, -1.832794189453125, -1.6988525390625, -1.564910888671875, -1.43096923828125, -1.297027587890625, -1.1630859375, -1.029144287109375, -0.89520263671875, -0.761260986328125, -0.6273193359375, -0.493377685546875, -0.35943603515625, -0.225494384765625, -0.091552734375, 0.042388916015625, 0.17633056640625, 0.310272216796875, 0.4442138671875, 0.578155517578125, 0.71209716796875, 0.846038818359375, 0.97998046875, 1.113922119140625, 1.24786376953125, 1.381805419921875, 1.5157470703125, 1.649688720703125, 1.78363037109375, 1.917572021484375, 2.051513671875, 2.185455322265625, 2.31939697265625, 2.453338623046875, 2.5872802734375, 2.721221923828125, 2.85516357421875, 2.989105224609375, 3.123046875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 13.0, 14.0, 28.0, 27.0, 26.0, 42.0, 57.0, 61.0, 74.0, 72.0, 71.0, 72.0, 70.0, 77.0, 72.0, 53.0, 44.0, 38.0, 36.0, 9.0, 16.0, 6.0, 9.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-5.83984375, -5.713043212890625, -5.58624267578125, -5.459442138671875, -5.3326416015625, -5.205841064453125, -5.07904052734375, -4.952239990234375, -4.825439453125, -4.698638916015625, -4.57183837890625, -4.445037841796875, -4.3182373046875, -4.191436767578125, -4.06463623046875, -3.937835693359375, -3.81103515625, -3.684234619140625, -3.55743408203125, -3.430633544921875, -3.3038330078125, -3.177032470703125, -3.05023193359375, -2.923431396484375, -2.796630859375, -2.669830322265625, -2.54302978515625, -2.416229248046875, -2.2894287109375, -2.162628173828125, -2.03582763671875, -1.909027099609375, -1.7822265625, -1.655426025390625, -1.52862548828125, -1.401824951171875, -1.2750244140625, -1.148223876953125, -1.02142333984375, -0.894622802734375, -0.767822265625, -0.641021728515625, -0.51422119140625, -0.387420654296875, -0.2606201171875, -0.133819580078125, -0.00701904296875, 0.119781494140625, 0.24658203125, 0.373382568359375, 0.50018310546875, 0.626983642578125, 0.7537841796875, 0.880584716796875, 1.00738525390625, 1.134185791015625, 1.260986328125, 1.387786865234375, 1.51458740234375, 1.641387939453125, 1.7681884765625, 1.894989013671875, 2.02178955078125, 2.148590087890625, 2.275390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 4.0, 8.0, 9.0, 12.0, 23.0, 31.0, 43.0, 114.0, 220.0, 640.0, 1967.0, 9382.0, 108312.0, 4013312.0, 52378.0, 5723.0, 1299.0, 435.0, 170.0, 78.0, 43.0, 20.0, 14.0, 12.0, 11.0, 7.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.859375, -10.5435791015625, -10.227783203125, -9.9119873046875, -9.59619140625, -9.2803955078125, -8.964599609375, -8.6488037109375, -8.3330078125, -8.0172119140625, -7.701416015625, -7.3856201171875, -7.06982421875, -6.7540283203125, -6.438232421875, -6.1224365234375, -5.806640625, -5.4908447265625, -5.175048828125, -4.8592529296875, -4.54345703125, -4.2276611328125, -3.911865234375, -3.5960693359375, -3.2802734375, -2.9644775390625, -2.648681640625, -2.3328857421875, -2.01708984375, -1.7012939453125, -1.385498046875, -1.0697021484375, -0.75390625, -0.4381103515625, -0.122314453125, 0.1934814453125, 0.50927734375, 0.8250732421875, 1.140869140625, 1.4566650390625, 1.7724609375, 2.0882568359375, 2.404052734375, 2.7198486328125, 3.03564453125, 3.3514404296875, 3.667236328125, 3.9830322265625, 4.298828125, 4.6146240234375, 4.930419921875, 5.2462158203125, 5.56201171875, 5.8778076171875, 6.193603515625, 6.5093994140625, 6.8251953125, 7.1409912109375, 7.456787109375, 7.7725830078125, 8.08837890625, 8.4041748046875, 8.719970703125, 9.0357666015625, 9.3515625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 9.0, 6.0, 8.0, 6.0, 15.0, 9.0, 13.0, 33.0, 41.0, 58.0, 86.0, 214.0, 560.0, 1224.0, 978.0, 388.0, 139.0, 69.0, 42.0, 32.0, 33.0, 28.0, 15.0, 11.0, 9.0, 4.0, 4.0, 5.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.30859375, -6.1220703125, -5.935546875, -5.7490234375, -5.5625, -5.3759765625, -5.189453125, -5.0029296875, -4.81640625, -4.6298828125, -4.443359375, -4.2568359375, -4.0703125, -3.8837890625, -3.697265625, -3.5107421875, -3.32421875, -3.1376953125, -2.951171875, -2.7646484375, -2.578125, -2.3916015625, -2.205078125, -2.0185546875, -1.83203125, -1.6455078125, -1.458984375, -1.2724609375, -1.0859375, -0.8994140625, -0.712890625, -0.5263671875, -0.33984375, -0.1533203125, 0.033203125, 0.2197265625, 0.40625, 0.5927734375, 0.779296875, 0.9658203125, 1.15234375, 1.3388671875, 1.525390625, 1.7119140625, 1.8984375, 2.0849609375, 2.271484375, 2.4580078125, 2.64453125, 2.8310546875, 3.017578125, 3.2041015625, 3.390625, 3.5771484375, 3.763671875, 3.9501953125, 4.13671875, 4.3232421875, 4.509765625, 4.6962890625, 4.8828125, 5.0693359375, 5.255859375, 5.4423828125, 5.62890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 11.0, 34.0, 63.0, 175.0, 380.0, 219.0, 73.0, 25.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.22975158691406, -105.90928649902344, -103.58881378173828, -101.26834106445312, -98.9478759765625, -96.62741088867188, -94.30693817138672, -91.98646545410156, -89.66600036621094, -87.34553527832031, -85.02506256103516, -82.70458984375, -80.38412475585938, -78.06365966796875, -75.7431869506836, -73.42271423339844, -71.10224914550781, -68.78178405761719, -66.46131134033203, -64.14083862304688, -61.82037353515625, -59.49990463256836, -57.17943572998047, -54.85896682739258, -52.53849792480469, -50.2180290222168, -47.897560119628906, -45.577091217041016, -43.256622314453125, -40.936153411865234, -38.615684509277344, -36.29521560668945, -33.97475051879883, -31.654281616210938, -29.333812713623047, -27.013343811035156, -24.692874908447266, -22.372406005859375, -20.051937103271484, -17.731468200683594, -15.410999298095703, -13.090530395507812, -10.770061492919922, -8.449592590332031, -6.129123687744141, -3.80865478515625, -1.4881858825683594, 0.8322830200195312, 3.152751922607422, 5.4732208251953125, 7.793689727783203, 10.114158630371094, 12.434627532958984, 14.755096435546875, 17.075565338134766, 19.396034240722656, 21.716503143310547, 24.036972045898438, 26.357440948486328, 28.67790985107422, 30.99837875366211, 33.31884765625, 35.63931655883789, 37.95978546142578, 40.28025436401367]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 5.0, 5.0, 10.0, 12.0, 9.0, 17.0, 23.0, 19.0, 43.0, 38.0, 50.0, 52.0, 50.0, 72.0, 72.0, 51.0, 65.0, 53.0, 68.0, 54.0, 34.0, 42.0, 30.0, 25.0, 22.0, 19.0, 9.0, 18.0, 11.0, 7.0, 7.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.516937255859375, -22.50958824157715, -21.502241134643555, -20.494892120361328, -19.487545013427734, -18.480195999145508, -17.47284698486328, -16.465499877929688, -15.458151817321777, -14.450803756713867, -13.443455696105957, -12.436107635498047, -11.42875862121582, -10.421411514282227, -9.4140625, -8.40671443939209, -7.39936637878418, -6.3920183181762695, -5.384670257568359, -4.377321720123291, -3.369973659515381, -2.3626255989074707, -1.3552770614624023, -0.3479290008544922, 0.659419059753418, 1.6667672395706177, 2.6741154193878174, 3.6814637184143066, 4.688811779022217, 5.696159839630127, 6.703508377075195, 7.7108564376831055, 8.718204498291016, 9.725552558898926, 10.732900619506836, 11.740249633789062, 12.747596740722656, 13.754945755004883, 14.762293815612793, 15.769641876220703, 16.776988983154297, 17.784337997436523, 18.791685104370117, 19.799034118652344, 20.806381225585938, 21.813730239868164, 22.82107925415039, 23.828426361083984, 24.83577537536621, 25.843124389648438, 26.85047149658203, 27.857820510864258, 28.86516761779785, 29.872516632080078, 30.879863739013672, 31.8872127532959, 32.894561767578125, 33.90190887451172, 34.90925979614258, 35.91660690307617, 36.923954010009766, 37.93130111694336, 38.93865203857422, 39.94599914550781, 40.953346252441406]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 18.0, 18.0, 25.0, 36.0, 48.0, 60.0, 84.0, 109.0, 176.0, 280.0, 464.0, 709.0, 1200.0, 2166.0, 3887.0, 7362.0, 14148.0, 29520.0, 67191.0, 163588.0, 330653.0, 241782.0, 100400.0, 42805.0, 19809.0, 9854.0, 5179.0, 2842.0, 1559.0, 945.0, 570.0, 338.0, 225.0, 141.0, 115.0, 67.0, 66.0, 28.0, 24.0, 15.0, 15.0, 5.0, 9.0, 1.0, 9.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.68359375, -2.6063232421875, -2.529052734375, -2.4517822265625, -2.37451171875, -2.2972412109375, -2.219970703125, -2.1427001953125, -2.0654296875, -1.9881591796875, -1.910888671875, -1.8336181640625, -1.75634765625, -1.6790771484375, -1.601806640625, -1.5245361328125, -1.447265625, -1.3699951171875, -1.292724609375, -1.2154541015625, -1.13818359375, -1.0609130859375, -0.983642578125, -0.9063720703125, -0.8291015625, -0.7518310546875, -0.674560546875, -0.5972900390625, -0.52001953125, -0.4427490234375, -0.365478515625, -0.2882080078125, -0.2109375, -0.1336669921875, -0.056396484375, 0.0208740234375, 0.09814453125, 0.1754150390625, 0.252685546875, 0.3299560546875, 0.4072265625, 0.4844970703125, 0.561767578125, 0.6390380859375, 0.71630859375, 0.7935791015625, 0.870849609375, 0.9481201171875, 1.025390625, 1.1026611328125, 1.179931640625, 1.2572021484375, 1.33447265625, 1.4117431640625, 1.489013671875, 1.5662841796875, 1.6435546875, 1.7208251953125, 1.798095703125, 1.8753662109375, 1.95263671875, 2.0299072265625, 2.107177734375, 2.1844482421875, 2.26171875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 5.0, 2.0, 3.0, 12.0, 8.0, 14.0, 14.0, 6.0, 22.0, 22.0, 20.0, 35.0, 25.0, 38.0, 32.0, 33.0, 43.0, 44.0, 40.0, 50.0, 41.0, 54.0, 34.0, 55.0, 45.0, 48.0, 43.0, 34.0, 25.0, 27.0, 29.0, 17.0, 14.0, 23.0, 12.0, 7.0, 6.0, 10.0, 4.0, 4.0, 2.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6015625, -2.524078369140625, -2.44659423828125, -2.369110107421875, -2.2916259765625, -2.214141845703125, -2.13665771484375, -2.059173583984375, -1.981689453125, -1.904205322265625, -1.82672119140625, -1.749237060546875, -1.6717529296875, -1.594268798828125, -1.51678466796875, -1.439300537109375, -1.36181640625, -1.284332275390625, -1.20684814453125, -1.129364013671875, -1.0518798828125, -0.974395751953125, -0.89691162109375, -0.819427490234375, -0.741943359375, -0.664459228515625, -0.58697509765625, -0.509490966796875, -0.4320068359375, -0.354522705078125, -0.27703857421875, -0.199554443359375, -0.1220703125, -0.044586181640625, 0.03289794921875, 0.110382080078125, 0.1878662109375, 0.265350341796875, 0.34283447265625, 0.420318603515625, 0.497802734375, 0.575286865234375, 0.65277099609375, 0.730255126953125, 0.8077392578125, 0.885223388671875, 0.96270751953125, 1.040191650390625, 1.11767578125, 1.195159912109375, 1.27264404296875, 1.350128173828125, 1.4276123046875, 1.505096435546875, 1.58258056640625, 1.660064697265625, 1.737548828125, 1.815032958984375, 1.89251708984375, 1.970001220703125, 2.0474853515625, 2.124969482421875, 2.20245361328125, 2.279937744140625, 2.357421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 10.0, 12.0, 7.0, 9.0, 24.0, 25.0, 29.0, 45.0, 52.0, 82.0, 104.0, 159.0, 217.0, 317.0, 438.0, 653.0, 1116.0, 2666.0, 10656.0, 111091.0, 840115.0, 67500.0, 8048.0, 2179.0, 987.0, 607.0, 380.0, 294.0, 179.0, 150.0, 109.0, 79.0, 65.0, 35.0, 33.0, 24.0, 12.0, 13.0, 5.0, 12.0, 3.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0859375, -7.820068359375, -7.55419921875, -7.288330078125, -7.0224609375, -6.756591796875, -6.49072265625, -6.224853515625, -5.958984375, -5.693115234375, -5.42724609375, -5.161376953125, -4.8955078125, -4.629638671875, -4.36376953125, -4.097900390625, -3.83203125, -3.566162109375, -3.30029296875, -3.034423828125, -2.7685546875, -2.502685546875, -2.23681640625, -1.970947265625, -1.705078125, -1.439208984375, -1.17333984375, -0.907470703125, -0.6416015625, -0.375732421875, -0.10986328125, 0.156005859375, 0.421875, 0.687744140625, 0.95361328125, 1.219482421875, 1.4853515625, 1.751220703125, 2.01708984375, 2.282958984375, 2.548828125, 2.814697265625, 3.08056640625, 3.346435546875, 3.6123046875, 3.878173828125, 4.14404296875, 4.409912109375, 4.67578125, 4.941650390625, 5.20751953125, 5.473388671875, 5.7392578125, 6.005126953125, 6.27099609375, 6.536865234375, 6.802734375, 7.068603515625, 7.33447265625, 7.600341796875, 7.8662109375, 8.132080078125, 8.39794921875, 8.663818359375, 8.9296875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 6.0, 10.0, 14.0, 18.0, 20.0, 25.0, 28.0, 28.0, 30.0, 39.0, 47.0, 39.0, 51.0, 53.0, 48.0, 59.0, 50.0, 51.0, 48.0, 56.0, 35.0, 39.0, 33.0, 25.0, 23.0, 25.0, 21.0, 12.0, 13.0, 8.0, 4.0, 5.0, 12.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.6796875, -12.3231201171875, -11.966552734375, -11.6099853515625, -11.25341796875, -10.8968505859375, -10.540283203125, -10.1837158203125, -9.8271484375, -9.4705810546875, -9.114013671875, -8.7574462890625, -8.40087890625, -8.0443115234375, -7.687744140625, -7.3311767578125, -6.974609375, -6.6180419921875, -6.261474609375, -5.9049072265625, -5.54833984375, -5.1917724609375, -4.835205078125, -4.4786376953125, -4.1220703125, -3.7655029296875, -3.408935546875, -3.0523681640625, -2.69580078125, -2.3392333984375, -1.982666015625, -1.6260986328125, -1.26953125, -0.9129638671875, -0.556396484375, -0.1998291015625, 0.15673828125, 0.5133056640625, 0.869873046875, 1.2264404296875, 1.5830078125, 1.9395751953125, 2.296142578125, 2.6527099609375, 3.00927734375, 3.3658447265625, 3.722412109375, 4.0789794921875, 4.435546875, 4.7921142578125, 5.148681640625, 5.5052490234375, 5.86181640625, 6.2183837890625, 6.574951171875, 6.9315185546875, 7.2880859375, 7.6446533203125, 8.001220703125, 8.3577880859375, 8.71435546875, 9.0709228515625, 9.427490234375, 9.7840576171875, 10.140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 15.0, 17.0, 21.0, 57.0, 108.0, 200.0, 587.0, 2048.0, 13204.0, 250180.0, 754201.0, 23415.0, 3120.0, 798.0, 304.0, 126.0, 70.0, 31.0, 15.0, 15.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.142578125, -3.047698974609375, -2.95281982421875, -2.857940673828125, -2.7630615234375, -2.668182373046875, -2.57330322265625, -2.478424072265625, -2.383544921875, -2.288665771484375, -2.19378662109375, -2.098907470703125, -2.0040283203125, -1.909149169921875, -1.81427001953125, -1.719390869140625, -1.62451171875, -1.529632568359375, -1.43475341796875, -1.339874267578125, -1.2449951171875, -1.150115966796875, -1.05523681640625, -0.960357666015625, -0.865478515625, -0.770599365234375, -0.67572021484375, -0.580841064453125, -0.4859619140625, -0.391082763671875, -0.29620361328125, -0.201324462890625, -0.1064453125, -0.011566162109375, 0.08331298828125, 0.178192138671875, 0.2730712890625, 0.367950439453125, 0.46282958984375, 0.557708740234375, 0.652587890625, 0.747467041015625, 0.84234619140625, 0.937225341796875, 1.0321044921875, 1.126983642578125, 1.22186279296875, 1.316741943359375, 1.41162109375, 1.506500244140625, 1.60137939453125, 1.696258544921875, 1.7911376953125, 1.886016845703125, 1.98089599609375, 2.075775146484375, 2.170654296875, 2.265533447265625, 2.36041259765625, 2.455291748046875, 2.5501708984375, 2.645050048828125, 2.73992919921875, 2.834808349609375, 2.9296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 3.0, 8.0, 15.0, 13.0, 27.0, 37.0, 43.0, 97.0, 178.0, 202.0, 142.0, 70.0, 46.0, 34.0, 28.0, 17.0, 15.0, 10.0, 2.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0007724761962890625, -0.0007554627954959869, -0.0007384493947029114, -0.0007214359939098358, -0.0007044225931167603, -0.0006874091923236847, -0.0006703957915306091, -0.0006533823907375336, -0.000636368989944458, -0.0006193555891513824, -0.0006023421883583069, -0.0005853287875652313, -0.0005683153867721558, -0.0005513019859790802, -0.0005342885851860046, -0.0005172751843929291, -0.0005002617835998535, -0.00048324838280677795, -0.0004662349820137024, -0.00044922158122062683, -0.00043220818042755127, -0.0004151947796344757, -0.00039818137884140015, -0.0003811679780483246, -0.000364154577255249, -0.00034714117646217346, -0.0003301277756690979, -0.00031311437487602234, -0.0002961009740829468, -0.0002790875732898712, -0.00026207417249679565, -0.0002450607717037201, -0.00022804737091064453, -0.00021103397011756897, -0.0001940205693244934, -0.00017700716853141785, -0.00015999376773834229, -0.00014298036694526672, -0.00012596696615219116, -0.0001089535653591156, -9.194016456604004e-05, -7.492676377296448e-05, -5.7913362979888916e-05, -4.0899962186813354e-05, -2.3886561393737793e-05, -6.8731606006622314e-06, 1.014024019241333e-05, 2.715364098548889e-05, 4.416704177856445e-05, 6.118044257164001e-05, 7.819384336471558e-05, 9.520724415779114e-05, 0.0001122206449508667, 0.00012923404574394226, 0.00014624744653701782, 0.00016326084733009338, 0.00018027424812316895, 0.0001972876489162445, 0.00021430104970932007, 0.00023131445050239563, 0.0002483278512954712, 0.00026534125208854675, 0.0002823546528816223, 0.0002993680536746979, 0.00031638145446777344]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 9.0, 10.0, 14.0, 6.0, 26.0, 22.0, 37.0, 87.0, 77.0, 120.0, 161.0, 324.0, 566.0, 1122.0, 2865.0, 10519.0, 77504.0, 819816.0, 115360.0, 13569.0, 3407.0, 1331.0, 614.0, 360.0, 167.0, 152.0, 89.0, 52.0, 46.0, 28.0, 21.0, 21.0, 6.0, 10.0, 11.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.490234375, -2.4239654541015625, -2.357696533203125, -2.2914276123046875, -2.22515869140625, -2.1588897705078125, -2.092620849609375, -2.0263519287109375, -1.9600830078125, -1.8938140869140625, -1.827545166015625, -1.7612762451171875, -1.69500732421875, -1.6287384033203125, -1.562469482421875, -1.4962005615234375, -1.429931640625, -1.3636627197265625, -1.297393798828125, -1.2311248779296875, -1.16485595703125, -1.0985870361328125, -1.032318115234375, -0.9660491943359375, -0.8997802734375, -0.8335113525390625, -0.767242431640625, -0.7009735107421875, -0.63470458984375, -0.5684356689453125, -0.502166748046875, -0.4358978271484375, -0.36962890625, -0.3033599853515625, -0.237091064453125, -0.1708221435546875, -0.10455322265625, -0.0382843017578125, 0.027984619140625, 0.0942535400390625, 0.1605224609375, 0.2267913818359375, 0.293060302734375, 0.3593292236328125, 0.42559814453125, 0.4918670654296875, 0.558135986328125, 0.6244049072265625, 0.690673828125, 0.7569427490234375, 0.823211669921875, 0.8894805908203125, 0.95574951171875, 1.0220184326171875, 1.088287353515625, 1.1545562744140625, 1.2208251953125, 1.2870941162109375, 1.353363037109375, 1.4196319580078125, 1.48590087890625, 1.5521697998046875, 1.618438720703125, 1.6847076416015625, 1.7509765625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 4.0, 4.0, 8.0, 9.0, 4.0, 12.0, 13.0, 19.0, 23.0, 33.0, 21.0, 36.0, 44.0, 63.0, 58.0, 79.0, 77.0, 75.0, 74.0, 67.0, 53.0, 38.0, 40.0, 30.0, 17.0, 21.0, 9.0, 17.0, 8.0, 10.0, 9.0, 5.0, 5.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8720703125, -1.8163909912109375, -1.760711669921875, -1.7050323486328125, -1.64935302734375, -1.5936737060546875, -1.537994384765625, -1.4823150634765625, -1.4266357421875, -1.3709564208984375, -1.315277099609375, -1.2595977783203125, -1.20391845703125, -1.1482391357421875, -1.092559814453125, -1.0368804931640625, -0.981201171875, -0.9255218505859375, -0.869842529296875, -0.8141632080078125, -0.75848388671875, -0.7028045654296875, -0.647125244140625, -0.5914459228515625, -0.5357666015625, -0.4800872802734375, -0.424407958984375, -0.3687286376953125, -0.31304931640625, -0.2573699951171875, -0.201690673828125, -0.1460113525390625, -0.09033203125, -0.0346527099609375, 0.021026611328125, 0.0767059326171875, 0.13238525390625, 0.1880645751953125, 0.243743896484375, 0.2994232177734375, 0.3551025390625, 0.4107818603515625, 0.466461181640625, 0.5221405029296875, 0.57781982421875, 0.6334991455078125, 0.689178466796875, 0.7448577880859375, 0.800537109375, 0.8562164306640625, 0.911895751953125, 0.9675750732421875, 1.02325439453125, 1.0789337158203125, 1.134613037109375, 1.1902923583984375, 1.2459716796875, 1.3016510009765625, 1.357330322265625, 1.4130096435546875, 1.46868896484375, 1.5243682861328125, 1.580047607421875, 1.6357269287109375, 1.69140625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 7.0, 2.0, 1.0, 4.0, 9.0, 18.0, 39.0, 96.0, 213.0, 393.0, 146.0, 49.0, 21.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.24934387207031, -101.89994812011719, -99.55055236816406, -97.20115661621094, -94.85176086425781, -92.50237274169922, -90.1529769897461, -87.80358123779297, -85.45418548583984, -83.10478973388672, -80.7553939819336, -78.40599822998047, -76.05661010742188, -73.70721435546875, -71.35781860351562, -69.0084228515625, -66.65902709960938, -64.30963134765625, -61.960235595703125, -59.610843658447266, -57.26144790649414, -54.912052154541016, -52.562660217285156, -50.21326446533203, -47.863868713378906, -45.51447296142578, -43.165077209472656, -40.8156852722168, -38.46628952026367, -36.11689376831055, -33.76750183105469, -31.418106079101562, -29.06871795654297, -26.719322204589844, -24.36992835998535, -22.02053451538086, -19.671138763427734, -17.32174301147461, -14.972349166870117, -12.622955322265625, -10.2735595703125, -7.924164772033691, -5.574769973754883, -3.225375175476074, -0.8759803771972656, 1.473414421081543, 3.8228092193603516, 6.172203063964844, 8.521598815917969, 10.870993614196777, 13.220388412475586, 15.569783210754395, 17.919178009033203, 20.268573760986328, 22.61796760559082, 24.967361450195312, 27.316757202148438, 29.666152954101562, 32.01554870605469, 34.36494064331055, 36.71433639526367, 39.0637321472168, 41.413124084472656, 43.76251983642578, 46.111915588378906]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 7.0, 10.0, 7.0, 13.0, 21.0, 22.0, 21.0, 17.0, 23.0, 28.0, 31.0, 29.0, 41.0, 36.0, 45.0, 46.0, 87.0, 62.0, 70.0, 44.0, 35.0, 27.0, 39.0, 28.0, 27.0, 28.0, 27.0, 19.0, 11.0, 21.0, 12.0, 9.0, 7.0, 5.0, 3.0, 9.0, 5.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-41.66759490966797, -40.36654281616211, -39.06549072265625, -37.764434814453125, -36.463382720947266, -35.162330627441406, -33.86127853393555, -32.56022644042969, -31.259172439575195, -29.958120346069336, -28.657066345214844, -27.356014251708984, -26.054962158203125, -24.753908157348633, -23.452856063842773, -22.15180206298828, -20.850749969482422, -19.549697875976562, -18.24864387512207, -16.94759178161621, -15.646538734436035, -14.34548568725586, -13.04443359375, -11.743380546569824, -10.442327499389648, -9.141274452209473, -7.840221881866455, -6.5391693115234375, -5.238116264343262, -3.937063217163086, -2.6360106468200684, -1.3349580764770508, -0.033901214599609375, 1.2671515941619873, 2.568204402923584, 3.8692572116851807, 5.170310020446777, 6.471363067626953, 7.772415637969971, 9.073468208312988, 10.374521255493164, 11.67557430267334, 12.976627349853516, 14.277679443359375, 15.57873249053955, 16.879785537719727, 18.180837631225586, 19.481891632080078, 20.782943725585938, 22.083995819091797, 23.38504981994629, 24.68610191345215, 25.98715591430664, 27.2882080078125, 28.58926010131836, 29.89031219482422, 31.19136619567871, 32.4924201965332, 33.79347229003906, 35.09452438354492, 36.39557647705078, 37.696632385253906, 38.997684478759766, 40.298736572265625, 41.599788665771484]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 4.0, 9.0, 15.0, 11.0, 17.0, 26.0, 49.0, 38.0, 65.0, 98.0, 110.0, 150.0, 185.0, 302.0, 466.0, 687.0, 1165.0, 2221.0, 4368.0, 10617.0, 39666.0, 229933.0, 1908455.0, 1721703.0, 217115.0, 37598.0, 9783.0, 4026.0, 2074.0, 1141.0, 729.0, 400.0, 297.0, 186.0, 130.0, 118.0, 82.0, 65.0, 40.0, 37.0, 26.0, 18.0, 15.0, 16.0, 9.0, 9.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.275390625, -2.201934814453125, -2.12847900390625, -2.055023193359375, -1.9815673828125, -1.908111572265625, -1.83465576171875, -1.761199951171875, -1.687744140625, -1.614288330078125, -1.54083251953125, -1.467376708984375, -1.3939208984375, -1.320465087890625, -1.24700927734375, -1.173553466796875, -1.10009765625, -1.026641845703125, -0.95318603515625, -0.879730224609375, -0.8062744140625, -0.732818603515625, -0.65936279296875, -0.585906982421875, -0.512451171875, -0.438995361328125, -0.36553955078125, -0.292083740234375, -0.2186279296875, -0.145172119140625, -0.07171630859375, 0.001739501953125, 0.0751953125, 0.148651123046875, 0.22210693359375, 0.295562744140625, 0.3690185546875, 0.442474365234375, 0.51593017578125, 0.589385986328125, 0.662841796875, 0.736297607421875, 0.80975341796875, 0.883209228515625, 0.9566650390625, 1.030120849609375, 1.10357666015625, 1.177032470703125, 1.25048828125, 1.323944091796875, 1.39739990234375, 1.470855712890625, 1.5443115234375, 1.617767333984375, 1.69122314453125, 1.764678955078125, 1.838134765625, 1.911590576171875, 1.98504638671875, 2.058502197265625, 2.1319580078125, 2.205413818359375, 2.27886962890625, 2.352325439453125, 2.42578125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 10.0, 12.0, 7.0, 15.0, 20.0, 26.0, 26.0, 33.0, 38.0, 36.0, 36.0, 52.0, 63.0, 46.0, 64.0, 66.0, 59.0, 58.0, 53.0, 44.0, 37.0, 35.0, 46.0, 22.0, 18.0, 13.0, 17.0, 16.0, 11.0, 12.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.177734375, -2.09381103515625, -2.0098876953125, -1.92596435546875, -1.842041015625, -1.75811767578125, -1.6741943359375, -1.59027099609375, -1.50634765625, -1.42242431640625, -1.3385009765625, -1.25457763671875, -1.170654296875, -1.08673095703125, -1.0028076171875, -0.91888427734375, -0.8349609375, -0.75103759765625, -0.6671142578125, -0.58319091796875, -0.499267578125, -0.41534423828125, -0.3314208984375, -0.24749755859375, -0.16357421875, -0.07965087890625, 0.0042724609375, 0.08819580078125, 0.172119140625, 0.25604248046875, 0.3399658203125, 0.42388916015625, 0.5078125, 0.59173583984375, 0.6756591796875, 0.75958251953125, 0.843505859375, 0.92742919921875, 1.0113525390625, 1.09527587890625, 1.17919921875, 1.26312255859375, 1.3470458984375, 1.43096923828125, 1.514892578125, 1.59881591796875, 1.6827392578125, 1.76666259765625, 1.8505859375, 1.93450927734375, 2.0184326171875, 2.10235595703125, 2.186279296875, 2.27020263671875, 2.3541259765625, 2.43804931640625, 2.52197265625, 2.60589599609375, 2.6898193359375, 2.77374267578125, 2.857666015625, 2.94158935546875, 3.0255126953125, 3.10943603515625, 3.193359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 12.0, 10.0, 30.0, 44.0, 56.0, 121.0, 261.0, 529.0, 1341.0, 4761.0, 45941.0, 4003990.0, 125818.0, 8080.0, 1747.0, 705.0, 315.0, 207.0, 98.0, 58.0, 52.0, 32.0, 15.0, 15.0, 12.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.94140625, -6.65972900390625, -6.3780517578125, -6.09637451171875, -5.814697265625, -5.53302001953125, -5.2513427734375, -4.96966552734375, -4.68798828125, -4.40631103515625, -4.1246337890625, -3.84295654296875, -3.561279296875, -3.27960205078125, -2.9979248046875, -2.71624755859375, -2.4345703125, -2.15289306640625, -1.8712158203125, -1.58953857421875, -1.307861328125, -1.02618408203125, -0.7445068359375, -0.46282958984375, -0.18115234375, 0.10052490234375, 0.3822021484375, 0.66387939453125, 0.945556640625, 1.22723388671875, 1.5089111328125, 1.79058837890625, 2.072265625, 2.35394287109375, 2.6356201171875, 2.91729736328125, 3.198974609375, 3.48065185546875, 3.7623291015625, 4.04400634765625, 4.32568359375, 4.60736083984375, 4.8890380859375, 5.17071533203125, 5.452392578125, 5.73406982421875, 6.0157470703125, 6.29742431640625, 6.5791015625, 6.86077880859375, 7.1424560546875, 7.42413330078125, 7.705810546875, 7.98748779296875, 8.2691650390625, 8.55084228515625, 8.83251953125, 9.11419677734375, 9.3958740234375, 9.67755126953125, 9.959228515625, 10.24090576171875, 10.5225830078125, 10.80426025390625, 11.0859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 19.0, 19.0, 34.0, 78.0, 136.0, 544.0, 1962.0, 919.0, 185.0, 64.0, 38.0, 26.0, 13.0, 16.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8203125, -8.5123291015625, -8.204345703125, -7.8963623046875, -7.58837890625, -7.2803955078125, -6.972412109375, -6.6644287109375, -6.3564453125, -6.0484619140625, -5.740478515625, -5.4324951171875, -5.12451171875, -4.8165283203125, -4.508544921875, -4.2005615234375, -3.892578125, -3.5845947265625, -3.276611328125, -2.9686279296875, -2.66064453125, -2.3526611328125, -2.044677734375, -1.7366943359375, -1.4287109375, -1.1207275390625, -0.812744140625, -0.5047607421875, -0.19677734375, 0.1112060546875, 0.419189453125, 0.7271728515625, 1.03515625, 1.3431396484375, 1.651123046875, 1.9591064453125, 2.26708984375, 2.5750732421875, 2.883056640625, 3.1910400390625, 3.4990234375, 3.8070068359375, 4.114990234375, 4.4229736328125, 4.73095703125, 5.0389404296875, 5.346923828125, 5.6549072265625, 5.962890625, 6.2708740234375, 6.578857421875, 6.8868408203125, 7.19482421875, 7.5028076171875, 7.810791015625, 8.1187744140625, 8.4267578125, 8.7347412109375, 9.042724609375, 9.3507080078125, 9.65869140625, 9.9666748046875, 10.274658203125, 10.5826416015625, 10.890625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 5.0, 8.0, 23.0, 53.0, 175.0, 322.0, 267.0, 96.0, 28.0, 12.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-67.02936553955078, -65.0513687133789, -63.0733642578125, -61.09536361694336, -59.11736297607422, -57.13936233520508, -55.16136169433594, -53.18336486816406, -51.205360412597656, -49.227359771728516, -47.249359130859375, -45.271358489990234, -43.293357849121094, -41.31535720825195, -39.33735656738281, -37.35935974121094, -35.3813591003418, -33.403358459472656, -31.425357818603516, -29.447357177734375, -27.469356536865234, -25.491355895996094, -23.513357162475586, -21.535356521606445, -19.557355880737305, -17.579355239868164, -15.601354598999023, -13.6233549118042, -11.645354270935059, -9.667353630065918, -7.689353942871094, -5.711353302001953, -3.733348846435547, -1.7553484439849854, 0.22265195846557617, 2.2006521224975586, 4.178652763366699, 6.15665340423584, 8.134653091430664, 10.112653732299805, 12.090654373168945, 14.068655014038086, 16.046655654907227, 18.024654388427734, 20.002655029296875, 21.980655670166016, 23.958656311035156, 25.936656951904297, 27.914657592773438, 29.892658233642578, 31.87065887451172, 33.84865951538086, 35.82666015625, 37.80466079711914, 39.78266143798828, 41.760658264160156, 43.73866271972656, 45.7166633605957, 47.694664001464844, 49.672664642333984, 51.650665283203125, 53.628665924072266, 55.606666564941406, 57.58466339111328, 59.56266403198242]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 7.0, 2.0, 2.0, 8.0, 16.0, 10.0, 11.0, 17.0, 24.0, 18.0, 38.0, 25.0, 36.0, 45.0, 35.0, 56.0, 48.0, 44.0, 47.0, 45.0, 52.0, 60.0, 41.0, 28.0, 40.0, 47.0, 29.0, 25.0, 23.0, 28.0, 18.0, 13.0, 16.0, 16.0, 8.0, 7.0, 4.0, 4.0, 6.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.314449310302734, -22.59934425354004, -21.884241104125977, -21.16913604736328, -20.45403289794922, -19.738927841186523, -19.023822784423828, -18.308719635009766, -17.59361457824707, -16.878509521484375, -16.163406372070312, -15.448301315307617, -14.733197212219238, -14.01809310913086, -13.302988052368164, -12.587883949279785, -11.872779846191406, -11.157675743103027, -10.442571640014648, -9.727466583251953, -9.012362480163574, -8.297258377075195, -7.582153797149658, -6.867049217224121, -6.151945114135742, -5.436841011047363, -4.721736431121826, -4.006631851196289, -3.29152774810791, -2.576423406600952, -1.8613190650939941, -1.146214485168457, -0.4311103820800781, 0.2839939594268799, 0.9990983009338379, 1.714202642440796, 2.429306983947754, 3.144411325454712, 3.85951566696167, 4.574620246887207, 5.289724349975586, 6.004828453063965, 6.719933032989502, 7.435037612915039, 8.150141716003418, 8.865245819091797, 9.580350875854492, 10.295454978942871, 11.01055908203125, 11.725663185119629, 12.440767288208008, 13.155872344970703, 13.870976448059082, 14.586080551147461, 15.301185607910156, 16.01628875732422, 16.731393814086914, 17.44649887084961, 18.161602020263672, 18.876707077026367, 19.591812133789062, 20.306915283203125, 21.02202033996582, 21.737125396728516, 22.452228546142578]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 11.0, 7.0, 7.0, 20.0, 39.0, 43.0, 78.0, 99.0, 141.0, 206.0, 311.0, 450.0, 665.0, 1088.0, 1704.0, 2717.0, 4793.0, 8983.0, 18398.0, 41313.0, 105249.0, 292736.0, 343680.0, 130103.0, 49712.0, 21614.0, 10455.0, 5541.0, 3044.0, 1849.0, 1180.0, 730.0, 526.0, 330.0, 222.0, 165.0, 86.0, 74.0, 52.0, 47.0, 26.0, 24.0, 13.0, 7.0, 4.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.04296875, -2.9510498046875, -2.859130859375, -2.7672119140625, -2.67529296875, -2.5833740234375, -2.491455078125, -2.3995361328125, -2.3076171875, -2.2156982421875, -2.123779296875, -2.0318603515625, -1.93994140625, -1.8480224609375, -1.756103515625, -1.6641845703125, -1.572265625, -1.4803466796875, -1.388427734375, -1.2965087890625, -1.20458984375, -1.1126708984375, -1.020751953125, -0.9288330078125, -0.8369140625, -0.7449951171875, -0.653076171875, -0.5611572265625, -0.46923828125, -0.3773193359375, -0.285400390625, -0.1934814453125, -0.1015625, -0.0096435546875, 0.082275390625, 0.1741943359375, 0.26611328125, 0.3580322265625, 0.449951171875, 0.5418701171875, 0.6337890625, 0.7257080078125, 0.817626953125, 0.9095458984375, 1.00146484375, 1.0933837890625, 1.185302734375, 1.2772216796875, 1.369140625, 1.4610595703125, 1.552978515625, 1.6448974609375, 1.73681640625, 1.8287353515625, 1.920654296875, 2.0125732421875, 2.1044921875, 2.1964111328125, 2.288330078125, 2.3802490234375, 2.47216796875, 2.5640869140625, 2.656005859375, 2.7479248046875, 2.83984375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 14.0, 6.0, 9.0, 13.0, 15.0, 14.0, 11.0, 18.0, 28.0, 31.0, 29.0, 31.0, 32.0, 34.0, 38.0, 39.0, 43.0, 42.0, 37.0, 42.0, 46.0, 35.0, 36.0, 43.0, 33.0, 37.0, 37.0, 24.0, 23.0, 18.0, 21.0, 16.0, 15.0, 16.0, 11.0, 13.0, 6.0, 7.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.0859375, -2.0243988037109375, -1.962860107421875, -1.9013214111328125, -1.83978271484375, -1.7782440185546875, -1.716705322265625, -1.6551666259765625, -1.5936279296875, -1.5320892333984375, -1.470550537109375, -1.4090118408203125, -1.34747314453125, -1.2859344482421875, -1.224395751953125, -1.1628570556640625, -1.101318359375, -1.0397796630859375, -0.978240966796875, -0.9167022705078125, -0.85516357421875, -0.7936248779296875, -0.732086181640625, -0.6705474853515625, -0.6090087890625, -0.5474700927734375, -0.485931396484375, -0.4243927001953125, -0.36285400390625, -0.3013153076171875, -0.239776611328125, -0.1782379150390625, -0.11669921875, -0.0551605224609375, 0.006378173828125, 0.0679168701171875, 0.12945556640625, 0.1909942626953125, 0.252532958984375, 0.3140716552734375, 0.3756103515625, 0.4371490478515625, 0.498687744140625, 0.5602264404296875, 0.62176513671875, 0.6833038330078125, 0.744842529296875, 0.8063812255859375, 0.867919921875, 0.9294586181640625, 0.990997314453125, 1.0525360107421875, 1.11407470703125, 1.1756134033203125, 1.237152099609375, 1.2986907958984375, 1.3602294921875, 1.4217681884765625, 1.483306884765625, 1.5448455810546875, 1.60638427734375, 1.6679229736328125, 1.729461669921875, 1.7910003662109375, 1.8525390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 2.0, 13.0, 14.0, 17.0, 37.0, 40.0, 52.0, 91.0, 166.0, 245.0, 388.0, 622.0, 1172.0, 3225.0, 15422.0, 276710.0, 718270.0, 24328.0, 4349.0, 1467.0, 662.0, 441.0, 257.0, 195.0, 105.0, 76.0, 73.0, 33.0, 26.0, 18.0, 10.0, 9.0, 4.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.40625, -12.0806884765625, -11.755126953125, -11.4295654296875, -11.10400390625, -10.7784423828125, -10.452880859375, -10.1273193359375, -9.8017578125, -9.4761962890625, -9.150634765625, -8.8250732421875, -8.49951171875, -8.1739501953125, -7.848388671875, -7.5228271484375, -7.197265625, -6.8717041015625, -6.546142578125, -6.2205810546875, -5.89501953125, -5.5694580078125, -5.243896484375, -4.9183349609375, -4.5927734375, -4.2672119140625, -3.941650390625, -3.6160888671875, -3.29052734375, -2.9649658203125, -2.639404296875, -2.3138427734375, -1.98828125, -1.6627197265625, -1.337158203125, -1.0115966796875, -0.68603515625, -0.3604736328125, -0.034912109375, 0.2906494140625, 0.6162109375, 0.9417724609375, 1.267333984375, 1.5928955078125, 1.91845703125, 2.2440185546875, 2.569580078125, 2.8951416015625, 3.220703125, 3.5462646484375, 3.871826171875, 4.1973876953125, 4.52294921875, 4.8485107421875, 5.174072265625, 5.4996337890625, 5.8251953125, 6.1507568359375, 6.476318359375, 6.8018798828125, 7.12744140625, 7.4530029296875, 7.778564453125, 8.1041259765625, 8.4296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 5.0, 5.0, 1.0, 7.0, 18.0, 10.0, 13.0, 24.0, 23.0, 34.0, 32.0, 37.0, 41.0, 58.0, 44.0, 50.0, 52.0, 59.0, 49.0, 45.0, 64.0, 31.0, 40.0, 55.0, 38.0, 30.0, 23.0, 23.0, 23.0, 18.0, 13.0, 9.0, 6.0, 8.0, 2.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.5390625, -9.2264404296875, -8.913818359375, -8.6011962890625, -8.28857421875, -7.9759521484375, -7.663330078125, -7.3507080078125, -7.0380859375, -6.7254638671875, -6.412841796875, -6.1002197265625, -5.78759765625, -5.4749755859375, -5.162353515625, -4.8497314453125, -4.537109375, -4.2244873046875, -3.911865234375, -3.5992431640625, -3.28662109375, -2.9739990234375, -2.661376953125, -2.3487548828125, -2.0361328125, -1.7235107421875, -1.410888671875, -1.0982666015625, -0.78564453125, -0.4730224609375, -0.160400390625, 0.1522216796875, 0.46484375, 0.7774658203125, 1.090087890625, 1.4027099609375, 1.71533203125, 2.0279541015625, 2.340576171875, 2.6531982421875, 2.9658203125, 3.2784423828125, 3.591064453125, 3.9036865234375, 4.21630859375, 4.5289306640625, 4.841552734375, 5.1541748046875, 5.466796875, 5.7794189453125, 6.092041015625, 6.4046630859375, 6.71728515625, 7.0299072265625, 7.342529296875, 7.6551513671875, 7.9677734375, 8.2803955078125, 8.593017578125, 8.9056396484375, 9.21826171875, 9.5308837890625, 9.843505859375, 10.1561279296875, 10.46875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 4.0, 11.0, 5.0, 6.0, 8.0, 10.0, 17.0, 16.0, 21.0, 30.0, 41.0, 89.0, 147.0, 254.0, 696.0, 1848.0, 6453.0, 36541.0, 712886.0, 261128.0, 21321.0, 4548.0, 1336.0, 537.0, 232.0, 125.0, 81.0, 39.0, 23.0, 18.0, 16.0, 14.0, 10.0, 5.0, 4.0, 5.0, 5.0, 5.0, 2.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-2.53125, -2.458648681640625, -2.38604736328125, -2.313446044921875, -2.2408447265625, -2.168243408203125, -2.09564208984375, -2.023040771484375, -1.950439453125, -1.877838134765625, -1.80523681640625, -1.732635498046875, -1.6600341796875, -1.587432861328125, -1.51483154296875, -1.442230224609375, -1.36962890625, -1.297027587890625, -1.22442626953125, -1.151824951171875, -1.0792236328125, -1.006622314453125, -0.93402099609375, -0.861419677734375, -0.788818359375, -0.716217041015625, -0.64361572265625, -0.571014404296875, -0.4984130859375, -0.425811767578125, -0.35321044921875, -0.280609130859375, -0.2080078125, -0.135406494140625, -0.06280517578125, 0.009796142578125, 0.0823974609375, 0.154998779296875, 0.22760009765625, 0.300201416015625, 0.372802734375, 0.445404052734375, 0.51800537109375, 0.590606689453125, 0.6632080078125, 0.735809326171875, 0.80841064453125, 0.881011962890625, 0.95361328125, 1.026214599609375, 1.09881591796875, 1.171417236328125, 1.2440185546875, 1.316619873046875, 1.38922119140625, 1.461822509765625, 1.534423828125, 1.607025146484375, 1.67962646484375, 1.752227783203125, 1.8248291015625, 1.897430419921875, 1.97003173828125, 2.042633056640625, 2.115234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 7.0, 6.0, 13.0, 8.0, 21.0, 28.0, 39.0, 47.0, 86.0, 132.0, 165.0, 141.0, 90.0, 55.0, 49.0, 17.0, 24.0, 11.0, 10.0, 15.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004911422729492188, -0.000477377325296402, -0.0004636123776435852, -0.00044984742999076843, -0.00043608248233795166, -0.0004223175346851349, -0.0004085525870323181, -0.00039478763937950134, -0.00038102269172668457, -0.0003672577440738678, -0.000353492796421051, -0.00033972784876823425, -0.0003259629011154175, -0.0003121979534626007, -0.00029843300580978394, -0.00028466805815696716, -0.0002709031105041504, -0.0002571381628513336, -0.00024337321519851685, -0.00022960826754570007, -0.0002158433198928833, -0.00020207837224006653, -0.00018831342458724976, -0.00017454847693443298, -0.0001607835292816162, -0.00014701858162879944, -0.00013325363397598267, -0.0001194886863231659, -0.00010572373867034912, -9.195879101753235e-05, -7.819384336471558e-05, -6.44288957118988e-05, -5.066394805908203e-05, -3.689900040626526e-05, -2.3134052753448486e-05, -9.369105100631714e-06, 4.395842552185059e-06, 1.816079020500183e-05, 3.1925737857818604e-05, 4.5690685510635376e-05, 5.945563316345215e-05, 7.322058081626892e-05, 8.69855284690857e-05, 0.00010075047612190247, 0.00011451542377471924, 0.000128280371427536, 0.00014204531908035278, 0.00015581026673316956, 0.00016957521438598633, 0.0001833401620388031, 0.00019710510969161987, 0.00021087005734443665, 0.00022463500499725342, 0.0002383999526500702, 0.00025216490030288696, 0.00026592984795570374, 0.0002796947956085205, 0.0002934597432613373, 0.00030722469091415405, 0.0003209896385669708, 0.0003347545862197876, 0.00034851953387260437, 0.00036228448152542114, 0.0003760494291782379, 0.0003898143768310547]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 4.0, 5.0, 10.0, 12.0, 23.0, 35.0, 54.0, 78.0, 162.0, 379.0, 1024.0, 4208.0, 47216.0, 944927.0, 44560.0, 4029.0, 1053.0, 373.0, 183.0, 76.0, 46.0, 26.0, 19.0, 15.0, 11.0, 3.0, 4.0, 3.0, 0.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0078125, -2.898406982421875, -2.78900146484375, -2.679595947265625, -2.5701904296875, -2.460784912109375, -2.35137939453125, -2.241973876953125, -2.132568359375, -2.023162841796875, -1.91375732421875, -1.804351806640625, -1.6949462890625, -1.585540771484375, -1.47613525390625, -1.366729736328125, -1.25732421875, -1.147918701171875, -1.03851318359375, -0.929107666015625, -0.8197021484375, -0.710296630859375, -0.60089111328125, -0.491485595703125, -0.382080078125, -0.272674560546875, -0.16326904296875, -0.053863525390625, 0.0555419921875, 0.164947509765625, 0.27435302734375, 0.383758544921875, 0.4931640625, 0.602569580078125, 0.71197509765625, 0.821380615234375, 0.9307861328125, 1.040191650390625, 1.14959716796875, 1.259002685546875, 1.368408203125, 1.477813720703125, 1.58721923828125, 1.696624755859375, 1.8060302734375, 1.915435791015625, 2.02484130859375, 2.134246826171875, 2.24365234375, 2.353057861328125, 2.46246337890625, 2.571868896484375, 2.6812744140625, 2.790679931640625, 2.90008544921875, 3.009490966796875, 3.118896484375, 3.228302001953125, 3.33770751953125, 3.447113037109375, 3.5565185546875, 3.665924072265625, 3.77532958984375, 3.884735107421875, 3.994140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 8.0, 9.0, 9.0, 13.0, 16.0, 23.0, 37.0, 58.0, 62.0, 78.0, 113.0, 99.0, 87.0, 96.0, 72.0, 69.0, 47.0, 22.0, 26.0, 16.0, 13.0, 8.0, 3.0, 9.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84765625, -1.784027099609375, -1.72039794921875, -1.656768798828125, -1.5931396484375, -1.529510498046875, -1.46588134765625, -1.402252197265625, -1.338623046875, -1.274993896484375, -1.21136474609375, -1.147735595703125, -1.0841064453125, -1.020477294921875, -0.95684814453125, -0.893218994140625, -0.82958984375, -0.765960693359375, -0.70233154296875, -0.638702392578125, -0.5750732421875, -0.511444091796875, -0.44781494140625, -0.384185791015625, -0.320556640625, -0.256927490234375, -0.19329833984375, -0.129669189453125, -0.0660400390625, -0.002410888671875, 0.06121826171875, 0.124847412109375, 0.1884765625, 0.252105712890625, 0.31573486328125, 0.379364013671875, 0.4429931640625, 0.506622314453125, 0.57025146484375, 0.633880615234375, 0.697509765625, 0.761138916015625, 0.82476806640625, 0.888397216796875, 0.9520263671875, 1.015655517578125, 1.07928466796875, 1.142913818359375, 1.20654296875, 1.270172119140625, 1.33380126953125, 1.397430419921875, 1.4610595703125, 1.524688720703125, 1.58831787109375, 1.651947021484375, 1.715576171875, 1.779205322265625, 1.84283447265625, 1.906463623046875, 1.9700927734375, 2.033721923828125, 2.09735107421875, 2.160980224609375, 2.224609375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 15.0, 19.0, 53.0, 135.0, 314.0, 253.0, 118.0, 55.0, 15.0, 16.0, 8.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.48570251464844, -93.44749450683594, -91.40928649902344, -89.37107849121094, -87.3328628540039, -85.2946548461914, -83.2564468383789, -81.2182388305664, -79.1800308227539, -77.1418228149414, -75.1036148071289, -73.06539916992188, -71.02719116210938, -68.98898315429688, -66.95077514648438, -64.91256713867188, -62.87435531616211, -60.83614730834961, -58.797935485839844, -56.759727478027344, -54.721519470214844, -52.683311462402344, -50.64509963989258, -48.60689163208008, -46.56867980957031, -44.53047180175781, -42.49225997924805, -40.45405197143555, -38.41584396362305, -36.37763214111328, -34.33942413330078, -32.30121612548828, -30.26300811767578, -28.22479820251465, -26.18659019470215, -24.148380279541016, -22.110172271728516, -20.071962356567383, -18.03375244140625, -15.995543479919434, -13.957334518432617, -11.9191255569458, -9.880916595458984, -7.842706680297852, -5.804497718811035, -3.7662887573242188, -1.728078842163086, 0.31013011932373047, 2.348339080810547, 4.386548042297363, 6.424757480621338, 8.462966918945312, 10.501175880432129, 12.539384841918945, 14.577594757080078, 16.615802764892578, 18.65401268005371, 20.692222595214844, 22.730430603027344, 24.768640518188477, 26.80685043334961, 28.84505844116211, 30.883268356323242, 32.921478271484375, 34.959686279296875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 5.0, 4.0, 4.0, 10.0, 5.0, 14.0, 17.0, 17.0, 23.0, 18.0, 28.0, 24.0, 18.0, 23.0, 30.0, 27.0, 39.0, 43.0, 51.0, 70.0, 62.0, 60.0, 65.0, 40.0, 33.0, 27.0, 32.0, 30.0, 25.0, 25.0, 32.0, 18.0, 16.0, 16.0, 9.0, 12.0, 14.0, 5.0, 6.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-42.14063262939453, -41.03972625732422, -39.93881607055664, -38.83790588378906, -37.73699951171875, -36.63609313964844, -35.53518295288086, -34.43427276611328, -33.33336639404297, -32.232460021972656, -31.131549835205078, -30.030641555786133, -28.929733276367188, -27.828824996948242, -26.727916717529297, -25.62700843811035, -24.526100158691406, -23.42519187927246, -22.324283599853516, -21.22337532043457, -20.122467041015625, -19.02155876159668, -17.920650482177734, -16.81974220275879, -15.718833923339844, -14.617925643920898, -13.517017364501953, -12.416109085083008, -11.315200805664062, -10.214292526245117, -9.113384246826172, -8.012475967407227, -6.911571502685547, -5.810663223266602, -4.709754943847656, -3.608846664428711, -2.5079383850097656, -1.4070301055908203, -0.306121826171875, 0.7947864532470703, 1.8956947326660156, 2.996603012084961, 4.097511291503906, 5.198419570922852, 6.299327850341797, 7.400236129760742, 8.501144409179688, 9.602052688598633, 10.702960968017578, 11.803869247436523, 12.904777526855469, 14.005685806274414, 15.10659408569336, 16.207502365112305, 17.30841064453125, 18.409318923950195, 19.51022720336914, 20.611135482788086, 21.71204376220703, 22.812952041625977, 23.913860321044922, 25.014768600463867, 26.115676879882812, 27.216585159301758, 28.317493438720703]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 7.0, 7.0, 11.0, 10.0, 13.0, 15.0, 27.0, 53.0, 59.0, 92.0, 136.0, 168.0, 278.0, 420.0, 581.0, 1110.0, 1988.0, 4219.0, 10944.0, 57172.0, 583740.0, 2982275.0, 481912.0, 50001.0, 10367.0, 3802.0, 1856.0, 1076.0, 607.0, 406.0, 258.0, 198.0, 140.0, 98.0, 63.0, 48.0, 24.0, 23.0, 19.0, 14.0, 12.0, 9.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.65625, -2.569061279296875, -2.48187255859375, -2.394683837890625, -2.3074951171875, -2.220306396484375, -2.13311767578125, -2.045928955078125, -1.958740234375, -1.871551513671875, -1.78436279296875, -1.697174072265625, -1.6099853515625, -1.522796630859375, -1.43560791015625, -1.348419189453125, -1.26123046875, -1.174041748046875, -1.08685302734375, -0.999664306640625, -0.9124755859375, -0.825286865234375, -0.73809814453125, -0.650909423828125, -0.563720703125, -0.476531982421875, -0.38934326171875, -0.302154541015625, -0.2149658203125, -0.127777099609375, -0.04058837890625, 0.046600341796875, 0.1337890625, 0.220977783203125, 0.30816650390625, 0.395355224609375, 0.4825439453125, 0.569732666015625, 0.65692138671875, 0.744110107421875, 0.831298828125, 0.918487548828125, 1.00567626953125, 1.092864990234375, 1.1800537109375, 1.267242431640625, 1.35443115234375, 1.441619873046875, 1.52880859375, 1.615997314453125, 1.70318603515625, 1.790374755859375, 1.8775634765625, 1.964752197265625, 2.05194091796875, 2.139129638671875, 2.226318359375, 2.313507080078125, 2.40069580078125, 2.487884521484375, 2.5750732421875, 2.662261962890625, 2.74945068359375, 2.836639404296875, 2.923828125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 7.0, 8.0, 8.0, 7.0, 12.0, 11.0, 10.0, 9.0, 19.0, 18.0, 22.0, 21.0, 18.0, 29.0, 38.0, 36.0, 38.0, 40.0, 44.0, 42.0, 56.0, 43.0, 34.0, 40.0, 40.0, 44.0, 33.0, 37.0, 35.0, 20.0, 23.0, 20.0, 19.0, 30.0, 11.0, 21.0, 12.0, 7.0, 10.0, 10.0, 13.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.044921875, -1.9871978759765625, -1.929473876953125, -1.8717498779296875, -1.81402587890625, -1.7563018798828125, -1.698577880859375, -1.6408538818359375, -1.5831298828125, -1.5254058837890625, -1.467681884765625, -1.4099578857421875, -1.35223388671875, -1.2945098876953125, -1.236785888671875, -1.1790618896484375, -1.121337890625, -1.0636138916015625, -1.005889892578125, -0.9481658935546875, -0.89044189453125, -0.8327178955078125, -0.774993896484375, -0.7172698974609375, -0.6595458984375, -0.6018218994140625, -0.544097900390625, -0.4863739013671875, -0.42864990234375, -0.3709259033203125, -0.313201904296875, -0.2554779052734375, -0.19775390625, -0.1400299072265625, -0.082305908203125, -0.0245819091796875, 0.03314208984375, 0.0908660888671875, 0.148590087890625, 0.2063140869140625, 0.2640380859375, 0.3217620849609375, 0.379486083984375, 0.4372100830078125, 0.49493408203125, 0.5526580810546875, 0.610382080078125, 0.6681060791015625, 0.725830078125, 0.7835540771484375, 0.841278076171875, 0.8990020751953125, 0.95672607421875, 1.0144500732421875, 1.072174072265625, 1.1298980712890625, 1.1876220703125, 1.2453460693359375, 1.303070068359375, 1.3607940673828125, 1.41851806640625, 1.4762420654296875, 1.533966064453125, 1.5916900634765625, 1.6494140625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 3.0, 6.0, 16.0, 15.0, 31.0, 42.0, 93.0, 147.0, 341.0, 789.0, 2153.0, 8058.0, 71334.0, 4018471.0, 80266.0, 8740.0, 2220.0, 785.0, 369.0, 166.0, 93.0, 38.0, 28.0, 23.0, 8.0, 11.0, 8.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.3203125, -9.0650634765625, -8.809814453125, -8.5545654296875, -8.29931640625, -8.0440673828125, -7.788818359375, -7.5335693359375, -7.2783203125, -7.0230712890625, -6.767822265625, -6.5125732421875, -6.25732421875, -6.0020751953125, -5.746826171875, -5.4915771484375, -5.236328125, -4.9810791015625, -4.725830078125, -4.4705810546875, -4.21533203125, -3.9600830078125, -3.704833984375, -3.4495849609375, -3.1943359375, -2.9390869140625, -2.683837890625, -2.4285888671875, -2.17333984375, -1.9180908203125, -1.662841796875, -1.4075927734375, -1.15234375, -0.8970947265625, -0.641845703125, -0.3865966796875, -0.13134765625, 0.1239013671875, 0.379150390625, 0.6343994140625, 0.8896484375, 1.1448974609375, 1.400146484375, 1.6553955078125, 1.91064453125, 2.1658935546875, 2.421142578125, 2.6763916015625, 2.931640625, 3.1868896484375, 3.442138671875, 3.6973876953125, 3.95263671875, 4.2078857421875, 4.463134765625, 4.7183837890625, 4.9736328125, 5.2288818359375, 5.484130859375, 5.7393798828125, 5.99462890625, 6.2498779296875, 6.505126953125, 6.7603759765625, 7.015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 3.0, 3.0, 2.0, 10.0, 7.0, 10.0, 18.0, 32.0, 38.0, 75.0, 201.0, 574.0, 1329.0, 1079.0, 363.0, 139.0, 65.0, 36.0, 23.0, 16.0, 12.0, 8.0, 10.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.8828125, -6.6905517578125, -6.498291015625, -6.3060302734375, -6.11376953125, -5.9215087890625, -5.729248046875, -5.5369873046875, -5.3447265625, -5.1524658203125, -4.960205078125, -4.7679443359375, -4.57568359375, -4.3834228515625, -4.191162109375, -3.9989013671875, -3.806640625, -3.6143798828125, -3.422119140625, -3.2298583984375, -3.03759765625, -2.8453369140625, -2.653076171875, -2.4608154296875, -2.2685546875, -2.0762939453125, -1.884033203125, -1.6917724609375, -1.49951171875, -1.3072509765625, -1.114990234375, -0.9227294921875, -0.73046875, -0.5382080078125, -0.345947265625, -0.1536865234375, 0.03857421875, 0.2308349609375, 0.423095703125, 0.6153564453125, 0.8076171875, 0.9998779296875, 1.192138671875, 1.3843994140625, 1.57666015625, 1.7689208984375, 1.961181640625, 2.1534423828125, 2.345703125, 2.5379638671875, 2.730224609375, 2.9224853515625, 3.11474609375, 3.3070068359375, 3.499267578125, 3.6915283203125, 3.8837890625, 4.0760498046875, 4.268310546875, 4.4605712890625, 4.65283203125, 4.8450927734375, 5.037353515625, 5.2296142578125, 5.421875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 6.0, 13.0, 30.0, 77.0, 185.0, 293.0, 231.0, 94.0, 36.0, 19.0, 10.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-81.15202331542969, -79.45350646972656, -77.75498962402344, -76.05647277832031, -74.35795593261719, -72.65943908691406, -70.96092224121094, -69.26241302490234, -67.56389617919922, -65.8653793334961, -64.16686248779297, -62.468345642089844, -60.769832611083984, -59.07131576538086, -57.372798919677734, -55.67428207397461, -53.975765228271484, -52.27724838256836, -50.578731536865234, -48.880218505859375, -47.18170166015625, -45.483184814453125, -43.78466796875, -42.086151123046875, -40.38763427734375, -38.689117431640625, -36.9906005859375, -35.292083740234375, -33.593570709228516, -31.89505386352539, -30.196537017822266, -28.49802017211914, -26.799510955810547, -25.100994110107422, -23.40247917175293, -21.703962326049805, -20.005447387695312, -18.306930541992188, -16.608413696289062, -14.909897804260254, -13.211381912231445, -11.512866020202637, -9.814350128173828, -8.115833282470703, -6.4173173904418945, -4.718801498413086, -3.020284652709961, -1.3217687606811523, 0.37674713134765625, 2.075263261795044, 3.7737793922424316, 5.472295761108398, 7.170811653137207, 8.869327545166016, 10.56784439086914, 12.26636028289795, 13.964876174926758, 15.663392066955566, 17.361907958984375, 19.0604248046875, 20.758941650390625, 22.457456588745117, 24.155973434448242, 25.854488372802734, 27.55300521850586]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 7.0, 5.0, 7.0, 16.0, 18.0, 20.0, 18.0, 22.0, 24.0, 25.0, 34.0, 32.0, 38.0, 49.0, 43.0, 43.0, 51.0, 44.0, 36.0, 43.0, 36.0, 32.0, 33.0, 48.0, 34.0, 31.0, 28.0, 26.0, 18.0, 19.0, 16.0, 18.0, 17.0, 11.0, 7.0, 9.0, 9.0, 5.0, 6.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-16.52326774597168, -16.01232147216797, -15.501375198364258, -14.990428924560547, -14.479482650756836, -13.968536376953125, -13.457590103149414, -12.946643829345703, -12.435697555541992, -11.924751281738281, -11.41380500793457, -10.90285873413086, -10.391912460327148, -9.880966186523438, -9.370019912719727, -8.859073638916016, -8.348127365112305, -7.837181091308594, -7.326234817504883, -6.815288543701172, -6.304342269897461, -5.79339599609375, -5.282449722290039, -4.771503448486328, -4.260557174682617, -3.7496109008789062, -3.2386646270751953, -2.7277183532714844, -2.2167720794677734, -1.7058258056640625, -1.1948795318603516, -0.6839332580566406, -0.1729888916015625, 0.33795738220214844, 0.8489036560058594, 1.3598499298095703, 1.8707962036132812, 2.381742477416992, 2.892688751220703, 3.403635025024414, 3.914581298828125, 4.425527572631836, 4.936473846435547, 5.447420120239258, 5.958366394042969, 6.46931266784668, 6.980258941650391, 7.491205215454102, 8.002151489257812, 8.513097763061523, 9.024044036865234, 9.534990310668945, 10.045936584472656, 10.556882858276367, 11.067829132080078, 11.578775405883789, 12.0897216796875, 12.600667953491211, 13.111614227294922, 13.622560501098633, 14.133506774902344, 14.644453048706055, 15.155399322509766, 15.666345596313477, 16.177291870117188]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 2.0, 14.0, 16.0, 36.0, 27.0, 71.0, 96.0, 126.0, 174.0, 319.0, 459.0, 742.0, 1061.0, 1837.0, 2861.0, 4902.0, 9090.0, 16730.0, 33995.0, 76467.0, 181675.0, 329842.0, 214747.0, 89926.0, 39608.0, 19241.0, 10118.0, 5734.0, 3248.0, 2013.0, 1215.0, 699.0, 554.0, 340.0, 211.0, 117.0, 79.0, 59.0, 32.0, 26.0, 16.0, 9.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.078125, -2.012359619140625, -1.94659423828125, -1.880828857421875, -1.8150634765625, -1.749298095703125, -1.68353271484375, -1.617767333984375, -1.552001953125, -1.486236572265625, -1.42047119140625, -1.354705810546875, -1.2889404296875, -1.223175048828125, -1.15740966796875, -1.091644287109375, -1.02587890625, -0.960113525390625, -0.89434814453125, -0.828582763671875, -0.7628173828125, -0.697052001953125, -0.63128662109375, -0.565521240234375, -0.499755859375, -0.433990478515625, -0.36822509765625, -0.302459716796875, -0.2366943359375, -0.170928955078125, -0.10516357421875, -0.039398193359375, 0.0263671875, 0.092132568359375, 0.15789794921875, 0.223663330078125, 0.2894287109375, 0.355194091796875, 0.42095947265625, 0.486724853515625, 0.552490234375, 0.618255615234375, 0.68402099609375, 0.749786376953125, 0.8155517578125, 0.881317138671875, 0.94708251953125, 1.012847900390625, 1.07861328125, 1.144378662109375, 1.21014404296875, 1.275909423828125, 1.3416748046875, 1.407440185546875, 1.47320556640625, 1.538970947265625, 1.604736328125, 1.670501708984375, 1.73626708984375, 1.802032470703125, 1.8677978515625, 1.933563232421875, 1.99932861328125, 2.065093994140625, 2.130859375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 5.0, 14.0, 14.0, 18.0, 16.0, 17.0, 19.0, 18.0, 26.0, 19.0, 38.0, 29.0, 42.0, 30.0, 41.0, 50.0, 43.0, 51.0, 42.0, 46.0, 40.0, 42.0, 33.0, 41.0, 29.0, 34.0, 22.0, 27.0, 33.0, 21.0, 17.0, 18.0, 5.0, 11.0, 9.0, 10.0, 7.0, 4.0, 7.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.248046875, -2.1855010986328125, -2.122955322265625, -2.0604095458984375, -1.99786376953125, -1.9353179931640625, -1.872772216796875, -1.8102264404296875, -1.7476806640625, -1.6851348876953125, -1.622589111328125, -1.5600433349609375, -1.49749755859375, -1.4349517822265625, -1.372406005859375, -1.3098602294921875, -1.247314453125, -1.1847686767578125, -1.122222900390625, -1.0596771240234375, -0.99713134765625, -0.9345855712890625, -0.872039794921875, -0.8094940185546875, -0.7469482421875, -0.6844024658203125, -0.621856689453125, -0.5593109130859375, -0.49676513671875, -0.4342193603515625, -0.371673583984375, -0.3091278076171875, -0.24658203125, -0.1840362548828125, -0.121490478515625, -0.0589447021484375, 0.00360107421875, 0.0661468505859375, 0.128692626953125, 0.1912384033203125, 0.2537841796875, 0.3163299560546875, 0.378875732421875, 0.4414215087890625, 0.50396728515625, 0.5665130615234375, 0.629058837890625, 0.6916046142578125, 0.754150390625, 0.8166961669921875, 0.879241943359375, 0.9417877197265625, 1.00433349609375, 1.0668792724609375, 1.129425048828125, 1.1919708251953125, 1.2545166015625, 1.3170623779296875, 1.379608154296875, 1.4421539306640625, 1.50469970703125, 1.5672454833984375, 1.629791259765625, 1.6923370361328125, 1.7548828125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 0.0, 4.0, 5.0, 6.0, 11.0, 9.0, 10.0, 15.0, 16.0, 26.0, 27.0, 50.0, 45.0, 64.0, 110.0, 192.0, 322.0, 587.0, 1388.0, 3988.0, 16974.0, 113776.0, 758383.0, 126857.0, 18557.0, 4199.0, 1397.0, 619.0, 312.0, 186.0, 105.0, 88.0, 40.0, 46.0, 27.0, 29.0, 15.0, 17.0, 10.0, 10.0, 5.0, 9.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.58984375, -5.4005126953125, -5.211181640625, -5.0218505859375, -4.83251953125, -4.6431884765625, -4.453857421875, -4.2645263671875, -4.0751953125, -3.8858642578125, -3.696533203125, -3.5072021484375, -3.31787109375, -3.1285400390625, -2.939208984375, -2.7498779296875, -2.560546875, -2.3712158203125, -2.181884765625, -1.9925537109375, -1.80322265625, -1.6138916015625, -1.424560546875, -1.2352294921875, -1.0458984375, -0.8565673828125, -0.667236328125, -0.4779052734375, -0.28857421875, -0.0992431640625, 0.090087890625, 0.2794189453125, 0.46875, 0.6580810546875, 0.847412109375, 1.0367431640625, 1.22607421875, 1.4154052734375, 1.604736328125, 1.7940673828125, 1.9833984375, 2.1727294921875, 2.362060546875, 2.5513916015625, 2.74072265625, 2.9300537109375, 3.119384765625, 3.3087158203125, 3.498046875, 3.6873779296875, 3.876708984375, 4.0660400390625, 4.25537109375, 4.4447021484375, 4.634033203125, 4.8233642578125, 5.0126953125, 5.2020263671875, 5.391357421875, 5.5806884765625, 5.77001953125, 5.9593505859375, 6.148681640625, 6.3380126953125, 6.52734375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 9.0, 9.0, 7.0, 16.0, 15.0, 17.0, 12.0, 22.0, 17.0, 19.0, 24.0, 24.0, 27.0, 47.0, 32.0, 37.0, 40.0, 41.0, 32.0, 35.0, 35.0, 51.0, 38.0, 36.0, 49.0, 30.0, 34.0, 30.0, 20.0, 21.0, 27.0, 24.0, 16.0, 13.0, 13.0, 17.0, 14.0, 6.0, 13.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-6.640625, -6.44354248046875, -6.2464599609375, -6.04937744140625, -5.852294921875, -5.65521240234375, -5.4581298828125, -5.26104736328125, -5.06396484375, -4.86688232421875, -4.6697998046875, -4.47271728515625, -4.275634765625, -4.07855224609375, -3.8814697265625, -3.68438720703125, -3.4873046875, -3.29022216796875, -3.0931396484375, -2.89605712890625, -2.698974609375, -2.50189208984375, -2.3048095703125, -2.10772705078125, -1.91064453125, -1.71356201171875, -1.5164794921875, -1.31939697265625, -1.122314453125, -0.92523193359375, -0.7281494140625, -0.53106689453125, -0.333984375, -0.13690185546875, 0.0601806640625, 0.25726318359375, 0.454345703125, 0.65142822265625, 0.8485107421875, 1.04559326171875, 1.24267578125, 1.43975830078125, 1.6368408203125, 1.83392333984375, 2.031005859375, 2.22808837890625, 2.4251708984375, 2.62225341796875, 2.8193359375, 3.01641845703125, 3.2135009765625, 3.41058349609375, 3.607666015625, 3.80474853515625, 4.0018310546875, 4.19891357421875, 4.39599609375, 4.59307861328125, 4.7901611328125, 4.98724365234375, 5.184326171875, 5.38140869140625, 5.5784912109375, 5.77557373046875, 5.97265625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 7.0, 5.0, 11.0, 10.0, 15.0, 17.0, 23.0, 41.0, 66.0, 80.0, 126.0, 267.0, 412.0, 839.0, 1952.0, 5140.0, 16675.0, 72800.0, 619060.0, 267654.0, 45069.0, 11442.0, 3737.0, 1524.0, 664.0, 340.0, 214.0, 120.0, 74.0, 46.0, 29.0, 22.0, 16.0, 14.0, 6.0, 11.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.580078125, -1.5334014892578125, -1.486724853515625, -1.4400482177734375, -1.39337158203125, -1.3466949462890625, -1.300018310546875, -1.2533416748046875, -1.2066650390625, -1.1599884033203125, -1.113311767578125, -1.0666351318359375, -1.01995849609375, -0.9732818603515625, -0.926605224609375, -0.8799285888671875, -0.833251953125, -0.7865753173828125, -0.739898681640625, -0.6932220458984375, -0.64654541015625, -0.5998687744140625, -0.553192138671875, -0.5065155029296875, -0.4598388671875, -0.4131622314453125, -0.366485595703125, -0.3198089599609375, -0.27313232421875, -0.2264556884765625, -0.179779052734375, -0.1331024169921875, -0.08642578125, -0.0397491455078125, 0.006927490234375, 0.0536041259765625, 0.10028076171875, 0.1469573974609375, 0.193634033203125, 0.2403106689453125, 0.2869873046875, 0.3336639404296875, 0.380340576171875, 0.4270172119140625, 0.47369384765625, 0.5203704833984375, 0.567047119140625, 0.6137237548828125, 0.660400390625, 0.7070770263671875, 0.753753662109375, 0.8004302978515625, 0.84710693359375, 0.8937835693359375, 0.940460205078125, 0.9871368408203125, 1.0338134765625, 1.0804901123046875, 1.127166748046875, 1.1738433837890625, 1.22052001953125, 1.2671966552734375, 1.313873291015625, 1.3605499267578125, 1.4072265625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 5.0, 22.0, 22.0, 35.0, 53.0, 71.0, 95.0, 148.0, 149.0, 108.0, 73.0, 65.0, 39.0, 31.0, 18.0, 16.0, 12.0, 11.0, 8.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004520416259765625, -0.0004402250051498413, -0.0004284083843231201, -0.0004165917634963989, -0.00040477514266967773, -0.00039295852184295654, -0.00038114190101623535, -0.00036932528018951416, -0.00035750865936279297, -0.0003456920385360718, -0.0003338754177093506, -0.0003220587968826294, -0.0003102421760559082, -0.000298425555229187, -0.0002866089344024658, -0.00027479231357574463, -0.00026297569274902344, -0.00025115907192230225, -0.00023934245109558105, -0.00022752583026885986, -0.00021570920944213867, -0.00020389258861541748, -0.0001920759677886963, -0.0001802593469619751, -0.0001684427261352539, -0.00015662610530853271, -0.00014480948448181152, -0.00013299286365509033, -0.00012117624282836914, -0.00010935962200164795, -9.754300117492676e-05, -8.572638034820557e-05, -7.390975952148438e-05, -6.209313869476318e-05, -5.027651786804199e-05, -3.84598970413208e-05, -2.664327621459961e-05, -1.4826655387878418e-05, -3.0100345611572266e-06, 8.806586265563965e-06, 2.0623207092285156e-05, 3.243982791900635e-05, 4.425644874572754e-05, 5.607306957244873e-05, 6.788969039916992e-05, 7.970631122589111e-05, 9.15229320526123e-05, 0.0001033395528793335, 0.00011515617370605469, 0.00012697279453277588, 0.00013878941535949707, 0.00015060603618621826, 0.00016242265701293945, 0.00017423927783966064, 0.00018605589866638184, 0.00019787251949310303, 0.00020968914031982422, 0.0002215057611465454, 0.0002333223819732666, 0.0002451390027999878, 0.000256955623626709, 0.0002687722444534302, 0.00028058886528015137, 0.00029240548610687256, 0.00030422210693359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 10.0, 12.0, 19.0, 24.0, 35.0, 67.0, 112.0, 164.0, 311.0, 633.0, 1489.0, 4663.0, 19040.0, 149140.0, 779518.0, 75398.0, 12371.0, 3218.0, 1162.0, 509.0, 248.0, 134.0, 91.0, 68.0, 39.0, 19.0, 16.0, 16.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.931640625, -1.863525390625, -1.79541015625, -1.727294921875, -1.6591796875, -1.591064453125, -1.52294921875, -1.454833984375, -1.38671875, -1.318603515625, -1.25048828125, -1.182373046875, -1.1142578125, -1.046142578125, -0.97802734375, -0.909912109375, -0.841796875, -0.773681640625, -0.70556640625, -0.637451171875, -0.5693359375, -0.501220703125, -0.43310546875, -0.364990234375, -0.296875, -0.228759765625, -0.16064453125, -0.092529296875, -0.0244140625, 0.043701171875, 0.11181640625, 0.179931640625, 0.248046875, 0.316162109375, 0.38427734375, 0.452392578125, 0.5205078125, 0.588623046875, 0.65673828125, 0.724853515625, 0.79296875, 0.861083984375, 0.92919921875, 0.997314453125, 1.0654296875, 1.133544921875, 1.20166015625, 1.269775390625, 1.337890625, 1.406005859375, 1.47412109375, 1.542236328125, 1.6103515625, 1.678466796875, 1.74658203125, 1.814697265625, 1.8828125, 1.950927734375, 2.01904296875, 2.087158203125, 2.1552734375, 2.223388671875, 2.29150390625, 2.359619140625, 2.427734375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 6.0, 12.0, 14.0, 33.0, 24.0, 35.0, 24.0, 45.0, 54.0, 65.0, 108.0, 101.0, 100.0, 86.0, 65.0, 53.0, 34.0, 29.0, 29.0, 22.0, 11.0, 9.0, 11.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.548828125, -1.4963531494140625, -1.443878173828125, -1.3914031982421875, -1.33892822265625, -1.2864532470703125, -1.233978271484375, -1.1815032958984375, -1.1290283203125, -1.0765533447265625, -1.024078369140625, -0.9716033935546875, -0.91912841796875, -0.8666534423828125, -0.814178466796875, -0.7617034912109375, -0.709228515625, -0.6567535400390625, -0.604278564453125, -0.5518035888671875, -0.49932861328125, -0.4468536376953125, -0.394378662109375, -0.3419036865234375, -0.2894287109375, -0.2369537353515625, -0.184478759765625, -0.1320037841796875, -0.07952880859375, -0.0270538330078125, 0.025421142578125, 0.0778961181640625, 0.13037109375, 0.1828460693359375, 0.235321044921875, 0.2877960205078125, 0.34027099609375, 0.3927459716796875, 0.445220947265625, 0.4976959228515625, 0.5501708984375, 0.6026458740234375, 0.655120849609375, 0.7075958251953125, 0.76007080078125, 0.8125457763671875, 0.865020751953125, 0.9174957275390625, 0.969970703125, 1.0224456787109375, 1.074920654296875, 1.1273956298828125, 1.17987060546875, 1.2323455810546875, 1.284820556640625, 1.3372955322265625, 1.3897705078125, 1.4422454833984375, 1.494720458984375, 1.5471954345703125, 1.59967041015625, 1.6521453857421875, 1.704620361328125, 1.7570953369140625, 1.8095703125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 10.0, 13.0, 21.0, 73.0, 143.0, 341.0, 188.0, 108.0, 43.0, 23.0, 12.0, 9.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.65494155883789, -26.091903686523438, -24.528865814208984, -22.96582794189453, -21.402790069580078, -19.839752197265625, -18.276716232299805, -16.71367835998535, -15.150640487670898, -13.587602615356445, -12.024564743041992, -10.461527824401855, -8.898489952087402, -7.335452079772949, -5.7724151611328125, -4.209377288818359, -2.6463394165039062, -1.0833017826080322, 0.4797358512878418, 2.0427732467651367, 3.60581111907959, 5.168848991394043, 6.73188591003418, 8.294923782348633, 9.857961654663086, 11.420999526977539, 12.984037399291992, 14.547074317932129, 16.110111236572266, 17.67314910888672, 19.236186981201172, 20.799224853515625, 22.362258911132812, 23.925296783447266, 25.48833465576172, 27.051372528076172, 28.614410400390625, 30.177448272705078, 31.7404842376709, 33.30352020263672, 34.86656188964844, 36.42959976196289, 37.992637634277344, 39.5556755065918, 41.11871337890625, 42.6817512512207, 44.244789123535156, 45.807823181152344, 47.3708610534668, 48.93389892578125, 50.4969367980957, 52.059974670410156, 53.62301254272461, 55.18605041503906, 56.74908447265625, 58.31212615966797, 59.875160217285156, 61.43819808959961, 63.00123596191406, 64.56427001953125, 66.12731170654297, 67.69034576416016, 69.25338745117188, 70.81642150878906, 72.37946319580078]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 6.0, 10.0, 9.0, 10.0, 12.0, 13.0, 18.0, 15.0, 14.0, 20.0, 27.0, 27.0, 26.0, 29.0, 43.0, 34.0, 40.0, 48.0, 67.0, 65.0, 75.0, 53.0, 38.0, 30.0, 31.0, 25.0, 29.0, 25.0, 23.0, 20.0, 18.0, 16.0, 10.0, 9.0, 13.0, 10.0, 8.0, 2.0, 8.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.214447021484375, -22.41911506652832, -21.623783111572266, -20.82845115661621, -20.033119201660156, -19.2377872467041, -18.442455291748047, -17.647123336791992, -16.851791381835938, -16.056459426879883, -15.261127471923828, -14.465795516967773, -13.670463562011719, -12.875131607055664, -12.07979965209961, -11.284467697143555, -10.4891357421875, -9.693803787231445, -8.89847183227539, -8.103139877319336, -7.307807922363281, -6.512475967407227, -5.717144012451172, -4.921812057495117, -4.1264801025390625, -3.331148147583008, -2.535816192626953, -1.7404842376708984, -0.9451522827148438, -0.14982032775878906, 0.6455116271972656, 1.4408435821533203, 2.236173629760742, 3.031505584716797, 3.8268375396728516, 4.622169494628906, 5.417501449584961, 6.212833404541016, 7.00816535949707, 7.803497314453125, 8.59882926940918, 9.394161224365234, 10.189493179321289, 10.984825134277344, 11.780157089233398, 12.575489044189453, 13.370820999145508, 14.166152954101562, 14.961484909057617, 15.756816864013672, 16.552148818969727, 17.34748077392578, 18.142812728881836, 18.93814468383789, 19.733476638793945, 20.52880859375, 21.324140548706055, 22.11947250366211, 22.914804458618164, 23.71013641357422, 24.505468368530273, 25.300800323486328, 26.096132278442383, 26.891464233398438, 27.686796188354492]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 12.0, 9.0, 7.0, 18.0, 28.0, 54.0, 57.0, 83.0, 159.0, 182.0, 262.0, 368.0, 534.0, 951.0, 1308.0, 2236.0, 4040.0, 8803.0, 26296.0, 98901.0, 473016.0, 2012369.0, 1226519.0, 247187.0, 58714.0, 17474.0, 6334.0, 3180.0, 1777.0, 1071.0, 724.0, 482.0, 337.0, 229.0, 157.0, 129.0, 93.0, 49.0, 37.0, 30.0, 18.0, 15.0, 13.0, 8.0, 10.0, 5.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.7392578125, -1.690673828125, -1.64208984375, -1.593505859375, -1.544921875, -1.496337890625, -1.44775390625, -1.399169921875, -1.3505859375, -1.302001953125, -1.25341796875, -1.204833984375, -1.15625, -1.107666015625, -1.05908203125, -1.010498046875, -0.9619140625, -0.913330078125, -0.86474609375, -0.816162109375, -0.767578125, -0.718994140625, -0.67041015625, -0.621826171875, -0.5732421875, -0.524658203125, -0.47607421875, -0.427490234375, -0.37890625, -0.330322265625, -0.28173828125, -0.233154296875, -0.1845703125, -0.135986328125, -0.08740234375, -0.038818359375, 0.009765625, 0.058349609375, 0.10693359375, 0.155517578125, 0.2041015625, 0.252685546875, 0.30126953125, 0.349853515625, 0.3984375, 0.447021484375, 0.49560546875, 0.544189453125, 0.5927734375, 0.641357421875, 0.68994140625, 0.738525390625, 0.787109375, 0.835693359375, 0.88427734375, 0.932861328125, 0.9814453125, 1.030029296875, 1.07861328125, 1.127197265625, 1.17578125, 1.224365234375, 1.27294921875, 1.321533203125, 1.3701171875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 8.0, 10.0, 16.0, 17.0, 16.0, 13.0, 20.0, 23.0, 13.0, 26.0, 36.0, 33.0, 39.0, 43.0, 49.0, 47.0, 62.0, 44.0, 46.0, 38.0, 45.0, 37.0, 38.0, 35.0, 39.0, 31.0, 32.0, 27.0, 30.0, 12.0, 19.0, 11.0, 8.0, 8.0, 7.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.107421875, -2.046234130859375, -1.98504638671875, -1.923858642578125, -1.8626708984375, -1.801483154296875, -1.74029541015625, -1.679107666015625, -1.617919921875, -1.556732177734375, -1.49554443359375, -1.434356689453125, -1.3731689453125, -1.311981201171875, -1.25079345703125, -1.189605712890625, -1.12841796875, -1.067230224609375, -1.00604248046875, -0.944854736328125, -0.8836669921875, -0.822479248046875, -0.76129150390625, -0.700103759765625, -0.638916015625, -0.577728271484375, -0.51654052734375, -0.455352783203125, -0.3941650390625, -0.332977294921875, -0.27178955078125, -0.210601806640625, -0.1494140625, -0.088226318359375, -0.02703857421875, 0.034149169921875, 0.0953369140625, 0.156524658203125, 0.21771240234375, 0.278900146484375, 0.340087890625, 0.401275634765625, 0.46246337890625, 0.523651123046875, 0.5848388671875, 0.646026611328125, 0.70721435546875, 0.768402099609375, 0.82958984375, 0.890777587890625, 0.95196533203125, 1.013153076171875, 1.0743408203125, 1.135528564453125, 1.19671630859375, 1.257904052734375, 1.319091796875, 1.380279541015625, 1.44146728515625, 1.502655029296875, 1.5638427734375, 1.625030517578125, 1.68621826171875, 1.747406005859375, 1.80859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 9.0, 5.0, 11.0, 18.0, 34.0, 56.0, 121.0, 299.0, 1305.0, 26377.0, 4142510.0, 21632.0, 1345.0, 280.0, 122.0, 70.0, 47.0, 25.0, 14.0, 3.0, 5.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1796875, -10.7728271484375, -10.365966796875, -9.9591064453125, -9.55224609375, -9.1453857421875, -8.738525390625, -8.3316650390625, -7.9248046875, -7.5179443359375, -7.111083984375, -6.7042236328125, -6.29736328125, -5.8905029296875, -5.483642578125, -5.0767822265625, -4.669921875, -4.2630615234375, -3.856201171875, -3.4493408203125, -3.04248046875, -2.6356201171875, -2.228759765625, -1.8218994140625, -1.4150390625, -1.0081787109375, -0.601318359375, -0.1944580078125, 0.21240234375, 0.6192626953125, 1.026123046875, 1.4329833984375, 1.83984375, 2.2467041015625, 2.653564453125, 3.0604248046875, 3.46728515625, 3.8741455078125, 4.281005859375, 4.6878662109375, 5.0947265625, 5.5015869140625, 5.908447265625, 6.3153076171875, 6.72216796875, 7.1290283203125, 7.535888671875, 7.9427490234375, 8.349609375, 8.7564697265625, 9.163330078125, 9.5701904296875, 9.97705078125, 10.3839111328125, 10.790771484375, 11.1976318359375, 11.6044921875, 12.0113525390625, 12.418212890625, 12.8250732421875, 13.23193359375, 13.6387939453125, 14.045654296875, 14.4525146484375, 14.859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 7.0, 10.0, 15.0, 21.0, 43.0, 78.0, 197.0, 513.0, 1290.0, 1131.0, 440.0, 160.0, 74.0, 30.0, 25.0, 13.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.826171875, -3.643341064453125, -3.46051025390625, -3.277679443359375, -3.0948486328125, -2.912017822265625, -2.72918701171875, -2.546356201171875, -2.363525390625, -2.180694580078125, -1.99786376953125, -1.815032958984375, -1.6322021484375, -1.449371337890625, -1.26654052734375, -1.083709716796875, -0.90087890625, -0.718048095703125, -0.53521728515625, -0.352386474609375, -0.1695556640625, 0.013275146484375, 0.19610595703125, 0.378936767578125, 0.561767578125, 0.744598388671875, 0.92742919921875, 1.110260009765625, 1.2930908203125, 1.475921630859375, 1.65875244140625, 1.841583251953125, 2.0244140625, 2.207244873046875, 2.39007568359375, 2.572906494140625, 2.7557373046875, 2.938568115234375, 3.12139892578125, 3.304229736328125, 3.487060546875, 3.669891357421875, 3.85272216796875, 4.035552978515625, 4.2183837890625, 4.401214599609375, 4.58404541015625, 4.766876220703125, 4.94970703125, 5.132537841796875, 5.31536865234375, 5.498199462890625, 5.6810302734375, 5.863861083984375, 6.04669189453125, 6.229522705078125, 6.412353515625, 6.595184326171875, 6.77801513671875, 6.960845947265625, 7.1436767578125, 7.326507568359375, 7.50933837890625, 7.692169189453125, 7.875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 10.0, 20.0, 65.0, 162.0, 355.0, 251.0, 98.0, 27.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.03592681884766, -69.33355712890625, -67.63119506835938, -65.92882537841797, -64.2264633178711, -62.52409744262695, -60.82173156738281, -59.11936569213867, -57.41699981689453, -55.71463394165039, -54.01226806640625, -52.30990219116211, -50.60753631591797, -48.90517044067383, -47.20280456542969, -45.50043869018555, -43.798072814941406, -42.095706939697266, -40.393341064453125, -38.690975189208984, -36.988609313964844, -35.2862434387207, -33.58387756347656, -31.881511688232422, -30.179141998291016, -28.476776123046875, -26.774410247802734, -25.072044372558594, -23.369678497314453, -21.667312622070312, -19.964946746826172, -18.26258087158203, -16.56021499633789, -14.85784912109375, -13.15548324584961, -11.453117370605469, -9.750751495361328, -8.048384666442871, -6.3460187911987305, -4.64365291595459, -2.941287040710449, -1.238921046257019, 0.46344494819641113, 2.165811061859131, 3.8681769371032715, 5.57054328918457, 7.272909164428711, 8.975275039672852, 10.677640914916992, 12.380006790161133, 14.082372665405273, 15.784738540649414, 17.487104415893555, 19.189472198486328, 20.89183807373047, 22.59420394897461, 24.29656982421875, 25.99893569946289, 27.70130157470703, 29.403667449951172, 31.106033325195312, 32.80839920043945, 34.510765075683594, 36.213130950927734, 37.915496826171875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 7.0, 6.0, 9.0, 7.0, 5.0, 8.0, 12.0, 11.0, 14.0, 23.0, 18.0, 28.0, 33.0, 36.0, 29.0, 38.0, 50.0, 32.0, 47.0, 32.0, 38.0, 38.0, 49.0, 32.0, 43.0, 31.0, 37.0, 33.0, 38.0, 25.0, 29.0, 28.0, 25.0, 19.0, 13.0, 10.0, 13.0, 12.0, 5.0, 6.0, 9.0, 4.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-14.523801803588867, -14.1176176071167, -13.711434364318848, -13.30525016784668, -12.899065971374512, -12.492881774902344, -12.086698532104492, -11.680514335632324, -11.274330139160156, -10.868145942687988, -10.461962699890137, -10.055778503417969, -9.6495943069458, -9.243410110473633, -8.837226867675781, -8.431042671203613, -8.024859428405762, -7.618675708770752, -7.212491512298584, -6.806307792663574, -6.400123596191406, -5.9939398765563965, -5.587756156921387, -5.181571960449219, -4.775388240814209, -4.369204521179199, -3.9630203247070312, -3.5568366050720215, -3.1506526470184326, -2.7444686889648438, -2.338284969329834, -1.9321010112762451, -1.5259160995483398, -1.119732141494751, -0.7135483026504517, -0.30736446380615234, 0.09881949424743652, 0.5050034523010254, 0.9111871719360352, 1.317371129989624, 1.723555088043213, 2.1297390460968018, 2.5359230041503906, 2.9421067237854004, 3.3482906818389893, 3.754474639892578, 4.160658359527588, 4.566842079162598, 4.973026275634766, 5.379209995269775, 5.785394191741943, 6.191577911376953, 6.597762107849121, 7.003945827484131, 7.410129547119141, 7.816313743591309, 8.222497940063477, 8.628682136535645, 9.034865379333496, 9.441049575805664, 9.847233772277832, 10.25341796875, 10.659601211547852, 11.06578540802002, 11.471968650817871]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 9.0, 3.0, 6.0, 5.0, 11.0, 8.0, 18.0, 31.0, 37.0, 47.0, 68.0, 86.0, 167.0, 209.0, 300.0, 491.0, 808.0, 1279.0, 2249.0, 4080.0, 7837.0, 15612.0, 33644.0, 78697.0, 204745.0, 378786.0, 185222.0, 71700.0, 30972.0, 14520.0, 7443.0, 3924.0, 2126.0, 1230.0, 758.0, 473.0, 302.0, 182.0, 123.0, 103.0, 69.0, 48.0, 43.0, 31.0, 14.0, 16.0, 11.0, 8.0, 5.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.234375, -2.163330078125, -2.09228515625, -2.021240234375, -1.9501953125, -1.879150390625, -1.80810546875, -1.737060546875, -1.666015625, -1.594970703125, -1.52392578125, -1.452880859375, -1.3818359375, -1.310791015625, -1.23974609375, -1.168701171875, -1.09765625, -1.026611328125, -0.95556640625, -0.884521484375, -0.8134765625, -0.742431640625, -0.67138671875, -0.600341796875, -0.529296875, -0.458251953125, -0.38720703125, -0.316162109375, -0.2451171875, -0.174072265625, -0.10302734375, -0.031982421875, 0.0390625, 0.110107421875, 0.18115234375, 0.252197265625, 0.3232421875, 0.394287109375, 0.46533203125, 0.536376953125, 0.607421875, 0.678466796875, 0.74951171875, 0.820556640625, 0.8916015625, 0.962646484375, 1.03369140625, 1.104736328125, 1.17578125, 1.246826171875, 1.31787109375, 1.388916015625, 1.4599609375, 1.531005859375, 1.60205078125, 1.673095703125, 1.744140625, 1.815185546875, 1.88623046875, 1.957275390625, 2.0283203125, 2.099365234375, 2.17041015625, 2.241455078125, 2.3125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 8.0, 10.0, 12.0, 9.0, 10.0, 17.0, 14.0, 13.0, 16.0, 35.0, 26.0, 21.0, 31.0, 28.0, 37.0, 38.0, 51.0, 47.0, 47.0, 46.0, 35.0, 52.0, 36.0, 40.0, 42.0, 27.0, 32.0, 36.0, 27.0, 22.0, 24.0, 22.0, 16.0, 12.0, 11.0, 8.0, 9.0, 7.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.07421875, -2.015533447265625, -1.95684814453125, -1.898162841796875, -1.8394775390625, -1.780792236328125, -1.72210693359375, -1.663421630859375, -1.604736328125, -1.546051025390625, -1.48736572265625, -1.428680419921875, -1.3699951171875, -1.311309814453125, -1.25262451171875, -1.193939208984375, -1.13525390625, -1.076568603515625, -1.01788330078125, -0.959197998046875, -0.9005126953125, -0.841827392578125, -0.78314208984375, -0.724456787109375, -0.665771484375, -0.607086181640625, -0.54840087890625, -0.489715576171875, -0.4310302734375, -0.372344970703125, -0.31365966796875, -0.254974365234375, -0.1962890625, -0.137603759765625, -0.07891845703125, -0.020233154296875, 0.0384521484375, 0.097137451171875, 0.15582275390625, 0.214508056640625, 0.273193359375, 0.331878662109375, 0.39056396484375, 0.449249267578125, 0.5079345703125, 0.566619873046875, 0.62530517578125, 0.683990478515625, 0.74267578125, 0.801361083984375, 0.86004638671875, 0.918731689453125, 0.9774169921875, 1.036102294921875, 1.09478759765625, 1.153472900390625, 1.212158203125, 1.270843505859375, 1.32952880859375, 1.388214111328125, 1.4468994140625, 1.505584716796875, 1.56427001953125, 1.622955322265625, 1.681640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 0.0, 4.0, 3.0, 2.0, 6.0, 8.0, 16.0, 8.0, 16.0, 25.0, 29.0, 36.0, 50.0, 72.0, 107.0, 155.0, 189.0, 304.0, 532.0, 1212.0, 3262.0, 14097.0, 116343.0, 824770.0, 71858.0, 10237.0, 2655.0, 1030.0, 520.0, 303.0, 183.0, 154.0, 101.0, 63.0, 55.0, 43.0, 28.0, 14.0, 9.0, 15.0, 10.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.3984375, -6.20098876953125, -6.0035400390625, -5.80609130859375, -5.608642578125, -5.41119384765625, -5.2137451171875, -5.01629638671875, -4.81884765625, -4.62139892578125, -4.4239501953125, -4.22650146484375, -4.029052734375, -3.83160400390625, -3.6341552734375, -3.43670654296875, -3.2392578125, -3.04180908203125, -2.8443603515625, -2.64691162109375, -2.449462890625, -2.25201416015625, -2.0545654296875, -1.85711669921875, -1.65966796875, -1.46221923828125, -1.2647705078125, -1.06732177734375, -0.869873046875, -0.67242431640625, -0.4749755859375, -0.27752685546875, -0.080078125, 0.11737060546875, 0.3148193359375, 0.51226806640625, 0.709716796875, 0.90716552734375, 1.1046142578125, 1.30206298828125, 1.49951171875, 1.69696044921875, 1.8944091796875, 2.09185791015625, 2.289306640625, 2.48675537109375, 2.6842041015625, 2.88165283203125, 3.0791015625, 3.27655029296875, 3.4739990234375, 3.67144775390625, 3.868896484375, 4.06634521484375, 4.2637939453125, 4.46124267578125, 4.65869140625, 4.85614013671875, 5.0535888671875, 5.25103759765625, 5.448486328125, 5.64593505859375, 5.8433837890625, 6.04083251953125, 6.23828125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 4.0, 17.0, 21.0, 19.0, 22.0, 23.0, 29.0, 32.0, 38.0, 44.0, 54.0, 56.0, 76.0, 66.0, 58.0, 68.0, 51.0, 60.0, 42.0, 39.0, 32.0, 23.0, 24.0, 18.0, 12.0, 18.0, 12.0, 11.0, 6.0, 7.0, 2.0, 6.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.953125, -8.67236328125, -8.3916015625, -8.11083984375, -7.830078125, -7.54931640625, -7.2685546875, -6.98779296875, -6.70703125, -6.42626953125, -6.1455078125, -5.86474609375, -5.583984375, -5.30322265625, -5.0224609375, -4.74169921875, -4.4609375, -4.18017578125, -3.8994140625, -3.61865234375, -3.337890625, -3.05712890625, -2.7763671875, -2.49560546875, -2.21484375, -1.93408203125, -1.6533203125, -1.37255859375, -1.091796875, -0.81103515625, -0.5302734375, -0.24951171875, 0.03125, 0.31201171875, 0.5927734375, 0.87353515625, 1.154296875, 1.43505859375, 1.7158203125, 1.99658203125, 2.27734375, 2.55810546875, 2.8388671875, 3.11962890625, 3.400390625, 3.68115234375, 3.9619140625, 4.24267578125, 4.5234375, 4.80419921875, 5.0849609375, 5.36572265625, 5.646484375, 5.92724609375, 6.2080078125, 6.48876953125, 6.76953125, 7.05029296875, 7.3310546875, 7.61181640625, 7.892578125, 8.17333984375, 8.4541015625, 8.73486328125, 9.015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 7.0, 9.0, 19.0, 51.0, 72.0, 115.0, 315.0, 838.0, 2913.0, 13064.0, 123833.0, 858595.0, 39501.0, 6606.0, 1616.0, 556.0, 198.0, 90.0, 45.0, 36.0, 22.0, 7.0, 5.0, 5.0, 7.0, 4.0, 6.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.29296875, -3.19964599609375, -3.1063232421875, -3.01300048828125, -2.919677734375, -2.82635498046875, -2.7330322265625, -2.63970947265625, -2.54638671875, -2.45306396484375, -2.3597412109375, -2.26641845703125, -2.173095703125, -2.07977294921875, -1.9864501953125, -1.89312744140625, -1.7998046875, -1.70648193359375, -1.6131591796875, -1.51983642578125, -1.426513671875, -1.33319091796875, -1.2398681640625, -1.14654541015625, -1.05322265625, -0.95989990234375, -0.8665771484375, -0.77325439453125, -0.679931640625, -0.58660888671875, -0.4932861328125, -0.39996337890625, -0.306640625, -0.21331787109375, -0.1199951171875, -0.02667236328125, 0.066650390625, 0.15997314453125, 0.2532958984375, 0.34661865234375, 0.43994140625, 0.53326416015625, 0.6265869140625, 0.71990966796875, 0.813232421875, 0.90655517578125, 0.9998779296875, 1.09320068359375, 1.1865234375, 1.27984619140625, 1.3731689453125, 1.46649169921875, 1.559814453125, 1.65313720703125, 1.7464599609375, 1.83978271484375, 1.93310546875, 2.02642822265625, 2.1197509765625, 2.21307373046875, 2.306396484375, 2.39971923828125, 2.4930419921875, 2.58636474609375, 2.6796875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 5.0, 6.0, 3.0, 12.0, 12.0, 24.0, 29.0, 51.0, 110.0, 225.0, 217.0, 124.0, 65.0, 40.0, 18.0, 15.0, 11.0, 10.0, 5.0, 2.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006418228149414062, -0.0006218254566192627, -0.0006018280982971191, -0.0005818307399749756, -0.000561833381652832, -0.0005418360233306885, -0.0005218386650085449, -0.0005018413066864014, -0.0004818439483642578, -0.00046184659004211426, -0.0004418492317199707, -0.00042185187339782715, -0.0004018545150756836, -0.00038185715675354004, -0.0003618597984313965, -0.00034186244010925293, -0.0003218650817871094, -0.0003018677234649658, -0.00028187036514282227, -0.0002618730068206787, -0.00024187564849853516, -0.0002218782901763916, -0.00020188093185424805, -0.0001818835735321045, -0.00016188621520996094, -0.00014188885688781738, -0.00012189149856567383, -0.00010189414024353027, -8.189678192138672e-05, -6.189942359924316e-05, -4.190206527709961e-05, -2.1904706954956055e-05, -1.9073486328125e-06, 1.8090009689331055e-05, 3.808736801147461e-05, 5.8084726333618164e-05, 7.808208465576172e-05, 9.807944297790527e-05, 0.00011807680130004883, 0.00013807415962219238, 0.00015807151794433594, 0.0001780688762664795, 0.00019806623458862305, 0.0002180635929107666, 0.00023806095123291016, 0.0002580583095550537, 0.00027805566787719727, 0.0002980530261993408, 0.0003180503845214844, 0.00033804774284362793, 0.0003580451011657715, 0.00037804245948791504, 0.0003980398178100586, 0.00041803717613220215, 0.0004380345344543457, 0.00045803189277648926, 0.0004780292510986328, 0.0004980266094207764, 0.0005180239677429199, 0.0005380213260650635, 0.000558018684387207, 0.0005780160427093506, 0.0005980134010314941, 0.0006180107593536377, 0.0006380081176757812]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0, 7.0, 7.0, 8.0, 10.0, 11.0, 35.0, 62.0, 126.0, 386.0, 1863.0, 33641.0, 997700.0, 13011.0, 1158.0, 288.0, 110.0, 39.0, 35.0, 19.0, 10.0, 12.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.265625, -5.07330322265625, -4.8809814453125, -4.68865966796875, -4.496337890625, -4.30401611328125, -4.1116943359375, -3.91937255859375, -3.72705078125, -3.53472900390625, -3.3424072265625, -3.15008544921875, -2.957763671875, -2.76544189453125, -2.5731201171875, -2.38079833984375, -2.1884765625, -1.99615478515625, -1.8038330078125, -1.61151123046875, -1.419189453125, -1.22686767578125, -1.0345458984375, -0.84222412109375, -0.64990234375, -0.45758056640625, -0.2652587890625, -0.07293701171875, 0.119384765625, 0.31170654296875, 0.5040283203125, 0.69635009765625, 0.888671875, 1.08099365234375, 1.2733154296875, 1.46563720703125, 1.657958984375, 1.85028076171875, 2.0426025390625, 2.23492431640625, 2.42724609375, 2.61956787109375, 2.8118896484375, 3.00421142578125, 3.196533203125, 3.38885498046875, 3.5811767578125, 3.77349853515625, 3.9658203125, 4.15814208984375, 4.3504638671875, 4.54278564453125, 4.735107421875, 4.92742919921875, 5.1197509765625, 5.31207275390625, 5.50439453125, 5.69671630859375, 5.8890380859375, 6.08135986328125, 6.273681640625, 6.46600341796875, 6.6583251953125, 6.85064697265625, 7.04296875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 8.0, 16.0, 20.0, 46.0, 83.0, 146.0, 239.0, 205.0, 79.0, 52.0, 33.0, 28.0, 14.0, 7.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.615234375, -3.508087158203125, -3.40093994140625, -3.293792724609375, -3.1866455078125, -3.079498291015625, -2.97235107421875, -2.865203857421875, -2.758056640625, -2.650909423828125, -2.54376220703125, -2.436614990234375, -2.3294677734375, -2.222320556640625, -2.11517333984375, -2.008026123046875, -1.90087890625, -1.793731689453125, -1.68658447265625, -1.579437255859375, -1.4722900390625, -1.365142822265625, -1.25799560546875, -1.150848388671875, -1.043701171875, -0.936553955078125, -0.82940673828125, -0.722259521484375, -0.6151123046875, -0.507965087890625, -0.40081787109375, -0.293670654296875, -0.1865234375, -0.079376220703125, 0.02777099609375, 0.134918212890625, 0.2420654296875, 0.349212646484375, 0.45635986328125, 0.563507080078125, 0.670654296875, 0.777801513671875, 0.88494873046875, 0.992095947265625, 1.0992431640625, 1.206390380859375, 1.31353759765625, 1.420684814453125, 1.52783203125, 1.634979248046875, 1.74212646484375, 1.849273681640625, 1.9564208984375, 2.063568115234375, 2.17071533203125, 2.277862548828125, 2.385009765625, 2.492156982421875, 2.59930419921875, 2.706451416015625, 2.8135986328125, 2.920745849609375, 3.02789306640625, 3.135040283203125, 3.2421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 11.0, 16.0, 35.0, 49.0, 112.0, 258.0, 253.0, 130.0, 67.0, 30.0, 13.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.383201599121094, -34.07194519042969, -32.76069259643555, -31.44943618774414, -30.138181686401367, -28.826927185058594, -27.515670776367188, -26.204416275024414, -24.89316177368164, -23.581907272338867, -22.270652770996094, -20.959396362304688, -19.648141860961914, -18.33688735961914, -17.025630950927734, -15.714376449584961, -14.403121948242188, -13.091867446899414, -11.780611991882324, -10.469356536865234, -9.158102035522461, -7.846847057342529, -6.535592079162598, -5.224336624145508, -3.9130821228027344, -2.6018271446228027, -1.290572166442871, 0.020682811737060547, 1.3319377899169922, 2.643192768096924, 3.9544477462768555, 5.265703201293945, 6.576953887939453, 7.888208866119385, 9.199463844299316, 10.510719299316406, 11.82197380065918, 13.133228302001953, 14.444483757019043, 15.755739212036133, 17.066993713378906, 18.37824821472168, 19.689502716064453, 21.00075912475586, 22.312013626098633, 23.623268127441406, 24.934524536132812, 26.245779037475586, 27.55703353881836, 28.868288040161133, 30.179542541503906, 31.490798950195312, 32.80205535888672, 34.11330795288086, 35.424564361572266, 36.735816955566406, 38.04707336425781, 39.35832977294922, 40.66958236694336, 41.980838775634766, 43.292091369628906, 44.60334777832031, 45.91460418701172, 47.225860595703125, 48.537113189697266]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 2.0, 4.0, 4.0, 9.0, 2.0, 12.0, 11.0, 13.0, 8.0, 11.0, 15.0, 16.0, 16.0, 26.0, 35.0, 34.0, 37.0, 44.0, 62.0, 60.0, 94.0, 96.0, 60.0, 40.0, 38.0, 34.0, 25.0, 25.0, 15.0, 34.0, 17.0, 20.0, 16.0, 11.0, 11.0, 6.0, 11.0, 2.0, 9.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.35497283935547, -22.480236053466797, -21.605499267578125, -20.730762481689453, -19.856027603149414, -18.981290817260742, -18.10655403137207, -17.2318172454834, -16.35708236694336, -15.482345581054688, -14.607609748840332, -13.73287296295166, -12.858137130737305, -11.983400344848633, -11.108663558959961, -10.233926773071289, -9.359189987182617, -8.484453201293945, -7.60971736907959, -6.734980583190918, -5.860244274139404, -4.985507965087891, -4.110771179199219, -3.236034870147705, -2.3612985610961914, -1.4865621328353882, -0.611825704574585, 0.2629108428955078, 1.1376471519470215, 2.012383460998535, 2.887120246887207, 3.7618565559387207, 4.636592864990234, 5.511329174041748, 6.386065483093262, 7.260802268981934, 8.135538101196289, 9.010274887084961, 9.885011672973633, 10.759748458862305, 11.63448429107666, 12.509221076965332, 13.383956909179688, 14.25869369506836, 15.133430480957031, 16.008167266845703, 16.882904052734375, 17.757638931274414, 18.632375717163086, 19.507112503051758, 20.38184928894043, 21.25658416748047, 22.13132095336914, 23.006057739257812, 23.880794525146484, 24.755531311035156, 25.630268096923828, 26.5050048828125, 27.379741668701172, 28.254478454589844, 29.129213333129883, 30.003950119018555, 30.878686904907227, 31.7534236907959, 32.62815856933594]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 10.0, 9.0, 12.0, 16.0, 33.0, 33.0, 39.0, 63.0, 102.0, 124.0, 195.0, 286.0, 430.0, 806.0, 1367.0, 2509.0, 5398.0, 15743.0, 114157.0, 1818787.0, 2070663.0, 133683.0, 17650.0, 5709.0, 2667.0, 1451.0, 823.0, 534.0, 334.0, 183.0, 134.0, 85.0, 58.0, 50.0, 30.0, 36.0, 13.0, 19.0, 9.0, 12.0, 5.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09765625, -2.9945068359375, -2.891357421875, -2.7882080078125, -2.68505859375, -2.5819091796875, -2.478759765625, -2.3756103515625, -2.2724609375, -2.1693115234375, -2.066162109375, -1.9630126953125, -1.85986328125, -1.7567138671875, -1.653564453125, -1.5504150390625, -1.447265625, -1.3441162109375, -1.240966796875, -1.1378173828125, -1.03466796875, -0.9315185546875, -0.828369140625, -0.7252197265625, -0.6220703125, -0.5189208984375, -0.415771484375, -0.3126220703125, -0.20947265625, -0.1063232421875, -0.003173828125, 0.0999755859375, 0.203125, 0.3062744140625, 0.409423828125, 0.5125732421875, 0.61572265625, 0.7188720703125, 0.822021484375, 0.9251708984375, 1.0283203125, 1.1314697265625, 1.234619140625, 1.3377685546875, 1.44091796875, 1.5440673828125, 1.647216796875, 1.7503662109375, 1.853515625, 1.9566650390625, 2.059814453125, 2.1629638671875, 2.26611328125, 2.3692626953125, 2.472412109375, 2.5755615234375, 2.6787109375, 2.7818603515625, 2.885009765625, 2.9881591796875, 3.09130859375, 3.1944580078125, 3.297607421875, 3.4007568359375, 3.50390625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 15.0, 20.0, 11.0, 17.0, 19.0, 22.0, 27.0, 24.0, 25.0, 29.0, 40.0, 40.0, 50.0, 35.0, 56.0, 57.0, 31.0, 42.0, 48.0, 61.0, 36.0, 42.0, 33.0, 36.0, 31.0, 25.0, 23.0, 14.0, 10.0, 8.0, 10.0, 12.0, 9.0, 4.0, 4.0, 6.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.07421875, -2.0109405517578125, -1.947662353515625, -1.8843841552734375, -1.82110595703125, -1.7578277587890625, -1.694549560546875, -1.6312713623046875, -1.5679931640625, -1.5047149658203125, -1.441436767578125, -1.3781585693359375, -1.31488037109375, -1.2516021728515625, -1.188323974609375, -1.1250457763671875, -1.061767578125, -0.9984893798828125, -0.935211181640625, -0.8719329833984375, -0.80865478515625, -0.7453765869140625, -0.682098388671875, -0.6188201904296875, -0.5555419921875, -0.4922637939453125, -0.428985595703125, -0.3657073974609375, -0.30242919921875, -0.2391510009765625, -0.175872802734375, -0.1125946044921875, -0.04931640625, 0.0139617919921875, 0.077239990234375, 0.1405181884765625, 0.20379638671875, 0.2670745849609375, 0.330352783203125, 0.3936309814453125, 0.4569091796875, 0.5201873779296875, 0.583465576171875, 0.6467437744140625, 0.71002197265625, 0.7733001708984375, 0.836578369140625, 0.8998565673828125, 0.963134765625, 1.0264129638671875, 1.089691162109375, 1.1529693603515625, 1.21624755859375, 1.2795257568359375, 1.342803955078125, 1.4060821533203125, 1.4693603515625, 1.5326385498046875, 1.595916748046875, 1.6591949462890625, 1.72247314453125, 1.7857513427734375, 1.849029541015625, 1.9123077392578125, 1.9755859375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 13.0, 12.0, 16.0, 20.0, 32.0, 54.0, 118.0, 277.0, 939.0, 3303.0, 28301.0, 4079854.0, 74315.0, 5089.0, 1245.0, 385.0, 142.0, 56.0, 29.0, 24.0, 17.0, 7.0, 10.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-12.2421875, -11.8985595703125, -11.554931640625, -11.2113037109375, -10.86767578125, -10.5240478515625, -10.180419921875, -9.8367919921875, -9.4931640625, -9.1495361328125, -8.805908203125, -8.4622802734375, -8.11865234375, -7.7750244140625, -7.431396484375, -7.0877685546875, -6.744140625, -6.4005126953125, -6.056884765625, -5.7132568359375, -5.36962890625, -5.0260009765625, -4.682373046875, -4.3387451171875, -3.9951171875, -3.6514892578125, -3.307861328125, -2.9642333984375, -2.62060546875, -2.2769775390625, -1.933349609375, -1.5897216796875, -1.24609375, -0.9024658203125, -0.558837890625, -0.2152099609375, 0.12841796875, 0.4720458984375, 0.815673828125, 1.1593017578125, 1.5029296875, 1.8465576171875, 2.190185546875, 2.5338134765625, 2.87744140625, 3.2210693359375, 3.564697265625, 3.9083251953125, 4.251953125, 4.5955810546875, 4.939208984375, 5.2828369140625, 5.62646484375, 5.9700927734375, 6.313720703125, 6.6573486328125, 7.0009765625, 7.3446044921875, 7.688232421875, 8.0318603515625, 8.37548828125, 8.7191162109375, 9.062744140625, 9.4063720703125, 9.75]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 14.0, 19.0, 30.0, 45.0, 70.0, 176.0, 463.0, 1066.0, 1175.0, 550.0, 225.0, 87.0, 46.0, 36.0, 16.0, 8.0, 5.0, 2.0, 4.0, 6.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.21875, -7.01318359375, -6.8076171875, -6.60205078125, -6.396484375, -6.19091796875, -5.9853515625, -5.77978515625, -5.57421875, -5.36865234375, -5.1630859375, -4.95751953125, -4.751953125, -4.54638671875, -4.3408203125, -4.13525390625, -3.9296875, -3.72412109375, -3.5185546875, -3.31298828125, -3.107421875, -2.90185546875, -2.6962890625, -2.49072265625, -2.28515625, -2.07958984375, -1.8740234375, -1.66845703125, -1.462890625, -1.25732421875, -1.0517578125, -0.84619140625, -0.640625, -0.43505859375, -0.2294921875, -0.02392578125, 0.181640625, 0.38720703125, 0.5927734375, 0.79833984375, 1.00390625, 1.20947265625, 1.4150390625, 1.62060546875, 1.826171875, 2.03173828125, 2.2373046875, 2.44287109375, 2.6484375, 2.85400390625, 3.0595703125, 3.26513671875, 3.470703125, 3.67626953125, 3.8818359375, 4.08740234375, 4.29296875, 4.49853515625, 4.7041015625, 4.90966796875, 5.115234375, 5.32080078125, 5.5263671875, 5.73193359375, 5.9375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 15.0, 14.0, 25.0, 60.0, 115.0, 198.0, 216.0, 178.0, 81.0, 47.0, 22.0, 9.0, 2.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.022735595703125, -39.759361267089844, -38.49598693847656, -37.23261260986328, -35.969242095947266, -34.705867767333984, -33.4424934387207, -32.17911911010742, -30.91574478149414, -29.65237045288086, -28.38899803161621, -27.12562370300293, -25.86224937438965, -24.598876953125, -23.33550262451172, -22.072128295898438, -20.80875587463379, -19.545381546020508, -18.28200912475586, -17.018634796142578, -15.755260467529297, -14.491887092590332, -13.228513717651367, -11.965139389038086, -10.701766014099121, -9.438392639160156, -8.175018310546875, -6.91164493560791, -5.648271083831787, -4.384897232055664, -3.121523857116699, -1.858149528503418, -0.5947761535644531, 0.6685975790023804, 1.9319713115692139, 3.195344924926758, 4.458718776702881, 5.722092628479004, 6.985466003417969, 8.24884033203125, 9.512213706970215, 10.77558708190918, 12.038961410522461, 13.302334785461426, 14.56570816040039, 15.829082489013672, 17.092456817626953, 18.355831146240234, 19.619203567504883, 20.882577896118164, 22.145950317382812, 23.409324645996094, 24.672698974609375, 25.936073303222656, 27.199445724487305, 28.462820053100586, 29.726192474365234, 30.989566802978516, 32.2529411315918, 33.51631164550781, 34.779685974121094, 36.043060302734375, 37.306434631347656, 38.56980895996094, 39.83318328857422]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 2.0, 8.0, 4.0, 14.0, 9.0, 20.0, 18.0, 21.0, 25.0, 28.0, 35.0, 54.0, 41.0, 51.0, 57.0, 59.0, 64.0, 63.0, 54.0, 66.0, 47.0, 41.0, 28.0, 36.0, 27.0, 27.0, 27.0, 23.0, 13.0, 12.0, 10.0, 9.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.63462257385254, -22.92302894592285, -22.211435317993164, -21.499841690063477, -20.78824806213379, -20.076656341552734, -19.365062713623047, -18.65346908569336, -17.941875457763672, -17.230281829833984, -16.518688201904297, -15.80709457397461, -15.095501899719238, -14.38390827178955, -13.672314643859863, -12.960721969604492, -12.249127388000488, -11.5375337600708, -10.825940132141113, -10.114347457885742, -9.402753829956055, -8.691160202026367, -7.97956657409668, -7.26797342300415, -6.556379795074463, -5.844786167144775, -5.133193016052246, -4.421599388122559, -3.71000599861145, -2.998412609100342, -2.2868189811706543, -1.575225830078125, -0.8636322021484375, -0.15203875303268433, 0.5595546960830688, 1.2711482048034668, 1.9827415943145752, 2.6943349838256836, 3.405928611755371, 4.1175217628479, 4.829115390777588, 5.540709018707275, 6.252302169799805, 6.963895797729492, 7.67548942565918, 8.387083053588867, 9.098676681518555, 9.810269355773926, 10.521862983703613, 11.2334566116333, 11.945050239562988, 12.65664291381836, 13.368236541748047, 14.079830169677734, 14.791423797607422, 15.50301742553711, 16.214611053466797, 16.926204681396484, 17.637798309326172, 18.34939193725586, 19.060985565185547, 19.772579193115234, 20.484172821044922, 21.195764541625977, 21.907358169555664]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 9.0, 12.0, 11.0, 28.0, 39.0, 49.0, 57.0, 110.0, 158.0, 237.0, 323.0, 493.0, 818.0, 1394.0, 2210.0, 4003.0, 7215.0, 14233.0, 32509.0, 92184.0, 335651.0, 382829.0, 104260.0, 35990.0, 15409.0, 7735.0, 4280.0, 2365.0, 1470.0, 856.0, 531.0, 341.0, 262.0, 147.0, 110.0, 75.0, 51.0, 22.0, 21.0, 24.0, 10.0, 4.0, 7.0, 8.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.564453125, -3.4627685546875, -3.361083984375, -3.2593994140625, -3.15771484375, -3.0560302734375, -2.954345703125, -2.8526611328125, -2.7509765625, -2.6492919921875, -2.547607421875, -2.4459228515625, -2.34423828125, -2.2425537109375, -2.140869140625, -2.0391845703125, -1.9375, -1.8358154296875, -1.734130859375, -1.6324462890625, -1.53076171875, -1.4290771484375, -1.327392578125, -1.2257080078125, -1.1240234375, -1.0223388671875, -0.920654296875, -0.8189697265625, -0.71728515625, -0.6156005859375, -0.513916015625, -0.4122314453125, -0.310546875, -0.2088623046875, -0.107177734375, -0.0054931640625, 0.09619140625, 0.1978759765625, 0.299560546875, 0.4012451171875, 0.5029296875, 0.6046142578125, 0.706298828125, 0.8079833984375, 0.90966796875, 1.0113525390625, 1.113037109375, 1.2147216796875, 1.31640625, 1.4180908203125, 1.519775390625, 1.6214599609375, 1.72314453125, 1.8248291015625, 1.926513671875, 2.0281982421875, 2.1298828125, 2.2315673828125, 2.333251953125, 2.4349365234375, 2.53662109375, 2.6383056640625, 2.739990234375, 2.8416748046875, 2.943359375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 3.0, 5.0, 6.0, 14.0, 18.0, 12.0, 15.0, 27.0, 28.0, 28.0, 46.0, 23.0, 28.0, 34.0, 41.0, 44.0, 41.0, 71.0, 46.0, 53.0, 53.0, 45.0, 49.0, 42.0, 32.0, 30.0, 32.0, 22.0, 26.0, 19.0, 11.0, 15.0, 11.0, 6.0, 7.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.359375, -2.288238525390625, -2.21710205078125, -2.145965576171875, -2.0748291015625, -2.003692626953125, -1.93255615234375, -1.861419677734375, -1.790283203125, -1.719146728515625, -1.64801025390625, -1.576873779296875, -1.5057373046875, -1.434600830078125, -1.36346435546875, -1.292327880859375, -1.22119140625, -1.150054931640625, -1.07891845703125, -1.007781982421875, -0.9366455078125, -0.865509033203125, -0.79437255859375, -0.723236083984375, -0.652099609375, -0.580963134765625, -0.50982666015625, -0.438690185546875, -0.3675537109375, -0.296417236328125, -0.22528076171875, -0.154144287109375, -0.0830078125, -0.011871337890625, 0.05926513671875, 0.130401611328125, 0.2015380859375, 0.272674560546875, 0.34381103515625, 0.414947509765625, 0.486083984375, 0.557220458984375, 0.62835693359375, 0.699493408203125, 0.7706298828125, 0.841766357421875, 0.91290283203125, 0.984039306640625, 1.05517578125, 1.126312255859375, 1.19744873046875, 1.268585205078125, 1.3397216796875, 1.410858154296875, 1.48199462890625, 1.553131103515625, 1.624267578125, 1.695404052734375, 1.76654052734375, 1.837677001953125, 1.9088134765625, 1.979949951171875, 2.05108642578125, 2.122222900390625, 2.193359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 11.0, 5.0, 11.0, 16.0, 21.0, 25.0, 32.0, 39.0, 48.0, 81.0, 91.0, 157.0, 219.0, 236.0, 484.0, 724.0, 1518.0, 4794.0, 37224.0, 909881.0, 81230.0, 7232.0, 1928.0, 929.0, 526.0, 310.0, 218.0, 138.0, 134.0, 60.0, 57.0, 43.0, 38.0, 19.0, 17.0, 17.0, 13.0, 5.0, 2.0, 8.0, 2.0, 8.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.09375, -7.820556640625, -7.54736328125, -7.274169921875, -7.0009765625, -6.727783203125, -6.45458984375, -6.181396484375, -5.908203125, -5.635009765625, -5.36181640625, -5.088623046875, -4.8154296875, -4.542236328125, -4.26904296875, -3.995849609375, -3.72265625, -3.449462890625, -3.17626953125, -2.903076171875, -2.6298828125, -2.356689453125, -2.08349609375, -1.810302734375, -1.537109375, -1.263916015625, -0.99072265625, -0.717529296875, -0.4443359375, -0.171142578125, 0.10205078125, 0.375244140625, 0.6484375, 0.921630859375, 1.19482421875, 1.468017578125, 1.7412109375, 2.014404296875, 2.28759765625, 2.560791015625, 2.833984375, 3.107177734375, 3.38037109375, 3.653564453125, 3.9267578125, 4.199951171875, 4.47314453125, 4.746337890625, 5.01953125, 5.292724609375, 5.56591796875, 5.839111328125, 6.1123046875, 6.385498046875, 6.65869140625, 6.931884765625, 7.205078125, 7.478271484375, 7.75146484375, 8.024658203125, 8.2978515625, 8.571044921875, 8.84423828125, 9.117431640625, 9.390625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 14.0, 9.0, 8.0, 15.0, 17.0, 18.0, 15.0, 37.0, 41.0, 44.0, 59.0, 67.0, 69.0, 52.0, 66.0, 54.0, 70.0, 49.0, 47.0, 38.0, 40.0, 31.0, 28.0, 19.0, 19.0, 21.0, 11.0, 4.0, 10.0, 4.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-10.9921875, -10.68994140625, -10.3876953125, -10.08544921875, -9.783203125, -9.48095703125, -9.1787109375, -8.87646484375, -8.57421875, -8.27197265625, -7.9697265625, -7.66748046875, -7.365234375, -7.06298828125, -6.7607421875, -6.45849609375, -6.15625, -5.85400390625, -5.5517578125, -5.24951171875, -4.947265625, -4.64501953125, -4.3427734375, -4.04052734375, -3.73828125, -3.43603515625, -3.1337890625, -2.83154296875, -2.529296875, -2.22705078125, -1.9248046875, -1.62255859375, -1.3203125, -1.01806640625, -0.7158203125, -0.41357421875, -0.111328125, 0.19091796875, 0.4931640625, 0.79541015625, 1.09765625, 1.39990234375, 1.7021484375, 2.00439453125, 2.306640625, 2.60888671875, 2.9111328125, 3.21337890625, 3.515625, 3.81787109375, 4.1201171875, 4.42236328125, 4.724609375, 5.02685546875, 5.3291015625, 5.63134765625, 5.93359375, 6.23583984375, 6.5380859375, 6.84033203125, 7.142578125, 7.44482421875, 7.7470703125, 8.04931640625, 8.3515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 8.0, 3.0, 2.0, 5.0, 5.0, 13.0, 12.0, 11.0, 22.0, 37.0, 50.0, 52.0, 74.0, 137.0, 225.0, 447.0, 889.0, 2170.0, 6268.0, 23531.0, 166804.0, 772259.0, 57083.0, 11949.0, 3596.0, 1403.0, 661.0, 286.0, 154.0, 122.0, 76.0, 63.0, 31.0, 22.0, 8.0, 10.0, 9.0, 7.0, 14.0, 11.0, 8.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2216796875, -1.183807373046875, -1.14593505859375, -1.108062744140625, -1.0701904296875, -1.032318115234375, -0.99444580078125, -0.956573486328125, -0.918701171875, -0.880828857421875, -0.84295654296875, -0.805084228515625, -0.7672119140625, -0.729339599609375, -0.69146728515625, -0.653594970703125, -0.61572265625, -0.577850341796875, -0.53997802734375, -0.502105712890625, -0.4642333984375, -0.426361083984375, -0.38848876953125, -0.350616455078125, -0.312744140625, -0.274871826171875, -0.23699951171875, -0.199127197265625, -0.1612548828125, -0.123382568359375, -0.08551025390625, -0.047637939453125, -0.009765625, 0.028106689453125, 0.06597900390625, 0.103851318359375, 0.1417236328125, 0.179595947265625, 0.21746826171875, 0.255340576171875, 0.293212890625, 0.331085205078125, 0.36895751953125, 0.406829833984375, 0.4447021484375, 0.482574462890625, 0.52044677734375, 0.558319091796875, 0.59619140625, 0.634063720703125, 0.67193603515625, 0.709808349609375, 0.7476806640625, 0.785552978515625, 0.82342529296875, 0.861297607421875, 0.899169921875, 0.937042236328125, 0.97491455078125, 1.012786865234375, 1.0506591796875, 1.088531494140625, 1.12640380859375, 1.164276123046875, 1.2021484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 6.0, 15.0, 14.0, 26.0, 44.0, 89.0, 152.0, 257.0, 171.0, 96.0, 51.0, 29.0, 16.0, 12.0, 6.0, 2.0, 0.0, 6.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043272972106933594, -0.0004170127213001251, -0.0004012957215309143, -0.0003855787217617035, -0.0003698617219924927, -0.00035414472222328186, -0.00033842772245407104, -0.00032271072268486023, -0.0003069937229156494, -0.0002912767231464386, -0.0002755597233772278, -0.00025984272360801697, -0.00024412572383880615, -0.00022840872406959534, -0.00021269172430038452, -0.0001969747245311737, -0.0001812577247619629, -0.00016554072499275208, -0.00014982372522354126, -0.00013410672545433044, -0.00011838972568511963, -0.00010267272591590881, -8.6955726146698e-05, -7.123872637748718e-05, -5.552172660827637e-05, -3.980472683906555e-05, -2.4087727069854736e-05, -8.370727300643921e-06, 7.3462724685668945e-06, 2.306327223777771e-05, 3.8780272006988525e-05, 5.449727177619934e-05, 7.021427154541016e-05, 8.593127131462097e-05, 0.00010164827108383179, 0.0001173652708530426, 0.00013308227062225342, 0.00014879927039146423, 0.00016451627016067505, 0.00018023326992988586, 0.00019595026969909668, 0.0002116672694683075, 0.0002273842692375183, 0.00024310126900672913, 0.00025881826877593994, 0.00027453526854515076, 0.00029025226831436157, 0.0003059692680835724, 0.0003216862678527832, 0.000337403267621994, 0.00035312026739120483, 0.00036883726716041565, 0.00038455426692962646, 0.0004002712666988373, 0.0004159882664680481, 0.0004317052662372589, 0.0004474222660064697, 0.00046313926577568054, 0.00047885626554489136, 0.0004945732653141022, 0.000510290265083313, 0.0005260072648525238, 0.0005417242646217346, 0.0005574412643909454, 0.0005731582641601562]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 4.0, 9.0, 4.0, 11.0, 19.0, 22.0, 27.0, 27.0, 45.0, 76.0, 104.0, 141.0, 239.0, 408.0, 801.0, 1970.0, 6436.0, 43362.0, 812947.0, 160779.0, 15013.0, 3360.0, 1269.0, 586.0, 291.0, 189.0, 143.0, 69.0, 49.0, 48.0, 28.0, 19.0, 15.0, 8.0, 6.0, 9.0, 4.0, 9.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4140625, -1.3695220947265625, -1.324981689453125, -1.2804412841796875, -1.23590087890625, -1.1913604736328125, -1.146820068359375, -1.1022796630859375, -1.0577392578125, -1.0131988525390625, -0.968658447265625, -0.9241180419921875, -0.87957763671875, -0.8350372314453125, -0.790496826171875, -0.7459564208984375, -0.701416015625, -0.6568756103515625, -0.612335205078125, -0.5677947998046875, -0.52325439453125, -0.4787139892578125, -0.434173583984375, -0.3896331787109375, -0.3450927734375, -0.3005523681640625, -0.256011962890625, -0.2114715576171875, -0.16693115234375, -0.1223907470703125, -0.077850341796875, -0.0333099365234375, 0.01123046875, 0.0557708740234375, 0.100311279296875, 0.1448516845703125, 0.18939208984375, 0.2339324951171875, 0.278472900390625, 0.3230133056640625, 0.3675537109375, 0.4120941162109375, 0.456634521484375, 0.5011749267578125, 0.54571533203125, 0.5902557373046875, 0.634796142578125, 0.6793365478515625, 0.723876953125, 0.7684173583984375, 0.812957763671875, 0.8574981689453125, 0.90203857421875, 0.9465789794921875, 0.991119384765625, 1.0356597900390625, 1.0802001953125, 1.1247406005859375, 1.169281005859375, 1.2138214111328125, 1.25836181640625, 1.3029022216796875, 1.347442626953125, 1.3919830322265625, 1.4365234375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 5.0, 8.0, 8.0, 15.0, 19.0, 18.0, 21.0, 25.0, 35.0, 45.0, 56.0, 64.0, 73.0, 75.0, 89.0, 81.0, 66.0, 55.0, 37.0, 43.0, 31.0, 30.0, 17.0, 17.0, 14.0, 9.0, 10.0, 6.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.025390625, -0.9953994750976562, -0.9654083251953125, -0.9354171752929688, -0.905426025390625, -0.8754348754882812, -0.8454437255859375, -0.8154525756835938, -0.78546142578125, -0.7554702758789062, -0.7254791259765625, -0.6954879760742188, -0.665496826171875, -0.6355056762695312, -0.6055145263671875, -0.5755233764648438, -0.5455322265625, -0.5155410766601562, -0.4855499267578125, -0.45555877685546875, -0.425567626953125, -0.39557647705078125, -0.3655853271484375, -0.33559417724609375, -0.30560302734375, -0.27561187744140625, -0.2456207275390625, -0.21562957763671875, -0.185638427734375, -0.15564727783203125, -0.1256561279296875, -0.09566497802734375, -0.065673828125, -0.03568267822265625, -0.0056915283203125, 0.02429962158203125, 0.054290771484375, 0.08428192138671875, 0.1142730712890625, 0.14426422119140625, 0.17425537109375, 0.20424652099609375, 0.2342376708984375, 0.26422882080078125, 0.294219970703125, 0.32421112060546875, 0.3542022705078125, 0.38419342041015625, 0.4141845703125, 0.44417572021484375, 0.4741668701171875, 0.5041580200195312, 0.534149169921875, 0.5641403198242188, 0.5941314697265625, 0.6241226196289062, 0.65411376953125, 0.6841049194335938, 0.7140960693359375, 0.7440872192382812, 0.774078369140625, 0.8040695190429688, 0.8340606689453125, 0.8640518188476562, 0.89404296875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 11.0, 22.0, 40.0, 94.0, 352.0, 208.0, 113.0, 73.0, 29.0, 17.0, 16.0, 14.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.13120651245117, -41.9272346496582, -40.723262786865234, -39.519290924072266, -38.31532287597656, -37.111351013183594, -35.907379150390625, -34.703407287597656, -33.49943542480469, -32.29546356201172, -31.09149169921875, -29.887521743774414, -28.683549880981445, -27.479578018188477, -26.27560806274414, -25.071636199951172, -23.867664337158203, -22.663692474365234, -21.459720611572266, -20.25575065612793, -19.05177879333496, -17.847806930541992, -16.643836975097656, -15.439865112304688, -14.235893249511719, -13.03192138671875, -11.827950477600098, -10.623979568481445, -9.420007705688477, -8.216035842895508, -7.0120649337768555, -5.808094024658203, -4.6041259765625, -3.4001545906066895, -2.196183204650879, -0.9922118186950684, 0.2117595672607422, 1.4157309532165527, 2.6197023391723633, 3.8236732482910156, 5.027645111083984, 6.231616497039795, 7.4355878829956055, 8.639558792114258, 9.843530654907227, 11.047502517700195, 12.251473426818848, 13.4554443359375, 14.659416198730469, 15.863388061523438, 17.067359924316406, 18.271329879760742, 19.47530174255371, 20.67927360534668, 21.883243560791016, 23.087215423583984, 24.291187286376953, 25.495159149169922, 26.69913101196289, 27.903100967407227, 29.107072830200195, 30.311044692993164, 31.5150146484375, 32.71898651123047, 33.92295837402344]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 8.0, 6.0, 6.0, 13.0, 8.0, 15.0, 14.0, 15.0, 28.0, 18.0, 28.0, 34.0, 46.0, 29.0, 51.0, 77.0, 175.0, 112.0, 54.0, 30.0, 20.0, 26.0, 26.0, 31.0, 26.0, 17.0, 14.0, 12.0, 6.0, 13.0, 6.0, 5.0, 3.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-33.129966735839844, -32.083683013916016, -31.037399291992188, -29.991113662719727, -28.9448299407959, -27.89854621887207, -26.85226058959961, -25.80597686767578, -24.759693145751953, -23.713409423828125, -22.667125701904297, -21.620840072631836, -20.574556350708008, -19.52827262878418, -18.48198699951172, -17.43570327758789, -16.389419555664062, -15.343135833740234, -14.29685115814209, -13.250566482543945, -12.204282760620117, -11.157999038696289, -10.111714363098145, -9.0654296875, -8.019145965576172, -6.9728617668151855, -5.926577568054199, -4.880293369293213, -3.8340091705322266, -2.7877249717712402, -1.741440773010254, -0.6951565742492676, 0.35112762451171875, 1.397411823272705, 2.4436960220336914, 3.4899802207946777, 4.536264419555664, 5.58254861831665, 6.628832817077637, 7.675117015838623, 8.72140121459961, 9.767684936523438, 10.813969612121582, 11.860254287719727, 12.906538009643555, 13.952821731567383, 14.999106407165527, 16.045391082763672, 17.0916748046875, 18.137958526611328, 19.184242248535156, 20.230527877807617, 21.276811599731445, 22.323095321655273, 23.369380950927734, 24.415664672851562, 25.46194839477539, 26.50823211669922, 27.554515838623047, 28.600801467895508, 29.647085189819336, 30.693368911743164, 31.739654541015625, 32.78593826293945, 33.83222198486328]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 26.0, 25.0, 41.0, 51.0, 65.0, 88.0, 116.0, 146.0, 235.0, 366.0, 557.0, 897.0, 1623.0, 3174.0, 7105.0, 22003.0, 142993.0, 1277523.0, 2300143.0, 373849.0, 42865.0, 10699.0, 4436.0, 2108.0, 1134.0, 677.0, 422.0, 246.0, 176.0, 141.0, 90.0, 54.0, 53.0, 43.0, 34.0, 22.0, 10.0, 10.0, 9.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.37109375, -3.259490966796875, -3.14788818359375, -3.036285400390625, -2.9246826171875, -2.813079833984375, -2.70147705078125, -2.589874267578125, -2.478271484375, -2.366668701171875, -2.25506591796875, -2.143463134765625, -2.0318603515625, -1.920257568359375, -1.80865478515625, -1.697052001953125, -1.58544921875, -1.473846435546875, -1.36224365234375, -1.250640869140625, -1.1390380859375, -1.027435302734375, -0.91583251953125, -0.804229736328125, -0.692626953125, -0.581024169921875, -0.46942138671875, -0.357818603515625, -0.2462158203125, -0.134613037109375, -0.02301025390625, 0.088592529296875, 0.2001953125, 0.311798095703125, 0.42340087890625, 0.535003662109375, 0.6466064453125, 0.758209228515625, 0.86981201171875, 0.981414794921875, 1.093017578125, 1.204620361328125, 1.31622314453125, 1.427825927734375, 1.5394287109375, 1.651031494140625, 1.76263427734375, 1.874237060546875, 1.98583984375, 2.097442626953125, 2.20904541015625, 2.320648193359375, 2.4322509765625, 2.543853759765625, 2.65545654296875, 2.767059326171875, 2.878662109375, 2.990264892578125, 3.10186767578125, 3.213470458984375, 3.3250732421875, 3.436676025390625, 3.54827880859375, 3.659881591796875, 3.771484375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 6.0, 5.0, 7.0, 15.0, 15.0, 25.0, 28.0, 30.0, 31.0, 26.0, 36.0, 39.0, 40.0, 53.0, 47.0, 59.0, 59.0, 51.0, 47.0, 47.0, 54.0, 53.0, 35.0, 27.0, 26.0, 15.0, 16.0, 32.0, 16.0, 16.0, 11.0, 10.0, 4.0, 4.0, 4.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.33984375, -2.269866943359375, -2.19989013671875, -2.129913330078125, -2.0599365234375, -1.989959716796875, -1.91998291015625, -1.850006103515625, -1.780029296875, -1.710052490234375, -1.64007568359375, -1.570098876953125, -1.5001220703125, -1.430145263671875, -1.36016845703125, -1.290191650390625, -1.22021484375, -1.150238037109375, -1.08026123046875, -1.010284423828125, -0.9403076171875, -0.870330810546875, -0.80035400390625, -0.730377197265625, -0.660400390625, -0.590423583984375, -0.52044677734375, -0.450469970703125, -0.3804931640625, -0.310516357421875, -0.24053955078125, -0.170562744140625, -0.1005859375, -0.030609130859375, 0.03936767578125, 0.109344482421875, 0.1793212890625, 0.249298095703125, 0.31927490234375, 0.389251708984375, 0.459228515625, 0.529205322265625, 0.59918212890625, 0.669158935546875, 0.7391357421875, 0.809112548828125, 0.87908935546875, 0.949066162109375, 1.01904296875, 1.089019775390625, 1.15899658203125, 1.228973388671875, 1.2989501953125, 1.368927001953125, 1.43890380859375, 1.508880615234375, 1.578857421875, 1.648834228515625, 1.71881103515625, 1.788787841796875, 1.8587646484375, 1.928741455078125, 1.99871826171875, 2.068695068359375, 2.138671875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 10.0, 14.0, 12.0, 21.0, 27.0, 46.0, 96.0, 146.0, 249.0, 397.0, 917.0, 2339.0, 11238.0, 1075574.0, 3086019.0, 13149.0, 2251.0, 815.0, 358.0, 210.0, 129.0, 88.0, 43.0, 36.0, 24.0, 21.0, 8.0, 8.0, 7.0, 12.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2421875, -10.8680419921875, -10.493896484375, -10.1197509765625, -9.74560546875, -9.3714599609375, -8.997314453125, -8.6231689453125, -8.2490234375, -7.8748779296875, -7.500732421875, -7.1265869140625, -6.75244140625, -6.3782958984375, -6.004150390625, -5.6300048828125, -5.255859375, -4.8817138671875, -4.507568359375, -4.1334228515625, -3.75927734375, -3.3851318359375, -3.010986328125, -2.6368408203125, -2.2626953125, -1.8885498046875, -1.514404296875, -1.1402587890625, -0.76611328125, -0.3919677734375, -0.017822265625, 0.3563232421875, 0.73046875, 1.1046142578125, 1.478759765625, 1.8529052734375, 2.22705078125, 2.6011962890625, 2.975341796875, 3.3494873046875, 3.7236328125, 4.0977783203125, 4.471923828125, 4.8460693359375, 5.22021484375, 5.5943603515625, 5.968505859375, 6.3426513671875, 6.716796875, 7.0909423828125, 7.465087890625, 7.8392333984375, 8.21337890625, 8.5875244140625, 8.961669921875, 9.3358154296875, 9.7099609375, 10.0841064453125, 10.458251953125, 10.8323974609375, 11.20654296875, 11.5806884765625, 11.954833984375, 12.3289794921875, 12.703125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 8.0, 4.0, 6.0, 9.0, 17.0, 28.0, 31.0, 38.0, 55.0, 78.0, 92.0, 154.0, 266.0, 479.0, 729.0, 729.0, 530.0, 307.0, 182.0, 98.0, 79.0, 50.0, 35.0, 30.0, 9.0, 5.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.078125, -6.87115478515625, -6.6641845703125, -6.45721435546875, -6.250244140625, -6.04327392578125, -5.8363037109375, -5.62933349609375, -5.42236328125, -5.21539306640625, -5.0084228515625, -4.80145263671875, -4.594482421875, -4.38751220703125, -4.1805419921875, -3.97357177734375, -3.7666015625, -3.55963134765625, -3.3526611328125, -3.14569091796875, -2.938720703125, -2.73175048828125, -2.5247802734375, -2.31781005859375, -2.11083984375, -1.90386962890625, -1.6968994140625, -1.48992919921875, -1.282958984375, -1.07598876953125, -0.8690185546875, -0.66204833984375, -0.455078125, -0.24810791015625, -0.0411376953125, 0.16583251953125, 0.372802734375, 0.57977294921875, 0.7867431640625, 0.99371337890625, 1.20068359375, 1.40765380859375, 1.6146240234375, 1.82159423828125, 2.028564453125, 2.23553466796875, 2.4425048828125, 2.64947509765625, 2.8564453125, 3.06341552734375, 3.2703857421875, 3.47735595703125, 3.684326171875, 3.89129638671875, 4.0982666015625, 4.30523681640625, 4.51220703125, 4.71917724609375, 4.9261474609375, 5.13311767578125, 5.340087890625, 5.54705810546875, 5.7540283203125, 5.96099853515625, 6.16796875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 13.0, 35.0, 54.0, 111.0, 201.0, 255.0, 179.0, 77.0, 41.0, 14.0, 6.0, 4.0, 7.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-134.59930419921875, -131.98284912109375, -129.3664093017578, -126.74996185302734, -124.13351440429688, -121.5170669555664, -118.90061950683594, -116.28417205810547, -113.667724609375, -111.05127716064453, -108.43482971191406, -105.8183822631836, -103.20193481445312, -100.58548736572266, -97.96903991699219, -95.35259246826172, -92.73614501953125, -90.11969757080078, -87.50325012207031, -84.88680267333984, -82.27035522460938, -79.6539077758789, -77.03746032714844, -74.42101287841797, -71.80455780029297, -69.1881103515625, -66.57166290283203, -63.95521545410156, -61.338768005371094, -58.722320556640625, -56.105873107910156, -53.48942565917969, -50.87297821044922, -48.25653076171875, -45.64008331298828, -43.02363586425781, -40.407188415527344, -37.790740966796875, -35.174293518066406, -32.55784606933594, -29.941396713256836, -27.324949264526367, -24.7085018157959, -22.092052459716797, -19.475605010986328, -16.85915756225586, -14.24271011352539, -11.626262664794922, -9.009815216064453, -6.393367767333984, -3.7769198417663574, -1.1604719161987305, 1.4559755325317383, 4.072422981262207, 6.688871383666992, 9.305318832397461, 11.92176628112793, 14.538213729858398, 17.154661178588867, 19.77111053466797, 22.387557983398438, 25.004005432128906, 27.620452880859375, 30.236900329589844, 32.85334777832031]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 9.0, 10.0, 19.0, 14.0, 25.0, 27.0, 30.0, 31.0, 42.0, 49.0, 42.0, 45.0, 63.0, 75.0, 57.0, 57.0, 47.0, 46.0, 53.0, 38.0, 43.0, 34.0, 23.0, 23.0, 14.0, 15.0, 23.0, 13.0, 6.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.91107177734375, -30.740110397338867, -29.569149017333984, -28.398189544677734, -27.22722816467285, -26.05626678466797, -24.88530731201172, -23.714345932006836, -22.543384552001953, -21.37242317199707, -20.201461791992188, -19.030502319335938, -17.859540939331055, -16.688579559326172, -15.517619132995605, -14.346658706665039, -13.175697326660156, -12.004735946655273, -10.833775520324707, -9.66281509399414, -8.491853713989258, -7.320892810821533, -6.149931907653809, -4.978971481323242, -3.8080101013183594, -2.6370491981506348, -1.4660882949829102, -0.29512739181518555, 0.8758335113525391, 2.0467944145202637, 3.2177553176879883, 4.388715744018555, 5.559680938720703, 6.730641841888428, 7.901602745056152, 9.072563171386719, 10.243524551391602, 11.414485931396484, 12.58544635772705, 13.756406784057617, 14.9273681640625, 16.098329544067383, 17.269290924072266, 18.440250396728516, 19.6112117767334, 20.78217315673828, 21.95313262939453, 23.124094009399414, 24.295055389404297, 25.46601676940918, 26.636978149414062, 27.807937622070312, 28.978899002075195, 30.149860382080078, 31.320819854736328, 32.491783142089844, 33.662742614746094, 34.833702087402344, 36.00466537475586, 37.17562484741211, 38.346588134765625, 39.517547607421875, 40.688507080078125, 41.859466552734375, 43.03042984008789]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 10.0, 11.0, 21.0, 24.0, 33.0, 34.0, 87.0, 130.0, 247.0, 444.0, 864.0, 1677.0, 3853.0, 8613.0, 21944.0, 75806.0, 629409.0, 235798.0, 43270.0, 14577.0, 6162.0, 2736.0, 1261.0, 622.0, 353.0, 201.0, 87.0, 81.0, 56.0, 44.0, 24.0, 17.0, 10.0, 8.0, 7.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.71875, -3.6148681640625, -3.510986328125, -3.4071044921875, -3.30322265625, -3.1993408203125, -3.095458984375, -2.9915771484375, -2.8876953125, -2.7838134765625, -2.679931640625, -2.5760498046875, -2.47216796875, -2.3682861328125, -2.264404296875, -2.1605224609375, -2.056640625, -1.9527587890625, -1.848876953125, -1.7449951171875, -1.64111328125, -1.5372314453125, -1.433349609375, -1.3294677734375, -1.2255859375, -1.1217041015625, -1.017822265625, -0.9139404296875, -0.81005859375, -0.7061767578125, -0.602294921875, -0.4984130859375, -0.39453125, -0.2906494140625, -0.186767578125, -0.0828857421875, 0.02099609375, 0.1248779296875, 0.228759765625, 0.3326416015625, 0.4365234375, 0.5404052734375, 0.644287109375, 0.7481689453125, 0.85205078125, 0.9559326171875, 1.059814453125, 1.1636962890625, 1.267578125, 1.3714599609375, 1.475341796875, 1.5792236328125, 1.68310546875, 1.7869873046875, 1.890869140625, 1.9947509765625, 2.0986328125, 2.2025146484375, 2.306396484375, 2.4102783203125, 2.51416015625, 2.6180419921875, 2.721923828125, 2.8258056640625, 2.9296875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 6.0, 10.0, 14.0, 24.0, 22.0, 37.0, 24.0, 44.0, 53.0, 75.0, 75.0, 80.0, 76.0, 59.0, 79.0, 60.0, 67.0, 47.0, 45.0, 31.0, 23.0, 15.0, 14.0, 12.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.072265625, -2.957305908203125, -2.84234619140625, -2.727386474609375, -2.6124267578125, -2.497467041015625, -2.38250732421875, -2.267547607421875, -2.152587890625, -2.037628173828125, -1.92266845703125, -1.807708740234375, -1.6927490234375, -1.577789306640625, -1.46282958984375, -1.347869873046875, -1.23291015625, -1.117950439453125, -1.00299072265625, -0.888031005859375, -0.7730712890625, -0.658111572265625, -0.54315185546875, -0.428192138671875, -0.313232421875, -0.198272705078125, -0.08331298828125, 0.031646728515625, 0.1466064453125, 0.261566162109375, 0.37652587890625, 0.491485595703125, 0.6064453125, 0.721405029296875, 0.83636474609375, 0.951324462890625, 1.0662841796875, 1.181243896484375, 1.29620361328125, 1.411163330078125, 1.526123046875, 1.641082763671875, 1.75604248046875, 1.871002197265625, 1.9859619140625, 2.100921630859375, 2.21588134765625, 2.330841064453125, 2.44580078125, 2.560760498046875, 2.67572021484375, 2.790679931640625, 2.9056396484375, 3.020599365234375, 3.13555908203125, 3.250518798828125, 3.365478515625, 3.480438232421875, 3.59539794921875, 3.710357666015625, 3.8253173828125, 3.940277099609375, 4.05523681640625, 4.170196533203125, 4.28515625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 3.0, 10.0, 17.0, 15.0, 24.0, 38.0, 55.0, 79.0, 133.0, 212.0, 365.0, 777.0, 2146.0, 12351.0, 885701.0, 136510.0, 7125.0, 1572.0, 620.0, 306.0, 163.0, 130.0, 73.0, 37.0, 29.0, 10.0, 22.0, 6.0, 12.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.48828125, -7.2672119140625, -7.046142578125, -6.8250732421875, -6.60400390625, -6.3829345703125, -6.161865234375, -5.9407958984375, -5.7197265625, -5.4986572265625, -5.277587890625, -5.0565185546875, -4.83544921875, -4.6143798828125, -4.393310546875, -4.1722412109375, -3.951171875, -3.7301025390625, -3.509033203125, -3.2879638671875, -3.06689453125, -2.8458251953125, -2.624755859375, -2.4036865234375, -2.1826171875, -1.9615478515625, -1.740478515625, -1.5194091796875, -1.29833984375, -1.0772705078125, -0.856201171875, -0.6351318359375, -0.4140625, -0.1929931640625, 0.028076171875, 0.2491455078125, 0.47021484375, 0.6912841796875, 0.912353515625, 1.1334228515625, 1.3544921875, 1.5755615234375, 1.796630859375, 2.0177001953125, 2.23876953125, 2.4598388671875, 2.680908203125, 2.9019775390625, 3.123046875, 3.3441162109375, 3.565185546875, 3.7862548828125, 4.00732421875, 4.2283935546875, 4.449462890625, 4.6705322265625, 4.8916015625, 5.1126708984375, 5.333740234375, 5.5548095703125, 5.77587890625, 5.9969482421875, 6.218017578125, 6.4390869140625, 6.66015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 14.0, 20.0, 18.0, 14.0, 36.0, 33.0, 48.0, 51.0, 63.0, 94.0, 96.0, 101.0, 84.0, 63.0, 47.0, 45.0, 48.0, 27.0, 23.0, 22.0, 10.0, 10.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.40625, -13.983642578125, -13.56103515625, -13.138427734375, -12.7158203125, -12.293212890625, -11.87060546875, -11.447998046875, -11.025390625, -10.602783203125, -10.18017578125, -9.757568359375, -9.3349609375, -8.912353515625, -8.48974609375, -8.067138671875, -7.64453125, -7.221923828125, -6.79931640625, -6.376708984375, -5.9541015625, -5.531494140625, -5.10888671875, -4.686279296875, -4.263671875, -3.841064453125, -3.41845703125, -2.995849609375, -2.5732421875, -2.150634765625, -1.72802734375, -1.305419921875, -0.8828125, -0.460205078125, -0.03759765625, 0.385009765625, 0.8076171875, 1.230224609375, 1.65283203125, 2.075439453125, 2.498046875, 2.920654296875, 3.34326171875, 3.765869140625, 4.1884765625, 4.611083984375, 5.03369140625, 5.456298828125, 5.87890625, 6.301513671875, 6.72412109375, 7.146728515625, 7.5693359375, 7.991943359375, 8.41455078125, 8.837158203125, 9.259765625, 9.682373046875, 10.10498046875, 10.527587890625, 10.9501953125, 11.372802734375, 11.79541015625, 12.218017578125, 12.640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 4.0, 2.0, 7.0, 8.0, 15.0, 16.0, 24.0, 30.0, 58.0, 83.0, 116.0, 211.0, 379.0, 814.0, 2289.0, 8471.0, 69601.0, 927399.0, 30512.0, 5402.0, 1621.0, 644.0, 327.0, 185.0, 111.0, 68.0, 56.0, 25.0, 22.0, 15.0, 14.0, 6.0, 9.0, 7.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.1396484375, -1.1082916259765625, -1.076934814453125, -1.0455780029296875, -1.01422119140625, -0.9828643798828125, -0.951507568359375, -0.9201507568359375, -0.8887939453125, -0.8574371337890625, -0.826080322265625, -0.7947235107421875, -0.76336669921875, -0.7320098876953125, -0.700653076171875, -0.6692962646484375, -0.637939453125, -0.6065826416015625, -0.575225830078125, -0.5438690185546875, -0.51251220703125, -0.4811553955078125, -0.449798583984375, -0.4184417724609375, -0.3870849609375, -0.3557281494140625, -0.324371337890625, -0.2930145263671875, -0.26165771484375, -0.2303009033203125, -0.198944091796875, -0.1675872802734375, -0.13623046875, -0.1048736572265625, -0.073516845703125, -0.0421600341796875, -0.01080322265625, 0.0205535888671875, 0.051910400390625, 0.0832672119140625, 0.1146240234375, 0.1459808349609375, 0.177337646484375, 0.2086944580078125, 0.24005126953125, 0.2714080810546875, 0.302764892578125, 0.3341217041015625, 0.365478515625, 0.3968353271484375, 0.428192138671875, 0.4595489501953125, 0.49090576171875, 0.5222625732421875, 0.553619384765625, 0.5849761962890625, 0.6163330078125, 0.6476898193359375, 0.679046630859375, 0.7104034423828125, 0.74176025390625, 0.7731170654296875, 0.804473876953125, 0.8358306884765625, 0.8671875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 11.0, 7.0, 8.0, 13.0, 13.0, 28.0, 31.0, 41.0, 73.0, 107.0, 180.0, 139.0, 109.0, 65.0, 38.0, 31.0, 18.0, 21.0, 14.0, 7.0, 8.0, 3.0, 1.0, 5.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00020122528076171875, -0.0001951083540916443, -0.00018899142742156982, -0.00018287450075149536, -0.0001767575740814209, -0.00017064064741134644, -0.00016452372074127197, -0.0001584067940711975, -0.00015228986740112305, -0.00014617294073104858, -0.00014005601406097412, -0.00013393908739089966, -0.0001278221607208252, -0.00012170523405075073, -0.00011558830738067627, -0.0001094713807106018, -0.00010335445404052734, -9.723752737045288e-05, -9.112060070037842e-05, -8.500367403030396e-05, -7.888674736022949e-05, -7.276982069015503e-05, -6.665289402008057e-05, -6.0535967350006104e-05, -5.441904067993164e-05, -4.830211400985718e-05, -4.2185187339782715e-05, -3.606826066970825e-05, -2.995133399963379e-05, -2.3834407329559326e-05, -1.7717480659484863e-05, -1.16005539894104e-05, -5.4836273193359375e-06, 6.332993507385254e-07, 6.750226020812988e-06, 1.2867152690887451e-05, 1.8984079360961914e-05, 2.5101006031036377e-05, 3.121793270111084e-05, 3.73348593711853e-05, 4.3451786041259766e-05, 4.956871271133423e-05, 5.568563938140869e-05, 6.180256605148315e-05, 6.791949272155762e-05, 7.403641939163208e-05, 8.015334606170654e-05, 8.6270272731781e-05, 9.238719940185547e-05, 9.850412607192993e-05, 0.0001046210527420044, 0.00011073797941207886, 0.00011685490608215332, 0.00012297183275222778, 0.00012908875942230225, 0.0001352056860923767, 0.00014132261276245117, 0.00014743953943252563, 0.0001535564661026001, 0.00015967339277267456, 0.00016579031944274902, 0.00017190724611282349, 0.00017802417278289795, 0.0001841410994529724, 0.00019025802612304688]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 13.0, 11.0, 18.0, 20.0, 27.0, 63.0, 81.0, 156.0, 388.0, 1019.0, 3483.0, 19167.0, 897338.0, 113720.0, 9529.0, 2098.0, 683.0, 322.0, 152.0, 83.0, 38.0, 38.0, 17.0, 17.0, 11.0, 12.0, 5.0, 9.0, 7.0, 5.0, 5.0, 1.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.779296875, -0.7435760498046875, -0.707855224609375, -0.6721343994140625, -0.63641357421875, -0.6006927490234375, -0.564971923828125, -0.5292510986328125, -0.4935302734375, -0.4578094482421875, -0.422088623046875, -0.3863677978515625, -0.35064697265625, -0.3149261474609375, -0.279205322265625, -0.2434844970703125, -0.207763671875, -0.1720428466796875, -0.136322021484375, -0.1006011962890625, -0.06488037109375, -0.0291595458984375, 0.006561279296875, 0.0422821044921875, 0.0780029296875, 0.1137237548828125, 0.149444580078125, 0.1851654052734375, 0.22088623046875, 0.2566070556640625, 0.292327880859375, 0.3280487060546875, 0.36376953125, 0.3994903564453125, 0.435211181640625, 0.4709320068359375, 0.50665283203125, 0.5423736572265625, 0.578094482421875, 0.6138153076171875, 0.6495361328125, 0.6852569580078125, 0.720977783203125, 0.7566986083984375, 0.79241943359375, 0.8281402587890625, 0.863861083984375, 0.8995819091796875, 0.935302734375, 0.9710235595703125, 1.006744384765625, 1.0424652099609375, 1.07818603515625, 1.1139068603515625, 1.149627685546875, 1.1853485107421875, 1.2210693359375, 1.2567901611328125, 1.292510986328125, 1.3282318115234375, 1.36395263671875, 1.3996734619140625, 1.435394287109375, 1.4711151123046875, 1.5068359375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 4.0, 15.0, 15.0, 17.0, 22.0, 42.0, 36.0, 72.0, 110.0, 181.0, 145.0, 108.0, 67.0, 41.0, 28.0, 23.0, 20.0, 17.0, 7.0, 10.0, 10.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.685546875, -0.65277099609375, -0.6199951171875, -0.58721923828125, -0.554443359375, -0.52166748046875, -0.4888916015625, -0.45611572265625, -0.42333984375, -0.39056396484375, -0.3577880859375, -0.32501220703125, -0.292236328125, -0.25946044921875, -0.2266845703125, -0.19390869140625, -0.1611328125, -0.12835693359375, -0.0955810546875, -0.06280517578125, -0.030029296875, 0.00274658203125, 0.0355224609375, 0.06829833984375, 0.10107421875, 0.13385009765625, 0.1666259765625, 0.19940185546875, 0.232177734375, 0.26495361328125, 0.2977294921875, 0.33050537109375, 0.36328125, 0.39605712890625, 0.4288330078125, 0.46160888671875, 0.494384765625, 0.52716064453125, 0.5599365234375, 0.59271240234375, 0.62548828125, 0.65826416015625, 0.6910400390625, 0.72381591796875, 0.756591796875, 0.78936767578125, 0.8221435546875, 0.85491943359375, 0.8876953125, 0.92047119140625, 0.9532470703125, 0.98602294921875, 1.018798828125, 1.05157470703125, 1.0843505859375, 1.11712646484375, 1.14990234375, 1.18267822265625, 1.2154541015625, 1.24822998046875, 1.281005859375, 1.31378173828125, 1.3465576171875, 1.37933349609375, 1.412109375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 14.0, 37.0, 83.0, 631.0, 163.0, 41.0, 22.0, 9.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.5894775390625, -42.42793273925781, -40.26639175415039, -38.10485076904297, -35.94330596923828, -33.781761169433594, -31.620220184326172, -29.458677291870117, -27.297134399414062, -25.135591506958008, -22.974048614501953, -20.8125057220459, -18.650962829589844, -16.48941993713379, -14.327877044677734, -12.16633415222168, -10.004791259765625, -7.84324836730957, -5.681705474853516, -3.520162582397461, -1.3586196899414062, 0.8029232025146484, 2.964466094970703, 5.126008987426758, 7.2875518798828125, 9.449094772338867, 11.610637664794922, 13.772180557250977, 15.933723449707031, 18.095266342163086, 20.25680923461914, 22.418352127075195, 24.57988739013672, 26.741430282592773, 28.902973175048828, 31.064516067504883, 33.22605895996094, 35.387603759765625, 37.54914474487305, 39.71068572998047, 41.872230529785156, 44.033775329589844, 46.195316314697266, 48.35685729980469, 50.518402099609375, 52.67994689941406, 54.841487884521484, 57.003028869628906, 59.164573669433594, 61.32611846923828, 63.4876594543457, 65.64920043945312, 67.81074523925781, 69.9722900390625, 72.13383483886719, 74.29537200927734, 76.45691680908203, 78.61846160888672, 80.77999877929688, 82.94154357910156, 85.10308837890625, 87.26463317871094, 89.42617797851562, 91.58771514892578, 93.74925994873047]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 7.0, 7.0, 10.0, 11.0, 15.0, 14.0, 8.0, 17.0, 21.0, 26.0, 22.0, 22.0, 24.0, 30.0, 96.0, 323.0, 92.0, 38.0, 28.0, 34.0, 19.0, 25.0, 15.0, 17.0, 18.0, 17.0, 3.0, 8.0, 6.0, 8.0, 2.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.01758575439453, -29.12090301513672, -28.224220275878906, -27.32753562927246, -26.43085289001465, -25.534170150756836, -24.63748550415039, -23.740802764892578, -22.844120025634766, -21.947437286376953, -21.05075454711914, -20.154069900512695, -19.257387161254883, -18.36070442199707, -17.464019775390625, -16.567337036132812, -15.670654296875, -14.773971557617188, -13.877287864685059, -12.98060417175293, -12.083921432495117, -11.187238693237305, -10.290555000305176, -9.393871307373047, -8.497188568115234, -7.600505352020264, -6.703822135925293, -5.807138919830322, -4.910455703735352, -4.013772487640381, -3.11708927154541, -2.2204060554504395, -1.3237247467041016, -0.42704153060913086, 0.46964168548583984, 1.3663249015808105, 2.2630081176757812, 3.159691333770752, 4.056374549865723, 4.953057765960693, 5.849740982055664, 6.746424198150635, 7.6431074142456055, 8.539791107177734, 9.436473846435547, 10.33315658569336, 11.229840278625488, 12.126523971557617, 13.02320671081543, 13.919889450073242, 14.816573143005371, 15.7132568359375, 16.609939575195312, 17.506622314453125, 18.403305053710938, 19.299989700317383, 20.196672439575195, 21.093355178833008, 21.990039825439453, 22.886722564697266, 23.783405303955078, 24.68008804321289, 25.576770782470703, 26.47345542907715, 27.37013816833496]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 4.0, 10.0, 8.0, 6.0, 12.0, 8.0, 15.0, 16.0, 15.0, 16.0, 28.0, 26.0, 34.0, 25.0, 38.0, 111.0, 229.0, 95.0, 48.0, 28.0, 32.0, 30.0, 19.0, 21.0, 20.0, 13.0, 16.0, 7.0, 9.0, 14.0, 11.0, 3.0, 6.0, 6.0, 2.0, 8.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.05859375, -1.994842529296875, -1.93109130859375, -1.867340087890625, -1.8035888671875, -1.739837646484375, -1.67608642578125, -1.612335205078125, -1.548583984375, -1.484832763671875, -1.42108154296875, -1.357330322265625, -1.2935791015625, -1.229827880859375, -1.16607666015625, -1.102325439453125, -1.03857421875, -0.974822998046875, -0.91107177734375, -0.847320556640625, -0.7835693359375, -0.719818115234375, -0.65606689453125, -0.592315673828125, -0.528564453125, -0.464813232421875, -0.40106201171875, -0.337310791015625, -0.2735595703125, -0.209808349609375, -0.14605712890625, -0.082305908203125, -0.0185546875, 0.045196533203125, 0.10894775390625, 0.172698974609375, 0.2364501953125, 0.300201416015625, 0.36395263671875, 0.427703857421875, 0.491455078125, 0.555206298828125, 0.61895751953125, 0.682708740234375, 0.7464599609375, 0.810211181640625, 0.87396240234375, 0.937713623046875, 1.00146484375, 1.065216064453125, 1.12896728515625, 1.192718505859375, 1.2564697265625, 1.320220947265625, 1.38397216796875, 1.447723388671875, 1.511474609375, 1.575225830078125, 1.63897705078125, 1.702728271484375, 1.7664794921875, 1.830230712890625, 1.89398193359375, 1.957733154296875, 2.021484375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 4.0, 1.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 6.0, 4.0, 10.0, 29.0, 15.0, 31.0, 34.0, 52.0, 72.0, 152.0, 287.0, 766.0, 2809.0, 24296.0, 8348573.0, 8645.0, 1647.0, 513.0, 200.0, 138.0, 77.0, 50.0, 38.0, 19.0, 4.0, 12.0, 8.0, 3.0, 15.0, 1.0, 3.0, 8.0, 9.0, 3.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0], "bins": [-25.266550064086914, -24.57072639465332, -23.874900817871094, -23.1790771484375, -22.483253479003906, -21.78742790222168, -21.091604232788086, -20.39577865600586, -19.699954986572266, -19.004131317138672, -18.308305740356445, -17.61248207092285, -16.916658401489258, -16.22083282470703, -15.525009155273438, -14.829184532165527, -14.133360862731934, -13.437536239624023, -12.74171257019043, -12.04588794708252, -11.35006332397461, -10.654239654541016, -9.958415031433105, -9.262590408325195, -8.566766738891602, -7.87094259262085, -7.1751179695129395, -6.4792938232421875, -5.783469200134277, -5.087645053863525, -4.391820907592773, -3.6959962844848633, -3.000171661376953, -2.304347276687622, -1.6085230112075806, -0.9126987457275391, -0.216874361038208, 0.47895002365112305, 1.174774169921875, 1.8705987930297852, 2.566422939300537, 3.262247323989868, 3.958071708679199, 4.653895854949951, 5.349720001220703, 6.045544624328613, 6.741368770599365, 7.437193393707275, 8.133017539978027, 8.828842163085938, 9.524665832519531, 10.220490455627441, 10.916315078735352, 11.612138748168945, 12.307963371276855, 13.003787994384766, 13.69961166381836, 14.39543628692627, 15.091259956359863, 15.787084579467773, 16.482908248901367, 17.178733825683594, 17.874557495117188, 18.57038116455078, 19.266206741333008]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 2.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.274808406829834, -6.750971794128418, -6.227134704589844, -5.7032976150512695, -5.1794610023498535, -4.6556243896484375, -4.131787300109863, -3.607950448989868, -3.084113597869873, -2.560276746749878, -2.036439895629883, -1.5126030445098877, -0.9887661933898926, -0.46492934226989746, 0.058907508850097656, 0.5827443599700928, 1.106581211090088, 1.630418062210083, 2.154254913330078, 2.6780917644500732, 3.2019286155700684, 3.7257654666900635, 4.249602317810059, 4.773439407348633, 5.297276020050049, 5.821112632751465, 6.344949722290039, 6.868786811828613, 7.392623424530029, 7.916460037231445, 8.44029712677002, 8.964134216308594, 9.487972259521484, 10.011809349060059, 10.535646438598633, 11.05948257446289, 11.583319664001465, 12.107156753540039, 12.630992889404297, 13.154829978942871, 13.678667068481445, 14.20250415802002, 14.726341247558594, 15.250177383422852, 15.774014472961426, 16.2978515625, 16.821687698364258, 17.34552574157715, 17.869361877441406, 18.393198013305664, 18.917036056518555, 19.440872192382812, 19.964710235595703, 20.48854637145996, 21.01238250732422, 21.53622055053711, 22.060056686401367, 22.583892822265625, 23.107730865478516, 23.631567001342773, 24.15540313720703, 24.679241180419922, 25.20307731628418, 25.72691535949707, 26.250751495361328]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 8.0, 12.0, 21.0, 39.0, 68.0, 105.0, 201.0, 438.0, 1033.0, 3259.0, 14337.0, 114720.0, 335215.0, 44581.0, 7056.0, 1803.0, 675.0, 291.0, 156.0, 85.0, 51.0, 38.0, 18.0, 21.0, 6.0, 8.0, 1.0, 6.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.078125, -22.128173828125, -21.17822265625, -20.228271484375, -19.2783203125, -18.328369140625, -17.37841796875, -16.428466796875, -15.478515625, -14.528564453125, -13.57861328125, -12.628662109375, -11.6787109375, -10.728759765625, -9.77880859375, -8.828857421875, -7.87890625, -6.928955078125, -5.97900390625, -5.029052734375, -4.0791015625, -3.129150390625, -2.17919921875, -1.229248046875, -0.279296875, 0.670654296875, 1.62060546875, 2.570556640625, 3.5205078125, 4.470458984375, 5.42041015625, 6.370361328125, 7.3203125, 8.270263671875, 9.22021484375, 10.170166015625, 11.1201171875, 12.070068359375, 13.02001953125, 13.969970703125, 14.919921875, 15.869873046875, 16.81982421875, 17.769775390625, 18.7197265625, 19.669677734375, 20.61962890625, 21.569580078125, 22.51953125, 23.469482421875, 24.41943359375, 25.369384765625, 26.3193359375, 27.269287109375, 28.21923828125, 29.169189453125, 30.119140625, 31.069091796875, 32.01904296875, 32.968994140625, 33.9189453125, 34.868896484375, 35.81884765625, 36.768798828125, 37.71875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 13.0, 13.0, 17.0, 17.0, 22.0, 23.0, 27.0, 35.0, 54.0, 55.0, 63.0, 71.0, 62.0, 83.0, 64.0, 54.0, 59.0, 53.0, 44.0, 37.0, 29.0, 20.0, 22.0, 7.0, 13.0, 10.0, 3.0, 2.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.060546875, -1.975677490234375, -1.89080810546875, -1.805938720703125, -1.7210693359375, -1.636199951171875, -1.55133056640625, -1.466461181640625, -1.381591796875, -1.296722412109375, -1.21185302734375, -1.126983642578125, -1.0421142578125, -0.957244873046875, -0.87237548828125, -0.787506103515625, -0.70263671875, -0.617767333984375, -0.53289794921875, -0.448028564453125, -0.3631591796875, -0.278289794921875, -0.19342041015625, -0.108551025390625, -0.023681640625, 0.061187744140625, 0.14605712890625, 0.230926513671875, 0.3157958984375, 0.400665283203125, 0.48553466796875, 0.570404052734375, 0.6552734375, 0.740142822265625, 0.82501220703125, 0.909881591796875, 0.9947509765625, 1.079620361328125, 1.16448974609375, 1.249359130859375, 1.334228515625, 1.419097900390625, 1.50396728515625, 1.588836669921875, 1.6737060546875, 1.758575439453125, 1.84344482421875, 1.928314208984375, 2.01318359375, 2.098052978515625, 2.18292236328125, 2.267791748046875, 2.3526611328125, 2.437530517578125, 2.52239990234375, 2.607269287109375, 2.692138671875, 2.777008056640625, 2.86187744140625, 2.946746826171875, 3.0316162109375, 3.116485595703125, 3.20135498046875, 3.286224365234375, 3.37109375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 11.0, 24.0, 69.0, 119.0, 118.0, 52.0, 28.0, 17.0, 11.0, 5.0, 6.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-36.02106857299805, -35.294490814208984, -34.567909240722656, -33.841331481933594, -33.11475372314453, -32.3881721496582, -31.66159439086914, -30.935014724731445, -30.20843505859375, -29.481855392456055, -28.755277633666992, -28.028697967529297, -27.3021183013916, -26.575538635253906, -25.848960876464844, -25.12238121032715, -24.395803451538086, -23.66922378540039, -22.942646026611328, -22.216066360473633, -21.489486694335938, -20.762908935546875, -20.03632926940918, -19.309749603271484, -18.583171844482422, -17.856592178344727, -17.130014419555664, -16.40343475341797, -15.676855087280273, -14.950276374816895, -14.223697662353516, -13.49711799621582, -12.770537376403809, -12.04395866394043, -11.317378997802734, -10.590800285339355, -9.864221572875977, -9.137641906738281, -8.411063194274902, -7.684484004974365, -6.957904815673828, -6.231325626373291, -5.504746437072754, -4.778167724609375, -4.051588535308838, -3.325009346008301, -2.598430633544922, -1.8718514442443848, -1.1452722549438477, -0.4186931848526001, 0.30788588523864746, 1.0344648361206055, 1.7610440254211426, 2.4876232147216797, 3.2142019271850586, 3.9407811164855957, 4.667360305786133, 5.39393949508667, 6.120518684387207, 6.847097396850586, 7.573676586151123, 8.30025577545166, 9.026834487915039, 9.753414154052734, 10.479992866516113]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 1.0, 3.0, 3.0, 6.0, 12.0, 13.0, 38.0, 73.0, 116.0, 75.0, 48.0, 30.0, 14.0, 9.0, 11.0, 1.0, 7.0, 3.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.470895767211914, -10.993066787719727, -10.515237808227539, -10.037407875061035, -9.559578895568848, -9.08174991607666, -8.603920936584473, -8.126091003417969, -7.648262023925781, -7.170433044433594, -6.692603588104248, -6.2147746086120605, -5.736945152282715, -5.259116172790527, -4.78128719329834, -4.303457736968994, -3.8256287574768066, -3.34779953956604, -2.8699703216552734, -2.392141342163086, -1.9143120050430298, -1.4364829063415527, -0.9586536884307861, -0.48082447052001953, -0.0029952526092529297, 0.4748339354991913, 0.9526631236076355, 1.4304922819137573, 1.908321499824524, 2.386150598526001, 2.8639798164367676, 3.341809034347534, 3.819638252258301, 4.297467231750488, 4.775296688079834, 5.2531256675720215, 5.730955123901367, 6.208784103393555, 6.686613082885742, 7.164442539215088, 7.642271995544434, 8.120100975036621, 8.597929954528809, 9.075759887695312, 9.5535888671875, 10.031417846679688, 10.509246826171875, 10.987075805664062, 11.46490478515625, 11.942733764648438, 12.420562744140625, 12.898392677307129, 13.376221656799316, 13.854050636291504, 14.331879615783691, 14.809709548950195, 15.287538528442383, 15.76536750793457, 16.243196487426758, 16.721025466918945, 17.198854446411133, 17.676685333251953, 18.15451431274414, 18.632343292236328, 19.110172271728516]}, "train/train_runtime": 4813.5869, "train/train_samples_per_second": 5.929, "train/train_steps_per_second": 0.062, "train/total_flos": 0.0, "train/train_loss": 4.3407110846805255, "eval/loss": 4.175893783569336, "eval/wer": 2.4477588258627527, "eval/runtime": 935.1251, "eval/samples_per_second": 2.825, "eval/steps_per_second": 0.236} \ No newline at end of file +{"train/loss": 4.4712, "train/learning_rate": 1.776e-05, "train/epoch": 1.0, "train/global_step": 297, "_runtime": 6038, "_timestamp": 1646144049, "_step": 298, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 80.0, 454.0, 412.0, 63.0, 7.0], "bins": [-318.0708923339844, -312.8525390625, -307.6341552734375, -302.4158020019531, -297.19744873046875, -291.97906494140625, -286.7607116699219, -281.5423583984375, -276.323974609375, -271.1056213378906, -265.8872375488281, -260.66888427734375, -255.45053100585938, -250.23216247558594, -245.0137939453125, -239.79544067382812, -234.57708740234375, -229.3587188720703, -224.14036560058594, -218.9219970703125, -213.70364379882812, -208.4852752685547, -203.26690673828125, -198.04855346679688, -192.83018493652344, -187.61181640625, -182.39346313476562, -177.1750946044922, -171.95672607421875, -166.73837280273438, -161.52000427246094, -156.3016357421875, -151.0832977294922, -145.86492919921875, -140.64657592773438, -135.42820739746094, -130.2098388671875, -124.99148559570312, -119.77311706542969, -114.55475616455078, -109.33639526367188, -104.11803436279297, -98.89967346191406, -93.68130493164062, -88.46294403076172, -83.24458312988281, -78.02621459960938, -72.80785369873047, -67.58949279785156, -62.371131896972656, -57.152767181396484, -51.93440246582031, -46.716041564941406, -41.4976806640625, -36.27931594848633, -31.060951232910156, -25.842588424682617, -20.624225616455078, -15.405862808227539, -10.1875, -4.969137191772461, 0.24922561645507812, 5.467588424682617, 10.685953140258789, 15.904314041137695]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 6.0, 7.0, 3.0, 10.0, 11.0, 9.0, 19.0, 15.0, 18.0, 23.0, 24.0, 31.0, 39.0, 35.0, 50.0, 48.0, 32.0, 32.0, 55.0, 49.0, 46.0, 44.0, 40.0, 48.0, 49.0, 35.0, 35.0, 17.0, 25.0, 20.0, 24.0, 21.0, 10.0, 11.0, 17.0, 12.0, 11.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-53.798095703125, -52.326568603515625, -50.855045318603516, -49.38351821899414, -47.911991119384766, -46.440467834472656, -44.96894073486328, -43.497413635253906, -42.0258903503418, -40.55436325073242, -39.08283996582031, -37.61131286621094, -36.13978576660156, -34.66826248168945, -33.19673538208008, -31.725210189819336, -30.25368309020996, -28.78215789794922, -27.310630798339844, -25.8391056060791, -24.36758041381836, -22.896053314208984, -21.424528121948242, -19.9530029296875, -18.481475830078125, -17.009950637817383, -15.538424491882324, -14.066898345947266, -12.595373153686523, -11.123847007751465, -9.652320861816406, -8.180795669555664, -6.709270477294922, -5.2377448081970215, -3.766218900680542, -2.2946929931640625, -0.8231673240661621, 0.6483583450317383, 2.119884490966797, 3.591409683227539, 5.062935829162598, 6.534461498260498, 8.005987167358398, 9.477513313293457, 10.949039459228516, 12.420564651489258, 13.892090797424316, 15.363615989685059, 16.835142135620117, 18.30666732788086, 19.778194427490234, 21.249719619750977, 22.72124481201172, 24.192771911621094, 25.664297103881836, 27.135822296142578, 28.607349395751953, 30.078874588012695, 31.55040168762207, 33.02192687988281, 34.49345397949219, 35.9649772644043, 37.43650436401367, 38.90802764892578, 40.379554748535156]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 9.0, 4.0, 11.0, 7.0, 11.0, 16.0, 21.0, 21.0, 19.0, 34.0, 36.0, 43.0, 53.0, 50.0, 49.0, 59.0, 40.0, 65.0, 44.0, 51.0, 36.0, 53.0, 32.0, 36.0, 40.0, 33.0, 17.0, 18.0, 20.0, 20.0, 15.0, 8.0, 7.0, 6.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.6640625, -2.56243896484375, -2.4608154296875, -2.35919189453125, -2.257568359375, -2.15594482421875, -2.0543212890625, -1.95269775390625, -1.85107421875, -1.74945068359375, -1.6478271484375, -1.54620361328125, -1.444580078125, -1.34295654296875, -1.2413330078125, -1.13970947265625, -1.0380859375, -0.93646240234375, -0.8348388671875, -0.73321533203125, -0.631591796875, -0.52996826171875, -0.4283447265625, -0.32672119140625, -0.22509765625, -0.12347412109375, -0.0218505859375, 0.07977294921875, 0.181396484375, 0.28302001953125, 0.3846435546875, 0.48626708984375, 0.587890625, 0.68951416015625, 0.7911376953125, 0.89276123046875, 0.994384765625, 1.09600830078125, 1.1976318359375, 1.29925537109375, 1.40087890625, 1.50250244140625, 1.6041259765625, 1.70574951171875, 1.807373046875, 1.90899658203125, 2.0106201171875, 2.11224365234375, 2.2138671875, 2.31549072265625, 2.4171142578125, 2.51873779296875, 2.620361328125, 2.72198486328125, 2.8236083984375, 2.92523193359375, 3.02685546875, 3.12847900390625, 3.2301025390625, 3.33172607421875, 3.433349609375, 3.53497314453125, 3.6365966796875, 3.73822021484375, 3.83984375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 6.0, 14.0, 15.0, 31.0, 36.0, 71.0, 96.0, 141.0, 272.0, 431.0, 785.0, 1472.0, 3077.0, 8438.0, 35158.0, 282709.0, 2640571.0, 1102198.0, 91797.0, 16868.0, 5230.0, 2197.0, 1143.0, 627.0, 311.0, 223.0, 139.0, 83.0, 62.0, 28.0, 16.0, 12.0, 8.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0], "bins": [-13.3515625, -13.0157470703125, -12.679931640625, -12.3441162109375, -12.00830078125, -11.6724853515625, -11.336669921875, -11.0008544921875, -10.6650390625, -10.3292236328125, -9.993408203125, -9.6575927734375, -9.32177734375, -8.9859619140625, -8.650146484375, -8.3143310546875, -7.978515625, -7.6427001953125, -7.306884765625, -6.9710693359375, -6.63525390625, -6.2994384765625, -5.963623046875, -5.6278076171875, -5.2919921875, -4.9561767578125, -4.620361328125, -4.2845458984375, -3.94873046875, -3.6129150390625, -3.277099609375, -2.9412841796875, -2.60546875, -2.2696533203125, -1.933837890625, -1.5980224609375, -1.26220703125, -0.9263916015625, -0.590576171875, -0.2547607421875, 0.0810546875, 0.4168701171875, 0.752685546875, 1.0885009765625, 1.42431640625, 1.7601318359375, 2.095947265625, 2.4317626953125, 2.767578125, 3.1033935546875, 3.439208984375, 3.7750244140625, 4.11083984375, 4.4466552734375, 4.782470703125, 5.1182861328125, 5.4541015625, 5.7899169921875, 6.125732421875, 6.4615478515625, 6.79736328125, 7.1331787109375, 7.468994140625, 7.8048095703125, 8.140625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 12.0, 5.0, 9.0, 21.0, 15.0, 35.0, 44.0, 46.0, 61.0, 90.0, 149.0, 188.0, 275.0, 374.0, 517.0, 519.0, 462.0, 355.0, 266.0, 194.0, 133.0, 86.0, 68.0, 41.0, 32.0, 21.0, 15.0, 11.0, 8.0, 8.0, 2.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.4921875, -11.1356201171875, -10.779052734375, -10.4224853515625, -10.06591796875, -9.7093505859375, -9.352783203125, -8.9962158203125, -8.6396484375, -8.2830810546875, -7.926513671875, -7.5699462890625, -7.21337890625, -6.8568115234375, -6.500244140625, -6.1436767578125, -5.787109375, -5.4305419921875, -5.073974609375, -4.7174072265625, -4.36083984375, -4.0042724609375, -3.647705078125, -3.2911376953125, -2.9345703125, -2.5780029296875, -2.221435546875, -1.8648681640625, -1.50830078125, -1.1517333984375, -0.795166015625, -0.4385986328125, -0.08203125, 0.2745361328125, 0.631103515625, 0.9876708984375, 1.34423828125, 1.7008056640625, 2.057373046875, 2.4139404296875, 2.7705078125, 3.1270751953125, 3.483642578125, 3.8402099609375, 4.19677734375, 4.5533447265625, 4.909912109375, 5.2664794921875, 5.623046875, 5.9796142578125, 6.336181640625, 6.6927490234375, 7.04931640625, 7.4058837890625, 7.762451171875, 8.1190185546875, 8.4755859375, 8.8321533203125, 9.188720703125, 9.5452880859375, 9.90185546875, 10.2584228515625, 10.614990234375, 10.9715576171875, 11.328125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 7.0, 4.0, 4.0, 1.0, 2.0, 4.0, 5.0, 6.0, 12.0, 17.0, 24.0, 41.0, 55.0, 88.0, 124.0, 161.0, 314.0, 490.0, 991.0, 2279.0, 8063.0, 299143.0, 3807389.0, 66341.0, 5035.0, 1750.0, 788.0, 416.0, 246.0, 162.0, 112.0, 60.0, 56.0, 30.0, 19.0, 17.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.59375, -34.380859375, -33.16796875, -31.955078125, -30.7421875, -29.529296875, -28.31640625, -27.103515625, -25.890625, -24.677734375, -23.46484375, -22.251953125, -21.0390625, -19.826171875, -18.61328125, -17.400390625, -16.1875, -14.974609375, -13.76171875, -12.548828125, -11.3359375, -10.123046875, -8.91015625, -7.697265625, -6.484375, -5.271484375, -4.05859375, -2.845703125, -1.6328125, -0.419921875, 0.79296875, 2.005859375, 3.21875, 4.431640625, 5.64453125, 6.857421875, 8.0703125, 9.283203125, 10.49609375, 11.708984375, 12.921875, 14.134765625, 15.34765625, 16.560546875, 17.7734375, 18.986328125, 20.19921875, 21.412109375, 22.625, 23.837890625, 25.05078125, 26.263671875, 27.4765625, 28.689453125, 29.90234375, 31.115234375, 32.328125, 33.541015625, 34.75390625, 35.966796875, 37.1796875, 38.392578125, 39.60546875, 40.818359375, 42.03125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 10.0, 40.0, 97.0, 209.0, 276.0, 201.0, 117.0, 37.0, 14.0, 6.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.43179321289062, -77.31104278564453, -75.19029235839844, -73.06954956054688, -70.94879913330078, -68.82804870605469, -66.7072982788086, -64.5865478515625, -62.46580505371094, -60.345054626464844, -58.224308013916016, -56.10355758666992, -53.982810974121094, -51.862060546875, -49.741310119628906, -47.62056350708008, -45.499813079833984, -43.37906265258789, -41.25831604003906, -39.13756561279297, -37.01681900024414, -34.89606857299805, -32.77532196044922, -30.654571533203125, -28.533823013305664, -26.413074493408203, -24.292325973510742, -22.17157745361328, -20.050827026367188, -17.93008041381836, -15.809329986572266, -13.688581466674805, -11.567832946777344, -9.447084426879883, -7.326335430145264, -5.2055864334106445, -3.0848379135131836, -0.9640893936157227, 1.1566600799560547, 3.2774085998535156, 5.398157119750977, 7.5189056396484375, 9.639654159545898, 11.760403633117676, 13.881152153015137, 16.00189971923828, 18.122650146484375, 20.243398666381836, 22.364147186279297, 24.484895706176758, 26.60564422607422, 28.726394653320312, 30.84714126586914, 32.967891693115234, 35.08863830566406, 37.209388732910156, 39.33013916015625, 41.450889587402344, 43.57163619995117, 45.692386627197266, 47.813133239746094, 49.93388366699219, 52.05463409423828, 54.17538070678711, 56.29612731933594]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 6.0, 6.0, 10.0, 6.0, 7.0, 9.0, 12.0, 11.0, 14.0, 7.0, 22.0, 14.0, 23.0, 29.0, 20.0, 27.0, 26.0, 42.0, 30.0, 37.0, 39.0, 45.0, 31.0, 35.0, 29.0, 38.0, 23.0, 44.0, 30.0, 33.0, 32.0, 49.0, 35.0, 20.0, 28.0, 18.0, 14.0, 18.0, 25.0, 15.0, 12.0, 10.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-35.123512268066406, -34.12685012817383, -33.13018798828125, -32.13352584838867, -31.136863708496094, -30.140201568603516, -29.143539428710938, -28.14687728881836, -27.15021514892578, -26.153553009033203, -25.156890869140625, -24.160228729248047, -23.16356658935547, -22.16690444946289, -21.170242309570312, -20.173580169677734, -19.176916122436523, -18.180253982543945, -17.183591842651367, -16.18692970275879, -15.190267562866211, -14.193605422973633, -13.196942329406738, -12.20028018951416, -11.203618049621582, -10.206955909729004, -9.210293769836426, -8.213630676269531, -7.216969013214111, -6.220306873321533, -5.223644256591797, -4.226982116699219, -3.230318069458008, -2.2336559295654297, -1.2369935512542725, -0.24033117294311523, 0.7563309669494629, 1.752993106842041, 2.7496557235717773, 3.7463178634643555, 4.742980003356934, 5.739642143249512, 6.73630428314209, 7.732966899871826, 8.729629516601562, 9.72629165649414, 10.722953796386719, 11.719615936279297, 12.716278076171875, 13.712940216064453, 14.709602355957031, 15.70626449584961, 16.702926635742188, 17.699588775634766, 18.696250915527344, 19.692913055419922, 20.6895751953125, 21.686237335205078, 22.682899475097656, 23.679561614990234, 24.676223754882812, 25.67288589477539, 26.66954803466797, 27.666210174560547, 28.662874221801758]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 7.0, 5.0, 6.0, 10.0, 10.0, 12.0, 19.0, 18.0, 22.0, 22.0, 27.0, 25.0, 23.0, 34.0, 50.0, 36.0, 34.0, 39.0, 42.0, 66.0, 37.0, 48.0, 46.0, 34.0, 28.0, 39.0, 30.0, 28.0, 35.0, 19.0, 24.0, 19.0, 23.0, 20.0, 12.0, 9.0, 7.0, 6.0, 8.0, 4.0, 2.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.703125, -2.61004638671875, -2.5169677734375, -2.42388916015625, -2.330810546875, -2.23773193359375, -2.1446533203125, -2.05157470703125, -1.95849609375, -1.86541748046875, -1.7723388671875, -1.67926025390625, -1.586181640625, -1.49310302734375, -1.4000244140625, -1.30694580078125, -1.2138671875, -1.12078857421875, -1.0277099609375, -0.93463134765625, -0.841552734375, -0.74847412109375, -0.6553955078125, -0.56231689453125, -0.46923828125, -0.37615966796875, -0.2830810546875, -0.19000244140625, -0.096923828125, -0.00384521484375, 0.0892333984375, 0.18231201171875, 0.275390625, 0.36846923828125, 0.4615478515625, 0.55462646484375, 0.647705078125, 0.74078369140625, 0.8338623046875, 0.92694091796875, 1.02001953125, 1.11309814453125, 1.2061767578125, 1.29925537109375, 1.392333984375, 1.48541259765625, 1.5784912109375, 1.67156982421875, 1.7646484375, 1.85772705078125, 1.9508056640625, 2.04388427734375, 2.136962890625, 2.23004150390625, 2.3231201171875, 2.41619873046875, 2.50927734375, 2.60235595703125, 2.6954345703125, 2.78851318359375, 2.881591796875, 2.97467041015625, 3.0677490234375, 3.16082763671875, 3.25390625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 4.0, 3.0, 14.0, 15.0, 23.0, 30.0, 52.0, 64.0, 113.0, 133.0, 196.0, 287.0, 462.0, 679.0, 1058.0, 1498.0, 2315.0, 3654.0, 5690.0, 9052.0, 14721.0, 24835.0, 41765.0, 73576.0, 141417.0, 293402.0, 199972.0, 97923.0, 54501.0, 31077.0, 18649.0, 11343.0, 7104.0, 4453.0, 2967.0, 1758.0, 1260.0, 808.0, 543.0, 360.0, 231.0, 166.0, 109.0, 95.0, 53.0, 43.0, 25.0, 18.0, 12.0, 9.0, 7.0, 3.0, 5.0, 2.0, 3.0, 2.0], "bins": [-0.60888671875, -0.5908355712890625, -0.572784423828125, -0.5547332763671875, -0.53668212890625, -0.5186309814453125, -0.500579833984375, -0.4825286865234375, -0.4644775390625, -0.4464263916015625, -0.428375244140625, -0.4103240966796875, -0.39227294921875, -0.3742218017578125, -0.356170654296875, -0.3381195068359375, -0.320068359375, -0.3020172119140625, -0.283966064453125, -0.2659149169921875, -0.24786376953125, -0.2298126220703125, -0.211761474609375, -0.1937103271484375, -0.1756591796875, -0.1576080322265625, -0.139556884765625, -0.1215057373046875, -0.10345458984375, -0.0854034423828125, -0.067352294921875, -0.0493011474609375, -0.03125, -0.0131988525390625, 0.004852294921875, 0.0229034423828125, 0.04095458984375, 0.0590057373046875, 0.077056884765625, 0.0951080322265625, 0.1131591796875, 0.1312103271484375, 0.149261474609375, 0.1673126220703125, 0.18536376953125, 0.2034149169921875, 0.221466064453125, 0.2395172119140625, 0.257568359375, 0.2756195068359375, 0.293670654296875, 0.3117218017578125, 0.32977294921875, 0.3478240966796875, 0.365875244140625, 0.3839263916015625, 0.4019775390625, 0.4200286865234375, 0.438079833984375, 0.4561309814453125, 0.47418212890625, 0.4922332763671875, 0.510284423828125, 0.5283355712890625, 0.54638671875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 7.0, 13.0, 10.0, 11.0, 11.0, 6.0, 17.0, 20.0, 22.0, 21.0, 28.0, 27.0, 29.0, 48.0, 39.0, 36.0, 33.0, 34.0, 53.0, 41.0, 1065.0, 39.0, 31.0, 37.0, 29.0, 41.0, 34.0, 25.0, 21.0, 21.0, 17.0, 21.0, 19.0, 26.0, 17.0, 7.0, 3.0, 10.0, 10.0, 12.0, 4.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.71875, -1.6635589599609375, -1.608367919921875, -1.5531768798828125, -1.49798583984375, -1.4427947998046875, -1.387603759765625, -1.3324127197265625, -1.2772216796875, -1.2220306396484375, -1.166839599609375, -1.1116485595703125, -1.05645751953125, -1.0012664794921875, -0.946075439453125, -0.8908843994140625, -0.835693359375, -0.7805023193359375, -0.725311279296875, -0.6701202392578125, -0.61492919921875, -0.5597381591796875, -0.504547119140625, -0.4493560791015625, -0.3941650390625, -0.3389739990234375, -0.283782958984375, -0.2285919189453125, -0.17340087890625, -0.1182098388671875, -0.063018798828125, -0.0078277587890625, 0.04736328125, 0.1025543212890625, 0.157745361328125, 0.2129364013671875, 0.26812744140625, 0.3233184814453125, 0.378509521484375, 0.4337005615234375, 0.4888916015625, 0.5440826416015625, 0.599273681640625, 0.6544647216796875, 0.70965576171875, 0.7648468017578125, 0.820037841796875, 0.8752288818359375, 0.930419921875, 0.9856109619140625, 1.040802001953125, 1.0959930419921875, 1.15118408203125, 1.2063751220703125, 1.261566162109375, 1.3167572021484375, 1.3719482421875, 1.4271392822265625, 1.482330322265625, 1.5375213623046875, 1.59271240234375, 1.6479034423828125, 1.703094482421875, 1.7582855224609375, 1.8134765625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 16.0, 18.0, 23.0, 31.0, 40.0, 61.0, 75.0, 134.0, 165.0, 257.0, 337.0, 500.0, 768.0, 1104.0, 1613.0, 2353.0, 3652.0, 5617.0, 8786.0, 14016.0, 21586.0, 35538.0, 59947.0, 109962.0, 217283.0, 1306879.0, 129964.0, 68845.0, 39267.0, 24056.0, 15183.0, 9893.0, 6430.0, 4139.0, 2755.0, 1840.0, 1223.0, 899.0, 608.0, 365.0, 263.0, 194.0, 123.0, 97.0, 70.0, 42.0, 39.0, 27.0, 11.0, 11.0, 12.0, 5.0, 2.0, 5.0, 0.0, 2.0], "bins": [-0.52783203125, -0.5118980407714844, -0.49596405029296875, -0.4800300598144531, -0.4640960693359375, -0.4481620788574219, -0.43222808837890625, -0.4162940979003906, -0.400360107421875, -0.3844261169433594, -0.36849212646484375, -0.3525581359863281, -0.3366241455078125, -0.3206901550292969, -0.30475616455078125, -0.2888221740722656, -0.27288818359375, -0.2569541931152344, -0.24102020263671875, -0.22508621215820312, -0.2091522216796875, -0.19321823120117188, -0.17728424072265625, -0.16135025024414062, -0.145416259765625, -0.12948226928710938, -0.11354827880859375, -0.09761428833007812, -0.0816802978515625, -0.06574630737304688, -0.04981231689453125, -0.033878326416015625, -0.0179443359375, -0.002010345458984375, 0.01392364501953125, 0.029857635498046875, 0.0457916259765625, 0.061725616455078125, 0.07765960693359375, 0.09359359741210938, 0.109527587890625, 0.12546157836914062, 0.14139556884765625, 0.15732955932617188, 0.1732635498046875, 0.18919754028320312, 0.20513153076171875, 0.22106552124023438, 0.23699951171875, 0.2529335021972656, 0.26886749267578125, 0.2848014831542969, 0.3007354736328125, 0.3166694641113281, 0.33260345458984375, 0.3485374450683594, 0.364471435546875, 0.3804054260253906, 0.39633941650390625, 0.4122734069824219, 0.4282073974609375, 0.4441413879394531, 0.46007537841796875, 0.4760093688964844, 0.491943359375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 7.0, 3.0, 10.0, 11.0, 13.0, 11.0, 16.0, 22.0, 32.0, 43.0, 19.0, 50.0, 45.0, 59.0, 53.0, 59.0, 65.0, 64.0, 53.0, 46.0, 44.0, 40.0, 41.0, 26.0, 31.0, 22.0, 20.0, 16.0, 19.0, 14.0, 8.0, 6.0, 8.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0003750324249267578, -0.00036242231726646423, -0.00034981220960617065, -0.0003372021019458771, -0.0003245919942855835, -0.0003119818866252899, -0.00029937177896499634, -0.00028676167130470276, -0.0002741515636444092, -0.0002615414559841156, -0.000248931348323822, -0.00023632124066352844, -0.00022371113300323486, -0.00021110102534294128, -0.0001984909176826477, -0.00018588081002235413, -0.00017327070236206055, -0.00016066059470176697, -0.0001480504870414734, -0.0001354403793811798, -0.00012283027172088623, -0.00011022016406059265, -9.761005640029907e-05, -8.499994874000549e-05, -7.238984107971191e-05, -5.9779733419418335e-05, -4.7169625759124756e-05, -3.455951809883118e-05, -2.1949410438537598e-05, -9.339302778244019e-06, 3.2708048820495605e-06, 1.588091254234314e-05, 2.849102020263672e-05, 4.11011278629303e-05, 5.371123552322388e-05, 6.632134318351746e-05, 7.893145084381104e-05, 9.154155850410461e-05, 0.0001041516661643982, 0.00011676177382469177, 0.00012937188148498535, 0.00014198198914527893, 0.0001545920968055725, 0.0001672022044658661, 0.00017981231212615967, 0.00019242241978645325, 0.00020503252744674683, 0.0002176426351070404, 0.00023025274276733398, 0.00024286285042762756, 0.00025547295808792114, 0.0002680830657482147, 0.0002806931734085083, 0.0002933032810688019, 0.00030591338872909546, 0.00031852349638938904, 0.0003311336040496826, 0.0003437437117099762, 0.0003563538193702698, 0.00036896392703056335, 0.00038157403469085693, 0.0003941841423511505, 0.0004067942500114441, 0.00041940435767173767, 0.00043201446533203125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 8.0, 6.0, 14.0, 9.0, 19.0, 27.0, 21.0, 32.0, 31.0, 41.0, 55.0, 74.0, 87.0, 136.0, 139.0, 224.0, 276.0, 429.0, 641.0, 1682.0, 740219.0, 301040.0, 1208.0, 556.0, 402.0, 285.0, 199.0, 170.0, 90.0, 93.0, 59.0, 60.0, 36.0, 52.0, 37.0, 25.0, 20.0, 14.0, 7.0, 3.0, 2.0, 6.0, 8.0, 1.0, 1.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.006404876708984375, -0.006190836429595947, -0.0059767961502075195, -0.005762755870819092, -0.005548715591430664, -0.005334675312042236, -0.005120635032653809, -0.004906594753265381, -0.004692554473876953, -0.004478514194488525, -0.004264473915100098, -0.00405043363571167, -0.003836393356323242, -0.0036223530769348145, -0.0034083127975463867, -0.003194272518157959, -0.0029802322387695312, -0.0027661919593811035, -0.0025521516799926758, -0.002338111400604248, -0.0021240711212158203, -0.0019100308418273926, -0.0016959905624389648, -0.0014819502830505371, -0.0012679100036621094, -0.0010538697242736816, -0.0008398294448852539, -0.0006257891654968262, -0.00041174888610839844, -0.0001977086067199707, 1.633167266845703e-05, 0.00023037195205688477, 0.0004444122314453125, 0.0006584525108337402, 0.000872492790222168, 0.0010865330696105957, 0.0013005733489990234, 0.0015146136283874512, 0.001728653907775879, 0.0019426941871643066, 0.0021567344665527344, 0.002370774745941162, 0.00258481502532959, 0.0027988553047180176, 0.0030128955841064453, 0.003226935863494873, 0.0034409761428833008, 0.0036550164222717285, 0.0038690567016601562, 0.004083096981048584, 0.004297137260437012, 0.0045111775398254395, 0.004725217819213867, 0.004939258098602295, 0.005153298377990723, 0.00536733865737915, 0.005581378936767578, 0.005795419216156006, 0.006009459495544434, 0.006223499774932861, 0.006437540054321289, 0.006651580333709717, 0.0068656206130981445, 0.007079660892486572, 0.007293701171875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 14.0, 109.0, 338.0, 352.0, 153.0, 40.0, 7.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008666588691994548, -0.0008439445518888533, -0.0008212301763705909, -0.0007985158590599895, -0.0007758014835417271, -0.0007530871662311256, -0.0007303728489205241, -0.0007076584734022617, -0.0006849440978839993, -0.0006622297805733979, -0.0006395154050551355, -0.000616801087744534, -0.0005940867122262716, -0.0005713723949156702, -0.0005486580776050687, -0.0005259437020868063, -0.0005032293847762048, -0.0004805150383617729, -0.00045780069194734097, -0.0004350863746367395, -0.0004123719991184771, -0.00038965768180787563, -0.0003669433353934437, -0.0003442289889790118, -0.00032151464256457984, -0.0002988002961501479, -0.000276085949735716, -0.00025337160332128406, -0.00023065727145876735, -0.00020794292504433542, -0.00018522859318181872, -0.0001625142467673868, -0.00013979995856061578, -0.00011708561214618385, -9.437127300770953e-05, -7.165693386923522e-05, -4.894258745480329e-05, -2.622824104037136e-05, -3.513909177854657e-06, 1.9200437236577272e-05, 4.19147836510092e-05, 6.462913006544113e-05, 8.734346920391545e-05, 0.00011005780834238976, 0.0001327721547568217, 0.00015548650117125362, 0.00017820083303377032, 0.00020091517944820225, 0.00022362952586263418, 0.0002463438722770661, 0.00026905821869149804, 0.0002917725360020995, 0.0003144869115203619, 0.0003372012288309634, 0.0003599155752453953, 0.00038262992165982723, 0.00040534426807425916, 0.0004280586144886911, 0.000450772960903123, 0.00047348730731755495, 0.0004962016246281564, 0.0005189160001464188, 0.0005416303174570203, 0.0005643446929752827, 0.0005870590102858841]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 7.0, 12.0, 10.0, 11.0, 16.0, 16.0, 19.0, 22.0, 23.0, 29.0, 34.0, 35.0, 31.0, 42.0, 34.0, 32.0, 39.0, 37.0, 45.0, 36.0, 46.0, 40.0, 34.0, 48.0, 35.0, 34.0, 28.0, 29.0, 24.0, 23.0, 17.0, 12.0, 17.0, 16.0, 13.0, 8.0, 9.0, 5.0, 5.0, 3.0, 3.0, 3.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0002161264419555664, -0.00020975247025489807, -0.00020337849855422974, -0.0001970045268535614, -0.00019063055515289307, -0.00018425658345222473, -0.0001778826117515564, -0.00017150864005088806, -0.00016513466835021973, -0.0001587606966495514, -0.00015238672494888306, -0.00014601275324821472, -0.0001396387815475464, -0.00013326480984687805, -0.00012689083814620972, -0.00012051686644554138, -0.00011414289474487305, -0.00010776892304420471, -0.00010139495134353638, -9.502097964286804e-05, -8.864700794219971e-05, -8.227303624153137e-05, -7.589906454086304e-05, -6.95250928401947e-05, -6.315112113952637e-05, -5.677714943885803e-05, -5.04031777381897e-05, -4.402920603752136e-05, -3.765523433685303e-05, -3.128126263618469e-05, -2.4907290935516357e-05, -1.8533319234848022e-05, -1.2159347534179688e-05, -5.7853758335113525e-06, 5.885958671569824e-07, 6.962567567825317e-06, 1.3336539268493652e-05, 1.9710510969161987e-05, 2.6084482669830322e-05, 3.245845437049866e-05, 3.883242607116699e-05, 4.520639777183533e-05, 5.158036947250366e-05, 5.7954341173172e-05, 6.432831287384033e-05, 7.070228457450867e-05, 7.7076256275177e-05, 8.345022797584534e-05, 8.982419967651367e-05, 9.619817137718201e-05, 0.00010257214307785034, 0.00010894611477851868, 0.00011532008647918701, 0.00012169405817985535, 0.00012806802988052368, 0.00013444200158119202, 0.00014081597328186035, 0.0001471899449825287, 0.00015356391668319702, 0.00015993788838386536, 0.0001663118600845337, 0.00017268583178520203, 0.00017905980348587036, 0.0001854337751865387, 0.00019180774688720703]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 7.0, 5.0, 6.0, 10.0, 10.0, 12.0, 19.0, 18.0, 22.0, 22.0, 27.0, 25.0, 23.0, 34.0, 50.0, 36.0, 34.0, 39.0, 42.0, 66.0, 37.0, 48.0, 46.0, 34.0, 28.0, 39.0, 30.0, 28.0, 35.0, 19.0, 24.0, 19.0, 23.0, 20.0, 12.0, 9.0, 7.0, 6.0, 8.0, 4.0, 2.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.703125, -2.61004638671875, -2.5169677734375, -2.42388916015625, -2.330810546875, -2.23773193359375, -2.1446533203125, -2.05157470703125, -1.95849609375, -1.86541748046875, -1.7723388671875, -1.67926025390625, -1.586181640625, -1.49310302734375, -1.4000244140625, -1.30694580078125, -1.2138671875, -1.12078857421875, -1.0277099609375, -0.93463134765625, -0.841552734375, -0.74847412109375, -0.6553955078125, -0.56231689453125, -0.46923828125, -0.37615966796875, -0.2830810546875, -0.19000244140625, -0.096923828125, -0.00384521484375, 0.0892333984375, 0.18231201171875, 0.275390625, 0.36846923828125, 0.4615478515625, 0.55462646484375, 0.647705078125, 0.74078369140625, 0.8338623046875, 0.92694091796875, 1.02001953125, 1.11309814453125, 1.2061767578125, 1.29925537109375, 1.392333984375, 1.48541259765625, 1.5784912109375, 1.67156982421875, 1.7646484375, 1.85772705078125, 1.9508056640625, 2.04388427734375, 2.136962890625, 2.23004150390625, 2.3231201171875, 2.41619873046875, 2.50927734375, 2.60235595703125, 2.6954345703125, 2.78851318359375, 2.881591796875, 2.97467041015625, 3.0677490234375, 3.16082763671875, 3.25390625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 3.0, 3.0, 15.0, 7.0, 6.0, 15.0, 22.0, 27.0, 42.0, 49.0, 77.0, 80.0, 118.0, 158.0, 216.0, 287.0, 391.0, 525.0, 690.0, 959.0, 1416.0, 1998.0, 2914.0, 4560.0, 8134.0, 18683.0, 74228.0, 524615.0, 328589.0, 45808.0, 14245.0, 6803.0, 3938.0, 2528.0, 1769.0, 1258.0, 875.0, 686.0, 433.0, 372.0, 259.0, 207.0, 137.0, 104.0, 73.0, 59.0, 49.0, 34.0, 30.0, 23.0, 16.0, 9.0, 7.0, 9.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0], "bins": [-12.0859375, -11.70654296875, -11.3271484375, -10.94775390625, -10.568359375, -10.18896484375, -9.8095703125, -9.43017578125, -9.05078125, -8.67138671875, -8.2919921875, -7.91259765625, -7.533203125, -7.15380859375, -6.7744140625, -6.39501953125, -6.015625, -5.63623046875, -5.2568359375, -4.87744140625, -4.498046875, -4.11865234375, -3.7392578125, -3.35986328125, -2.98046875, -2.60107421875, -2.2216796875, -1.84228515625, -1.462890625, -1.08349609375, -0.7041015625, -0.32470703125, 0.0546875, 0.43408203125, 0.8134765625, 1.19287109375, 1.572265625, 1.95166015625, 2.3310546875, 2.71044921875, 3.08984375, 3.46923828125, 3.8486328125, 4.22802734375, 4.607421875, 4.98681640625, 5.3662109375, 5.74560546875, 6.125, 6.50439453125, 6.8837890625, 7.26318359375, 7.642578125, 8.02197265625, 8.4013671875, 8.78076171875, 9.16015625, 9.53955078125, 9.9189453125, 10.29833984375, 10.677734375, 11.05712890625, 11.4365234375, 11.81591796875, 12.1953125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 8.0, 4.0, 8.0, 8.0, 15.0, 6.0, 15.0, 19.0, 17.0, 17.0, 12.0, 29.0, 31.0, 26.0, 27.0, 28.0, 42.0, 51.0, 79.0, 126.0, 216.0, 1334.0, 254.0, 169.0, 81.0, 69.0, 54.0, 44.0, 33.0, 34.0, 25.0, 32.0, 17.0, 25.0, 16.0, 14.0, 12.0, 8.0, 10.0, 8.0, 3.0, 4.0, 8.0, 0.0, 5.0, 2.0, 3.0, 1.0, 2.0], "bins": [-10.0078125, -9.73602294921875, -9.4642333984375, -9.19244384765625, -8.920654296875, -8.64886474609375, -8.3770751953125, -8.10528564453125, -7.83349609375, -7.56170654296875, -7.2899169921875, -7.01812744140625, -6.746337890625, -6.47454833984375, -6.2027587890625, -5.93096923828125, -5.6591796875, -5.38739013671875, -5.1156005859375, -4.84381103515625, -4.572021484375, -4.30023193359375, -4.0284423828125, -3.75665283203125, -3.48486328125, -3.21307373046875, -2.9412841796875, -2.66949462890625, -2.397705078125, -2.12591552734375, -1.8541259765625, -1.58233642578125, -1.310546875, -1.03875732421875, -0.7669677734375, -0.49517822265625, -0.223388671875, 0.04840087890625, 0.3201904296875, 0.59197998046875, 0.86376953125, 1.13555908203125, 1.4073486328125, 1.67913818359375, 1.950927734375, 2.22271728515625, 2.4945068359375, 2.76629638671875, 3.0380859375, 3.30987548828125, 3.5816650390625, 3.85345458984375, 4.125244140625, 4.39703369140625, 4.6688232421875, 4.94061279296875, 5.21240234375, 5.48419189453125, 5.7559814453125, 6.02777099609375, 6.299560546875, 6.57135009765625, 6.8431396484375, 7.11492919921875, 7.38671875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 7.0, 1.0, 11.0, 12.0, 9.0, 20.0, 29.0, 21.0, 24.0, 27.0, 40.0, 46.0, 74.0, 145.0, 273.0, 705.0, 3459.0, 1715582.0, 1420627.0, 3054.0, 738.0, 287.0, 121.0, 79.0, 51.0, 33.0, 36.0, 29.0, 22.0, 31.0, 17.0, 14.0, 12.0, 10.0, 12.0, 6.0, 4.0, 7.0, 7.0, 2.0, 3.0, 3.0, 4.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.515625, -29.385009765625, -28.25439453125, -27.123779296875, -25.9931640625, -24.862548828125, -23.73193359375, -22.601318359375, -21.470703125, -20.340087890625, -19.20947265625, -18.078857421875, -16.9482421875, -15.817626953125, -14.68701171875, -13.556396484375, -12.42578125, -11.295166015625, -10.16455078125, -9.033935546875, -7.9033203125, -6.772705078125, -5.64208984375, -4.511474609375, -3.380859375, -2.250244140625, -1.11962890625, 0.010986328125, 1.1416015625, 2.272216796875, 3.40283203125, 4.533447265625, 5.6640625, 6.794677734375, 7.92529296875, 9.055908203125, 10.1865234375, 11.317138671875, 12.44775390625, 13.578369140625, 14.708984375, 15.839599609375, 16.97021484375, 18.100830078125, 19.2314453125, 20.362060546875, 21.49267578125, 22.623291015625, 23.75390625, 24.884521484375, 26.01513671875, 27.145751953125, 28.2763671875, 29.406982421875, 30.53759765625, 31.668212890625, 32.798828125, 33.929443359375, 35.06005859375, 36.190673828125, 37.3212890625, 38.451904296875, 39.58251953125, 40.713134765625, 41.84375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 7.0, 995.0, 14.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-165.60826110839844, -154.34991455078125, -143.09158325195312, -131.83323669433594, -120.57490539550781, -109.31655883789062, -98.05821990966797, -86.79988098144531, -75.54154205322266, -64.283203125, -53.024864196777344, -41.76652145385742, -30.508182525634766, -19.24984359741211, -7.9915008544921875, 3.2668380737304688, 14.525177001953125, 25.78351593017578, 37.04185485839844, 48.30019760131836, 59.558536529541016, 70.81687927246094, 82.0752182006836, 93.33355712890625, 104.5918960571289, 115.85023498535156, 127.10857391357422, 138.36691284179688, 149.62525939941406, 160.8835906982422, 172.14193725585938, 183.4002685546875, 194.65859985351562, 205.9169464111328, 217.17527770996094, 228.43362426757812, 239.69195556640625, 250.95030212402344, 262.2086486816406, 273.46697998046875, 284.7253112792969, 295.983642578125, 307.24200439453125, 318.5003356933594, 329.7586669921875, 341.0169982910156, 352.2753601074219, 363.53369140625, 374.79205322265625, 386.0503845214844, 397.3087463378906, 408.56707763671875, 419.8254089355469, 431.083740234375, 442.34210205078125, 453.6004333496094, 464.8587646484375, 476.1170959472656, 487.3754577636719, 498.6337890625, 509.8921203613281, 521.1504516601562, 532.4088134765625, 543.6671142578125, 554.9254760742188]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 2.0, 9.0, 6.0, 6.0, 13.0, 12.0, 15.0, 22.0, 21.0, 23.0, 25.0, 16.0, 26.0, 27.0, 32.0, 41.0, 23.0, 42.0, 40.0, 51.0, 31.0, 37.0, 46.0, 48.0, 36.0, 36.0, 38.0, 39.0, 34.0, 29.0, 15.0, 25.0, 24.0, 13.0, 14.0, 13.0, 13.0, 15.0, 11.0, 6.0, 6.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.403093338012695, -29.32271385192871, -28.242334365844727, -27.161954879760742, -26.081575393676758, -25.001195907592773, -23.92081642150879, -22.840436935424805, -21.76005744934082, -20.679677963256836, -19.59929847717285, -18.518918991088867, -17.438539505004883, -16.3581600189209, -15.277780532836914, -14.19740104675293, -13.117021560668945, -12.036642074584961, -10.956262588500977, -9.875883102416992, -8.795503616333008, -7.715124130249023, -6.634744644165039, -5.554365158081055, -4.47398567199707, -3.393606185913086, -2.3132266998291016, -1.2328472137451172, -0.1524677276611328, 0.9279117584228516, 2.008291244506836, 3.0886707305908203, 4.1690521240234375, 5.249431610107422, 6.329811096191406, 7.410190582275391, 8.490570068359375, 9.57094955444336, 10.651329040527344, 11.731708526611328, 12.812088012695312, 13.892467498779297, 14.972846984863281, 16.053226470947266, 17.13360595703125, 18.213985443115234, 19.29436492919922, 20.374744415283203, 21.455123901367188, 22.535503387451172, 23.615882873535156, 24.69626235961914, 25.776641845703125, 26.85702133178711, 27.937400817871094, 29.017780303955078, 30.098159790039062, 31.178539276123047, 32.25891876220703, 33.339298248291016, 34.419677734375, 35.500057220458984, 36.58043670654297, 37.66081619262695, 38.74119567871094]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 7.0, 4.0, 6.0, 4.0, 6.0, 9.0, 7.0, 19.0, 14.0, 19.0, 19.0, 31.0, 27.0, 20.0, 35.0, 38.0, 36.0, 41.0, 51.0, 43.0, 45.0, 55.0, 40.0, 31.0, 50.0, 35.0, 33.0, 36.0, 33.0, 43.0, 19.0, 26.0, 20.0, 23.0, 16.0, 15.0, 5.0, 14.0, 8.0, 1.0, 6.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.98828125, -2.883819580078125, -2.77935791015625, -2.674896240234375, -2.5704345703125, -2.465972900390625, -2.36151123046875, -2.257049560546875, -2.152587890625, -2.048126220703125, -1.94366455078125, -1.839202880859375, -1.7347412109375, -1.630279541015625, -1.52581787109375, -1.421356201171875, -1.31689453125, -1.212432861328125, -1.10797119140625, -1.003509521484375, -0.8990478515625, -0.794586181640625, -0.69012451171875, -0.585662841796875, -0.481201171875, -0.376739501953125, -0.27227783203125, -0.167816162109375, -0.0633544921875, 0.041107177734375, 0.14556884765625, 0.250030517578125, 0.3544921875, 0.458953857421875, 0.56341552734375, 0.667877197265625, 0.7723388671875, 0.876800537109375, 0.98126220703125, 1.085723876953125, 1.190185546875, 1.294647216796875, 1.39910888671875, 1.503570556640625, 1.6080322265625, 1.712493896484375, 1.81695556640625, 1.921417236328125, 2.02587890625, 2.130340576171875, 2.23480224609375, 2.339263916015625, 2.4437255859375, 2.548187255859375, 2.65264892578125, 2.757110595703125, 2.861572265625, 2.966033935546875, 3.07049560546875, 3.174957275390625, 3.2794189453125, 3.383880615234375, 3.48834228515625, 3.592803955078125, 3.697265625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 8.0, 14.0, 20.0, 22.0, 24.0, 25.0, 36.0, 62.0, 85.0, 113.0, 152.0, 223.0, 379.0, 545.0, 939.0, 1706.0, 3381.0, 7613.0, 20143.0, 80579.0, 767996.0, 2834246.0, 392817.0, 54125.0, 15548.0, 6358.0, 2947.0, 1597.0, 865.0, 552.0, 338.0, 223.0, 161.0, 120.0, 76.0, 59.0, 38.0, 41.0, 24.0, 15.0, 16.0, 10.0, 15.0, 5.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-12.7890625, -12.39404296875, -11.9990234375, -11.60400390625, -11.208984375, -10.81396484375, -10.4189453125, -10.02392578125, -9.62890625, -9.23388671875, -8.8388671875, -8.44384765625, -8.048828125, -7.65380859375, -7.2587890625, -6.86376953125, -6.46875, -6.07373046875, -5.6787109375, -5.28369140625, -4.888671875, -4.49365234375, -4.0986328125, -3.70361328125, -3.30859375, -2.91357421875, -2.5185546875, -2.12353515625, -1.728515625, -1.33349609375, -0.9384765625, -0.54345703125, -0.1484375, 0.24658203125, 0.6416015625, 1.03662109375, 1.431640625, 1.82666015625, 2.2216796875, 2.61669921875, 3.01171875, 3.40673828125, 3.8017578125, 4.19677734375, 4.591796875, 4.98681640625, 5.3818359375, 5.77685546875, 6.171875, 6.56689453125, 6.9619140625, 7.35693359375, 7.751953125, 8.14697265625, 8.5419921875, 8.93701171875, 9.33203125, 9.72705078125, 10.1220703125, 10.51708984375, 10.912109375, 11.30712890625, 11.7021484375, 12.09716796875, 12.4921875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 10.0, 17.0, 19.0, 34.0, 38.0, 53.0, 92.0, 115.0, 157.0, 254.0, 329.0, 441.0, 575.0, 510.0, 425.0, 325.0, 223.0, 112.0, 107.0, 82.0, 47.0, 34.0, 21.0, 15.0, 13.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.4375, -17.96337890625, -17.4892578125, -17.01513671875, -16.541015625, -16.06689453125, -15.5927734375, -15.11865234375, -14.64453125, -14.17041015625, -13.6962890625, -13.22216796875, -12.748046875, -12.27392578125, -11.7998046875, -11.32568359375, -10.8515625, -10.37744140625, -9.9033203125, -9.42919921875, -8.955078125, -8.48095703125, -8.0068359375, -7.53271484375, -7.05859375, -6.58447265625, -6.1103515625, -5.63623046875, -5.162109375, -4.68798828125, -4.2138671875, -3.73974609375, -3.265625, -2.79150390625, -2.3173828125, -1.84326171875, -1.369140625, -0.89501953125, -0.4208984375, 0.05322265625, 0.52734375, 1.00146484375, 1.4755859375, 1.94970703125, 2.423828125, 2.89794921875, 3.3720703125, 3.84619140625, 4.3203125, 4.79443359375, 5.2685546875, 5.74267578125, 6.216796875, 6.69091796875, 7.1650390625, 7.63916015625, 8.11328125, 8.58740234375, 9.0615234375, 9.53564453125, 10.009765625, 10.48388671875, 10.9580078125, 11.43212890625, 11.90625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 8.0, 2.0, 5.0, 10.0, 18.0, 11.0, 15.0, 36.0, 28.0, 48.0, 57.0, 84.0, 135.0, 223.0, 462.0, 1715.0, 30783.0, 3972984.0, 183463.0, 2806.0, 617.0, 275.0, 167.0, 91.0, 78.0, 46.0, 39.0, 22.0, 13.0, 10.0, 13.0, 3.0, 5.0, 6.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5625, -33.919921875, -32.27734375, -30.634765625, -28.9921875, -27.349609375, -25.70703125, -24.064453125, -22.421875, -20.779296875, -19.13671875, -17.494140625, -15.8515625, -14.208984375, -12.56640625, -10.923828125, -9.28125, -7.638671875, -5.99609375, -4.353515625, -2.7109375, -1.068359375, 0.57421875, 2.216796875, 3.859375, 5.501953125, 7.14453125, 8.787109375, 10.4296875, 12.072265625, 13.71484375, 15.357421875, 17.0, 18.642578125, 20.28515625, 21.927734375, 23.5703125, 25.212890625, 26.85546875, 28.498046875, 30.140625, 31.783203125, 33.42578125, 35.068359375, 36.7109375, 38.353515625, 39.99609375, 41.638671875, 43.28125, 44.923828125, 46.56640625, 48.208984375, 49.8515625, 51.494140625, 53.13671875, 54.779296875, 56.421875, 58.064453125, 59.70703125, 61.349609375, 62.9921875, 64.634765625, 66.27734375, 67.919921875, 69.5625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 212.0, 719.0, 81.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.40779876708984, -74.5325927734375, -65.65739440917969, -56.78219223022461, -47.90699005126953, -39.03178787231445, -30.156585693359375, -21.281383514404297, -12.406181335449219, -3.5309791564941406, 5.3442230224609375, 14.219425201416016, 23.094627380371094, 31.969829559326172, 40.84503173828125, 49.72023391723633, 58.595436096191406, 67.47064208984375, 76.34584045410156, 85.22103881835938, 94.09624481201172, 102.97145080566406, 111.84664916992188, 120.72184753417969, 129.5970458984375, 138.4722442626953, 147.34744262695312, 156.22265625, 165.0978546142578, 173.97305297851562, 182.8482666015625, 191.7234649658203, 200.59866333007812, 209.47386169433594, 218.34906005859375, 227.22427368164062, 236.09947204589844, 244.97467041015625, 253.84988403320312, 262.7250671386719, 271.60028076171875, 280.4754943847656, 289.3506774902344, 298.22589111328125, 307.10107421875, 315.9762878417969, 324.85150146484375, 333.7266845703125, 342.6018981933594, 351.47711181640625, 360.352294921875, 369.2275085449219, 378.10272216796875, 386.9779052734375, 395.8531188964844, 404.7283020019531, 413.603515625, 422.4787292480469, 431.3539123535156, 440.2291259765625, 449.10430908203125, 457.9795227050781, 466.854736328125, 475.72991943359375, 484.6051330566406]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 1.0, 6.0, 10.0, 12.0, 14.0, 7.0, 14.0, 17.0, 18.0, 22.0, 24.0, 24.0, 27.0, 35.0, 36.0, 36.0, 39.0, 45.0, 37.0, 31.0, 37.0, 41.0, 26.0, 29.0, 37.0, 44.0, 43.0, 28.0, 28.0, 30.0, 31.0, 22.0, 21.0, 20.0, 22.0, 12.0, 12.0, 13.0, 6.0, 11.0, 6.0, 7.0, 7.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.00556182861328, -37.77153396606445, -36.53750228881836, -35.30347442626953, -34.06944274902344, -32.83541488647461, -31.60138511657715, -30.367355346679688, -29.133325576782227, -27.899295806884766, -26.665266036987305, -25.431236267089844, -24.197208404541016, -22.963176727294922, -21.729148864746094, -20.495119094848633, -19.261089324951172, -18.02705955505371, -16.79302978515625, -15.559000968933105, -14.324971199035645, -13.090941429138184, -11.856912612915039, -10.622882843017578, -9.388853073120117, -8.154823303222656, -6.9207940101623535, -5.686764717102051, -4.45273494720459, -3.218705177307129, -1.9846758842468262, -0.7506465911865234, 0.4833831787109375, 1.7174127101898193, 2.951442241668701, 4.185471534729004, 5.419501304626465, 6.653531074523926, 7.8875603675842285, 9.121589660644531, 10.355619430541992, 11.589649200439453, 12.823678970336914, 14.057707786560059, 15.29173755645752, 16.525768280029297, 17.759796142578125, 18.993825912475586, 20.227855682373047, 21.461885452270508, 22.69591522216797, 23.92994499206543, 25.16397476196289, 26.39800262451172, 27.63203239440918, 28.86606216430664, 30.1000919342041, 31.334121704101562, 32.56814956665039, 33.802181243896484, 35.03620910644531, 36.270240783691406, 37.504268646240234, 38.73829650878906, 39.972328186035156]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 3.0, 6.0, 7.0, 7.0, 10.0, 13.0, 16.0, 17.0, 14.0, 18.0, 33.0, 18.0, 20.0, 31.0, 29.0, 22.0, 35.0, 45.0, 50.0, 40.0, 45.0, 42.0, 36.0, 41.0, 24.0, 34.0, 23.0, 35.0, 28.0, 36.0, 29.0, 32.0, 22.0, 15.0, 24.0, 12.0, 13.0, 9.0, 12.0, 9.0, 10.0, 7.0, 5.0, 3.0, 0.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.115234375, -3.020172119140625, -2.92510986328125, -2.830047607421875, -2.7349853515625, -2.639923095703125, -2.54486083984375, -2.449798583984375, -2.354736328125, -2.259674072265625, -2.16461181640625, -2.069549560546875, -1.9744873046875, -1.879425048828125, -1.78436279296875, -1.689300537109375, -1.59423828125, -1.499176025390625, -1.40411376953125, -1.309051513671875, -1.2139892578125, -1.118927001953125, -1.02386474609375, -0.928802490234375, -0.833740234375, -0.738677978515625, -0.64361572265625, -0.548553466796875, -0.4534912109375, -0.358428955078125, -0.26336669921875, -0.168304443359375, -0.0732421875, 0.021820068359375, 0.11688232421875, 0.211944580078125, 0.3070068359375, 0.402069091796875, 0.49713134765625, 0.592193603515625, 0.687255859375, 0.782318115234375, 0.87738037109375, 0.972442626953125, 1.0675048828125, 1.162567138671875, 1.25762939453125, 1.352691650390625, 1.44775390625, 1.542816162109375, 1.63787841796875, 1.732940673828125, 1.8280029296875, 1.923065185546875, 2.01812744140625, 2.113189697265625, 2.208251953125, 2.303314208984375, 2.39837646484375, 2.493438720703125, 2.5885009765625, 2.683563232421875, 2.77862548828125, 2.873687744140625, 2.96875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 6.0, 11.0, 23.0, 24.0, 39.0, 60.0, 61.0, 90.0, 144.0, 177.0, 305.0, 364.0, 604.0, 820.0, 1177.0, 1616.0, 2455.0, 3547.0, 5150.0, 7467.0, 11074.0, 16508.0, 24536.0, 37284.0, 60119.0, 101381.0, 196629.0, 246265.0, 126017.0, 72019.0, 44424.0, 28772.0, 19034.0, 12721.0, 8665.0, 5893.0, 3987.0, 2762.0, 1908.0, 1372.0, 913.0, 657.0, 431.0, 342.0, 207.0, 156.0, 105.0, 73.0, 51.0, 29.0, 30.0, 21.0, 16.0, 11.0, 4.0, 4.0, 2.0, 3.0], "bins": [-0.57568359375, -0.5583343505859375, -0.540985107421875, -0.5236358642578125, -0.50628662109375, -0.4889373779296875, -0.471588134765625, -0.4542388916015625, -0.4368896484375, -0.4195404052734375, -0.402191162109375, -0.3848419189453125, -0.36749267578125, -0.3501434326171875, -0.332794189453125, -0.3154449462890625, -0.298095703125, -0.2807464599609375, -0.263397216796875, -0.2460479736328125, -0.22869873046875, -0.2113494873046875, -0.194000244140625, -0.1766510009765625, -0.1593017578125, -0.1419525146484375, -0.124603271484375, -0.1072540283203125, -0.08990478515625, -0.0725555419921875, -0.055206298828125, -0.0378570556640625, -0.0205078125, -0.0031585693359375, 0.014190673828125, 0.0315399169921875, 0.04888916015625, 0.0662384033203125, 0.083587646484375, 0.1009368896484375, 0.1182861328125, 0.1356353759765625, 0.152984619140625, 0.1703338623046875, 0.18768310546875, 0.2050323486328125, 0.222381591796875, 0.2397308349609375, 0.257080078125, 0.2744293212890625, 0.291778564453125, 0.3091278076171875, 0.32647705078125, 0.3438262939453125, 0.361175537109375, 0.3785247802734375, 0.3958740234375, 0.4132232666015625, 0.430572509765625, 0.4479217529296875, 0.46527099609375, 0.4826202392578125, 0.499969482421875, 0.5173187255859375, 0.53466796875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 2.0, 4.0, 8.0, 11.0, 9.0, 9.0, 12.0, 17.0, 18.0, 26.0, 12.0, 22.0, 26.0, 32.0, 32.0, 31.0, 32.0, 37.0, 36.0, 45.0, 43.0, 1069.0, 34.0, 46.0, 35.0, 32.0, 40.0, 44.0, 20.0, 30.0, 25.0, 29.0, 24.0, 22.0, 18.0, 21.0, 11.0, 13.0, 11.0, 8.0, 9.0, 7.0, 7.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.115234375, -2.048980712890625, -1.98272705078125, -1.916473388671875, -1.8502197265625, -1.783966064453125, -1.71771240234375, -1.651458740234375, -1.585205078125, -1.518951416015625, -1.45269775390625, -1.386444091796875, -1.3201904296875, -1.253936767578125, -1.18768310546875, -1.121429443359375, -1.05517578125, -0.988922119140625, -0.92266845703125, -0.856414794921875, -0.7901611328125, -0.723907470703125, -0.65765380859375, -0.591400146484375, -0.525146484375, -0.458892822265625, -0.39263916015625, -0.326385498046875, -0.2601318359375, -0.193878173828125, -0.12762451171875, -0.061370849609375, 0.0048828125, 0.071136474609375, 0.13739013671875, 0.203643798828125, 0.2698974609375, 0.336151123046875, 0.40240478515625, 0.468658447265625, 0.534912109375, 0.601165771484375, 0.66741943359375, 0.733673095703125, 0.7999267578125, 0.866180419921875, 0.93243408203125, 0.998687744140625, 1.06494140625, 1.131195068359375, 1.19744873046875, 1.263702392578125, 1.3299560546875, 1.396209716796875, 1.46246337890625, 1.528717041015625, 1.594970703125, 1.661224365234375, 1.72747802734375, 1.793731689453125, 1.8599853515625, 1.926239013671875, 1.99249267578125, 2.058746337890625, 2.125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 12.0, 14.0, 20.0, 36.0, 43.0, 57.0, 97.0, 103.0, 161.0, 238.0, 297.0, 508.0, 679.0, 1033.0, 1518.0, 2183.0, 3437.0, 5009.0, 7887.0, 12434.0, 19109.0, 31127.0, 50550.0, 87443.0, 171097.0, 1331590.0, 158034.0, 82435.0, 47741.0, 29323.0, 18852.0, 11526.0, 7760.0, 4825.0, 3181.0, 2178.0, 1412.0, 982.0, 652.0, 463.0, 332.0, 232.0, 154.0, 105.0, 64.0, 59.0, 43.0, 32.0, 20.0, 15.0, 10.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-0.56982421875, -0.5517044067382812, -0.5335845947265625, -0.5154647827148438, -0.497344970703125, -0.47922515869140625, -0.4611053466796875, -0.44298553466796875, -0.42486572265625, -0.40674591064453125, -0.3886260986328125, -0.37050628662109375, -0.352386474609375, -0.33426666259765625, -0.3161468505859375, -0.29802703857421875, -0.2799072265625, -0.26178741455078125, -0.2436676025390625, -0.22554779052734375, -0.207427978515625, -0.18930816650390625, -0.1711883544921875, -0.15306854248046875, -0.13494873046875, -0.11682891845703125, -0.0987091064453125, -0.08058929443359375, -0.062469482421875, -0.04434967041015625, -0.0262298583984375, -0.00811004638671875, 0.010009765625, 0.02812957763671875, 0.0462493896484375, 0.06436920166015625, 0.082489013671875, 0.10060882568359375, 0.1187286376953125, 0.13684844970703125, 0.15496826171875, 0.17308807373046875, 0.1912078857421875, 0.20932769775390625, 0.227447509765625, 0.24556732177734375, 0.2636871337890625, 0.28180694580078125, 0.2999267578125, 0.31804656982421875, 0.3361663818359375, 0.35428619384765625, 0.372406005859375, 0.39052581787109375, 0.4086456298828125, 0.42676544189453125, 0.44488525390625, 0.46300506591796875, 0.4811248779296875, 0.49924468994140625, 0.517364501953125, 0.5354843139648438, 0.5536041259765625, 0.5717239379882812, 0.58984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [5.0, 2.0, 1.0, 4.0, 2.0, 4.0, 6.0, 2.0, 7.0, 3.0, 10.0, 10.0, 7.0, 23.0, 13.0, 19.0, 17.0, 17.0, 32.0, 22.0, 41.0, 41.0, 52.0, 57.0, 67.0, 57.0, 70.0, 61.0, 58.0, 38.0, 48.0, 36.0, 30.0, 23.0, 28.0, 17.0, 11.0, 15.0, 11.0, 10.0, 10.0, 6.0, 3.0, 3.0, 4.0, 2.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004892349243164062, -0.00047062337398529053, -0.0004520118236541748, -0.0004334002733230591, -0.00041478872299194336, -0.00039617717266082764, -0.0003775656223297119, -0.0003589540719985962, -0.00034034252166748047, -0.00032173097133636475, -0.000303119421005249, -0.0002845078706741333, -0.0002658963203430176, -0.00024728477001190186, -0.00022867321968078613, -0.0002100616693496704, -0.0001914501190185547, -0.00017283856868743896, -0.00015422701835632324, -0.00013561546802520752, -0.0001170039176940918, -9.839236736297607e-05, -7.978081703186035e-05, -6.116926670074463e-05, -4.2557716369628906e-05, -2.3946166038513184e-05, -5.334615707397461e-06, 1.3276934623718262e-05, 3.1888484954833984e-05, 5.050003528594971e-05, 6.911158561706543e-05, 8.772313594818115e-05, 0.00010633468627929688, 0.0001249462366104126, 0.00014355778694152832, 0.00016216933727264404, 0.00018078088760375977, 0.0001993924379348755, 0.0002180039882659912, 0.00023661553859710693, 0.00025522708892822266, 0.0002738386392593384, 0.0002924501895904541, 0.0003110617399215698, 0.00032967329025268555, 0.00034828484058380127, 0.000366896390914917, 0.0003855079412460327, 0.00040411949157714844, 0.00042273104190826416, 0.0004413425922393799, 0.0004599541425704956, 0.00047856569290161133, 0.000497177243232727, 0.0005157887935638428, 0.0005344003438949585, 0.0005530118942260742, 0.0005716234445571899, 0.0005902349948883057, 0.0006088465452194214, 0.0006274580955505371, 0.0006460696458816528, 0.0006646811962127686, 0.0006832927465438843, 0.000701904296875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 2.0, 10.0, 8.0, 18.0, 16.0, 16.0, 21.0, 23.0, 61.0, 51.0, 79.0, 98.0, 107.0, 175.0, 289.0, 534.0, 1547.0, 982296.0, 61093.0, 845.0, 421.0, 245.0, 125.0, 118.0, 55.0, 69.0, 46.0, 28.0, 19.0, 24.0, 31.0, 16.0, 10.0, 15.0, 9.0, 6.0, 2.0, 5.0, 5.0, 2.0, 2.0, 5.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.01442718505859375, -0.014024138450622559, -0.013621091842651367, -0.013218045234680176, -0.012814998626708984, -0.012411952018737793, -0.012008905410766602, -0.01160585880279541, -0.011202812194824219, -0.010799765586853027, -0.010396718978881836, -0.009993672370910645, -0.009590625762939453, -0.009187579154968262, -0.00878453254699707, -0.008381485939025879, -0.007978439331054688, -0.007575392723083496, -0.007172346115112305, -0.006769299507141113, -0.006366252899169922, -0.0059632062911987305, -0.005560159683227539, -0.005157113075256348, -0.004754066467285156, -0.004351019859313965, -0.0039479732513427734, -0.003544926643371582, -0.0031418800354003906, -0.0027388334274291992, -0.002335786819458008, -0.0019327402114868164, -0.001529693603515625, -0.0011266469955444336, -0.0007236003875732422, -0.0003205537796020508, 8.249282836914062e-05, 0.00048553943634033203, 0.0008885860443115234, 0.0012916326522827148, 0.0016946792602539062, 0.0020977258682250977, 0.002500772476196289, 0.0029038190841674805, 0.003306865692138672, 0.0037099123001098633, 0.004112958908081055, 0.004516005516052246, 0.0049190521240234375, 0.005322098731994629, 0.00572514533996582, 0.006128191947937012, 0.006531238555908203, 0.0069342851638793945, 0.007337331771850586, 0.007740378379821777, 0.008143424987792969, 0.00854647159576416, 0.008949518203735352, 0.009352564811706543, 0.009755611419677734, 0.010158658027648926, 0.010561704635620117, 0.010964751243591309, 0.0113677978515625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 19.0, 223.0, 586.0, 175.0, 12.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001708584139123559, -0.001652475562877953, -0.001596366986632347, -0.0015402584103867412, -0.0014841498341411352, -0.0014280412578955293, -0.0013719326816499233, -0.0013158239889889956, -0.0012597155291587114, -0.0012036069529131055, -0.0011474983766674995, -0.0010913898004218936, -0.0010352812241762877, -0.0009791726479306817, -0.0009230640134774148, -0.0008669554372318089, -0.000810846802778542, -0.0007547382265329361, -0.0006986296502873302, -0.0006425210740417242, -0.0005864124977961183, -0.0005303039215505123, -0.00047419528709724545, -0.0004180867108516395, -0.00036197813460603356, -0.0003058695583604276, -0.00024976098211482167, -0.00019365237676538527, -0.00013754380051977932, -8.143522427417338e-05, -2.5326618924736977e-05, 3.078195732086897e-05, 8.689064998179674e-05, 0.0001429992262274027, 0.00019910781702492386, 0.00025521640782244503, 0.000311324984068051, 0.0003674335603136569, 0.00042354216566309333, 0.0004796507419086993, 0.0005357593181543052, 0.0005918678943999112, 0.0006479764706455171, 0.000704085105098784, 0.0007601936813443899, 0.0008163022575899959, 0.0008724108338356018, 0.0009285194100812078, 0.0009846279863268137, 0.0010407365625724196, 0.0010968451388180256, 0.0011529537150636315, 0.0012090622913092375, 0.0012651708675548434, 0.0013212794438004494, 0.0013773881364613771, 0.0014334965962916613, 0.0014896051725372672, 0.0015457137487828732, 0.001601822325028479, 0.001657930901274085, 0.001714039477519691, 0.001770148053765297, 0.0018262567464262247, 0.0018823653226718307]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 3.0, 4.0, 4.0, 3.0, 7.0, 12.0, 11.0, 17.0, 14.0, 14.0, 16.0, 25.0, 19.0, 21.0, 27.0, 40.0, 39.0, 35.0, 35.0, 39.0, 50.0, 41.0, 54.0, 38.0, 40.0, 47.0, 36.0, 30.0, 45.0, 39.0, 31.0, 31.0, 21.0, 25.0, 13.0, 16.0, 12.0, 8.0, 10.0, 9.0, 6.0, 4.0, 6.0, 4.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003325939178466797, -0.0003217337653040886, -0.0003108736127614975, -0.0003000134602189064, -0.0002891533076763153, -0.0002782931551337242, -0.0002674330025911331, -0.000256572850048542, -0.00024571269750595093, -0.00023485254496335983, -0.00022399239242076874, -0.00021313223987817764, -0.00020227208733558655, -0.00019141193479299545, -0.00018055178225040436, -0.00016969162970781326, -0.00015883147716522217, -0.00014797132462263107, -0.00013711117208003998, -0.00012625101953744888, -0.00011539086699485779, -0.00010453071445226669, -9.36705619096756e-05, -8.28104093670845e-05, -7.195025682449341e-05, -6.109010428190231e-05, -5.022995173931122e-05, -3.936979919672012e-05, -2.850964665412903e-05, -1.7649494111537933e-05, -6.789341568946838e-06, 4.070810973644257e-06, 1.4930963516235352e-05, 2.5791116058826447e-05, 3.665126860141754e-05, 4.7511421144008636e-05, 5.837157368659973e-05, 6.923172622919083e-05, 8.009187877178192e-05, 9.095203131437302e-05, 0.00010181218385696411, 0.0001126723363995552, 0.0001235324889421463, 0.0001343926414847374, 0.0001452527940273285, 0.00015611294656991959, 0.00016697309911251068, 0.00017783325165510178, 0.00018869340419769287, 0.00019955355674028397, 0.00021041370928287506, 0.00022127386182546616, 0.00023213401436805725, 0.00024299416691064835, 0.00025385431945323944, 0.00026471447199583054, 0.00027557462453842163, 0.0002864347770810127, 0.0002972949296236038, 0.0003081550821661949, 0.000319015234708786, 0.0003298753872513771, 0.0003407355397939682, 0.0003515956923365593, 0.0003624558448791504]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 3.0, 6.0, 7.0, 7.0, 10.0, 13.0, 16.0, 17.0, 14.0, 18.0, 33.0, 18.0, 20.0, 31.0, 29.0, 22.0, 35.0, 45.0, 50.0, 40.0, 45.0, 42.0, 36.0, 41.0, 24.0, 34.0, 23.0, 35.0, 28.0, 36.0, 29.0, 32.0, 22.0, 15.0, 24.0, 12.0, 13.0, 9.0, 12.0, 9.0, 10.0, 7.0, 5.0, 3.0, 0.0, 8.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.115234375, -3.020172119140625, -2.92510986328125, -2.830047607421875, -2.7349853515625, -2.639923095703125, -2.54486083984375, -2.449798583984375, -2.354736328125, -2.259674072265625, -2.16461181640625, -2.069549560546875, -1.9744873046875, -1.879425048828125, -1.78436279296875, -1.689300537109375, -1.59423828125, -1.499176025390625, -1.40411376953125, -1.309051513671875, -1.2139892578125, -1.118927001953125, -1.02386474609375, -0.928802490234375, -0.833740234375, -0.738677978515625, -0.64361572265625, -0.548553466796875, -0.4534912109375, -0.358428955078125, -0.26336669921875, -0.168304443359375, -0.0732421875, 0.021820068359375, 0.11688232421875, 0.211944580078125, 0.3070068359375, 0.402069091796875, 0.49713134765625, 0.592193603515625, 0.687255859375, 0.782318115234375, 0.87738037109375, 0.972442626953125, 1.0675048828125, 1.162567138671875, 1.25762939453125, 1.352691650390625, 1.44775390625, 1.542816162109375, 1.63787841796875, 1.732940673828125, 1.8280029296875, 1.923065185546875, 2.01812744140625, 2.113189697265625, 2.208251953125, 2.303314208984375, 2.39837646484375, 2.493438720703125, 2.5885009765625, 2.683563232421875, 2.77862548828125, 2.873687744140625, 2.96875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 10.0, 6.0, 20.0, 16.0, 22.0, 28.0, 48.0, 74.0, 85.0, 128.0, 157.0, 251.0, 379.0, 579.0, 961.0, 1875.0, 3658.0, 7435.0, 17442.0, 42929.0, 110882.0, 245322.0, 312772.0, 178958.0, 72906.0, 28247.0, 11685.0, 5381.0, 2575.0, 1360.0, 794.0, 488.0, 332.0, 221.0, 147.0, 109.0, 72.0, 52.0, 41.0, 39.0, 21.0, 13.0, 6.0, 8.0, 9.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.1328125, -4.012237548828125, -3.89166259765625, -3.771087646484375, -3.6505126953125, -3.529937744140625, -3.40936279296875, -3.288787841796875, -3.168212890625, -3.047637939453125, -2.92706298828125, -2.806488037109375, -2.6859130859375, -2.565338134765625, -2.44476318359375, -2.324188232421875, -2.20361328125, -2.083038330078125, -1.96246337890625, -1.841888427734375, -1.7213134765625, -1.600738525390625, -1.48016357421875, -1.359588623046875, -1.239013671875, -1.118438720703125, -0.99786376953125, -0.877288818359375, -0.7567138671875, -0.636138916015625, -0.51556396484375, -0.394989013671875, -0.2744140625, -0.153839111328125, -0.03326416015625, 0.087310791015625, 0.2078857421875, 0.328460693359375, 0.44903564453125, 0.569610595703125, 0.690185546875, 0.810760498046875, 0.93133544921875, 1.051910400390625, 1.1724853515625, 1.293060302734375, 1.41363525390625, 1.534210205078125, 1.65478515625, 1.775360107421875, 1.89593505859375, 2.016510009765625, 2.1370849609375, 2.257659912109375, 2.37823486328125, 2.498809814453125, 2.619384765625, 2.739959716796875, 2.86053466796875, 2.981109619140625, 3.1016845703125, 3.222259521484375, 3.34283447265625, 3.463409423828125, 3.583984375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 13.0, 10.0, 6.0, 6.0, 16.0, 14.0, 18.0, 18.0, 19.0, 32.0, 26.0, 23.0, 45.0, 40.0, 35.0, 52.0, 75.0, 159.0, 304.0, 1391.0, 205.0, 102.0, 66.0, 41.0, 52.0, 45.0, 34.0, 30.0, 27.0, 26.0, 17.0, 14.0, 16.0, 10.0, 16.0, 9.0, 7.0, 6.0, 8.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.046875, -11.68359375, -11.3203125, -10.95703125, -10.59375, -10.23046875, -9.8671875, -9.50390625, -9.140625, -8.77734375, -8.4140625, -8.05078125, -7.6875, -7.32421875, -6.9609375, -6.59765625, -6.234375, -5.87109375, -5.5078125, -5.14453125, -4.78125, -4.41796875, -4.0546875, -3.69140625, -3.328125, -2.96484375, -2.6015625, -2.23828125, -1.875, -1.51171875, -1.1484375, -0.78515625, -0.421875, -0.05859375, 0.3046875, 0.66796875, 1.03125, 1.39453125, 1.7578125, 2.12109375, 2.484375, 2.84765625, 3.2109375, 3.57421875, 3.9375, 4.30078125, 4.6640625, 5.02734375, 5.390625, 5.75390625, 6.1171875, 6.48046875, 6.84375, 7.20703125, 7.5703125, 7.93359375, 8.296875, 8.66015625, 9.0234375, 9.38671875, 9.75, 10.11328125, 10.4765625, 10.83984375, 11.203125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 5.0, 7.0, 6.0, 8.0, 10.0, 7.0, 12.0, 16.0, 16.0, 23.0, 30.0, 36.0, 44.0, 53.0, 84.0, 131.0, 205.0, 425.0, 1163.0, 10357.0, 2282929.0, 842446.0, 5776.0, 949.0, 339.0, 184.0, 129.0, 56.0, 39.0, 39.0, 39.0, 25.0, 17.0, 17.0, 17.0, 12.0, 17.0, 6.0, 7.0, 11.0, 5.0, 3.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.921875, -22.155517578125, -21.38916015625, -20.622802734375, -19.8564453125, -19.090087890625, -18.32373046875, -17.557373046875, -16.791015625, -16.024658203125, -15.25830078125, -14.491943359375, -13.7255859375, -12.959228515625, -12.19287109375, -11.426513671875, -10.66015625, -9.893798828125, -9.12744140625, -8.361083984375, -7.5947265625, -6.828369140625, -6.06201171875, -5.295654296875, -4.529296875, -3.762939453125, -2.99658203125, -2.230224609375, -1.4638671875, -0.697509765625, 0.06884765625, 0.835205078125, 1.6015625, 2.367919921875, 3.13427734375, 3.900634765625, 4.6669921875, 5.433349609375, 6.19970703125, 6.966064453125, 7.732421875, 8.498779296875, 9.26513671875, 10.031494140625, 10.7978515625, 11.564208984375, 12.33056640625, 13.096923828125, 13.86328125, 14.629638671875, 15.39599609375, 16.162353515625, 16.9287109375, 17.695068359375, 18.46142578125, 19.227783203125, 19.994140625, 20.760498046875, 21.52685546875, 22.293212890625, 23.0595703125, 23.825927734375, 24.59228515625, 25.358642578125, 26.125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 186.0, 782.0, 43.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-208.3084716796875, -204.4712677001953, -200.6340789794922, -196.796875, -192.95968627929688, -189.1224822998047, -185.2852783203125, -181.44808959960938, -177.6108856201172, -173.773681640625, -169.93649291992188, -166.0992889404297, -162.2620849609375, -158.42489624023438, -154.5876922607422, -150.75050354003906, -146.91329956054688, -143.0760955810547, -139.23890686035156, -135.40170288085938, -131.56451416015625, -127.72731018066406, -123.89010620117188, -120.05290985107422, -116.21571350097656, -112.3785171508789, -108.54132080078125, -104.70411682128906, -100.8669204711914, -97.02972412109375, -93.19252014160156, -89.3553237915039, -85.51812744140625, -81.6809310913086, -77.84373474121094, -74.00653076171875, -70.1693344116211, -66.33213806152344, -62.494937896728516, -58.657737731933594, -54.82053756713867, -50.98333740234375, -47.146141052246094, -43.30894470214844, -39.471744537353516, -35.634544372558594, -31.797348022460938, -27.96014976501465, -24.12295150756836, -20.28575325012207, -16.44855499267578, -12.611356735229492, -8.774158477783203, -4.936960220336914, -1.099761962890625, 2.737436294555664, 6.574634552001953, 10.411832809448242, 14.249031066894531, 18.08622932434082, 21.92342758178711, 25.7606258392334, 29.597824096679688, 33.435020446777344, 37.272220611572266]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 1.0, 4.0, 6.0, 13.0, 10.0, 11.0, 17.0, 11.0, 15.0, 22.0, 19.0, 35.0, 17.0, 30.0, 21.0, 39.0, 48.0, 42.0, 48.0, 39.0, 39.0, 40.0, 28.0, 35.0, 38.0, 29.0, 45.0, 44.0, 31.0, 20.0, 28.0, 25.0, 30.0, 12.0, 15.0, 14.0, 15.0, 17.0, 7.0, 6.0, 7.0, 6.0, 6.0, 2.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.04179382324219, -32.95559310913086, -31.86939239501953, -30.783191680908203, -29.696990966796875, -28.610790252685547, -27.524587631225586, -26.438386917114258, -25.35218620300293, -24.2659854888916, -23.179784774780273, -22.093584060668945, -21.007381439208984, -19.921180725097656, -18.834980010986328, -17.748779296875, -16.662578582763672, -15.576377868652344, -14.490177154541016, -13.403975486755371, -12.317774772644043, -11.231574058532715, -10.14537239074707, -9.059171676635742, -7.972970962524414, -6.886770248413086, -5.8005690574646, -4.714367866516113, -3.628167152404785, -2.541966438293457, -1.4557652473449707, -0.3695640563964844, 0.7166366577148438, 1.802837610244751, 2.889038562774658, 3.9752395153045654, 5.061440467834473, 6.147641181945801, 7.233842372894287, 8.320043563842773, 9.406244277954102, 10.49244499206543, 11.578645706176758, 12.664847373962402, 13.75104808807373, 14.837248802185059, 15.923450469970703, 17.00965118408203, 18.09585189819336, 19.182052612304688, 20.268253326416016, 21.354454040527344, 22.440654754638672, 23.52685546875, 24.61305809020996, 25.69925880432129, 26.785459518432617, 27.871660232543945, 28.957860946655273, 30.0440616607666, 31.130264282226562, 32.21646499633789, 33.30266571044922, 34.38886642456055, 35.475067138671875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 3.0, 5.0, 5.0, 13.0, 4.0, 11.0, 13.0, 18.0, 16.0, 17.0, 16.0, 20.0, 27.0, 19.0, 22.0, 40.0, 27.0, 32.0, 36.0, 44.0, 34.0, 44.0, 37.0, 30.0, 48.0, 44.0, 24.0, 35.0, 33.0, 33.0, 29.0, 26.0, 34.0, 17.0, 19.0, 25.0, 15.0, 12.0, 12.0, 11.0, 8.0, 10.0, 3.0, 6.0, 6.0, 3.0, 5.0, 5.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0], "bins": [-3.234375, -3.136474609375, -3.03857421875, -2.940673828125, -2.8427734375, -2.744873046875, -2.64697265625, -2.549072265625, -2.451171875, -2.353271484375, -2.25537109375, -2.157470703125, -2.0595703125, -1.961669921875, -1.86376953125, -1.765869140625, -1.66796875, -1.570068359375, -1.47216796875, -1.374267578125, -1.2763671875, -1.178466796875, -1.08056640625, -0.982666015625, -0.884765625, -0.786865234375, -0.68896484375, -0.591064453125, -0.4931640625, -0.395263671875, -0.29736328125, -0.199462890625, -0.1015625, -0.003662109375, 0.09423828125, 0.192138671875, 0.2900390625, 0.387939453125, 0.48583984375, 0.583740234375, 0.681640625, 0.779541015625, 0.87744140625, 0.975341796875, 1.0732421875, 1.171142578125, 1.26904296875, 1.366943359375, 1.46484375, 1.562744140625, 1.66064453125, 1.758544921875, 1.8564453125, 1.954345703125, 2.05224609375, 2.150146484375, 2.248046875, 2.345947265625, 2.44384765625, 2.541748046875, 2.6396484375, 2.737548828125, 2.83544921875, 2.933349609375, 3.03125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 3.0, 9.0, 7.0, 16.0, 19.0, 17.0, 31.0, 22.0, 35.0, 48.0, 51.0, 81.0, 127.0, 264.0, 516.0, 1364.0, 5472.0, 39460.0, 615001.0, 3007817.0, 483944.0, 32840.0, 4686.0, 1257.0, 477.0, 220.0, 105.0, 79.0, 58.0, 47.0, 52.0, 29.0, 22.0, 20.0, 20.0, 10.0, 10.0, 13.0, 9.0, 3.0, 2.0, 5.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-12.7109375, -12.3310546875, -11.951171875, -11.5712890625, -11.19140625, -10.8115234375, -10.431640625, -10.0517578125, -9.671875, -9.2919921875, -8.912109375, -8.5322265625, -8.15234375, -7.7724609375, -7.392578125, -7.0126953125, -6.6328125, -6.2529296875, -5.873046875, -5.4931640625, -5.11328125, -4.7333984375, -4.353515625, -3.9736328125, -3.59375, -3.2138671875, -2.833984375, -2.4541015625, -2.07421875, -1.6943359375, -1.314453125, -0.9345703125, -0.5546875, -0.1748046875, 0.205078125, 0.5849609375, 0.96484375, 1.3447265625, 1.724609375, 2.1044921875, 2.484375, 2.8642578125, 3.244140625, 3.6240234375, 4.00390625, 4.3837890625, 4.763671875, 5.1435546875, 5.5234375, 5.9033203125, 6.283203125, 6.6630859375, 7.04296875, 7.4228515625, 7.802734375, 8.1826171875, 8.5625, 8.9423828125, 9.322265625, 9.7021484375, 10.08203125, 10.4619140625, 10.841796875, 11.2216796875, 11.6015625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 10.0, 7.0, 21.0, 31.0, 36.0, 52.0, 83.0, 125.0, 142.0, 216.0, 281.0, 379.0, 484.0, 496.0, 472.0, 354.0, 240.0, 195.0, 128.0, 93.0, 69.0, 48.0, 33.0, 21.0, 24.0, 8.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.1328125, -12.72607421875, -12.3193359375, -11.91259765625, -11.505859375, -11.09912109375, -10.6923828125, -10.28564453125, -9.87890625, -9.47216796875, -9.0654296875, -8.65869140625, -8.251953125, -7.84521484375, -7.4384765625, -7.03173828125, -6.625, -6.21826171875, -5.8115234375, -5.40478515625, -4.998046875, -4.59130859375, -4.1845703125, -3.77783203125, -3.37109375, -2.96435546875, -2.5576171875, -2.15087890625, -1.744140625, -1.33740234375, -0.9306640625, -0.52392578125, -0.1171875, 0.28955078125, 0.6962890625, 1.10302734375, 1.509765625, 1.91650390625, 2.3232421875, 2.72998046875, 3.13671875, 3.54345703125, 3.9501953125, 4.35693359375, 4.763671875, 5.17041015625, 5.5771484375, 5.98388671875, 6.390625, 6.79736328125, 7.2041015625, 7.61083984375, 8.017578125, 8.42431640625, 8.8310546875, 9.23779296875, 9.64453125, 10.05126953125, 10.4580078125, 10.86474609375, 11.271484375, 11.67822265625, 12.0849609375, 12.49169921875, 12.8984375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 8.0, 9.0, 12.0, 21.0, 26.0, 45.0, 63.0, 113.0, 177.0, 331.0, 816.0, 2709.0, 41766.0, 3241195.0, 891954.0, 12133.0, 1623.0, 592.0, 270.0, 144.0, 88.0, 61.0, 41.0, 23.0, 22.0, 11.0, 10.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.03125, -22.87744140625, -21.7236328125, -20.56982421875, -19.416015625, -18.26220703125, -17.1083984375, -15.95458984375, -14.80078125, -13.64697265625, -12.4931640625, -11.33935546875, -10.185546875, -9.03173828125, -7.8779296875, -6.72412109375, -5.5703125, -4.41650390625, -3.2626953125, -2.10888671875, -0.955078125, 0.19873046875, 1.3525390625, 2.50634765625, 3.66015625, 4.81396484375, 5.9677734375, 7.12158203125, 8.275390625, 9.42919921875, 10.5830078125, 11.73681640625, 12.890625, 14.04443359375, 15.1982421875, 16.35205078125, 17.505859375, 18.65966796875, 19.8134765625, 20.96728515625, 22.12109375, 23.27490234375, 24.4287109375, 25.58251953125, 26.736328125, 27.89013671875, 29.0439453125, 30.19775390625, 31.3515625, 32.50537109375, 33.6591796875, 34.81298828125, 35.966796875, 37.12060546875, 38.2744140625, 39.42822265625, 40.58203125, 41.73583984375, 42.8896484375, 44.04345703125, 45.197265625, 46.35107421875, 47.5048828125, 48.65869140625, 49.8125]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 8.0, 12.0, 16.0, 19.0, 27.0, 47.0, 56.0, 79.0, 87.0, 80.0, 103.0, 81.0, 80.0, 85.0, 77.0, 44.0, 40.0, 29.0, 13.0, 10.0, 4.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.093761444091797, -29.010303497314453, -27.926847457885742, -26.84339141845703, -25.759933471679688, -24.676475524902344, -23.593019485473633, -22.509563446044922, -21.426105499267578, -20.342647552490234, -19.259191513061523, -18.175735473632812, -17.09227752685547, -16.008819580078125, -14.925363540649414, -13.841906547546387, -12.75844955444336, -11.674992561340332, -10.591535568237305, -9.508078575134277, -8.42462158203125, -7.341164588928223, -6.257707595825195, -5.174250602722168, -4.090793609619141, -3.0073366165161133, -1.923879623413086, -0.8404226303100586, 0.24303436279296875, 1.326491355895996, 2.4099483489990234, 3.493405342102051, 4.5768585205078125, 5.66031551361084, 6.743772506713867, 7.8272294998168945, 8.910686492919922, 9.99414348602295, 11.077600479125977, 12.161057472229004, 13.244514465332031, 14.327971458435059, 15.411428451538086, 16.494884490966797, 17.57834243774414, 18.661800384521484, 19.745256423950195, 20.828712463378906, 21.91217041015625, 22.995628356933594, 24.079084396362305, 25.162540435791016, 26.24599838256836, 27.329456329345703, 28.412912368774414, 29.496368408203125, 30.57982635498047, 31.663284301757812, 32.746742248535156, 33.830196380615234, 34.91365432739258, 35.99711227416992, 37.08056640625, 38.164024353027344, 39.24748229980469]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 6.0, 17.0, 12.0, 30.0, 23.0, 19.0, 14.0, 34.0, 31.0, 24.0, 41.0, 41.0, 32.0, 53.0, 46.0, 44.0, 43.0, 36.0, 35.0, 50.0, 33.0, 44.0, 47.0, 42.0, 28.0, 25.0, 21.0, 23.0, 20.0, 11.0, 13.0, 10.0, 10.0, 6.0, 8.0, 5.0, 2.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.70399856567383, -38.40064239501953, -37.0972900390625, -35.79393768310547, -34.49058151245117, -33.187225341796875, -31.883872985839844, -30.58051872253418, -29.277164459228516, -27.97381019592285, -26.670455932617188, -25.367101669311523, -24.06374740600586, -22.760393142700195, -21.45703887939453, -20.153684616088867, -18.850330352783203, -17.54697608947754, -16.243621826171875, -14.940267562866211, -13.636913299560547, -12.333559036254883, -11.030204772949219, -9.726850509643555, -8.42349624633789, -7.120141983032227, -5.8167877197265625, -4.513433456420898, -3.2100791931152344, -1.9067249298095703, -0.6033706665039062, 0.6999835968017578, 2.0033416748046875, 3.3066959381103516, 4.610050201416016, 5.91340446472168, 7.216758728027344, 8.520112991333008, 9.823467254638672, 11.126821517944336, 12.43017578125, 13.733530044555664, 15.036884307861328, 16.340238571166992, 17.643592834472656, 18.94694709777832, 20.250301361083984, 21.55365562438965, 22.857009887695312, 24.160364151000977, 25.46371841430664, 26.767072677612305, 28.07042694091797, 29.373781204223633, 30.677135467529297, 31.98048973083496, 33.283843994140625, 34.587196350097656, 35.89055252075195, 37.19390869140625, 38.49726104736328, 39.80061340332031, 41.10396957397461, 42.407325744628906, 43.71067810058594]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 14.0, 9.0, 11.0, 6.0, 13.0, 17.0, 9.0, 21.0, 16.0, 26.0, 34.0, 35.0, 28.0, 30.0, 38.0, 49.0, 35.0, 46.0, 35.0, 57.0, 40.0, 39.0, 35.0, 31.0, 38.0, 33.0, 25.0, 40.0, 22.0, 23.0, 22.0, 14.0, 17.0, 18.0, 9.0, 12.0, 14.0, 7.0, 5.0, 7.0, 3.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.63671875, -3.527374267578125, -3.41802978515625, -3.308685302734375, -3.1993408203125, -3.089996337890625, -2.98065185546875, -2.871307373046875, -2.761962890625, -2.652618408203125, -2.54327392578125, -2.433929443359375, -2.3245849609375, -2.215240478515625, -2.10589599609375, -1.996551513671875, -1.88720703125, -1.777862548828125, -1.66851806640625, -1.559173583984375, -1.4498291015625, -1.340484619140625, -1.23114013671875, -1.121795654296875, -1.012451171875, -0.903106689453125, -0.79376220703125, -0.684417724609375, -0.5750732421875, -0.465728759765625, -0.35638427734375, -0.247039794921875, -0.1376953125, -0.028350830078125, 0.08099365234375, 0.190338134765625, 0.2996826171875, 0.409027099609375, 0.51837158203125, 0.627716064453125, 0.737060546875, 0.846405029296875, 0.95574951171875, 1.065093994140625, 1.1744384765625, 1.283782958984375, 1.39312744140625, 1.502471923828125, 1.61181640625, 1.721160888671875, 1.83050537109375, 1.939849853515625, 2.0491943359375, 2.158538818359375, 2.26788330078125, 2.377227783203125, 2.486572265625, 2.595916748046875, 2.70526123046875, 2.814605712890625, 2.9239501953125, 3.033294677734375, 3.14263916015625, 3.251983642578125, 3.361328125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 2.0, 6.0, 12.0, 21.0, 22.0, 36.0, 49.0, 90.0, 100.0, 177.0, 259.0, 374.0, 536.0, 894.0, 1226.0, 1856.0, 2699.0, 4196.0, 6244.0, 9652.0, 15100.0, 23787.0, 39069.0, 64498.0, 112860.0, 229184.0, 241661.0, 117787.0, 66710.0, 39930.0, 24642.0, 15441.0, 9920.0, 6585.0, 4295.0, 2818.0, 1891.0, 1304.0, 863.0, 595.0, 380.0, 264.0, 188.0, 106.0, 73.0, 54.0, 32.0, 22.0, 21.0, 12.0, 11.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.64794921875, -0.6283340454101562, -0.6087188720703125, -0.5891036987304688, -0.569488525390625, -0.5498733520507812, -0.5302581787109375, -0.5106430053710938, -0.49102783203125, -0.47141265869140625, -0.4517974853515625, -0.43218231201171875, -0.412567138671875, -0.39295196533203125, -0.3733367919921875, -0.35372161865234375, -0.3341064453125, -0.31449127197265625, -0.2948760986328125, -0.27526092529296875, -0.255645751953125, -0.23603057861328125, -0.2164154052734375, -0.19680023193359375, -0.17718505859375, -0.15756988525390625, -0.1379547119140625, -0.11833953857421875, -0.098724365234375, -0.07910919189453125, -0.0594940185546875, -0.03987884521484375, -0.020263671875, -0.00064849853515625, 0.0189666748046875, 0.03858184814453125, 0.058197021484375, 0.07781219482421875, 0.0974273681640625, 0.11704254150390625, 0.13665771484375, 0.15627288818359375, 0.1758880615234375, 0.19550323486328125, 0.215118408203125, 0.23473358154296875, 0.2543487548828125, 0.27396392822265625, 0.2935791015625, 0.31319427490234375, 0.3328094482421875, 0.35242462158203125, 0.372039794921875, 0.39165496826171875, 0.4112701416015625, 0.43088531494140625, 0.45050048828125, 0.47011566162109375, 0.4897308349609375, 0.5093460083007812, 0.528961181640625, 0.5485763549804688, 0.5681915283203125, 0.5878067016601562, 0.607421875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 3.0, 4.0, 8.0, 11.0, 14.0, 24.0, 19.0, 19.0, 25.0, 26.0, 26.0, 37.0, 33.0, 39.0, 31.0, 42.0, 29.0, 35.0, 37.0, 1070.0, 42.0, 36.0, 39.0, 39.0, 36.0, 36.0, 33.0, 30.0, 19.0, 22.0, 23.0, 24.0, 10.0, 22.0, 12.0, 13.0, 12.0, 6.0, 10.0, 6.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9853515625, -1.9157257080078125, -1.846099853515625, -1.7764739990234375, -1.70684814453125, -1.6372222900390625, -1.567596435546875, -1.4979705810546875, -1.4283447265625, -1.3587188720703125, -1.289093017578125, -1.2194671630859375, -1.14984130859375, -1.0802154541015625, -1.010589599609375, -0.9409637451171875, -0.871337890625, -0.8017120361328125, -0.732086181640625, -0.6624603271484375, -0.59283447265625, -0.5232086181640625, -0.453582763671875, -0.3839569091796875, -0.3143310546875, -0.2447052001953125, -0.175079345703125, -0.1054534912109375, -0.03582763671875, 0.0337982177734375, 0.103424072265625, 0.1730499267578125, 0.24267578125, 0.3123016357421875, 0.381927490234375, 0.4515533447265625, 0.52117919921875, 0.5908050537109375, 0.660430908203125, 0.7300567626953125, 0.7996826171875, 0.8693084716796875, 0.938934326171875, 1.0085601806640625, 1.07818603515625, 1.1478118896484375, 1.217437744140625, 1.2870635986328125, 1.356689453125, 1.4263153076171875, 1.495941162109375, 1.5655670166015625, 1.63519287109375, 1.7048187255859375, 1.774444580078125, 1.8440704345703125, 1.9136962890625, 1.9833221435546875, 2.052947998046875, 2.1225738525390625, 2.19219970703125, 2.2618255615234375, 2.331451416015625, 2.4010772705078125, 2.470703125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 13.0, 18.0, 20.0, 37.0, 53.0, 75.0, 93.0, 143.0, 227.0, 273.0, 382.0, 589.0, 843.0, 1326.0, 1922.0, 3134.0, 4580.0, 7405.0, 11706.0, 18316.0, 29523.0, 48210.0, 82799.0, 154961.0, 1326831.0, 173230.0, 90536.0, 52598.0, 32044.0, 19851.0, 12383.0, 8040.0, 5119.0, 3244.0, 2130.0, 1384.0, 949.0, 694.0, 476.0, 323.0, 191.0, 134.0, 89.0, 68.0, 37.0, 32.0, 27.0, 22.0, 9.0, 14.0, 11.0, 4.0, 3.0, 2.0, 5.0], "bins": [-0.6376953125, -0.6187057495117188, -0.5997161865234375, -0.5807266235351562, -0.561737060546875, -0.5427474975585938, -0.5237579345703125, -0.5047683715820312, -0.48577880859375, -0.46678924560546875, -0.4477996826171875, -0.42881011962890625, -0.409820556640625, -0.39083099365234375, -0.3718414306640625, -0.35285186767578125, -0.3338623046875, -0.31487274169921875, -0.2958831787109375, -0.27689361572265625, -0.257904052734375, -0.23891448974609375, -0.2199249267578125, -0.20093536376953125, -0.18194580078125, -0.16295623779296875, -0.1439666748046875, -0.12497711181640625, -0.105987548828125, -0.08699798583984375, -0.0680084228515625, -0.04901885986328125, -0.030029296875, -0.01103973388671875, 0.0079498291015625, 0.02693939208984375, 0.045928955078125, 0.06491851806640625, 0.0839080810546875, 0.10289764404296875, 0.12188720703125, 0.14087677001953125, 0.1598663330078125, 0.17885589599609375, 0.197845458984375, 0.21683502197265625, 0.2358245849609375, 0.25481414794921875, 0.2738037109375, 0.29279327392578125, 0.3117828369140625, 0.33077239990234375, 0.349761962890625, 0.36875152587890625, 0.3877410888671875, 0.40673065185546875, 0.42572021484375, 0.44470977783203125, 0.4636993408203125, 0.48268890380859375, 0.501678466796875, 0.5206680297851562, 0.5396575927734375, 0.5586471557617188, 0.57763671875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 3.0, 4.0, 2.0, 8.0, 7.0, 8.0, 10.0, 9.0, 9.0, 19.0, 25.0, 14.0, 20.0, 16.0, 28.0, 34.0, 43.0, 43.0, 46.0, 56.0, 53.0, 57.0, 59.0, 50.0, 46.0, 48.0, 34.0, 41.0, 50.0, 33.0, 17.0, 23.0, 20.0, 17.0, 8.0, 14.0, 8.0, 7.0, 4.0, 3.0, 4.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00048160552978515625, -0.00046490877866744995, -0.00044821202754974365, -0.00043151527643203735, -0.00041481852531433105, -0.00039812177419662476, -0.00038142502307891846, -0.00036472827196121216, -0.00034803152084350586, -0.00033133476972579956, -0.00031463801860809326, -0.00029794126749038696, -0.00028124451637268066, -0.00026454776525497437, -0.00024785101413726807, -0.00023115426301956177, -0.00021445751190185547, -0.00019776076078414917, -0.00018106400966644287, -0.00016436725854873657, -0.00014767050743103027, -0.00013097375631332397, -0.00011427700519561768, -9.758025407791138e-05, -8.088350296020508e-05, -6.418675184249878e-05, -4.749000072479248e-05, -3.079324960708618e-05, -1.4096498489379883e-05, 2.600252628326416e-06, 1.9297003746032715e-05, 3.5993754863739014e-05, 5.269050598144531e-05, 6.938725709915161e-05, 8.608400821685791e-05, 0.00010278075933456421, 0.00011947751045227051, 0.0001361742615699768, 0.0001528710126876831, 0.0001695677638053894, 0.0001862645149230957, 0.000202961266040802, 0.0002196580171585083, 0.0002363547682762146, 0.0002530515193939209, 0.0002697482705116272, 0.0002864450216293335, 0.0003031417727470398, 0.0003198385238647461, 0.0003365352749824524, 0.0003532320261001587, 0.000369928777217865, 0.0003866255283355713, 0.0004033222794532776, 0.0004200190305709839, 0.0004367157816886902, 0.0004534125328063965, 0.0004701092839241028, 0.0004868060350418091, 0.0005035027861595154, 0.0005201995372772217, 0.000536896288394928, 0.0005535930395126343, 0.0005702897906303406, 0.0005869865417480469]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 9.0, 5.0, 9.0, 10.0, 19.0, 21.0, 29.0, 57.0, 59.0, 62.0, 98.0, 120.0, 170.0, 222.0, 324.0, 628.0, 10185.0, 1016701.0, 17866.0, 709.0, 322.0, 252.0, 174.0, 134.0, 82.0, 68.0, 48.0, 46.0, 23.0, 32.0, 15.0, 20.0, 8.0, 11.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.01288604736328125, -0.012533426284790039, -0.012180805206298828, -0.011828184127807617, -0.011475563049316406, -0.011122941970825195, -0.010770320892333984, -0.010417699813842773, -0.010065078735351562, -0.009712457656860352, -0.00935983657836914, -0.00900721549987793, -0.008654594421386719, -0.008301973342895508, -0.007949352264404297, -0.007596731185913086, -0.007244110107421875, -0.006891489028930664, -0.006538867950439453, -0.006186246871948242, -0.005833625793457031, -0.00548100471496582, -0.005128383636474609, -0.0047757625579833984, -0.0044231414794921875, -0.0040705204010009766, -0.0037178993225097656, -0.0033652782440185547, -0.0030126571655273438, -0.002660036087036133, -0.002307415008544922, -0.001954793930053711, -0.0016021728515625, -0.001249551773071289, -0.0008969306945800781, -0.0005443096160888672, -0.00019168853759765625, 0.0001609325408935547, 0.0005135536193847656, 0.0008661746978759766, 0.0012187957763671875, 0.0015714168548583984, 0.0019240379333496094, 0.0022766590118408203, 0.0026292800903320312, 0.002981901168823242, 0.003334522247314453, 0.003687143325805664, 0.004039764404296875, 0.004392385482788086, 0.004745006561279297, 0.005097627639770508, 0.005450248718261719, 0.00580286979675293, 0.006155490875244141, 0.0065081119537353516, 0.0068607330322265625, 0.0072133541107177734, 0.007565975189208984, 0.007918596267700195, 0.008271217346191406, 0.008623838424682617, 0.008976459503173828, 0.009329080581665039, 0.00968170166015625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 26.0, 180.0, 363.0, 333.0, 93.0, 18.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008653370314277709, -0.0008216529386118054, -0.0007779689040035009, -0.0007342848111875355, -0.0006906007183715701, -0.0006469166837632656, -0.0006032325909473002, -0.0005595484981313348, -0.0005158644635230303, -0.0004721803998108953, -0.0004284963069949299, -0.00038481224328279495, -0.00034112815046682954, -0.0002974440867546946, -0.0002537600230425596, -0.0002100759302265942, -0.0001663918374106288, -0.0001227077591465786, -7.902368815848604e-05, -3.533961717039347e-05, 8.344461093656719e-06, 5.2028539357706904e-05, 9.571260306984186e-05, 0.00013939669588580728, 0.00018308075959794223, 0.00022676483786199242, 0.0002704489161260426, 0.00031413297983817756, 0.0003578170435503125, 0.00040150113636627793, 0.0004451852000784129, 0.0004888692637905478, 0.0005325532983988523, 0.0005762373912148178, 0.0006199214258231223, 0.0006636055186390877, 0.0007072896114550531, 0.0007509737042710185, 0.000794657738879323, 0.0008383418316952884, 0.0008820259245112538, 0.0009257100173272192, 0.0009693940519355237, 0.0010130781447514892, 0.0010567621793597937, 0.00110044633038342, 0.0011441303649917245, 0.001187814399600029, 0.0012314985506236553, 0.0012751825852319598, 0.0013188667362555861, 0.0013625507708638906, 0.0014062348054721951, 0.0014499189564958215, 0.001493602991104126, 0.0015372871421277523, 0.001580971060320735, 0.0016246550949290395, 0.0016683392459526658, 0.0017120232805609703, 0.0017557073151692748, 0.0017993914661929011, 0.0018430755008012056, 0.001886759651824832, 0.0019304436864331365]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 5.0, 10.0, 7.0, 15.0, 17.0, 18.0, 16.0, 8.0, 13.0, 23.0, 23.0, 22.0, 27.0, 33.0, 40.0, 34.0, 33.0, 30.0, 31.0, 41.0, 38.0, 43.0, 51.0, 35.0, 36.0, 32.0, 35.0, 32.0, 41.0, 23.0, 18.0, 23.0, 27.0, 25.0, 15.0, 14.0, 8.0, 8.0, 9.0, 10.0, 9.0, 3.0, 10.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025898218154907227, -0.00025032833218574524, -0.0002416744828224182, -0.0002330206334590912, -0.00022436678409576416, -0.00021571293473243713, -0.0002070590853691101, -0.00019840523600578308, -0.00018975138664245605, -0.00018109753727912903, -0.000172443687915802, -0.00016378983855247498, -0.00015513598918914795, -0.00014648213982582092, -0.0001378282904624939, -0.00012917444109916687, -0.00012052059173583984, -0.00011186674237251282, -0.00010321289300918579, -9.455904364585876e-05, -8.590519428253174e-05, -7.725134491920471e-05, -6.859749555587769e-05, -5.994364619255066e-05, -5.128979682922363e-05, -4.2635947465896606e-05, -3.398209810256958e-05, -2.5328248739242554e-05, -1.6674399375915527e-05, -8.020550012588501e-06, 6.332993507385254e-07, 9.287148714065552e-06, 1.7940998077392578e-05, 2.6594847440719604e-05, 3.524869680404663e-05, 4.390254616737366e-05, 5.2556395530700684e-05, 6.121024489402771e-05, 6.986409425735474e-05, 7.851794362068176e-05, 8.717179298400879e-05, 9.582564234733582e-05, 0.00010447949171066284, 0.00011313334107398987, 0.0001217871904373169, 0.00013044103980064392, 0.00013909488916397095, 0.00014774873852729797, 0.000156402587890625, 0.00016505643725395203, 0.00017371028661727905, 0.00018236413598060608, 0.0001910179853439331, 0.00019967183470726013, 0.00020832568407058716, 0.00021697953343391418, 0.0002256333827972412, 0.00023428723216056824, 0.00024294108152389526, 0.0002515949308872223, 0.0002602487802505493, 0.00026890262961387634, 0.00027755647897720337, 0.0002862103283405304, 0.0002948641777038574]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 14.0, 9.0, 11.0, 6.0, 13.0, 17.0, 9.0, 21.0, 16.0, 26.0, 34.0, 35.0, 28.0, 30.0, 38.0, 49.0, 35.0, 46.0, 35.0, 57.0, 40.0, 39.0, 35.0, 31.0, 38.0, 33.0, 25.0, 40.0, 22.0, 23.0, 22.0, 14.0, 17.0, 18.0, 9.0, 12.0, 14.0, 7.0, 5.0, 7.0, 3.0, 1.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.63671875, -3.527374267578125, -3.41802978515625, -3.308685302734375, -3.1993408203125, -3.089996337890625, -2.98065185546875, -2.871307373046875, -2.761962890625, -2.652618408203125, -2.54327392578125, -2.433929443359375, -2.3245849609375, -2.215240478515625, -2.10589599609375, -1.996551513671875, -1.88720703125, -1.777862548828125, -1.66851806640625, -1.559173583984375, -1.4498291015625, -1.340484619140625, -1.23114013671875, -1.121795654296875, -1.012451171875, -0.903106689453125, -0.79376220703125, -0.684417724609375, -0.5750732421875, -0.465728759765625, -0.35638427734375, -0.247039794921875, -0.1376953125, -0.028350830078125, 0.08099365234375, 0.190338134765625, 0.2996826171875, 0.409027099609375, 0.51837158203125, 0.627716064453125, 0.737060546875, 0.846405029296875, 0.95574951171875, 1.065093994140625, 1.1744384765625, 1.283782958984375, 1.39312744140625, 1.502471923828125, 1.61181640625, 1.721160888671875, 1.83050537109375, 1.939849853515625, 2.0491943359375, 2.158538818359375, 2.26788330078125, 2.377227783203125, 2.486572265625, 2.595916748046875, 2.70526123046875, 2.814605712890625, 2.9239501953125, 3.033294677734375, 3.14263916015625, 3.251983642578125, 3.361328125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 4.0, 8.0, 16.0, 11.0, 19.0, 18.0, 28.0, 52.0, 76.0, 103.0, 147.0, 205.0, 277.0, 405.0, 671.0, 1104.0, 1987.0, 3438.0, 6572.0, 12804.0, 28685.0, 72579.0, 210682.0, 403633.0, 187600.0, 65042.0, 26127.0, 12116.0, 6104.0, 3194.0, 1865.0, 1028.0, 661.0, 375.0, 259.0, 179.0, 140.0, 101.0, 68.0, 53.0, 40.0, 31.0, 14.0, 16.0, 14.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-3.9765625, -3.857666015625, -3.73876953125, -3.619873046875, -3.5009765625, -3.382080078125, -3.26318359375, -3.144287109375, -3.025390625, -2.906494140625, -2.78759765625, -2.668701171875, -2.5498046875, -2.430908203125, -2.31201171875, -2.193115234375, -2.07421875, -1.955322265625, -1.83642578125, -1.717529296875, -1.5986328125, -1.479736328125, -1.36083984375, -1.241943359375, -1.123046875, -1.004150390625, -0.88525390625, -0.766357421875, -0.6474609375, -0.528564453125, -0.40966796875, -0.290771484375, -0.171875, -0.052978515625, 0.06591796875, 0.184814453125, 0.3037109375, 0.422607421875, 0.54150390625, 0.660400390625, 0.779296875, 0.898193359375, 1.01708984375, 1.135986328125, 1.2548828125, 1.373779296875, 1.49267578125, 1.611572265625, 1.73046875, 1.849365234375, 1.96826171875, 2.087158203125, 2.2060546875, 2.324951171875, 2.44384765625, 2.562744140625, 2.681640625, 2.800537109375, 2.91943359375, 3.038330078125, 3.1572265625, 3.276123046875, 3.39501953125, 3.513916015625, 3.6328125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 6.0, 11.0, 9.0, 3.0, 4.0, 16.0, 17.0, 23.0, 24.0, 24.0, 38.0, 34.0, 35.0, 32.0, 34.0, 57.0, 75.0, 160.0, 1545.0, 375.0, 106.0, 55.0, 47.0, 30.0, 48.0, 38.0, 38.0, 32.0, 24.0, 18.0, 14.0, 11.0, 19.0, 11.0, 11.0, 10.0, 9.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.9453125, -12.511962890625, -12.07861328125, -11.645263671875, -11.2119140625, -10.778564453125, -10.34521484375, -9.911865234375, -9.478515625, -9.045166015625, -8.61181640625, -8.178466796875, -7.7451171875, -7.311767578125, -6.87841796875, -6.445068359375, -6.01171875, -5.578369140625, -5.14501953125, -4.711669921875, -4.2783203125, -3.844970703125, -3.41162109375, -2.978271484375, -2.544921875, -2.111572265625, -1.67822265625, -1.244873046875, -0.8115234375, -0.378173828125, 0.05517578125, 0.488525390625, 0.921875, 1.355224609375, 1.78857421875, 2.221923828125, 2.6552734375, 3.088623046875, 3.52197265625, 3.955322265625, 4.388671875, 4.822021484375, 5.25537109375, 5.688720703125, 6.1220703125, 6.555419921875, 6.98876953125, 7.422119140625, 7.85546875, 8.288818359375, 8.72216796875, 9.155517578125, 9.5888671875, 10.022216796875, 10.45556640625, 10.888916015625, 11.322265625, 11.755615234375, 12.18896484375, 12.622314453125, 13.0556640625, 13.489013671875, 13.92236328125, 14.355712890625, 14.7890625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 10.0, 6.0, 13.0, 14.0, 20.0, 16.0, 22.0, 27.0, 28.0, 47.0, 59.0, 82.0, 111.0, 203.0, 366.0, 1046.0, 8161.0, 595224.0, 2522478.0, 15036.0, 1564.0, 470.0, 214.0, 136.0, 66.0, 63.0, 51.0, 41.0, 30.0, 19.0, 18.0, 14.0, 7.0, 8.0, 10.0, 17.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.765625, -24.017578125, -23.26953125, -22.521484375, -21.7734375, -21.025390625, -20.27734375, -19.529296875, -18.78125, -18.033203125, -17.28515625, -16.537109375, -15.7890625, -15.041015625, -14.29296875, -13.544921875, -12.796875, -12.048828125, -11.30078125, -10.552734375, -9.8046875, -9.056640625, -8.30859375, -7.560546875, -6.8125, -6.064453125, -5.31640625, -4.568359375, -3.8203125, -3.072265625, -2.32421875, -1.576171875, -0.828125, -0.080078125, 0.66796875, 1.416015625, 2.1640625, 2.912109375, 3.66015625, 4.408203125, 5.15625, 5.904296875, 6.65234375, 7.400390625, 8.1484375, 8.896484375, 9.64453125, 10.392578125, 11.140625, 11.888671875, 12.63671875, 13.384765625, 14.1328125, 14.880859375, 15.62890625, 16.376953125, 17.125, 17.873046875, 18.62109375, 19.369140625, 20.1171875, 20.865234375, 21.61328125, 22.361328125, 23.109375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 16.0, 22.0, 64.0, 141.0, 173.0, 204.0, 170.0, 118.0, 42.0, 29.0, 13.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0806245803833, -10.249979019165039, -9.419332504272461, -8.588685989379883, -7.758040428161621, -6.927394390106201, -6.096748352050781, -5.266102313995361, -4.435456275939941, -3.6048102378845215, -2.7741641998291016, -1.9435181617736816, -1.1128721237182617, -0.2822260856628418, 0.5484199523925781, 1.379065990447998, 2.209712028503418, 3.040358066558838, 3.871004104614258, 4.701650142669678, 5.532296180725098, 6.362942218780518, 7.1935882568359375, 8.024234771728516, 8.854880332946777, 9.685525894165039, 10.516172409057617, 11.346818923950195, 12.177464485168457, 13.008110046386719, 13.838756561279297, 14.669403076171875, 15.500049591064453, 16.33069610595703, 17.16134262084961, 17.991987228393555, 18.822633743286133, 19.65328025817871, 20.483924865722656, 21.314571380615234, 22.145217895507812, 22.97586441040039, 23.80651092529297, 24.637155532836914, 25.467802047729492, 26.29844856262207, 27.129093170166016, 27.959739685058594, 28.790386199951172, 29.62103271484375, 30.451679229736328, 31.282323837280273, 32.11296844482422, 32.9436149597168, 33.774261474609375, 34.60490798950195, 35.43555450439453, 36.26620101928711, 37.09684753417969, 37.927494049072266, 38.758140563964844, 39.588783264160156, 40.419429779052734, 41.25007629394531, 42.08072280883789]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 6.0, 7.0, 6.0, 14.0, 9.0, 12.0, 12.0, 14.0, 11.0, 19.0, 29.0, 35.0, 32.0, 40.0, 32.0, 34.0, 32.0, 46.0, 41.0, 41.0, 26.0, 46.0, 35.0, 42.0, 36.0, 36.0, 41.0, 33.0, 30.0, 26.0, 30.0, 26.0, 24.0, 27.0, 9.0, 15.0, 11.0, 7.0, 5.0, 7.0, 3.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-41.49871063232422, -40.227928161621094, -38.957149505615234, -37.68636703491211, -36.415584564208984, -35.144805908203125, -33.8740234375, -32.603240966796875, -31.332460403442383, -30.06167984008789, -28.790897369384766, -27.520116806030273, -26.24933624267578, -24.978553771972656, -23.707773208618164, -22.436992645263672, -21.166210174560547, -19.895429611206055, -18.62464714050293, -17.353866577148438, -16.083084106445312, -14.81230354309082, -13.541522979736328, -12.27074146270752, -10.999959945678711, -9.729178428649902, -8.458396911621094, -7.187616348266602, -5.916834831237793, -4.646053314208984, -3.375272274017334, -2.1044912338256836, -0.833709716796875, 0.4370715618133545, 1.707852840423584, 2.9786341190338135, 4.249415397644043, 5.520196914672852, 6.790977954864502, 8.061758995056152, 9.332540512084961, 10.60332202911377, 11.874103546142578, 13.14488410949707, 14.415665626525879, 15.686447143554688, 16.95722770690918, 18.228008270263672, 19.498790740966797, 20.76957130432129, 22.040353775024414, 23.311134338378906, 24.58191680908203, 25.852697372436523, 27.123477935791016, 28.39426040649414, 29.665040969848633, 30.935821533203125, 32.20660400390625, 33.477386474609375, 34.748165130615234, 36.01894760131836, 37.289730072021484, 38.560508728027344, 39.83129119873047]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 8.0, 6.0, 9.0, 12.0, 13.0, 14.0, 11.0, 18.0, 22.0, 20.0, 35.0, 31.0, 34.0, 39.0, 31.0, 44.0, 50.0, 37.0, 55.0, 43.0, 40.0, 37.0, 45.0, 27.0, 34.0, 47.0, 31.0, 30.0, 21.0, 30.0, 24.0, 9.0, 16.0, 17.0, 11.0, 7.0, 9.0, 10.0, 2.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0390625, -3.917449951171875, -3.79583740234375, -3.674224853515625, -3.5526123046875, -3.430999755859375, -3.30938720703125, -3.187774658203125, -3.066162109375, -2.944549560546875, -2.82293701171875, -2.701324462890625, -2.5797119140625, -2.458099365234375, -2.33648681640625, -2.214874267578125, -2.09326171875, -1.971649169921875, -1.85003662109375, -1.728424072265625, -1.6068115234375, -1.485198974609375, -1.36358642578125, -1.241973876953125, -1.120361328125, -0.998748779296875, -0.87713623046875, -0.755523681640625, -0.6339111328125, -0.512298583984375, -0.39068603515625, -0.269073486328125, -0.1474609375, -0.025848388671875, 0.09576416015625, 0.217376708984375, 0.3389892578125, 0.460601806640625, 0.58221435546875, 0.703826904296875, 0.825439453125, 0.947052001953125, 1.06866455078125, 1.190277099609375, 1.3118896484375, 1.433502197265625, 1.55511474609375, 1.676727294921875, 1.79833984375, 1.919952392578125, 2.04156494140625, 2.163177490234375, 2.2847900390625, 2.406402587890625, 2.52801513671875, 2.649627685546875, 2.771240234375, 2.892852783203125, 3.01446533203125, 3.136077880859375, 3.2576904296875, 3.379302978515625, 3.50091552734375, 3.622528076171875, 3.744140625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 4.0, 14.0, 5.0, 10.0, 9.0, 13.0, 18.0, 21.0, 23.0, 26.0, 25.0, 42.0, 48.0, 60.0, 122.0, 374.0, 2239.0, 40712.0, 2666215.0, 1462002.0, 20156.0, 1442.0, 280.0, 94.0, 46.0, 40.0, 33.0, 34.0, 23.0, 20.0, 16.0, 22.0, 19.0, 10.0, 5.0, 9.0, 7.0, 6.0, 5.0, 6.0, 6.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.71875, -21.078125, -20.4375, -19.796875, -19.15625, -18.515625, -17.875, -17.234375, -16.59375, -15.953125, -15.3125, -14.671875, -14.03125, -13.390625, -12.75, -12.109375, -11.46875, -10.828125, -10.1875, -9.546875, -8.90625, -8.265625, -7.625, -6.984375, -6.34375, -5.703125, -5.0625, -4.421875, -3.78125, -3.140625, -2.5, -1.859375, -1.21875, -0.578125, 0.0625, 0.703125, 1.34375, 1.984375, 2.625, 3.265625, 3.90625, 4.546875, 5.1875, 5.828125, 6.46875, 7.109375, 7.75, 8.390625, 9.03125, 9.671875, 10.3125, 10.953125, 11.59375, 12.234375, 12.875, 13.515625, 14.15625, 14.796875, 15.4375, 16.078125, 16.71875, 17.359375, 18.0, 18.640625, 19.28125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 6.0, 9.0, 12.0, 19.0, 27.0, 34.0, 58.0, 84.0, 127.0, 152.0, 209.0, 330.0, 433.0, 488.0, 499.0, 384.0, 353.0, 271.0, 175.0, 109.0, 87.0, 61.0, 48.0, 32.0, 19.0, 14.0, 4.0, 8.0, 7.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-15.5625, -15.173828125, -14.78515625, -14.396484375, -14.0078125, -13.619140625, -13.23046875, -12.841796875, -12.453125, -12.064453125, -11.67578125, -11.287109375, -10.8984375, -10.509765625, -10.12109375, -9.732421875, -9.34375, -8.955078125, -8.56640625, -8.177734375, -7.7890625, -7.400390625, -7.01171875, -6.623046875, -6.234375, -5.845703125, -5.45703125, -5.068359375, -4.6796875, -4.291015625, -3.90234375, -3.513671875, -3.125, -2.736328125, -2.34765625, -1.958984375, -1.5703125, -1.181640625, -0.79296875, -0.404296875, -0.015625, 0.373046875, 0.76171875, 1.150390625, 1.5390625, 1.927734375, 2.31640625, 2.705078125, 3.09375, 3.482421875, 3.87109375, 4.259765625, 4.6484375, 5.037109375, 5.42578125, 5.814453125, 6.203125, 6.591796875, 6.98046875, 7.369140625, 7.7578125, 8.146484375, 8.53515625, 8.923828125, 9.3125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 3.0, 10.0, 14.0, 10.0, 21.0, 28.0, 53.0, 79.0, 138.0, 201.0, 392.0, 1303.0, 18019.0, 3197142.0, 968322.0, 6944.0, 790.0, 329.0, 182.0, 113.0, 73.0, 44.0, 30.0, 13.0, 5.0, 7.0, 6.0, 7.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.3125, -33.892578125, -32.47265625, -31.052734375, -29.6328125, -28.212890625, -26.79296875, -25.373046875, -23.953125, -22.533203125, -21.11328125, -19.693359375, -18.2734375, -16.853515625, -15.43359375, -14.013671875, -12.59375, -11.173828125, -9.75390625, -8.333984375, -6.9140625, -5.494140625, -4.07421875, -2.654296875, -1.234375, 0.185546875, 1.60546875, 3.025390625, 4.4453125, 5.865234375, 7.28515625, 8.705078125, 10.125, 11.544921875, 12.96484375, 14.384765625, 15.8046875, 17.224609375, 18.64453125, 20.064453125, 21.484375, 22.904296875, 24.32421875, 25.744140625, 27.1640625, 28.583984375, 30.00390625, 31.423828125, 32.84375, 34.263671875, 35.68359375, 37.103515625, 38.5234375, 39.943359375, 41.36328125, 42.783203125, 44.203125, 45.623046875, 47.04296875, 48.462890625, 49.8828125, 51.302734375, 52.72265625, 54.142578125, 55.5625]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 19.0, 97.0, 301.0, 376.0, 183.0, 33.0, 5.0, 2.0], "bins": [-292.83917236328125, -287.89251708984375, -282.9458312988281, -277.9991760253906, -273.0525207519531, -268.1058349609375, -263.1591796875, -258.2125244140625, -253.26583862304688, -248.3191680908203, -243.3725128173828, -238.42584228515625, -233.4791717529297, -228.53250122070312, -223.58584594726562, -218.63917541503906, -213.69252014160156, -208.745849609375, -203.7991943359375, -198.85252380371094, -193.90585327148438, -188.95919799804688, -184.0125274658203, -179.06585693359375, -174.11920166015625, -169.1725311279297, -164.2258758544922, -159.27920532226562, -154.33253479003906, -149.3858642578125, -144.439208984375, -139.49253845214844, -134.54586791992188, -129.5991973876953, -124.65253448486328, -119.70587158203125, -114.75920104980469, -109.81253814697266, -104.86587524414062, -99.91920471191406, -94.97254180908203, -90.02587890625, -85.07920837402344, -80.1325454711914, -75.18588256835938, -70.23921203613281, -65.29254913330078, -60.345882415771484, -55.39921569824219, -50.45254898071289, -45.505882263183594, -40.55921936035156, -35.612552642822266, -30.66588592529297, -25.719221115112305, -20.77255630493164, -15.825891494750977, -10.879225730895996, -5.932559967041016, -0.9858942031860352, 3.9607715606689453, 8.907438278198242, 13.854103088378906, 18.80076789855957, 23.747434616088867]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 9.0, 6.0, 13.0, 11.0, 17.0, 29.0, 16.0, 17.0, 19.0, 27.0, 30.0, 34.0, 36.0, 43.0, 45.0, 56.0, 42.0, 51.0, 34.0, 42.0, 48.0, 44.0, 38.0, 57.0, 39.0, 30.0, 34.0, 26.0, 18.0, 24.0, 18.0, 13.0, 9.0, 9.0, 3.0, 4.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.424598693847656, -40.11902618408203, -38.81345748901367, -37.50788879394531, -36.20231628417969, -34.89674377441406, -33.5911750793457, -32.285606384277344, -30.98003387451172, -29.674463272094727, -28.368892669677734, -27.063322067260742, -25.75775146484375, -24.452180862426758, -23.146610260009766, -21.841039657592773, -20.53546905517578, -19.22989845275879, -17.924327850341797, -16.618757247924805, -15.313186645507812, -14.00761604309082, -12.702045440673828, -11.396474838256836, -10.090904235839844, -8.785333633422852, -7.479763031005859, -6.174192428588867, -4.868621826171875, -3.563051223754883, -2.2574806213378906, -0.9519100189208984, 0.3536567687988281, 1.6592273712158203, 2.9647979736328125, 4.270368576049805, 5.575939178466797, 6.881509780883789, 8.187080383300781, 9.492650985717773, 10.798221588134766, 12.103792190551758, 13.40936279296875, 14.714933395385742, 16.020503997802734, 17.326074600219727, 18.63164520263672, 19.93721580505371, 21.242786407470703, 22.548357009887695, 23.853927612304688, 25.15949821472168, 26.465068817138672, 27.770639419555664, 29.076210021972656, 30.38178062438965, 31.68735122680664, 32.992919921875, 34.298492431640625, 35.60406494140625, 36.90963363647461, 38.21520233154297, 39.520774841308594, 40.82634735107422, 42.13191604614258]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 5.0, 6.0, 13.0, 7.0, 14.0, 18.0, 17.0, 21.0, 21.0, 19.0, 34.0, 30.0, 26.0, 48.0, 39.0, 38.0, 51.0, 61.0, 39.0, 39.0, 58.0, 40.0, 44.0, 37.0, 41.0, 37.0, 30.0, 31.0, 18.0, 21.0, 22.0, 13.0, 10.0, 11.0, 11.0, 8.0, 5.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.260009765625, -4.12548828125, -3.990966796875, -3.8564453125, -3.721923828125, -3.58740234375, -3.452880859375, -3.318359375, -3.183837890625, -3.04931640625, -2.914794921875, -2.7802734375, -2.645751953125, -2.51123046875, -2.376708984375, -2.2421875, -2.107666015625, -1.97314453125, -1.838623046875, -1.7041015625, -1.569580078125, -1.43505859375, -1.300537109375, -1.166015625, -1.031494140625, -0.89697265625, -0.762451171875, -0.6279296875, -0.493408203125, -0.35888671875, -0.224365234375, -0.08984375, 0.044677734375, 0.17919921875, 0.313720703125, 0.4482421875, 0.582763671875, 0.71728515625, 0.851806640625, 0.986328125, 1.120849609375, 1.25537109375, 1.389892578125, 1.5244140625, 1.658935546875, 1.79345703125, 1.927978515625, 2.0625, 2.197021484375, 2.33154296875, 2.466064453125, 2.6005859375, 2.735107421875, 2.86962890625, 3.004150390625, 3.138671875, 3.273193359375, 3.40771484375, 3.542236328125, 3.6767578125, 3.811279296875, 3.94580078125, 4.080322265625, 4.21484375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 4.0, 6.0, 12.0, 13.0, 11.0, 20.0, 30.0, 40.0, 53.0, 86.0, 140.0, 179.0, 239.0, 397.0, 528.0, 740.0, 1073.0, 1662.0, 2321.0, 3690.0, 5372.0, 8074.0, 12768.0, 20133.0, 31849.0, 51988.0, 87530.0, 159905.0, 267367.0, 161531.0, 88306.0, 52637.0, 32099.0, 20016.0, 12765.0, 8359.0, 5351.0, 3647.0, 2311.0, 1662.0, 1100.0, 795.0, 552.0, 352.0, 257.0, 168.0, 136.0, 83.0, 52.0, 55.0, 41.0, 24.0, 12.0, 15.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.65576171875, -0.63494873046875, -0.6141357421875, -0.59332275390625, -0.572509765625, -0.55169677734375, -0.5308837890625, -0.51007080078125, -0.4892578125, -0.46844482421875, -0.4476318359375, -0.42681884765625, -0.406005859375, -0.38519287109375, -0.3643798828125, -0.34356689453125, -0.32275390625, -0.30194091796875, -0.2811279296875, -0.26031494140625, -0.239501953125, -0.21868896484375, -0.1978759765625, -0.17706298828125, -0.15625, -0.13543701171875, -0.1146240234375, -0.09381103515625, -0.072998046875, -0.05218505859375, -0.0313720703125, -0.01055908203125, 0.01025390625, 0.03106689453125, 0.0518798828125, 0.07269287109375, 0.093505859375, 0.11431884765625, 0.1351318359375, 0.15594482421875, 0.1767578125, 0.19757080078125, 0.2183837890625, 0.23919677734375, 0.260009765625, 0.28082275390625, 0.3016357421875, 0.32244873046875, 0.34326171875, 0.36407470703125, 0.3848876953125, 0.40570068359375, 0.426513671875, 0.44732666015625, 0.4681396484375, 0.48895263671875, 0.509765625, 0.53057861328125, 0.5513916015625, 0.57220458984375, 0.593017578125, 0.61383056640625, 0.6346435546875, 0.65545654296875, 0.67626953125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 9.0, 2.0, 6.0, 8.0, 7.0, 10.0, 8.0, 13.0, 6.0, 21.0, 21.0, 24.0, 33.0, 22.0, 26.0, 35.0, 35.0, 39.0, 33.0, 39.0, 36.0, 42.0, 1065.0, 43.0, 35.0, 38.0, 31.0, 40.0, 27.0, 41.0, 32.0, 20.0, 27.0, 16.0, 21.0, 18.0, 19.0, 10.0, 6.0, 13.0, 9.0, 6.0, 6.0, 5.0, 3.0, 4.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.310546875, -2.239654541015625, -2.16876220703125, -2.097869873046875, -2.0269775390625, -1.956085205078125, -1.88519287109375, -1.814300537109375, -1.743408203125, -1.672515869140625, -1.60162353515625, -1.530731201171875, -1.4598388671875, -1.388946533203125, -1.31805419921875, -1.247161865234375, -1.17626953125, -1.105377197265625, -1.03448486328125, -0.963592529296875, -0.8927001953125, -0.821807861328125, -0.75091552734375, -0.680023193359375, -0.609130859375, -0.538238525390625, -0.46734619140625, -0.396453857421875, -0.3255615234375, -0.254669189453125, -0.18377685546875, -0.112884521484375, -0.0419921875, 0.028900146484375, 0.09979248046875, 0.170684814453125, 0.2415771484375, 0.312469482421875, 0.38336181640625, 0.454254150390625, 0.525146484375, 0.596038818359375, 0.66693115234375, 0.737823486328125, 0.8087158203125, 0.879608154296875, 0.95050048828125, 1.021392822265625, 1.09228515625, 1.163177490234375, 1.23406982421875, 1.304962158203125, 1.3758544921875, 1.446746826171875, 1.51763916015625, 1.588531494140625, 1.659423828125, 1.730316162109375, 1.80120849609375, 1.872100830078125, 1.9429931640625, 2.013885498046875, 2.08477783203125, 2.155670166015625, 2.2265625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 12.0, 10.0, 6.0, 15.0, 26.0, 41.0, 53.0, 51.0, 77.0, 122.0, 141.0, 194.0, 252.0, 352.0, 548.0, 804.0, 1135.0, 1577.0, 2130.0, 3282.0, 4800.0, 7059.0, 10416.0, 15803.0, 24657.0, 39918.0, 66745.0, 121156.0, 1286974.0, 224085.0, 113427.0, 62937.0, 37638.0, 23513.0, 15081.0, 10039.0, 6728.0, 4596.0, 3159.0, 2217.0, 1575.0, 1092.0, 722.0, 543.0, 406.0, 267.0, 216.0, 152.0, 107.0, 82.0, 79.0, 41.0, 23.0, 27.0, 12.0, 9.0, 3.0, 5.0, 2.0, 3.0, 3.0], "bins": [-0.61328125, -0.594085693359375, -0.57489013671875, -0.555694580078125, -0.5364990234375, -0.517303466796875, -0.49810791015625, -0.478912353515625, -0.459716796875, -0.440521240234375, -0.42132568359375, -0.402130126953125, -0.3829345703125, -0.363739013671875, -0.34454345703125, -0.325347900390625, -0.30615234375, -0.286956787109375, -0.26776123046875, -0.248565673828125, -0.2293701171875, -0.210174560546875, -0.19097900390625, -0.171783447265625, -0.152587890625, -0.133392333984375, -0.11419677734375, -0.095001220703125, -0.0758056640625, -0.056610107421875, -0.03741455078125, -0.018218994140625, 0.0009765625, 0.020172119140625, 0.03936767578125, 0.058563232421875, 0.0777587890625, 0.096954345703125, 0.11614990234375, 0.135345458984375, 0.154541015625, 0.173736572265625, 0.19293212890625, 0.212127685546875, 0.2313232421875, 0.250518798828125, 0.26971435546875, 0.288909912109375, 0.30810546875, 0.327301025390625, 0.34649658203125, 0.365692138671875, 0.3848876953125, 0.404083251953125, 0.42327880859375, 0.442474365234375, 0.461669921875, 0.480865478515625, 0.50006103515625, 0.519256591796875, 0.5384521484375, 0.557647705078125, 0.57684326171875, 0.596038818359375, 0.615234375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 6.0, 6.0, 5.0, 5.0, 17.0, 10.0, 16.0, 20.0, 26.0, 26.0, 42.0, 37.0, 48.0, 40.0, 47.0, 62.0, 63.0, 62.0, 52.0, 35.0, 49.0, 42.0, 36.0, 44.0, 30.0, 42.0, 18.0, 22.0, 17.0, 11.0, 8.0, 11.0, 3.0, 7.0, 2.0, 5.0, 8.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005731582641601562, -0.0005535483360290527, -0.0005339384078979492, -0.0005143284797668457, -0.0004947185516357422, -0.00047510862350463867, -0.00045549869537353516, -0.00043588876724243164, -0.0004162788391113281, -0.0003966689109802246, -0.0003770589828491211, -0.0003574490547180176, -0.00033783912658691406, -0.00031822919845581055, -0.00029861927032470703, -0.0002790093421936035, -0.0002593994140625, -0.00023978948593139648, -0.00022017955780029297, -0.00020056962966918945, -0.00018095970153808594, -0.00016134977340698242, -0.0001417398452758789, -0.0001221299171447754, -0.00010251998901367188, -8.291006088256836e-05, -6.330013275146484e-05, -4.369020462036133e-05, -2.4080276489257812e-05, -4.470348358154297e-06, 1.5139579772949219e-05, 3.4749507904052734e-05, 5.435943603515625e-05, 7.396936416625977e-05, 9.357929229736328e-05, 0.0001131892204284668, 0.0001327991485595703, 0.00015240907669067383, 0.00017201900482177734, 0.00019162893295288086, 0.00021123886108398438, 0.0002308487892150879, 0.0002504587173461914, 0.0002700686454772949, 0.00028967857360839844, 0.00030928850173950195, 0.00032889842987060547, 0.000348508358001709, 0.0003681182861328125, 0.000387728214263916, 0.00040733814239501953, 0.00042694807052612305, 0.00044655799865722656, 0.0004661679267883301, 0.0004857778549194336, 0.0005053877830505371, 0.0005249977111816406, 0.0005446076393127441, 0.0005642175674438477, 0.0005838274955749512, 0.0006034374237060547, 0.0006230473518371582, 0.0006426572799682617, 0.0006622672080993652, 0.0006818771362304688]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 9.0, 5.0, 13.0, 8.0, 10.0, 26.0, 28.0, 42.0, 50.0, 68.0, 98.0, 141.0, 229.0, 322.0, 784.0, 48709.0, 993817.0, 2773.0, 505.0, 256.0, 195.0, 117.0, 90.0, 60.0, 46.0, 32.0, 25.0, 18.0, 14.0, 13.0, 15.0, 7.0, 5.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.0171051025390625, -0.016646265983581543, -0.016187429428100586, -0.01572859287261963, -0.015269756317138672, -0.014810919761657715, -0.014352083206176758, -0.0138932466506958, -0.013434410095214844, -0.012975573539733887, -0.01251673698425293, -0.012057900428771973, -0.011599063873291016, -0.011140227317810059, -0.010681390762329102, -0.010222554206848145, -0.009763717651367188, -0.00930488109588623, -0.008846044540405273, -0.008387207984924316, -0.00792837142944336, -0.007469534873962402, -0.007010698318481445, -0.006551861763000488, -0.006093025207519531, -0.005634188652038574, -0.005175352096557617, -0.00471651554107666, -0.004257678985595703, -0.003798842430114746, -0.003340005874633789, -0.002881169319152832, -0.002422332763671875, -0.001963496208190918, -0.001504659652709961, -0.001045823097229004, -0.0005869865417480469, -0.00012814998626708984, 0.0003306865692138672, 0.0007895231246948242, 0.0012483596801757812, 0.0017071962356567383, 0.0021660327911376953, 0.0026248693466186523, 0.0030837059020996094, 0.0035425424575805664, 0.0040013790130615234, 0.0044602155685424805, 0.0049190521240234375, 0.0053778886795043945, 0.0058367252349853516, 0.006295561790466309, 0.006754398345947266, 0.007213234901428223, 0.00767207145690918, 0.008130908012390137, 0.008589744567871094, 0.00904858112335205, 0.009507417678833008, 0.009966254234313965, 0.010425090789794922, 0.010883927345275879, 0.011342763900756836, 0.011801600456237793, 0.01226043701171875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 45.0, 117.0, 264.0, 302.0, 180.0, 69.0, 14.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004487147962208837, -0.0004120715311728418, -0.0003754282952286303, -0.00033878503018058836, -0.0003021417651325464, -0.00026549852918833494, -0.000228855264140293, -0.00019221202819608152, -0.00015556876314803958, -0.00011892551265191287, -8.228225487982854e-05, -4.563899710774422e-05, -8.995746611617506e-06, 2.7647503884509206e-05, 6.429076893255115e-05, 0.00010093400487676263, 0.00013757726992480457, 0.00017422052042093128, 0.000210863770917058, 0.00024750703596509993, 0.00028415030101314187, 0.00032079353695735335, 0.0003574368020053953, 0.0003940800379496068, 0.0004307233029976487, 0.00046736656804569066, 0.0005040098330937326, 0.0005406530690379441, 0.0005772963049821556, 0.000613939599134028, 0.0006505828350782394, 0.0006872260710224509, 0.0007238693069666624, 0.0007605125429108739, 0.0007971558370627463, 0.0008337990730069578, 0.0008704423089511693, 0.0009070856031030416, 0.0009437288390472531, 0.0009803720749914646, 0.001017015310935676, 0.0010536585468798876, 0.001090301782824099, 0.0011269450187683105, 0.0011635883711278439, 0.0012002316070720553, 0.0012368748430162668, 0.0012735180789604783, 0.0013101613149046898, 0.0013468045508489013, 0.0013834477867931128, 0.001420091139152646, 0.0014567343750968575, 0.001493377611041069, 0.0015300208469852805, 0.001566664082929492, 0.0016033074352890253, 0.0016399506712332368, 0.0016765939071774483, 0.0017132372595369816, 0.001749880495481193, 0.0017865237314254045, 0.001823166967369616, 0.0018598102033138275, 0.001896453439258039]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 7.0, 6.0, 13.0, 7.0, 12.0, 10.0, 17.0, 21.0, 14.0, 24.0, 22.0, 18.0, 26.0, 28.0, 50.0, 43.0, 41.0, 32.0, 34.0, 33.0, 43.0, 53.0, 38.0, 35.0, 43.0, 33.0, 44.0, 37.0, 18.0, 29.0, 22.0, 26.0, 21.0, 15.0, 17.0, 15.0, 12.0, 9.0, 6.0, 8.0, 8.0, 3.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00034630298614501953, -0.0003356989473104477, -0.00032509490847587585, -0.000314490869641304, -0.0003038868308067322, -0.00029328279197216034, -0.0002826787531375885, -0.00027207471430301666, -0.0002614706754684448, -0.000250866636633873, -0.00024026259779930115, -0.0002296585589647293, -0.00021905452013015747, -0.00020845048129558563, -0.0001978464424610138, -0.00018724240362644196, -0.00017663836479187012, -0.00016603432595729828, -0.00015543028712272644, -0.0001448262482881546, -0.00013422220945358276, -0.00012361817061901093, -0.00011301413178443909, -0.00010241009294986725, -9.180605411529541e-05, -8.120201528072357e-05, -7.059797644615173e-05, -5.9993937611579895e-05, -4.938989877700806e-05, -3.878585994243622e-05, -2.818182110786438e-05, -1.757778227329254e-05, -6.973743438720703e-06, 3.6302953958511353e-06, 1.4234334230422974e-05, 2.4838373064994812e-05, 3.544241189956665e-05, 4.604645073413849e-05, 5.665048956871033e-05, 6.725452840328217e-05, 7.7858567237854e-05, 8.846260607242584e-05, 9.906664490699768e-05, 0.00010967068374156952, 0.00012027472257614136, 0.0001308787614107132, 0.00014148280024528503, 0.00015208683907985687, 0.0001626908779144287, 0.00017329491674900055, 0.0001838989555835724, 0.00019450299441814423, 0.00020510703325271606, 0.0002157110720872879, 0.00022631511092185974, 0.00023691914975643158, 0.0002475231885910034, 0.00025812722742557526, 0.0002687312662601471, 0.00027933530509471893, 0.00028993934392929077, 0.0003005433827638626, 0.00031114742159843445, 0.0003217514604330063, 0.0003323554992675781]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 5.0, 6.0, 13.0, 7.0, 14.0, 18.0, 17.0, 21.0, 21.0, 19.0, 34.0, 30.0, 26.0, 48.0, 39.0, 38.0, 51.0, 61.0, 39.0, 39.0, 58.0, 40.0, 43.0, 38.0, 41.0, 37.0, 30.0, 31.0, 18.0, 21.0, 22.0, 13.0, 10.0, 11.0, 11.0, 8.0, 5.0, 6.0, 1.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.260009765625, -4.12548828125, -3.990966796875, -3.8564453125, -3.721923828125, -3.58740234375, -3.452880859375, -3.318359375, -3.183837890625, -3.04931640625, -2.914794921875, -2.7802734375, -2.645751953125, -2.51123046875, -2.376708984375, -2.2421875, -2.107666015625, -1.97314453125, -1.838623046875, -1.7041015625, -1.569580078125, -1.43505859375, -1.300537109375, -1.166015625, -1.031494140625, -0.89697265625, -0.762451171875, -0.6279296875, -0.493408203125, -0.35888671875, -0.224365234375, -0.08984375, 0.044677734375, 0.17919921875, 0.313720703125, 0.4482421875, 0.582763671875, 0.71728515625, 0.851806640625, 0.986328125, 1.120849609375, 1.25537109375, 1.389892578125, 1.5244140625, 1.658935546875, 1.79345703125, 1.927978515625, 2.0625, 2.197021484375, 2.33154296875, 2.466064453125, 2.6005859375, 2.735107421875, 2.86962890625, 3.004150390625, 3.138671875, 3.273193359375, 3.40771484375, 3.542236328125, 3.6767578125, 3.811279296875, 3.94580078125, 4.080322265625, 4.21484375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 7.0, 7.0, 6.0, 14.0, 18.0, 18.0, 23.0, 37.0, 64.0, 85.0, 87.0, 148.0, 246.0, 330.0, 548.0, 916.0, 1572.0, 3210.0, 7417.0, 19190.0, 66203.0, 297208.0, 472643.0, 125747.0, 32002.0, 11133.0, 4562.0, 2022.0, 1099.0, 677.0, 408.0, 276.0, 198.0, 121.0, 86.0, 60.0, 44.0, 31.0, 17.0, 24.0, 18.0, 10.0, 7.0, 7.0, 6.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91796875, -4.76531982421875, -4.6126708984375, -4.46002197265625, -4.307373046875, -4.15472412109375, -4.0020751953125, -3.84942626953125, -3.69677734375, -3.54412841796875, -3.3914794921875, -3.23883056640625, -3.086181640625, -2.93353271484375, -2.7808837890625, -2.62823486328125, -2.4755859375, -2.32293701171875, -2.1702880859375, -2.01763916015625, -1.864990234375, -1.71234130859375, -1.5596923828125, -1.40704345703125, -1.25439453125, -1.10174560546875, -0.9490966796875, -0.79644775390625, -0.643798828125, -0.49114990234375, -0.3385009765625, -0.18585205078125, -0.033203125, 0.11944580078125, 0.2720947265625, 0.42474365234375, 0.577392578125, 0.73004150390625, 0.8826904296875, 1.03533935546875, 1.18798828125, 1.34063720703125, 1.4932861328125, 1.64593505859375, 1.798583984375, 1.95123291015625, 2.1038818359375, 2.25653076171875, 2.4091796875, 2.56182861328125, 2.7144775390625, 2.86712646484375, 3.019775390625, 3.17242431640625, 3.3250732421875, 3.47772216796875, 3.63037109375, 3.78302001953125, 3.9356689453125, 4.08831787109375, 4.240966796875, 4.39361572265625, 4.5462646484375, 4.69891357421875, 4.8515625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 4.0, 12.0, 7.0, 15.0, 19.0, 20.0, 20.0, 28.0, 26.0, 34.0, 44.0, 51.0, 60.0, 84.0, 147.0, 1750.0, 255.0, 78.0, 57.0, 50.0, 53.0, 43.0, 28.0, 29.0, 23.0, 23.0, 23.0, 19.0, 13.0, 9.0, 10.0, 12.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.28125, -18.72509765625, -18.1689453125, -17.61279296875, -17.056640625, -16.50048828125, -15.9443359375, -15.38818359375, -14.83203125, -14.27587890625, -13.7197265625, -13.16357421875, -12.607421875, -12.05126953125, -11.4951171875, -10.93896484375, -10.3828125, -9.82666015625, -9.2705078125, -8.71435546875, -8.158203125, -7.60205078125, -7.0458984375, -6.48974609375, -5.93359375, -5.37744140625, -4.8212890625, -4.26513671875, -3.708984375, -3.15283203125, -2.5966796875, -2.04052734375, -1.484375, -0.92822265625, -0.3720703125, 0.18408203125, 0.740234375, 1.29638671875, 1.8525390625, 2.40869140625, 2.96484375, 3.52099609375, 4.0771484375, 4.63330078125, 5.189453125, 5.74560546875, 6.3017578125, 6.85791015625, 7.4140625, 7.97021484375, 8.5263671875, 9.08251953125, 9.638671875, 10.19482421875, 10.7509765625, 11.30712890625, 11.86328125, 12.41943359375, 12.9755859375, 13.53173828125, 14.087890625, 14.64404296875, 15.2001953125, 15.75634765625, 16.3125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 11.0, 10.0, 15.0, 12.0, 18.0, 30.0, 20.0, 38.0, 32.0, 63.0, 84.0, 112.0, 216.0, 508.0, 1619.0, 19757.0, 3011601.0, 106662.0, 3446.0, 680.0, 278.0, 144.0, 79.0, 68.0, 38.0, 34.0, 14.0, 30.0, 17.0, 17.0, 11.0, 12.0, 8.0, 4.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.984375, -22.154296875, -21.32421875, -20.494140625, -19.6640625, -18.833984375, -18.00390625, -17.173828125, -16.34375, -15.513671875, -14.68359375, -13.853515625, -13.0234375, -12.193359375, -11.36328125, -10.533203125, -9.703125, -8.873046875, -8.04296875, -7.212890625, -6.3828125, -5.552734375, -4.72265625, -3.892578125, -3.0625, -2.232421875, -1.40234375, -0.572265625, 0.2578125, 1.087890625, 1.91796875, 2.748046875, 3.578125, 4.408203125, 5.23828125, 6.068359375, 6.8984375, 7.728515625, 8.55859375, 9.388671875, 10.21875, 11.048828125, 11.87890625, 12.708984375, 13.5390625, 14.369140625, 15.19921875, 16.029296875, 16.859375, 17.689453125, 18.51953125, 19.349609375, 20.1796875, 21.009765625, 21.83984375, 22.669921875, 23.5, 24.330078125, 25.16015625, 25.990234375, 26.8203125, 27.650390625, 28.48046875, 29.310546875, 30.140625]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 39.0, 667.0, 306.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.59774780273438, -166.70021057128906, -162.8026580810547, -158.90512084960938, -155.007568359375, -151.1100311279297, -147.21249389648438, -143.31494140625, -139.4174041748047, -135.51986694335938, -131.622314453125, -127.72477722167969, -123.82723236083984, -119.9296875, -116.03215026855469, -112.13460540771484, -108.237060546875, -104.33951568603516, -100.44197082519531, -96.54443359375, -92.64688873291016, -88.74934387207031, -84.851806640625, -80.95426177978516, -77.05671691894531, -73.15917205810547, -69.26162719726562, -65.36408996582031, -61.46654510498047, -57.569000244140625, -53.67145919799805, -49.77391815185547, -45.876365661621094, -41.97882080078125, -38.08127975463867, -34.183738708496094, -30.28619384765625, -26.38865089416504, -22.491107940673828, -18.593564987182617, -14.696022033691406, -10.798479080200195, -6.900936126708984, -3.0033931732177734, 0.8941497802734375, 4.791692733764648, 8.68923568725586, 12.58677864074707, 16.48432159423828, 20.381864547729492, 24.279407501220703, 28.176950454711914, 32.074493408203125, 35.97203826904297, 39.86957931518555, 43.767120361328125, 47.66466522216797, 51.56221008300781, 55.45975112915039, 59.35729217529297, 63.25483703613281, 67.15238189697266, 71.0499267578125, 74.94746398925781, 78.84500885009766]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 8.0, 5.0, 11.0, 18.0, 14.0, 14.0, 27.0, 21.0, 16.0, 33.0, 30.0, 42.0, 40.0, 35.0, 27.0, 43.0, 50.0, 49.0, 45.0, 41.0, 40.0, 44.0, 41.0, 36.0, 32.0, 19.0, 34.0, 18.0, 31.0, 18.0, 18.0, 16.0, 12.0, 11.0, 10.0, 8.0, 6.0, 7.0, 10.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.91804504394531, -43.481300354003906, -42.0445556640625, -40.607810974121094, -39.17106628417969, -37.73432159423828, -36.297576904296875, -34.8608283996582, -33.4240837097168, -31.98733901977539, -30.550594329833984, -29.113849639892578, -27.67710304260254, -26.240358352661133, -24.803613662719727, -23.366867065429688, -21.930124282836914, -20.493379592895508, -19.0566349029541, -17.619888305664062, -16.183143615722656, -14.74639892578125, -13.309654235839844, -11.872908592224121, -10.436163902282715, -8.999419212341309, -7.562673568725586, -6.12592887878418, -4.689183712005615, -3.252438545227051, -1.8156938552856445, -0.3789482116699219, 1.0577964782714844, 2.494541645050049, 3.931286573410034, 5.3680315017700195, 6.804776668548584, 8.241521835327148, 9.678266525268555, 11.115012168884277, 12.551756858825684, 13.98850154876709, 15.425247192382812, 16.86199188232422, 18.298736572265625, 19.73548126220703, 21.172225952148438, 22.608972549438477, 24.045717239379883, 25.48246192932129, 26.919206619262695, 28.355953216552734, 29.79269790649414, 31.229442596435547, 32.66618728637695, 34.10293197631836, 35.539676666259766, 36.97642135620117, 38.41316604614258, 39.849910736083984, 41.28665542602539, 42.72340393066406, 44.16014862060547, 45.596893310546875, 47.03363800048828]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 5.0, 8.0, 8.0, 12.0, 9.0, 10.0, 23.0, 19.0, 14.0, 33.0, 26.0, 20.0, 34.0, 38.0, 52.0, 31.0, 55.0, 44.0, 51.0, 54.0, 50.0, 39.0, 44.0, 37.0, 34.0, 46.0, 32.0, 26.0, 25.0, 17.0, 23.0, 18.0, 6.0, 16.0, 7.0, 11.0, 6.0, 4.0, 6.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.34765625, -4.2071533203125, -4.066650390625, -3.9261474609375, -3.78564453125, -3.6451416015625, -3.504638671875, -3.3641357421875, -3.2236328125, -3.0831298828125, -2.942626953125, -2.8021240234375, -2.66162109375, -2.5211181640625, -2.380615234375, -2.2401123046875, -2.099609375, -1.9591064453125, -1.818603515625, -1.6781005859375, -1.53759765625, -1.3970947265625, -1.256591796875, -1.1160888671875, -0.9755859375, -0.8350830078125, -0.694580078125, -0.5540771484375, -0.41357421875, -0.2730712890625, -0.132568359375, 0.0079345703125, 0.1484375, 0.2889404296875, 0.429443359375, 0.5699462890625, 0.71044921875, 0.8509521484375, 0.991455078125, 1.1319580078125, 1.2724609375, 1.4129638671875, 1.553466796875, 1.6939697265625, 1.83447265625, 1.9749755859375, 2.115478515625, 2.2559814453125, 2.396484375, 2.5369873046875, 2.677490234375, 2.8179931640625, 2.95849609375, 3.0989990234375, 3.239501953125, 3.3800048828125, 3.5205078125, 3.6610107421875, 3.801513671875, 3.9420166015625, 4.08251953125, 4.2230224609375, 4.363525390625, 4.5040283203125, 4.64453125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 3.0, 9.0, 11.0, 13.0, 13.0, 20.0, 11.0, 16.0, 26.0, 53.0, 64.0, 116.0, 157.0, 360.0, 816.0, 2204.0, 7053.0, 28023.0, 150380.0, 940200.0, 2169895.0, 746740.0, 116278.0, 22547.0, 5909.0, 1868.0, 735.0, 292.0, 140.0, 78.0, 49.0, 37.0, 39.0, 23.0, 24.0, 19.0, 9.0, 4.0, 9.0, 6.0, 9.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.9765625, -7.7227783203125, -7.468994140625, -7.2152099609375, -6.96142578125, -6.7076416015625, -6.453857421875, -6.2000732421875, -5.9462890625, -5.6925048828125, -5.438720703125, -5.1849365234375, -4.93115234375, -4.6773681640625, -4.423583984375, -4.1697998046875, -3.916015625, -3.6622314453125, -3.408447265625, -3.1546630859375, -2.90087890625, -2.6470947265625, -2.393310546875, -2.1395263671875, -1.8857421875, -1.6319580078125, -1.378173828125, -1.1243896484375, -0.87060546875, -0.6168212890625, -0.363037109375, -0.1092529296875, 0.14453125, 0.3983154296875, 0.652099609375, 0.9058837890625, 1.15966796875, 1.4134521484375, 1.667236328125, 1.9210205078125, 2.1748046875, 2.4285888671875, 2.682373046875, 2.9361572265625, 3.18994140625, 3.4437255859375, 3.697509765625, 3.9512939453125, 4.205078125, 4.4588623046875, 4.712646484375, 4.9664306640625, 5.22021484375, 5.4739990234375, 5.727783203125, 5.9815673828125, 6.2353515625, 6.4891357421875, 6.742919921875, 6.9967041015625, 7.25048828125, 7.5042724609375, 7.758056640625, 8.0118408203125, 8.265625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 8.0, 15.0, 13.0, 20.0, 51.0, 65.0, 120.0, 165.0, 266.0, 356.0, 526.0, 593.0, 567.0, 410.0, 336.0, 187.0, 144.0, 84.0, 59.0, 37.0, 15.0, 18.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.234375, -13.756103515625, -13.27783203125, -12.799560546875, -12.3212890625, -11.843017578125, -11.36474609375, -10.886474609375, -10.408203125, -9.929931640625, -9.45166015625, -8.973388671875, -8.4951171875, -8.016845703125, -7.53857421875, -7.060302734375, -6.58203125, -6.103759765625, -5.62548828125, -5.147216796875, -4.6689453125, -4.190673828125, -3.71240234375, -3.234130859375, -2.755859375, -2.277587890625, -1.79931640625, -1.321044921875, -0.8427734375, -0.364501953125, 0.11376953125, 0.592041015625, 1.0703125, 1.548583984375, 2.02685546875, 2.505126953125, 2.9833984375, 3.461669921875, 3.93994140625, 4.418212890625, 4.896484375, 5.374755859375, 5.85302734375, 6.331298828125, 6.8095703125, 7.287841796875, 7.76611328125, 8.244384765625, 8.72265625, 9.200927734375, 9.67919921875, 10.157470703125, 10.6357421875, 11.114013671875, 11.59228515625, 12.070556640625, 12.548828125, 13.027099609375, 13.50537109375, 13.983642578125, 14.4619140625, 14.940185546875, 15.41845703125, 15.896728515625, 16.375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 8.0, 10.0, 21.0, 26.0, 40.0, 59.0, 120.0, 212.0, 487.0, 2019.0, 72222.0, 3976119.0, 139182.0, 2608.0, 576.0, 259.0, 110.0, 72.0, 57.0, 25.0, 12.0, 19.0, 8.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.625, -52.158203125, -50.69140625, -49.224609375, -47.7578125, -46.291015625, -44.82421875, -43.357421875, -41.890625, -40.423828125, -38.95703125, -37.490234375, -36.0234375, -34.556640625, -33.08984375, -31.623046875, -30.15625, -28.689453125, -27.22265625, -25.755859375, -24.2890625, -22.822265625, -21.35546875, -19.888671875, -18.421875, -16.955078125, -15.48828125, -14.021484375, -12.5546875, -11.087890625, -9.62109375, -8.154296875, -6.6875, -5.220703125, -3.75390625, -2.287109375, -0.8203125, 0.646484375, 2.11328125, 3.580078125, 5.046875, 6.513671875, 7.98046875, 9.447265625, 10.9140625, 12.380859375, 13.84765625, 15.314453125, 16.78125, 18.248046875, 19.71484375, 21.181640625, 22.6484375, 24.115234375, 25.58203125, 27.048828125, 28.515625, 29.982421875, 31.44921875, 32.916015625, 34.3828125, 35.849609375, 37.31640625, 38.783203125, 40.25]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 25.0, 136.0, 276.0, 333.0, 190.0, 47.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-199.8176727294922, -194.96788024902344, -190.11810302734375, -185.268310546875, -180.4185333251953, -175.56874084472656, -170.71896362304688, -165.86917114257812, -161.01937866210938, -156.16958618164062, -151.31980895996094, -146.4700164794922, -141.6202392578125, -136.77044677734375, -131.92066955566406, -127.07087707519531, -122.22109985351562, -117.3713150024414, -112.52153015136719, -107.67174530029297, -102.82196044921875, -97.97216796875, -93.12238311767578, -88.27259826660156, -83.42281341552734, -78.57302856445312, -73.7232437133789, -68.87345886230469, -64.02366638183594, -59.173885345458984, -54.3240966796875, -49.47431182861328, -44.62451934814453, -39.77473449707031, -34.924949645996094, -30.07516098022461, -25.22537612915039, -20.375591278076172, -15.52580451965332, -10.676017761230469, -5.82623291015625, -0.9764471054077148, 3.8733386993408203, 8.723124504089355, 13.57291030883789, 18.42269515991211, 23.27248191833496, 28.122268676757812, 32.97205352783203, 37.82183837890625, 42.67162322998047, 47.52141189575195, 52.37119674682617, 57.22098159790039, 62.070770263671875, 66.9205551147461, 71.77033996582031, 76.62012481689453, 81.46990966796875, 86.31969451904297, 91.16947937011719, 96.01927185058594, 100.86905670166016, 105.71884155273438, 110.5686264038086]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 1.0, 5.0, 6.0, 6.0, 14.0, 12.0, 12.0, 19.0, 17.0, 21.0, 19.0, 31.0, 36.0, 30.0, 48.0, 31.0, 34.0, 39.0, 50.0, 50.0, 41.0, 47.0, 42.0, 37.0, 27.0, 45.0, 34.0, 42.0, 33.0, 23.0, 25.0, 24.0, 13.0, 16.0, 11.0, 11.0, 13.0, 7.0, 7.0, 7.0, 3.0, 1.0, 5.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.596866607666016, -37.36635208129883, -36.13583755493164, -34.90532302856445, -33.6748046875, -32.44429016113281, -31.213775634765625, -29.983261108398438, -28.75274658203125, -27.522232055664062, -26.291717529296875, -25.061201095581055, -23.830686569213867, -22.60017204284668, -21.36965560913086, -20.139141082763672, -18.908626556396484, -17.678112030029297, -16.44759750366211, -15.217081069946289, -13.986566543579102, -12.756052017211914, -11.52553653717041, -10.295021057128906, -9.064506530761719, -7.833991527557373, -6.603476524353027, -5.372961521148682, -4.142446517944336, -2.9119315147399902, -1.6814165115356445, -0.4509010314941406, 0.7796134948730469, 2.0101284980773926, 3.2406435012817383, 4.471158504486084, 5.70167350769043, 6.932188510894775, 8.162703514099121, 9.393218994140625, 10.623733520507812, 11.854248046875, 13.084763526916504, 14.315279006958008, 15.545793533325195, 16.776308059692383, 18.006824493408203, 19.23733901977539, 20.467853546142578, 21.698368072509766, 22.928882598876953, 24.159399032592773, 25.38991355895996, 26.62042808532715, 27.85094451904297, 29.081459045410156, 30.311973571777344, 31.54248809814453, 32.77300262451172, 34.003517150878906, 35.234031677246094, 36.46455001831055, 37.695064544677734, 38.92557907104492, 40.15609359741211]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 15.0, 11.0, 11.0, 12.0, 13.0, 19.0, 22.0, 31.0, 30.0, 27.0, 41.0, 31.0, 36.0, 48.0, 44.0, 56.0, 40.0, 43.0, 49.0, 48.0, 45.0, 36.0, 29.0, 40.0, 35.0, 21.0, 30.0, 20.0, 15.0, 16.0, 20.0, 9.0, 8.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.52734375, -4.3885498046875, -4.249755859375, -4.1109619140625, -3.97216796875, -3.8333740234375, -3.694580078125, -3.5557861328125, -3.4169921875, -3.2781982421875, -3.139404296875, -3.0006103515625, -2.86181640625, -2.7230224609375, -2.584228515625, -2.4454345703125, -2.306640625, -2.1678466796875, -2.029052734375, -1.8902587890625, -1.75146484375, -1.6126708984375, -1.473876953125, -1.3350830078125, -1.1962890625, -1.0574951171875, -0.918701171875, -0.7799072265625, -0.64111328125, -0.5023193359375, -0.363525390625, -0.2247314453125, -0.0859375, 0.0528564453125, 0.191650390625, 0.3304443359375, 0.46923828125, 0.6080322265625, 0.746826171875, 0.8856201171875, 1.0244140625, 1.1632080078125, 1.302001953125, 1.4407958984375, 1.57958984375, 1.7183837890625, 1.857177734375, 1.9959716796875, 2.134765625, 2.2735595703125, 2.412353515625, 2.5511474609375, 2.68994140625, 2.8287353515625, 2.967529296875, 3.1063232421875, 3.2451171875, 3.3839111328125, 3.522705078125, 3.6614990234375, 3.80029296875, 3.9390869140625, 4.077880859375, 4.2166748046875, 4.35546875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 11.0, 15.0, 17.0, 25.0, 31.0, 55.0, 77.0, 101.0, 172.0, 222.0, 357.0, 449.0, 682.0, 966.0, 1342.0, 1944.0, 2771.0, 3979.0, 5896.0, 8884.0, 13148.0, 20479.0, 31892.0, 50750.0, 83655.0, 152756.0, 261514.0, 165777.0, 89258.0, 53420.0, 33345.0, 21375.0, 13971.0, 9249.0, 6161.0, 4180.0, 2898.0, 2069.0, 1461.0, 961.0, 674.0, 466.0, 344.0, 248.0, 153.0, 117.0, 75.0, 57.0, 35.0, 19.0, 24.0, 13.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0], "bins": [-0.68603515625, -0.6649627685546875, -0.643890380859375, -0.6228179931640625, -0.60174560546875, -0.5806732177734375, -0.559600830078125, -0.5385284423828125, -0.5174560546875, -0.4963836669921875, -0.475311279296875, -0.4542388916015625, -0.43316650390625, -0.4120941162109375, -0.391021728515625, -0.3699493408203125, -0.348876953125, -0.3278045654296875, -0.306732177734375, -0.2856597900390625, -0.26458740234375, -0.2435150146484375, -0.222442626953125, -0.2013702392578125, -0.1802978515625, -0.1592254638671875, -0.138153076171875, -0.1170806884765625, -0.09600830078125, -0.0749359130859375, -0.053863525390625, -0.0327911376953125, -0.01171875, 0.0093536376953125, 0.030426025390625, 0.0514984130859375, 0.07257080078125, 0.0936431884765625, 0.114715576171875, 0.1357879638671875, 0.1568603515625, 0.1779327392578125, 0.199005126953125, 0.2200775146484375, 0.24114990234375, 0.2622222900390625, 0.283294677734375, 0.3043670654296875, 0.325439453125, 0.3465118408203125, 0.367584228515625, 0.3886566162109375, 0.40972900390625, 0.4308013916015625, 0.451873779296875, 0.4729461669921875, 0.4940185546875, 0.5150909423828125, 0.536163330078125, 0.5572357177734375, 0.57830810546875, 0.5993804931640625, 0.620452880859375, 0.6415252685546875, 0.66259765625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 6.0, 1.0, 4.0, 7.0, 5.0, 4.0, 12.0, 12.0, 5.0, 12.0, 8.0, 22.0, 15.0, 17.0, 29.0, 20.0, 34.0, 33.0, 41.0, 34.0, 36.0, 42.0, 36.0, 36.0, 36.0, 1055.0, 43.0, 35.0, 32.0, 41.0, 38.0, 28.0, 33.0, 26.0, 29.0, 21.0, 10.0, 23.0, 12.0, 18.0, 19.0, 4.0, 9.0, 11.0, 12.0, 4.0, 7.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0], "bins": [-2.4140625, -2.34368896484375, -2.2733154296875, -2.20294189453125, -2.132568359375, -2.06219482421875, -1.9918212890625, -1.92144775390625, -1.85107421875, -1.78070068359375, -1.7103271484375, -1.63995361328125, -1.569580078125, -1.49920654296875, -1.4288330078125, -1.35845947265625, -1.2880859375, -1.21771240234375, -1.1473388671875, -1.07696533203125, -1.006591796875, -0.93621826171875, -0.8658447265625, -0.79547119140625, -0.72509765625, -0.65472412109375, -0.5843505859375, -0.51397705078125, -0.443603515625, -0.37322998046875, -0.3028564453125, -0.23248291015625, -0.162109375, -0.09173583984375, -0.0213623046875, 0.04901123046875, 0.119384765625, 0.18975830078125, 0.2601318359375, 0.33050537109375, 0.40087890625, 0.47125244140625, 0.5416259765625, 0.61199951171875, 0.682373046875, 0.75274658203125, 0.8231201171875, 0.89349365234375, 0.9638671875, 1.03424072265625, 1.1046142578125, 1.17498779296875, 1.245361328125, 1.31573486328125, 1.3861083984375, 1.45648193359375, 1.52685546875, 1.59722900390625, 1.6676025390625, 1.73797607421875, 1.808349609375, 1.87872314453125, 1.9490966796875, 2.01947021484375, 2.08984375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 4.0, 8.0, 11.0, 15.0, 23.0, 42.0, 61.0, 76.0, 108.0, 135.0, 197.0, 312.0, 408.0, 627.0, 907.0, 1315.0, 2076.0, 3131.0, 4688.0, 7144.0, 11218.0, 17549.0, 27913.0, 47361.0, 84362.0, 159364.0, 1323471.0, 177516.0, 92408.0, 51186.0, 29930.0, 18976.0, 11729.0, 7625.0, 5211.0, 3297.0, 2192.0, 1418.0, 970.0, 673.0, 447.0, 333.0, 230.0, 154.0, 101.0, 74.0, 49.0, 25.0, 28.0, 7.0, 15.0, 5.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.61767578125, -0.5967941284179688, -0.5759124755859375, -0.5550308227539062, -0.534149169921875, -0.5132675170898438, -0.4923858642578125, -0.47150421142578125, -0.45062255859375, -0.42974090576171875, -0.4088592529296875, -0.38797760009765625, -0.367095947265625, -0.34621429443359375, -0.3253326416015625, -0.30445098876953125, -0.2835693359375, -0.26268768310546875, -0.2418060302734375, -0.22092437744140625, -0.200042724609375, -0.17916107177734375, -0.1582794189453125, -0.13739776611328125, -0.11651611328125, -0.09563446044921875, -0.0747528076171875, -0.05387115478515625, -0.032989501953125, -0.01210784912109375, 0.0087738037109375, 0.02965545654296875, 0.050537109375, 0.07141876220703125, 0.0923004150390625, 0.11318206787109375, 0.134063720703125, 0.15494537353515625, 0.1758270263671875, 0.19670867919921875, 0.21759033203125, 0.23847198486328125, 0.2593536376953125, 0.28023529052734375, 0.301116943359375, 0.32199859619140625, 0.3428802490234375, 0.36376190185546875, 0.3846435546875, 0.40552520751953125, 0.4264068603515625, 0.44728851318359375, 0.468170166015625, 0.48905181884765625, 0.5099334716796875, 0.5308151245117188, 0.55169677734375, 0.5725784301757812, 0.5934600830078125, 0.6143417358398438, 0.635223388671875, 0.6561050415039062, 0.6769866943359375, 0.6978683471679688, 0.71875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 7.0, 4.0, 11.0, 18.0, 18.0, 18.0, 29.0, 22.0, 36.0, 26.0, 38.0, 38.0, 51.0, 54.0, 70.0, 57.0, 59.0, 57.0, 62.0, 61.0, 50.0, 33.0, 32.0, 25.0, 20.0, 15.0, 19.0, 11.0, 12.0, 10.0, 7.0, 4.0, 5.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0], "bins": [-0.0009784698486328125, -0.0009520649909973145, -0.0009256601333618164, -0.0008992552757263184, -0.0008728504180908203, -0.0008464455604553223, -0.0008200407028198242, -0.0007936358451843262, -0.0007672309875488281, -0.0007408261299133301, -0.000714421272277832, -0.000688016414642334, -0.0006616115570068359, -0.0006352066993713379, -0.0006088018417358398, -0.0005823969841003418, -0.0005559921264648438, -0.0005295872688293457, -0.0005031824111938477, -0.0004767775535583496, -0.00045037269592285156, -0.0004239678382873535, -0.00039756298065185547, -0.0003711581230163574, -0.0003447532653808594, -0.00031834840774536133, -0.0002919435501098633, -0.00026553869247436523, -0.0002391338348388672, -0.00021272897720336914, -0.0001863241195678711, -0.00015991926193237305, -0.000133514404296875, -0.00010710954666137695, -8.07046890258789e-05, -5.429983139038086e-05, -2.7894973754882812e-05, -1.4901161193847656e-06, 2.491474151611328e-05, 5.131959915161133e-05, 7.772445678710938e-05, 0.00010412931442260742, 0.00013053417205810547, 0.00015693902969360352, 0.00018334388732910156, 0.0002097487449645996, 0.00023615360260009766, 0.0002625584602355957, 0.00028896331787109375, 0.0003153681755065918, 0.00034177303314208984, 0.0003681778907775879, 0.00039458274841308594, 0.000420987606048584, 0.00044739246368408203, 0.0004737973213195801, 0.0005002021789550781, 0.0005266070365905762, 0.0005530118942260742, 0.0005794167518615723, 0.0006058216094970703, 0.0006322264671325684, 0.0006586313247680664, 0.0006850361824035645, 0.0007114410400390625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 9.0, 8.0, 5.0, 13.0, 12.0, 15.0, 20.0, 30.0, 40.0, 50.0, 67.0, 98.0, 155.0, 210.0, 339.0, 585.0, 6858.0, 1023200.0, 15065.0, 699.0, 337.0, 207.0, 124.0, 95.0, 78.0, 42.0, 45.0, 30.0, 29.0, 18.0, 21.0, 16.0, 4.0, 4.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.015625, -0.015096426010131836, -0.014567852020263672, -0.014039278030395508, -0.013510704040527344, -0.01298213005065918, -0.012453556060791016, -0.011924982070922852, -0.011396408081054688, -0.010867834091186523, -0.01033926010131836, -0.009810686111450195, -0.009282112121582031, -0.008753538131713867, -0.008224964141845703, -0.007696390151977539, -0.007167816162109375, -0.006639242172241211, -0.006110668182373047, -0.005582094192504883, -0.005053520202636719, -0.004524946212768555, -0.003996372222900391, -0.0034677982330322266, -0.0029392242431640625, -0.0024106502532958984, -0.0018820762634277344, -0.0013535022735595703, -0.0008249282836914062, -0.0002963542938232422, 0.00023221969604492188, 0.0007607936859130859, 0.00128936767578125, 0.001817941665649414, 0.002346515655517578, 0.002875089645385742, 0.0034036636352539062, 0.00393223762512207, 0.004460811614990234, 0.0049893856048583984, 0.0055179595947265625, 0.0060465335845947266, 0.006575107574462891, 0.007103681564331055, 0.007632255554199219, 0.008160829544067383, 0.008689403533935547, 0.009217977523803711, 0.009746551513671875, 0.010275125503540039, 0.010803699493408203, 0.011332273483276367, 0.011860847473144531, 0.012389421463012695, 0.01291799545288086, 0.013446569442749023, 0.013975143432617188, 0.014503717422485352, 0.015032291412353516, 0.01556086540222168, 0.016089439392089844, 0.016618013381958008, 0.017146587371826172, 0.017675161361694336, 0.0182037353515625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 46.0, 427.0, 464.0, 72.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004102547187358141, -0.004011508077383041, -0.003920468967407942, -0.0038294296246021986, -0.003738390514627099, -0.0036473514046519995, -0.0035563122946769, -0.0034652729518711567, -0.003374233841896057, -0.0032831947319209576, -0.003192155621945858, -0.003101116279140115, -0.0030100771691650152, -0.0029190380591899157, -0.002827998949214816, -0.002736959606409073, -0.0026459204964339733, -0.0025548813864588737, -0.002463842276483774, -0.002372802933678031, -0.0022817638237029314, -0.002190724713727832, -0.0020996856037527323, -0.002008646260946989, -0.0019176073838025331, -0.0018265682738274336, -0.0017355290474370122, -0.0016444899374619126, -0.0015534507110714912, -0.0014624116010963917, -0.0013713724911212921, -0.0012803332647308707, -0.0011892941547557712, -0.0010982550447806716, -0.0010072158183902502, -0.0009161767084151506, -0.0008251374820247293, -0.0007340983720496297, -0.0006430592038668692, -0.0005520200356841087, -0.00046098086750134826, -0.0003699416993185878, -0.0002789025311358273, -0.00018786339205689728, -9.68242238741368e-05, -5.7850556913763285e-06, 8.525408338755369e-05, 0.00017629325157031417, 0.00026733241975307465, 0.0003583715879358351, 0.0004494107561185956, 0.0005404498660936952, 0.0006314890924841166, 0.0007225282024592161, 0.0008135673706419766, 0.0009046065388247371, 0.0009956457652151585, 0.001086684875190258, 0.0011777241015806794, 0.001268763211555779, 0.0013598024379462004, 0.0014508415479213, 0.0015418806578963995, 0.0016329198842868209, 0.0017239589942619205]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 9.0, 7.0, 7.0, 5.0, 8.0, 12.0, 12.0, 17.0, 14.0, 16.0, 21.0, 23.0, 19.0, 24.0, 24.0, 29.0, 30.0, 28.0, 33.0, 34.0, 43.0, 34.0, 41.0, 42.0, 38.0, 43.0, 35.0, 34.0, 26.0, 31.0, 35.0, 25.0, 21.0, 20.0, 34.0, 18.0, 14.0, 16.0, 15.0, 10.0, 11.0, 8.0, 11.0, 7.0, 8.0, 4.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0], "bins": [-0.00044333934783935547, -0.0004308093339204788, -0.00041827932000160217, -0.0004057493060827255, -0.0003932192921638489, -0.00038068927824497223, -0.0003681592643260956, -0.00035562925040721893, -0.0003430992364883423, -0.00033056922256946564, -0.000318039208650589, -0.00030550919473171234, -0.0002929791808128357, -0.00028044916689395905, -0.0002679191529750824, -0.00025538913905620575, -0.0002428591251373291, -0.00023032911121845245, -0.0002177990972995758, -0.00020526908338069916, -0.0001927390694618225, -0.00018020905554294586, -0.00016767904162406921, -0.00015514902770519257, -0.00014261901378631592, -0.00013008899986743927, -0.00011755898594856262, -0.00010502897202968597, -9.249895811080933e-05, -7.996894419193268e-05, -6.743893027305603e-05, -5.490891635417938e-05, -4.2378902435302734e-05, -2.9848888516426086e-05, -1.731887459754944e-05, -4.7888606786727905e-06, 7.741153240203857e-06, 2.0271167159080505e-05, 3.280118107795715e-05, 4.53311949968338e-05, 5.786120891571045e-05, 7.03912228345871e-05, 8.292123675346375e-05, 9.545125067234039e-05, 0.00010798126459121704, 0.00012051127851009369, 0.00013304129242897034, 0.00014557130634784698, 0.00015810132026672363, 0.00017063133418560028, 0.00018316134810447693, 0.00019569136202335358, 0.00020822137594223022, 0.00022075138986110687, 0.00023328140377998352, 0.00024581141769886017, 0.0002583414316177368, 0.00027087144553661346, 0.0002834014594554901, 0.00029593147337436676, 0.0003084614872932434, 0.00032099150121212006, 0.0003335215151309967, 0.00034605152904987335, 0.00035858154296875]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 6.0, 7.0, 11.0, 15.0, 11.0, 11.0, 12.0, 13.0, 19.0, 22.0, 31.0, 30.0, 27.0, 41.0, 31.0, 36.0, 48.0, 44.0, 56.0, 40.0, 43.0, 49.0, 48.0, 45.0, 36.0, 29.0, 40.0, 35.0, 21.0, 30.0, 20.0, 15.0, 16.0, 20.0, 9.0, 8.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.52734375, -4.3885498046875, -4.249755859375, -4.1109619140625, -3.97216796875, -3.8333740234375, -3.694580078125, -3.5557861328125, -3.4169921875, -3.2781982421875, -3.139404296875, -3.0006103515625, -2.86181640625, -2.7230224609375, -2.584228515625, -2.4454345703125, -2.306640625, -2.1678466796875, -2.029052734375, -1.8902587890625, -1.75146484375, -1.6126708984375, -1.473876953125, -1.3350830078125, -1.1962890625, -1.0574951171875, -0.918701171875, -0.7799072265625, -0.64111328125, -0.5023193359375, -0.363525390625, -0.2247314453125, -0.0859375, 0.0528564453125, 0.191650390625, 0.3304443359375, 0.46923828125, 0.6080322265625, 0.746826171875, 0.8856201171875, 1.0244140625, 1.1632080078125, 1.302001953125, 1.4407958984375, 1.57958984375, 1.7183837890625, 1.857177734375, 1.9959716796875, 2.134765625, 2.2735595703125, 2.412353515625, 2.5511474609375, 2.68994140625, 2.8287353515625, 2.967529296875, 3.1063232421875, 3.2451171875, 3.3839111328125, 3.522705078125, 3.6614990234375, 3.80029296875, 3.9390869140625, 4.077880859375, 4.2166748046875, 4.35546875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 6.0, 13.0, 18.0, 17.0, 38.0, 50.0, 56.0, 87.0, 145.0, 228.0, 408.0, 713.0, 1306.0, 2415.0, 4483.0, 8833.0, 18108.0, 40124.0, 92758.0, 200576.0, 292924.0, 207771.0, 97064.0, 42126.0, 18870.0, 9072.0, 4581.0, 2476.0, 1363.0, 769.0, 439.0, 256.0, 149.0, 91.0, 65.0, 53.0, 38.0, 20.0, 14.0, 8.0, 9.0, 4.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.833984375, -2.74114990234375, -2.6483154296875, -2.55548095703125, -2.462646484375, -2.36981201171875, -2.2769775390625, -2.18414306640625, -2.09130859375, -1.99847412109375, -1.9056396484375, -1.81280517578125, -1.719970703125, -1.62713623046875, -1.5343017578125, -1.44146728515625, -1.3486328125, -1.25579833984375, -1.1629638671875, -1.07012939453125, -0.977294921875, -0.88446044921875, -0.7916259765625, -0.69879150390625, -0.60595703125, -0.51312255859375, -0.4202880859375, -0.32745361328125, -0.234619140625, -0.14178466796875, -0.0489501953125, 0.04388427734375, 0.13671875, 0.22955322265625, 0.3223876953125, 0.41522216796875, 0.508056640625, 0.60089111328125, 0.6937255859375, 0.78656005859375, 0.87939453125, 0.97222900390625, 1.0650634765625, 1.15789794921875, 1.250732421875, 1.34356689453125, 1.4364013671875, 1.52923583984375, 1.6220703125, 1.71490478515625, 1.8077392578125, 1.90057373046875, 1.993408203125, 2.08624267578125, 2.1790771484375, 2.27191162109375, 2.36474609375, 2.45758056640625, 2.5504150390625, 2.64324951171875, 2.736083984375, 2.82891845703125, 2.9217529296875, 3.01458740234375, 3.107421875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 4.0, 7.0, 5.0, 13.0, 12.0, 13.0, 12.0, 20.0, 15.0, 25.0, 24.0, 32.0, 26.0, 37.0, 26.0, 39.0, 47.0, 74.0, 162.0, 1556.0, 362.0, 109.0, 67.0, 39.0, 34.0, 31.0, 36.0, 21.0, 24.0, 21.0, 27.0, 22.0, 25.0, 17.0, 11.0, 11.0, 7.0, 7.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-16.84375, -16.3731689453125, -15.902587890625, -15.4320068359375, -14.96142578125, -14.4908447265625, -14.020263671875, -13.5496826171875, -13.0791015625, -12.6085205078125, -12.137939453125, -11.6673583984375, -11.19677734375, -10.7261962890625, -10.255615234375, -9.7850341796875, -9.314453125, -8.8438720703125, -8.373291015625, -7.9027099609375, -7.43212890625, -6.9615478515625, -6.490966796875, -6.0203857421875, -5.5498046875, -5.0792236328125, -4.608642578125, -4.1380615234375, -3.66748046875, -3.1968994140625, -2.726318359375, -2.2557373046875, -1.78515625, -1.3145751953125, -0.843994140625, -0.3734130859375, 0.09716796875, 0.5677490234375, 1.038330078125, 1.5089111328125, 1.9794921875, 2.4500732421875, 2.920654296875, 3.3912353515625, 3.86181640625, 4.3323974609375, 4.802978515625, 5.2735595703125, 5.744140625, 6.2147216796875, 6.685302734375, 7.1558837890625, 7.62646484375, 8.0970458984375, 8.567626953125, 9.0382080078125, 9.5087890625, 9.9793701171875, 10.449951171875, 10.9205322265625, 11.39111328125, 11.8616943359375, 12.332275390625, 12.8028564453125, 13.2734375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 1.0, 5.0, 5.0, 8.0, 10.0, 6.0, 9.0, 18.0, 19.0, 29.0, 24.0, 28.0, 35.0, 45.0, 44.0, 66.0, 107.0, 164.0, 260.0, 550.0, 2204.0, 39632.0, 2971873.0, 125280.0, 3614.0, 674.0, 319.0, 172.0, 126.0, 87.0, 51.0, 46.0, 37.0, 26.0, 31.0, 20.0, 12.0, 6.0, 14.0, 15.0, 9.0, 5.0, 5.0, 6.0, 7.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.78125, -21.0458984375, -20.310546875, -19.5751953125, -18.83984375, -18.1044921875, -17.369140625, -16.6337890625, -15.8984375, -15.1630859375, -14.427734375, -13.6923828125, -12.95703125, -12.2216796875, -11.486328125, -10.7509765625, -10.015625, -9.2802734375, -8.544921875, -7.8095703125, -7.07421875, -6.3388671875, -5.603515625, -4.8681640625, -4.1328125, -3.3974609375, -2.662109375, -1.9267578125, -1.19140625, -0.4560546875, 0.279296875, 1.0146484375, 1.75, 2.4853515625, 3.220703125, 3.9560546875, 4.69140625, 5.4267578125, 6.162109375, 6.8974609375, 7.6328125, 8.3681640625, 9.103515625, 9.8388671875, 10.57421875, 11.3095703125, 12.044921875, 12.7802734375, 13.515625, 14.2509765625, 14.986328125, 15.7216796875, 16.45703125, 17.1923828125, 17.927734375, 18.6630859375, 19.3984375, 20.1337890625, 20.869140625, 21.6044921875, 22.33984375, 23.0751953125, 23.810546875, 24.5458984375, 25.28125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 6.0, 33.0, 75.0, 138.0, 183.0, 210.0, 185.0, 102.0, 52.0, 20.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6102876663208, -7.580400466918945, -6.55051326751709, -5.520625591278076, -4.490738391876221, -3.4608511924743652, -2.4309635162353516, -1.401076316833496, -0.3711891174316406, 0.6586982011795044, 1.6885855197906494, 2.718472957611084, 3.7483601570129395, 4.778247356414795, 5.808135032653809, 6.838022232055664, 7.8679094314575195, 8.897796630859375, 9.92768383026123, 10.957571029663086, 11.987459182739258, 13.017345428466797, 14.047233581542969, 15.077120780944824, 16.10700798034668, 17.13689613342285, 18.16678237915039, 19.196670532226562, 20.2265567779541, 21.256444931030273, 22.286331176757812, 23.316219329833984, 24.346107482910156, 25.375995635986328, 26.405881881713867, 27.43577003479004, 28.465656280517578, 29.49554443359375, 30.525432586669922, 31.55531883239746, 32.585205078125, 33.61509323120117, 34.644981384277344, 35.67486572265625, 36.70475387573242, 37.734642028808594, 38.764530181884766, 39.79441833496094, 40.824302673339844, 41.854190826416016, 42.88407897949219, 43.913963317871094, 44.943851470947266, 45.97373962402344, 47.00362777709961, 48.03351593017578, 49.06340408325195, 50.093292236328125, 51.1231803894043, 52.1530647277832, 53.182952880859375, 54.21284103393555, 55.24272918701172, 56.272613525390625, 57.3025016784668]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 7.0, 7.0, 8.0, 5.0, 11.0, 15.0, 18.0, 24.0, 26.0, 23.0, 30.0, 41.0, 36.0, 48.0, 44.0, 41.0, 41.0, 56.0, 43.0, 56.0, 49.0, 41.0, 48.0, 33.0, 35.0, 30.0, 26.0, 20.0, 22.0, 19.0, 19.0, 21.0, 15.0, 6.0, 13.0, 10.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.10160827636719, -49.47425842285156, -47.84690475463867, -46.21955490112305, -44.592201232910156, -42.96485137939453, -41.337501525878906, -39.71015167236328, -38.08279800415039, -36.455448150634766, -34.828094482421875, -33.20074462890625, -31.573392868041992, -29.946041107177734, -28.31869125366211, -26.69133949279785, -25.063987731933594, -23.436635971069336, -21.809284210205078, -20.181934356689453, -18.554582595825195, -16.927230834960938, -15.299880027770996, -13.672529220581055, -12.045177459716797, -10.417825698852539, -8.790474891662598, -7.163123607635498, -5.535772323608398, -3.9084205627441406, -2.281069755554199, -0.6537189483642578, 0.9736366271972656, 2.6009879112243652, 4.228339195251465, 5.8556904792785645, 7.483041763305664, 9.110393524169922, 10.737744331359863, 12.365095138549805, 13.992446899414062, 15.61979866027832, 17.247150421142578, 18.874500274658203, 20.50185203552246, 22.12920379638672, 23.756553649902344, 25.3839054107666, 27.01125717163086, 28.638608932495117, 30.265960693359375, 31.893310546875, 33.520660400390625, 35.148014068603516, 36.77536392211914, 38.40271759033203, 40.030067443847656, 41.65741729736328, 43.28477096557617, 44.9121208190918, 46.53947448730469, 48.16682434082031, 49.79417419433594, 51.42152404785156, 53.04887771606445]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 9.0, 10.0, 6.0, 8.0, 8.0, 10.0, 12.0, 17.0, 19.0, 12.0, 23.0, 25.0, 24.0, 33.0, 34.0, 32.0, 38.0, 45.0, 41.0, 42.0, 63.0, 33.0, 40.0, 37.0, 44.0, 43.0, 45.0, 36.0, 30.0, 32.0, 26.0, 14.0, 23.0, 23.0, 10.0, 11.0, 11.0, 7.0, 9.0, 9.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.46875, -4.3291015625, -4.189453125, -4.0498046875, -3.91015625, -3.7705078125, -3.630859375, -3.4912109375, -3.3515625, -3.2119140625, -3.072265625, -2.9326171875, -2.79296875, -2.6533203125, -2.513671875, -2.3740234375, -2.234375, -2.0947265625, -1.955078125, -1.8154296875, -1.67578125, -1.5361328125, -1.396484375, -1.2568359375, -1.1171875, -0.9775390625, -0.837890625, -0.6982421875, -0.55859375, -0.4189453125, -0.279296875, -0.1396484375, 0.0, 0.1396484375, 0.279296875, 0.4189453125, 0.55859375, 0.6982421875, 0.837890625, 0.9775390625, 1.1171875, 1.2568359375, 1.396484375, 1.5361328125, 1.67578125, 1.8154296875, 1.955078125, 2.0947265625, 2.234375, 2.3740234375, 2.513671875, 2.6533203125, 2.79296875, 2.9326171875, 3.072265625, 3.2119140625, 3.3515625, 3.4912109375, 3.630859375, 3.7705078125, 3.91015625, 4.0498046875, 4.189453125, 4.3291015625, 4.46875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 6.0, 9.0, 9.0, 6.0, 6.0, 9.0, 14.0, 16.0, 21.0, 17.0, 30.0, 33.0, 37.0, 46.0, 67.0, 118.0, 200.0, 442.0, 1239.0, 5177.0, 29756.0, 263242.0, 2004466.0, 1666313.0, 193830.0, 23032.0, 4175.0, 1010.0, 358.0, 192.0, 98.0, 58.0, 49.0, 38.0, 30.0, 25.0, 20.0, 12.0, 16.0, 12.0, 3.0, 7.0, 13.0, 5.0, 8.0, 3.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.0234375, -10.688720703125, -10.35400390625, -10.019287109375, -9.6845703125, -9.349853515625, -9.01513671875, -8.680419921875, -8.345703125, -8.010986328125, -7.67626953125, -7.341552734375, -7.0068359375, -6.672119140625, -6.33740234375, -6.002685546875, -5.66796875, -5.333251953125, -4.99853515625, -4.663818359375, -4.3291015625, -3.994384765625, -3.65966796875, -3.324951171875, -2.990234375, -2.655517578125, -2.32080078125, -1.986083984375, -1.6513671875, -1.316650390625, -0.98193359375, -0.647216796875, -0.3125, 0.022216796875, 0.35693359375, 0.691650390625, 1.0263671875, 1.361083984375, 1.69580078125, 2.030517578125, 2.365234375, 2.699951171875, 3.03466796875, 3.369384765625, 3.7041015625, 4.038818359375, 4.37353515625, 4.708251953125, 5.04296875, 5.377685546875, 5.71240234375, 6.047119140625, 6.3818359375, 6.716552734375, 7.05126953125, 7.385986328125, 7.720703125, 8.055419921875, 8.39013671875, 8.724853515625, 9.0595703125, 9.394287109375, 9.72900390625, 10.063720703125, 10.3984375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 6.0, 5.0, 5.0, 7.0, 20.0, 18.0, 22.0, 39.0, 38.0, 39.0, 60.0, 86.0, 107.0, 148.0, 188.0, 195.0, 267.0, 346.0, 336.0, 341.0, 330.0, 320.0, 261.0, 201.0, 131.0, 139.0, 91.0, 81.0, 61.0, 43.0, 40.0, 29.0, 11.0, 17.0, 10.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4453125, -8.1461181640625, -7.846923828125, -7.5477294921875, -7.24853515625, -6.9493408203125, -6.650146484375, -6.3509521484375, -6.0517578125, -5.7525634765625, -5.453369140625, -5.1541748046875, -4.85498046875, -4.5557861328125, -4.256591796875, -3.9573974609375, -3.658203125, -3.3590087890625, -3.059814453125, -2.7606201171875, -2.46142578125, -2.1622314453125, -1.863037109375, -1.5638427734375, -1.2646484375, -0.9654541015625, -0.666259765625, -0.3670654296875, -0.06787109375, 0.2313232421875, 0.530517578125, 0.8297119140625, 1.12890625, 1.4281005859375, 1.727294921875, 2.0264892578125, 2.32568359375, 2.6248779296875, 2.924072265625, 3.2232666015625, 3.5224609375, 3.8216552734375, 4.120849609375, 4.4200439453125, 4.71923828125, 5.0184326171875, 5.317626953125, 5.6168212890625, 5.916015625, 6.2152099609375, 6.514404296875, 6.8135986328125, 7.11279296875, 7.4119873046875, 7.711181640625, 8.0103759765625, 8.3095703125, 8.6087646484375, 8.907958984375, 9.2071533203125, 9.50634765625, 9.8055419921875, 10.104736328125, 10.4039306640625, 10.703125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 8.0, 6.0, 10.0, 12.0, 24.0, 28.0, 42.0, 66.0, 86.0, 93.0, 149.0, 260.0, 465.0, 1660.0, 18269.0, 721789.0, 3330652.0, 113799.0, 5001.0, 849.0, 309.0, 206.0, 142.0, 83.0, 73.0, 62.0, 28.0, 32.0, 19.0, 18.0, 14.0, 11.0, 6.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-33.28125, -32.31005859375, -31.3388671875, -30.36767578125, -29.396484375, -28.42529296875, -27.4541015625, -26.48291015625, -25.51171875, -24.54052734375, -23.5693359375, -22.59814453125, -21.626953125, -20.65576171875, -19.6845703125, -18.71337890625, -17.7421875, -16.77099609375, -15.7998046875, -14.82861328125, -13.857421875, -12.88623046875, -11.9150390625, -10.94384765625, -9.97265625, -9.00146484375, -8.0302734375, -7.05908203125, -6.087890625, -5.11669921875, -4.1455078125, -3.17431640625, -2.203125, -1.23193359375, -0.2607421875, 0.71044921875, 1.681640625, 2.65283203125, 3.6240234375, 4.59521484375, 5.56640625, 6.53759765625, 7.5087890625, 8.47998046875, 9.451171875, 10.42236328125, 11.3935546875, 12.36474609375, 13.3359375, 14.30712890625, 15.2783203125, 16.24951171875, 17.220703125, 18.19189453125, 19.1630859375, 20.13427734375, 21.10546875, 22.07666015625, 23.0478515625, 24.01904296875, 24.990234375, 25.96142578125, 26.9326171875, 27.90380859375, 28.875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 19.0, 15.0, 36.0, 38.0, 60.0, 69.0, 103.0, 98.0, 88.0, 94.0, 82.0, 89.0, 66.0, 63.0, 27.0, 27.0, 9.0, 11.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.548952102661133, -21.101688385009766, -19.654422760009766, -18.207157135009766, -16.7598934173584, -15.312628746032715, -13.865364074707031, -12.418099403381348, -10.970834732055664, -9.52357006072998, -8.076305389404297, -6.629040718078613, -5.18177604675293, -3.734511375427246, -2.2872467041015625, -0.8399820327758789, 0.6072826385498047, 2.0545473098754883, 3.501811981201172, 4.9490766525268555, 6.396341323852539, 7.843605995178223, 9.290870666503906, 10.73813533782959, 12.185400009155273, 13.632664680480957, 15.07992935180664, 16.52719497680664, 17.974458694458008, 19.421722412109375, 20.868988037109375, 22.316253662109375, 23.763519287109375, 25.210784912109375, 26.658048629760742, 28.10531234741211, 29.55257797241211, 30.99984359741211, 32.447105407714844, 33.894371032714844, 35.341636657714844, 36.788902282714844, 38.236167907714844, 39.68342971801758, 41.13069534301758, 42.57796096801758, 44.02522277832031, 45.47248840332031, 46.91975402832031, 48.36701965332031, 49.81428527832031, 51.26154708862305, 52.70881271362305, 54.15607833862305, 55.60334014892578, 57.05060577392578, 58.49787139892578, 59.94513702392578, 61.39240264892578, 62.839664459228516, 64.28692626953125, 65.73419189453125, 67.18145751953125, 68.62872314453125, 70.07598876953125]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 10.0, 5.0, 11.0, 6.0, 13.0, 13.0, 20.0, 19.0, 19.0, 19.0, 25.0, 23.0, 20.0, 33.0, 24.0, 28.0, 26.0, 34.0, 30.0, 50.0, 48.0, 43.0, 32.0, 34.0, 29.0, 34.0, 39.0, 28.0, 33.0, 29.0, 26.0, 15.0, 22.0, 20.0, 20.0, 20.0, 12.0, 15.0, 12.0, 10.0, 7.0, 8.0, 5.0, 6.0, 3.0, 5.0, 4.0, 2.0, 3.0, 5.0, 0.0, 0.0, 3.0, 2.0], "bins": [-33.534393310546875, -32.471500396728516, -31.40860939025879, -30.345718383789062, -29.282825469970703, -28.219934463500977, -27.15704345703125, -26.09415054321289, -25.031259536743164, -23.968368530273438, -22.905475616455078, -21.84258460998535, -20.779693603515625, -19.716800689697266, -18.65390968322754, -17.591018676757812, -16.528125762939453, -15.46523380279541, -14.402341842651367, -13.33945083618164, -12.276558876037598, -11.213666915893555, -10.150775909423828, -9.087883949279785, -8.024991989135742, -6.962100028991699, -5.8992085456848145, -4.83631706237793, -3.7734251022338867, -2.7105331420898438, -1.647641658782959, -0.5847501754760742, 0.47814178466796875, 1.5410335063934326, 2.6039252281188965, 3.6668169498443604, 4.729708671569824, 5.792600631713867, 6.855492115020752, 7.918383598327637, 8.98127555847168, 10.044167518615723, 11.107059478759766, 12.169950485229492, 13.232842445373535, 14.295734405517578, 15.358625411987305, 16.42151641845703, 17.48440933227539, 18.547300338745117, 19.610193252563477, 20.673084259033203, 21.735977172851562, 22.79886817932129, 23.861759185791016, 24.924652099609375, 25.9875431060791, 27.050434112548828, 28.113327026367188, 29.176218032836914, 30.23910903930664, 31.302001953125, 32.36489486694336, 33.42778396606445, 34.49067687988281]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 6.0, 7.0, 7.0, 6.0, 15.0, 15.0, 22.0, 22.0, 19.0, 13.0, 32.0, 38.0, 40.0, 36.0, 38.0, 38.0, 42.0, 44.0, 53.0, 45.0, 35.0, 53.0, 48.0, 36.0, 31.0, 28.0, 30.0, 28.0, 32.0, 26.0, 14.0, 17.0, 17.0, 14.0, 13.0, 7.0, 3.0, 11.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.9296875, -4.78497314453125, -4.6402587890625, -4.49554443359375, -4.350830078125, -4.20611572265625, -4.0614013671875, -3.91668701171875, -3.77197265625, -3.62725830078125, -3.4825439453125, -3.33782958984375, -3.193115234375, -3.04840087890625, -2.9036865234375, -2.75897216796875, -2.6142578125, -2.46954345703125, -2.3248291015625, -2.18011474609375, -2.035400390625, -1.89068603515625, -1.7459716796875, -1.60125732421875, -1.45654296875, -1.31182861328125, -1.1671142578125, -1.02239990234375, -0.877685546875, -0.73297119140625, -0.5882568359375, -0.44354248046875, -0.298828125, -0.15411376953125, -0.0093994140625, 0.13531494140625, 0.280029296875, 0.42474365234375, 0.5694580078125, 0.71417236328125, 0.85888671875, 1.00360107421875, 1.1483154296875, 1.29302978515625, 1.437744140625, 1.58245849609375, 1.7271728515625, 1.87188720703125, 2.0166015625, 2.16131591796875, 2.3060302734375, 2.45074462890625, 2.595458984375, 2.74017333984375, 2.8848876953125, 3.02960205078125, 3.17431640625, 3.31903076171875, 3.4637451171875, 3.60845947265625, 3.753173828125, 3.89788818359375, 4.0426025390625, 4.18731689453125, 4.33203125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 8.0, 8.0, 22.0, 27.0, 37.0, 55.0, 86.0, 115.0, 151.0, 228.0, 310.0, 479.0, 641.0, 990.0, 1339.0, 1928.0, 2713.0, 3904.0, 5567.0, 8227.0, 12167.0, 18231.0, 28353.0, 44716.0, 75589.0, 136510.0, 270359.0, 183578.0, 95379.0, 55463.0, 33776.0, 21840.0, 14287.0, 9587.0, 6527.0, 4614.0, 3235.0, 2231.0, 1600.0, 1111.0, 747.0, 533.0, 365.0, 295.0, 189.0, 141.0, 94.0, 59.0, 47.0, 33.0, 24.0, 14.0, 12.0, 10.0, 7.0, 3.0, 1.0, 2.0], "bins": [-0.75439453125, -0.7313308715820312, -0.7082672119140625, -0.6852035522460938, -0.662139892578125, -0.6390762329101562, -0.6160125732421875, -0.5929489135742188, -0.56988525390625, -0.5468215942382812, -0.5237579345703125, -0.5006942749023438, -0.477630615234375, -0.45456695556640625, -0.4315032958984375, -0.40843963623046875, -0.3853759765625, -0.36231231689453125, -0.3392486572265625, -0.31618499755859375, -0.293121337890625, -0.27005767822265625, -0.2469940185546875, -0.22393035888671875, -0.20086669921875, -0.17780303955078125, -0.1547393798828125, -0.13167572021484375, -0.108612060546875, -0.08554840087890625, -0.0624847412109375, -0.03942108154296875, -0.016357421875, 0.00670623779296875, 0.0297698974609375, 0.05283355712890625, 0.075897216796875, 0.09896087646484375, 0.1220245361328125, 0.14508819580078125, 0.16815185546875, 0.19121551513671875, 0.2142791748046875, 0.23734283447265625, 0.260406494140625, 0.28347015380859375, 0.3065338134765625, 0.32959747314453125, 0.3526611328125, 0.37572479248046875, 0.3987884521484375, 0.42185211181640625, 0.444915771484375, 0.46797943115234375, 0.4910430908203125, 0.5141067504882812, 0.53717041015625, 0.5602340698242188, 0.5832977294921875, 0.6063613891601562, 0.629425048828125, 0.6524887084960938, 0.6755523681640625, 0.6986160278320312, 0.7216796875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 2.0, 8.0, 5.0, 8.0, 11.0, 12.0, 10.0, 17.0, 14.0, 28.0, 20.0, 32.0, 43.0, 37.0, 45.0, 37.0, 52.0, 24.0, 35.0, 1068.0, 38.0, 37.0, 36.0, 57.0, 48.0, 39.0, 33.0, 34.0, 32.0, 34.0, 29.0, 18.0, 11.0, 19.0, 14.0, 2.0, 2.0, 11.0, 4.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.9140625, -2.819610595703125, -2.72515869140625, -2.630706787109375, -2.5362548828125, -2.441802978515625, -2.34735107421875, -2.252899169921875, -2.158447265625, -2.063995361328125, -1.96954345703125, -1.875091552734375, -1.7806396484375, -1.686187744140625, -1.59173583984375, -1.497283935546875, -1.40283203125, -1.308380126953125, -1.21392822265625, -1.119476318359375, -1.0250244140625, -0.930572509765625, -0.83612060546875, -0.741668701171875, -0.647216796875, -0.552764892578125, -0.45831298828125, -0.363861083984375, -0.2694091796875, -0.174957275390625, -0.08050537109375, 0.013946533203125, 0.1083984375, 0.202850341796875, 0.29730224609375, 0.391754150390625, 0.4862060546875, 0.580657958984375, 0.67510986328125, 0.769561767578125, 0.864013671875, 0.958465576171875, 1.05291748046875, 1.147369384765625, 1.2418212890625, 1.336273193359375, 1.43072509765625, 1.525177001953125, 1.61962890625, 1.714080810546875, 1.80853271484375, 1.902984619140625, 1.9974365234375, 2.091888427734375, 2.18634033203125, 2.280792236328125, 2.375244140625, 2.469696044921875, 2.56414794921875, 2.658599853515625, 2.7530517578125, 2.847503662109375, 2.94195556640625, 3.036407470703125, 3.130859375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 5.0, 7.0, 16.0, 21.0, 21.0, 40.0, 64.0, 75.0, 133.0, 196.0, 266.0, 411.0, 584.0, 839.0, 1442.0, 2208.0, 3352.0, 5316.0, 8984.0, 15284.0, 26018.0, 46289.0, 85251.0, 172469.0, 1364812.0, 168828.0, 83977.0, 45552.0, 25534.0, 14984.0, 8950.0, 5515.0, 3392.0, 2250.0, 1299.0, 938.0, 552.0, 389.0, 269.0, 183.0, 124.0, 100.0, 53.0, 43.0, 32.0, 16.0, 19.0, 14.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.86865234375, -0.8419113159179688, -0.8151702880859375, -0.7884292602539062, -0.761688232421875, -0.7349472045898438, -0.7082061767578125, -0.6814651489257812, -0.65472412109375, -0.6279830932617188, -0.6012420654296875, -0.5745010375976562, -0.547760009765625, -0.5210189819335938, -0.4942779541015625, -0.46753692626953125, -0.4407958984375, -0.41405487060546875, -0.3873138427734375, -0.36057281494140625, -0.333831787109375, -0.30709075927734375, -0.2803497314453125, -0.25360870361328125, -0.22686767578125, -0.20012664794921875, -0.1733856201171875, -0.14664459228515625, -0.119903564453125, -0.09316253662109375, -0.0664215087890625, -0.03968048095703125, -0.012939453125, 0.01380157470703125, 0.0405426025390625, 0.06728363037109375, 0.094024658203125, 0.12076568603515625, 0.1475067138671875, 0.17424774169921875, 0.20098876953125, 0.22772979736328125, 0.2544708251953125, 0.28121185302734375, 0.307952880859375, 0.33469390869140625, 0.3614349365234375, 0.38817596435546875, 0.4149169921875, 0.44165802001953125, 0.4683990478515625, 0.49514007568359375, 0.521881103515625, 0.5486221313476562, 0.5753631591796875, 0.6021041870117188, 0.62884521484375, 0.6555862426757812, 0.6823272705078125, 0.7090682983398438, 0.735809326171875, 0.7625503540039062, 0.7892913818359375, 0.8160324096679688, 0.8427734375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 4.0, 11.0, 6.0, 5.0, 12.0, 15.0, 17.0, 17.0, 18.0, 15.0, 34.0, 34.0, 44.0, 57.0, 67.0, 77.0, 77.0, 69.0, 74.0, 73.0, 70.0, 57.0, 23.0, 36.0, 29.0, 15.0, 11.0, 8.0, 5.0, 5.0, 8.0, 4.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008678436279296875, -0.0008385926485061646, -0.0008093416690826416, -0.0007800906896591187, -0.0007508397102355957, -0.0007215887308120728, -0.0006923377513885498, -0.0006630867719650269, -0.0006338357925415039, -0.000604584813117981, -0.000575333833694458, -0.0005460828542709351, -0.0005168318748474121, -0.00048758089542388916, -0.0004583299160003662, -0.00042907893657684326, -0.0003998279571533203, -0.00037057697772979736, -0.0003413259983062744, -0.00031207501888275146, -0.0002828240394592285, -0.00025357306003570557, -0.00022432208061218262, -0.00019507110118865967, -0.00016582012176513672, -0.00013656914234161377, -0.00010731816291809082, -7.806718349456787e-05, -4.881620407104492e-05, -1.9565224647521973e-05, 9.685754776000977e-06, 3.8936734199523926e-05, 6.818771362304688e-05, 9.743869304656982e-05, 0.00012668967247009277, 0.00015594065189361572, 0.00018519163131713867, 0.00021444261074066162, 0.00024369359016418457, 0.0002729445695877075, 0.00030219554901123047, 0.0003314465284347534, 0.00036069750785827637, 0.0003899484872817993, 0.00041919946670532227, 0.0004484504461288452, 0.00047770142555236816, 0.0005069524049758911, 0.0005362033843994141, 0.000565454363822937, 0.00059470534324646, 0.0006239563226699829, 0.0006532073020935059, 0.0006824582815170288, 0.0007117092609405518, 0.0007409602403640747, 0.0007702112197875977, 0.0007994621992111206, 0.0008287131786346436, 0.0008579641580581665, 0.0008872151374816895, 0.0009164661169052124, 0.0009457170963287354, 0.0009749680757522583, 0.0010042190551757812]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 11.0, 8.0, 12.0, 18.0, 20.0, 41.0, 50.0, 80.0, 109.0, 190.0, 351.0, 698.0, 8879.0, 1028275.0, 8203.0, 729.0, 341.0, 191.0, 89.0, 65.0, 39.0, 33.0, 25.0, 20.0, 15.0, 13.0, 11.0, 8.0, 8.0, 8.0, 4.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.018524169921875, -0.017935991287231445, -0.01734781265258789, -0.016759634017944336, -0.01617145538330078, -0.015583276748657227, -0.014995098114013672, -0.014406919479370117, -0.013818740844726562, -0.013230562210083008, -0.012642383575439453, -0.012054204940795898, -0.011466026306152344, -0.010877847671508789, -0.010289669036865234, -0.00970149040222168, -0.009113311767578125, -0.00852513313293457, -0.007936954498291016, -0.007348775863647461, -0.006760597229003906, -0.0061724185943603516, -0.005584239959716797, -0.004996061325073242, -0.0044078826904296875, -0.003819704055786133, -0.003231525421142578, -0.0026433467864990234, -0.0020551681518554688, -0.001466989517211914, -0.0008788108825683594, -0.0002906322479248047, 0.00029754638671875, 0.0008857250213623047, 0.0014739036560058594, 0.002062082290649414, 0.0026502609252929688, 0.0032384395599365234, 0.003826618194580078, 0.004414796829223633, 0.0050029754638671875, 0.005591154098510742, 0.006179332733154297, 0.0067675113677978516, 0.007355690002441406, 0.007943868637084961, 0.008532047271728516, 0.00912022590637207, 0.009708404541015625, 0.01029658317565918, 0.010884761810302734, 0.011472940444946289, 0.012061119079589844, 0.012649297714233398, 0.013237476348876953, 0.013825654983520508, 0.014413833618164062, 0.015002012252807617, 0.015590190887451172, 0.016178369522094727, 0.01676654815673828, 0.017354726791381836, 0.01794290542602539, 0.018531084060668945, 0.0191192626953125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 33.0, 146.0, 376.0, 333.0, 104.0, 18.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007817293517291546, -0.0007210138137452304, -0.0006602983339689672, -0.000599582795985043, -0.0005388672580011189, -0.0004781517491210252, -0.0004174362402409315, -0.00035672070225700736, -0.00029600519337691367, -0.00023528966994490474, -0.00017457414651289582, -0.00011385863763280213, -5.314311420079321e-05, 7.572409231215715e-06, 6.828791811130941e-05, 0.00012900345609523356, 0.00018971896497532725, 0.00025043447385542095, 0.0003111500118393451, 0.0003718655207194388, 0.00043258105870336294, 0.0004932965384796262, 0.0005540120764635503, 0.0006147276144474745, 0.0006754430942237377, 0.0007361586322076619, 0.0007968741119839251, 0.0008575896499678493, 0.0009183051879517734, 0.0009790207259356976, 0.0010397362057119608, 0.001100451685488224, 0.001161167281679809, 0.0012218827614560723, 0.0012825983576476574, 0.0013433138374239206, 0.0014040293172001839, 0.001464744913391769, 0.0015254603931680322, 0.0015861759893596172, 0.0016468914691358805, 0.0017076069489121437, 0.0017683225451037288, 0.001829038024879992, 0.0018897535046562552, 0.0019504691008478403, 0.0020111845806241035, 0.0020719000604003668, 0.00213261554017663, 0.0021933310199528933, 0.0022540464997291565, 0.0023147622123360634, 0.0023754776921123266, 0.00243619317188859, 0.002496908651664853, 0.0025576241314411163, 0.0026183398440480232, 0.0026790553238242865, 0.0027397708036005497, 0.0028004865162074566, 0.00286120199598372, 0.002921917475759983, 0.0029826329555362463, 0.0030433484353125095, 0.0031040639150887728]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 8.0, 9.0, 8.0, 7.0, 9.0, 13.0, 15.0, 12.0, 23.0, 24.0, 28.0, 19.0, 28.0, 23.0, 27.0, 29.0, 47.0, 27.0, 38.0, 34.0, 43.0, 40.0, 33.0, 36.0, 27.0, 24.0, 41.0, 27.0, 33.0, 30.0, 24.0, 30.0, 29.0, 27.0, 13.0, 15.0, 11.0, 10.0, 15.0, 11.0, 10.0, 15.0, 7.0, 4.0, 6.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-0.00034350156784057617, -0.0003326665610074997, -0.0003218315541744232, -0.00031099654734134674, -0.00030016154050827026, -0.0002893265336751938, -0.0002784915268421173, -0.00026765652000904083, -0.00025682151317596436, -0.0002459865063428879, -0.0002351514995098114, -0.00022431649267673492, -0.00021348148584365845, -0.00020264647901058197, -0.0001918114721775055, -0.00018097646534442902, -0.00017014145851135254, -0.00015930645167827606, -0.00014847144484519958, -0.0001376364380121231, -0.00012680143117904663, -0.00011596642434597015, -0.00010513141751289368, -9.42964106798172e-05, -8.346140384674072e-05, -7.262639701366425e-05, -6.179139018058777e-05, -5.095638334751129e-05, -4.0121376514434814e-05, -2.9286369681358337e-05, -1.845136284828186e-05, -7.616356015205383e-06, 3.2186508178710938e-06, 1.405365765094757e-05, 2.4888664484024048e-05, 3.5723671317100525e-05, 4.6558678150177e-05, 5.739368498325348e-05, 6.822869181632996e-05, 7.906369864940643e-05, 8.989870548248291e-05, 0.00010073371231555939, 0.00011156871914863586, 0.00012240372598171234, 0.00013323873281478882, 0.0001440737396478653, 0.00015490874648094177, 0.00016574375331401825, 0.00017657876014709473, 0.0001874137669801712, 0.00019824877381324768, 0.00020908378064632416, 0.00021991878747940063, 0.0002307537943124771, 0.0002415888011455536, 0.00025242380797863007, 0.00026325881481170654, 0.000274093821644783, 0.0002849288284778595, 0.000295763835310936, 0.00030659884214401245, 0.00031743384897708893, 0.0003282688558101654, 0.0003391038626432419, 0.00034993886947631836]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 4.0, 6.0, 7.0, 7.0, 6.0, 15.0, 15.0, 22.0, 22.0, 19.0, 13.0, 32.0, 38.0, 40.0, 36.0, 38.0, 38.0, 42.0, 44.0, 53.0, 45.0, 35.0, 53.0, 48.0, 36.0, 31.0, 28.0, 30.0, 28.0, 32.0, 26.0, 14.0, 17.0, 17.0, 14.0, 13.0, 7.0, 3.0, 11.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.9296875, -4.78497314453125, -4.6402587890625, -4.49554443359375, -4.350830078125, -4.20611572265625, -4.0614013671875, -3.91668701171875, -3.77197265625, -3.62725830078125, -3.4825439453125, -3.33782958984375, -3.193115234375, -3.04840087890625, -2.9036865234375, -2.75897216796875, -2.6142578125, -2.46954345703125, -2.3248291015625, -2.18011474609375, -2.035400390625, -1.89068603515625, -1.7459716796875, -1.60125732421875, -1.45654296875, -1.31182861328125, -1.1671142578125, -1.02239990234375, -0.877685546875, -0.73297119140625, -0.5882568359375, -0.44354248046875, -0.298828125, -0.15411376953125, -0.0093994140625, 0.13531494140625, 0.280029296875, 0.42474365234375, 0.5694580078125, 0.71417236328125, 0.85888671875, 1.00360107421875, 1.1483154296875, 1.29302978515625, 1.437744140625, 1.58245849609375, 1.7271728515625, 1.87188720703125, 2.0166015625, 2.16131591796875, 2.3060302734375, 2.45074462890625, 2.595458984375, 2.74017333984375, 2.8848876953125, 3.02960205078125, 3.17431640625, 3.31903076171875, 3.4637451171875, 3.60845947265625, 3.753173828125, 3.89788818359375, 4.0426025390625, 4.18731689453125, 4.33203125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 6.0, 9.0, 16.0, 16.0, 20.0, 36.0, 51.0, 64.0, 92.0, 114.0, 174.0, 275.0, 336.0, 559.0, 811.0, 1281.0, 1992.0, 3140.0, 4857.0, 8258.0, 15233.0, 33343.0, 90536.0, 289245.0, 385545.0, 125069.0, 43319.0, 18596.0, 9708.0, 5695.0, 3536.0, 2219.0, 1395.0, 977.0, 658.0, 401.0, 273.0, 193.0, 146.0, 108.0, 72.0, 45.0, 34.0, 24.0, 26.0, 20.0, 11.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.67578125, -4.525634765625, -4.37548828125, -4.225341796875, -4.0751953125, -3.925048828125, -3.77490234375, -3.624755859375, -3.474609375, -3.324462890625, -3.17431640625, -3.024169921875, -2.8740234375, -2.723876953125, -2.57373046875, -2.423583984375, -2.2734375, -2.123291015625, -1.97314453125, -1.822998046875, -1.6728515625, -1.522705078125, -1.37255859375, -1.222412109375, -1.072265625, -0.922119140625, -0.77197265625, -0.621826171875, -0.4716796875, -0.321533203125, -0.17138671875, -0.021240234375, 0.12890625, 0.279052734375, 0.42919921875, 0.579345703125, 0.7294921875, 0.879638671875, 1.02978515625, 1.179931640625, 1.330078125, 1.480224609375, 1.63037109375, 1.780517578125, 1.9306640625, 2.080810546875, 2.23095703125, 2.381103515625, 2.53125, 2.681396484375, 2.83154296875, 2.981689453125, 3.1318359375, 3.281982421875, 3.43212890625, 3.582275390625, 3.732421875, 3.882568359375, 4.03271484375, 4.182861328125, 4.3330078125, 4.483154296875, 4.63330078125, 4.783447265625, 4.93359375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 3.0, 9.0, 7.0, 10.0, 9.0, 9.0, 16.0, 17.0, 24.0, 26.0, 25.0, 40.0, 36.0, 38.0, 34.0, 32.0, 42.0, 60.0, 138.0, 281.0, 1509.0, 189.0, 88.0, 52.0, 44.0, 37.0, 40.0, 38.0, 25.0, 16.0, 22.0, 16.0, 17.0, 18.0, 9.0, 11.0, 15.0, 4.0, 14.0, 4.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.4765625, -15.01171875, -14.546875, -14.08203125, -13.6171875, -13.15234375, -12.6875, -12.22265625, -11.7578125, -11.29296875, -10.828125, -10.36328125, -9.8984375, -9.43359375, -8.96875, -8.50390625, -8.0390625, -7.57421875, -7.109375, -6.64453125, -6.1796875, -5.71484375, -5.25, -4.78515625, -4.3203125, -3.85546875, -3.390625, -2.92578125, -2.4609375, -1.99609375, -1.53125, -1.06640625, -0.6015625, -0.13671875, 0.328125, 0.79296875, 1.2578125, 1.72265625, 2.1875, 2.65234375, 3.1171875, 3.58203125, 4.046875, 4.51171875, 4.9765625, 5.44140625, 5.90625, 6.37109375, 6.8359375, 7.30078125, 7.765625, 8.23046875, 8.6953125, 9.16015625, 9.625, 10.08984375, 10.5546875, 11.01953125, 11.484375, 11.94921875, 12.4140625, 12.87890625, 13.34375, 13.80859375, 14.2734375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 6.0, 6.0, 7.0, 17.0, 6.0, 26.0, 33.0, 41.0, 48.0, 78.0, 148.0, 314.0, 653.0, 4713.0, 2502689.0, 632328.0, 3297.0, 548.0, 270.0, 164.0, 95.0, 62.0, 46.0, 28.0, 20.0, 19.0, 15.0, 9.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.1875, -48.70849609375, -47.2294921875, -45.75048828125, -44.271484375, -42.79248046875, -41.3134765625, -39.83447265625, -38.35546875, -36.87646484375, -35.3974609375, -33.91845703125, -32.439453125, -30.96044921875, -29.4814453125, -28.00244140625, -26.5234375, -25.04443359375, -23.5654296875, -22.08642578125, -20.607421875, -19.12841796875, -17.6494140625, -16.17041015625, -14.69140625, -13.21240234375, -11.7333984375, -10.25439453125, -8.775390625, -7.29638671875, -5.8173828125, -4.33837890625, -2.859375, -1.38037109375, 0.0986328125, 1.57763671875, 3.056640625, 4.53564453125, 6.0146484375, 7.49365234375, 8.97265625, 10.45166015625, 11.9306640625, 13.40966796875, 14.888671875, 16.36767578125, 17.8466796875, 19.32568359375, 20.8046875, 22.28369140625, 23.7626953125, 25.24169921875, 26.720703125, 28.19970703125, 29.6787109375, 31.15771484375, 32.63671875, 34.11572265625, 35.5947265625, 37.07373046875, 38.552734375, 40.03173828125, 41.5107421875, 42.98974609375, 44.46875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 6.0, 138.0, 670.0, 191.0, 10.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.539440155029297, -24.20182228088379, -19.86420440673828, -15.526588439941406, -11.188970565795898, -6.851352691650391, -2.5137367248535156, 1.8238811492919922, 6.1614990234375, 10.499116897583008, 14.8367338180542, 19.17435073852539, 23.5119686126709, 27.849586486816406, 32.18720245361328, 36.524818420410156, 40.8624382019043, 45.20005416870117, 49.53767395019531, 53.87528991699219, 58.21290588378906, 62.5505256652832, 66.88813781738281, 71.22576141357422, 75.5633773803711, 79.90099334716797, 84.23860931396484, 88.57623291015625, 92.91384887695312, 97.25146484375, 101.58908081054688, 105.92669677734375, 110.26431274414062, 114.6019287109375, 118.93954467773438, 123.27716064453125, 127.61478424072266, 131.952392578125, 136.29000854492188, 140.6276397705078, 144.9652557373047, 149.30287170410156, 153.64048767089844, 157.9781036376953, 162.3157196044922, 166.65335083007812, 170.990966796875, 175.32858276367188, 179.66619873046875, 184.00381469726562, 188.3414306640625, 192.67904663085938, 197.01666259765625, 201.35427856445312, 205.69189453125, 210.02952575683594, 214.36712646484375, 218.70474243164062, 223.0423583984375, 227.37997436523438, 231.71759033203125, 236.05520629882812, 240.392822265625, 244.73045349121094, 249.0680694580078]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 7.0, 2.0, 10.0, 11.0, 9.0, 17.0, 16.0, 19.0, 23.0, 33.0, 28.0, 21.0, 40.0, 42.0, 40.0, 32.0, 40.0, 32.0, 52.0, 45.0, 42.0, 44.0, 47.0, 25.0, 34.0, 38.0, 37.0, 24.0, 25.0, 23.0, 27.0, 20.0, 19.0, 10.0, 19.0, 5.0, 10.0, 6.0, 7.0, 8.0, 6.0, 6.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-51.48308563232422, -49.94945526123047, -48.41582489013672, -46.88219451904297, -45.34856033325195, -43.8149299621582, -42.28129959106445, -40.7476692199707, -39.21403884887695, -37.6804084777832, -36.14677810668945, -34.61314392089844, -33.07951354980469, -31.545883178710938, -30.012252807617188, -28.478622436523438, -26.944990158081055, -25.411359786987305, -23.877727508544922, -22.344097137451172, -20.810466766357422, -19.276836395263672, -17.74320411682129, -16.20957374572754, -14.675942420959473, -13.142311096191406, -11.608680725097656, -10.07504940032959, -8.541418075561523, -7.007787704467773, -5.474156379699707, -3.940526008605957, -2.4068946838378906, -0.8732637166976929, 0.6603672504425049, 2.193998336791992, 3.7276291847229004, 5.261260032653809, 6.794891357421875, 8.328521728515625, 9.862153053283691, 11.395784378051758, 12.929414749145508, 14.463046073913574, 15.99667739868164, 17.53030776977539, 19.06393814086914, 20.59756851196289, 22.131200790405273, 23.664831161499023, 25.198463439941406, 26.732093811035156, 28.265724182128906, 29.799354553222656, 31.33298683166504, 32.866615295410156, 34.40024948120117, 35.93387985229492, 37.46751022338867, 39.00114440917969, 40.53477478027344, 42.06840515136719, 43.60203552246094, 45.13566589355469, 46.66929626464844]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 5.0, 4.0, 9.0, 9.0, 9.0, 7.0, 11.0, 10.0, 16.0, 20.0, 26.0, 16.0, 33.0, 34.0, 39.0, 30.0, 47.0, 35.0, 49.0, 43.0, 49.0, 44.0, 49.0, 44.0, 44.0, 38.0, 26.0, 41.0, 32.0, 30.0, 21.0, 19.0, 18.0, 19.0, 10.0, 14.0, 18.0, 8.0, 8.0, 5.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-5.12890625, -4.9786376953125, -4.828369140625, -4.6781005859375, -4.52783203125, -4.3775634765625, -4.227294921875, -4.0770263671875, -3.9267578125, -3.7764892578125, -3.626220703125, -3.4759521484375, -3.32568359375, -3.1754150390625, -3.025146484375, -2.8748779296875, -2.724609375, -2.5743408203125, -2.424072265625, -2.2738037109375, -2.12353515625, -1.9732666015625, -1.822998046875, -1.6727294921875, -1.5224609375, -1.3721923828125, -1.221923828125, -1.0716552734375, -0.92138671875, -0.7711181640625, -0.620849609375, -0.4705810546875, -0.3203125, -0.1700439453125, -0.019775390625, 0.1304931640625, 0.28076171875, 0.4310302734375, 0.581298828125, 0.7315673828125, 0.8818359375, 1.0321044921875, 1.182373046875, 1.3326416015625, 1.48291015625, 1.6331787109375, 1.783447265625, 1.9337158203125, 2.083984375, 2.2342529296875, 2.384521484375, 2.5347900390625, 2.68505859375, 2.8353271484375, 2.985595703125, 3.1358642578125, 3.2861328125, 3.4364013671875, 3.586669921875, 3.7369384765625, 3.88720703125, 4.0374755859375, 4.187744140625, 4.3380126953125, 4.48828125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 4.0, 2.0, 8.0, 6.0, 9.0, 10.0, 12.0, 15.0, 24.0, 37.0, 34.0, 65.0, 90.0, 183.0, 266.0, 430.0, 778.0, 1514.0, 3280.0, 7310.0, 18340.0, 51541.0, 161187.0, 496545.0, 1150374.0, 1316106.0, 653527.0, 221105.0, 70133.0, 24081.0, 9340.0, 3889.0, 1819.0, 897.0, 473.0, 288.0, 175.0, 129.0, 69.0, 49.0, 43.0, 32.0, 17.0, 19.0, 10.0, 8.0, 3.0, 3.0, 2.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.578125, -5.4097900390625, -5.241455078125, -5.0731201171875, -4.90478515625, -4.7364501953125, -4.568115234375, -4.3997802734375, -4.2314453125, -4.0631103515625, -3.894775390625, -3.7264404296875, -3.55810546875, -3.3897705078125, -3.221435546875, -3.0531005859375, -2.884765625, -2.7164306640625, -2.548095703125, -2.3797607421875, -2.21142578125, -2.0430908203125, -1.874755859375, -1.7064208984375, -1.5380859375, -1.3697509765625, -1.201416015625, -1.0330810546875, -0.86474609375, -0.6964111328125, -0.528076171875, -0.3597412109375, -0.19140625, -0.0230712890625, 0.145263671875, 0.3135986328125, 0.48193359375, 0.6502685546875, 0.818603515625, 0.9869384765625, 1.1552734375, 1.3236083984375, 1.491943359375, 1.6602783203125, 1.82861328125, 1.9969482421875, 2.165283203125, 2.3336181640625, 2.501953125, 2.6702880859375, 2.838623046875, 3.0069580078125, 3.17529296875, 3.3436279296875, 3.511962890625, 3.6802978515625, 3.8486328125, 4.0169677734375, 4.185302734375, 4.3536376953125, 4.52197265625, 4.6903076171875, 4.858642578125, 5.0269775390625, 5.1953125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 5.0, 9.0, 17.0, 13.0, 18.0, 27.0, 50.0, 66.0, 92.0, 118.0, 225.0, 247.0, 340.0, 429.0, 453.0, 459.0, 381.0, 308.0, 253.0, 162.0, 119.0, 79.0, 62.0, 49.0, 39.0, 19.0, 13.0, 9.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.609375, -14.2015380859375, -13.793701171875, -13.3858642578125, -12.97802734375, -12.5701904296875, -12.162353515625, -11.7545166015625, -11.3466796875, -10.9388427734375, -10.531005859375, -10.1231689453125, -9.71533203125, -9.3074951171875, -8.899658203125, -8.4918212890625, -8.083984375, -7.6761474609375, -7.268310546875, -6.8604736328125, -6.45263671875, -6.0447998046875, -5.636962890625, -5.2291259765625, -4.8212890625, -4.4134521484375, -4.005615234375, -3.5977783203125, -3.18994140625, -2.7821044921875, -2.374267578125, -1.9664306640625, -1.55859375, -1.1507568359375, -0.742919921875, -0.3350830078125, 0.07275390625, 0.4805908203125, 0.888427734375, 1.2962646484375, 1.7041015625, 2.1119384765625, 2.519775390625, 2.9276123046875, 3.33544921875, 3.7432861328125, 4.151123046875, 4.5589599609375, 4.966796875, 5.3746337890625, 5.782470703125, 6.1903076171875, 6.59814453125, 7.0059814453125, 7.413818359375, 7.8216552734375, 8.2294921875, 8.6373291015625, 9.045166015625, 9.4530029296875, 9.86083984375, 10.2686767578125, 10.676513671875, 11.0843505859375, 11.4921875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 4.0, 12.0, 10.0, 20.0, 12.0, 29.0, 35.0, 56.0, 80.0, 92.0, 168.0, 314.0, 967.0, 5776.0, 161545.0, 3587198.0, 425164.0, 10489.0, 1227.0, 406.0, 226.0, 133.0, 71.0, 57.0, 55.0, 39.0, 30.0, 16.0, 18.0, 5.0, 6.0, 8.0, 6.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.25, -23.22314453125, -22.1962890625, -21.16943359375, -20.142578125, -19.11572265625, -18.0888671875, -17.06201171875, -16.03515625, -15.00830078125, -13.9814453125, -12.95458984375, -11.927734375, -10.90087890625, -9.8740234375, -8.84716796875, -7.8203125, -6.79345703125, -5.7666015625, -4.73974609375, -3.712890625, -2.68603515625, -1.6591796875, -0.63232421875, 0.39453125, 1.42138671875, 2.4482421875, 3.47509765625, 4.501953125, 5.52880859375, 6.5556640625, 7.58251953125, 8.609375, 9.63623046875, 10.6630859375, 11.68994140625, 12.716796875, 13.74365234375, 14.7705078125, 15.79736328125, 16.82421875, 17.85107421875, 18.8779296875, 19.90478515625, 20.931640625, 21.95849609375, 22.9853515625, 24.01220703125, 25.0390625, 26.06591796875, 27.0927734375, 28.11962890625, 29.146484375, 30.17333984375, 31.2001953125, 32.22705078125, 33.25390625, 34.28076171875, 35.3076171875, 36.33447265625, 37.361328125, 38.38818359375, 39.4150390625, 40.44189453125, 41.46875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 22.0, 35.0, 97.0, 157.0, 214.0, 210.0, 129.0, 78.0, 51.0, 12.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.29010009765625, -139.1205596923828, -135.95101928710938, -132.78147888183594, -129.6119384765625, -126.4424057006836, -123.27286529541016, -120.10332489013672, -116.93378448486328, -113.76424407958984, -110.5947036743164, -107.42516326904297, -104.25563049316406, -101.08609008789062, -97.91654968261719, -94.74700927734375, -91.57746887207031, -88.40792846679688, -85.23838806152344, -82.06884765625, -78.89930725097656, -75.72977447509766, -72.56023406982422, -69.39069366455078, -66.22115325927734, -63.051612854003906, -59.88207244873047, -56.7125358581543, -53.54299545288086, -50.37345504760742, -47.20391845703125, -44.03437805175781, -40.864837646484375, -37.69529724121094, -34.5257568359375, -31.356220245361328, -28.18667984008789, -25.017139434814453, -21.84760093688965, -18.678062438964844, -15.508522033691406, -12.338982582092285, -9.169443130493164, -5.999903678894043, -2.830364227294922, 0.3391752243041992, 3.5087146759033203, 6.678253173828125, 9.847793579101562, 13.017333030700684, 16.186872482299805, 19.35641098022461, 22.525951385498047, 25.695491790771484, 28.86503028869629, 32.034568786621094, 35.20410919189453, 38.37364959716797, 41.543190002441406, 44.71272659301758, 47.882266998291016, 51.05180740356445, 54.221343994140625, 57.39088439941406, 60.5604248046875]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 11.0, 6.0, 8.0, 11.0, 14.0, 14.0, 15.0, 24.0, 26.0, 20.0, 24.0, 26.0, 34.0, 34.0, 35.0, 50.0, 23.0, 55.0, 44.0, 32.0, 28.0, 45.0, 37.0, 41.0, 33.0, 32.0, 21.0, 28.0, 29.0, 23.0, 19.0, 27.0, 17.0, 17.0, 16.0, 12.0, 13.0, 9.0, 12.0, 6.0, 3.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-38.20566177368164, -37.06896209716797, -35.93226623535156, -34.79556655883789, -33.65886688232422, -32.52217102050781, -31.38547134399414, -30.2487735748291, -29.112075805664062, -27.975378036499023, -26.83867835998535, -25.701980590820312, -24.565282821655273, -23.428585052490234, -22.291885375976562, -21.155187606811523, -20.01848793029785, -18.881790161132812, -17.74509048461914, -16.6083927154541, -15.471694946289062, -14.334996223449707, -13.198297500610352, -12.061599731445312, -10.924901008605957, -9.788202285766602, -8.651504516601562, -7.514805793762207, -6.37810754776001, -5.2414093017578125, -4.104710578918457, -2.9680123329162598, -1.8313140869140625, -0.6946157217025757, 0.44208264350891113, 1.5787811279296875, 2.7154793739318848, 3.852177619934082, 4.9888763427734375, 6.125574588775635, 7.262272834777832, 8.398971557617188, 9.535669326782227, 10.672368049621582, 11.809066772460938, 12.945764541625977, 14.082463264465332, 15.219161987304688, 16.355859756469727, 17.492557525634766, 18.629257202148438, 19.765954971313477, 20.902652740478516, 22.039352416992188, 23.176050186157227, 24.312747955322266, 25.449447631835938, 26.586145401000977, 27.72284507751465, 28.859542846679688, 29.996240615844727, 31.132938385009766, 32.26963806152344, 33.40633773803711, 34.543033599853516]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 3.0, 9.0, 7.0, 11.0, 19.0, 15.0, 18.0, 23.0, 18.0, 26.0, 20.0, 42.0, 39.0, 44.0, 54.0, 47.0, 45.0, 41.0, 47.0, 40.0, 41.0, 48.0, 36.0, 33.0, 33.0, 31.0, 30.0, 26.0, 21.0, 18.0, 24.0, 16.0, 14.0, 15.0, 8.0, 8.0, 10.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.03515625, -4.87908935546875, -4.7230224609375, -4.56695556640625, -4.410888671875, -4.25482177734375, -4.0987548828125, -3.94268798828125, -3.78662109375, -3.63055419921875, -3.4744873046875, -3.31842041015625, -3.162353515625, -3.00628662109375, -2.8502197265625, -2.69415283203125, -2.5380859375, -2.38201904296875, -2.2259521484375, -2.06988525390625, -1.913818359375, -1.75775146484375, -1.6016845703125, -1.44561767578125, -1.28955078125, -1.13348388671875, -0.9774169921875, -0.82135009765625, -0.665283203125, -0.50921630859375, -0.3531494140625, -0.19708251953125, -0.041015625, 0.11505126953125, 0.2711181640625, 0.42718505859375, 0.583251953125, 0.73931884765625, 0.8953857421875, 1.05145263671875, 1.20751953125, 1.36358642578125, 1.5196533203125, 1.67572021484375, 1.831787109375, 1.98785400390625, 2.1439208984375, 2.29998779296875, 2.4560546875, 2.61212158203125, 2.7681884765625, 2.92425537109375, 3.080322265625, 3.23638916015625, 3.3924560546875, 3.54852294921875, 3.70458984375, 3.86065673828125, 4.0167236328125, 4.17279052734375, 4.328857421875, 4.48492431640625, 4.6409912109375, 4.79705810546875, 4.953125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 8.0, 17.0, 24.0, 30.0, 41.0, 74.0, 79.0, 152.0, 188.0, 321.0, 513.0, 720.0, 1133.0, 1685.0, 2546.0, 4023.0, 5982.0, 9394.0, 14316.0, 23056.0, 37659.0, 64805.0, 120692.0, 242815.0, 236673.0, 117758.0, 63420.0, 37107.0, 22471.0, 14272.0, 9229.0, 6102.0, 3851.0, 2573.0, 1623.0, 1056.0, 728.0, 489.0, 315.0, 202.0, 142.0, 95.0, 59.0, 45.0, 23.0, 16.0, 14.0, 13.0, 7.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.83984375, -0.8127365112304688, -0.7856292724609375, -0.7585220336914062, -0.731414794921875, -0.7043075561523438, -0.6772003173828125, -0.6500930786132812, -0.62298583984375, -0.5958786010742188, -0.5687713623046875, -0.5416641235351562, -0.514556884765625, -0.48744964599609375, -0.4603424072265625, -0.43323516845703125, -0.4061279296875, -0.37902069091796875, -0.3519134521484375, -0.32480621337890625, -0.297698974609375, -0.27059173583984375, -0.2434844970703125, -0.21637725830078125, -0.18927001953125, -0.16216278076171875, -0.1350555419921875, -0.10794830322265625, -0.080841064453125, -0.05373382568359375, -0.0266265869140625, 0.00048065185546875, 0.027587890625, 0.05469512939453125, 0.0818023681640625, 0.10890960693359375, 0.136016845703125, 0.16312408447265625, 0.1902313232421875, 0.21733856201171875, 0.24444580078125, 0.27155303955078125, 0.2986602783203125, 0.32576751708984375, 0.352874755859375, 0.37998199462890625, 0.4070892333984375, 0.43419647216796875, 0.4613037109375, 0.48841094970703125, 0.5155181884765625, 0.5426254272460938, 0.569732666015625, 0.5968399047851562, 0.6239471435546875, 0.6510543823242188, 0.67816162109375, 0.7052688598632812, 0.7323760986328125, 0.7594833374023438, 0.786590576171875, 0.8136978149414062, 0.8408050537109375, 0.8679122924804688, 0.89501953125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 0.0, 4.0, 6.0, 6.0, 8.0, 14.0, 12.0, 10.0, 15.0, 17.0, 28.0, 28.0, 28.0, 30.0, 28.0, 29.0, 46.0, 29.0, 30.0, 46.0, 53.0, 1062.0, 42.0, 46.0, 31.0, 29.0, 41.0, 39.0, 34.0, 35.0, 31.0, 38.0, 20.0, 19.0, 18.0, 17.0, 11.0, 14.0, 10.0, 3.0, 3.0, 6.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0], "bins": [-3.59765625, -3.50146484375, -3.4052734375, -3.30908203125, -3.212890625, -3.11669921875, -3.0205078125, -2.92431640625, -2.828125, -2.73193359375, -2.6357421875, -2.53955078125, -2.443359375, -2.34716796875, -2.2509765625, -2.15478515625, -2.05859375, -1.96240234375, -1.8662109375, -1.77001953125, -1.673828125, -1.57763671875, -1.4814453125, -1.38525390625, -1.2890625, -1.19287109375, -1.0966796875, -1.00048828125, -0.904296875, -0.80810546875, -0.7119140625, -0.61572265625, -0.51953125, -0.42333984375, -0.3271484375, -0.23095703125, -0.134765625, -0.03857421875, 0.0576171875, 0.15380859375, 0.25, 0.34619140625, 0.4423828125, 0.53857421875, 0.634765625, 0.73095703125, 0.8271484375, 0.92333984375, 1.01953125, 1.11572265625, 1.2119140625, 1.30810546875, 1.404296875, 1.50048828125, 1.5966796875, 1.69287109375, 1.7890625, 1.88525390625, 1.9814453125, 2.07763671875, 2.173828125, 2.27001953125, 2.3662109375, 2.46240234375, 2.55859375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 12.0, 10.0, 23.0, 40.0, 40.0, 52.0, 97.0, 143.0, 201.0, 312.0, 464.0, 672.0, 1104.0, 1578.0, 2585.0, 4238.0, 6969.0, 11672.0, 19719.0, 34247.0, 60261.0, 114912.0, 249843.0, 1313982.0, 121514.0, 64341.0, 36027.0, 20753.0, 12049.0, 7383.0, 4429.0, 2678.0, 1733.0, 1045.0, 692.0, 428.0, 300.0, 172.0, 148.0, 85.0, 48.0, 48.0, 21.0, 16.0, 15.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.87158203125, -0.8425674438476562, -0.8135528564453125, -0.7845382690429688, -0.755523681640625, -0.7265090942382812, -0.6974945068359375, -0.6684799194335938, -0.63946533203125, -0.6104507446289062, -0.5814361572265625, -0.5524215698242188, -0.523406982421875, -0.49439239501953125, -0.4653778076171875, -0.43636322021484375, -0.4073486328125, -0.37833404541015625, -0.3493194580078125, -0.32030487060546875, -0.291290283203125, -0.26227569580078125, -0.2332611083984375, -0.20424652099609375, -0.17523193359375, -0.14621734619140625, -0.1172027587890625, -0.08818817138671875, -0.059173583984375, -0.03015899658203125, -0.0011444091796875, 0.02787017822265625, 0.056884765625, 0.08589935302734375, 0.1149139404296875, 0.14392852783203125, 0.172943115234375, 0.20195770263671875, 0.2309722900390625, 0.25998687744140625, 0.28900146484375, 0.31801605224609375, 0.3470306396484375, 0.37604522705078125, 0.405059814453125, 0.43407440185546875, 0.4630889892578125, 0.49210357666015625, 0.5211181640625, 0.5501327514648438, 0.5791473388671875, 0.6081619262695312, 0.637176513671875, 0.6661911010742188, 0.6952056884765625, 0.7242202758789062, 0.75323486328125, 0.7822494506835938, 0.8112640380859375, 0.8402786254882812, 0.869293212890625, 0.8983078002929688, 0.9273223876953125, 0.9563369750976562, 0.9853515625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 2.0, 3.0, 5.0, 4.0, 6.0, 13.0, 7.0, 8.0, 9.0, 18.0, 13.0, 21.0, 27.0, 33.0, 23.0, 43.0, 35.0, 45.0, 39.0, 51.0, 36.0, 48.0, 53.0, 41.0, 50.0, 38.0, 32.0, 33.0, 34.0, 33.0, 30.0, 23.0, 27.0, 20.0, 21.0, 10.0, 12.0, 13.0, 7.0, 9.0, 4.0, 5.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0005354881286621094, -0.0005178079009056091, -0.0005001276731491089, -0.00048244744539260864, -0.0004647672176361084, -0.00044708698987960815, -0.0004294067621231079, -0.00041172653436660767, -0.0003940463066101074, -0.0003763660788536072, -0.00035868585109710693, -0.0003410056233406067, -0.00032332539558410645, -0.0003056451678276062, -0.00028796494007110596, -0.0002702847123146057, -0.00025260448455810547, -0.00023492425680160522, -0.00021724402904510498, -0.00019956380128860474, -0.0001818835735321045, -0.00016420334577560425, -0.000146523118019104, -0.00012884289026260376, -0.00011116266250610352, -9.348243474960327e-05, -7.580220699310303e-05, -5.812197923660278e-05, -4.044175148010254e-05, -2.2761523723602295e-05, -5.081295967102051e-06, 1.2598931789398193e-05, 3.0279159545898438e-05, 4.795938730239868e-05, 6.563961505889893e-05, 8.331984281539917e-05, 0.00010100007057189941, 0.00011868029832839966, 0.0001363605260848999, 0.00015404075384140015, 0.0001717209815979004, 0.00018940120935440063, 0.00020708143711090088, 0.00022476166486740112, 0.00024244189262390137, 0.0002601221203804016, 0.00027780234813690186, 0.0002954825758934021, 0.00031316280364990234, 0.0003308430314064026, 0.00034852325916290283, 0.0003662034869194031, 0.0003838837146759033, 0.00040156394243240356, 0.0004192441701889038, 0.00043692439794540405, 0.0004546046257019043, 0.00047228485345840454, 0.0004899650812149048, 0.000507645308971405, 0.0005253255367279053, 0.0005430057644844055, 0.0005606859922409058, 0.000578366219997406, 0.0005960464477539062]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 3.0, 5.0, 10.0, 14.0, 11.0, 19.0, 18.0, 29.0, 26.0, 39.0, 65.0, 88.0, 102.0, 159.0, 214.0, 328.0, 623.0, 2474.0, 176678.0, 854008.0, 11435.0, 839.0, 435.0, 240.0, 156.0, 150.0, 108.0, 65.0, 57.0, 39.0, 26.0, 17.0, 15.0, 9.0, 10.0, 9.0, 7.0, 5.0, 3.0, 6.0, 0.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01177978515625, -0.011389970779418945, -0.01100015640258789, -0.010610342025756836, -0.010220527648925781, -0.009830713272094727, -0.009440898895263672, -0.009051084518432617, -0.008661270141601562, -0.008271455764770508, -0.007881641387939453, -0.0074918270111083984, -0.007102012634277344, -0.006712198257446289, -0.006322383880615234, -0.00593256950378418, -0.005542755126953125, -0.00515294075012207, -0.004763126373291016, -0.004373311996459961, -0.003983497619628906, -0.0035936832427978516, -0.003203868865966797, -0.002814054489135742, -0.0024242401123046875, -0.002034425735473633, -0.0016446113586425781, -0.0012547969818115234, -0.0008649826049804688, -0.00047516822814941406, -8.535385131835938e-05, 0.0003044605255126953, 0.00069427490234375, 0.0010840892791748047, 0.0014739036560058594, 0.001863718032836914, 0.0022535324096679688, 0.0026433467864990234, 0.003033161163330078, 0.003422975540161133, 0.0038127899169921875, 0.004202604293823242, 0.004592418670654297, 0.0049822330474853516, 0.005372047424316406, 0.005761861801147461, 0.006151676177978516, 0.00654149055480957, 0.006931304931640625, 0.00732111930847168, 0.007710933685302734, 0.008100748062133789, 0.008490562438964844, 0.008880376815795898, 0.009270191192626953, 0.009660005569458008, 0.010049819946289062, 0.010439634323120117, 0.010829448699951172, 0.011219263076782227, 0.011609077453613281, 0.011998891830444336, 0.01238870620727539, 0.012778520584106445, 0.0131683349609375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 7.0, 44.0, 158.0, 303.0, 340.0, 134.0, 28.0, 5.0], "bins": [-0.0038258617278188467, -0.003762006526812911, -0.003698151558637619, -0.0036342963576316833, -0.0035704411566257477, -0.003506585955619812, -0.00344273098744452, -0.0033788757864385843, -0.0033150205854326487, -0.003251165384426713, -0.003187310416251421, -0.0031234552152454853, -0.0030596000142395496, -0.002995744813233614, -0.002931889845058322, -0.0028680346440523863, -0.0028041796758770943, -0.0027403244748711586, -0.0026764695066958666, -0.002612614305689931, -0.0025487591046839952, -0.0024849039036780596, -0.0024210489355027676, -0.002357193734496832, -0.0022933385334908962, -0.0022294833324849606, -0.0021656283643096685, -0.002101773163303733, -0.002037917962297797, -0.0019740627612918615, -0.0019102077931165695, -0.0018463525921106339, -0.0017824972746893764, -0.0017186421900987625, -0.0016547869890928268, -0.001590931904502213, -0.0015270767034962773, -0.0014632216189056635, -0.0013993664178997278, -0.001335511333309114, -0.0012716562487185001, -0.0012078011641278863, -0.0011439459631219506, -0.0010800908785313368, -0.0010162356775254011, -0.0009523805929347873, -0.0008885254501365125, -0.0008246703073382378, -0.0007608151063323021, -0.0006969599635340273, -0.0006331048207357526, -0.0005692497361451387, -0.0005053945351392031, -0.00044153942144475877, -0.0003776843077503145, -0.0003138291649520397, -0.00024997402215376496, -0.0001861188793554902, -0.00012226375110913068, -5.8408622862771153e-05, 5.446519935503602e-06, 6.930166273377836e-05, 0.00013315677642822266, 0.0001970119192264974, 0.00026086706202477217]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 6.0, 4.0, 5.0, 10.0, 8.0, 16.0, 18.0, 14.0, 22.0, 20.0, 20.0, 23.0, 30.0, 40.0, 33.0, 25.0, 37.0, 44.0, 34.0, 47.0, 33.0, 39.0, 44.0, 40.0, 19.0, 34.0, 33.0, 31.0, 27.0, 20.0, 34.0, 19.0, 18.0, 23.0, 16.0, 29.0, 16.0, 17.0, 5.0, 13.0, 3.0, 10.0, 6.0, 8.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00032132863998413086, -0.0003111995756626129, -0.00030107051134109497, -0.000290941447019577, -0.0002808123826980591, -0.00027068331837654114, -0.0002605542540550232, -0.00025042518973350525, -0.0002402961254119873, -0.00023016706109046936, -0.00022003799676895142, -0.00020990893244743347, -0.00019977986812591553, -0.00018965080380439758, -0.00017952173948287964, -0.0001693926751613617, -0.00015926361083984375, -0.0001491345465183258, -0.00013900548219680786, -0.00012887641787528992, -0.00011874735355377197, -0.00010861828923225403, -9.848922491073608e-05, -8.836016058921814e-05, -7.82310962677002e-05, -6.810203194618225e-05, -5.797296762466431e-05, -4.784390330314636e-05, -3.771483898162842e-05, -2.7585774660110474e-05, -1.745671033859253e-05, -7.327646017074585e-06, 2.8014183044433594e-06, 1.2930482625961304e-05, 2.3059546947479248e-05, 3.318861126899719e-05, 4.331767559051514e-05, 5.344673991203308e-05, 6.357580423355103e-05, 7.370486855506897e-05, 8.383393287658691e-05, 9.396299719810486e-05, 0.0001040920615196228, 0.00011422112584114075, 0.0001243501901626587, 0.00013447925448417664, 0.00014460831880569458, 0.00015473738312721252, 0.00016486644744873047, 0.0001749955117702484, 0.00018512457609176636, 0.0001952536404132843, 0.00020538270473480225, 0.0002155117690563202, 0.00022564083337783813, 0.00023576989769935608, 0.000245898962020874, 0.00025602802634239197, 0.0002661570906639099, 0.00027628615498542786, 0.0002864152193069458, 0.00029654428362846375, 0.0003066733479499817, 0.00031680241227149963, 0.0003269314765930176]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 3.0, 9.0, 7.0, 11.0, 19.0, 15.0, 18.0, 23.0, 18.0, 26.0, 20.0, 42.0, 39.0, 44.0, 54.0, 47.0, 45.0, 41.0, 47.0, 40.0, 41.0, 48.0, 36.0, 33.0, 33.0, 31.0, 30.0, 26.0, 21.0, 18.0, 24.0, 16.0, 14.0, 15.0, 8.0, 8.0, 10.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.03515625, -4.87908935546875, -4.7230224609375, -4.56695556640625, -4.410888671875, -4.25482177734375, -4.0987548828125, -3.94268798828125, -3.78662109375, -3.63055419921875, -3.4744873046875, -3.31842041015625, -3.162353515625, -3.00628662109375, -2.8502197265625, -2.69415283203125, -2.5380859375, -2.38201904296875, -2.2259521484375, -2.06988525390625, -1.913818359375, -1.75775146484375, -1.6016845703125, -1.44561767578125, -1.28955078125, -1.13348388671875, -0.9774169921875, -0.82135009765625, -0.665283203125, -0.50921630859375, -0.3531494140625, -0.19708251953125, -0.041015625, 0.11505126953125, 0.2711181640625, 0.42718505859375, 0.583251953125, 0.73931884765625, 0.8953857421875, 1.05145263671875, 1.20751953125, 1.36358642578125, 1.5196533203125, 1.67572021484375, 1.831787109375, 1.98785400390625, 2.1439208984375, 2.29998779296875, 2.4560546875, 2.61212158203125, 2.7681884765625, 2.92425537109375, 3.080322265625, 3.23638916015625, 3.3924560546875, 3.54852294921875, 3.70458984375, 3.86065673828125, 4.0167236328125, 4.17279052734375, 4.328857421875, 4.48492431640625, 4.6409912109375, 4.79705810546875, 4.953125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 7.0, 12.0, 14.0, 11.0, 23.0, 32.0, 37.0, 44.0, 84.0, 122.0, 178.0, 371.0, 682.0, 1398.0, 2739.0, 5711.0, 11811.0, 27437.0, 72034.0, 239917.0, 418224.0, 172983.0, 53999.0, 21579.0, 9778.0, 4613.0, 2151.0, 1074.0, 636.0, 325.0, 187.0, 97.0, 66.0, 45.0, 34.0, 24.0, 19.0, 15.0, 10.0, 8.0, 10.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.58203125, -5.404052734375, -5.22607421875, -5.048095703125, -4.8701171875, -4.692138671875, -4.51416015625, -4.336181640625, -4.158203125, -3.980224609375, -3.80224609375, -3.624267578125, -3.4462890625, -3.268310546875, -3.09033203125, -2.912353515625, -2.734375, -2.556396484375, -2.37841796875, -2.200439453125, -2.0224609375, -1.844482421875, -1.66650390625, -1.488525390625, -1.310546875, -1.132568359375, -0.95458984375, -0.776611328125, -0.5986328125, -0.420654296875, -0.24267578125, -0.064697265625, 0.11328125, 0.291259765625, 0.46923828125, 0.647216796875, 0.8251953125, 1.003173828125, 1.18115234375, 1.359130859375, 1.537109375, 1.715087890625, 1.89306640625, 2.071044921875, 2.2490234375, 2.427001953125, 2.60498046875, 2.782958984375, 2.9609375, 3.138916015625, 3.31689453125, 3.494873046875, 3.6728515625, 3.850830078125, 4.02880859375, 4.206787109375, 4.384765625, 4.562744140625, 4.74072265625, 4.918701171875, 5.0966796875, 5.274658203125, 5.45263671875, 5.630615234375, 5.80859375]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 4.0, 2.0, 9.0, 7.0, 11.0, 9.0, 10.0, 16.0, 13.0, 30.0, 22.0, 24.0, 27.0, 30.0, 44.0, 53.0, 52.0, 103.0, 165.0, 1413.0, 364.0, 164.0, 76.0, 59.0, 45.0, 42.0, 34.0, 27.0, 26.0, 31.0, 27.0, 12.0, 12.0, 16.0, 11.0, 12.0, 10.0, 5.0, 8.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0], "bins": [-19.109375, -18.57763671875, -18.0458984375, -17.51416015625, -16.982421875, -16.45068359375, -15.9189453125, -15.38720703125, -14.85546875, -14.32373046875, -13.7919921875, -13.26025390625, -12.728515625, -12.19677734375, -11.6650390625, -11.13330078125, -10.6015625, -10.06982421875, -9.5380859375, -9.00634765625, -8.474609375, -7.94287109375, -7.4111328125, -6.87939453125, -6.34765625, -5.81591796875, -5.2841796875, -4.75244140625, -4.220703125, -3.68896484375, -3.1572265625, -2.62548828125, -2.09375, -1.56201171875, -1.0302734375, -0.49853515625, 0.033203125, 0.56494140625, 1.0966796875, 1.62841796875, 2.16015625, 2.69189453125, 3.2236328125, 3.75537109375, 4.287109375, 4.81884765625, 5.3505859375, 5.88232421875, 6.4140625, 6.94580078125, 7.4775390625, 8.00927734375, 8.541015625, 9.07275390625, 9.6044921875, 10.13623046875, 10.66796875, 11.19970703125, 11.7314453125, 12.26318359375, 12.794921875, 13.32666015625, 13.8583984375, 14.39013671875, 14.921875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 8.0, 13.0, 14.0, 8.0, 26.0, 41.0, 41.0, 61.0, 75.0, 123.0, 188.0, 405.0, 836.0, 9669.0, 3045399.0, 85995.0, 1619.0, 453.0, 239.0, 152.0, 90.0, 66.0, 41.0, 28.0, 32.0, 23.0, 9.0, 11.0, 6.0, 5.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.09375, -46.52734375, -44.9609375, -43.39453125, -41.828125, -40.26171875, -38.6953125, -37.12890625, -35.5625, -33.99609375, -32.4296875, -30.86328125, -29.296875, -27.73046875, -26.1640625, -24.59765625, -23.03125, -21.46484375, -19.8984375, -18.33203125, -16.765625, -15.19921875, -13.6328125, -12.06640625, -10.5, -8.93359375, -7.3671875, -5.80078125, -4.234375, -2.66796875, -1.1015625, 0.46484375, 2.03125, 3.59765625, 5.1640625, 6.73046875, 8.296875, 9.86328125, 11.4296875, 12.99609375, 14.5625, 16.12890625, 17.6953125, 19.26171875, 20.828125, 22.39453125, 23.9609375, 25.52734375, 27.09375, 28.66015625, 30.2265625, 31.79296875, 33.359375, 34.92578125, 36.4921875, 38.05859375, 39.625, 41.19140625, 42.7578125, 44.32421875, 45.890625, 47.45703125, 49.0234375, 50.58984375, 52.15625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 13.0, 38.0, 110.0, 216.0, 274.0, 216.0, 96.0, 37.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.981849670410156, -31.286474227905273, -29.59109878540039, -27.895723342895508, -26.200347900390625, -24.50497055053711, -22.80959701538086, -21.114219665527344, -19.418846130371094, -17.72347068786621, -16.028095245361328, -14.332719802856445, -12.637344360351562, -10.941967964172363, -9.24659252166748, -7.551217079162598, -5.855840682983398, -4.160465240478516, -2.4650895595550537, -0.7697138786315918, 0.925661563873291, 2.621037483215332, 4.316412925720215, 6.011788368225098, 7.7071638107299805, 9.402539253234863, 11.097914695739746, 12.793291091918945, 14.488666534423828, 16.18404197692871, 17.879417419433594, 19.574792861938477, 21.27016830444336, 22.965543746948242, 24.660919189453125, 26.356294631958008, 28.05167007446289, 29.747047424316406, 31.442420959472656, 33.13779830932617, 34.83317184448242, 36.52854919433594, 38.22392272949219, 39.9193000793457, 41.61467361450195, 43.31005096435547, 45.00542449951172, 46.700801849365234, 48.39617919921875, 50.091556549072266, 51.786930084228516, 53.48230743408203, 55.17768096923828, 56.8730583190918, 58.56843185424805, 60.26380920410156, 61.95918273925781, 63.65456008911133, 65.34993743896484, 67.0453109741211, 68.74068450927734, 70.4360580444336, 72.13143920898438, 73.82681274414062, 75.52218627929688]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 10.0, 6.0, 8.0, 9.0, 8.0, 19.0, 12.0, 15.0, 21.0, 30.0, 29.0, 37.0, 32.0, 28.0, 33.0, 36.0, 49.0, 37.0, 49.0, 53.0, 36.0, 45.0, 34.0, 30.0, 41.0, 30.0, 47.0, 37.0, 22.0, 18.0, 17.0, 20.0, 19.0, 22.0, 15.0, 12.0, 6.0, 9.0, 3.0, 9.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-47.60844421386719, -46.23941421508789, -44.870384216308594, -43.5013542175293, -42.13232421875, -40.7632942199707, -39.394264221191406, -38.025230407714844, -36.65620422363281, -35.287174224853516, -33.91814422607422, -32.54911422729492, -31.180084228515625, -29.811054229736328, -28.4420223236084, -27.0729923248291, -25.703960418701172, -24.334930419921875, -22.965900421142578, -21.59687042236328, -20.227840423583984, -18.858810424804688, -17.489778518676758, -16.12074851989746, -14.751718521118164, -13.382688522338867, -12.01365852355957, -10.644627571105957, -9.27559757232666, -7.906567573547363, -6.53753662109375, -5.168506622314453, -3.7994728088378906, -2.4304425716400146, -1.0614123344421387, 0.3076181411743164, 1.6766481399536133, 3.04567813873291, 4.414709091186523, 5.78373908996582, 7.152769088745117, 8.521799087524414, 9.890829086303711, 11.259860038757324, 12.628890037536621, 13.997920036315918, 15.366950988769531, 16.735980987548828, 18.105010986328125, 19.474040985107422, 20.84307098388672, 22.212100982666016, 23.581130981445312, 24.95016098022461, 26.31919288635254, 27.688222885131836, 29.057252883911133, 30.42628288269043, 31.795312881469727, 33.164344787597656, 34.53337478637695, 35.90240478515625, 37.27143478393555, 38.640464782714844, 40.00949478149414]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 6.0, 4.0, 5.0, 13.0, 12.0, 11.0, 18.0, 20.0, 17.0, 20.0, 27.0, 32.0, 38.0, 40.0, 44.0, 41.0, 46.0, 46.0, 34.0, 52.0, 49.0, 46.0, 42.0, 36.0, 29.0, 35.0, 33.0, 29.0, 24.0, 23.0, 16.0, 28.0, 15.0, 15.0, 10.0, 14.0, 7.0, 10.0, 0.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.1875, -5.0220947265625, -4.856689453125, -4.6912841796875, -4.52587890625, -4.3604736328125, -4.195068359375, -4.0296630859375, -3.8642578125, -3.6988525390625, -3.533447265625, -3.3680419921875, -3.20263671875, -3.0372314453125, -2.871826171875, -2.7064208984375, -2.541015625, -2.3756103515625, -2.210205078125, -2.0447998046875, -1.87939453125, -1.7139892578125, -1.548583984375, -1.3831787109375, -1.2177734375, -1.0523681640625, -0.886962890625, -0.7215576171875, -0.55615234375, -0.3907470703125, -0.225341796875, -0.0599365234375, 0.10546875, 0.2708740234375, 0.436279296875, 0.6016845703125, 0.76708984375, 0.9324951171875, 1.097900390625, 1.2633056640625, 1.4287109375, 1.5941162109375, 1.759521484375, 1.9249267578125, 2.09033203125, 2.2557373046875, 2.421142578125, 2.5865478515625, 2.751953125, 2.9173583984375, 3.082763671875, 3.2481689453125, 3.41357421875, 3.5789794921875, 3.744384765625, 3.9097900390625, 4.0751953125, 4.2406005859375, 4.406005859375, 4.5714111328125, 4.73681640625, 4.9022216796875, 5.067626953125, 5.2330322265625, 5.3984375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 10.0, 6.0, 9.0, 6.0, 11.0, 7.0, 13.0, 21.0, 20.0, 23.0, 32.0, 40.0, 37.0, 63.0, 63.0, 109.0, 168.0, 351.0, 1070.0, 14172.0, 1299243.0, 2834428.0, 41576.0, 1712.0, 408.0, 180.0, 119.0, 78.0, 66.0, 45.0, 41.0, 31.0, 31.0, 17.0, 15.0, 13.0, 13.0, 14.0, 6.0, 10.0, 1.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.890625, -23.123291015625, -22.35595703125, -21.588623046875, -20.8212890625, -20.053955078125, -19.28662109375, -18.519287109375, -17.751953125, -16.984619140625, -16.21728515625, -15.449951171875, -14.6826171875, -13.915283203125, -13.14794921875, -12.380615234375, -11.61328125, -10.845947265625, -10.07861328125, -9.311279296875, -8.5439453125, -7.776611328125, -7.00927734375, -6.241943359375, -5.474609375, -4.707275390625, -3.93994140625, -3.172607421875, -2.4052734375, -1.637939453125, -0.87060546875, -0.103271484375, 0.6640625, 1.431396484375, 2.19873046875, 2.966064453125, 3.7333984375, 4.500732421875, 5.26806640625, 6.035400390625, 6.802734375, 7.570068359375, 8.33740234375, 9.104736328125, 9.8720703125, 10.639404296875, 11.40673828125, 12.174072265625, 12.94140625, 13.708740234375, 14.47607421875, 15.243408203125, 16.0107421875, 16.778076171875, 17.54541015625, 18.312744140625, 19.080078125, 19.847412109375, 20.61474609375, 21.382080078125, 22.1494140625, 22.916748046875, 23.68408203125, 24.451416015625, 25.21875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 6.0, 6.0, 15.0, 27.0, 27.0, 43.0, 91.0, 98.0, 177.0, 277.0, 406.0, 516.0, 611.0, 605.0, 408.0, 249.0, 200.0, 105.0, 89.0, 44.0, 31.0, 12.0, 13.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.625, -13.091552734375, -12.55810546875, -12.024658203125, -11.4912109375, -10.957763671875, -10.42431640625, -9.890869140625, -9.357421875, -8.823974609375, -8.29052734375, -7.757080078125, -7.2236328125, -6.690185546875, -6.15673828125, -5.623291015625, -5.08984375, -4.556396484375, -4.02294921875, -3.489501953125, -2.9560546875, -2.422607421875, -1.88916015625, -1.355712890625, -0.822265625, -0.288818359375, 0.24462890625, 0.778076171875, 1.3115234375, 1.844970703125, 2.37841796875, 2.911865234375, 3.4453125, 3.978759765625, 4.51220703125, 5.045654296875, 5.5791015625, 6.112548828125, 6.64599609375, 7.179443359375, 7.712890625, 8.246337890625, 8.77978515625, 9.313232421875, 9.8466796875, 10.380126953125, 10.91357421875, 11.447021484375, 11.98046875, 12.513916015625, 13.04736328125, 13.580810546875, 14.1142578125, 14.647705078125, 15.18115234375, 15.714599609375, 16.248046875, 16.781494140625, 17.31494140625, 17.848388671875, 18.3818359375, 18.915283203125, 19.44873046875, 19.982177734375, 20.515625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 5.0, 15.0, 18.0, 23.0, 45.0, 70.0, 119.0, 178.0, 250.0, 450.0, 970.0, 8430.0, 1497427.0, 2670153.0, 13627.0, 1191.0, 507.0, 247.0, 185.0, 118.0, 77.0, 39.0, 56.0, 21.0, 20.0, 15.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.28125, -55.81494140625, -54.3486328125, -52.88232421875, -51.416015625, -49.94970703125, -48.4833984375, -47.01708984375, -45.55078125, -44.08447265625, -42.6181640625, -41.15185546875, -39.685546875, -38.21923828125, -36.7529296875, -35.28662109375, -33.8203125, -32.35400390625, -30.8876953125, -29.42138671875, -27.955078125, -26.48876953125, -25.0224609375, -23.55615234375, -22.08984375, -20.62353515625, -19.1572265625, -17.69091796875, -16.224609375, -14.75830078125, -13.2919921875, -11.82568359375, -10.359375, -8.89306640625, -7.4267578125, -5.96044921875, -4.494140625, -3.02783203125, -1.5615234375, -0.09521484375, 1.37109375, 2.83740234375, 4.3037109375, 5.77001953125, 7.236328125, 8.70263671875, 10.1689453125, 11.63525390625, 13.1015625, 14.56787109375, 16.0341796875, 17.50048828125, 18.966796875, 20.43310546875, 21.8994140625, 23.36572265625, 24.83203125, 26.29833984375, 27.7646484375, 29.23095703125, 30.697265625, 32.16357421875, 33.6298828125, 35.09619140625, 36.5625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 4.0, 15.0, 26.0, 46.0, 51.0, 87.0, 112.0, 109.0, 88.0, 97.0, 106.0, 78.0, 59.0, 47.0, 30.0, 13.0, 15.0, 10.0, 8.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.70492172241211, -33.90251922607422, -32.100120544433594, -30.297718048095703, -28.495315551757812, -26.692914962768555, -24.890514373779297, -23.088111877441406, -21.28571128845215, -19.48331069946289, -17.680908203125, -15.878507614135742, -14.076106071472168, -12.273704528808594, -10.471303939819336, -8.668902397155762, -6.8665008544921875, -5.064099311828613, -3.2616982460021973, -1.4592971801757812, 0.34310436248779297, 2.145505905151367, 3.947906494140625, 5.750308036804199, 7.552709579467773, 9.355111122131348, 11.157512664794922, 12.95991325378418, 14.762314796447754, 16.564716339111328, 18.367116928100586, 20.169517517089844, 21.971923828125, 23.774324417114258, 25.57672691345215, 27.379127502441406, 29.181529998779297, 30.983930587768555, 32.78633117675781, 34.5887336730957, 36.391136169433594, 38.193538665771484, 39.99593734741211, 41.79833984375, 43.60074234008789, 45.40314483642578, 47.205543518066406, 49.0079460144043, 50.81034469604492, 52.61274719238281, 54.41514587402344, 56.21754837036133, 58.01995086669922, 59.822349548339844, 61.624752044677734, 63.427154541015625, 65.22955322265625, 67.03195190429688, 68.83435821533203, 70.63675689697266, 72.43915557861328, 74.24156188964844, 76.04396057128906, 77.84635925292969, 79.64876556396484]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 8.0, 8.0, 9.0, 7.0, 9.0, 18.0, 15.0, 12.0, 13.0, 21.0, 28.0, 26.0, 21.0, 28.0, 34.0, 30.0, 38.0, 40.0, 36.0, 41.0, 43.0, 46.0, 42.0, 47.0, 47.0, 33.0, 31.0, 33.0, 31.0, 25.0, 35.0, 25.0, 18.0, 24.0, 13.0, 15.0, 9.0, 16.0, 9.0, 9.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.850093841552734, -41.62049102783203, -40.39088821411133, -39.16128921508789, -37.93168640136719, -36.702083587646484, -35.47248077392578, -34.24287796020508, -33.013275146484375, -31.783672332763672, -30.5540714263916, -29.3244686126709, -28.094867706298828, -26.865264892578125, -25.635662078857422, -24.40605926513672, -23.17646026611328, -21.946857452392578, -20.717256546020508, -19.487653732299805, -18.258052825927734, -17.02845001220703, -15.798847198486328, -14.569245338439941, -13.339643478393555, -12.110041618347168, -10.880439758300781, -9.650836944580078, -8.421235084533691, -7.191633224487305, -5.96203088760376, -4.732428550720215, -3.5028228759765625, -2.2732207775115967, -1.0436186790466309, 0.18598341941833496, 1.4155855178833008, 2.6451873779296875, 3.8747897148132324, 5.104392051696777, 6.333993911743164, 7.563595771789551, 8.793197631835938, 10.02280044555664, 11.252402305603027, 12.482004165649414, 13.711606979370117, 14.941208839416504, 16.17081069946289, 17.400413513183594, 18.630014419555664, 19.859617233276367, 21.089218139648438, 22.31882095336914, 23.548423767089844, 24.778026580810547, 26.007627487182617, 27.23723030090332, 28.46683120727539, 29.696434020996094, 30.926036834716797, 32.1556396484375, 33.38523864746094, 34.61484146118164, 35.844444274902344]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 1.0, 9.0, 6.0, 9.0, 10.0, 10.0, 7.0, 22.0, 23.0, 21.0, 18.0, 37.0, 30.0, 33.0, 53.0, 41.0, 43.0, 40.0, 47.0, 47.0, 39.0, 37.0, 34.0, 41.0, 35.0, 44.0, 26.0, 31.0, 30.0, 40.0, 21.0, 21.0, 16.0, 17.0, 10.0, 11.0, 8.0, 11.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3359375, -5.16973876953125, -5.0035400390625, -4.83734130859375, -4.671142578125, -4.50494384765625, -4.3387451171875, -4.17254638671875, -4.00634765625, -3.84014892578125, -3.6739501953125, -3.50775146484375, -3.341552734375, -3.17535400390625, -3.0091552734375, -2.84295654296875, -2.6767578125, -2.51055908203125, -2.3443603515625, -2.17816162109375, -2.011962890625, -1.84576416015625, -1.6795654296875, -1.51336669921875, -1.34716796875, -1.18096923828125, -1.0147705078125, -0.84857177734375, -0.682373046875, -0.51617431640625, -0.3499755859375, -0.18377685546875, -0.017578125, 0.14862060546875, 0.3148193359375, 0.48101806640625, 0.647216796875, 0.81341552734375, 0.9796142578125, 1.14581298828125, 1.31201171875, 1.47821044921875, 1.6444091796875, 1.81060791015625, 1.976806640625, 2.14300537109375, 2.3092041015625, 2.47540283203125, 2.6416015625, 2.80780029296875, 2.9739990234375, 3.14019775390625, 3.306396484375, 3.47259521484375, 3.6387939453125, 3.80499267578125, 3.97119140625, 4.13739013671875, 4.3035888671875, 4.46978759765625, 4.635986328125, 4.80218505859375, 4.9683837890625, 5.13458251953125, 5.30078125]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 2.0, 6.0, 13.0, 20.0, 10.0, 28.0, 40.0, 57.0, 94.0, 142.0, 194.0, 283.0, 395.0, 609.0, 937.0, 1342.0, 1940.0, 3015.0, 4515.0, 7028.0, 10595.0, 16288.0, 26074.0, 41232.0, 69284.0, 118106.0, 219285.0, 221203.0, 120018.0, 69486.0, 42070.0, 26058.0, 16616.0, 10645.0, 6982.0, 4630.0, 3063.0, 2040.0, 1331.0, 903.0, 631.0, 447.0, 279.0, 177.0, 148.0, 94.0, 64.0, 39.0, 38.0, 25.0, 14.0, 7.0, 8.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80419921875, -0.7782669067382812, -0.7523345947265625, -0.7264022827148438, -0.700469970703125, -0.6745376586914062, -0.6486053466796875, -0.6226730346679688, -0.59674072265625, -0.5708084106445312, -0.5448760986328125, -0.5189437866210938, -0.493011474609375, -0.46707916259765625, -0.4411468505859375, -0.41521453857421875, -0.3892822265625, -0.36334991455078125, -0.3374176025390625, -0.31148529052734375, -0.285552978515625, -0.25962066650390625, -0.2336883544921875, -0.20775604248046875, -0.18182373046875, -0.15589141845703125, -0.1299591064453125, -0.10402679443359375, -0.078094482421875, -0.05216217041015625, -0.0262298583984375, -0.00029754638671875, 0.025634765625, 0.05156707763671875, 0.0774993896484375, 0.10343170166015625, 0.129364013671875, 0.15529632568359375, 0.1812286376953125, 0.20716094970703125, 0.23309326171875, 0.25902557373046875, 0.2849578857421875, 0.31089019775390625, 0.336822509765625, 0.36275482177734375, 0.3886871337890625, 0.41461944580078125, 0.4405517578125, 0.46648406982421875, 0.4924163818359375, 0.5183486938476562, 0.544281005859375, 0.5702133178710938, 0.5961456298828125, 0.6220779418945312, 0.64801025390625, 0.6739425659179688, 0.6998748779296875, 0.7258071899414062, 0.751739501953125, 0.7776718139648438, 0.8036041259765625, 0.8295364379882812, 0.85546875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 12.0, 2.0, 16.0, 14.0, 18.0, 22.0, 19.0, 16.0, 22.0, 34.0, 26.0, 42.0, 31.0, 33.0, 29.0, 37.0, 49.0, 34.0, 39.0, 1072.0, 44.0, 41.0, 41.0, 34.0, 41.0, 27.0, 28.0, 25.0, 25.0, 18.0, 25.0, 16.0, 11.0, 16.0, 18.0, 11.0, 13.0, 2.0, 12.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.009765625, -2.909881591796875, -2.80999755859375, -2.710113525390625, -2.6102294921875, -2.510345458984375, -2.41046142578125, -2.310577392578125, -2.210693359375, -2.110809326171875, -2.01092529296875, -1.911041259765625, -1.8111572265625, -1.711273193359375, -1.61138916015625, -1.511505126953125, -1.41162109375, -1.311737060546875, -1.21185302734375, -1.111968994140625, -1.0120849609375, -0.912200927734375, -0.81231689453125, -0.712432861328125, -0.612548828125, -0.512664794921875, -0.41278076171875, -0.312896728515625, -0.2130126953125, -0.113128662109375, -0.01324462890625, 0.086639404296875, 0.1865234375, 0.286407470703125, 0.38629150390625, 0.486175537109375, 0.5860595703125, 0.685943603515625, 0.78582763671875, 0.885711669921875, 0.985595703125, 1.085479736328125, 1.18536376953125, 1.285247802734375, 1.3851318359375, 1.485015869140625, 1.58489990234375, 1.684783935546875, 1.78466796875, 1.884552001953125, 1.98443603515625, 2.084320068359375, 2.1842041015625, 2.284088134765625, 2.38397216796875, 2.483856201171875, 2.583740234375, 2.683624267578125, 2.78350830078125, 2.883392333984375, 2.9832763671875, 3.083160400390625, 3.18304443359375, 3.282928466796875, 3.3828125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 11.0, 12.0, 14.0, 30.0, 37.0, 48.0, 72.0, 79.0, 126.0, 177.0, 270.0, 392.0, 553.0, 902.0, 1310.0, 2096.0, 3181.0, 5030.0, 8108.0, 12770.0, 20854.0, 33885.0, 57388.0, 104002.0, 213222.0, 1322719.0, 133329.0, 69633.0, 41021.0, 24454.0, 15056.0, 9353.0, 5923.0, 3796.0, 2432.0, 1559.0, 1053.0, 704.0, 483.0, 347.0, 232.0, 170.0, 99.0, 69.0, 38.0, 29.0, 24.0, 8.0, 14.0, 8.0, 4.0, 1.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.875, -0.8469390869140625, -0.818878173828125, -0.7908172607421875, -0.76275634765625, -0.7346954345703125, -0.706634521484375, -0.6785736083984375, -0.6505126953125, -0.6224517822265625, -0.594390869140625, -0.5663299560546875, -0.53826904296875, -0.5102081298828125, -0.482147216796875, -0.4540863037109375, -0.426025390625, -0.3979644775390625, -0.369903564453125, -0.3418426513671875, -0.31378173828125, -0.2857208251953125, -0.257659912109375, -0.2295989990234375, -0.2015380859375, -0.1734771728515625, -0.145416259765625, -0.1173553466796875, -0.08929443359375, -0.0612335205078125, -0.033172607421875, -0.0051116943359375, 0.02294921875, 0.0510101318359375, 0.079071044921875, 0.1071319580078125, 0.13519287109375, 0.1632537841796875, 0.191314697265625, 0.2193756103515625, 0.2474365234375, 0.2754974365234375, 0.303558349609375, 0.3316192626953125, 0.35968017578125, 0.3877410888671875, 0.415802001953125, 0.4438629150390625, 0.471923828125, 0.4999847412109375, 0.528045654296875, 0.5561065673828125, 0.58416748046875, 0.6122283935546875, 0.640289306640625, 0.6683502197265625, 0.6964111328125, 0.7244720458984375, 0.752532958984375, 0.7805938720703125, 0.80865478515625, 0.8367156982421875, 0.864776611328125, 0.8928375244140625, 0.9208984375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 9.0, 12.0, 10.0, 14.0, 7.0, 10.0, 10.0, 17.0, 17.0, 42.0, 48.0, 55.0, 64.0, 63.0, 85.0, 82.0, 74.0, 71.0, 61.0, 37.0, 31.0, 26.0, 28.0, 19.0, 10.0, 15.0, 7.0, 6.0, 12.0, 9.0, 8.0, 4.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0008192062377929688, -0.0007879436016082764, -0.000756680965423584, -0.0007254183292388916, -0.0006941556930541992, -0.0006628930568695068, -0.0006316304206848145, -0.0006003677845001221, -0.0005691051483154297, -0.0005378425121307373, -0.0005065798759460449, -0.00047531723976135254, -0.00044405460357666016, -0.0004127919673919678, -0.0003815293312072754, -0.000350266695022583, -0.0003190040588378906, -0.00028774142265319824, -0.00025647878646850586, -0.00022521615028381348, -0.0001939535140991211, -0.0001626908779144287, -0.00013142824172973633, -0.00010016560554504395, -6.890296936035156e-05, -3.764033317565918e-05, -6.377696990966797e-06, 2.4884939193725586e-05, 5.614757537841797e-05, 8.741021156311035e-05, 0.00011867284774780273, 0.00014993548393249512, 0.0001811981201171875, 0.00021246075630187988, 0.00024372339248657227, 0.00027498602867126465, 0.00030624866485595703, 0.0003375113010406494, 0.0003687739372253418, 0.0004000365734100342, 0.00043129920959472656, 0.00046256184577941895, 0.0004938244819641113, 0.0005250871181488037, 0.0005563497543334961, 0.0005876123905181885, 0.0006188750267028809, 0.0006501376628875732, 0.0006814002990722656, 0.000712662935256958, 0.0007439255714416504, 0.0007751882076263428, 0.0008064508438110352, 0.0008377134799957275, 0.0008689761161804199, 0.0009002387523651123, 0.0009315013885498047, 0.0009627640247344971, 0.0009940266609191895, 0.0010252892971038818, 0.0010565519332885742, 0.0010878145694732666, 0.001119077205657959, 0.0011503398418426514, 0.0011816024780273438]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 14.0, 10.0, 21.0, 12.0, 22.0, 29.0, 55.0, 72.0, 143.0, 144.0, 245.0, 439.0, 1073.0, 63207.0, 975877.0, 5471.0, 672.0, 333.0, 202.0, 135.0, 95.0, 65.0, 58.0, 27.0, 23.0, 21.0, 15.0, 15.0, 10.0, 9.0, 1.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.023406982421875, -0.022795677185058594, -0.022184371948242188, -0.02157306671142578, -0.020961761474609375, -0.02035045623779297, -0.019739151000976562, -0.019127845764160156, -0.01851654052734375, -0.017905235290527344, -0.017293930053710938, -0.01668262481689453, -0.016071319580078125, -0.015460014343261719, -0.014848709106445312, -0.014237403869628906, -0.0136260986328125, -0.013014793395996094, -0.012403488159179688, -0.011792182922363281, -0.011180877685546875, -0.010569572448730469, -0.009958267211914062, -0.009346961975097656, -0.00873565673828125, -0.008124351501464844, -0.0075130462646484375, -0.006901741027832031, -0.006290435791015625, -0.005679130554199219, -0.0050678253173828125, -0.004456520080566406, -0.00384521484375, -0.0032339096069335938, -0.0026226043701171875, -0.0020112991333007812, -0.001399993896484375, -0.0007886886596679688, -0.0001773834228515625, 0.00043392181396484375, 0.00104522705078125, 0.0016565322875976562, 0.0022678375244140625, 0.0028791427612304688, 0.003490447998046875, 0.004101753234863281, 0.0047130584716796875, 0.005324363708496094, 0.0059356689453125, 0.006546974182128906, 0.0071582794189453125, 0.007769584655761719, 0.008380889892578125, 0.008992195129394531, 0.009603500366210938, 0.010214805603027344, 0.01082611083984375, 0.011437416076660156, 0.012048721313476562, 0.012660026550292969, 0.013271331787109375, 0.013882637023925781, 0.014493942260742188, 0.015105247497558594, 0.015716552734375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 5.0, 14.0, 86.0, 302.0, 398.0, 172.0, 34.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022419746965169907, -0.002165189478546381, -0.0020884042605757713, -0.0020116190426051617, -0.001934833824634552, -0.0018580486066639423, -0.0017812633886933327, -0.001704478170722723, -0.0016276929527521133, -0.0015509077347815037, -0.001474122516810894, -0.0013973372988402843, -0.0013205520808696747, -0.001243766862899065, -0.0011669816449284554, -0.0010901964269578457, -0.001013411208987236, -0.0009366259910166264, -0.0008598407730460167, -0.000783055555075407, -0.0007062703371047974, -0.0006294851191341877, -0.000552699901163578, -0.00047591468319296837, -0.0003991294652223587, -0.00032234424725174904, -0.0002455590292811394, -0.0001687738113105297, -9.198859333992004e-05, -1.5203375369310379e-05, 6.158184260129929e-05, 0.00013836706057190895, 0.00021515251137316227, 0.00029193772934377193, 0.0003687229473143816, 0.00044550816528499126, 0.0005222933832556009, 0.0005990786012262106, 0.0006758638191968203, 0.0007526490371674299, 0.0008294342551380396, 0.0009062194731086493, 0.000983004691079259, 0.0010597899090498686, 0.0011365751270204782, 0.001213360344991088, 0.0012901455629616976, 0.0013669307809323072, 0.001443715998902917, 0.0015205012168735266, 0.0015972864348441362, 0.001674071652814746, 0.0017508568707853556, 0.0018276420887559652, 0.001904427306726575, 0.0019812125246971846, 0.0020579977426677942, 0.002134782960638404, 0.0022115681786090136, 0.0022883533965796232, 0.002365138614550233, 0.0024419238325208426, 0.0025187090504914522, 0.002595494268462062, 0.0026722794864326715]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 9.0, 11.0, 11.0, 11.0, 10.0, 17.0, 6.0, 25.0, 26.0, 30.0, 31.0, 22.0, 37.0, 44.0, 40.0, 37.0, 42.0, 44.0, 39.0, 53.0, 47.0, 41.0, 38.0, 38.0, 52.0, 32.0, 38.0, 23.0, 22.0, 22.0, 18.0, 21.0, 11.0, 9.0, 7.0, 12.0, 6.0, 8.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.000596165657043457, -0.0005794772878289223, -0.0005627889186143875, -0.0005461005493998528, -0.000529412180185318, -0.0005127238109707832, -0.0004960354417562485, -0.0004793470725417137, -0.00046265870332717896, -0.0004459703341126442, -0.00042928196489810944, -0.0004125935956835747, -0.0003959052264690399, -0.00037921685725450516, -0.0003625284880399704, -0.00034584011882543564, -0.0003291517496109009, -0.0003124633803963661, -0.00029577501118183136, -0.0002790866419672966, -0.00026239827275276184, -0.0002457099035382271, -0.00022902153432369232, -0.00021233316510915756, -0.0001956447958946228, -0.00017895642668008804, -0.00016226805746555328, -0.00014557968825101852, -0.00012889131903648376, -0.000112202949821949, -9.551458060741425e-05, -7.882621139287949e-05, -6.213784217834473e-05, -4.544947296380997e-05, -2.8761103749275208e-05, -1.2072734534740448e-05, 4.6156346797943115e-06, 2.130400389432907e-05, 3.799237310886383e-05, 5.468074232339859e-05, 7.136911153793335e-05, 8.805748075246811e-05, 0.00010474584996700287, 0.00012143421918153763, 0.0001381225883960724, 0.00015481095761060715, 0.0001714993268251419, 0.00018818769603967667, 0.00020487606525421143, 0.00022156443446874619, 0.00023825280368328094, 0.0002549411728978157, 0.00027162954211235046, 0.0002883179113268852, 0.00030500628054142, 0.00032169464975595474, 0.0003383830189704895, 0.00035507138818502426, 0.000371759757399559, 0.0003884481266140938, 0.00040513649582862854, 0.0004218248650431633, 0.00043851323425769806, 0.0004552016034722328, 0.0004718899726867676]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 6.0, 1.0, 9.0, 6.0, 9.0, 10.0, 10.0, 7.0, 22.0, 23.0, 21.0, 19.0, 36.0, 30.0, 33.0, 53.0, 41.0, 43.0, 40.0, 47.0, 47.0, 39.0, 37.0, 34.0, 41.0, 35.0, 44.0, 26.0, 31.0, 30.0, 40.0, 21.0, 21.0, 16.0, 17.0, 10.0, 11.0, 8.0, 11.0, 5.0, 8.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.3359375, -5.16973876953125, -5.0035400390625, -4.83734130859375, -4.671142578125, -4.50494384765625, -4.3387451171875, -4.17254638671875, -4.00634765625, -3.84014892578125, -3.6739501953125, -3.50775146484375, -3.341552734375, -3.17535400390625, -3.0091552734375, -2.84295654296875, -2.6767578125, -2.51055908203125, -2.3443603515625, -2.17816162109375, -2.011962890625, -1.84576416015625, -1.6795654296875, -1.51336669921875, -1.34716796875, -1.18096923828125, -1.0147705078125, -0.84857177734375, -0.682373046875, -0.51617431640625, -0.3499755859375, -0.18377685546875, -0.017578125, 0.14862060546875, 0.3148193359375, 0.48101806640625, 0.647216796875, 0.81341552734375, 0.9796142578125, 1.14581298828125, 1.31201171875, 1.47821044921875, 1.6444091796875, 1.81060791015625, 1.976806640625, 2.14300537109375, 2.3092041015625, 2.47540283203125, 2.6416015625, 2.80780029296875, 2.9739990234375, 3.14019775390625, 3.306396484375, 3.47259521484375, 3.6387939453125, 3.80499267578125, 3.97119140625, 4.13739013671875, 4.3035888671875, 4.46978759765625, 4.635986328125, 4.80218505859375, 4.9683837890625, 5.13458251953125, 5.30078125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 1.0, 10.0, 8.0, 15.0, 17.0, 31.0, 42.0, 71.0, 89.0, 173.0, 245.0, 403.0, 681.0, 1279.0, 2385.0, 4403.0, 8478.0, 16121.0, 30568.0, 60865.0, 140042.0, 317547.0, 256397.0, 106921.0, 48537.0, 24905.0, 13124.0, 7008.0, 3720.0, 1921.0, 1038.0, 585.0, 351.0, 210.0, 132.0, 65.0, 50.0, 25.0, 17.0, 24.0, 9.0, 8.0, 7.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.375, -4.23760986328125, -4.1002197265625, -3.96282958984375, -3.825439453125, -3.68804931640625, -3.5506591796875, -3.41326904296875, -3.27587890625, -3.13848876953125, -3.0010986328125, -2.86370849609375, -2.726318359375, -2.58892822265625, -2.4515380859375, -2.31414794921875, -2.1767578125, -2.03936767578125, -1.9019775390625, -1.76458740234375, -1.627197265625, -1.48980712890625, -1.3524169921875, -1.21502685546875, -1.07763671875, -0.94024658203125, -0.8028564453125, -0.66546630859375, -0.528076171875, -0.39068603515625, -0.2532958984375, -0.11590576171875, 0.021484375, 0.15887451171875, 0.2962646484375, 0.43365478515625, 0.571044921875, 0.70843505859375, 0.8458251953125, 0.98321533203125, 1.12060546875, 1.25799560546875, 1.3953857421875, 1.53277587890625, 1.670166015625, 1.80755615234375, 1.9449462890625, 2.08233642578125, 2.2197265625, 2.35711669921875, 2.4945068359375, 2.63189697265625, 2.769287109375, 2.90667724609375, 3.0440673828125, 3.18145751953125, 3.31884765625, 3.45623779296875, 3.5936279296875, 3.73101806640625, 3.868408203125, 4.00579833984375, 4.1431884765625, 4.28057861328125, 4.41796875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 3.0, 10.0, 7.0, 5.0, 4.0, 9.0, 13.0, 14.0, 19.0, 16.0, 23.0, 25.0, 40.0, 33.0, 36.0, 41.0, 45.0, 54.0, 58.0, 86.0, 179.0, 1500.0, 248.0, 123.0, 58.0, 48.0, 44.0, 40.0, 46.0, 19.0, 28.0, 41.0, 26.0, 21.0, 15.0, 17.0, 16.0, 8.0, 7.0, 13.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.75, -18.158203125, -17.56640625, -16.974609375, -16.3828125, -15.791015625, -15.19921875, -14.607421875, -14.015625, -13.423828125, -12.83203125, -12.240234375, -11.6484375, -11.056640625, -10.46484375, -9.873046875, -9.28125, -8.689453125, -8.09765625, -7.505859375, -6.9140625, -6.322265625, -5.73046875, -5.138671875, -4.546875, -3.955078125, -3.36328125, -2.771484375, -2.1796875, -1.587890625, -0.99609375, -0.404296875, 0.1875, 0.779296875, 1.37109375, 1.962890625, 2.5546875, 3.146484375, 3.73828125, 4.330078125, 4.921875, 5.513671875, 6.10546875, 6.697265625, 7.2890625, 7.880859375, 8.47265625, 9.064453125, 9.65625, 10.248046875, 10.83984375, 11.431640625, 12.0234375, 12.615234375, 13.20703125, 13.798828125, 14.390625, 14.982421875, 15.57421875, 16.166015625, 16.7578125, 17.349609375, 17.94140625, 18.533203125, 19.125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 4.0, 7.0, 11.0, 19.0, 29.0, 53.0, 110.0, 198.0, 519.0, 4214.0, 3134557.0, 4937.0, 542.0, 198.0, 107.0, 70.0, 40.0, 30.0, 14.0, 9.0, 12.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-137.125, -132.908203125, -128.69140625, -124.474609375, -120.2578125, -116.041015625, -111.82421875, -107.607421875, -103.390625, -99.173828125, -94.95703125, -90.740234375, -86.5234375, -82.306640625, -78.08984375, -73.873046875, -69.65625, -65.439453125, -61.22265625, -57.005859375, -52.7890625, -48.572265625, -44.35546875, -40.138671875, -35.921875, -31.705078125, -27.48828125, -23.271484375, -19.0546875, -14.837890625, -10.62109375, -6.404296875, -2.1875, 2.029296875, 6.24609375, 10.462890625, 14.6796875, 18.896484375, 23.11328125, 27.330078125, 31.546875, 35.763671875, 39.98046875, 44.197265625, 48.4140625, 52.630859375, 56.84765625, 61.064453125, 65.28125, 69.498046875, 73.71484375, 77.931640625, 82.1484375, 86.365234375, 90.58203125, 94.798828125, 99.015625, 103.232421875, 107.44921875, 111.666015625, 115.8828125, 120.099609375, 124.31640625, 128.533203125, 132.75]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 273.0, 746.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.31407165527344, -66.75882720947266, -45.20357894897461, -23.648330688476562, -2.0930862426757812, 19.462158203125, 41.01741027832031, 62.57264709472656, 84.12789916992188, 105.68314361572266, 127.23838806152344, 148.79364013671875, 170.348876953125, 191.9041290283203, 213.45938110351562, 235.01461791992188, 256.56988525390625, 278.1251220703125, 299.6803894042969, 321.2356262207031, 342.7908630371094, 364.34613037109375, 385.9013671875, 407.45660400390625, 429.0118408203125, 450.56707763671875, 472.1223449707031, 493.6775817871094, 515.2328491210938, 536.7880859375, 558.3433227539062, 579.8985595703125, 601.4537963867188, 623.009033203125, 644.5642700195312, 666.1195068359375, 687.6748046875, 709.2300415039062, 730.7852783203125, 752.3405151367188, 773.895751953125, 795.4509887695312, 817.0062255859375, 838.5615234375, 860.1167602539062, 881.6719970703125, 903.2272338867188, 924.782470703125, 946.3377685546875, 967.8930053710938, 989.4482421875, 1011.0035400390625, 1032.5587158203125, 1054.114013671875, 1075.669189453125, 1097.2244873046875, 1118.7796630859375, 1140.3349609375, 1161.89013671875, 1183.4454345703125, 1205.0006103515625, 1226.555908203125, 1248.111083984375, 1269.6663818359375, 1291.2216796875]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 4.0, 9.0, 7.0, 14.0, 18.0, 18.0, 16.0, 20.0, 14.0, 26.0, 22.0, 20.0, 44.0, 29.0, 34.0, 33.0, 34.0, 32.0, 49.0, 46.0, 37.0, 53.0, 39.0, 33.0, 49.0, 29.0, 46.0, 20.0, 23.0, 24.0, 26.0, 16.0, 13.0, 20.0, 11.0, 10.0, 11.0, 14.0, 6.0, 7.0, 4.0, 6.0, 2.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-47.685279846191406, -46.086273193359375, -44.48727035522461, -42.88826370239258, -41.28925704956055, -39.69025421142578, -38.09124755859375, -36.49224090576172, -34.89323425292969, -33.294227600097656, -31.695222854614258, -30.09621810913086, -28.497211456298828, -26.89820671081543, -25.29920196533203, -23.7001953125, -22.101192474365234, -20.502187728881836, -18.903181076049805, -17.304176330566406, -15.705170631408691, -14.106164932250977, -12.507160186767578, -10.908154487609863, -9.309148788452148, -7.710143089294434, -6.111137866973877, -4.51213264465332, -2.9131269454956055, -1.3141212463378906, 0.2848834991455078, 1.8838891983032227, 3.482898712158203, 5.081904411315918, 6.680909633636475, 8.279914855957031, 9.878920555114746, 11.477926254272461, 13.07693099975586, 14.675936698913574, 16.27494239807129, 17.873947143554688, 19.47295379638672, 21.071958541870117, 22.670963287353516, 24.269969940185547, 25.868974685668945, 27.467979431152344, 29.066986083984375, 30.665990829467773, 32.26499557495117, 33.8640022277832, 35.463008880615234, 37.06201171875, 38.66101837158203, 40.26002502441406, 41.859031677246094, 43.458038330078125, 45.05704116821289, 46.65604782104492, 48.25505447387695, 49.85405731201172, 51.45306396484375, 53.05207061767578, 54.65107345581055]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 3.0, 3.0, 4.0, 6.0, 9.0, 11.0, 17.0, 8.0, 16.0, 16.0, 18.0, 26.0, 34.0, 30.0, 35.0, 37.0, 41.0, 45.0, 41.0, 24.0, 47.0, 48.0, 42.0, 43.0, 33.0, 37.0, 37.0, 38.0, 35.0, 32.0, 27.0, 21.0, 20.0, 22.0, 16.0, 20.0, 13.0, 8.0, 11.0, 3.0, 12.0, 4.0, 3.0, 1.0, 1.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.29296875, -5.11492919921875, -4.9368896484375, -4.75885009765625, -4.580810546875, -4.40277099609375, -4.2247314453125, -4.04669189453125, -3.86865234375, -3.69061279296875, -3.5125732421875, -3.33453369140625, -3.156494140625, -2.97845458984375, -2.8004150390625, -2.62237548828125, -2.4443359375, -2.26629638671875, -2.0882568359375, -1.91021728515625, -1.732177734375, -1.55413818359375, -1.3760986328125, -1.19805908203125, -1.02001953125, -0.84197998046875, -0.6639404296875, -0.48590087890625, -0.307861328125, -0.12982177734375, 0.0482177734375, 0.22625732421875, 0.404296875, 0.58233642578125, 0.7603759765625, 0.93841552734375, 1.116455078125, 1.29449462890625, 1.4725341796875, 1.65057373046875, 1.82861328125, 2.00665283203125, 2.1846923828125, 2.36273193359375, 2.540771484375, 2.71881103515625, 2.8968505859375, 3.07489013671875, 3.2529296875, 3.43096923828125, 3.6090087890625, 3.78704833984375, 3.965087890625, 4.14312744140625, 4.3211669921875, 4.49920654296875, 4.67724609375, 4.85528564453125, 5.0333251953125, 5.21136474609375, 5.389404296875, 5.56744384765625, 5.7454833984375, 5.92352294921875, 6.1015625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 9.0, 7.0, 6.0, 23.0, 19.0, 11.0, 14.0, 35.0, 47.0, 65.0, 84.0, 147.0, 206.0, 392.0, 768.0, 1822.0, 5647.0, 22025.0, 109285.0, 540000.0, 1554336.0, 1418783.0, 431417.0, 83873.0, 17379.0, 4635.0, 1576.0, 627.0, 379.0, 208.0, 129.0, 80.0, 67.0, 47.0, 37.0, 22.0, 19.0, 7.0, 12.0, 8.0, 9.0, 6.0, 7.0, 3.0, 0.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.80078125, -7.54010009765625, -7.2794189453125, -7.01873779296875, -6.758056640625, -6.49737548828125, -6.2366943359375, -5.97601318359375, -5.71533203125, -5.45465087890625, -5.1939697265625, -4.93328857421875, -4.672607421875, -4.41192626953125, -4.1512451171875, -3.89056396484375, -3.6298828125, -3.36920166015625, -3.1085205078125, -2.84783935546875, -2.587158203125, -2.32647705078125, -2.0657958984375, -1.80511474609375, -1.54443359375, -1.28375244140625, -1.0230712890625, -0.76239013671875, -0.501708984375, -0.24102783203125, 0.0196533203125, 0.28033447265625, 0.541015625, 0.80169677734375, 1.0623779296875, 1.32305908203125, 1.583740234375, 1.84442138671875, 2.1051025390625, 2.36578369140625, 2.62646484375, 2.88714599609375, 3.1478271484375, 3.40850830078125, 3.669189453125, 3.92987060546875, 4.1905517578125, 4.45123291015625, 4.7119140625, 4.97259521484375, 5.2332763671875, 5.49395751953125, 5.754638671875, 6.01531982421875, 6.2760009765625, 6.53668212890625, 6.79736328125, 7.05804443359375, 7.3187255859375, 7.57940673828125, 7.840087890625, 8.10076904296875, 8.3614501953125, 8.62213134765625, 8.8828125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 8.0, 10.0, 13.0, 16.0, 20.0, 36.0, 50.0, 70.0, 89.0, 123.0, 174.0, 252.0, 334.0, 426.0, 458.0, 427.0, 391.0, 309.0, 253.0, 166.0, 123.0, 96.0, 65.0, 51.0, 42.0, 14.0, 23.0, 13.0, 3.0, 4.0, 3.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-16.875, -16.4417724609375, -16.008544921875, -15.5753173828125, -15.14208984375, -14.7088623046875, -14.275634765625, -13.8424072265625, -13.4091796875, -12.9759521484375, -12.542724609375, -12.1094970703125, -11.67626953125, -11.2430419921875, -10.809814453125, -10.3765869140625, -9.943359375, -9.5101318359375, -9.076904296875, -8.6436767578125, -8.21044921875, -7.7772216796875, -7.343994140625, -6.9107666015625, -6.4775390625, -6.0443115234375, -5.611083984375, -5.1778564453125, -4.74462890625, -4.3114013671875, -3.878173828125, -3.4449462890625, -3.01171875, -2.5784912109375, -2.145263671875, -1.7120361328125, -1.27880859375, -0.8455810546875, -0.412353515625, 0.0208740234375, 0.4541015625, 0.8873291015625, 1.320556640625, 1.7537841796875, 2.18701171875, 2.6202392578125, 3.053466796875, 3.4866943359375, 3.919921875, 4.3531494140625, 4.786376953125, 5.2196044921875, 5.65283203125, 6.0860595703125, 6.519287109375, 6.9525146484375, 7.3857421875, 7.8189697265625, 8.252197265625, 8.6854248046875, 9.11865234375, 9.5518798828125, 9.985107421875, 10.4183349609375, 10.8515625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 7.0, 4.0, 9.0, 15.0, 8.0, 16.0, 23.0, 25.0, 24.0, 52.0, 69.0, 85.0, 145.0, 176.0, 346.0, 668.0, 2440.0, 33516.0, 1800487.0, 2306200.0, 45408.0, 2791.0, 706.0, 324.0, 199.0, 131.0, 97.0, 82.0, 58.0, 50.0, 30.0, 27.0, 24.0, 8.0, 10.0, 9.0, 5.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.609375, -27.589111328125, -26.56884765625, -25.548583984375, -24.5283203125, -23.508056640625, -22.48779296875, -21.467529296875, -20.447265625, -19.427001953125, -18.40673828125, -17.386474609375, -16.3662109375, -15.345947265625, -14.32568359375, -13.305419921875, -12.28515625, -11.264892578125, -10.24462890625, -9.224365234375, -8.2041015625, -7.183837890625, -6.16357421875, -5.143310546875, -4.123046875, -3.102783203125, -2.08251953125, -1.062255859375, -0.0419921875, 0.978271484375, 1.99853515625, 3.018798828125, 4.0390625, 5.059326171875, 6.07958984375, 7.099853515625, 8.1201171875, 9.140380859375, 10.16064453125, 11.180908203125, 12.201171875, 13.221435546875, 14.24169921875, 15.261962890625, 16.2822265625, 17.302490234375, 18.32275390625, 19.343017578125, 20.36328125, 21.383544921875, 22.40380859375, 23.424072265625, 24.4443359375, 25.464599609375, 26.48486328125, 27.505126953125, 28.525390625, 29.545654296875, 30.56591796875, 31.586181640625, 32.6064453125, 33.626708984375, 34.64697265625, 35.667236328125, 36.6875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 9.0, 8.0, 36.0, 54.0, 147.0, 191.0, 214.0, 183.0, 101.0, 39.0, 19.0, 9.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.20657348632812, -117.86116027832031, -114.51573944091797, -111.17032623291016, -107.82490539550781, -104.4794921875, -101.13407897949219, -97.78866577148438, -94.44324493408203, -91.09783172607422, -87.75241088867188, -84.40699768066406, -81.06158447265625, -77.7161636352539, -74.3707504272461, -71.02532958984375, -67.67991638183594, -64.33450317382812, -60.98908233642578, -57.64366912841797, -54.29825210571289, -50.95283508300781, -47.607421875, -44.26200485229492, -40.916587829589844, -37.571170806884766, -34.22575378417969, -30.880340576171875, -27.534923553466797, -24.18950653076172, -20.844091415405273, -17.498676300048828, -14.153251647949219, -10.807835578918457, -7.462419509887695, -4.117003440856934, -0.7715873718261719, 2.5738296508789062, 5.919244766235352, 9.264659881591797, 12.610076904296875, 15.955492973327637, 19.3009090423584, 22.646324157714844, 25.991741180419922, 29.337158203125, 32.68257141113281, 36.02798843383789, 39.37340545654297, 42.71882247924805, 46.064239501953125, 49.40965270996094, 52.755069732666016, 56.100486755371094, 59.445899963378906, 62.791316986083984, 66.13673400878906, 69.48214721679688, 72.82756805419922, 76.17298126220703, 79.51840209960938, 82.86381530761719, 86.209228515625, 89.55464172363281, 92.90006256103516]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 2.0, 5.0, 4.0, 7.0, 3.0, 7.0, 20.0, 9.0, 26.0, 14.0, 18.0, 24.0, 30.0, 31.0, 44.0, 34.0, 44.0, 34.0, 26.0, 45.0, 48.0, 49.0, 41.0, 34.0, 51.0, 31.0, 41.0, 54.0, 29.0, 30.0, 19.0, 27.0, 13.0, 25.0, 21.0, 10.0, 12.0, 9.0, 4.0, 11.0, 7.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.99734878540039, -37.622154235839844, -36.24695587158203, -34.871761322021484, -33.49656295776367, -32.121368408203125, -30.746171951293945, -29.370975494384766, -27.995779037475586, -26.620582580566406, -25.245386123657227, -23.870189666748047, -22.4949951171875, -21.119796752929688, -19.74460220336914, -18.36940574645996, -16.99420928955078, -15.619012832641602, -14.243816375732422, -12.868620872497559, -11.493424415588379, -10.1182279586792, -8.743032455444336, -7.367835998535156, -5.992639541625977, -4.617443084716797, -3.2422471046447754, -1.867051124572754, -0.4918546676635742, 0.8833417892456055, 2.2585372924804688, 3.6337337493896484, 5.008934020996094, 6.384130477905273, 7.759326457977295, 9.134522438049316, 10.509718894958496, 11.884915351867676, 13.260110855102539, 14.635307312011719, 16.0105037689209, 17.385700225830078, 18.760896682739258, 20.136093139648438, 21.511287689208984, 22.886486053466797, 24.261680603027344, 25.636877059936523, 27.012073516845703, 28.387269973754883, 29.762466430664062, 31.13766098022461, 32.51285934448242, 33.88805389404297, 35.26325225830078, 36.63844680786133, 38.013641357421875, 39.38883590698242, 40.764034271240234, 42.13922882080078, 43.514427185058594, 44.88962173461914, 46.26481628417969, 47.6400146484375, 49.01521301269531]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 12.0, 10.0, 7.0, 9.0, 21.0, 13.0, 15.0, 26.0, 43.0, 25.0, 40.0, 47.0, 37.0, 48.0, 49.0, 44.0, 52.0, 47.0, 42.0, 40.0, 47.0, 42.0, 40.0, 36.0, 39.0, 33.0, 29.0, 20.0, 16.0, 16.0, 8.0, 11.0, 7.0, 8.0, 3.0, 8.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.41015625, -5.20965576171875, -5.0091552734375, -4.80865478515625, -4.608154296875, -4.40765380859375, -4.2071533203125, -4.00665283203125, -3.80615234375, -3.60565185546875, -3.4051513671875, -3.20465087890625, -3.004150390625, -2.80364990234375, -2.6031494140625, -2.40264892578125, -2.2021484375, -2.00164794921875, -1.8011474609375, -1.60064697265625, -1.400146484375, -1.19964599609375, -0.9991455078125, -0.79864501953125, -0.59814453125, -0.39764404296875, -0.1971435546875, 0.00335693359375, 0.203857421875, 0.40435791015625, 0.6048583984375, 0.80535888671875, 1.005859375, 1.20635986328125, 1.4068603515625, 1.60736083984375, 1.807861328125, 2.00836181640625, 2.2088623046875, 2.40936279296875, 2.60986328125, 2.81036376953125, 3.0108642578125, 3.21136474609375, 3.411865234375, 3.61236572265625, 3.8128662109375, 4.01336669921875, 4.2138671875, 4.41436767578125, 4.6148681640625, 4.81536865234375, 5.015869140625, 5.21636962890625, 5.4168701171875, 5.61737060546875, 5.81787109375, 6.01837158203125, 6.2188720703125, 6.41937255859375, 6.619873046875, 6.82037353515625, 7.0208740234375, 7.22137451171875, 7.421875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 3.0, 9.0, 14.0, 8.0, 21.0, 29.0, 34.0, 76.0, 86.0, 138.0, 246.0, 314.0, 497.0, 705.0, 1025.0, 1494.0, 2247.0, 3484.0, 5002.0, 8028.0, 12289.0, 19034.0, 31170.0, 51385.0, 91868.0, 176921.0, 278862.0, 155974.0, 81813.0, 46431.0, 28669.0, 17856.0, 11140.0, 7216.0, 4818.0, 3081.0, 2117.0, 1432.0, 942.0, 708.0, 419.0, 307.0, 199.0, 144.0, 95.0, 78.0, 46.0, 28.0, 17.0, 6.0, 6.0, 9.0, 9.0, 5.0, 5.0, 3.0], "bins": [-1.04296875, -1.0126571655273438, -0.9823455810546875, -0.9520339965820312, -0.921722412109375, -0.8914108276367188, -0.8610992431640625, -0.8307876586914062, -0.80047607421875, -0.7701644897460938, -0.7398529052734375, -0.7095413208007812, -0.679229736328125, -0.6489181518554688, -0.6186065673828125, -0.5882949829101562, -0.5579833984375, -0.5276718139648438, -0.4973602294921875, -0.46704864501953125, -0.436737060546875, -0.40642547607421875, -0.3761138916015625, -0.34580230712890625, -0.31549072265625, -0.28517913818359375, -0.2548675537109375, -0.22455596923828125, -0.194244384765625, -0.16393280029296875, -0.1336212158203125, -0.10330963134765625, -0.072998046875, -0.04268646240234375, -0.0123748779296875, 0.01793670654296875, 0.048248291015625, 0.07855987548828125, 0.1088714599609375, 0.13918304443359375, 0.16949462890625, 0.19980621337890625, 0.2301177978515625, 0.26042938232421875, 0.290740966796875, 0.32105255126953125, 0.3513641357421875, 0.38167572021484375, 0.4119873046875, 0.44229888916015625, 0.4726104736328125, 0.5029220581054688, 0.533233642578125, 0.5635452270507812, 0.5938568115234375, 0.6241683959960938, 0.65447998046875, 0.6847915649414062, 0.7151031494140625, 0.7454147338867188, 0.775726318359375, 0.8060379028320312, 0.8363494873046875, 0.8666610717773438, 0.89697265625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 2.0, 4.0, 12.0, 8.0, 16.0, 13.0, 16.0, 13.0, 20.0, 26.0, 29.0, 27.0, 22.0, 30.0, 20.0, 23.0, 26.0, 52.0, 42.0, 40.0, 1072.0, 43.0, 35.0, 40.0, 39.0, 45.0, 37.0, 28.0, 35.0, 26.0, 27.0, 15.0, 24.0, 17.0, 17.0, 12.0, 11.0, 10.0, 8.0, 6.0, 3.0, 5.0, 5.0, 3.0, 4.0, 5.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-3.197265625, -3.09295654296875, -2.9886474609375, -2.88433837890625, -2.780029296875, -2.67572021484375, -2.5714111328125, -2.46710205078125, -2.36279296875, -2.25848388671875, -2.1541748046875, -2.04986572265625, -1.945556640625, -1.84124755859375, -1.7369384765625, -1.63262939453125, -1.5283203125, -1.42401123046875, -1.3197021484375, -1.21539306640625, -1.111083984375, -1.00677490234375, -0.9024658203125, -0.79815673828125, -0.69384765625, -0.58953857421875, -0.4852294921875, -0.38092041015625, -0.276611328125, -0.17230224609375, -0.0679931640625, 0.03631591796875, 0.140625, 0.24493408203125, 0.3492431640625, 0.45355224609375, 0.557861328125, 0.66217041015625, 0.7664794921875, 0.87078857421875, 0.97509765625, 1.07940673828125, 1.1837158203125, 1.28802490234375, 1.392333984375, 1.49664306640625, 1.6009521484375, 1.70526123046875, 1.8095703125, 1.91387939453125, 2.0181884765625, 2.12249755859375, 2.226806640625, 2.33111572265625, 2.4354248046875, 2.53973388671875, 2.64404296875, 2.74835205078125, 2.8526611328125, 2.95697021484375, 3.061279296875, 3.16558837890625, 3.2698974609375, 3.37420654296875, 3.478515625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 5.0, 8.0, 9.0, 8.0, 16.0, 19.0, 38.0, 36.0, 46.0, 66.0, 84.0, 126.0, 171.0, 234.0, 367.0, 486.0, 760.0, 1077.0, 1520.0, 2290.0, 3374.0, 5177.0, 7599.0, 11506.0, 17856.0, 28056.0, 45471.0, 76140.0, 141571.0, 1316961.0, 186516.0, 96963.0, 55408.0, 34030.0, 21621.0, 13913.0, 8917.0, 5887.0, 3967.0, 2684.0, 1777.0, 1267.0, 886.0, 636.0, 459.0, 291.0, 243.0, 173.0, 126.0, 96.0, 64.0, 48.0, 34.0, 14.0, 20.0, 14.0, 4.0, 1.0, 2.0, 6.0], "bins": [-0.9443359375, -0.9163131713867188, -0.8882904052734375, -0.8602676391601562, -0.832244873046875, -0.8042221069335938, -0.7761993408203125, -0.7481765747070312, -0.72015380859375, -0.6921310424804688, -0.6641082763671875, -0.6360855102539062, -0.608062744140625, -0.5800399780273438, -0.5520172119140625, -0.5239944458007812, -0.4959716796875, -0.46794891357421875, -0.4399261474609375, -0.41190338134765625, -0.383880615234375, -0.35585784912109375, -0.3278350830078125, -0.29981231689453125, -0.27178955078125, -0.24376678466796875, -0.2157440185546875, -0.18772125244140625, -0.159698486328125, -0.13167572021484375, -0.1036529541015625, -0.07563018798828125, -0.047607421875, -0.01958465576171875, 0.0084381103515625, 0.03646087646484375, 0.064483642578125, 0.09250640869140625, 0.1205291748046875, 0.14855194091796875, 0.17657470703125, 0.20459747314453125, 0.2326202392578125, 0.26064300537109375, 0.288665771484375, 0.31668853759765625, 0.3447113037109375, 0.37273406982421875, 0.4007568359375, 0.42877960205078125, 0.4568023681640625, 0.48482513427734375, 0.512847900390625, 0.5408706665039062, 0.5688934326171875, 0.5969161987304688, 0.62493896484375, 0.6529617309570312, 0.6809844970703125, 0.7090072631835938, 0.737030029296875, 0.7650527954101562, 0.7930755615234375, 0.8210983276367188, 0.84912109375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 9.0, 6.0, 10.0, 18.0, 23.0, 25.0, 37.0, 58.0, 85.0, 93.0, 99.0, 108.0, 90.0, 92.0, 69.0, 42.0, 39.0, 27.0, 19.0, 12.0, 9.0, 11.0, 3.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0019073486328125, -0.001859813928604126, -0.001812279224395752, -0.001764744520187378, -0.001717209815979004, -0.0016696751117706299, -0.0016221404075622559, -0.0015746057033538818, -0.0015270709991455078, -0.0014795362949371338, -0.0014320015907287598, -0.0013844668865203857, -0.0013369321823120117, -0.0012893974781036377, -0.0012418627738952637, -0.0011943280696868896, -0.0011467933654785156, -0.0010992586612701416, -0.0010517239570617676, -0.0010041892528533936, -0.0009566545486450195, -0.0009091198444366455, -0.0008615851402282715, -0.0008140504360198975, -0.0007665157318115234, -0.0007189810276031494, -0.0006714463233947754, -0.0006239116191864014, -0.0005763769149780273, -0.0005288422107696533, -0.0004813075065612793, -0.0004337728023529053, -0.00038623809814453125, -0.0003387033939361572, -0.0002911686897277832, -0.00024363398551940918, -0.00019609928131103516, -0.00014856457710266113, -0.00010102987289428711, -5.3495168685913086e-05, -5.9604644775390625e-06, 4.157423973083496e-05, 8.910894393920898e-05, 0.000136643648147583, 0.00018417835235595703, 0.00023171305656433105, 0.0002792477607727051, 0.0003267824649810791, 0.0003743171691894531, 0.00042185187339782715, 0.00046938657760620117, 0.0005169212818145752, 0.0005644559860229492, 0.0006119906902313232, 0.0006595253944396973, 0.0007070600986480713, 0.0007545948028564453, 0.0008021295070648193, 0.0008496642112731934, 0.0008971989154815674, 0.0009447336196899414, 0.0009922683238983154, 0.0010398030281066895, 0.0010873377323150635, 0.0011348724365234375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 6.0, 12.0, 16.0, 14.0, 27.0, 30.0, 59.0, 66.0, 131.0, 248.0, 517.0, 2259.0, 1016097.0, 27506.0, 796.0, 310.0, 167.0, 101.0, 60.0, 41.0, 15.0, 18.0, 16.0, 11.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0206298828125, -0.019759654998779297, -0.018889427185058594, -0.01801919937133789, -0.017148971557617188, -0.016278743743896484, -0.015408515930175781, -0.014538288116455078, -0.013668060302734375, -0.012797832489013672, -0.011927604675292969, -0.011057376861572266, -0.010187149047851562, -0.00931692123413086, -0.008446693420410156, -0.007576465606689453, -0.00670623779296875, -0.005836009979248047, -0.004965782165527344, -0.004095554351806641, -0.0032253265380859375, -0.0023550987243652344, -0.0014848709106445312, -0.0006146430969238281, 0.000255584716796875, 0.0011258125305175781, 0.0019960403442382812, 0.0028662681579589844, 0.0037364959716796875, 0.004606723785400391, 0.005476951599121094, 0.006347179412841797, 0.0072174072265625, 0.008087635040283203, 0.008957862854003906, 0.00982809066772461, 0.010698318481445312, 0.011568546295166016, 0.012438774108886719, 0.013309001922607422, 0.014179229736328125, 0.015049457550048828, 0.01591968536376953, 0.016789913177490234, 0.017660140991210938, 0.01853036880493164, 0.019400596618652344, 0.020270824432373047, 0.02114105224609375, 0.022011280059814453, 0.022881507873535156, 0.02375173568725586, 0.024621963500976562, 0.025492191314697266, 0.02636241912841797, 0.027232646942138672, 0.028102874755859375, 0.028973102569580078, 0.02984333038330078, 0.030713558197021484, 0.03158378601074219, 0.03245401382446289, 0.033324241638183594, 0.0341944694519043, 0.035064697265625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 12.0, 42.0, 99.0, 204.0, 246.0, 170.0, 133.0, 64.0, 27.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012557676527649164, -0.0012119583552703261, -0.0011681490577757359, -0.0011243398766964674, -0.0010805305792018771, -0.0010367212817072868, -0.0009929121006280184, -0.0009491028031334281, -0.0009052935056388378, -0.0008614842081442475, -0.0008176749688573182, -0.0007738657295703888, -0.0007300564320757985, -0.0006862471345812082, -0.0006424378952942789, -0.0005986286560073495, -0.0005548193585127592, -0.0005110100610181689, -0.00046720082173123956, -0.00042339155334047973, -0.0003795822849497199, -0.0003357730165589601, -0.00029196374816820025, -0.00024815447977744043, -0.0002043452113866806, -0.00016053594299592078, -0.00011672667460516095, -7.291740621440113e-05, -2.91081378236413e-05, 1.4701130567118526e-05, 5.851039895787835e-05, 0.00010231966734863818, 0.00014612905215471983, 0.00018993832054547966, 0.00023374758893623948, 0.0002775568573269993, 0.00032136612571775913, 0.00036517539410851896, 0.0004089846624992788, 0.0004527939308900386, 0.0004966031992807984, 0.0005404124967753887, 0.0005842217360623181, 0.0006280309753492475, 0.0006718402728438377, 0.000715649570338428, 0.0007594588096253574, 0.0008032680489122868, 0.000847077346406877, 0.0008908866439014673, 0.0009346958831883967, 0.000978505122475326, 0.0010223144199699163, 0.0010661237174645066, 0.001109933014959097, 0.0011537421960383654, 0.0011975514935329556, 0.001241360791027546, 0.0012851699721068144, 0.0013289792696014047, 0.001372788567095995, 0.0014165978645905852, 0.0014604071620851755, 0.001504216343164444, 0.0015480256406590343]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 8.0, 4.0, 11.0, 8.0, 18.0, 14.0, 17.0, 14.0, 27.0, 26.0, 31.0, 28.0, 30.0, 33.0, 33.0, 39.0, 35.0, 39.0, 34.0, 41.0, 37.0, 36.0, 41.0, 35.0, 38.0, 31.0, 41.0, 43.0, 35.0, 25.0, 26.0, 22.0, 16.0, 18.0, 11.0, 12.0, 8.0, 9.0, 6.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005280375480651855, -0.0005120057612657547, -0.0004959739744663239, -0.000479942187666893, -0.00046391040086746216, -0.0004478786140680313, -0.00043184682726860046, -0.0004158150404691696, -0.00039978325366973877, -0.0003837514668703079, -0.0003677196800708771, -0.00035168789327144623, -0.0003356561064720154, -0.00031962431967258453, -0.0003035925328731537, -0.00028756074607372284, -0.000271528959274292, -0.00025549717247486115, -0.0002394653856754303, -0.00022343359887599945, -0.0002074018120765686, -0.00019137002527713776, -0.0001753382384777069, -0.00015930645167827606, -0.00014327466487884521, -0.00012724287807941437, -0.00011121109127998352, -9.517930448055267e-05, -7.914751768112183e-05, -6.311573088169098e-05, -4.708394408226013e-05, -3.1052157282829285e-05, -1.5020370483398438e-05, 1.0114163160324097e-06, 1.7043203115463257e-05, 3.3074989914894104e-05, 4.910677671432495e-05, 6.51385635137558e-05, 8.117035031318665e-05, 9.720213711261749e-05, 0.00011323392391204834, 0.0001292657107114792, 0.00014529749751091003, 0.00016132928431034088, 0.00017736107110977173, 0.00019339285790920258, 0.00020942464470863342, 0.00022545643150806427, 0.00024148821830749512, 0.00025752000510692596, 0.0002735517919063568, 0.00028958357870578766, 0.0003056153655052185, 0.00032164715230464935, 0.0003376789391040802, 0.00035371072590351105, 0.0003697425127029419, 0.00038577429950237274, 0.0004018060863018036, 0.00041783787310123444, 0.0004338696599006653, 0.00044990144670009613, 0.000465933233499527, 0.0004819650202989578, 0.0004979968070983887]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 12.0, 10.0, 7.0, 9.0, 21.0, 13.0, 15.0, 26.0, 43.0, 25.0, 40.0, 47.0, 37.0, 48.0, 49.0, 44.0, 52.0, 47.0, 42.0, 40.0, 47.0, 42.0, 40.0, 36.0, 39.0, 33.0, 29.0, 20.0, 16.0, 16.0, 8.0, 11.0, 7.0, 8.0, 3.0, 8.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.41015625, -5.20965576171875, -5.0091552734375, -4.80865478515625, -4.608154296875, -4.40765380859375, -4.2071533203125, -4.00665283203125, -3.80615234375, -3.60565185546875, -3.4051513671875, -3.20465087890625, -3.004150390625, -2.80364990234375, -2.6031494140625, -2.40264892578125, -2.2021484375, -2.00164794921875, -1.8011474609375, -1.60064697265625, -1.400146484375, -1.19964599609375, -0.9991455078125, -0.79864501953125, -0.59814453125, -0.39764404296875, -0.1971435546875, 0.00335693359375, 0.203857421875, 0.40435791015625, 0.6048583984375, 0.80535888671875, 1.005859375, 1.20635986328125, 1.4068603515625, 1.60736083984375, 1.807861328125, 2.00836181640625, 2.2088623046875, 2.40936279296875, 2.60986328125, 2.81036376953125, 3.0108642578125, 3.21136474609375, 3.411865234375, 3.61236572265625, 3.8128662109375, 4.01336669921875, 4.2138671875, 4.41436767578125, 4.6148681640625, 4.81536865234375, 5.015869140625, 5.21636962890625, 5.4168701171875, 5.61737060546875, 5.81787109375, 6.01837158203125, 6.2188720703125, 6.41937255859375, 6.619873046875, 6.82037353515625, 7.0208740234375, 7.22137451171875, 7.421875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 7.0, 3.0, 8.0, 15.0, 21.0, 33.0, 37.0, 50.0, 78.0, 127.0, 191.0, 350.0, 597.0, 1014.0, 1880.0, 3701.0, 7450.0, 14931.0, 29453.0, 57472.0, 113019.0, 215760.0, 270129.0, 161521.0, 83256.0, 43127.0, 21944.0, 10928.0, 5381.0, 2749.0, 1370.0, 764.0, 449.0, 277.0, 145.0, 117.0, 76.0, 37.0, 31.0, 22.0, 19.0, 9.0, 4.0, 6.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.00390625, -4.85791015625, -4.7119140625, -4.56591796875, -4.419921875, -4.27392578125, -4.1279296875, -3.98193359375, -3.8359375, -3.68994140625, -3.5439453125, -3.39794921875, -3.251953125, -3.10595703125, -2.9599609375, -2.81396484375, -2.66796875, -2.52197265625, -2.3759765625, -2.22998046875, -2.083984375, -1.93798828125, -1.7919921875, -1.64599609375, -1.5, -1.35400390625, -1.2080078125, -1.06201171875, -0.916015625, -0.77001953125, -0.6240234375, -0.47802734375, -0.33203125, -0.18603515625, -0.0400390625, 0.10595703125, 0.251953125, 0.39794921875, 0.5439453125, 0.68994140625, 0.8359375, 0.98193359375, 1.1279296875, 1.27392578125, 1.419921875, 1.56591796875, 1.7119140625, 1.85791015625, 2.00390625, 2.14990234375, 2.2958984375, 2.44189453125, 2.587890625, 2.73388671875, 2.8798828125, 3.02587890625, 3.171875, 3.31787109375, 3.4638671875, 3.60986328125, 3.755859375, 3.90185546875, 4.0478515625, 4.19384765625, 4.33984375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 5.0, 7.0, 14.0, 12.0, 16.0, 15.0, 20.0, 26.0, 28.0, 40.0, 42.0, 43.0, 55.0, 65.0, 55.0, 101.0, 246.0, 1471.0, 244.0, 110.0, 76.0, 55.0, 28.0, 41.0, 30.0, 31.0, 25.0, 25.0, 18.0, 19.0, 15.0, 12.0, 4.0, 6.0, 12.0, 4.0, 4.0, 5.0, 8.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-23.953125, -23.259033203125, -22.56494140625, -21.870849609375, -21.1767578125, -20.482666015625, -19.78857421875, -19.094482421875, -18.400390625, -17.706298828125, -17.01220703125, -16.318115234375, -15.6240234375, -14.929931640625, -14.23583984375, -13.541748046875, -12.84765625, -12.153564453125, -11.45947265625, -10.765380859375, -10.0712890625, -9.377197265625, -8.68310546875, -7.989013671875, -7.294921875, -6.600830078125, -5.90673828125, -5.212646484375, -4.5185546875, -3.824462890625, -3.13037109375, -2.436279296875, -1.7421875, -1.048095703125, -0.35400390625, 0.340087890625, 1.0341796875, 1.728271484375, 2.42236328125, 3.116455078125, 3.810546875, 4.504638671875, 5.19873046875, 5.892822265625, 6.5869140625, 7.281005859375, 7.97509765625, 8.669189453125, 9.36328125, 10.057373046875, 10.75146484375, 11.445556640625, 12.1396484375, 12.833740234375, 13.52783203125, 14.221923828125, 14.916015625, 15.610107421875, 16.30419921875, 16.998291015625, 17.6923828125, 18.386474609375, 19.08056640625, 19.774658203125, 20.46875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 9.0, 9.0, 16.0, 21.0, 21.0, 31.0, 52.0, 72.0, 122.0, 169.0, 270.0, 580.0, 3066.0, 3036084.0, 102895.0, 1202.0, 432.0, 199.0, 141.0, 100.0, 65.0, 44.0, 43.0, 20.0, 14.0, 5.0, 11.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.0, -73.265625, -70.53125, -67.796875, -65.0625, -62.328125, -59.59375, -56.859375, -54.125, -51.390625, -48.65625, -45.921875, -43.1875, -40.453125, -37.71875, -34.984375, -32.25, -29.515625, -26.78125, -24.046875, -21.3125, -18.578125, -15.84375, -13.109375, -10.375, -7.640625, -4.90625, -2.171875, 0.5625, 3.296875, 6.03125, 8.765625, 11.5, 14.234375, 16.96875, 19.703125, 22.4375, 25.171875, 27.90625, 30.640625, 33.375, 36.109375, 38.84375, 41.578125, 44.3125, 47.046875, 49.78125, 52.515625, 55.25, 57.984375, 60.71875, 63.453125, 66.1875, 68.921875, 71.65625, 74.390625, 77.125, 79.859375, 82.59375, 85.328125, 88.0625, 90.796875, 93.53125, 96.265625, 99.0]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 28.0, 303.0, 548.0, 127.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-265.9557189941406, -261.1466979980469, -256.3376770019531, -251.52865600585938, -246.71963500976562, -241.91061401367188, -237.10159301757812, -232.29258728027344, -227.4835662841797, -222.67454528808594, -217.8655242919922, -213.05650329589844, -208.2474822998047, -203.4384765625, -198.62945556640625, -193.8204345703125, -189.01141357421875, -184.202392578125, -179.39337158203125, -174.5843505859375, -169.77532958984375, -164.96630859375, -160.15728759765625, -155.34828186035156, -150.53924560546875, -145.730224609375, -140.92120361328125, -136.1121826171875, -131.30316162109375, -126.49414825439453, -121.68512725830078, -116.87611389160156, -112.06709289550781, -107.25807189941406, -102.44905090332031, -97.64002990722656, -92.83101654052734, -88.0219955444336, -83.21297454833984, -78.40396118164062, -73.59494018554688, -68.78591918945312, -63.97690200805664, -59.16788101196289, -54.358863830566406, -49.549842834472656, -44.740821838378906, -39.93180465698242, -35.12278366088867, -30.313764572143555, -25.504745483398438, -20.695724487304688, -15.88670539855957, -11.077686309814453, -6.268665313720703, -1.4596481323242188, 3.3493728637695312, 8.158391952514648, 12.967411994934082, 17.776432037353516, 22.585451126098633, 27.39447021484375, 32.2034912109375, 37.012508392333984, 41.821529388427734]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 2.0, 6.0, 4.0, 7.0, 11.0, 20.0, 10.0, 20.0, 18.0, 15.0, 22.0, 23.0, 29.0, 24.0, 36.0, 39.0, 35.0, 28.0, 36.0, 35.0, 46.0, 40.0, 45.0, 35.0, 39.0, 39.0, 30.0, 47.0, 38.0, 23.0, 25.0, 27.0, 22.0, 18.0, 8.0, 13.0, 13.0, 7.0, 13.0, 10.0, 9.0, 6.0, 6.0, 4.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0], "bins": [-44.75486373901367, -43.29269027709961, -41.83052062988281, -40.36834716796875, -38.90617370605469, -37.44400405883789, -35.98183059692383, -34.51966094970703, -33.05748748779297, -31.59531593322754, -30.13314437866211, -28.670970916748047, -27.208799362182617, -25.746627807617188, -24.284454345703125, -22.822282791137695, -21.360111236572266, -19.897939682006836, -18.435768127441406, -16.973594665527344, -15.511423110961914, -14.049251556396484, -12.587079048156738, -11.124906539916992, -9.662734985351562, -8.200563430786133, -6.738390922546387, -5.276218891143799, -3.814046859741211, -2.351874828338623, -0.8897027969360352, 0.5724697113037109, 2.0346450805664062, 3.496817111968994, 4.958989143371582, 6.42116117477417, 7.883333206176758, 9.345504760742188, 10.807677268981934, 12.26984977722168, 13.73202133178711, 15.194192886352539, 16.65636444091797, 18.11853790283203, 19.58070945739746, 21.04288101196289, 22.505054473876953, 23.967226028442383, 25.429397583007812, 26.891569137573242, 28.353740692138672, 29.815914154052734, 31.278085708618164, 32.740257263183594, 34.202430725097656, 35.66460418701172, 37.126773834228516, 38.58894729614258, 40.051116943359375, 41.51329040527344, 42.9754638671875, 44.4376335144043, 45.89980697631836, 47.361976623535156, 48.82415008544922]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 5.0, 4.0, 3.0, 10.0, 7.0, 12.0, 12.0, 14.0, 9.0, 17.0, 25.0, 35.0, 30.0, 30.0, 29.0, 37.0, 41.0, 58.0, 48.0, 47.0, 32.0, 55.0, 30.0, 52.0, 48.0, 35.0, 35.0, 34.0, 32.0, 35.0, 30.0, 20.0, 22.0, 14.0, 11.0, 9.0, 15.0, 7.0, 4.0, 1.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.265625, -5.0556640625, -4.845703125, -4.6357421875, -4.42578125, -4.2158203125, -4.005859375, -3.7958984375, -3.5859375, -3.3759765625, -3.166015625, -2.9560546875, -2.74609375, -2.5361328125, -2.326171875, -2.1162109375, -1.90625, -1.6962890625, -1.486328125, -1.2763671875, -1.06640625, -0.8564453125, -0.646484375, -0.4365234375, -0.2265625, -0.0166015625, 0.193359375, 0.4033203125, 0.61328125, 0.8232421875, 1.033203125, 1.2431640625, 1.453125, 1.6630859375, 1.873046875, 2.0830078125, 2.29296875, 2.5029296875, 2.712890625, 2.9228515625, 3.1328125, 3.3427734375, 3.552734375, 3.7626953125, 3.97265625, 4.1826171875, 4.392578125, 4.6025390625, 4.8125, 5.0224609375, 5.232421875, 5.4423828125, 5.65234375, 5.8623046875, 6.072265625, 6.2822265625, 6.4921875, 6.7021484375, 6.912109375, 7.1220703125, 7.33203125, 7.5419921875, 7.751953125, 7.9619140625, 8.171875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 4.0, 8.0, 3.0, 4.0, 8.0, 8.0, 9.0, 12.0, 13.0, 17.0, 14.0, 25.0, 28.0, 33.0, 42.0, 67.0, 96.0, 165.0, 452.0, 2073.0, 44905.0, 2109549.0, 1996325.0, 37669.0, 1834.0, 382.0, 163.0, 81.0, 60.0, 52.0, 38.0, 32.0, 18.0, 19.0, 14.0, 13.0, 14.0, 12.0, 5.0, 8.0, 2.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.203125, -17.474609375, -16.74609375, -16.017578125, -15.2890625, -14.560546875, -13.83203125, -13.103515625, -12.375, -11.646484375, -10.91796875, -10.189453125, -9.4609375, -8.732421875, -8.00390625, -7.275390625, -6.546875, -5.818359375, -5.08984375, -4.361328125, -3.6328125, -2.904296875, -2.17578125, -1.447265625, -0.71875, 0.009765625, 0.73828125, 1.466796875, 2.1953125, 2.923828125, 3.65234375, 4.380859375, 5.109375, 5.837890625, 6.56640625, 7.294921875, 8.0234375, 8.751953125, 9.48046875, 10.208984375, 10.9375, 11.666015625, 12.39453125, 13.123046875, 13.8515625, 14.580078125, 15.30859375, 16.037109375, 16.765625, 17.494140625, 18.22265625, 18.951171875, 19.6796875, 20.408203125, 21.13671875, 21.865234375, 22.59375, 23.322265625, 24.05078125, 24.779296875, 25.5078125, 26.236328125, 26.96484375, 27.693359375, 28.421875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 13.0, 12.0, 11.0, 18.0, 25.0, 38.0, 52.0, 86.0, 85.0, 120.0, 150.0, 213.0, 261.0, 363.0, 378.0, 456.0, 371.0, 336.0, 267.0, 216.0, 167.0, 97.0, 86.0, 44.0, 54.0, 30.0, 30.0, 21.0, 16.0, 15.0, 6.0, 4.0, 3.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.1328125, -11.74658203125, -11.3603515625, -10.97412109375, -10.587890625, -10.20166015625, -9.8154296875, -9.42919921875, -9.04296875, -8.65673828125, -8.2705078125, -7.88427734375, -7.498046875, -7.11181640625, -6.7255859375, -6.33935546875, -5.953125, -5.56689453125, -5.1806640625, -4.79443359375, -4.408203125, -4.02197265625, -3.6357421875, -3.24951171875, -2.86328125, -2.47705078125, -2.0908203125, -1.70458984375, -1.318359375, -0.93212890625, -0.5458984375, -0.15966796875, 0.2265625, 0.61279296875, 0.9990234375, 1.38525390625, 1.771484375, 2.15771484375, 2.5439453125, 2.93017578125, 3.31640625, 3.70263671875, 4.0888671875, 4.47509765625, 4.861328125, 5.24755859375, 5.6337890625, 6.02001953125, 6.40625, 6.79248046875, 7.1787109375, 7.56494140625, 7.951171875, 8.33740234375, 8.7236328125, 9.10986328125, 9.49609375, 9.88232421875, 10.2685546875, 10.65478515625, 11.041015625, 11.42724609375, 11.8134765625, 12.19970703125, 12.5859375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 10.0, 14.0, 15.0, 18.0, 30.0, 28.0, 45.0, 65.0, 87.0, 103.0, 182.0, 224.0, 482.0, 1565.0, 28068.0, 3178620.0, 974560.0, 8115.0, 911.0, 346.0, 228.0, 165.0, 120.0, 79.0, 56.0, 50.0, 28.0, 15.0, 16.0, 13.0, 8.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.65625, -27.34423828125, -26.0322265625, -24.72021484375, -23.408203125, -22.09619140625, -20.7841796875, -19.47216796875, -18.16015625, -16.84814453125, -15.5361328125, -14.22412109375, -12.912109375, -11.60009765625, -10.2880859375, -8.97607421875, -7.6640625, -6.35205078125, -5.0400390625, -3.72802734375, -2.416015625, -1.10400390625, 0.2080078125, 1.52001953125, 2.83203125, 4.14404296875, 5.4560546875, 6.76806640625, 8.080078125, 9.39208984375, 10.7041015625, 12.01611328125, 13.328125, 14.64013671875, 15.9521484375, 17.26416015625, 18.576171875, 19.88818359375, 21.2001953125, 22.51220703125, 23.82421875, 25.13623046875, 26.4482421875, 27.76025390625, 29.072265625, 30.38427734375, 31.6962890625, 33.00830078125, 34.3203125, 35.63232421875, 36.9443359375, 38.25634765625, 39.568359375, 40.88037109375, 42.1923828125, 43.50439453125, 44.81640625, 46.12841796875, 47.4404296875, 48.75244140625, 50.064453125, 51.37646484375, 52.6884765625, 54.00048828125, 55.3125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 9.0, 14.0, 37.0, 59.0, 117.0, 134.0, 154.0, 142.0, 139.0, 91.0, 55.0, 30.0, 12.0, 7.0, 7.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.99246978759766, -82.63236999511719, -80.27227783203125, -77.91217803955078, -75.55208587646484, -73.19198608398438, -70.83189392089844, -68.47179412841797, -66.1116943359375, -63.7515983581543, -61.391502380371094, -59.03140640258789, -56.67131042480469, -54.31121063232422, -51.951114654541016, -49.59101867675781, -47.230926513671875, -44.87083053588867, -42.51073455810547, -40.150638580322266, -37.79054260253906, -35.430442810058594, -33.07034683227539, -30.710250854492188, -28.350154876708984, -25.99005889892578, -23.629962921142578, -21.269865036010742, -18.90976905822754, -16.549673080444336, -14.189576148986816, -11.829479217529297, -9.469375610351562, -7.109279155731201, -4.74918270111084, -2.3890862464904785, -0.028989791870117188, 2.331106185913086, 4.6912031173706055, 7.051300048828125, 9.411396026611328, 11.771492004394531, 14.13158893585205, 16.49168586730957, 18.851781845092773, 21.211877822875977, 23.571975708007812, 25.932071685791016, 28.29216766357422, 30.652263641357422, 33.012359619140625, 35.37245559692383, 37.73255157470703, 40.0926513671875, 42.4527473449707, 44.812843322753906, 47.17293930053711, 49.53303527832031, 51.893131256103516, 54.25322723388672, 56.61332702636719, 58.973419189453125, 61.333518981933594, 63.6936149597168, 66.0537109375]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 1.0, 4.0, 4.0, 10.0, 8.0, 5.0, 12.0, 13.0, 20.0, 11.0, 20.0, 23.0, 24.0, 25.0, 25.0, 26.0, 22.0, 25.0, 42.0, 40.0, 46.0, 31.0, 45.0, 35.0, 39.0, 40.0, 49.0, 39.0, 33.0, 21.0, 27.0, 26.0, 30.0, 25.0, 32.0, 15.0, 12.0, 19.0, 14.0, 16.0, 12.0, 8.0, 6.0, 8.0, 7.0, 5.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-33.96825408935547, -32.69132614135742, -31.414400100708008, -30.13747215270996, -28.860546112060547, -27.5836181640625, -26.306690216064453, -25.02976417541504, -23.752838134765625, -22.475910186767578, -21.198984146118164, -19.922056198120117, -18.645130157470703, -17.368202209472656, -16.09127426147461, -14.814348220825195, -13.537420272827148, -12.260493278503418, -10.983566284179688, -9.70663833618164, -8.429712295532227, -7.152784824371338, -5.875857353210449, -4.598930358886719, -3.3220033645629883, -2.045076370239258, -0.7681491374969482, 0.5087780952453613, 1.7857050895690918, 3.0626320838928223, 4.339559555053711, 5.616486549377441, 6.893413543701172, 8.170340538024902, 9.447267532348633, 10.72419548034668, 12.001121520996094, 13.27804946899414, 14.554976463317871, 15.831903457641602, 17.108829498291016, 18.385757446289062, 19.662683486938477, 20.939611434936523, 22.216537475585938, 23.493465423583984, 24.77039337158203, 26.047319412231445, 27.324247360229492, 28.60117530822754, 29.878101348876953, 31.155029296875, 32.43195724487305, 33.70888137817383, 34.985809326171875, 36.26273727416992, 37.53966522216797, 38.816593170166016, 40.09352111816406, 41.370445251464844, 42.64737319946289, 43.92430114746094, 45.201229095458984, 46.47815704345703, 47.75508117675781]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 11.0, 14.0, 12.0, 13.0, 19.0, 20.0, 24.0, 30.0, 39.0, 22.0, 42.0, 39.0, 47.0, 49.0, 40.0, 51.0, 53.0, 38.0, 51.0, 40.0, 43.0, 41.0, 38.0, 39.0, 39.0, 34.0, 15.0, 19.0, 13.0, 18.0, 11.0, 11.0, 3.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.453125, -5.2401123046875, -5.027099609375, -4.8140869140625, -4.60107421875, -4.3880615234375, -4.175048828125, -3.9620361328125, -3.7490234375, -3.5360107421875, -3.322998046875, -3.1099853515625, -2.89697265625, -2.6839599609375, -2.470947265625, -2.2579345703125, -2.044921875, -1.8319091796875, -1.618896484375, -1.4058837890625, -1.19287109375, -0.9798583984375, -0.766845703125, -0.5538330078125, -0.3408203125, -0.1278076171875, 0.085205078125, 0.2982177734375, 0.51123046875, 0.7242431640625, 0.937255859375, 1.1502685546875, 1.36328125, 1.5762939453125, 1.789306640625, 2.0023193359375, 2.21533203125, 2.4283447265625, 2.641357421875, 2.8543701171875, 3.0673828125, 3.2803955078125, 3.493408203125, 3.7064208984375, 3.91943359375, 4.1324462890625, 4.345458984375, 4.5584716796875, 4.771484375, 4.9844970703125, 5.197509765625, 5.4105224609375, 5.62353515625, 5.8365478515625, 6.049560546875, 6.2625732421875, 6.4755859375, 6.6885986328125, 6.901611328125, 7.1146240234375, 7.32763671875, 7.5406494140625, 7.753662109375, 7.9666748046875, 8.1796875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 11.0, 11.0, 16.0, 25.0, 22.0, 53.0, 67.0, 96.0, 158.0, 257.0, 385.0, 694.0, 1148.0, 1896.0, 3134.0, 5266.0, 8681.0, 15126.0, 26502.0, 47954.0, 90157.0, 192009.0, 315622.0, 162130.0, 78544.0, 41774.0, 23442.0, 13702.0, 7969.0, 4663.0, 2816.0, 1725.0, 990.0, 595.0, 347.0, 213.0, 132.0, 77.0, 55.0, 39.0, 21.0, 12.0, 8.0, 9.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.275390625, -1.2371978759765625, -1.199005126953125, -1.1608123779296875, -1.12261962890625, -1.0844268798828125, -1.046234130859375, -1.0080413818359375, -0.9698486328125, -0.9316558837890625, -0.893463134765625, -0.8552703857421875, -0.81707763671875, -0.7788848876953125, -0.740692138671875, -0.7024993896484375, -0.664306640625, -0.6261138916015625, -0.587921142578125, -0.5497283935546875, -0.51153564453125, -0.4733428955078125, -0.435150146484375, -0.3969573974609375, -0.3587646484375, -0.3205718994140625, -0.282379150390625, -0.2441864013671875, -0.20599365234375, -0.1678009033203125, -0.129608154296875, -0.0914154052734375, -0.05322265625, -0.0150299072265625, 0.023162841796875, 0.0613555908203125, 0.09954833984375, 0.1377410888671875, 0.175933837890625, 0.2141265869140625, 0.2523193359375, 0.2905120849609375, 0.328704833984375, 0.3668975830078125, 0.40509033203125, 0.4432830810546875, 0.481475830078125, 0.5196685791015625, 0.557861328125, 0.5960540771484375, 0.634246826171875, 0.6724395751953125, 0.71063232421875, 0.7488250732421875, 0.787017822265625, 0.8252105712890625, 0.8634033203125, 0.9015960693359375, 0.939788818359375, 0.9779815673828125, 1.01617431640625, 1.0543670654296875, 1.092559814453125, 1.1307525634765625, 1.1689453125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 2.0, 4.0, 11.0, 9.0, 14.0, 9.0, 11.0, 19.0, 21.0, 24.0, 21.0, 28.0, 40.0, 37.0, 36.0, 34.0, 39.0, 34.0, 50.0, 41.0, 1069.0, 45.0, 46.0, 34.0, 29.0, 41.0, 32.0, 31.0, 27.0, 25.0, 31.0, 24.0, 20.0, 17.0, 11.0, 8.0, 13.0, 11.0, 8.0, 6.0, 4.0, 2.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.603515625, -3.483673095703125, -3.36383056640625, -3.243988037109375, -3.1241455078125, -3.004302978515625, -2.88446044921875, -2.764617919921875, -2.644775390625, -2.524932861328125, -2.40509033203125, -2.285247802734375, -2.1654052734375, -2.045562744140625, -1.92572021484375, -1.805877685546875, -1.68603515625, -1.566192626953125, -1.44635009765625, -1.326507568359375, -1.2066650390625, -1.086822509765625, -0.96697998046875, -0.847137451171875, -0.727294921875, -0.607452392578125, -0.48760986328125, -0.367767333984375, -0.2479248046875, -0.128082275390625, -0.00823974609375, 0.111602783203125, 0.2314453125, 0.351287841796875, 0.47113037109375, 0.590972900390625, 0.7108154296875, 0.830657958984375, 0.95050048828125, 1.070343017578125, 1.190185546875, 1.310028076171875, 1.42987060546875, 1.549713134765625, 1.6695556640625, 1.789398193359375, 1.90924072265625, 2.029083251953125, 2.14892578125, 2.268768310546875, 2.38861083984375, 2.508453369140625, 2.6282958984375, 2.748138427734375, 2.86798095703125, 2.987823486328125, 3.107666015625, 3.227508544921875, 3.34735107421875, 3.467193603515625, 3.5870361328125, 3.706878662109375, 3.82672119140625, 3.946563720703125, 4.06640625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 9.0, 2.0, 6.0, 6.0, 14.0, 17.0, 7.0, 34.0, 41.0, 54.0, 86.0, 114.0, 143.0, 221.0, 331.0, 468.0, 701.0, 994.0, 1505.0, 2268.0, 3511.0, 5349.0, 8327.0, 13098.0, 20691.0, 33983.0, 56970.0, 102216.0, 206577.0, 1319439.0, 134982.0, 71573.0, 41760.0, 25711.0, 16149.0, 10275.0, 6636.0, 4275.0, 2733.0, 1849.0, 1241.0, 847.0, 583.0, 407.0, 272.0, 189.0, 147.0, 98.0, 71.0, 53.0, 30.0, 29.0, 18.0, 9.0, 11.0, 11.0, 2.0, 1.0, 3.0], "bins": [-1.0654296875, -1.0342864990234375, -1.003143310546875, -0.9720001220703125, -0.94085693359375, -0.9097137451171875, -0.878570556640625, -0.8474273681640625, -0.8162841796875, -0.7851409912109375, -0.753997802734375, -0.7228546142578125, -0.69171142578125, -0.6605682373046875, -0.629425048828125, -0.5982818603515625, -0.567138671875, -0.5359954833984375, -0.504852294921875, -0.4737091064453125, -0.44256591796875, -0.4114227294921875, -0.380279541015625, -0.3491363525390625, -0.3179931640625, -0.2868499755859375, -0.255706787109375, -0.2245635986328125, -0.19342041015625, -0.1622772216796875, -0.131134033203125, -0.0999908447265625, -0.06884765625, -0.0377044677734375, -0.006561279296875, 0.0245819091796875, 0.05572509765625, 0.0868682861328125, 0.118011474609375, 0.1491546630859375, 0.1802978515625, 0.2114410400390625, 0.242584228515625, 0.2737274169921875, 0.30487060546875, 0.3360137939453125, 0.367156982421875, 0.3983001708984375, 0.429443359375, 0.4605865478515625, 0.491729736328125, 0.5228729248046875, 0.55401611328125, 0.5851593017578125, 0.616302490234375, 0.6474456787109375, 0.6785888671875, 0.7097320556640625, 0.740875244140625, 0.7720184326171875, 0.80316162109375, 0.8343048095703125, 0.865447998046875, 0.8965911865234375, 0.927734375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 10.0, 12.0, 17.0, 14.0, 30.0, 23.0, 46.0, 54.0, 52.0, 63.0, 80.0, 82.0, 96.0, 79.0, 68.0, 57.0, 41.0, 36.0, 28.0, 24.0, 14.0, 9.0, 8.0, 10.0, 4.0, 7.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.0012731552124023438, -0.0012330114841461182, -0.0011928677558898926, -0.001152724027633667, -0.0011125802993774414, -0.0010724365711212158, -0.0010322928428649902, -0.0009921491146087646, -0.0009520053863525391, -0.0009118616580963135, -0.0008717179298400879, -0.0008315742015838623, -0.0007914304733276367, -0.0007512867450714111, -0.0007111430168151855, -0.00067099928855896, -0.0006308555603027344, -0.0005907118320465088, -0.0005505681037902832, -0.0005104243755340576, -0.00047028064727783203, -0.00043013691902160645, -0.00038999319076538086, -0.0003498494625091553, -0.0003097057342529297, -0.0002695620059967041, -0.00022941827774047852, -0.00018927454948425293, -0.00014913082122802734, -0.00010898709297180176, -6.884336471557617e-05, -2.8699636459350586e-05, 1.1444091796875e-05, 5.1587820053100586e-05, 9.173154830932617e-05, 0.00013187527656555176, 0.00017201900482177734, 0.00021216273307800293, 0.0002523064613342285, 0.0002924501895904541, 0.0003325939178466797, 0.0003727376461029053, 0.00041288137435913086, 0.00045302510261535645, 0.000493168830871582, 0.0005333125591278076, 0.0005734562873840332, 0.0006136000156402588, 0.0006537437438964844, 0.00069388747215271, 0.0007340312004089355, 0.0007741749286651611, 0.0008143186569213867, 0.0008544623851776123, 0.0008946061134338379, 0.0009347498416900635, 0.0009748935699462891, 0.0010150372982025146, 0.0010551810264587402, 0.0010953247547149658, 0.0011354684829711914, 0.001175612211227417, 0.0012157559394836426, 0.0012558996677398682, 0.0012960433959960938]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 8.0, 6.0, 6.0, 15.0, 11.0, 13.0, 21.0, 42.0, 50.0, 64.0, 146.0, 235.0, 523.0, 2943.0, 1020774.0, 22204.0, 752.0, 262.0, 156.0, 92.0, 73.0, 45.0, 30.0, 21.0, 10.0, 12.0, 9.0, 8.0, 4.0, 5.0, 3.0, 0.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02911376953125, -0.02822256088256836, -0.02733135223388672, -0.026440143585205078, -0.025548934936523438, -0.024657726287841797, -0.023766517639160156, -0.022875308990478516, -0.021984100341796875, -0.021092891693115234, -0.020201683044433594, -0.019310474395751953, -0.018419265747070312, -0.017528057098388672, -0.01663684844970703, -0.01574563980102539, -0.01485443115234375, -0.01396322250366211, -0.013072013854980469, -0.012180805206298828, -0.011289596557617188, -0.010398387908935547, -0.009507179260253906, -0.008615970611572266, -0.007724761962890625, -0.006833553314208984, -0.005942344665527344, -0.005051136016845703, -0.0041599273681640625, -0.003268718719482422, -0.0023775100708007812, -0.0014863014221191406, -0.0005950927734375, 0.0002961158752441406, 0.0011873245239257812, 0.002078533172607422, 0.0029697418212890625, 0.003860950469970703, 0.004752159118652344, 0.005643367767333984, 0.006534576416015625, 0.007425785064697266, 0.008316993713378906, 0.009208202362060547, 0.010099411010742188, 0.010990619659423828, 0.011881828308105469, 0.01277303695678711, 0.01366424560546875, 0.01455545425415039, 0.015446662902832031, 0.016337871551513672, 0.017229080200195312, 0.018120288848876953, 0.019011497497558594, 0.019902706146240234, 0.020793914794921875, 0.021685123443603516, 0.022576332092285156, 0.023467540740966797, 0.024358749389648438, 0.025249958038330078, 0.02614116668701172, 0.02703237533569336, 0.027923583984375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 10.0, 43.0, 55.0, 123.0, 203.0, 205.0, 169.0, 114.0, 56.0, 15.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012491774978116155, -0.001207944587804377, -0.0011667115613818169, -0.0011254786513745785, -0.00108424574136734, -0.0010430127149447799, -0.0010017798049375415, -0.0009605468367226422, -0.0009193138685077429, -0.0008780809002928436, -0.0008368479320779443, -0.0007956150220707059, -0.0007543820538558066, -0.0007131490856409073, -0.0006719161756336689, -0.0006306832074187696, -0.0005894502392038703, -0.000548217270988971, -0.0005069843027740717, -0.0004657513927668333, -0.000424518424551934, -0.0003832854563370347, -0.00034205251722596586, -0.000300819578114897, -0.0002595866098999977, -0.00021835365623701364, -0.00017712070257402956, -0.0001358877489110455, -9.465479524806142e-05, -5.3421841585077345e-05, -1.2188887922093272e-05, 2.9044051188975573e-05, 7.02771358191967e-05, 0.00011151008948218077, 0.00015274304314516485, 0.00019397599680814892, 0.000235208950471133, 0.0002764419186860323, 0.00031767485779710114, 0.00035890779690817, 0.0004001407651230693, 0.0004413737333379686, 0.00048260667244903743, 0.0005238396115601063, 0.0005650725797750056, 0.0006063055479899049, 0.0006475384579971433, 0.0006887714262120426, 0.0007300043944269419, 0.0007712373626418412, 0.0008124703308567405, 0.0008537032408639789, 0.0008949362090788782, 0.0009361691772937775, 0.0009774020873010159, 0.0010186349973082542, 0.0010598680237308145, 0.0011011009337380528, 0.001142333960160613, 0.0011835668701678514, 0.0012247997801750898, 0.00126603280659765, 0.0013072657166048884, 0.0013484987430274487, 0.001389731653034687]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 3.0, 2.0, 9.0, 9.0, 9.0, 9.0, 12.0, 14.0, 13.0, 20.0, 27.0, 19.0, 23.0, 27.0, 25.0, 27.0, 45.0, 38.0, 48.0, 49.0, 40.0, 50.0, 40.0, 34.0, 32.0, 45.0, 31.0, 32.0, 26.0, 42.0, 27.0, 22.0, 24.0, 19.0, 19.0, 21.0, 13.0, 9.0, 14.0, 11.0, 13.0, 5.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0005900859832763672, -0.0005727093666791916, -0.000555332750082016, -0.0005379561334848404, -0.0005205795168876648, -0.0005032029002904892, -0.0004858262836933136, -0.000468449667096138, -0.0004510730504989624, -0.0004336964339017868, -0.0004163198173046112, -0.0003989432007074356, -0.00038156658411026, -0.0003641899675130844, -0.0003468133509159088, -0.0003294367343187332, -0.0003120601177215576, -0.000294683501124382, -0.0002773068845272064, -0.0002599302679300308, -0.00024255365133285522, -0.00022517703473567963, -0.00020780041813850403, -0.00019042380154132843, -0.00017304718494415283, -0.00015567056834697723, -0.00013829395174980164, -0.00012091733515262604, -0.00010354071855545044, -8.616410195827484e-05, -6.878748536109924e-05, -5.1410868763923645e-05, -3.403425216674805e-05, -1.665763556957245e-05, 7.189810276031494e-07, 1.8095597624778748e-05, 3.5472214221954346e-05, 5.2848830819129944e-05, 7.022544741630554e-05, 8.760206401348114e-05, 0.00010497868061065674, 0.00012235529720783234, 0.00013973191380500793, 0.00015710853040218353, 0.00017448514699935913, 0.00019186176359653473, 0.00020923838019371033, 0.00022661499679088593, 0.00024399161338806152, 0.0002613682299852371, 0.0002787448465824127, 0.0002961214631795883, 0.0003134980797767639, 0.0003308746963739395, 0.0003482513129711151, 0.0003656279295682907, 0.0003830045461654663, 0.0004003811627626419, 0.0004177577793598175, 0.0004351343959569931, 0.0004525110125541687, 0.0004698876291513443, 0.0004872642457485199, 0.0005046408623456955, 0.0005220174789428711]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 11.0, 14.0, 12.0, 13.0, 19.0, 20.0, 24.0, 30.0, 39.0, 22.0, 42.0, 39.0, 47.0, 49.0, 40.0, 51.0, 53.0, 38.0, 51.0, 40.0, 43.0, 41.0, 38.0, 39.0, 39.0, 34.0, 15.0, 19.0, 13.0, 18.0, 11.0, 11.0, 3.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.453125, -5.2401123046875, -5.027099609375, -4.8140869140625, -4.60107421875, -4.3880615234375, -4.175048828125, -3.9620361328125, -3.7490234375, -3.5360107421875, -3.322998046875, -3.1099853515625, -2.89697265625, -2.6839599609375, -2.470947265625, -2.2579345703125, -2.044921875, -1.8319091796875, -1.618896484375, -1.4058837890625, -1.19287109375, -0.9798583984375, -0.766845703125, -0.5538330078125, -0.3408203125, -0.1278076171875, 0.085205078125, 0.2982177734375, 0.51123046875, 0.7242431640625, 0.937255859375, 1.1502685546875, 1.36328125, 1.5762939453125, 1.789306640625, 2.0023193359375, 2.21533203125, 2.4283447265625, 2.641357421875, 2.8543701171875, 3.0673828125, 3.2803955078125, 3.493408203125, 3.7064208984375, 3.91943359375, 4.1324462890625, 4.345458984375, 4.5584716796875, 4.771484375, 4.9844970703125, 5.197509765625, 5.4105224609375, 5.62353515625, 5.8365478515625, 6.049560546875, 6.2625732421875, 6.4755859375, 6.6885986328125, 6.901611328125, 7.1146240234375, 7.32763671875, 7.5406494140625, 7.753662109375, 7.9666748046875, 8.1796875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 10.0, 17.0, 15.0, 18.0, 34.0, 43.0, 57.0, 70.0, 89.0, 124.0, 188.0, 266.0, 453.0, 728.0, 1463.0, 2925.0, 6385.0, 15090.0, 33148.0, 71629.0, 156882.0, 344330.0, 229445.0, 99638.0, 46248.0, 21179.0, 9302.0, 4209.0, 1923.0, 986.0, 558.0, 326.0, 202.0, 153.0, 108.0, 74.0, 58.0, 45.0, 29.0, 31.0, 11.0, 11.0, 19.0, 6.0, 3.0, 6.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.75, -5.56280517578125, -5.3756103515625, -5.18841552734375, -5.001220703125, -4.81402587890625, -4.6268310546875, -4.43963623046875, -4.25244140625, -4.06524658203125, -3.8780517578125, -3.69085693359375, -3.503662109375, -3.31646728515625, -3.1292724609375, -2.94207763671875, -2.7548828125, -2.56768798828125, -2.3804931640625, -2.19329833984375, -2.006103515625, -1.81890869140625, -1.6317138671875, -1.44451904296875, -1.25732421875, -1.07012939453125, -0.8829345703125, -0.69573974609375, -0.508544921875, -0.32135009765625, -0.1341552734375, 0.05303955078125, 0.240234375, 0.42742919921875, 0.6146240234375, 0.80181884765625, 0.989013671875, 1.17620849609375, 1.3634033203125, 1.55059814453125, 1.73779296875, 1.92498779296875, 2.1121826171875, 2.29937744140625, 2.486572265625, 2.67376708984375, 2.8609619140625, 3.04815673828125, 3.2353515625, 3.42254638671875, 3.6097412109375, 3.79693603515625, 3.984130859375, 4.17132568359375, 4.3585205078125, 4.54571533203125, 4.73291015625, 4.92010498046875, 5.1072998046875, 5.29449462890625, 5.481689453125, 5.66888427734375, 5.8560791015625, 6.04327392578125, 6.23046875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [5.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 10.0, 6.0, 17.0, 10.0, 11.0, 10.0, 15.0, 31.0, 29.0, 33.0, 28.0, 33.0, 38.0, 39.0, 63.0, 92.0, 143.0, 1406.0, 358.0, 152.0, 90.0, 51.0, 49.0, 30.0, 33.0, 29.0, 37.0, 29.0, 23.0, 25.0, 23.0, 17.0, 18.0, 11.0, 14.0, 11.0, 5.0, 4.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.9375, -16.309814453125, -15.68212890625, -15.054443359375, -14.4267578125, -13.799072265625, -13.17138671875, -12.543701171875, -11.916015625, -11.288330078125, -10.66064453125, -10.032958984375, -9.4052734375, -8.777587890625, -8.14990234375, -7.522216796875, -6.89453125, -6.266845703125, -5.63916015625, -5.011474609375, -4.3837890625, -3.756103515625, -3.12841796875, -2.500732421875, -1.873046875, -1.245361328125, -0.61767578125, 0.010009765625, 0.6376953125, 1.265380859375, 1.89306640625, 2.520751953125, 3.1484375, 3.776123046875, 4.40380859375, 5.031494140625, 5.6591796875, 6.286865234375, 6.91455078125, 7.542236328125, 8.169921875, 8.797607421875, 9.42529296875, 10.052978515625, 10.6806640625, 11.308349609375, 11.93603515625, 12.563720703125, 13.19140625, 13.819091796875, 14.44677734375, 15.074462890625, 15.7021484375, 16.329833984375, 16.95751953125, 17.585205078125, 18.212890625, 18.840576171875, 19.46826171875, 20.095947265625, 20.7236328125, 21.351318359375, 21.97900390625, 22.606689453125, 23.234375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 8.0, 5.0, 6.0, 10.0, 9.0, 9.0, 14.0, 12.0, 11.0, 17.0, 25.0, 27.0, 37.0, 42.0, 50.0, 61.0, 82.0, 93.0, 138.0, 175.0, 292.0, 484.0, 1161.0, 18106.0, 3044328.0, 77088.0, 1712.0, 596.0, 287.0, 202.0, 123.0, 99.0, 86.0, 59.0, 46.0, 30.0, 33.0, 32.0, 17.0, 16.0, 21.0, 11.0, 8.0, 5.0, 8.0, 5.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0], "bins": [-52.625, -50.9609375, -49.296875, -47.6328125, -45.96875, -44.3046875, -42.640625, -40.9765625, -39.3125, -37.6484375, -35.984375, -34.3203125, -32.65625, -30.9921875, -29.328125, -27.6640625, -26.0, -24.3359375, -22.671875, -21.0078125, -19.34375, -17.6796875, -16.015625, -14.3515625, -12.6875, -11.0234375, -9.359375, -7.6953125, -6.03125, -4.3671875, -2.703125, -1.0390625, 0.625, 2.2890625, 3.953125, 5.6171875, 7.28125, 8.9453125, 10.609375, 12.2734375, 13.9375, 15.6015625, 17.265625, 18.9296875, 20.59375, 22.2578125, 23.921875, 25.5859375, 27.25, 28.9140625, 30.578125, 32.2421875, 33.90625, 35.5703125, 37.234375, 38.8984375, 40.5625, 42.2265625, 43.890625, 45.5546875, 47.21875, 48.8828125, 50.546875, 52.2109375, 53.875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 26.0, 115.0, 296.0, 375.0, 149.0, 37.0, 10.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.363853454589844, -35.44792938232422, -32.53200149536133, -29.61607551574707, -26.700149536132812, -23.784223556518555, -20.868297576904297, -17.95237159729004, -15.036445617675781, -12.120519638061523, -9.204593658447266, -6.288667678833008, -3.37274169921875, -0.4568157196044922, 2.4591102600097656, 5.375036239624023, 8.290962219238281, 11.206888198852539, 14.122814178466797, 17.038740158081055, 19.954666137695312, 22.87059211730957, 25.786518096923828, 28.702444076538086, 31.618370056152344, 34.53429412841797, 37.45022201538086, 40.36614990234375, 43.282073974609375, 46.197998046875, 49.11392593383789, 52.02985382080078, 54.94578552246094, 57.86170959472656, 60.77763748168945, 63.693565368652344, 66.60948944091797, 69.5254135131836, 72.44134521484375, 75.35726928710938, 78.273193359375, 81.18911743164062, 84.10504150390625, 87.0209732055664, 89.93689727783203, 92.85282135009766, 95.76875305175781, 98.68467712402344, 101.60060119628906, 104.51652526855469, 107.43244934082031, 110.34838104248047, 113.2643051147461, 116.18022918701172, 119.09616088867188, 122.0120849609375, 124.92800903320312, 127.84393310546875, 130.75985717773438, 133.67578125, 136.59170532226562, 139.5076446533203, 142.42356872558594, 145.33949279785156, 148.2554168701172]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 7.0, 2.0, 3.0, 7.0, 10.0, 1.0, 10.0, 10.0, 7.0, 10.0, 13.0, 18.0, 18.0, 25.0, 25.0, 23.0, 19.0, 37.0, 37.0, 38.0, 38.0, 46.0, 41.0, 44.0, 44.0, 45.0, 44.0, 42.0, 58.0, 30.0, 30.0, 37.0, 26.0, 18.0, 29.0, 20.0, 16.0, 12.0, 10.0, 5.0, 13.0, 7.0, 9.0, 6.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-59.63190841674805, -57.779335021972656, -55.9267578125, -54.07418441772461, -52.22161102294922, -50.36903762817383, -48.51646423339844, -46.66388702392578, -44.81131362915039, -42.958740234375, -41.106163024902344, -39.25358963012695, -37.40101623535156, -35.54844284057617, -33.69586944580078, -31.843292236328125, -29.990718841552734, -28.138145446777344, -26.28557014465332, -24.432994842529297, -22.580421447753906, -20.727848052978516, -18.875272750854492, -17.02269744873047, -15.170124053955078, -13.317549705505371, -11.464975357055664, -9.612401008605957, -7.75982666015625, -5.907252311706543, -4.054677963256836, -2.202103614807129, -0.3495292663574219, 1.5030450820922852, 3.355619430541992, 5.208193778991699, 7.060768127441406, 8.913342475891113, 10.76591682434082, 12.618491172790527, 14.471065521240234, 16.323638916015625, 18.17621421813965, 20.028789520263672, 21.881362915039062, 23.733936309814453, 25.586511611938477, 27.4390869140625, 29.29166030883789, 31.14423370361328, 32.99681091308594, 34.84938430786133, 36.70195770263672, 38.55453109741211, 40.4071044921875, 42.259681701660156, 44.11225509643555, 45.96482849121094, 47.817405700683594, 49.669979095458984, 51.522552490234375, 53.375125885009766, 55.227699279785156, 57.08027648925781, 58.9328498840332]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 12.0, 17.0, 11.0, 24.0, 21.0, 21.0, 25.0, 21.0, 22.0, 40.0, 33.0, 35.0, 40.0, 41.0, 48.0, 32.0, 47.0, 42.0, 37.0, 49.0, 54.0, 47.0, 37.0, 37.0, 40.0, 23.0, 23.0, 19.0, 20.0, 16.0, 14.0, 15.0, 7.0, 4.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.89453125, -5.66607666015625, -5.4376220703125, -5.20916748046875, -4.980712890625, -4.75225830078125, -4.5238037109375, -4.29534912109375, -4.06689453125, -3.83843994140625, -3.6099853515625, -3.38153076171875, -3.153076171875, -2.92462158203125, -2.6961669921875, -2.46771240234375, -2.2392578125, -2.01080322265625, -1.7823486328125, -1.55389404296875, -1.325439453125, -1.09698486328125, -0.8685302734375, -0.64007568359375, -0.41162109375, -0.18316650390625, 0.0452880859375, 0.27374267578125, 0.502197265625, 0.73065185546875, 0.9591064453125, 1.18756103515625, 1.416015625, 1.64447021484375, 1.8729248046875, 2.10137939453125, 2.329833984375, 2.55828857421875, 2.7867431640625, 3.01519775390625, 3.24365234375, 3.47210693359375, 3.7005615234375, 3.92901611328125, 4.157470703125, 4.38592529296875, 4.6143798828125, 4.84283447265625, 5.0712890625, 5.29974365234375, 5.5281982421875, 5.75665283203125, 5.985107421875, 6.21356201171875, 6.4420166015625, 6.67047119140625, 6.89892578125, 7.12738037109375, 7.3558349609375, 7.58428955078125, 7.812744140625, 8.04119873046875, 8.2696533203125, 8.49810791015625, 8.7265625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 7.0, 4.0, 6.0, 20.0, 13.0, 16.0, 18.0, 21.0, 22.0, 30.0, 34.0, 37.0, 54.0, 82.0, 200.0, 558.0, 2782.0, 73737.0, 2579087.0, 1509469.0, 25504.0, 1707.0, 407.0, 135.0, 81.0, 44.0, 37.0, 36.0, 23.0, 22.0, 11.0, 14.0, 13.0, 14.0, 13.0, 6.0, 9.0, 3.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.75, -18.98681640625, -18.2236328125, -17.46044921875, -16.697265625, -15.93408203125, -15.1708984375, -14.40771484375, -13.64453125, -12.88134765625, -12.1181640625, -11.35498046875, -10.591796875, -9.82861328125, -9.0654296875, -8.30224609375, -7.5390625, -6.77587890625, -6.0126953125, -5.24951171875, -4.486328125, -3.72314453125, -2.9599609375, -2.19677734375, -1.43359375, -0.67041015625, 0.0927734375, 0.85595703125, 1.619140625, 2.38232421875, 3.1455078125, 3.90869140625, 4.671875, 5.43505859375, 6.1982421875, 6.96142578125, 7.724609375, 8.48779296875, 9.2509765625, 10.01416015625, 10.77734375, 11.54052734375, 12.3037109375, 13.06689453125, 13.830078125, 14.59326171875, 15.3564453125, 16.11962890625, 16.8828125, 17.64599609375, 18.4091796875, 19.17236328125, 19.935546875, 20.69873046875, 21.4619140625, 22.22509765625, 22.98828125, 23.75146484375, 24.5146484375, 25.27783203125, 26.041015625, 26.80419921875, 27.5673828125, 28.33056640625, 29.09375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 9.0, 9.0, 21.0, 25.0, 48.0, 68.0, 107.0, 152.0, 249.0, 375.0, 493.0, 567.0, 568.0, 441.0, 330.0, 206.0, 157.0, 90.0, 57.0, 41.0, 27.0, 13.0, 9.0, 9.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3203125, -13.7178955078125, -13.115478515625, -12.5130615234375, -11.91064453125, -11.3082275390625, -10.705810546875, -10.1033935546875, -9.5009765625, -8.8985595703125, -8.296142578125, -7.6937255859375, -7.09130859375, -6.4888916015625, -5.886474609375, -5.2840576171875, -4.681640625, -4.0792236328125, -3.476806640625, -2.8743896484375, -2.27197265625, -1.6695556640625, -1.067138671875, -0.4647216796875, 0.1376953125, 0.7401123046875, 1.342529296875, 1.9449462890625, 2.54736328125, 3.1497802734375, 3.752197265625, 4.3546142578125, 4.95703125, 5.5594482421875, 6.161865234375, 6.7642822265625, 7.36669921875, 7.9691162109375, 8.571533203125, 9.1739501953125, 9.7763671875, 10.3787841796875, 10.981201171875, 11.5836181640625, 12.18603515625, 12.7884521484375, 13.390869140625, 13.9932861328125, 14.595703125, 15.1981201171875, 15.800537109375, 16.4029541015625, 17.00537109375, 17.6077880859375, 18.210205078125, 18.8126220703125, 19.4150390625, 20.0174560546875, 20.619873046875, 21.2222900390625, 21.82470703125, 22.4271240234375, 23.029541015625, 23.6319580078125, 24.234375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 14.0, 11.0, 18.0, 28.0, 48.0, 79.0, 102.0, 159.0, 226.0, 342.0, 595.0, 2935.0, 1787787.0, 2396693.0, 3585.0, 646.0, 375.0, 197.0, 166.0, 117.0, 55.0, 40.0, 33.0, 16.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.4375, -79.40283203125, -77.3681640625, -75.33349609375, -73.298828125, -71.26416015625, -69.2294921875, -67.19482421875, -65.16015625, -63.12548828125, -61.0908203125, -59.05615234375, -57.021484375, -54.98681640625, -52.9521484375, -50.91748046875, -48.8828125, -46.84814453125, -44.8134765625, -42.77880859375, -40.744140625, -38.70947265625, -36.6748046875, -34.64013671875, -32.60546875, -30.57080078125, -28.5361328125, -26.50146484375, -24.466796875, -22.43212890625, -20.3974609375, -18.36279296875, -16.328125, -14.29345703125, -12.2587890625, -10.22412109375, -8.189453125, -6.15478515625, -4.1201171875, -2.08544921875, -0.05078125, 1.98388671875, 4.0185546875, 6.05322265625, 8.087890625, 10.12255859375, 12.1572265625, 14.19189453125, 16.2265625, 18.26123046875, 20.2958984375, 22.33056640625, 24.365234375, 26.39990234375, 28.4345703125, 30.46923828125, 32.50390625, 34.53857421875, 36.5732421875, 38.60791015625, 40.642578125, 42.67724609375, 44.7119140625, 46.74658203125, 48.78125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 20.0, 49.0, 135.0, 203.0, 237.0, 183.0, 113.0, 36.0, 21.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.71265411376953, -58.11537170410156, -54.518089294433594, -50.920806884765625, -47.323524475097656, -43.72624206542969, -40.12895965576172, -36.53167724609375, -32.93439483642578, -29.337112426757812, -25.739830017089844, -22.142547607421875, -18.545265197753906, -14.947982788085938, -11.350700378417969, -7.75341796875, -4.156135559082031, -0.5588531494140625, 3.0384292602539062, 6.635711669921875, 10.232994079589844, 13.830276489257812, 17.42755889892578, 21.02484130859375, 24.62212371826172, 28.219406127929688, 31.816688537597656, 35.413970947265625, 39.011253356933594, 42.60853576660156, 46.20581817626953, 49.8031005859375, 53.400390625, 56.99767303466797, 60.59495544433594, 64.1922378540039, 67.78952026367188, 71.38680267333984, 74.98408508300781, 78.58136749267578, 82.17864990234375, 85.77593231201172, 89.37321472167969, 92.97049713134766, 96.56777954101562, 100.1650619506836, 103.76234436035156, 107.35962677001953, 110.9569091796875, 114.55419158935547, 118.15147399902344, 121.7487564086914, 125.34603881835938, 128.94332885742188, 132.5406036376953, 136.13787841796875, 139.73516845703125, 143.33245849609375, 146.9297332763672, 150.52700805664062, 154.12429809570312, 157.72158813476562, 161.31886291503906, 164.9161376953125, 168.513427734375]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 5.0, 5.0, 11.0, 13.0, 14.0, 23.0, 23.0, 20.0, 25.0, 40.0, 38.0, 46.0, 38.0, 43.0, 35.0, 42.0, 41.0, 36.0, 37.0, 45.0, 37.0, 29.0, 47.0, 39.0, 41.0, 23.0, 37.0, 31.0, 16.0, 18.0, 19.0, 13.0, 15.0, 5.0, 6.0, 6.0, 1.0, 8.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.798030853271484, -40.31563949584961, -38.83324432373047, -37.350852966308594, -35.86846160888672, -34.38606643676758, -32.9036750793457, -31.421281814575195, -29.938888549804688, -28.45649528503418, -26.974102020263672, -25.491710662841797, -24.00931739807129, -22.52692413330078, -21.044532775878906, -19.5621395111084, -18.07974624633789, -16.597352981567383, -15.114960670471191, -13.632568359375, -12.150175094604492, -10.667781829833984, -9.185389518737793, -7.702997207641602, -6.220603942871094, -4.738211154937744, -3.2558183670043945, -1.773425579071045, -0.2910327911376953, 1.1913599967956543, 2.673752784729004, 4.156145095825195, 5.6385345458984375, 7.120927333831787, 8.603320121765137, 10.085712432861328, 11.568105697631836, 13.050498962402344, 14.532891273498535, 16.015283584594727, 17.497676849365234, 18.980070114135742, 20.46246337890625, 21.944854736328125, 23.427248001098633, 24.90964126586914, 26.392032623291016, 27.874425888061523, 29.35681915283203, 30.83921241760254, 32.32160568237305, 33.80399703979492, 35.28639221191406, 36.76878356933594, 38.25117492675781, 39.73356628417969, 41.21596145629883, 42.6983528137207, 44.180747985839844, 45.66313934326172, 47.145530700683594, 48.627925872802734, 50.11031723022461, 51.59271240234375, 53.075103759765625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 9.0, 16.0, 16.0, 21.0, 29.0, 19.0, 32.0, 26.0, 30.0, 43.0, 40.0, 43.0, 55.0, 45.0, 51.0, 47.0, 40.0, 47.0, 48.0, 49.0, 49.0, 44.0, 41.0, 26.0, 21.0, 20.0, 18.0, 17.0, 9.0, 7.0, 6.0, 8.0, 7.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.23828125, -6.00091552734375, -5.7635498046875, -5.52618408203125, -5.288818359375, -5.05145263671875, -4.8140869140625, -4.57672119140625, -4.33935546875, -4.10198974609375, -3.8646240234375, -3.62725830078125, -3.389892578125, -3.15252685546875, -2.9151611328125, -2.67779541015625, -2.4404296875, -2.20306396484375, -1.9656982421875, -1.72833251953125, -1.490966796875, -1.25360107421875, -1.0162353515625, -0.77886962890625, -0.54150390625, -0.30413818359375, -0.0667724609375, 0.17059326171875, 0.407958984375, 0.64532470703125, 0.8826904296875, 1.12005615234375, 1.357421875, 1.59478759765625, 1.8321533203125, 2.06951904296875, 2.306884765625, 2.54425048828125, 2.7816162109375, 3.01898193359375, 3.25634765625, 3.49371337890625, 3.7310791015625, 3.96844482421875, 4.205810546875, 4.44317626953125, 4.6805419921875, 4.91790771484375, 5.1552734375, 5.39263916015625, 5.6300048828125, 5.86737060546875, 6.104736328125, 6.34210205078125, 6.5794677734375, 6.81683349609375, 7.05419921875, 7.29156494140625, 7.5289306640625, 7.76629638671875, 8.003662109375, 8.24102783203125, 8.4783935546875, 8.71575927734375, 8.953125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 11.0, 12.0, 14.0, 23.0, 27.0, 38.0, 69.0, 115.0, 151.0, 275.0, 405.0, 575.0, 915.0, 1386.0, 2194.0, 3567.0, 5657.0, 9291.0, 15690.0, 27599.0, 50153.0, 97708.0, 199116.0, 303194.0, 154760.0, 77853.0, 40840.0, 22822.0, 13064.0, 7895.0, 4761.0, 2991.0, 1853.0, 1250.0, 811.0, 506.0, 341.0, 198.0, 140.0, 97.0, 61.0, 44.0, 24.0, 15.0, 10.0, 8.0, 8.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-1.3564453125, -1.3157501220703125, -1.275054931640625, -1.2343597412109375, -1.19366455078125, -1.1529693603515625, -1.112274169921875, -1.0715789794921875, -1.0308837890625, -0.9901885986328125, -0.949493408203125, -0.9087982177734375, -0.86810302734375, -0.8274078369140625, -0.786712646484375, -0.7460174560546875, -0.705322265625, -0.6646270751953125, -0.623931884765625, -0.5832366943359375, -0.54254150390625, -0.5018463134765625, -0.461151123046875, -0.4204559326171875, -0.3797607421875, -0.3390655517578125, -0.298370361328125, -0.2576751708984375, -0.21697998046875, -0.1762847900390625, -0.135589599609375, -0.0948944091796875, -0.05419921875, -0.0135040283203125, 0.027191162109375, 0.0678863525390625, 0.10858154296875, 0.1492767333984375, 0.189971923828125, 0.2306671142578125, 0.2713623046875, 0.3120574951171875, 0.352752685546875, 0.3934478759765625, 0.43414306640625, 0.4748382568359375, 0.515533447265625, 0.5562286376953125, 0.596923828125, 0.6376190185546875, 0.678314208984375, 0.7190093994140625, 0.75970458984375, 0.8003997802734375, 0.841094970703125, 0.8817901611328125, 0.9224853515625, 0.9631805419921875, 1.003875732421875, 1.0445709228515625, 1.08526611328125, 1.1259613037109375, 1.166656494140625, 1.2073516845703125, 1.248046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 5.0, 3.0, 7.0, 7.0, 9.0, 8.0, 6.0, 6.0, 8.0, 13.0, 11.0, 17.0, 24.0, 21.0, 26.0, 37.0, 32.0, 30.0, 41.0, 39.0, 24.0, 42.0, 44.0, 1070.0, 47.0, 39.0, 44.0, 33.0, 23.0, 34.0, 24.0, 31.0, 32.0, 22.0, 21.0, 23.0, 19.0, 19.0, 18.0, 19.0, 7.0, 8.0, 3.0, 7.0, 5.0, 7.0, 4.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-4.1484375, -4.02978515625, -3.9111328125, -3.79248046875, -3.673828125, -3.55517578125, -3.4365234375, -3.31787109375, -3.19921875, -3.08056640625, -2.9619140625, -2.84326171875, -2.724609375, -2.60595703125, -2.4873046875, -2.36865234375, -2.25, -2.13134765625, -2.0126953125, -1.89404296875, -1.775390625, -1.65673828125, -1.5380859375, -1.41943359375, -1.30078125, -1.18212890625, -1.0634765625, -0.94482421875, -0.826171875, -0.70751953125, -0.5888671875, -0.47021484375, -0.3515625, -0.23291015625, -0.1142578125, 0.00439453125, 0.123046875, 0.24169921875, 0.3603515625, 0.47900390625, 0.59765625, 0.71630859375, 0.8349609375, 0.95361328125, 1.072265625, 1.19091796875, 1.3095703125, 1.42822265625, 1.546875, 1.66552734375, 1.7841796875, 1.90283203125, 2.021484375, 2.14013671875, 2.2587890625, 2.37744140625, 2.49609375, 2.61474609375, 2.7333984375, 2.85205078125, 2.970703125, 3.08935546875, 3.2080078125, 3.32666015625, 3.4453125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 10.0, 13.0, 22.0, 36.0, 55.0, 72.0, 94.0, 130.0, 254.0, 321.0, 441.0, 669.0, 996.0, 1595.0, 2389.0, 3790.0, 5969.0, 9544.0, 15855.0, 26487.0, 45610.0, 81842.0, 164397.0, 1359123.0, 173150.0, 85336.0, 47460.0, 27647.0, 16389.0, 10112.0, 6175.0, 3981.0, 2612.0, 1520.0, 946.0, 701.0, 420.0, 322.0, 201.0, 149.0, 97.0, 65.0, 45.0, 28.0, 17.0, 17.0, 8.0, 8.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0947265625, -1.0576629638671875, -1.020599365234375, -0.9835357666015625, -0.94647216796875, -0.9094085693359375, -0.872344970703125, -0.8352813720703125, -0.7982177734375, -0.7611541748046875, -0.724090576171875, -0.6870269775390625, -0.64996337890625, -0.6128997802734375, -0.575836181640625, -0.5387725830078125, -0.501708984375, -0.4646453857421875, -0.427581787109375, -0.3905181884765625, -0.35345458984375, -0.3163909912109375, -0.279327392578125, -0.2422637939453125, -0.2052001953125, -0.1681365966796875, -0.131072998046875, -0.0940093994140625, -0.05694580078125, -0.0198822021484375, 0.017181396484375, 0.0542449951171875, 0.09130859375, 0.1283721923828125, 0.165435791015625, 0.2024993896484375, 0.23956298828125, 0.2766265869140625, 0.313690185546875, 0.3507537841796875, 0.3878173828125, 0.4248809814453125, 0.461944580078125, 0.4990081787109375, 0.53607177734375, 0.5731353759765625, 0.610198974609375, 0.6472625732421875, 0.684326171875, 0.7213897705078125, 0.758453369140625, 0.7955169677734375, 0.83258056640625, 0.8696441650390625, 0.906707763671875, 0.9437713623046875, 0.9808349609375, 1.0178985595703125, 1.054962158203125, 1.0920257568359375, 1.12908935546875, 1.1661529541015625, 1.203216552734375, 1.2402801513671875, 1.27734375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 8.0, 5.0, 12.0, 4.0, 10.0, 4.0, 9.0, 21.0, 16.0, 23.0, 27.0, 40.0, 50.0, 58.0, 56.0, 78.0, 64.0, 71.0, 67.0, 64.0, 48.0, 48.0, 45.0, 32.0, 32.0, 29.0, 14.0, 14.0, 11.0, 13.0, 6.0, 6.0, 7.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0011653900146484375, -0.0011281222105026245, -0.0010908544063568115, -0.0010535866022109985, -0.0010163187980651855, -0.0009790509939193726, -0.0009417831897735596, -0.0009045153856277466, -0.0008672475814819336, -0.0008299797773361206, -0.0007927119731903076, -0.0007554441690444946, -0.0007181763648986816, -0.0006809085607528687, -0.0006436407566070557, -0.0006063729524612427, -0.0005691051483154297, -0.0005318373441696167, -0.0004945695400238037, -0.0004573017358779907, -0.00042003393173217773, -0.00038276612758636475, -0.00034549832344055176, -0.00030823051929473877, -0.0002709627151489258, -0.0002336949110031128, -0.0001964271068572998, -0.00015915930271148682, -0.00012189149856567383, -8.462369441986084e-05, -4.735589027404785e-05, -1.0088086128234863e-05, 2.7179718017578125e-05, 6.444752216339111e-05, 0.0001017153263092041, 0.0001389831304550171, 0.00017625093460083008, 0.00021351873874664307, 0.00025078654289245605, 0.00028805434703826904, 0.00032532215118408203, 0.000362589955329895, 0.000399857759475708, 0.000437125563621521, 0.000474393367767334, 0.000511661171913147, 0.00054892897605896, 0.000586196780204773, 0.0006234645843505859, 0.0006607323884963989, 0.0006980001926422119, 0.0007352679967880249, 0.0007725358009338379, 0.0008098036050796509, 0.0008470714092254639, 0.0008843392133712769, 0.0009216070175170898, 0.0009588748216629028, 0.0009961426258087158, 0.0010334104299545288, 0.0010706782341003418, 0.0011079460382461548, 0.0011452138423919678, 0.0011824816465377808, 0.0012197494506835938]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 8.0, 6.0, 12.0, 9.0, 16.0, 19.0, 25.0, 23.0, 42.0, 49.0, 81.0, 121.0, 189.0, 315.0, 1012.0, 87977.0, 955133.0, 2323.0, 474.0, 251.0, 149.0, 98.0, 51.0, 30.0, 31.0, 28.0, 18.0, 10.0, 22.0, 5.0, 6.0, 7.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0280303955078125, -0.02721095085144043, -0.02639150619506836, -0.02557206153869629, -0.02475261688232422, -0.02393317222595215, -0.023113727569580078, -0.022294282913208008, -0.021474838256835938, -0.020655393600463867, -0.019835948944091797, -0.019016504287719727, -0.018197059631347656, -0.017377614974975586, -0.016558170318603516, -0.015738725662231445, -0.014919281005859375, -0.014099836349487305, -0.013280391693115234, -0.012460947036743164, -0.011641502380371094, -0.010822057723999023, -0.010002613067626953, -0.009183168411254883, -0.008363723754882812, -0.007544279098510742, -0.006724834442138672, -0.0059053897857666016, -0.005085945129394531, -0.004266500473022461, -0.0034470558166503906, -0.0026276111602783203, -0.00180816650390625, -0.0009887218475341797, -0.00016927719116210938, 0.0006501674652099609, 0.0014696121215820312, 0.0022890567779541016, 0.003108501434326172, 0.003927946090698242, 0.0047473907470703125, 0.005566835403442383, 0.006386280059814453, 0.0072057247161865234, 0.008025169372558594, 0.008844614028930664, 0.009664058685302734, 0.010483503341674805, 0.011302947998046875, 0.012122392654418945, 0.012941837310791016, 0.013761281967163086, 0.014580726623535156, 0.015400171279907227, 0.016219615936279297, 0.017039060592651367, 0.017858505249023438, 0.018677949905395508, 0.019497394561767578, 0.02031683921813965, 0.02113628387451172, 0.02195572853088379, 0.02277517318725586, 0.02359461784362793, 0.0244140625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 23.0, 44.0, 106.0, 175.0, 204.0, 192.0, 121.0, 83.0, 33.0, 12.0, 9.0, 1.0, 1.0, 2.0], "bins": [-0.002360305516049266, -0.0023171992506831884, -0.002274092985317111, -0.0022309869527816772, -0.0021878806874156, -0.0021447744220495224, -0.002101668156683445, -0.0020585618913173676, -0.00201545562595129, -0.0019723493605852127, -0.0019292432116344571, -0.0018861369462683797, -0.0018430306809023023, -0.0017999245319515467, -0.0017568182665854692, -0.0017137120012193918, -0.0016706058522686362, -0.0016274995869025588, -0.0015843934379518032, -0.0015412871725857258, -0.0014981809072196484, -0.001455074641853571, -0.0014119684929028153, -0.001368862227536738, -0.0013257560785859823, -0.001282649813219905, -0.0012395436642691493, -0.0011964373989030719, -0.0011533311335369945, -0.0011102249845862389, -0.0010671187192201614, -0.001024012453854084, -0.0009809061884880066, -0.0009377999813295901, -0.0008946937159635127, -0.0008515875088050961, -0.0008084812434390187, -0.0007653750362806022, -0.0007222688291221857, -0.0006791625637561083, -0.0006360564148053527, -0.0005929502076469362, -0.0005498439422808588, -0.0005067377351224422, -0.0004636314988601953, -0.0004205252625979483, -0.0003774190554395318, -0.00033431281917728484, -0.0002912065538112074, -0.00024810031754896045, -0.0002049940958386287, -0.00016188787412829697, -0.00011878163786605, -7.567540160380304e-05, -3.256919444538653e-05, 1.0537041816860437e-05, 5.3643278079107404e-05, 9.674950706539676e-05, 0.0001398557360516861, 0.00018296195776201785, 0.0002260681940242648, 0.0002691744302865118, 0.0003122806374449283, 0.00035538687370717525, 0.0003984931099694222]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 4.0, 8.0, 8.0, 8.0, 18.0, 7.0, 16.0, 19.0, 29.0, 20.0, 26.0, 33.0, 21.0, 27.0, 31.0, 38.0, 44.0, 32.0, 49.0, 53.0, 44.0, 50.0, 49.0, 44.0, 39.0, 31.0, 41.0, 26.0, 38.0, 25.0, 29.0, 16.0, 15.0, 9.0, 7.0, 16.0, 13.0, 3.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0006132721900939941, -0.0005948934704065323, -0.0005765147507190704, -0.0005581360310316086, -0.0005397573113441467, -0.0005213785916566849, -0.000502999871969223, -0.00048462115228176117, -0.0004662424325942993, -0.00044786371290683746, -0.0004294849932193756, -0.00041110627353191376, -0.0003927275538444519, -0.00037434883415699005, -0.0003559701144695282, -0.00033759139478206635, -0.0003192126750946045, -0.00030083395540714264, -0.0002824552357196808, -0.00026407651603221893, -0.0002456977963447571, -0.00022731907665729523, -0.00020894035696983337, -0.00019056163728237152, -0.00017218291759490967, -0.00015380419790744781, -0.00013542547821998596, -0.00011704675853252411, -9.866803884506226e-05, -8.02893191576004e-05, -6.191059947013855e-05, -4.35318797826767e-05, -2.5153160095214844e-05, -6.774440407752991e-06, 1.1604279279708862e-05, 2.9982998967170715e-05, 4.836171865463257e-05, 6.674043834209442e-05, 8.511915802955627e-05, 0.00010349787771701813, 0.00012187659740447998, 0.00014025531709194183, 0.0001586340367794037, 0.00017701275646686554, 0.0001953914761543274, 0.00021377019584178925, 0.0002321489155292511, 0.00025052763521671295, 0.0002689063549041748, 0.00028728507459163666, 0.0003056637942790985, 0.00032404251396656036, 0.0003424212336540222, 0.00036079995334148407, 0.0003791786730289459, 0.0003975573927164078, 0.00041593611240386963, 0.0004343148320913315, 0.00045269355177879333, 0.0004710722714662552, 0.000489450991153717, 0.0005078297108411789, 0.0005262084305286407, 0.0005445871502161026, 0.0005629658699035645]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 7.0, 9.0, 16.0, 16.0, 21.0, 29.0, 19.0, 32.0, 26.0, 30.0, 43.0, 40.0, 43.0, 55.0, 45.0, 51.0, 47.0, 40.0, 47.0, 48.0, 49.0, 49.0, 44.0, 41.0, 26.0, 21.0, 20.0, 18.0, 17.0, 9.0, 7.0, 6.0, 8.0, 7.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.23828125, -6.00091552734375, -5.7635498046875, -5.52618408203125, -5.288818359375, -5.05145263671875, -4.8140869140625, -4.57672119140625, -4.33935546875, -4.10198974609375, -3.8646240234375, -3.62725830078125, -3.389892578125, -3.15252685546875, -2.9151611328125, -2.67779541015625, -2.4404296875, -2.20306396484375, -1.9656982421875, -1.72833251953125, -1.490966796875, -1.25360107421875, -1.0162353515625, -0.77886962890625, -0.54150390625, -0.30413818359375, -0.0667724609375, 0.17059326171875, 0.407958984375, 0.64532470703125, 0.8826904296875, 1.12005615234375, 1.357421875, 1.59478759765625, 1.8321533203125, 2.06951904296875, 2.306884765625, 2.54425048828125, 2.7816162109375, 3.01898193359375, 3.25634765625, 3.49371337890625, 3.7310791015625, 3.96844482421875, 4.205810546875, 4.44317626953125, 4.6805419921875, 4.91790771484375, 5.1552734375, 5.39263916015625, 5.6300048828125, 5.86737060546875, 6.104736328125, 6.34210205078125, 6.5794677734375, 6.81683349609375, 7.05419921875, 7.29156494140625, 7.5289306640625, 7.76629638671875, 8.003662109375, 8.24102783203125, 8.4783935546875, 8.71575927734375, 8.953125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 10.0, 11.0, 23.0, 26.0, 29.0, 62.0, 95.0, 109.0, 203.0, 256.0, 408.0, 737.0, 1333.0, 2629.0, 5308.0, 11750.0, 28325.0, 71822.0, 178706.0, 358488.0, 230408.0, 92751.0, 36583.0, 14950.0, 6573.0, 3196.0, 1599.0, 819.0, 489.0, 261.0, 203.0, 127.0, 87.0, 48.0, 39.0, 11.0, 27.0, 15.0, 13.0, 13.0, 5.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.84375, -5.63970947265625, -5.4356689453125, -5.23162841796875, -5.027587890625, -4.82354736328125, -4.6195068359375, -4.41546630859375, -4.21142578125, -4.00738525390625, -3.8033447265625, -3.59930419921875, -3.395263671875, -3.19122314453125, -2.9871826171875, -2.78314208984375, -2.5791015625, -2.37506103515625, -2.1710205078125, -1.96697998046875, -1.762939453125, -1.55889892578125, -1.3548583984375, -1.15081787109375, -0.94677734375, -0.74273681640625, -0.5386962890625, -0.33465576171875, -0.130615234375, 0.07342529296875, 0.2774658203125, 0.48150634765625, 0.685546875, 0.88958740234375, 1.0936279296875, 1.29766845703125, 1.501708984375, 1.70574951171875, 1.9097900390625, 2.11383056640625, 2.31787109375, 2.52191162109375, 2.7259521484375, 2.92999267578125, 3.134033203125, 3.33807373046875, 3.5421142578125, 3.74615478515625, 3.9501953125, 4.15423583984375, 4.3582763671875, 4.56231689453125, 4.766357421875, 4.97039794921875, 5.1744384765625, 5.37847900390625, 5.58251953125, 5.78656005859375, 5.9906005859375, 6.19464111328125, 6.398681640625, 6.60272216796875, 6.8067626953125, 7.01080322265625, 7.21484375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 6.0, 7.0, 6.0, 4.0, 15.0, 12.0, 18.0, 18.0, 30.0, 26.0, 27.0, 19.0, 33.0, 34.0, 30.0, 54.0, 49.0, 86.0, 162.0, 867.0, 912.0, 153.0, 82.0, 54.0, 51.0, 34.0, 53.0, 23.0, 28.0, 24.0, 22.0, 12.0, 16.0, 14.0, 17.0, 7.0, 9.0, 9.0, 11.0, 2.0, 5.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.703125, -21.02490234375, -20.3466796875, -19.66845703125, -18.990234375, -18.31201171875, -17.6337890625, -16.95556640625, -16.27734375, -15.59912109375, -14.9208984375, -14.24267578125, -13.564453125, -12.88623046875, -12.2080078125, -11.52978515625, -10.8515625, -10.17333984375, -9.4951171875, -8.81689453125, -8.138671875, -7.46044921875, -6.7822265625, -6.10400390625, -5.42578125, -4.74755859375, -4.0693359375, -3.39111328125, -2.712890625, -2.03466796875, -1.3564453125, -0.67822265625, 0.0, 0.67822265625, 1.3564453125, 2.03466796875, 2.712890625, 3.39111328125, 4.0693359375, 4.74755859375, 5.42578125, 6.10400390625, 6.7822265625, 7.46044921875, 8.138671875, 8.81689453125, 9.4951171875, 10.17333984375, 10.8515625, 11.52978515625, 12.2080078125, 12.88623046875, 13.564453125, 14.24267578125, 14.9208984375, 15.59912109375, 16.27734375, 16.95556640625, 17.6337890625, 18.31201171875, 18.990234375, 19.66845703125, 20.3466796875, 21.02490234375, 21.703125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 4.0, 6.0, 6.0, 12.0, 15.0, 5.0, 23.0, 43.0, 52.0, 74.0, 99.0, 184.0, 374.0, 809.0, 28834.0, 3111535.0, 2343.0, 519.0, 280.0, 169.0, 98.0, 71.0, 41.0, 28.0, 20.0, 11.0, 10.0, 6.0, 10.0, 7.0, 2.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-119.9375, -116.33203125, -112.7265625, -109.12109375, -105.515625, -101.91015625, -98.3046875, -94.69921875, -91.09375, -87.48828125, -83.8828125, -80.27734375, -76.671875, -73.06640625, -69.4609375, -65.85546875, -62.25, -58.64453125, -55.0390625, -51.43359375, -47.828125, -44.22265625, -40.6171875, -37.01171875, -33.40625, -29.80078125, -26.1953125, -22.58984375, -18.984375, -15.37890625, -11.7734375, -8.16796875, -4.5625, -0.95703125, 2.6484375, 6.25390625, 9.859375, 13.46484375, 17.0703125, 20.67578125, 24.28125, 27.88671875, 31.4921875, 35.09765625, 38.703125, 42.30859375, 45.9140625, 49.51953125, 53.125, 56.73046875, 60.3359375, 63.94140625, 67.546875, 71.15234375, 74.7578125, 78.36328125, 81.96875, 85.57421875, 89.1796875, 92.78515625, 96.390625, 99.99609375, 103.6015625, 107.20703125, 110.8125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 9.0, 9.0, 21.0, 32.0, 47.0, 77.0, 121.0, 136.0, 154.0, 125.0, 102.0, 83.0, 49.0, 24.0, 13.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.249046325683594, -46.18189239501953, -45.114742279052734, -44.04758834838867, -42.98043441772461, -41.91328048706055, -40.84613037109375, -39.77897644042969, -38.711822509765625, -37.64466857910156, -36.577518463134766, -35.5103645324707, -34.44321060180664, -33.37605667114258, -32.30890655517578, -31.24175262451172, -30.17460060119629, -29.10744857788086, -28.040294647216797, -26.973142623901367, -25.905988693237305, -24.838836669921875, -23.771682739257812, -22.704530715942383, -21.637378692626953, -20.570226669311523, -19.50307273864746, -18.43592071533203, -17.36876678466797, -16.30161476135254, -15.234461784362793, -14.167308807373047, -13.100154876708984, -12.033001899719238, -10.965848922729492, -9.898696899414062, -8.83154296875, -7.764390468597412, -6.697237968444824, -5.630084991455078, -4.562932014465332, -3.495779037475586, -2.428626298904419, -1.361473560333252, -0.29432058334350586, 0.7728323936462402, 1.8399848937988281, 2.907137870788574, 3.9742908477783203, 5.041443824768066, 6.1085968017578125, 7.1757493019104, 8.242902755737305, 9.310054779052734, 10.37720775604248, 11.444360733032227, 12.511513710021973, 13.578666687011719, 14.645819664001465, 15.712972640991211, 16.78012466430664, 17.847278594970703, 18.914430618286133, 19.981582641601562, 21.048736572265625]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 10.0, 8.0, 9.0, 14.0, 14.0, 17.0, 24.0, 13.0, 24.0, 15.0, 23.0, 34.0, 32.0, 29.0, 31.0, 35.0, 35.0, 30.0, 32.0, 30.0, 55.0, 50.0, 34.0, 37.0, 28.0, 30.0, 36.0, 28.0, 31.0, 27.0, 29.0, 17.0, 22.0, 9.0, 14.0, 13.0, 14.0, 7.0, 13.0, 5.0, 4.0, 8.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 4.0], "bins": [-52.8168830871582, -51.34181213378906, -49.86674118041992, -48.39167022705078, -46.916595458984375, -45.441524505615234, -43.966453552246094, -42.49138259887695, -41.01631164550781, -39.54124069213867, -38.06616973876953, -36.591094970703125, -35.116024017333984, -33.640953063964844, -32.1658821105957, -30.690811157226562, -29.215736389160156, -27.740665435791016, -26.265592575073242, -24.7905216217041, -23.315448760986328, -21.840377807617188, -20.365306854248047, -18.890235900878906, -17.415163040161133, -15.940091133117676, -14.465019226074219, -12.989948272705078, -11.514876365661621, -10.039804458618164, -8.564733505249023, -7.089661598205566, -5.614585876464844, -4.139513969421387, -2.664442539215088, -1.189371109008789, 0.28570079803466797, 1.760772705078125, 3.2358436584472656, 4.710915565490723, 6.18598747253418, 7.661059379577637, 9.136131286621094, 10.611202239990234, 12.086274147033691, 13.561346054077148, 15.036417007446289, 16.511489868164062, 17.986560821533203, 19.461631774902344, 20.936704635620117, 22.411775588989258, 23.88684844970703, 25.361919403076172, 26.836990356445312, 28.312061309814453, 29.787134170532227, 31.262205123901367, 32.73727798461914, 34.21234893798828, 35.68741989135742, 37.16249084472656, 38.63756561279297, 40.11263656616211, 41.58770751953125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 5.0, 6.0, 12.0, 9.0, 17.0, 16.0, 21.0, 27.0, 27.0, 24.0, 28.0, 27.0, 36.0, 47.0, 45.0, 52.0, 43.0, 58.0, 40.0, 53.0, 47.0, 49.0, 39.0, 45.0, 40.0, 33.0, 26.0, 25.0, 16.0, 20.0, 23.0, 9.0, 6.0, 4.0, 8.0, 7.0, 2.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.30859375, -6.05572509765625, -5.8028564453125, -5.54998779296875, -5.297119140625, -5.04425048828125, -4.7913818359375, -4.53851318359375, -4.28564453125, -4.03277587890625, -3.7799072265625, -3.52703857421875, -3.274169921875, -3.02130126953125, -2.7684326171875, -2.51556396484375, -2.2626953125, -2.00982666015625, -1.7569580078125, -1.50408935546875, -1.251220703125, -0.99835205078125, -0.7454833984375, -0.49261474609375, -0.23974609375, 0.01312255859375, 0.2659912109375, 0.51885986328125, 0.771728515625, 1.02459716796875, 1.2774658203125, 1.53033447265625, 1.783203125, 2.03607177734375, 2.2889404296875, 2.54180908203125, 2.794677734375, 3.04754638671875, 3.3004150390625, 3.55328369140625, 3.80615234375, 4.05902099609375, 4.3118896484375, 4.56475830078125, 4.817626953125, 5.07049560546875, 5.3233642578125, 5.57623291015625, 5.8291015625, 6.08197021484375, 6.3348388671875, 6.58770751953125, 6.840576171875, 7.09344482421875, 7.3463134765625, 7.59918212890625, 7.85205078125, 8.10491943359375, 8.3577880859375, 8.61065673828125, 8.863525390625, 9.11639404296875, 9.3692626953125, 9.62213134765625, 9.875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 6.0, 2.0, 4.0, 5.0, 5.0, 9.0, 13.0, 12.0, 25.0, 32.0, 25.0, 36.0, 60.0, 84.0, 114.0, 205.0, 387.0, 1270.0, 9710.0, 210004.0, 2385536.0, 1500495.0, 79909.0, 4586.0, 871.0, 321.0, 202.0, 99.0, 63.0, 44.0, 37.0, 16.0, 17.0, 19.0, 19.0, 12.0, 9.0, 8.0, 5.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.53125, -14.952880859375, -14.37451171875, -13.796142578125, -13.2177734375, -12.639404296875, -12.06103515625, -11.482666015625, -10.904296875, -10.325927734375, -9.74755859375, -9.169189453125, -8.5908203125, -8.012451171875, -7.43408203125, -6.855712890625, -6.27734375, -5.698974609375, -5.12060546875, -4.542236328125, -3.9638671875, -3.385498046875, -2.80712890625, -2.228759765625, -1.650390625, -1.072021484375, -0.49365234375, 0.084716796875, 0.6630859375, 1.241455078125, 1.81982421875, 2.398193359375, 2.9765625, 3.554931640625, 4.13330078125, 4.711669921875, 5.2900390625, 5.868408203125, 6.44677734375, 7.025146484375, 7.603515625, 8.181884765625, 8.76025390625, 9.338623046875, 9.9169921875, 10.495361328125, 11.07373046875, 11.652099609375, 12.23046875, 12.808837890625, 13.38720703125, 13.965576171875, 14.5439453125, 15.122314453125, 15.70068359375, 16.279052734375, 16.857421875, 17.435791015625, 18.01416015625, 18.592529296875, 19.1708984375, 19.749267578125, 20.32763671875, 20.906005859375, 21.484375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 3.0, 5.0, 7.0, 10.0, 9.0, 15.0, 20.0, 28.0, 43.0, 52.0, 95.0, 115.0, 157.0, 219.0, 240.0, 355.0, 392.0, 426.0, 447.0, 354.0, 288.0, 215.0, 154.0, 126.0, 81.0, 57.0, 41.0, 43.0, 26.0, 14.0, 10.0, 6.0, 2.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.6796875, -14.2420654296875, -13.804443359375, -13.3668212890625, -12.92919921875, -12.4915771484375, -12.053955078125, -11.6163330078125, -11.1787109375, -10.7410888671875, -10.303466796875, -9.8658447265625, -9.42822265625, -8.9906005859375, -8.552978515625, -8.1153564453125, -7.677734375, -7.2401123046875, -6.802490234375, -6.3648681640625, -5.92724609375, -5.4896240234375, -5.052001953125, -4.6143798828125, -4.1767578125, -3.7391357421875, -3.301513671875, -2.8638916015625, -2.42626953125, -1.9886474609375, -1.551025390625, -1.1134033203125, -0.67578125, -0.2381591796875, 0.199462890625, 0.6370849609375, 1.07470703125, 1.5123291015625, 1.949951171875, 2.3875732421875, 2.8251953125, 3.2628173828125, 3.700439453125, 4.1380615234375, 4.57568359375, 5.0133056640625, 5.450927734375, 5.8885498046875, 6.326171875, 6.7637939453125, 7.201416015625, 7.6390380859375, 8.07666015625, 8.5142822265625, 8.951904296875, 9.3895263671875, 9.8271484375, 10.2647705078125, 10.702392578125, 11.1400146484375, 11.57763671875, 12.0152587890625, 12.452880859375, 12.8905029296875, 13.328125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 4.0, 11.0, 5.0, 15.0, 29.0, 46.0, 40.0, 74.0, 84.0, 125.0, 156.0, 201.0, 314.0, 482.0, 933.0, 21212.0, 3381175.0, 783170.0, 4114.0, 666.0, 371.0, 274.0, 201.0, 150.0, 115.0, 85.0, 66.0, 36.0, 30.0, 24.0, 13.0, 14.0, 13.0, 5.0, 9.0, 1.0, 5.0, 3.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.03125, -44.53759765625, -43.0439453125, -41.55029296875, -40.056640625, -38.56298828125, -37.0693359375, -35.57568359375, -34.08203125, -32.58837890625, -31.0947265625, -29.60107421875, -28.107421875, -26.61376953125, -25.1201171875, -23.62646484375, -22.1328125, -20.63916015625, -19.1455078125, -17.65185546875, -16.158203125, -14.66455078125, -13.1708984375, -11.67724609375, -10.18359375, -8.68994140625, -7.1962890625, -5.70263671875, -4.208984375, -2.71533203125, -1.2216796875, 0.27197265625, 1.765625, 3.25927734375, 4.7529296875, 6.24658203125, 7.740234375, 9.23388671875, 10.7275390625, 12.22119140625, 13.71484375, 15.20849609375, 16.7021484375, 18.19580078125, 19.689453125, 21.18310546875, 22.6767578125, 24.17041015625, 25.6640625, 27.15771484375, 28.6513671875, 30.14501953125, 31.638671875, 33.13232421875, 34.6259765625, 36.11962890625, 37.61328125, 39.10693359375, 40.6005859375, 42.09423828125, 43.587890625, 45.08154296875, 46.5751953125, 48.06884765625, 49.5625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 6.0, 12.0, 16.0, 38.0, 32.0, 42.0, 51.0, 62.0, 78.0, 99.0, 82.0, 101.0, 92.0, 80.0, 63.0, 55.0, 32.0, 23.0, 14.0, 12.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.646728515625, -47.197303771972656, -45.74788284301758, -44.298458099365234, -42.84903335571289, -41.39961242675781, -39.95018768310547, -38.500762939453125, -37.05133819580078, -35.60191345214844, -34.15249252319336, -32.703067779541016, -31.253643035888672, -29.80422019958496, -28.35479736328125, -26.905372619628906, -25.455951690673828, -24.006528854370117, -22.557104110717773, -21.107681274414062, -19.65825653076172, -18.208833694458008, -16.759410858154297, -15.30998706817627, -13.860563278198242, -12.411139488220215, -10.961715698242188, -9.512292861938477, -8.06286907196045, -6.613445281982422, -5.164022445678711, -3.7145986557006836, -2.265178680419922, -0.8157551288604736, 0.6336684226989746, 2.0830917358398438, 3.532515525817871, 4.981939315795898, 6.431362152099609, 7.880785942077637, 9.330209732055664, 10.779633522033691, 12.229057312011719, 13.67848014831543, 15.127903938293457, 16.577327728271484, 18.026750564575195, 19.476173400878906, 20.92559814453125, 22.37502098083496, 23.824445724487305, 25.273868560791016, 26.72329330444336, 28.17271614074707, 29.62213897705078, 31.071563720703125, 32.52098846435547, 33.97041320800781, 35.41983413696289, 36.869258880615234, 38.31868362426758, 39.768104553222656, 41.217529296875, 42.666954040527344, 44.11637496948242]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 8.0, 10.0, 12.0, 11.0, 15.0, 11.0, 14.0, 13.0, 22.0, 16.0, 26.0, 12.0, 24.0, 30.0, 29.0, 21.0, 30.0, 26.0, 39.0, 39.0, 40.0, 39.0, 42.0, 26.0, 37.0, 36.0, 26.0, 33.0, 29.0, 29.0, 26.0, 24.0, 35.0, 23.0, 27.0, 19.0, 14.0, 17.0, 14.0, 9.0, 11.0, 11.0, 7.0, 6.0, 3.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-37.9444465637207, -36.71249008178711, -35.480533599853516, -34.24857711791992, -33.01662063598633, -31.784664154052734, -30.55270767211914, -29.320751190185547, -28.088794708251953, -26.85683822631836, -25.624881744384766, -24.392925262451172, -23.160968780517578, -21.929012298583984, -20.69705581665039, -19.465099334716797, -18.233142852783203, -17.00118637084961, -15.769229888916016, -14.537273406982422, -13.305316925048828, -12.073360443115234, -10.84140396118164, -9.609447479248047, -8.377490997314453, -7.145534515380859, -5.913578033447266, -4.681621551513672, -3.449665069580078, -2.2177085876464844, -0.9857521057128906, 0.24620437622070312, 1.4781570434570312, 2.710113525390625, 3.9420700073242188, 5.1740264892578125, 6.405982971191406, 7.637939453125, 8.869895935058594, 10.101852416992188, 11.333808898925781, 12.565765380859375, 13.797721862792969, 15.029678344726562, 16.261634826660156, 17.49359130859375, 18.725547790527344, 19.957504272460938, 21.18946075439453, 22.421417236328125, 23.65337371826172, 24.885330200195312, 26.117286682128906, 27.3492431640625, 28.581199645996094, 29.813156127929688, 31.04511260986328, 32.277069091796875, 33.50902557373047, 34.74098205566406, 35.972938537597656, 37.20489501953125, 38.436851501464844, 39.66880798339844, 40.90076446533203]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 10.0, 10.0, 11.0, 14.0, 26.0, 15.0, 25.0, 22.0, 24.0, 40.0, 38.0, 30.0, 49.0, 50.0, 42.0, 51.0, 47.0, 52.0, 52.0, 53.0, 37.0, 45.0, 41.0, 42.0, 33.0, 21.0, 19.0, 18.0, 14.0, 14.0, 12.0, 11.0, 11.0, 2.0, 3.0, 3.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.2928466796875, -6.046630859375, -5.8004150390625, -5.55419921875, -5.3079833984375, -5.061767578125, -4.8155517578125, -4.5693359375, -4.3231201171875, -4.076904296875, -3.8306884765625, -3.58447265625, -3.3382568359375, -3.092041015625, -2.8458251953125, -2.599609375, -2.3533935546875, -2.107177734375, -1.8609619140625, -1.61474609375, -1.3685302734375, -1.122314453125, -0.8760986328125, -0.6298828125, -0.3836669921875, -0.137451171875, 0.1087646484375, 0.35498046875, 0.6011962890625, 0.847412109375, 1.0936279296875, 1.33984375, 1.5860595703125, 1.832275390625, 2.0784912109375, 2.32470703125, 2.5709228515625, 2.817138671875, 3.0633544921875, 3.3095703125, 3.5557861328125, 3.802001953125, 4.0482177734375, 4.29443359375, 4.5406494140625, 4.786865234375, 5.0330810546875, 5.279296875, 5.5255126953125, 5.771728515625, 6.0179443359375, 6.26416015625, 6.5103759765625, 6.756591796875, 7.0028076171875, 7.2490234375, 7.4952392578125, 7.741455078125, 7.9876708984375, 8.23388671875, 8.4801025390625, 8.726318359375, 8.9725341796875, 9.21875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 2.0, 8.0, 8.0, 18.0, 19.0, 28.0, 43.0, 84.0, 124.0, 156.0, 299.0, 424.0, 729.0, 1225.0, 1961.0, 3308.0, 5432.0, 9359.0, 16096.0, 28996.0, 54620.0, 113206.0, 270705.0, 291088.0, 120895.0, 58043.0, 30713.0, 16877.0, 9617.0, 5716.0, 3362.0, 2048.0, 1273.0, 750.0, 494.0, 292.0, 194.0, 118.0, 75.0, 49.0, 29.0, 22.0, 16.0, 8.0, 9.0, 7.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.603515625, -1.5564117431640625, -1.509307861328125, -1.4622039794921875, -1.41510009765625, -1.3679962158203125, -1.320892333984375, -1.2737884521484375, -1.2266845703125, -1.1795806884765625, -1.132476806640625, -1.0853729248046875, -1.03826904296875, -0.9911651611328125, -0.944061279296875, -0.8969573974609375, -0.849853515625, -0.8027496337890625, -0.755645751953125, -0.7085418701171875, -0.66143798828125, -0.6143341064453125, -0.567230224609375, -0.5201263427734375, -0.4730224609375, -0.4259185791015625, -0.378814697265625, -0.3317108154296875, -0.28460693359375, -0.2375030517578125, -0.190399169921875, -0.1432952880859375, -0.09619140625, -0.0490875244140625, -0.001983642578125, 0.0451202392578125, 0.09222412109375, 0.1393280029296875, 0.186431884765625, 0.2335357666015625, 0.2806396484375, 0.3277435302734375, 0.374847412109375, 0.4219512939453125, 0.46905517578125, 0.5161590576171875, 0.563262939453125, 0.6103668212890625, 0.657470703125, 0.7045745849609375, 0.751678466796875, 0.7987823486328125, 0.84588623046875, 0.8929901123046875, 0.940093994140625, 0.9871978759765625, 1.0343017578125, 1.0814056396484375, 1.128509521484375, 1.1756134033203125, 1.22271728515625, 1.2698211669921875, 1.316925048828125, 1.3640289306640625, 1.4111328125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 2.0, 3.0, 7.0, 12.0, 8.0, 13.0, 14.0, 22.0, 15.0, 23.0, 23.0, 28.0, 29.0, 31.0, 38.0, 37.0, 36.0, 42.0, 43.0, 34.0, 35.0, 1052.0, 40.0, 43.0, 38.0, 33.0, 30.0, 42.0, 39.0, 26.0, 28.0, 28.0, 25.0, 19.0, 18.0, 12.0, 8.0, 10.0, 11.0, 8.0, 6.0, 8.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-4.140625, -4.00750732421875, -3.8743896484375, -3.74127197265625, -3.608154296875, -3.47503662109375, -3.3419189453125, -3.20880126953125, -3.07568359375, -2.94256591796875, -2.8094482421875, -2.67633056640625, -2.543212890625, -2.41009521484375, -2.2769775390625, -2.14385986328125, -2.0107421875, -1.87762451171875, -1.7445068359375, -1.61138916015625, -1.478271484375, -1.34515380859375, -1.2120361328125, -1.07891845703125, -0.94580078125, -0.81268310546875, -0.6795654296875, -0.54644775390625, -0.413330078125, -0.28021240234375, -0.1470947265625, -0.01397705078125, 0.119140625, 0.25225830078125, 0.3853759765625, 0.51849365234375, 0.651611328125, 0.78472900390625, 0.9178466796875, 1.05096435546875, 1.18408203125, 1.31719970703125, 1.4503173828125, 1.58343505859375, 1.716552734375, 1.84967041015625, 1.9827880859375, 2.11590576171875, 2.2490234375, 2.38214111328125, 2.5152587890625, 2.64837646484375, 2.781494140625, 2.91461181640625, 3.0477294921875, 3.18084716796875, 3.31396484375, 3.44708251953125, 3.5802001953125, 3.71331787109375, 3.846435546875, 3.97955322265625, 4.1126708984375, 4.24578857421875, 4.37890625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 7.0, 5.0, 5.0, 7.0, 18.0, 16.0, 21.0, 34.0, 43.0, 60.0, 84.0, 128.0, 172.0, 264.0, 427.0, 609.0, 917.0, 1333.0, 2071.0, 3245.0, 5004.0, 7985.0, 12966.0, 20624.0, 33999.0, 57442.0, 102603.0, 200640.0, 1312789.0, 141778.0, 76024.0, 44303.0, 26684.0, 16497.0, 10143.0, 6448.0, 3945.0, 2572.0, 1673.0, 1138.0, 762.0, 527.0, 343.0, 266.0, 155.0, 113.0, 79.0, 51.0, 37.0, 32.0, 22.0, 13.0, 9.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-1.1943359375, -1.1573028564453125, -1.120269775390625, -1.0832366943359375, -1.04620361328125, -1.0091705322265625, -0.972137451171875, -0.9351043701171875, -0.8980712890625, -0.8610382080078125, -0.824005126953125, -0.7869720458984375, -0.74993896484375, -0.7129058837890625, -0.675872802734375, -0.6388397216796875, -0.601806640625, -0.5647735595703125, -0.527740478515625, -0.4907073974609375, -0.45367431640625, -0.4166412353515625, -0.379608154296875, -0.3425750732421875, -0.3055419921875, -0.2685089111328125, -0.231475830078125, -0.1944427490234375, -0.15740966796875, -0.1203765869140625, -0.083343505859375, -0.0463104248046875, -0.00927734375, 0.0277557373046875, 0.064788818359375, 0.1018218994140625, 0.13885498046875, 0.1758880615234375, 0.212921142578125, 0.2499542236328125, 0.2869873046875, 0.3240203857421875, 0.361053466796875, 0.3980865478515625, 0.43511962890625, 0.4721527099609375, 0.509185791015625, 0.5462188720703125, 0.583251953125, 0.6202850341796875, 0.657318115234375, 0.6943511962890625, 0.73138427734375, 0.7684173583984375, 0.805450439453125, 0.8424835205078125, 0.8795166015625, 0.9165496826171875, 0.953582763671875, 0.9906158447265625, 1.02764892578125, 1.0646820068359375, 1.101715087890625, 1.1387481689453125, 1.17578125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 5.0, 2.0, 13.0, 20.0, 19.0, 26.0, 19.0, 33.0, 38.0, 41.0, 61.0, 75.0, 67.0, 67.0, 67.0, 63.0, 79.0, 61.0, 35.0, 53.0, 32.0, 38.0, 27.0, 22.0, 7.0, 8.0, 3.0, 9.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00130462646484375, -0.0012714564800262451, -0.0012382864952087402, -0.0012051165103912354, -0.0011719465255737305, -0.0011387765407562256, -0.0011056065559387207, -0.0010724365711212158, -0.001039266586303711, -0.001006096601486206, -0.0009729266166687012, -0.0009397566318511963, -0.0009065866470336914, -0.0008734166622161865, -0.0008402466773986816, -0.0008070766925811768, -0.0007739067077636719, -0.000740736722946167, -0.0007075667381286621, -0.0006743967533111572, -0.0006412267684936523, -0.0006080567836761475, -0.0005748867988586426, -0.0005417168140411377, -0.0005085468292236328, -0.00047537684440612793, -0.00044220685958862305, -0.00040903687477111816, -0.0003758668899536133, -0.0003426969051361084, -0.0003095269203186035, -0.00027635693550109863, -0.00024318695068359375, -0.00021001696586608887, -0.00017684698104858398, -0.0001436769962310791, -0.00011050701141357422, -7.733702659606934e-05, -4.416704177856445e-05, -1.099705696105957e-05, 2.2172927856445312e-05, 5.5342912673950195e-05, 8.851289749145508e-05, 0.00012168288230895996, 0.00015485286712646484, 0.00018802285194396973, 0.0002211928367614746, 0.0002543628215789795, 0.0002875328063964844, 0.00032070279121398926, 0.00035387277603149414, 0.000387042760848999, 0.0004202127456665039, 0.0004533827304840088, 0.00048655271530151367, 0.0005197227001190186, 0.0005528926849365234, 0.0005860626697540283, 0.0006192326545715332, 0.0006524026393890381, 0.000685572624206543, 0.0007187426090240479, 0.0007519125938415527, 0.0007850825786590576, 0.0008182525634765625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 12.0, 6.0, 10.0, 23.0, 32.0, 33.0, 58.0, 57.0, 76.0, 127.0, 204.0, 389.0, 1346.0, 159966.0, 881610.0, 3248.0, 551.0, 249.0, 140.0, 98.0, 77.0, 55.0, 39.0, 28.0, 32.0, 20.0, 14.0, 17.0, 7.0, 5.0, 8.0, 5.0, 5.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01529693603515625, -0.014664053916931152, -0.014031171798706055, -0.013398289680480957, -0.01276540756225586, -0.012132525444030762, -0.011499643325805664, -0.010866761207580566, -0.010233879089355469, -0.009600996971130371, -0.008968114852905273, -0.008335232734680176, -0.007702350616455078, -0.0070694684982299805, -0.006436586380004883, -0.005803704261779785, -0.0051708221435546875, -0.00453794002532959, -0.003905057907104492, -0.0032721757888793945, -0.002639293670654297, -0.0020064115524291992, -0.0013735294342041016, -0.0007406473159790039, -0.00010776519775390625, 0.0005251169204711914, 0.001157999038696289, 0.0017908811569213867, 0.0024237632751464844, 0.003056645393371582, 0.0036895275115966797, 0.004322409629821777, 0.004955291748046875, 0.005588173866271973, 0.00622105598449707, 0.006853938102722168, 0.007486820220947266, 0.008119702339172363, 0.008752584457397461, 0.009385466575622559, 0.010018348693847656, 0.010651230812072754, 0.011284112930297852, 0.01191699504852295, 0.012549877166748047, 0.013182759284973145, 0.013815641403198242, 0.01444852352142334, 0.015081405639648438, 0.015714287757873535, 0.016347169876098633, 0.01698005199432373, 0.017612934112548828, 0.018245816230773926, 0.018878698348999023, 0.01951158046722412, 0.02014446258544922, 0.020777344703674316, 0.021410226821899414, 0.02204310894012451, 0.02267599105834961, 0.023308873176574707, 0.023941755294799805, 0.024574637413024902, 0.02520751953125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 25.0, 78.0, 149.0, 204.0, 229.0, 163.0, 97.0, 35.0, 17.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00063685531495139, -0.0005918823298998177, -0.0005469093448482454, -0.0005019363597966731, -0.00045696337474510074, -0.0004119903896935284, -0.00036701743374578655, -0.0003220444486942142, -0.0002770714636426419, -0.00023209847859106958, -0.00018712549353949726, -0.00014215252303984016, -9.717953798826784e-05, -5.2206552936695516e-05, -7.233582437038422e-06, 3.77394026145339e-05, 8.271238766610622e-05, 0.00012768537271767855, 0.00017265835776925087, 0.00021763132826890796, 0.0002626043278723955, 0.00030757731292396784, 0.0003525502688717097, 0.00039752325392328203, 0.00044249623897485435, 0.0004874692240264267, 0.0005324421799741685, 0.0005774151650257409, 0.0006223881500773132, 0.0006673611351288855, 0.0007123341201804578, 0.0007573071052320302, 0.0008022800320759416, 0.0008472530171275139, 0.0008922260021790862, 0.0009371989872306585, 0.0009821719722822309, 0.0010271449573338032, 0.0010721179423853755, 0.0011170909274369478, 0.0011620639124885201, 0.0012070368975400925, 0.0012520098825916648, 0.0012969828676432371, 0.0013419558526948094, 0.0013869288377463818, 0.001431901822797954, 0.0014768748078495264, 0.001521847676485777, 0.0015668206615373492, 0.0016117936465889215, 0.0016567666316404939, 0.0017017396166920662, 0.0017467126017436385, 0.0017916855867952108, 0.0018366585718467832, 0.0018816315568983555, 0.0019266045419499278, 0.0019715775270015, 0.0020165503956377506, 0.0020615234971046448, 0.0021064963657408953, 0.0021514694672077894, 0.00219644233584404, 0.002241415437310934]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 2.0, 2.0, 5.0, 10.0, 8.0, 10.0, 13.0, 11.0, 11.0, 16.0, 18.0, 19.0, 21.0, 22.0, 32.0, 34.0, 30.0, 39.0, 27.0, 34.0, 37.0, 44.0, 27.0, 41.0, 40.0, 38.0, 41.0, 35.0, 29.0, 36.0, 32.0, 33.0, 32.0, 23.0, 22.0, 23.0, 19.0, 17.0, 14.0, 12.0, 6.0, 10.0, 4.0, 6.0, 5.0, 4.0, 1.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00040668249130249023, -0.0003937156870961189, -0.0003807488828897476, -0.0003677820786833763, -0.000354815274477005, -0.0003418484702706337, -0.0003288816660642624, -0.0003159148618578911, -0.0003029480576515198, -0.00028998125344514847, -0.00027701444923877716, -0.00026404764503240585, -0.00025108084082603455, -0.00023811403661966324, -0.00022514723241329193, -0.00021218042820692062, -0.00019921362400054932, -0.000186246819794178, -0.0001732800155878067, -0.0001603132113814354, -0.0001473464071750641, -0.00013437960296869278, -0.00012141279876232147, -0.00010844599455595016, -9.547919034957886e-05, -8.251238614320755e-05, -6.954558193683624e-05, -5.6578777730464935e-05, -4.361197352409363e-05, -3.064516931772232e-05, -1.7678365111351013e-05, -4.711560904979706e-06, 8.255243301391602e-06, 2.122204750776291e-05, 3.4188851714134216e-05, 4.7155655920505524e-05, 6.012246012687683e-05, 7.308926433324814e-05, 8.605606853961945e-05, 9.902287274599075e-05, 0.00011198967695236206, 0.00012495648115873337, 0.00013792328536510468, 0.00015089008957147598, 0.0001638568937778473, 0.0001768236979842186, 0.0001897905021905899, 0.0002027573063969612, 0.00021572411060333252, 0.00022869091480970383, 0.00024165771901607513, 0.00025462452322244644, 0.00026759132742881775, 0.00028055813163518906, 0.00029352493584156036, 0.00030649174004793167, 0.000319458544254303, 0.0003324253484606743, 0.0003453921526670456, 0.0003583589568734169, 0.0003713257610797882, 0.0003842925652861595, 0.0003972593694925308, 0.00041022617369890213, 0.00042319297790527344]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 10.0, 10.0, 11.0, 14.0, 26.0, 15.0, 25.0, 22.0, 24.0, 40.0, 38.0, 30.0, 48.0, 51.0, 42.0, 51.0, 47.0, 52.0, 52.0, 53.0, 37.0, 45.0, 41.0, 42.0, 33.0, 21.0, 19.0, 18.0, 14.0, 14.0, 12.0, 11.0, 11.0, 2.0, 3.0, 3.0, 8.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.2928466796875, -6.046630859375, -5.8004150390625, -5.55419921875, -5.3079833984375, -5.061767578125, -4.8155517578125, -4.5693359375, -4.3231201171875, -4.076904296875, -3.8306884765625, -3.58447265625, -3.3382568359375, -3.092041015625, -2.8458251953125, -2.599609375, -2.3533935546875, -2.107177734375, -1.8609619140625, -1.61474609375, -1.3685302734375, -1.122314453125, -0.8760986328125, -0.6298828125, -0.3836669921875, -0.137451171875, 0.1087646484375, 0.35498046875, 0.6011962890625, 0.847412109375, 1.0936279296875, 1.33984375, 1.5860595703125, 1.832275390625, 2.0784912109375, 2.32470703125, 2.5709228515625, 2.817138671875, 3.0633544921875, 3.3095703125, 3.5557861328125, 3.802001953125, 4.0482177734375, 4.29443359375, 4.5406494140625, 4.786865234375, 5.0330810546875, 5.279296875, 5.5255126953125, 5.771728515625, 6.0179443359375, 6.26416015625, 6.5103759765625, 6.756591796875, 7.0028076171875, 7.2490234375, 7.4952392578125, 7.741455078125, 7.9876708984375, 8.23388671875, 8.4801025390625, 8.726318359375, 8.9725341796875, 9.21875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 12.0, 19.0, 26.0, 32.0, 49.0, 69.0, 109.0, 182.0, 304.0, 569.0, 1316.0, 3337.0, 9672.0, 29578.0, 98449.0, 330629.0, 397086.0, 121984.0, 36446.0, 11612.0, 3974.0, 1480.0, 681.0, 354.0, 201.0, 127.0, 85.0, 47.0, 35.0, 36.0, 15.0, 11.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.65625, -8.3778076171875, -8.099365234375, -7.8209228515625, -7.54248046875, -7.2640380859375, -6.985595703125, -6.7071533203125, -6.4287109375, -6.1502685546875, -5.871826171875, -5.5933837890625, -5.31494140625, -5.0364990234375, -4.758056640625, -4.4796142578125, -4.201171875, -3.9227294921875, -3.644287109375, -3.3658447265625, -3.08740234375, -2.8089599609375, -2.530517578125, -2.2520751953125, -1.9736328125, -1.6951904296875, -1.416748046875, -1.1383056640625, -0.85986328125, -0.5814208984375, -0.302978515625, -0.0245361328125, 0.25390625, 0.5323486328125, 0.810791015625, 1.0892333984375, 1.36767578125, 1.6461181640625, 1.924560546875, 2.2030029296875, 2.4814453125, 2.7598876953125, 3.038330078125, 3.3167724609375, 3.59521484375, 3.8736572265625, 4.152099609375, 4.4305419921875, 4.708984375, 4.9874267578125, 5.265869140625, 5.5443115234375, 5.82275390625, 6.1011962890625, 6.379638671875, 6.6580810546875, 6.9365234375, 7.2149658203125, 7.493408203125, 7.7718505859375, 8.05029296875, 8.3287353515625, 8.607177734375, 8.8856201171875, 9.1640625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 7.0, 10.0, 4.0, 16.0, 16.0, 15.0, 15.0, 21.0, 34.0, 28.0, 41.0, 44.0, 42.0, 50.0, 56.0, 82.0, 175.0, 1475.0, 324.0, 115.0, 64.0, 51.0, 37.0, 45.0, 40.0, 31.0, 32.0, 29.0, 25.0, 26.0, 17.0, 16.0, 16.0, 12.0, 6.0, 8.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.203125, -19.47705078125, -18.7509765625, -18.02490234375, -17.298828125, -16.57275390625, -15.8466796875, -15.12060546875, -14.39453125, -13.66845703125, -12.9423828125, -12.21630859375, -11.490234375, -10.76416015625, -10.0380859375, -9.31201171875, -8.5859375, -7.85986328125, -7.1337890625, -6.40771484375, -5.681640625, -4.95556640625, -4.2294921875, -3.50341796875, -2.77734375, -2.05126953125, -1.3251953125, -0.59912109375, 0.126953125, 0.85302734375, 1.5791015625, 2.30517578125, 3.03125, 3.75732421875, 4.4833984375, 5.20947265625, 5.935546875, 6.66162109375, 7.3876953125, 8.11376953125, 8.83984375, 9.56591796875, 10.2919921875, 11.01806640625, 11.744140625, 12.47021484375, 13.1962890625, 13.92236328125, 14.6484375, 15.37451171875, 16.1005859375, 16.82666015625, 17.552734375, 18.27880859375, 19.0048828125, 19.73095703125, 20.45703125, 21.18310546875, 21.9091796875, 22.63525390625, 23.361328125, 24.08740234375, 24.8134765625, 25.53955078125, 26.265625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 6.0, 4.0, 2.0, 9.0, 8.0, 6.0, 8.0, 12.0, 26.0, 31.0, 48.0, 52.0, 96.0, 113.0, 199.0, 344.0, 878.0, 9000.0, 3126969.0, 6224.0, 784.0, 313.0, 187.0, 127.0, 77.0, 50.0, 42.0, 25.0, 19.0, 20.0, 9.0, 4.0, 4.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-111.75, -108.306640625, -104.86328125, -101.419921875, -97.9765625, -94.533203125, -91.08984375, -87.646484375, -84.203125, -80.759765625, -77.31640625, -73.873046875, -70.4296875, -66.986328125, -63.54296875, -60.099609375, -56.65625, -53.212890625, -49.76953125, -46.326171875, -42.8828125, -39.439453125, -35.99609375, -32.552734375, -29.109375, -25.666015625, -22.22265625, -18.779296875, -15.3359375, -11.892578125, -8.44921875, -5.005859375, -1.5625, 1.880859375, 5.32421875, 8.767578125, 12.2109375, 15.654296875, 19.09765625, 22.541015625, 25.984375, 29.427734375, 32.87109375, 36.314453125, 39.7578125, 43.201171875, 46.64453125, 50.087890625, 53.53125, 56.974609375, 60.41796875, 63.861328125, 67.3046875, 70.748046875, 74.19140625, 77.634765625, 81.078125, 84.521484375, 87.96484375, 91.408203125, 94.8515625, 98.294921875, 101.73828125, 105.181640625, 108.625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 12.0, 23.0, 58.0, 89.0, 123.0, 164.0, 192.0, 129.0, 93.0, 62.0, 28.0, 20.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.250093460083008, -30.055500030517578, -28.86090660095215, -27.66631317138672, -26.471721649169922, -25.277128219604492, -24.082534790039062, -22.887943267822266, -21.693347930908203, -20.498754501342773, -19.304161071777344, -18.109569549560547, -16.914976119995117, -15.720382690429688, -14.525789260864258, -13.331196784973145, -12.136604309082031, -10.942010879516602, -9.747418403625488, -8.552824974060059, -7.358232021331787, -6.163639068603516, -4.969045639038086, -3.7744531631469727, -2.579859733581543, -1.385266661643982, -0.1906735897064209, 1.0039196014404297, 2.198512554168701, 3.3931055068969727, 4.587698936462402, 5.782291412353516, 6.9768829345703125, 8.171476364135742, 9.366068840026855, 10.560662269592285, 11.755254745483398, 12.949848175048828, 14.144441604614258, 15.339034080505371, 16.533626556396484, 17.728219985961914, 18.922813415527344, 20.11740493774414, 21.31199836730957, 22.506591796875, 23.70118522644043, 24.89577865600586, 26.09037208557129, 27.28496551513672, 28.47955894470215, 29.674152374267578, 30.868743896484375, 32.06333923339844, 33.257930755615234, 34.45252227783203, 35.647117614746094, 36.84170913696289, 38.03630447387695, 39.23089599609375, 40.42549133300781, 41.62008285522461, 42.814674377441406, 44.00926971435547, 45.203861236572266]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 6.0, 7.0, 14.0, 22.0, 14.0, 17.0, 19.0, 30.0, 21.0, 33.0, 45.0, 25.0, 43.0, 35.0, 44.0, 54.0, 57.0, 49.0, 37.0, 42.0, 31.0, 38.0, 35.0, 45.0, 50.0, 27.0, 21.0, 23.0, 24.0, 16.0, 17.0, 9.0, 10.0, 10.0, 6.0, 10.0, 5.0, 2.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.87211227416992, -48.00289535522461, -46.1336784362793, -44.26445770263672, -42.395240783691406, -40.526023864746094, -38.65680694580078, -36.78759002685547, -34.918373107910156, -33.049156188964844, -31.1799373626709, -29.310720443725586, -27.44150161743164, -25.572284698486328, -23.703067779541016, -21.833850860595703, -19.964630126953125, -18.095413208007812, -16.226194381713867, -14.356977462768555, -12.487759590148926, -10.618541717529297, -8.749324798583984, -6.8801069259643555, -5.010889053344727, -3.1416714191436768, -1.272453784942627, 0.5967636108398438, 2.4659814834594727, 4.335199356079102, 6.204416275024414, 8.073634147644043, 9.942855834960938, 11.812073707580566, 13.681291580200195, 15.550508499145508, 17.419727325439453, 19.288944244384766, 21.158161163330078, 23.02737808227539, 24.896596908569336, 26.76581382751465, 28.635032653808594, 30.504249572753906, 32.37346649169922, 34.24268341064453, 36.111900329589844, 37.98112106323242, 39.850337982177734, 41.71955490112305, 43.58877182006836, 45.45799255371094, 47.32720947265625, 49.19642639160156, 51.065643310546875, 52.93486022949219, 54.8040771484375, 56.67329406738281, 58.542510986328125, 60.41172790527344, 62.280948638916016, 64.15016174316406, 66.01937866210938, 67.88860321044922, 69.75782012939453]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 3.0, 11.0, 8.0, 19.0, 9.0, 11.0, 17.0, 21.0, 35.0, 29.0, 36.0, 34.0, 41.0, 42.0, 53.0, 47.0, 52.0, 48.0, 50.0, 61.0, 49.0, 44.0, 31.0, 50.0, 35.0, 33.0, 25.0, 19.0, 18.0, 15.0, 8.0, 17.0, 6.0, 8.0, 7.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.2890625, -7.0142822265625, -6.739501953125, -6.4647216796875, -6.18994140625, -5.9151611328125, -5.640380859375, -5.3656005859375, -5.0908203125, -4.8160400390625, -4.541259765625, -4.2664794921875, -3.99169921875, -3.7169189453125, -3.442138671875, -3.1673583984375, -2.892578125, -2.6177978515625, -2.343017578125, -2.0682373046875, -1.79345703125, -1.5186767578125, -1.243896484375, -0.9691162109375, -0.6943359375, -0.4195556640625, -0.144775390625, 0.1300048828125, 0.40478515625, 0.6795654296875, 0.954345703125, 1.2291259765625, 1.50390625, 1.7786865234375, 2.053466796875, 2.3282470703125, 2.60302734375, 2.8778076171875, 3.152587890625, 3.4273681640625, 3.7021484375, 3.9769287109375, 4.251708984375, 4.5264892578125, 4.80126953125, 5.0760498046875, 5.350830078125, 5.6256103515625, 5.900390625, 6.1751708984375, 6.449951171875, 6.7247314453125, 6.99951171875, 7.2742919921875, 7.549072265625, 7.8238525390625, 8.0986328125, 8.3734130859375, 8.648193359375, 8.9229736328125, 9.19775390625, 9.4725341796875, 9.747314453125, 10.0220947265625, 10.296875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 3.0, 11.0, 9.0, 7.0, 11.0, 20.0, 25.0, 29.0, 35.0, 47.0, 50.0, 62.0, 75.0, 112.0, 124.0, 265.0, 605.0, 2371.0, 25040.0, 573062.0, 2845302.0, 712421.0, 30512.0, 2532.0, 591.0, 284.0, 162.0, 121.0, 93.0, 59.0, 47.0, 35.0, 28.0, 31.0, 17.0, 17.0, 16.0, 21.0, 8.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.79541015625, -15.2001953125, -14.60498046875, -14.009765625, -13.41455078125, -12.8193359375, -12.22412109375, -11.62890625, -11.03369140625, -10.4384765625, -9.84326171875, -9.248046875, -8.65283203125, -8.0576171875, -7.46240234375, -6.8671875, -6.27197265625, -5.6767578125, -5.08154296875, -4.486328125, -3.89111328125, -3.2958984375, -2.70068359375, -2.10546875, -1.51025390625, -0.9150390625, -0.31982421875, 0.275390625, 0.87060546875, 1.4658203125, 2.06103515625, 2.65625, 3.25146484375, 3.8466796875, 4.44189453125, 5.037109375, 5.63232421875, 6.2275390625, 6.82275390625, 7.41796875, 8.01318359375, 8.6083984375, 9.20361328125, 9.798828125, 10.39404296875, 10.9892578125, 11.58447265625, 12.1796875, 12.77490234375, 13.3701171875, 13.96533203125, 14.560546875, 15.15576171875, 15.7509765625, 16.34619140625, 16.94140625, 17.53662109375, 18.1318359375, 18.72705078125, 19.322265625, 19.91748046875, 20.5126953125, 21.10791015625, 21.703125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 11.0, 9.0, 17.0, 20.0, 23.0, 38.0, 69.0, 69.0, 115.0, 155.0, 222.0, 296.0, 419.0, 477.0, 488.0, 487.0, 331.0, 254.0, 177.0, 111.0, 76.0, 52.0, 40.0, 34.0, 22.0, 17.0, 14.0, 11.0, 10.0, 4.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8359375, -12.3463134765625, -11.856689453125, -11.3670654296875, -10.87744140625, -10.3878173828125, -9.898193359375, -9.4085693359375, -8.9189453125, -8.4293212890625, -7.939697265625, -7.4500732421875, -6.96044921875, -6.4708251953125, -5.981201171875, -5.4915771484375, -5.001953125, -4.5123291015625, -4.022705078125, -3.5330810546875, -3.04345703125, -2.5538330078125, -2.064208984375, -1.5745849609375, -1.0849609375, -0.5953369140625, -0.105712890625, 0.3839111328125, 0.87353515625, 1.3631591796875, 1.852783203125, 2.3424072265625, 2.83203125, 3.3216552734375, 3.811279296875, 4.3009033203125, 4.79052734375, 5.2801513671875, 5.769775390625, 6.2593994140625, 6.7490234375, 7.2386474609375, 7.728271484375, 8.2178955078125, 8.70751953125, 9.1971435546875, 9.686767578125, 10.1763916015625, 10.666015625, 11.1556396484375, 11.645263671875, 12.1348876953125, 12.62451171875, 13.1141357421875, 13.603759765625, 14.0933837890625, 14.5830078125, 15.0726318359375, 15.562255859375, 16.0518798828125, 16.54150390625, 17.0311279296875, 17.520751953125, 18.0103759765625, 18.5]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 7.0, 11.0, 18.0, 18.0, 23.0, 44.0, 56.0, 76.0, 102.0, 156.0, 242.0, 355.0, 661.0, 7829.0, 4031848.0, 150448.0, 1000.0, 431.0, 311.0, 191.0, 138.0, 109.0, 73.0, 42.0, 25.0, 20.0, 18.0, 10.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-88.5, -86.212890625, -83.92578125, -81.638671875, -79.3515625, -77.064453125, -74.77734375, -72.490234375, -70.203125, -67.916015625, -65.62890625, -63.341796875, -61.0546875, -58.767578125, -56.48046875, -54.193359375, -51.90625, -49.619140625, -47.33203125, -45.044921875, -42.7578125, -40.470703125, -38.18359375, -35.896484375, -33.609375, -31.322265625, -29.03515625, -26.748046875, -24.4609375, -22.173828125, -19.88671875, -17.599609375, -15.3125, -13.025390625, -10.73828125, -8.451171875, -6.1640625, -3.876953125, -1.58984375, 0.697265625, 2.984375, 5.271484375, 7.55859375, 9.845703125, 12.1328125, 14.419921875, 16.70703125, 18.994140625, 21.28125, 23.568359375, 25.85546875, 28.142578125, 30.4296875, 32.716796875, 35.00390625, 37.291015625, 39.578125, 41.865234375, 44.15234375, 46.439453125, 48.7265625, 51.013671875, 53.30078125, 55.587890625, 57.875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 10.0, 110.0, 382.0, 403.0, 97.0, 14.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.3288688659668, -51.93135452270508, -44.53384017944336, -37.136322021484375, -29.73880958557129, -22.341293334960938, -14.943778991699219, -7.5462646484375, -0.14875030517578125, 7.248764514923096, 14.646279335021973, 22.043794631958008, 29.441308975219727, 36.83882522583008, 44.2363395690918, 51.633853912353516, 59.031368255615234, 66.42888641357422, 73.82640075683594, 81.22391510009766, 88.62142944335938, 96.0189437866211, 103.41645812988281, 110.81397247314453, 118.21148681640625, 125.60900115966797, 133.0065155029297, 140.40403747558594, 147.80154418945312, 155.19906616210938, 162.59657287597656, 169.9940948486328, 177.39161682128906, 184.7891387939453, 192.1866455078125, 199.58416748046875, 206.98167419433594, 214.3791961669922, 221.77670288085938, 229.17422485351562, 236.5717315673828, 243.96925354003906, 251.36676025390625, 258.7642822265625, 266.16180419921875, 273.5592956542969, 280.9568176269531, 288.3543395996094, 295.7518615722656, 303.1493835449219, 310.5469055175781, 317.94439697265625, 325.3419189453125, 332.73944091796875, 340.136962890625, 347.5344543457031, 354.9319763183594, 362.3294982910156, 369.7270202636719, 377.12451171875, 384.52203369140625, 391.9195556640625, 399.31707763671875, 406.7145690917969, 414.1120910644531]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 9.0, 8.0, 9.0, 6.0, 8.0, 14.0, 19.0, 16.0, 21.0, 25.0, 19.0, 28.0, 43.0, 36.0, 40.0, 34.0, 26.0, 42.0, 39.0, 44.0, 45.0, 37.0, 42.0, 38.0, 47.0, 34.0, 28.0, 28.0, 32.0, 29.0, 26.0, 25.0, 25.0, 15.0, 8.0, 11.0, 10.0, 11.0, 8.0, 5.0, 2.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.607723236083984, -38.214412689208984, -36.82110595703125, -35.42779541015625, -34.034488677978516, -32.641178131103516, -31.24786949157715, -29.85456085205078, -28.46125030517578, -27.067941665649414, -25.674633026123047, -24.281322479248047, -22.88801383972168, -21.494705200195312, -20.101396560668945, -18.708087921142578, -17.31477928161621, -15.921470642089844, -14.52816104888916, -13.134852409362793, -11.74154281616211, -10.348234176635742, -8.954925537109375, -7.561615943908691, -6.168307304382324, -4.774998188018799, -3.3816893100738525, -1.9883804321289062, -0.5950713157653809, 0.7982378005981445, 2.1915464401245117, 3.5848560333251953, 4.9781646728515625, 6.371473789215088, 7.764782905578613, 9.15809154510498, 10.551401138305664, 11.944709777832031, 13.338018417358398, 14.731328010559082, 16.124637603759766, 17.517946243286133, 18.9112548828125, 20.3045654296875, 21.697874069213867, 23.091182708740234, 24.4844913482666, 25.87779998779297, 27.271108627319336, 28.664417266845703, 30.05772590637207, 31.451034545898438, 32.84434509277344, 34.23765563964844, 35.63096237182617, 37.02427291870117, 38.417579650878906, 39.810890197753906, 41.20419692993164, 42.59750747680664, 43.990814208984375, 45.384124755859375, 46.777435302734375, 48.17074203491211, 49.56405258178711]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 6.0, 13.0, 9.0, 11.0, 15.0, 20.0, 24.0, 32.0, 37.0, 23.0, 35.0, 39.0, 51.0, 42.0, 46.0, 53.0, 53.0, 45.0, 45.0, 45.0, 46.0, 34.0, 30.0, 34.0, 36.0, 30.0, 17.0, 27.0, 15.0, 18.0, 11.0, 12.0, 16.0, 5.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.859375, -6.6131591796875, -6.366943359375, -6.1207275390625, -5.87451171875, -5.6282958984375, -5.382080078125, -5.1358642578125, -4.8896484375, -4.6434326171875, -4.397216796875, -4.1510009765625, -3.90478515625, -3.6585693359375, -3.412353515625, -3.1661376953125, -2.919921875, -2.6737060546875, -2.427490234375, -2.1812744140625, -1.93505859375, -1.6888427734375, -1.442626953125, -1.1964111328125, -0.9501953125, -0.7039794921875, -0.457763671875, -0.2115478515625, 0.03466796875, 0.2808837890625, 0.527099609375, 0.7733154296875, 1.01953125, 1.2657470703125, 1.511962890625, 1.7581787109375, 2.00439453125, 2.2506103515625, 2.496826171875, 2.7430419921875, 2.9892578125, 3.2354736328125, 3.481689453125, 3.7279052734375, 3.97412109375, 4.2203369140625, 4.466552734375, 4.7127685546875, 4.958984375, 5.2052001953125, 5.451416015625, 5.6976318359375, 5.94384765625, 6.1900634765625, 6.436279296875, 6.6824951171875, 6.9287109375, 7.1749267578125, 7.421142578125, 7.6673583984375, 7.91357421875, 8.1597900390625, 8.406005859375, 8.6522216796875, 8.8984375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 10.0, 11.0, 9.0, 13.0, 19.0, 23.0, 33.0, 55.0, 77.0, 126.0, 201.0, 292.0, 453.0, 669.0, 1036.0, 1593.0, 2445.0, 3543.0, 5652.0, 8472.0, 13096.0, 20628.0, 33195.0, 55801.0, 100739.0, 209475.0, 277649.0, 132524.0, 70196.0, 40545.0, 24851.0, 15811.0, 10017.0, 6607.0, 4341.0, 2801.0, 1869.0, 1208.0, 872.0, 544.0, 356.0, 255.0, 146.0, 102.0, 67.0, 36.0, 38.0, 22.0, 12.0, 10.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-1.1826171875, -1.14471435546875, -1.1068115234375, -1.06890869140625, -1.031005859375, -0.99310302734375, -0.9552001953125, -0.91729736328125, -0.87939453125, -0.84149169921875, -0.8035888671875, -0.76568603515625, -0.727783203125, -0.68988037109375, -0.6519775390625, -0.61407470703125, -0.576171875, -0.53826904296875, -0.5003662109375, -0.46246337890625, -0.424560546875, -0.38665771484375, -0.3487548828125, -0.31085205078125, -0.27294921875, -0.23504638671875, -0.1971435546875, -0.15924072265625, -0.121337890625, -0.08343505859375, -0.0455322265625, -0.00762939453125, 0.0302734375, 0.06817626953125, 0.1060791015625, 0.14398193359375, 0.181884765625, 0.21978759765625, 0.2576904296875, 0.29559326171875, 0.33349609375, 0.37139892578125, 0.4093017578125, 0.44720458984375, 0.485107421875, 0.52301025390625, 0.5609130859375, 0.59881591796875, 0.63671875, 0.67462158203125, 0.7125244140625, 0.75042724609375, 0.788330078125, 0.82623291015625, 0.8641357421875, 0.90203857421875, 0.93994140625, 0.97784423828125, 1.0157470703125, 1.05364990234375, 1.091552734375, 1.12945556640625, 1.1673583984375, 1.20526123046875, 1.2431640625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 7.0, 2.0, 7.0, 6.0, 17.0, 12.0, 10.0, 19.0, 20.0, 26.0, 23.0, 22.0, 27.0, 34.0, 35.0, 31.0, 40.0, 36.0, 43.0, 36.0, 1063.0, 34.0, 42.0, 36.0, 49.0, 41.0, 27.0, 36.0, 29.0, 33.0, 34.0, 18.0, 22.0, 17.0, 13.0, 14.0, 14.0, 13.0, 8.0, 6.0, 7.0, 8.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.49609375, -4.35980224609375, -4.2235107421875, -4.08721923828125, -3.950927734375, -3.81463623046875, -3.6783447265625, -3.54205322265625, -3.40576171875, -3.26947021484375, -3.1331787109375, -2.99688720703125, -2.860595703125, -2.72430419921875, -2.5880126953125, -2.45172119140625, -2.3154296875, -2.17913818359375, -2.0428466796875, -1.90655517578125, -1.770263671875, -1.63397216796875, -1.4976806640625, -1.36138916015625, -1.22509765625, -1.08880615234375, -0.9525146484375, -0.81622314453125, -0.679931640625, -0.54364013671875, -0.4073486328125, -0.27105712890625, -0.134765625, 0.00152587890625, 0.1378173828125, 0.27410888671875, 0.410400390625, 0.54669189453125, 0.6829833984375, 0.81927490234375, 0.95556640625, 1.09185791015625, 1.2281494140625, 1.36444091796875, 1.500732421875, 1.63702392578125, 1.7733154296875, 1.90960693359375, 2.0458984375, 2.18218994140625, 2.3184814453125, 2.45477294921875, 2.591064453125, 2.72735595703125, 2.8636474609375, 2.99993896484375, 3.13623046875, 3.27252197265625, 3.4088134765625, 3.54510498046875, 3.681396484375, 3.81768798828125, 3.9539794921875, 4.09027099609375, 4.2265625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 5.0, 11.0, 16.0, 24.0, 33.0, 36.0, 56.0, 93.0, 123.0, 151.0, 220.0, 313.0, 474.0, 689.0, 942.0, 1458.0, 2091.0, 3313.0, 4860.0, 7699.0, 11720.0, 18337.0, 29486.0, 48973.0, 84412.0, 156890.0, 1320401.0, 172041.0, 91869.0, 52141.0, 31410.0, 19760.0, 12505.0, 8272.0, 5422.0, 3528.0, 2320.0, 1602.0, 1062.0, 714.0, 510.0, 394.0, 200.0, 180.0, 118.0, 90.0, 50.0, 31.0, 31.0, 27.0, 9.0, 9.0, 7.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.0966796875, -1.0608062744140625, -1.024932861328125, -0.9890594482421875, -0.95318603515625, -0.9173126220703125, -0.881439208984375, -0.8455657958984375, -0.8096923828125, -0.7738189697265625, -0.737945556640625, -0.7020721435546875, -0.66619873046875, -0.6303253173828125, -0.594451904296875, -0.5585784912109375, -0.522705078125, -0.4868316650390625, -0.450958251953125, -0.4150848388671875, -0.37921142578125, -0.3433380126953125, -0.307464599609375, -0.2715911865234375, -0.2357177734375, -0.1998443603515625, -0.163970947265625, -0.1280975341796875, -0.09222412109375, -0.0563507080078125, -0.020477294921875, 0.0153961181640625, 0.05126953125, 0.0871429443359375, 0.123016357421875, 0.1588897705078125, 0.19476318359375, 0.2306365966796875, 0.266510009765625, 0.3023834228515625, 0.3382568359375, 0.3741302490234375, 0.410003662109375, 0.4458770751953125, 0.48175048828125, 0.5176239013671875, 0.553497314453125, 0.5893707275390625, 0.625244140625, 0.6611175537109375, 0.696990966796875, 0.7328643798828125, 0.76873779296875, 0.8046112060546875, 0.840484619140625, 0.8763580322265625, 0.9122314453125, 0.9481048583984375, 0.983978271484375, 1.0198516845703125, 1.05572509765625, 1.0915985107421875, 1.127471923828125, 1.1633453369140625, 1.19921875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 10.0, 4.0, 9.0, 9.0, 8.0, 9.0, 11.0, 18.0, 15.0, 31.0, 39.0, 43.0, 35.0, 48.0, 52.0, 48.0, 47.0, 50.0, 56.0, 67.0, 51.0, 53.0, 42.0, 32.0, 30.0, 28.0, 20.0, 26.0, 16.0, 17.0, 12.0, 8.0, 6.0, 8.0, 5.0, 9.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008759498596191406, -0.0008440092206001282, -0.0008120685815811157, -0.0007801279425621033, -0.0007481873035430908, -0.0007162466645240784, -0.0006843060255050659, -0.0006523653864860535, -0.000620424747467041, -0.0005884841084480286, -0.0005565434694290161, -0.0005246028304100037, -0.0004926621913909912, -0.00046072155237197876, -0.0004287809133529663, -0.00039684027433395386, -0.0003648996353149414, -0.00033295899629592896, -0.0003010183572769165, -0.00026907771825790405, -0.0002371370792388916, -0.00020519644021987915, -0.0001732558012008667, -0.00014131516218185425, -0.0001093745231628418, -7.743388414382935e-05, -4.5493245124816895e-05, -1.3552606105804443e-05, 1.8388032913208008e-05, 5.032867193222046e-05, 8.226931095123291e-05, 0.00011420994997024536, 0.0001461505889892578, 0.00017809122800827026, 0.00021003186702728271, 0.00024197250604629517, 0.0002739131450653076, 0.00030585378408432007, 0.0003377944231033325, 0.00036973506212234497, 0.0004016757011413574, 0.0004336163401603699, 0.0004655569791793823, 0.0004974976181983948, 0.0005294382572174072, 0.0005613788962364197, 0.0005933195352554321, 0.0006252601742744446, 0.000657200813293457, 0.0006891414523124695, 0.0007210820913314819, 0.0007530227303504944, 0.0007849633693695068, 0.0008169040083885193, 0.0008488446474075317, 0.0008807852864265442, 0.0009127259254455566, 0.0009446665644645691, 0.0009766072034835815, 0.001008547842502594, 0.0010404884815216064, 0.001072429120540619, 0.0011043697595596313, 0.0011363103985786438, 0.0011682510375976562]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 2.0, 5.0, 2.0, 4.0, 5.0, 9.0, 13.0, 10.0, 10.0, 11.0, 20.0, 24.0, 25.0, 35.0, 38.0, 43.0, 73.0, 91.0, 146.0, 283.0, 546.0, 2741.0, 907796.0, 134160.0, 1220.0, 424.0, 218.0, 156.0, 95.0, 87.0, 51.0, 51.0, 30.0, 30.0, 11.0, 21.0, 12.0, 12.0, 14.0, 4.0, 7.0, 9.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.0248260498046875, -0.024132966995239258, -0.023439884185791016, -0.022746801376342773, -0.02205371856689453, -0.02136063575744629, -0.020667552947998047, -0.019974470138549805, -0.019281387329101562, -0.01858830451965332, -0.017895221710205078, -0.017202138900756836, -0.016509056091308594, -0.01581597328186035, -0.01512289047241211, -0.014429807662963867, -0.013736724853515625, -0.013043642044067383, -0.01235055923461914, -0.011657476425170898, -0.010964393615722656, -0.010271310806274414, -0.009578227996826172, -0.00888514518737793, -0.008192062377929688, -0.007498979568481445, -0.006805896759033203, -0.006112813949584961, -0.005419731140136719, -0.0047266483306884766, -0.004033565521240234, -0.003340482711791992, -0.00264739990234375, -0.001954317092895508, -0.0012612342834472656, -0.0005681514739990234, 0.00012493133544921875, 0.0008180141448974609, 0.0015110969543457031, 0.0022041797637939453, 0.0028972625732421875, 0.0035903453826904297, 0.004283428192138672, 0.004976511001586914, 0.005669593811035156, 0.0063626766204833984, 0.007055759429931641, 0.007748842239379883, 0.008441925048828125, 0.009135007858276367, 0.00982809066772461, 0.010521173477172852, 0.011214256286621094, 0.011907339096069336, 0.012600421905517578, 0.01329350471496582, 0.013986587524414062, 0.014679670333862305, 0.015372753143310547, 0.01606583595275879, 0.01675891876220703, 0.017452001571655273, 0.018145084381103516, 0.018838167190551758, 0.01953125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 26.0, 77.0, 192.0, 305.0, 251.0, 121.0, 32.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021674383897334337, -0.0021050528157502413, -0.002042667241767049, -0.0019802816677838564, -0.0019178962102159858, -0.0018555106362327933, -0.0017931251786649227, -0.0017307396046817303, -0.0016683540306985378, -0.0016059684567153454, -0.001543582882732153, -0.0014811974251642823, -0.0014188118511810899, -0.0013564262771978974, -0.0012940408196300268, -0.0012316552456468344, -0.001169269671663642, -0.0011068840976804495, -0.001044498523697257, -0.0009821130661293864, -0.000919727492146194, -0.0008573419181630015, -0.00079495640238747, -0.0007325708866119385, -0.000670185312628746, -0.0006077997386455536, -0.0005454142228700221, -0.00048302867799066007, -0.0004206431331112981, -0.0003582575882319361, -0.0002958720433525741, -0.00023348649847321212, -0.00017110072076320648, -0.0001087151758838445, -4.632963100448251e-05, 1.605591387487948e-05, 7.844145875424147e-05, 0.00014082700363360345, 0.00020321254851296544, 0.00026559809339232743, 0.0003279836382716894, 0.0003903691831510514, 0.0004527547280304134, 0.0005151402438059449, 0.0005775258177891374, 0.0006399113917723298, 0.0007022969075478613, 0.0007646824233233929, 0.0008270679973065853, 0.0008894535712897778, 0.0009518390870653093, 0.0010142246028408408, 0.0010766101768240333, 0.0011389957508072257, 0.0012013812083750963, 0.0012637667823582888, 0.0013261523563414812, 0.0013885379303246737, 0.001450923504307866, 0.0015133089618757367, 0.0015756945358589292, 0.0016380801098421216, 0.0017004655674099922, 0.0017628511413931847, 0.001825236715376377]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 2.0, 7.0, 9.0, 7.0, 11.0, 13.0, 18.0, 13.0, 14.0, 12.0, 32.0, 28.0, 24.0, 31.0, 39.0, 35.0, 23.0, 37.0, 30.0, 33.0, 42.0, 45.0, 48.0, 40.0, 49.0, 43.0, 31.0, 47.0, 29.0, 38.0, 15.0, 25.0, 22.0, 20.0, 21.0, 13.0, 11.0, 11.0, 7.0, 6.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005617737770080566, -0.000544319860637188, -0.0005268659442663193, -0.0005094120278954506, -0.0004919581115245819, -0.0004745041951537132, -0.00045705027878284454, -0.00043959636241197586, -0.0004221424460411072, -0.0004046885296702385, -0.0003872346132993698, -0.00036978069692850113, -0.00035232678055763245, -0.00033487286418676376, -0.0003174189478158951, -0.0002999650314450264, -0.0002825111150741577, -0.00026505719870328903, -0.00024760328233242035, -0.00023014936596155167, -0.00021269544959068298, -0.0001952415332198143, -0.00017778761684894562, -0.00016033370047807693, -0.00014287978410720825, -0.00012542586773633957, -0.00010797195136547089, -9.05180349946022e-05, -7.306411862373352e-05, -5.561020225286484e-05, -3.8156285881996155e-05, -2.0702369511127472e-05, -3.248453140258789e-06, 1.4205463230609894e-05, 3.165937960147858e-05, 4.911329597234726e-05, 6.656721234321594e-05, 8.402112871408463e-05, 0.00010147504508495331, 0.00011892896145582199, 0.00013638287782669067, 0.00015383679419755936, 0.00017129071056842804, 0.00018874462693929672, 0.0002061985433101654, 0.0002236524596810341, 0.00024110637605190277, 0.00025856029242277145, 0.00027601420879364014, 0.0002934681251645088, 0.0003109220415353775, 0.0003283759579062462, 0.00034582987427711487, 0.00036328379064798355, 0.00038073770701885223, 0.0003981916233897209, 0.0004156455397605896, 0.0004330994561314583, 0.00045055337250232697, 0.00046800728887319565, 0.00048546120524406433, 0.000502915121614933, 0.0005203690379858017, 0.0005378229543566704, 0.0005552768707275391]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 7.0, 6.0, 13.0, 9.0, 11.0, 15.0, 20.0, 24.0, 32.0, 37.0, 23.0, 35.0, 39.0, 51.0, 42.0, 46.0, 53.0, 53.0, 45.0, 45.0, 45.0, 46.0, 34.0, 30.0, 34.0, 36.0, 30.0, 17.0, 27.0, 15.0, 18.0, 11.0, 12.0, 16.0, 5.0, 5.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.859375, -6.6131591796875, -6.366943359375, -6.1207275390625, -5.87451171875, -5.6282958984375, -5.382080078125, -5.1358642578125, -4.8896484375, -4.6434326171875, -4.397216796875, -4.1510009765625, -3.90478515625, -3.6585693359375, -3.412353515625, -3.1661376953125, -2.919921875, -2.6737060546875, -2.427490234375, -2.1812744140625, -1.93505859375, -1.6888427734375, -1.442626953125, -1.1964111328125, -0.9501953125, -0.7039794921875, -0.457763671875, -0.2115478515625, 0.03466796875, 0.2808837890625, 0.527099609375, 0.7733154296875, 1.01953125, 1.2657470703125, 1.511962890625, 1.7581787109375, 2.00439453125, 2.2506103515625, 2.496826171875, 2.7430419921875, 2.9892578125, 3.2354736328125, 3.481689453125, 3.7279052734375, 3.97412109375, 4.2203369140625, 4.466552734375, 4.7127685546875, 4.958984375, 5.2052001953125, 5.451416015625, 5.6976318359375, 5.94384765625, 6.1900634765625, 6.436279296875, 6.6824951171875, 6.9287109375, 7.1749267578125, 7.421142578125, 7.6673583984375, 7.91357421875, 8.1597900390625, 8.406005859375, 8.6522216796875, 8.8984375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 6.0, 5.0, 13.0, 8.0, 15.0, 21.0, 30.0, 65.0, 64.0, 84.0, 152.0, 304.0, 627.0, 1248.0, 2702.0, 5712.0, 12253.0, 27290.0, 64533.0, 172098.0, 365619.0, 240026.0, 89427.0, 35821.0, 16158.0, 7377.0, 3515.0, 1630.0, 808.0, 376.0, 197.0, 119.0, 83.0, 50.0, 29.0, 25.0, 20.0, 13.0, 14.0, 5.0, 8.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8515625, -6.628173828125, -6.40478515625, -6.181396484375, -5.9580078125, -5.734619140625, -5.51123046875, -5.287841796875, -5.064453125, -4.841064453125, -4.61767578125, -4.394287109375, -4.1708984375, -3.947509765625, -3.72412109375, -3.500732421875, -3.27734375, -3.053955078125, -2.83056640625, -2.607177734375, -2.3837890625, -2.160400390625, -1.93701171875, -1.713623046875, -1.490234375, -1.266845703125, -1.04345703125, -0.820068359375, -0.5966796875, -0.373291015625, -0.14990234375, 0.073486328125, 0.296875, 0.520263671875, 0.74365234375, 0.967041015625, 1.1904296875, 1.413818359375, 1.63720703125, 1.860595703125, 2.083984375, 2.307373046875, 2.53076171875, 2.754150390625, 2.9775390625, 3.200927734375, 3.42431640625, 3.647705078125, 3.87109375, 4.094482421875, 4.31787109375, 4.541259765625, 4.7646484375, 4.988037109375, 5.21142578125, 5.434814453125, 5.658203125, 5.881591796875, 6.10498046875, 6.328369140625, 6.5517578125, 6.775146484375, 6.99853515625, 7.221923828125, 7.4453125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 4.0, 4.0, 9.0, 11.0, 9.0, 14.0, 13.0, 16.0, 11.0, 11.0, 30.0, 28.0, 24.0, 20.0, 49.0, 44.0, 67.0, 80.0, 149.0, 390.0, 1438.0, 179.0, 80.0, 56.0, 39.0, 51.0, 32.0, 27.0, 24.0, 27.0, 18.0, 15.0, 13.0, 12.0, 16.0, 12.0, 7.0, 5.0, 10.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.46875, -28.6044921875, -27.740234375, -26.8759765625, -26.01171875, -25.1474609375, -24.283203125, -23.4189453125, -22.5546875, -21.6904296875, -20.826171875, -19.9619140625, -19.09765625, -18.2333984375, -17.369140625, -16.5048828125, -15.640625, -14.7763671875, -13.912109375, -13.0478515625, -12.18359375, -11.3193359375, -10.455078125, -9.5908203125, -8.7265625, -7.8623046875, -6.998046875, -6.1337890625, -5.26953125, -4.4052734375, -3.541015625, -2.6767578125, -1.8125, -0.9482421875, -0.083984375, 0.7802734375, 1.64453125, 2.5087890625, 3.373046875, 4.2373046875, 5.1015625, 5.9658203125, 6.830078125, 7.6943359375, 8.55859375, 9.4228515625, 10.287109375, 11.1513671875, 12.015625, 12.8798828125, 13.744140625, 14.6083984375, 15.47265625, 16.3369140625, 17.201171875, 18.0654296875, 18.9296875, 19.7939453125, 20.658203125, 21.5224609375, 22.38671875, 23.2509765625, 24.115234375, 24.9794921875, 25.84375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 2.0, 9.0, 8.0, 13.0, 21.0, 17.0, 29.0, 46.0, 53.0, 55.0, 109.0, 145.0, 284.0, 511.0, 1803.0, 2963986.0, 176455.0, 1026.0, 431.0, 228.0, 147.0, 95.0, 57.0, 41.0, 35.0, 31.0, 29.0, 11.0, 8.0, 6.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-100.0, -96.861328125, -93.72265625, -90.583984375, -87.4453125, -84.306640625, -81.16796875, -78.029296875, -74.890625, -71.751953125, -68.61328125, -65.474609375, -62.3359375, -59.197265625, -56.05859375, -52.919921875, -49.78125, -46.642578125, -43.50390625, -40.365234375, -37.2265625, -34.087890625, -30.94921875, -27.810546875, -24.671875, -21.533203125, -18.39453125, -15.255859375, -12.1171875, -8.978515625, -5.83984375, -2.701171875, 0.4375, 3.576171875, 6.71484375, 9.853515625, 12.9921875, 16.130859375, 19.26953125, 22.408203125, 25.546875, 28.685546875, 31.82421875, 34.962890625, 38.1015625, 41.240234375, 44.37890625, 47.517578125, 50.65625, 53.794921875, 56.93359375, 60.072265625, 63.2109375, 66.349609375, 69.48828125, 72.626953125, 75.765625, 78.904296875, 82.04296875, 85.181640625, 88.3203125, 91.458984375, 94.59765625, 97.736328125, 100.875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [11.0, 501.0, 499.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.462803840637207, -7.869811534881592, -0.27681922912597656, 7.3161725997924805, 14.909165382385254, 22.502159118652344, 30.095149993896484, 37.68814468383789, 45.28113555908203, 52.87412643432617, 60.46712112426758, 68.06011199951172, 75.65310668945312, 83.24609375, 90.8390884399414, 98.43208312988281, 106.02507019042969, 113.6180648803711, 121.21105194091797, 128.80404663085938, 136.39703369140625, 143.9900360107422, 151.58302307128906, 159.176025390625, 166.76901245117188, 174.36199951171875, 181.9550018310547, 189.54798889160156, 197.14097595214844, 204.73397827148438, 212.32696533203125, 219.91995239257812, 227.51295471191406, 235.10594177246094, 242.69894409179688, 250.29193115234375, 257.8849182128906, 265.4779052734375, 273.0709228515625, 280.6639099121094, 288.25689697265625, 295.8498840332031, 303.44287109375, 311.035888671875, 318.6288757324219, 326.22186279296875, 333.8148498535156, 341.4078369140625, 349.0008239746094, 356.59381103515625, 364.1867980957031, 371.77978515625, 379.372802734375, 386.9657897949219, 394.55877685546875, 402.1517639160156, 409.7447814941406, 417.3377685546875, 424.9307556152344, 432.52374267578125, 440.11676025390625, 447.7097473144531, 455.302734375, 462.8957214355469, 470.48870849609375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 3.0, 10.0, 8.0, 10.0, 20.0, 14.0, 15.0, 15.0, 17.0, 12.0, 21.0, 19.0, 23.0, 30.0, 24.0, 29.0, 30.0, 45.0, 41.0, 32.0, 40.0, 33.0, 27.0, 29.0, 35.0, 34.0, 26.0, 36.0, 28.0, 32.0, 23.0, 36.0, 24.0, 20.0, 22.0, 30.0, 15.0, 19.0, 13.0, 12.0, 6.0, 8.0, 7.0, 3.0, 6.0, 5.0, 3.0, 3.0, 1.0, 4.0, 4.0, 0.0, 2.0, 2.0], "bins": [-53.91154098510742, -52.26323318481445, -50.614925384521484, -48.966617584228516, -47.31830978393555, -45.67000198364258, -44.021690368652344, -42.373382568359375, -40.725074768066406, -39.07676696777344, -37.42845916748047, -35.7801513671875, -34.13184356689453, -32.48353576660156, -30.83522605895996, -29.186918258666992, -27.538612365722656, -25.890304565429688, -24.24199676513672, -22.59368896484375, -20.94538116455078, -19.297073364257812, -17.64876365661621, -16.000455856323242, -14.352148056030273, -12.703840255737305, -11.055532455444336, -9.40722370147705, -7.758915901184082, -6.110608100891113, -4.462299346923828, -2.8139915466308594, -1.1656837463378906, 0.4826242923736572, 2.130932331085205, 3.779240608215332, 5.427548408508301, 7.0758562088012695, 8.724164962768555, 10.372472763061523, 12.020780563354492, 13.669088363647461, 15.31739616394043, 16.96570587158203, 18.614013671875, 20.26232147216797, 21.910629272460938, 23.558937072753906, 25.207244873046875, 26.855552673339844, 28.503860473632812, 30.15216827392578, 31.80047607421875, 33.44878387451172, 35.09709167480469, 36.745399475097656, 38.393707275390625, 40.042015075683594, 41.69032287597656, 43.33863067626953, 44.9869384765625, 46.63524627685547, 48.28355407714844, 49.931861877441406, 51.58017349243164]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 7.0, 6.0, 2.0, 15.0, 15.0, 11.0, 14.0, 14.0, 30.0, 28.0, 18.0, 36.0, 27.0, 45.0, 51.0, 52.0, 43.0, 52.0, 47.0, 53.0, 50.0, 35.0, 40.0, 38.0, 23.0, 31.0, 32.0, 31.0, 25.0, 22.0, 15.0, 21.0, 18.0, 11.0, 11.0, 10.0, 3.0, 8.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.26953125, -7.00006103515625, -6.7305908203125, -6.46112060546875, -6.191650390625, -5.92218017578125, -5.6527099609375, -5.38323974609375, -5.11376953125, -4.84429931640625, -4.5748291015625, -4.30535888671875, -4.035888671875, -3.76641845703125, -3.4969482421875, -3.22747802734375, -2.9580078125, -2.68853759765625, -2.4190673828125, -2.14959716796875, -1.880126953125, -1.61065673828125, -1.3411865234375, -1.07171630859375, -0.80224609375, -0.53277587890625, -0.2633056640625, 0.00616455078125, 0.275634765625, 0.54510498046875, 0.8145751953125, 1.08404541015625, 1.353515625, 1.62298583984375, 1.8924560546875, 2.16192626953125, 2.431396484375, 2.70086669921875, 2.9703369140625, 3.23980712890625, 3.50927734375, 3.77874755859375, 4.0482177734375, 4.31768798828125, 4.587158203125, 4.85662841796875, 5.1260986328125, 5.39556884765625, 5.6650390625, 5.93450927734375, 6.2039794921875, 6.47344970703125, 6.742919921875, 7.01239013671875, 7.2818603515625, 7.55133056640625, 7.82080078125, 8.09027099609375, 8.3597412109375, 8.62921142578125, 8.898681640625, 9.16815185546875, 9.4376220703125, 9.70709228515625, 9.9765625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 9.0, 16.0, 13.0, 19.0, 19.0, 18.0, 35.0, 47.0, 60.0, 75.0, 116.0, 181.0, 375.0, 872.0, 4493.0, 184921.0, 3232023.0, 756109.0, 12380.0, 1348.0, 424.0, 207.0, 132.0, 83.0, 67.0, 48.0, 42.0, 37.0, 23.0, 15.0, 15.0, 8.0, 13.0, 9.0, 7.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.15625, -23.313720703125, -22.47119140625, -21.628662109375, -20.7861328125, -19.943603515625, -19.10107421875, -18.258544921875, -17.416015625, -16.573486328125, -15.73095703125, -14.888427734375, -14.0458984375, -13.203369140625, -12.36083984375, -11.518310546875, -10.67578125, -9.833251953125, -8.99072265625, -8.148193359375, -7.3056640625, -6.463134765625, -5.62060546875, -4.778076171875, -3.935546875, -3.093017578125, -2.25048828125, -1.407958984375, -0.5654296875, 0.277099609375, 1.11962890625, 1.962158203125, 2.8046875, 3.647216796875, 4.48974609375, 5.332275390625, 6.1748046875, 7.017333984375, 7.85986328125, 8.702392578125, 9.544921875, 10.387451171875, 11.22998046875, 12.072509765625, 12.9150390625, 13.757568359375, 14.60009765625, 15.442626953125, 16.28515625, 17.127685546875, 17.97021484375, 18.812744140625, 19.6552734375, 20.497802734375, 21.34033203125, 22.182861328125, 23.025390625, 23.867919921875, 24.71044921875, 25.552978515625, 26.3955078125, 27.238037109375, 28.08056640625, 28.923095703125, 29.765625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 9.0, 6.0, 9.0, 16.0, 23.0, 34.0, 54.0, 60.0, 80.0, 98.0, 183.0, 212.0, 345.0, 408.0, 446.0, 455.0, 403.0, 337.0, 246.0, 184.0, 118.0, 94.0, 73.0, 55.0, 42.0, 23.0, 21.0, 14.0, 7.0, 4.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.203125, -14.69775390625, -14.1923828125, -13.68701171875, -13.181640625, -12.67626953125, -12.1708984375, -11.66552734375, -11.16015625, -10.65478515625, -10.1494140625, -9.64404296875, -9.138671875, -8.63330078125, -8.1279296875, -7.62255859375, -7.1171875, -6.61181640625, -6.1064453125, -5.60107421875, -5.095703125, -4.59033203125, -4.0849609375, -3.57958984375, -3.07421875, -2.56884765625, -2.0634765625, -1.55810546875, -1.052734375, -0.54736328125, -0.0419921875, 0.46337890625, 0.96875, 1.47412109375, 1.9794921875, 2.48486328125, 2.990234375, 3.49560546875, 4.0009765625, 4.50634765625, 5.01171875, 5.51708984375, 6.0224609375, 6.52783203125, 7.033203125, 7.53857421875, 8.0439453125, 8.54931640625, 9.0546875, 9.56005859375, 10.0654296875, 10.57080078125, 11.076171875, 11.58154296875, 12.0869140625, 12.59228515625, 13.09765625, 13.60302734375, 14.1083984375, 14.61376953125, 15.119140625, 15.62451171875, 16.1298828125, 16.63525390625, 17.140625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 8.0, 7.0, 19.0, 23.0, 29.0, 58.0, 67.0, 95.0, 127.0, 175.0, 259.0, 383.0, 625.0, 5457.0, 3675610.0, 508120.0, 1579.0, 539.0, 319.0, 247.0, 152.0, 104.0, 86.0, 57.0, 45.0, 25.0, 17.0, 12.0, 9.0, 9.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.5, -74.23828125, -71.9765625, -69.71484375, -67.453125, -65.19140625, -62.9296875, -60.66796875, -58.40625, -56.14453125, -53.8828125, -51.62109375, -49.359375, -47.09765625, -44.8359375, -42.57421875, -40.3125, -38.05078125, -35.7890625, -33.52734375, -31.265625, -29.00390625, -26.7421875, -24.48046875, -22.21875, -19.95703125, -17.6953125, -15.43359375, -13.171875, -10.91015625, -8.6484375, -6.38671875, -4.125, -1.86328125, 0.3984375, 2.66015625, 4.921875, 7.18359375, 9.4453125, 11.70703125, 13.96875, 16.23046875, 18.4921875, 20.75390625, 23.015625, 25.27734375, 27.5390625, 29.80078125, 32.0625, 34.32421875, 36.5859375, 38.84765625, 41.109375, 43.37109375, 45.6328125, 47.89453125, 50.15625, 52.41796875, 54.6796875, 56.94140625, 59.203125, 61.46484375, 63.7265625, 65.98828125, 68.25]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 16.0, 228.0, 582.0, 180.0, 10.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.25180053710938, -59.91868209838867, -50.58556365966797, -41.252445220947266, -31.919326782226562, -22.58620834350586, -13.253089904785156, -3.9199676513671875, 5.41314697265625, 14.746265411376953, 24.079383850097656, 33.41250228881836, 42.74562072753906, 52.078739166259766, 61.41185760498047, 70.74497985839844, 80.07809448242188, 89.41120910644531, 98.74433135986328, 108.07745361328125, 117.41056823730469, 126.74368286132812, 136.07681274414062, 145.40992736816406, 154.7430419921875, 164.07615661621094, 173.40927124023438, 182.74240112304688, 192.0755157470703, 201.40863037109375, 210.74176025390625, 220.0748748779297, 229.40802001953125, 238.7411346435547, 248.07424926757812, 257.4073791503906, 266.740478515625, 276.0736083984375, 285.40673828125, 294.7398681640625, 304.0729675292969, 313.4060974121094, 322.73919677734375, 332.07232666015625, 341.40545654296875, 350.7385559082031, 360.0716857910156, 369.40478515625, 378.7379150390625, 388.071044921875, 397.4041442871094, 406.7372741699219, 416.07037353515625, 425.40350341796875, 434.73663330078125, 444.06976318359375, 453.4028625488281, 462.7359924316406, 472.069091796875, 481.4022216796875, 490.7353515625, 500.0684509277344, 509.4015808105469, 518.7346801757812, 528.0678100585938]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 4.0, 2.0, 3.0, 8.0, 4.0, 5.0, 11.0, 9.0, 19.0, 15.0, 24.0, 25.0, 27.0, 31.0, 27.0, 42.0, 31.0, 43.0, 33.0, 36.0, 43.0, 35.0, 52.0, 48.0, 37.0, 34.0, 35.0, 44.0, 40.0, 40.0, 33.0, 22.0, 21.0, 22.0, 14.0, 14.0, 10.0, 12.0, 14.0, 6.0, 7.0, 7.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.38121795654297, -51.78391647338867, -50.18661117553711, -48.58930969238281, -46.99200439453125, -45.39470291137695, -43.797401428222656, -42.200096130371094, -40.6027946472168, -39.0054931640625, -37.40818786621094, -35.81088638305664, -34.213584899902344, -32.61627960205078, -31.018978118896484, -29.421674728393555, -27.824371337890625, -26.227067947387695, -24.629764556884766, -23.03246307373047, -21.43515968322754, -19.83785629272461, -18.240554809570312, -16.643251419067383, -15.045948028564453, -13.448644638061523, -11.85134220123291, -10.254039764404297, -8.656736373901367, -7.059433460235596, -5.462130546569824, -3.864828109741211, -2.2675209045410156, -0.6702179908752441, 0.9270849227905273, 2.524387836456299, 4.12169075012207, 5.718993663787842, 7.316296577453613, 8.913599014282227, 10.510902404785156, 12.108205795288086, 13.7055082321167, 15.302810668945312, 16.900114059448242, 18.497417449951172, 20.09471893310547, 21.6920223236084, 23.289325714111328, 24.886629104614258, 26.483932495117188, 28.081233978271484, 29.678537368774414, 31.275840759277344, 32.87314224243164, 34.47044372558594, 36.0677490234375, 37.6650505065918, 39.26235580444336, 40.859657287597656, 42.45696258544922, 44.054264068603516, 45.65156555175781, 47.248870849609375, 48.84617233276367]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 10.0, 8.0, 11.0, 28.0, 19.0, 20.0, 20.0, 26.0, 25.0, 24.0, 27.0, 47.0, 45.0, 38.0, 41.0, 53.0, 51.0, 45.0, 50.0, 50.0, 40.0, 38.0, 32.0, 39.0, 26.0, 24.0, 22.0, 24.0, 19.0, 19.0, 15.0, 12.0, 12.0, 11.0, 9.0, 9.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.91668701171875, -7.6693115234375, -7.42193603515625, -7.174560546875, -6.92718505859375, -6.6798095703125, -6.43243408203125, -6.18505859375, -5.93768310546875, -5.6903076171875, -5.44293212890625, -5.195556640625, -4.94818115234375, -4.7008056640625, -4.45343017578125, -4.2060546875, -3.95867919921875, -3.7113037109375, -3.46392822265625, -3.216552734375, -2.96917724609375, -2.7218017578125, -2.47442626953125, -2.22705078125, -1.97967529296875, -1.7322998046875, -1.48492431640625, -1.237548828125, -0.99017333984375, -0.7427978515625, -0.49542236328125, -0.248046875, -0.00067138671875, 0.2467041015625, 0.49407958984375, 0.741455078125, 0.98883056640625, 1.2362060546875, 1.48358154296875, 1.73095703125, 1.97833251953125, 2.2257080078125, 2.47308349609375, 2.720458984375, 2.96783447265625, 3.2152099609375, 3.46258544921875, 3.7099609375, 3.95733642578125, 4.2047119140625, 4.45208740234375, 4.699462890625, 4.94683837890625, 5.1942138671875, 5.44158935546875, 5.68896484375, 5.93634033203125, 6.1837158203125, 6.43109130859375, 6.678466796875, 6.92584228515625, 7.1732177734375, 7.42059326171875, 7.66796875]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 11.0, 14.0, 19.0, 36.0, 45.0, 80.0, 117.0, 155.0, 228.0, 394.0, 574.0, 894.0, 1485.0, 2153.0, 3373.0, 5291.0, 8311.0, 13126.0, 21404.0, 35959.0, 63905.0, 129168.0, 284219.0, 234248.0, 105649.0, 55294.0, 31489.0, 18654.0, 11749.0, 7357.0, 4755.0, 3036.0, 1850.0, 1158.0, 793.0, 510.0, 339.0, 234.0, 137.0, 108.0, 73.0, 47.0, 39.0, 25.0, 14.0, 9.0, 11.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.3828125, -1.3407440185546875, -1.298675537109375, -1.2566070556640625, -1.21453857421875, -1.1724700927734375, -1.130401611328125, -1.0883331298828125, -1.0462646484375, -1.0041961669921875, -0.962127685546875, -0.9200592041015625, -0.87799072265625, -0.8359222412109375, -0.793853759765625, -0.7517852783203125, -0.709716796875, -0.6676483154296875, -0.625579833984375, -0.5835113525390625, -0.54144287109375, -0.4993743896484375, -0.457305908203125, -0.4152374267578125, -0.3731689453125, -0.3311004638671875, -0.289031982421875, -0.2469635009765625, -0.20489501953125, -0.1628265380859375, -0.120758056640625, -0.0786895751953125, -0.03662109375, 0.0054473876953125, 0.047515869140625, 0.0895843505859375, 0.13165283203125, 0.1737213134765625, 0.215789794921875, 0.2578582763671875, 0.2999267578125, 0.3419952392578125, 0.384063720703125, 0.4261322021484375, 0.46820068359375, 0.5102691650390625, 0.552337646484375, 0.5944061279296875, 0.636474609375, 0.6785430908203125, 0.720611572265625, 0.7626800537109375, 0.80474853515625, 0.8468170166015625, 0.888885498046875, 0.9309539794921875, 0.9730224609375, 1.0150909423828125, 1.057159423828125, 1.0992279052734375, 1.14129638671875, 1.1833648681640625, 1.225433349609375, 1.2675018310546875, 1.3095703125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 8.0, 12.0, 12.0, 17.0, 20.0, 17.0, 26.0, 26.0, 28.0, 42.0, 39.0, 52.0, 41.0, 49.0, 57.0, 1079.0, 47.0, 56.0, 55.0, 52.0, 42.0, 33.0, 42.0, 33.0, 31.0, 20.0, 18.0, 20.0, 13.0, 10.0, 7.0, 5.0, 8.0, 4.0, 0.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.55859375, -5.37628173828125, -5.1939697265625, -5.01165771484375, -4.829345703125, -4.64703369140625, -4.4647216796875, -4.28240966796875, -4.10009765625, -3.91778564453125, -3.7354736328125, -3.55316162109375, -3.370849609375, -3.18853759765625, -3.0062255859375, -2.82391357421875, -2.6416015625, -2.45928955078125, -2.2769775390625, -2.09466552734375, -1.912353515625, -1.73004150390625, -1.5477294921875, -1.36541748046875, -1.18310546875, -1.00079345703125, -0.8184814453125, -0.63616943359375, -0.453857421875, -0.27154541015625, -0.0892333984375, 0.09307861328125, 0.275390625, 0.45770263671875, 0.6400146484375, 0.82232666015625, 1.004638671875, 1.18695068359375, 1.3692626953125, 1.55157470703125, 1.73388671875, 1.91619873046875, 2.0985107421875, 2.28082275390625, 2.463134765625, 2.64544677734375, 2.8277587890625, 3.01007080078125, 3.1923828125, 3.37469482421875, 3.5570068359375, 3.73931884765625, 3.921630859375, 4.10394287109375, 4.2862548828125, 4.46856689453125, 4.65087890625, 4.83319091796875, 5.0155029296875, 5.19781494140625, 5.380126953125, 5.56243896484375, 5.7447509765625, 5.92706298828125, 6.109375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 12.0, 4.0, 16.0, 22.0, 28.0, 35.0, 49.0, 64.0, 110.0, 173.0, 250.0, 376.0, 593.0, 969.0, 1508.0, 2379.0, 4037.0, 6835.0, 11490.0, 20514.0, 36601.0, 69756.0, 148392.0, 1373697.0, 212732.0, 94673.0, 48279.0, 26180.0, 15050.0, 8637.0, 5152.0, 3080.0, 2078.0, 1121.0, 736.0, 492.0, 330.0, 241.0, 139.0, 117.0, 58.0, 55.0, 34.0, 10.0, 9.0, 7.0, 5.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.548828125, -1.5014801025390625, -1.454132080078125, -1.4067840576171875, -1.35943603515625, -1.3120880126953125, -1.264739990234375, -1.2173919677734375, -1.1700439453125, -1.1226959228515625, -1.075347900390625, -1.0279998779296875, -0.98065185546875, -0.9333038330078125, -0.885955810546875, -0.8386077880859375, -0.791259765625, -0.7439117431640625, -0.696563720703125, -0.6492156982421875, -0.60186767578125, -0.5545196533203125, -0.507171630859375, -0.4598236083984375, -0.4124755859375, -0.3651275634765625, -0.317779541015625, -0.2704315185546875, -0.22308349609375, -0.1757354736328125, -0.128387451171875, -0.0810394287109375, -0.03369140625, 0.0136566162109375, 0.061004638671875, 0.1083526611328125, 0.15570068359375, 0.2030487060546875, 0.250396728515625, 0.2977447509765625, 0.3450927734375, 0.3924407958984375, 0.439788818359375, 0.4871368408203125, 0.53448486328125, 0.5818328857421875, 0.629180908203125, 0.6765289306640625, 0.723876953125, 0.7712249755859375, 0.818572998046875, 0.8659210205078125, 0.91326904296875, 0.9606170654296875, 1.007965087890625, 1.0553131103515625, 1.1026611328125, 1.1500091552734375, 1.197357177734375, 1.2447052001953125, 1.29205322265625, 1.3394012451171875, 1.386749267578125, 1.4340972900390625, 1.4814453125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 9.0, 7.0, 5.0, 7.0, 9.0, 19.0, 25.0, 24.0, 29.0, 26.0, 45.0, 52.0, 61.0, 69.0, 88.0, 63.0, 69.0, 56.0, 56.0, 54.0, 37.0, 33.0, 28.0, 22.0, 19.0, 19.0, 11.0, 7.0, 5.0, 10.0, 6.0, 8.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009107589721679688, -0.0008774846792221069, -0.0008442103862762451, -0.0008109360933303833, -0.0007776618003845215, -0.0007443875074386597, -0.0007111132144927979, -0.000677838921546936, -0.0006445646286010742, -0.0006112903356552124, -0.0005780160427093506, -0.0005447417497634888, -0.000511467456817627, -0.00047819316387176514, -0.0004449188709259033, -0.0004116445779800415, -0.0003783702850341797, -0.00034509599208831787, -0.00031182169914245605, -0.00027854740619659424, -0.0002452731132507324, -0.0002119988203048706, -0.0001787245273590088, -0.00014545023441314697, -0.00011217594146728516, -7.890164852142334e-05, -4.5627355575561523e-05, -1.2353062629699707e-05, 2.092123031616211e-05, 5.4195523262023926e-05, 8.746981620788574e-05, 0.00012074410915374756, 0.00015401840209960938, 0.0001872926950454712, 0.000220566987991333, 0.0002538412809371948, 0.00028711557388305664, 0.00032038986682891846, 0.0003536641597747803, 0.0003869384527206421, 0.0004202127456665039, 0.0004534870386123657, 0.00048676133155822754, 0.0005200356245040894, 0.0005533099174499512, 0.000586584210395813, 0.0006198585033416748, 0.0006531327962875366, 0.0006864070892333984, 0.0007196813821792603, 0.0007529556751251221, 0.0007862299680709839, 0.0008195042610168457, 0.0008527785539627075, 0.0008860528469085693, 0.0009193271398544312, 0.000952601432800293, 0.0009858757257461548, 0.0010191500186920166, 0.0010524243116378784, 0.0010856986045837402, 0.001118972897529602, 0.0011522471904754639, 0.0011855214834213257, 0.0012187957763671875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 10.0, 13.0, 8.0, 9.0, 13.0, 16.0, 23.0, 28.0, 24.0, 55.0, 61.0, 94.0, 150.0, 217.0, 499.0, 4221.0, 1005664.0, 35885.0, 761.0, 259.0, 152.0, 120.0, 59.0, 50.0, 35.0, 30.0, 28.0, 7.0, 15.0, 11.0, 6.0, 6.0, 5.0, 7.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.02899169921875, -0.028241872787475586, -0.027492046356201172, -0.026742219924926758, -0.025992393493652344, -0.02524256706237793, -0.024492740631103516, -0.0237429141998291, -0.022993087768554688, -0.022243261337280273, -0.02149343490600586, -0.020743608474731445, -0.01999378204345703, -0.019243955612182617, -0.018494129180908203, -0.01774430274963379, -0.016994476318359375, -0.01624464988708496, -0.015494823455810547, -0.014744997024536133, -0.013995170593261719, -0.013245344161987305, -0.01249551773071289, -0.011745691299438477, -0.010995864868164062, -0.010246038436889648, -0.009496212005615234, -0.00874638557434082, -0.007996559143066406, -0.007246732711791992, -0.006496906280517578, -0.005747079849243164, -0.00499725341796875, -0.004247426986694336, -0.003497600555419922, -0.002747774124145508, -0.0019979476928710938, -0.0012481212615966797, -0.0004982948303222656, 0.00025153160095214844, 0.0010013580322265625, 0.0017511844635009766, 0.0025010108947753906, 0.0032508373260498047, 0.004000663757324219, 0.004750490188598633, 0.005500316619873047, 0.006250143051147461, 0.006999969482421875, 0.007749795913696289, 0.008499622344970703, 0.009249448776245117, 0.009999275207519531, 0.010749101638793945, 0.01149892807006836, 0.012248754501342773, 0.012998580932617188, 0.013748407363891602, 0.014498233795166016, 0.01524806022644043, 0.015997886657714844, 0.016747713088989258, 0.017497539520263672, 0.018247365951538086, 0.0189971923828125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 9.0, 75.0, 382.0, 413.0, 124.0, 15.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.005713447462767363, -0.005609740503132343, -0.005506033543497324, -0.005402327049523592, -0.005298620089888573, -0.005194913130253553, -0.005091206170618534, -0.004987499210983515, -0.004883792717009783, -0.0047800857573747635, -0.004676378797739744, -0.004572672303766012, -0.004468965344130993, -0.004365258384495974, -0.004261551424860954, -0.004157844465225935, -0.004054137505590916, -0.003950430545955896, -0.0038467238191515207, -0.0037430168595165014, -0.0036393101327121258, -0.0035356031730771065, -0.003431896213442087, -0.0033281894866377115, -0.003224482759833336, -0.0031207758001983166, -0.003017069073393941, -0.0029133621137589216, -0.002809655386954546, -0.0027059484273195267, -0.0026022414676845074, -0.0024985347408801317, -0.002394828014075756, -0.0022911210544407368, -0.002187414327636361, -0.002083707368001342, -0.001980000641196966, -0.0018762936815619469, -0.0017725868383422494, -0.001668879995122552, -0.0015651730354875326, -0.0014614661922678351, -0.0013577593490481377, -0.0012540523894131184, -0.0011503455461934209, -0.0010466387029737234, -0.0009429318597540259, -0.0008392249583266675, -0.0007355181151069701, -0.0006318112718872726, -0.0005281043704599142, -0.00042439752724021673, -0.0003206906549166888, -0.00021698378259316087, -0.00011327693937346339, -9.570037946105003e-06, 9.413680527359247e-05, 0.0001978436775971204, 0.00030155054992064834, 0.0004052573931403458, 0.0005089642945677042, 0.0006126711377874017, 0.0007163779810070992, 0.0008200848824344575, 0.000923791725654155]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 2.0, 8.0, 9.0, 20.0, 14.0, 20.0, 19.0, 26.0, 20.0, 36.0, 34.0, 38.0, 29.0, 50.0, 34.0, 49.0, 42.0, 54.0, 38.0, 53.0, 48.0, 54.0, 52.0, 46.0, 31.0, 36.0, 19.0, 26.0, 20.0, 22.0, 12.0, 14.0, 7.0, 5.0, 4.0, 2.0, 2.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005475878715515137, -0.0005288589745759964, -0.0005101300776004791, -0.0004914011806249619, -0.0004726722836494446, -0.0004539433866739273, -0.00043521448969841003, -0.00041648559272289276, -0.0003977566957473755, -0.0003790277987718582, -0.00036029890179634094, -0.00034157000482082367, -0.0003228411078453064, -0.0003041122108697891, -0.00028538331389427185, -0.0002666544169187546, -0.0002479255199432373, -0.00022919662296772003, -0.00021046772599220276, -0.00019173882901668549, -0.0001730099320411682, -0.00015428103506565094, -0.00013555213809013367, -0.0001168232411146164, -9.809434413909912e-05, -7.936544716358185e-05, -6.0636550188064575e-05, -4.19076532125473e-05, -2.317875623703003e-05, -4.449859261512756e-06, 1.4279037714004517e-05, 3.300793468952179e-05, 5.173683166503906e-05, 7.046572864055634e-05, 8.919462561607361e-05, 0.00010792352259159088, 0.00012665241956710815, 0.00014538131654262543, 0.0001641102135181427, 0.00018283911049365997, 0.00020156800746917725, 0.00022029690444469452, 0.0002390258014202118, 0.00025775469839572906, 0.00027648359537124634, 0.0002952124923467636, 0.0003139413893222809, 0.00033267028629779816, 0.00035139918327331543, 0.0003701280802488327, 0.00038885697722435, 0.00040758587419986725, 0.0004263147711753845, 0.0004450436681509018, 0.00046377256512641907, 0.00048250146210193634, 0.0005012303590774536, 0.0005199592560529709, 0.0005386881530284882, 0.0005574170500040054, 0.0005761459469795227, 0.00059487484395504, 0.0006136037409305573, 0.0006323326379060745, 0.0006510615348815918]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 10.0, 8.0, 11.0, 28.0, 19.0, 20.0, 20.0, 26.0, 25.0, 24.0, 27.0, 47.0, 45.0, 38.0, 41.0, 53.0, 51.0, 45.0, 50.0, 50.0, 40.0, 38.0, 32.0, 39.0, 26.0, 24.0, 22.0, 24.0, 19.0, 19.0, 15.0, 12.0, 12.0, 11.0, 9.0, 9.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.1640625, -7.91668701171875, -7.6693115234375, -7.42193603515625, -7.174560546875, -6.92718505859375, -6.6798095703125, -6.43243408203125, -6.18505859375, -5.93768310546875, -5.6903076171875, -5.44293212890625, -5.195556640625, -4.94818115234375, -4.7008056640625, -4.45343017578125, -4.2060546875, -3.95867919921875, -3.7113037109375, -3.46392822265625, -3.216552734375, -2.96917724609375, -2.7218017578125, -2.47442626953125, -2.22705078125, -1.97967529296875, -1.7322998046875, -1.48492431640625, -1.237548828125, -0.99017333984375, -0.7427978515625, -0.49542236328125, -0.248046875, -0.00067138671875, 0.2467041015625, 0.49407958984375, 0.741455078125, 0.98883056640625, 1.2362060546875, 1.48358154296875, 1.73095703125, 1.97833251953125, 2.2257080078125, 2.47308349609375, 2.720458984375, 2.96783447265625, 3.2152099609375, 3.46258544921875, 3.7099609375, 3.95733642578125, 4.2047119140625, 4.45208740234375, 4.699462890625, 4.94683837890625, 5.1942138671875, 5.44158935546875, 5.68896484375, 5.93634033203125, 6.1837158203125, 6.43109130859375, 6.678466796875, 6.92584228515625, 7.1732177734375, 7.42059326171875, 7.66796875]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 5.0, 6.0, 9.0, 16.0, 21.0, 29.0, 29.0, 50.0, 60.0, 81.0, 124.0, 182.0, 252.0, 514.0, 1166.0, 2692.0, 7204.0, 18658.0, 49658.0, 127337.0, 307680.0, 317178.0, 131817.0, 51451.0, 19365.0, 7593.0, 2815.0, 1136.0, 512.0, 285.0, 163.0, 87.0, 95.0, 68.0, 48.0, 40.0, 29.0, 24.0, 17.0, 17.0, 12.0, 6.0, 6.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1640625, -7.91680908203125, -7.6695556640625, -7.42230224609375, -7.175048828125, -6.92779541015625, -6.6805419921875, -6.43328857421875, -6.18603515625, -5.93878173828125, -5.6915283203125, -5.44427490234375, -5.197021484375, -4.94976806640625, -4.7025146484375, -4.45526123046875, -4.2080078125, -3.96075439453125, -3.7135009765625, -3.46624755859375, -3.218994140625, -2.97174072265625, -2.7244873046875, -2.47723388671875, -2.22998046875, -1.98272705078125, -1.7354736328125, -1.48822021484375, -1.240966796875, -0.99371337890625, -0.7464599609375, -0.49920654296875, -0.251953125, -0.00469970703125, 0.2425537109375, 0.48980712890625, 0.737060546875, 0.98431396484375, 1.2315673828125, 1.47882080078125, 1.72607421875, 1.97332763671875, 2.2205810546875, 2.46783447265625, 2.715087890625, 2.96234130859375, 3.2095947265625, 3.45684814453125, 3.7041015625, 3.95135498046875, 4.1986083984375, 4.44586181640625, 4.693115234375, 4.94036865234375, 5.1876220703125, 5.43487548828125, 5.68212890625, 5.92938232421875, 6.1766357421875, 6.42388916015625, 6.671142578125, 6.91839599609375, 7.1656494140625, 7.41290283203125, 7.66015625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 8.0, 9.0, 11.0, 11.0, 8.0, 16.0, 19.0, 15.0, 19.0, 26.0, 25.0, 27.0, 32.0, 33.0, 43.0, 41.0, 51.0, 89.0, 190.0, 1519.0, 306.0, 118.0, 55.0, 48.0, 37.0, 37.0, 32.0, 35.0, 33.0, 26.0, 20.0, 23.0, 15.0, 11.0, 19.0, 9.0, 4.0, 10.0, 2.0, 4.0, 0.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-26.5, -25.73583984375, -24.9716796875, -24.20751953125, -23.443359375, -22.67919921875, -21.9150390625, -21.15087890625, -20.38671875, -19.62255859375, -18.8583984375, -18.09423828125, -17.330078125, -16.56591796875, -15.8017578125, -15.03759765625, -14.2734375, -13.50927734375, -12.7451171875, -11.98095703125, -11.216796875, -10.45263671875, -9.6884765625, -8.92431640625, -8.16015625, -7.39599609375, -6.6318359375, -5.86767578125, -5.103515625, -4.33935546875, -3.5751953125, -2.81103515625, -2.046875, -1.28271484375, -0.5185546875, 0.24560546875, 1.009765625, 1.77392578125, 2.5380859375, 3.30224609375, 4.06640625, 4.83056640625, 5.5947265625, 6.35888671875, 7.123046875, 7.88720703125, 8.6513671875, 9.41552734375, 10.1796875, 10.94384765625, 11.7080078125, 12.47216796875, 13.236328125, 14.00048828125, 14.7646484375, 15.52880859375, 16.29296875, 17.05712890625, 17.8212890625, 18.58544921875, 19.349609375, 20.11376953125, 20.8779296875, 21.64208984375, 22.40625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 7.0, 1.0, 5.0, 4.0, 7.0, 6.0, 10.0, 11.0, 15.0, 18.0, 24.0, 33.0, 50.0, 75.0, 105.0, 170.0, 344.0, 819.0, 4888.0, 3126805.0, 10299.0, 1036.0, 374.0, 198.0, 125.0, 74.0, 55.0, 33.0, 31.0, 24.0, 14.0, 13.0, 7.0, 6.0, 3.0, 2.0, 4.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-136.75, -133.01171875, -129.2734375, -125.53515625, -121.796875, -118.05859375, -114.3203125, -110.58203125, -106.84375, -103.10546875, -99.3671875, -95.62890625, -91.890625, -88.15234375, -84.4140625, -80.67578125, -76.9375, -73.19921875, -69.4609375, -65.72265625, -61.984375, -58.24609375, -54.5078125, -50.76953125, -47.03125, -43.29296875, -39.5546875, -35.81640625, -32.078125, -28.33984375, -24.6015625, -20.86328125, -17.125, -13.38671875, -9.6484375, -5.91015625, -2.171875, 1.56640625, 5.3046875, 9.04296875, 12.78125, 16.51953125, 20.2578125, 23.99609375, 27.734375, 31.47265625, 35.2109375, 38.94921875, 42.6875, 46.42578125, 50.1640625, 53.90234375, 57.640625, 61.37890625, 65.1171875, 68.85546875, 72.59375, 76.33203125, 80.0703125, 83.80859375, 87.546875, 91.28515625, 95.0234375, 98.76171875, 102.5]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 64.0, 373.0, 462.0, 102.0, 8.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-237.55494689941406, -233.31671142578125, -229.0784912109375, -224.8402557373047, -220.60203552246094, -216.36380004882812, -212.12557983398438, -207.88734436035156, -203.6491241455078, -199.410888671875, -195.17266845703125, -190.93443298339844, -186.6962127685547, -182.45797729492188, -178.21975708007812, -173.9815216064453, -169.7432861328125, -165.5050506591797, -161.26683044433594, -157.02859497070312, -152.79037475585938, -148.55213928222656, -144.3139190673828, -140.07568359375, -135.83746337890625, -131.59922790527344, -127.36100769042969, -123.1227798461914, -118.88455200195312, -114.64632415771484, -110.40809631347656, -106.16986083984375, -101.93163299560547, -97.69340515136719, -93.4551773071289, -89.21694946289062, -84.97872161865234, -80.74049377441406, -76.50225830078125, -72.2640380859375, -68.02580261230469, -63.787574768066406, -59.549346923828125, -55.311119079589844, -51.07289123535156, -46.83466339111328, -42.596431732177734, -38.35820388793945, -34.11997985839844, -29.881752014160156, -25.643524169921875, -21.40529441833496, -17.16706657409668, -12.928838729858398, -8.690608978271484, -4.452381134033203, -0.21415328979492188, 4.024075031280518, 8.262303352355957, 12.500532150268555, 16.738759994506836, 20.976987838745117, 25.21521759033203, 29.453445434570312, 33.691673278808594]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 6.0, 2.0, 3.0, 4.0, 10.0, 13.0, 10.0, 23.0, 13.0, 13.0, 16.0, 24.0, 31.0, 20.0, 37.0, 33.0, 21.0, 27.0, 32.0, 37.0, 39.0, 46.0, 53.0, 41.0, 54.0, 41.0, 35.0, 26.0, 42.0, 34.0, 29.0, 28.0, 21.0, 22.0, 17.0, 13.0, 14.0, 17.0, 14.0, 10.0, 12.0, 8.0, 5.0, 7.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.984249114990234, -49.09490203857422, -47.2055549621582, -45.31620788574219, -43.426856994628906, -41.537513732910156, -39.648162841796875, -37.75881576538086, -35.869468688964844, -33.98012161254883, -32.09077453613281, -30.201425552368164, -28.31207847595215, -26.422731399536133, -24.533382415771484, -22.64403533935547, -20.754688262939453, -18.865341186523438, -16.975994110107422, -15.086645126342773, -13.197298049926758, -11.307950973510742, -9.41860294342041, -7.529254913330078, -5.6399078369140625, -3.7505602836608887, -1.8612127304077148, 0.028134822845458984, 1.9174823760986328, 3.8068294525146484, 5.6961774826049805, 7.5855255126953125, 9.474868774414062, 11.364215850830078, 13.25356388092041, 15.142911911010742, 17.032258987426758, 18.921606063842773, 20.810955047607422, 22.700302124023438, 24.589649200439453, 26.47899627685547, 28.368343353271484, 30.257692337036133, 32.14704132080078, 34.03638458251953, 35.92573547363281, 37.81508255004883, 39.704429626464844, 41.59377670288086, 43.483123779296875, 45.37247085571289, 47.261817932128906, 49.15116882324219, 51.0405158996582, 52.92986297607422, 54.819210052490234, 56.70855712890625, 58.597904205322266, 60.48725128173828, 62.37660217285156, 64.26594543457031, 66.1552963256836, 68.04464721679688, 69.93399047851562]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 6.0, 9.0, 9.0, 10.0, 23.0, 14.0, 18.0, 22.0, 24.0, 31.0, 46.0, 34.0, 31.0, 33.0, 31.0, 35.0, 60.0, 58.0, 40.0, 53.0, 52.0, 43.0, 29.0, 36.0, 26.0, 31.0, 33.0, 23.0, 25.0, 19.0, 15.0, 11.0, 18.0, 12.0, 11.0, 9.0, 8.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.08837890625, -7.8095703125, -7.53076171875, -7.251953125, -6.97314453125, -6.6943359375, -6.41552734375, -6.13671875, -5.85791015625, -5.5791015625, -5.30029296875, -5.021484375, -4.74267578125, -4.4638671875, -4.18505859375, -3.90625, -3.62744140625, -3.3486328125, -3.06982421875, -2.791015625, -2.51220703125, -2.2333984375, -1.95458984375, -1.67578125, -1.39697265625, -1.1181640625, -0.83935546875, -0.560546875, -0.28173828125, -0.0029296875, 0.27587890625, 0.5546875, 0.83349609375, 1.1123046875, 1.39111328125, 1.669921875, 1.94873046875, 2.2275390625, 2.50634765625, 2.78515625, 3.06396484375, 3.3427734375, 3.62158203125, 3.900390625, 4.17919921875, 4.4580078125, 4.73681640625, 5.015625, 5.29443359375, 5.5732421875, 5.85205078125, 6.130859375, 6.40966796875, 6.6884765625, 6.96728515625, 7.24609375, 7.52490234375, 7.8037109375, 8.08251953125, 8.361328125, 8.64013671875, 8.9189453125, 9.19775390625, 9.4765625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 0.0, 5.0, 4.0, 7.0, 9.0, 8.0, 19.0, 14.0, 27.0, 28.0, 39.0, 49.0, 59.0, 76.0, 99.0, 120.0, 178.0, 347.0, 1167.0, 17175.0, 1321643.0, 2781943.0, 67871.0, 2170.0, 415.0, 207.0, 135.0, 100.0, 78.0, 52.0, 44.0, 44.0, 37.0, 28.0, 21.0, 15.0, 20.0, 11.0, 9.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.28125, -28.37060546875, -27.4599609375, -26.54931640625, -25.638671875, -24.72802734375, -23.8173828125, -22.90673828125, -21.99609375, -21.08544921875, -20.1748046875, -19.26416015625, -18.353515625, -17.44287109375, -16.5322265625, -15.62158203125, -14.7109375, -13.80029296875, -12.8896484375, -11.97900390625, -11.068359375, -10.15771484375, -9.2470703125, -8.33642578125, -7.42578125, -6.51513671875, -5.6044921875, -4.69384765625, -3.783203125, -2.87255859375, -1.9619140625, -1.05126953125, -0.140625, 0.77001953125, 1.6806640625, 2.59130859375, 3.501953125, 4.41259765625, 5.3232421875, 6.23388671875, 7.14453125, 8.05517578125, 8.9658203125, 9.87646484375, 10.787109375, 11.69775390625, 12.6083984375, 13.51904296875, 14.4296875, 15.34033203125, 16.2509765625, 17.16162109375, 18.072265625, 18.98291015625, 19.8935546875, 20.80419921875, 21.71484375, 22.62548828125, 23.5361328125, 24.44677734375, 25.357421875, 26.26806640625, 27.1787109375, 28.08935546875, 29.0]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 6.0, 9.0, 12.0, 17.0, 31.0, 23.0, 40.0, 64.0, 95.0, 151.0, 182.0, 272.0, 396.0, 515.0, 477.0, 466.0, 355.0, 294.0, 201.0, 122.0, 89.0, 73.0, 50.0, 30.0, 29.0, 19.0, 18.0, 11.0, 8.0, 6.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.0625, -16.537109375, -16.01171875, -15.486328125, -14.9609375, -14.435546875, -13.91015625, -13.384765625, -12.859375, -12.333984375, -11.80859375, -11.283203125, -10.7578125, -10.232421875, -9.70703125, -9.181640625, -8.65625, -8.130859375, -7.60546875, -7.080078125, -6.5546875, -6.029296875, -5.50390625, -4.978515625, -4.453125, -3.927734375, -3.40234375, -2.876953125, -2.3515625, -1.826171875, -1.30078125, -0.775390625, -0.25, 0.275390625, 0.80078125, 1.326171875, 1.8515625, 2.376953125, 2.90234375, 3.427734375, 3.953125, 4.478515625, 5.00390625, 5.529296875, 6.0546875, 6.580078125, 7.10546875, 7.630859375, 8.15625, 8.681640625, 9.20703125, 9.732421875, 10.2578125, 10.783203125, 11.30859375, 11.833984375, 12.359375, 12.884765625, 13.41015625, 13.935546875, 14.4609375, 14.986328125, 15.51171875, 16.037109375, 16.5625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 8.0, 8.0, 16.0, 14.0, 16.0, 30.0, 32.0, 44.0, 91.0, 113.0, 155.0, 257.0, 378.0, 644.0, 5624.0, 4026237.0, 158207.0, 1081.0, 450.0, 279.0, 193.0, 150.0, 76.0, 54.0, 26.0, 34.0, 23.0, 16.0, 6.0, 5.0, 7.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-87.1875, -84.439453125, -81.69140625, -78.943359375, -76.1953125, -73.447265625, -70.69921875, -67.951171875, -65.203125, -62.455078125, -59.70703125, -56.958984375, -54.2109375, -51.462890625, -48.71484375, -45.966796875, -43.21875, -40.470703125, -37.72265625, -34.974609375, -32.2265625, -29.478515625, -26.73046875, -23.982421875, -21.234375, -18.486328125, -15.73828125, -12.990234375, -10.2421875, -7.494140625, -4.74609375, -1.998046875, 0.75, 3.498046875, 6.24609375, 8.994140625, 11.7421875, 14.490234375, 17.23828125, 19.986328125, 22.734375, 25.482421875, 28.23046875, 30.978515625, 33.7265625, 36.474609375, 39.22265625, 41.970703125, 44.71875, 47.466796875, 50.21484375, 52.962890625, 55.7109375, 58.458984375, 61.20703125, 63.955078125, 66.703125, 69.451171875, 72.19921875, 74.947265625, 77.6953125, 80.443359375, 83.19140625, 85.939453125, 88.6875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 26.0, 157.0, 334.0, 320.0, 139.0, 32.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.1746368408203, -127.83661651611328, -122.49859619140625, -117.16058349609375, -111.82255554199219, -106.48454284667969, -101.14652252197266, -95.80850219726562, -90.4704818725586, -85.13246154785156, -79.79444122314453, -74.4564208984375, -69.118408203125, -63.7803840637207, -58.44236755371094, -53.104347229003906, -47.766326904296875, -42.428306579589844, -37.09028625488281, -31.752269744873047, -26.414249420166016, -21.076229095458984, -15.738212585449219, -10.400192260742188, -5.062171936035156, 0.2758474349975586, 5.613866806030273, 10.951885223388672, 16.289905548095703, 21.627925872802734, 26.9659423828125, 32.30396270751953, 37.641998291015625, 42.980018615722656, 48.31803894042969, 53.65605545043945, 58.994075775146484, 64.33209228515625, 69.67011260986328, 75.00813293457031, 80.34615325927734, 85.68417358398438, 91.0221939086914, 96.36021423339844, 101.69822692871094, 107.0362548828125, 112.374267578125, 117.71228790283203, 123.05030822753906, 128.38832092285156, 133.72634887695312, 139.06436157226562, 144.4023895263672, 149.7404022216797, 155.07843017578125, 160.41644287109375, 165.75445556640625, 171.09246826171875, 176.4304962158203, 181.7685089111328, 187.10653686523438, 192.44454956054688, 197.78256225585938, 203.12059020996094, 208.4586181640625]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 10.0, 5.0, 8.0, 10.0, 12.0, 8.0, 19.0, 16.0, 14.0, 19.0, 25.0, 31.0, 26.0, 34.0, 29.0, 36.0, 37.0, 41.0, 35.0, 35.0, 48.0, 35.0, 31.0, 49.0, 31.0, 26.0, 29.0, 38.0, 25.0, 31.0, 17.0, 23.0, 29.0, 16.0, 20.0, 11.0, 12.0, 15.0, 13.0, 5.0, 10.0, 8.0, 9.0, 4.0, 5.0, 5.0, 2.0, 0.0, 4.0, 0.0, 3.0], "bins": [-45.06654739379883, -43.75147247314453, -42.436397552490234, -41.12132263183594, -39.806251525878906, -38.49117660522461, -37.17610168457031, -35.861026763916016, -34.54595184326172, -33.23087692260742, -31.915802001953125, -30.60072898864746, -29.285654067993164, -27.970579147338867, -26.655506134033203, -25.340431213378906, -24.02535629272461, -22.710281372070312, -21.395206451416016, -20.08013343811035, -18.765058517456055, -17.449983596801758, -16.134910583496094, -14.819835662841797, -13.5047607421875, -12.189685821533203, -10.874611854553223, -9.559537887573242, -8.244462966918945, -6.929388523101807, -5.614314079284668, -4.2992401123046875, -2.9841690063476562, -1.6690945625305176, -0.3540201187133789, 0.9610543251037598, 2.2761287689208984, 3.591203212738037, 4.906277656555176, 6.221351623535156, 7.536426544189453, 8.85150146484375, 10.16657543182373, 11.481649398803711, 12.796724319458008, 14.111799240112305, 15.426873207092285, 16.741947174072266, 18.057022094726562, 19.37209701538086, 20.687171936035156, 22.00224494934082, 23.317319869995117, 24.632394790649414, 25.947467803955078, 27.262542724609375, 28.577617645263672, 29.89269256591797, 31.207767486572266, 32.52284240722656, 33.837913513183594, 35.15298843383789, 36.46806335449219, 37.783138275146484, 39.09821319580078]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0, 5.0, 5.0, 11.0, 12.0, 6.0, 15.0, 10.0, 16.0, 19.0, 24.0, 19.0, 34.0, 28.0, 35.0, 28.0, 39.0, 38.0, 54.0, 38.0, 31.0, 65.0, 51.0, 37.0, 33.0, 53.0, 33.0, 35.0, 38.0, 31.0, 25.0, 24.0, 16.0, 20.0, 18.0, 13.0, 9.0, 12.0, 13.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.90625, -7.6456298828125, -7.385009765625, -7.1243896484375, -6.86376953125, -6.6031494140625, -6.342529296875, -6.0819091796875, -5.8212890625, -5.5606689453125, -5.300048828125, -5.0394287109375, -4.77880859375, -4.5181884765625, -4.257568359375, -3.9969482421875, -3.736328125, -3.4757080078125, -3.215087890625, -2.9544677734375, -2.69384765625, -2.4332275390625, -2.172607421875, -1.9119873046875, -1.6513671875, -1.3907470703125, -1.130126953125, -0.8695068359375, -0.60888671875, -0.3482666015625, -0.087646484375, 0.1729736328125, 0.43359375, 0.6942138671875, 0.954833984375, 1.2154541015625, 1.47607421875, 1.7366943359375, 1.997314453125, 2.2579345703125, 2.5185546875, 2.7791748046875, 3.039794921875, 3.3004150390625, 3.56103515625, 3.8216552734375, 4.082275390625, 4.3428955078125, 4.603515625, 4.8641357421875, 5.124755859375, 5.3853759765625, 5.64599609375, 5.9066162109375, 6.167236328125, 6.4278564453125, 6.6884765625, 6.9490966796875, 7.209716796875, 7.4703369140625, 7.73095703125, 7.9915771484375, 8.252197265625, 8.5128173828125, 8.7734375]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 4.0, 6.0, 11.0, 15.0, 16.0, 28.0, 43.0, 52.0, 86.0, 148.0, 173.0, 304.0, 401.0, 597.0, 876.0, 1318.0, 1835.0, 2772.0, 4167.0, 6413.0, 10055.0, 15560.0, 24849.0, 41402.0, 72425.0, 140203.0, 294761.0, 197092.0, 95392.0, 52125.0, 31290.0, 19268.0, 11696.0, 7728.0, 5062.0, 3428.0, 2265.0, 1518.0, 984.0, 707.0, 422.0, 318.0, 215.0, 150.0, 118.0, 77.0, 70.0, 39.0, 25.0, 18.0, 12.0, 9.0, 5.0, 3.0, 3.0, 1.0, 2.0], "bins": [-1.427734375, -1.3853912353515625, -1.343048095703125, -1.3007049560546875, -1.25836181640625, -1.2160186767578125, -1.173675537109375, -1.1313323974609375, -1.0889892578125, -1.0466461181640625, -1.004302978515625, -0.9619598388671875, -0.91961669921875, -0.8772735595703125, -0.834930419921875, -0.7925872802734375, -0.750244140625, -0.7079010009765625, -0.665557861328125, -0.6232147216796875, -0.58087158203125, -0.5385284423828125, -0.496185302734375, -0.4538421630859375, -0.4114990234375, -0.3691558837890625, -0.326812744140625, -0.2844696044921875, -0.24212646484375, -0.1997833251953125, -0.157440185546875, -0.1150970458984375, -0.07275390625, -0.0304107666015625, 0.011932373046875, 0.0542755126953125, 0.09661865234375, 0.1389617919921875, 0.181304931640625, 0.2236480712890625, 0.2659912109375, 0.3083343505859375, 0.350677490234375, 0.3930206298828125, 0.43536376953125, 0.4777069091796875, 0.520050048828125, 0.5623931884765625, 0.604736328125, 0.6470794677734375, 0.689422607421875, 0.7317657470703125, 0.77410888671875, 0.8164520263671875, 0.858795166015625, 0.9011383056640625, 0.9434814453125, 0.9858245849609375, 1.028167724609375, 1.0705108642578125, 1.11285400390625, 1.1551971435546875, 1.197540283203125, 1.2398834228515625, 1.2822265625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 12.0, 10.0, 13.0, 16.0, 12.0, 13.0, 24.0, 23.0, 31.0, 38.0, 34.0, 43.0, 58.0, 45.0, 51.0, 64.0, 1070.0, 47.0, 48.0, 39.0, 42.0, 43.0, 40.0, 32.0, 24.0, 21.0, 28.0, 23.0, 12.0, 15.0, 12.0, 10.0, 8.0, 7.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.2578125, -6.068115234375, -5.87841796875, -5.688720703125, -5.4990234375, -5.309326171875, -5.11962890625, -4.929931640625, -4.740234375, -4.550537109375, -4.36083984375, -4.171142578125, -3.9814453125, -3.791748046875, -3.60205078125, -3.412353515625, -3.22265625, -3.032958984375, -2.84326171875, -2.653564453125, -2.4638671875, -2.274169921875, -2.08447265625, -1.894775390625, -1.705078125, -1.515380859375, -1.32568359375, -1.135986328125, -0.9462890625, -0.756591796875, -0.56689453125, -0.377197265625, -0.1875, 0.002197265625, 0.19189453125, 0.381591796875, 0.5712890625, 0.760986328125, 0.95068359375, 1.140380859375, 1.330078125, 1.519775390625, 1.70947265625, 1.899169921875, 2.0888671875, 2.278564453125, 2.46826171875, 2.657958984375, 2.84765625, 3.037353515625, 3.22705078125, 3.416748046875, 3.6064453125, 3.796142578125, 3.98583984375, 4.175537109375, 4.365234375, 4.554931640625, 4.74462890625, 4.934326171875, 5.1240234375, 5.313720703125, 5.50341796875, 5.693115234375, 5.8828125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 9.0, 14.0, 13.0, 28.0, 48.0, 51.0, 87.0, 143.0, 199.0, 323.0, 443.0, 631.0, 993.0, 1545.0, 2428.0, 3757.0, 6184.0, 9775.0, 16034.0, 27539.0, 47943.0, 92159.0, 202189.0, 1364343.0, 151787.0, 72142.0, 38473.0, 22278.0, 13460.0, 8182.0, 4976.0, 3195.0, 1984.0, 1280.0, 828.0, 533.0, 348.0, 223.0, 177.0, 110.0, 93.0, 61.0, 31.0, 25.0, 23.0, 11.0, 16.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.5244140625, -1.4757537841796875, -1.427093505859375, -1.3784332275390625, -1.32977294921875, -1.2811126708984375, -1.232452392578125, -1.1837921142578125, -1.1351318359375, -1.0864715576171875, -1.037811279296875, -0.9891510009765625, -0.94049072265625, -0.8918304443359375, -0.843170166015625, -0.7945098876953125, -0.745849609375, -0.6971893310546875, -0.648529052734375, -0.5998687744140625, -0.55120849609375, -0.5025482177734375, -0.453887939453125, -0.4052276611328125, -0.3565673828125, -0.3079071044921875, -0.259246826171875, -0.2105865478515625, -0.16192626953125, -0.1132659912109375, -0.064605712890625, -0.0159454345703125, 0.03271484375, 0.0813751220703125, 0.130035400390625, 0.1786956787109375, 0.22735595703125, 0.2760162353515625, 0.324676513671875, 0.3733367919921875, 0.4219970703125, 0.4706573486328125, 0.519317626953125, 0.5679779052734375, 0.61663818359375, 0.6652984619140625, 0.713958740234375, 0.7626190185546875, 0.811279296875, 0.8599395751953125, 0.908599853515625, 0.9572601318359375, 1.00592041015625, 1.0545806884765625, 1.103240966796875, 1.1519012451171875, 1.2005615234375, 1.2492218017578125, 1.297882080078125, 1.3465423583984375, 1.39520263671875, 1.4438629150390625, 1.492523193359375, 1.5411834716796875, 1.58984375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 7.0, 11.0, 14.0, 14.0, 26.0, 18.0, 23.0, 28.0, 53.0, 56.0, 63.0, 86.0, 72.0, 73.0, 79.0, 81.0, 68.0, 42.0, 32.0, 33.0, 20.0, 14.0, 25.0, 9.0, 13.0, 7.0, 5.0, 3.0, 4.0, 4.0, 1.0, 4.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00217437744140625, -0.0021089017391204834, -0.002043426036834717, -0.00197795033454895, -0.0019124746322631836, -0.001846998929977417, -0.0017815232276916504, -0.0017160475254058838, -0.0016505718231201172, -0.0015850961208343506, -0.001519620418548584, -0.0014541447162628174, -0.0013886690139770508, -0.0013231933116912842, -0.0012577176094055176, -0.001192241907119751, -0.0011267662048339844, -0.0010612905025482178, -0.0009958148002624512, -0.0009303390979766846, -0.000864863395690918, -0.0007993876934051514, -0.0007339119911193848, -0.0006684362888336182, -0.0006029605865478516, -0.000537484884262085, -0.00047200918197631836, -0.00040653347969055176, -0.00034105777740478516, -0.00027558207511901855, -0.00021010637283325195, -0.00014463067054748535, -7.915496826171875e-05, -1.3679265975952148e-05, 5.179643630981445e-05, 0.00011727213859558105, 0.00018274784088134766, 0.00024822354316711426, 0.00031369924545288086, 0.00037917494773864746, 0.00044465065002441406, 0.0005101263523101807, 0.0005756020545959473, 0.0006410777568817139, 0.0007065534591674805, 0.0007720291614532471, 0.0008375048637390137, 0.0009029805660247803, 0.0009684562683105469, 0.0010339319705963135, 0.00109940767288208, 0.0011648833751678467, 0.0012303590774536133, 0.0012958347797393799, 0.0013613104820251465, 0.001426786184310913, 0.0014922618865966797, 0.0015577375888824463, 0.0016232132911682129, 0.0016886889934539795, 0.001754164695739746, 0.0018196403980255127, 0.0018851161003112793, 0.001950591802597046, 0.0020160675048828125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 4.0, 12.0, 9.0, 9.0, 12.0, 26.0, 29.0, 36.0, 51.0, 64.0, 77.0, 160.0, 299.0, 598.0, 4036.0, 1038127.0, 3578.0, 633.0, 262.0, 154.0, 99.0, 70.0, 39.0, 40.0, 31.0, 27.0, 13.0, 15.0, 10.0, 8.0, 2.0, 8.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.045654296875, -0.044291019439697266, -0.04292774200439453, -0.0415644645690918, -0.04020118713378906, -0.03883790969848633, -0.037474632263183594, -0.03611135482788086, -0.034748077392578125, -0.03338479995727539, -0.032021522521972656, -0.030658245086669922, -0.029294967651367188, -0.027931690216064453, -0.02656841278076172, -0.025205135345458984, -0.02384185791015625, -0.022478580474853516, -0.02111530303955078, -0.019752025604248047, -0.018388748168945312, -0.017025470733642578, -0.015662193298339844, -0.01429891586303711, -0.012935638427734375, -0.01157236099243164, -0.010209083557128906, -0.008845806121826172, -0.0074825286865234375, -0.006119251251220703, -0.004755973815917969, -0.0033926963806152344, -0.0020294189453125, -0.0006661415100097656, 0.0006971359252929688, 0.002060413360595703, 0.0034236907958984375, 0.004786968231201172, 0.006150245666503906, 0.007513523101806641, 0.008876800537109375, 0.01024007797241211, 0.011603355407714844, 0.012966632843017578, 0.014329910278320312, 0.015693187713623047, 0.01705646514892578, 0.018419742584228516, 0.01978302001953125, 0.021146297454833984, 0.02250957489013672, 0.023872852325439453, 0.025236129760742188, 0.026599407196044922, 0.027962684631347656, 0.02932596206665039, 0.030689239501953125, 0.03205251693725586, 0.033415794372558594, 0.03477907180786133, 0.03614234924316406, 0.0375056266784668, 0.03886890411376953, 0.040232181549072266, 0.041595458984375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 7.0, 469.0, 531.0, 11.0], "bins": [-0.015552587807178497, -0.015301905572414398, -0.015051223337650299, -0.0148005411028862, -0.0145498588681221, -0.014299176633358002, -0.014048494398593903, -0.013797812163829803, -0.013547129929065704, -0.013296447694301605, -0.013045765459537506, -0.012795083224773407, -0.012544400990009308, -0.012293718755245209, -0.01204303652048111, -0.01179235428571701, -0.011541672050952911, -0.011290989816188812, -0.011040307581424713, -0.010789625346660614, -0.010538943111896515, -0.010288260877132416, -0.010037578642368317, -0.009786896407604218, -0.009536214172840118, -0.00928553193807602, -0.00903484970331192, -0.008784167468547821, -0.008533485233783722, -0.008282802999019623, -0.008032120764255524, -0.0077814385294914246, -0.0075307562947273254, -0.007280074059963226, -0.007029391825199127, -0.006778709590435028, -0.006528027355670929, -0.00627734512090683, -0.006026662886142731, -0.005775980651378632, -0.0055252984166145325, -0.005274616181850433, -0.005023933947086334, -0.004773251712322235, -0.004522569477558136, -0.004271887242794037, -0.004021205008029938, -0.0037705227732658386, -0.0035198405385017395, -0.0032691583037376404, -0.0030184760689735413, -0.002767793834209442, -0.002517111599445343, -0.002266429364681244, -0.0020157471299171448, -0.0017650648951530457, -0.0015143826603889465, -0.0012637004256248474, -0.0010130181908607483, -0.0007623359560966492, -0.00051165372133255, -0.00026097148656845093, -1.0289251804351807e-05, 0.00024039298295974731, 0.0004910752759315073]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 7.0, 9.0, 6.0, 7.0, 5.0, 14.0, 11.0, 14.0, 24.0, 19.0, 22.0, 26.0, 18.0, 23.0, 34.0, 39.0, 46.0, 37.0, 30.0, 41.0, 45.0, 50.0, 43.0, 46.0, 33.0, 44.0, 35.0, 34.0, 25.0, 35.0, 32.0, 23.0, 21.0, 21.0, 14.0, 17.0, 8.0, 8.0, 6.0, 8.0, 7.0, 2.0, 3.0, 6.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0009357929229736328, -0.00090755894780159, -0.0008793249726295471, -0.0008510909974575043, -0.0008228570222854614, -0.0007946230471134186, -0.0007663890719413757, -0.0007381550967693329, -0.00070992112159729, -0.0006816871464252472, -0.0006534531712532043, -0.0006252191960811615, -0.0005969852209091187, -0.0005687512457370758, -0.000540517270565033, -0.0005122832953929901, -0.00048404932022094727, -0.0004558153450489044, -0.00042758136987686157, -0.0003993473947048187, -0.0003711134195327759, -0.00034287944436073303, -0.0003146454691886902, -0.00028641149401664734, -0.0002581775188446045, -0.00022994354367256165, -0.0002017095685005188, -0.00017347559332847595, -0.0001452416181564331, -0.00011700764298439026, -8.877366781234741e-05, -6.0539692640304565e-05, -3.230571746826172e-05, -4.071742296218872e-06, 2.4162232875823975e-05, 5.239620804786682e-05, 8.063018321990967e-05, 0.00010886415839195251, 0.00013709813356399536, 0.0001653321087360382, 0.00019356608390808105, 0.0002218000590801239, 0.00025003403425216675, 0.0002782680094242096, 0.00030650198459625244, 0.0003347359597682953, 0.00036296993494033813, 0.000391203910112381, 0.00041943788528442383, 0.0004476718604564667, 0.0004759058356285095, 0.0005041398108005524, 0.0005323737859725952, 0.0005606077611446381, 0.0005888417363166809, 0.0006170757114887238, 0.0006453096866607666, 0.0006735436618328094, 0.0007017776370048523, 0.0007300116121768951, 0.000758245587348938, 0.0007864795625209808, 0.0008147135376930237, 0.0008429475128650665, 0.0008711814880371094]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 2.0, 1.0, 5.0, 5.0, 11.0, 12.0, 6.0, 15.0, 10.0, 16.0, 19.0, 24.0, 19.0, 34.0, 28.0, 35.0, 28.0, 39.0, 38.0, 54.0, 38.0, 31.0, 65.0, 51.0, 37.0, 33.0, 53.0, 33.0, 35.0, 38.0, 31.0, 25.0, 24.0, 16.0, 20.0, 18.0, 13.0, 9.0, 12.0, 13.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.90625, -7.6456298828125, -7.385009765625, -7.1243896484375, -6.86376953125, -6.6031494140625, -6.342529296875, -6.0819091796875, -5.8212890625, -5.5606689453125, -5.300048828125, -5.0394287109375, -4.77880859375, -4.5181884765625, -4.257568359375, -3.9969482421875, -3.736328125, -3.4757080078125, -3.215087890625, -2.9544677734375, -2.69384765625, -2.4332275390625, -2.172607421875, -1.9119873046875, -1.6513671875, -1.3907470703125, -1.130126953125, -0.8695068359375, -0.60888671875, -0.3482666015625, -0.087646484375, 0.1729736328125, 0.43359375, 0.6942138671875, 0.954833984375, 1.2154541015625, 1.47607421875, 1.7366943359375, 1.997314453125, 2.2579345703125, 2.5185546875, 2.7791748046875, 3.039794921875, 3.3004150390625, 3.56103515625, 3.8216552734375, 4.082275390625, 4.3428955078125, 4.603515625, 4.8641357421875, 5.124755859375, 5.3853759765625, 5.64599609375, 5.9066162109375, 6.167236328125, 6.4278564453125, 6.6884765625, 6.9490966796875, 7.209716796875, 7.4703369140625, 7.73095703125, 7.9915771484375, 8.252197265625, 8.5128173828125, 8.7734375]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 6.0, 10.0, 15.0, 10.0, 21.0, 16.0, 29.0, 42.0, 60.0, 79.0, 88.0, 120.0, 201.0, 327.0, 622.0, 1578.0, 8888.0, 68964.0, 562632.0, 353724.0, 42604.0, 5711.0, 1297.0, 517.0, 290.0, 196.0, 121.0, 97.0, 57.0, 61.0, 40.0, 23.0, 19.0, 15.0, 16.0, 11.0, 13.0, 9.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-15.6171875, -15.0946044921875, -14.572021484375, -14.0494384765625, -13.52685546875, -13.0042724609375, -12.481689453125, -11.9591064453125, -11.4365234375, -10.9139404296875, -10.391357421875, -9.8687744140625, -9.34619140625, -8.8236083984375, -8.301025390625, -7.7784423828125, -7.255859375, -6.7332763671875, -6.210693359375, -5.6881103515625, -5.16552734375, -4.6429443359375, -4.120361328125, -3.5977783203125, -3.0751953125, -2.5526123046875, -2.030029296875, -1.5074462890625, -0.98486328125, -0.4622802734375, 0.060302734375, 0.5828857421875, 1.10546875, 1.6280517578125, 2.150634765625, 2.6732177734375, 3.19580078125, 3.7183837890625, 4.240966796875, 4.7635498046875, 5.2861328125, 5.8087158203125, 6.331298828125, 6.8538818359375, 7.37646484375, 7.8990478515625, 8.421630859375, 8.9442138671875, 9.466796875, 9.9893798828125, 10.511962890625, 11.0345458984375, 11.55712890625, 12.0797119140625, 12.602294921875, 13.1248779296875, 13.6474609375, 14.1700439453125, 14.692626953125, 15.2152099609375, 15.73779296875, 16.2603759765625, 16.782958984375, 17.3055419921875, 17.828125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 2.0, 3.0, 5.0, 6.0, 10.0, 9.0, 8.0, 13.0, 14.0, 20.0, 21.0, 22.0, 30.0, 33.0, 35.0, 41.0, 44.0, 47.0, 76.0, 145.0, 343.0, 1470.0, 150.0, 85.0, 48.0, 50.0, 38.0, 46.0, 47.0, 39.0, 27.0, 19.0, 23.0, 23.0, 10.0, 12.0, 15.0, 7.0, 7.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-30.171875, -29.261474609375, -28.35107421875, -27.440673828125, -26.5302734375, -25.619873046875, -24.70947265625, -23.799072265625, -22.888671875, -21.978271484375, -21.06787109375, -20.157470703125, -19.2470703125, -18.336669921875, -17.42626953125, -16.515869140625, -15.60546875, -14.695068359375, -13.78466796875, -12.874267578125, -11.9638671875, -11.053466796875, -10.14306640625, -9.232666015625, -8.322265625, -7.411865234375, -6.50146484375, -5.591064453125, -4.6806640625, -3.770263671875, -2.85986328125, -1.949462890625, -1.0390625, -0.128662109375, 0.78173828125, 1.692138671875, 2.6025390625, 3.512939453125, 4.42333984375, 5.333740234375, 6.244140625, 7.154541015625, 8.06494140625, 8.975341796875, 9.8857421875, 10.796142578125, 11.70654296875, 12.616943359375, 13.52734375, 14.437744140625, 15.34814453125, 16.258544921875, 17.1689453125, 18.079345703125, 18.98974609375, 19.900146484375, 20.810546875, 21.720947265625, 22.63134765625, 23.541748046875, 24.4521484375, 25.362548828125, 26.27294921875, 27.183349609375, 28.09375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 1.0, 2.0, 8.0, 4.0, 5.0, 14.0, 27.0, 22.0, 41.0, 52.0, 67.0, 60.0, 121.0, 145.0, 273.0, 514.0, 1740.0, 998777.0, 2140545.0, 1937.0, 545.0, 239.0, 153.0, 114.0, 76.0, 53.0, 54.0, 26.0, 24.0, 19.0, 14.0, 15.0, 10.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-123.125, -119.609375, -116.09375, -112.578125, -109.0625, -105.546875, -102.03125, -98.515625, -95.0, -91.484375, -87.96875, -84.453125, -80.9375, -77.421875, -73.90625, -70.390625, -66.875, -63.359375, -59.84375, -56.328125, -52.8125, -49.296875, -45.78125, -42.265625, -38.75, -35.234375, -31.71875, -28.203125, -24.6875, -21.171875, -17.65625, -14.140625, -10.625, -7.109375, -3.59375, -0.078125, 3.4375, 6.953125, 10.46875, 13.984375, 17.5, 21.015625, 24.53125, 28.046875, 31.5625, 35.078125, 38.59375, 42.109375, 45.625, 49.140625, 52.65625, 56.171875, 59.6875, 63.203125, 66.71875, 70.234375, 73.75, 77.265625, 80.78125, 84.296875, 87.8125, 91.328125, 94.84375, 98.359375, 101.875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 11.0, 38.0, 87.0, 99.0, 133.0, 186.0, 158.0, 125.0, 89.0, 35.0, 26.0, 10.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.83781433105469, -48.67265319824219, -47.50749588012695, -46.34233474731445, -45.17717742919922, -44.01201629638672, -42.846858978271484, -41.681697845458984, -40.51654052734375, -39.35137939453125, -38.186222076416016, -37.021060943603516, -35.85590362548828, -34.69074249267578, -33.52558517456055, -32.36042404174805, -31.195262908935547, -30.03010368347168, -28.864944458007812, -27.699785232543945, -26.534626007080078, -25.369464874267578, -24.20430564880371, -23.039146423339844, -21.873987197875977, -20.70882797241211, -19.543668746948242, -18.378509521484375, -17.213348388671875, -16.04819107055664, -14.88302993774414, -13.717870712280273, -12.55270767211914, -11.387548446655273, -10.222389221191406, -9.057229042053223, -7.8920698165893555, -6.726910591125488, -5.561750888824463, -4.3965911865234375, -3.2314319610595703, -2.066272497177124, -0.9011130332946777, 0.26404643058776855, 1.4292058944702148, 2.594365119934082, 3.7595248222351074, 4.924684524536133, 6.08984375, 7.255002975463867, 8.420162200927734, 9.585322380065918, 10.750481605529785, 11.915640830993652, 13.080801010131836, 14.245960235595703, 15.41111946105957, 16.576278686523438, 17.741437911987305, 18.906597137451172, 20.071758270263672, 21.236915588378906, 22.402076721191406, 23.567235946655273, 24.73239517211914]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 4.0, 2.0, 5.0, 14.0, 15.0, 12.0, 12.0, 18.0, 20.0, 15.0, 23.0, 25.0, 30.0, 42.0, 38.0, 40.0, 41.0, 34.0, 49.0, 46.0, 36.0, 51.0, 47.0, 32.0, 34.0, 30.0, 25.0, 40.0, 31.0, 27.0, 16.0, 18.0, 18.0, 13.0, 8.0, 13.0, 10.0, 8.0, 11.0, 10.0, 7.0, 8.0, 2.0, 6.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.28593826293945, -60.176822662353516, -58.06770706176758, -55.95859146118164, -53.84947967529297, -51.74036407470703, -49.631248474121094, -47.522132873535156, -45.41301727294922, -43.30390167236328, -41.194786071777344, -39.085670471191406, -36.97655487060547, -34.86743927001953, -32.75832748413086, -30.649211883544922, -28.540096282958984, -26.430980682373047, -24.32186508178711, -22.212751388549805, -20.103635787963867, -17.99452018737793, -15.885405540466309, -13.776290893554688, -11.66717529296875, -9.558059692382812, -7.448945045471191, -5.339829921722412, -3.230714797973633, -1.1215991973876953, 0.9875154495239258, 3.096630096435547, 5.205741882324219, 7.314857006072998, 9.423972129821777, 11.533086776733398, 13.642202377319336, 15.751317977905273, 17.860431671142578, 19.969547271728516, 22.078662872314453, 24.18777847290039, 26.296894073486328, 28.406007766723633, 30.51512336730957, 32.624237060546875, 34.73335266113281, 36.84246826171875, 38.95158386230469, 41.060699462890625, 43.16981506347656, 45.2789306640625, 47.38804626464844, 49.497161865234375, 51.60627365112305, 53.715389251708984, 55.82450485229492, 57.93362045288086, 60.0427360534668, 62.151851654052734, 64.2609634399414, 66.37007904052734, 68.47919464111328, 70.58831024169922, 72.69742584228516]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 3.0, 6.0, 11.0, 9.0, 7.0, 14.0, 11.0, 20.0, 15.0, 31.0, 39.0, 29.0, 33.0, 32.0, 41.0, 51.0, 44.0, 55.0, 41.0, 46.0, 45.0, 39.0, 49.0, 45.0, 30.0, 36.0, 31.0, 32.0, 32.0, 20.0, 15.0, 16.0, 13.0, 13.0, 11.0, 16.0, 4.0, 5.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.1875, -8.883056640625, -8.57861328125, -8.274169921875, -7.9697265625, -7.665283203125, -7.36083984375, -7.056396484375, -6.751953125, -6.447509765625, -6.14306640625, -5.838623046875, -5.5341796875, -5.229736328125, -4.92529296875, -4.620849609375, -4.31640625, -4.011962890625, -3.70751953125, -3.403076171875, -3.0986328125, -2.794189453125, -2.48974609375, -2.185302734375, -1.880859375, -1.576416015625, -1.27197265625, -0.967529296875, -0.6630859375, -0.358642578125, -0.05419921875, 0.250244140625, 0.5546875, 0.859130859375, 1.16357421875, 1.468017578125, 1.7724609375, 2.076904296875, 2.38134765625, 2.685791015625, 2.990234375, 3.294677734375, 3.59912109375, 3.903564453125, 4.2080078125, 4.512451171875, 4.81689453125, 5.121337890625, 5.42578125, 5.730224609375, 6.03466796875, 6.339111328125, 6.6435546875, 6.947998046875, 7.25244140625, 7.556884765625, 7.861328125, 8.165771484375, 8.47021484375, 8.774658203125, 9.0791015625, 9.383544921875, 9.68798828125, 9.992431640625, 10.296875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 11.0, 11.0, 12.0, 26.0, 31.0, 37.0, 36.0, 66.0, 95.0, 192.0, 278.0, 555.0, 1290.0, 4653.0, 22428.0, 143420.0, 753887.0, 1770962.0, 1160574.0, 280041.0, 44218.0, 7836.0, 1992.0, 681.0, 360.0, 181.0, 118.0, 70.0, 57.0, 36.0, 28.0, 19.0, 22.0, 13.0, 10.0, 6.0, 10.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4140625, -11.01611328125, -10.6181640625, -10.22021484375, -9.822265625, -9.42431640625, -9.0263671875, -8.62841796875, -8.23046875, -7.83251953125, -7.4345703125, -7.03662109375, -6.638671875, -6.24072265625, -5.8427734375, -5.44482421875, -5.046875, -4.64892578125, -4.2509765625, -3.85302734375, -3.455078125, -3.05712890625, -2.6591796875, -2.26123046875, -1.86328125, -1.46533203125, -1.0673828125, -0.66943359375, -0.271484375, 0.12646484375, 0.5244140625, 0.92236328125, 1.3203125, 1.71826171875, 2.1162109375, 2.51416015625, 2.912109375, 3.31005859375, 3.7080078125, 4.10595703125, 4.50390625, 4.90185546875, 5.2998046875, 5.69775390625, 6.095703125, 6.49365234375, 6.8916015625, 7.28955078125, 7.6875, 8.08544921875, 8.4833984375, 8.88134765625, 9.279296875, 9.67724609375, 10.0751953125, 10.47314453125, 10.87109375, 11.26904296875, 11.6669921875, 12.06494140625, 12.462890625, 12.86083984375, 13.2587890625, 13.65673828125, 14.0546875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 4.0, 13.0, 14.0, 31.0, 39.0, 65.0, 67.0, 96.0, 166.0, 216.0, 304.0, 411.0, 498.0, 509.0, 457.0, 331.0, 243.0, 193.0, 115.0, 90.0, 66.0, 37.0, 32.0, 23.0, 21.0, 13.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.296875, -20.7080078125, -20.119140625, -19.5302734375, -18.94140625, -18.3525390625, -17.763671875, -17.1748046875, -16.5859375, -15.9970703125, -15.408203125, -14.8193359375, -14.23046875, -13.6416015625, -13.052734375, -12.4638671875, -11.875, -11.2861328125, -10.697265625, -10.1083984375, -9.51953125, -8.9306640625, -8.341796875, -7.7529296875, -7.1640625, -6.5751953125, -5.986328125, -5.3974609375, -4.80859375, -4.2197265625, -3.630859375, -3.0419921875, -2.453125, -1.8642578125, -1.275390625, -0.6865234375, -0.09765625, 0.4912109375, 1.080078125, 1.6689453125, 2.2578125, 2.8466796875, 3.435546875, 4.0244140625, 4.61328125, 5.2021484375, 5.791015625, 6.3798828125, 6.96875, 7.5576171875, 8.146484375, 8.7353515625, 9.32421875, 9.9130859375, 10.501953125, 11.0908203125, 11.6796875, 12.2685546875, 12.857421875, 13.4462890625, 14.03515625, 14.6240234375, 15.212890625, 15.8017578125, 16.390625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 16.0, 16.0, 31.0, 37.0, 57.0, 100.0, 169.0, 225.0, 382.0, 703.0, 1456.0, 8915.0, 3078949.0, 1095535.0, 4949.0, 1168.0, 618.0, 358.0, 204.0, 119.0, 104.0, 59.0, 38.0, 18.0, 20.0, 12.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.96875, -55.89111328125, -53.8134765625, -51.73583984375, -49.658203125, -47.58056640625, -45.5029296875, -43.42529296875, -41.34765625, -39.27001953125, -37.1923828125, -35.11474609375, -33.037109375, -30.95947265625, -28.8818359375, -26.80419921875, -24.7265625, -22.64892578125, -20.5712890625, -18.49365234375, -16.416015625, -14.33837890625, -12.2607421875, -10.18310546875, -8.10546875, -6.02783203125, -3.9501953125, -1.87255859375, 0.205078125, 2.28271484375, 4.3603515625, 6.43798828125, 8.515625, 10.59326171875, 12.6708984375, 14.74853515625, 16.826171875, 18.90380859375, 20.9814453125, 23.05908203125, 25.13671875, 27.21435546875, 29.2919921875, 31.36962890625, 33.447265625, 35.52490234375, 37.6025390625, 39.68017578125, 41.7578125, 43.83544921875, 45.9130859375, 47.99072265625, 50.068359375, 52.14599609375, 54.2236328125, 56.30126953125, 58.37890625, 60.45654296875, 62.5341796875, 64.61181640625, 66.689453125, 68.76708984375, 70.8447265625, 72.92236328125, 75.0]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 74.0, 455.0, 423.0, 56.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-369.5962219238281, -359.85150146484375, -350.1067810058594, -340.362060546875, -330.6173400878906, -320.87261962890625, -311.1278991699219, -301.3831787109375, -291.638427734375, -281.8937072753906, -272.14898681640625, -262.4042663574219, -252.6595458984375, -242.91482543945312, -233.1700897216797, -223.4253692626953, -213.6806640625, -203.93594360351562, -194.19122314453125, -184.44650268554688, -174.7017822265625, -164.95706176757812, -155.2123260498047, -145.4676055908203, -135.72288513183594, -125.97816467285156, -116.23344421386719, -106.48871612548828, -96.7439956665039, -86.99927520751953, -77.25454711914062, -67.50982666015625, -57.76509094238281, -48.02037048339844, -38.2756462097168, -28.53092384338379, -18.78620147705078, -9.041481018066406, 0.7032432556152344, 10.447967529296875, 20.19268798828125, 29.937410354614258, 39.682132720947266, 49.426856994628906, 59.17157745361328, 68.91629791259766, 78.66102600097656, 88.40574645996094, 98.15046691894531, 107.89518737792969, 117.63990783691406, 127.38463592529297, 137.12936401367188, 146.87408447265625, 156.61880493164062, 166.363525390625, 176.10824584960938, 185.85296630859375, 195.59768676757812, 205.3424072265625, 215.08712768554688, 224.83184814453125, 234.5765838623047, 244.32130432128906, 254.06602478027344]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 3.0, 10.0, 4.0, 12.0, 9.0, 17.0, 14.0, 28.0, 21.0, 27.0, 22.0, 28.0, 33.0, 37.0, 41.0, 42.0, 42.0, 55.0, 44.0, 52.0, 45.0, 37.0, 38.0, 49.0, 46.0, 39.0, 39.0, 28.0, 26.0, 15.0, 22.0, 20.0, 13.0, 14.0, 8.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.217674255371094, -54.34430694580078, -52.47093963623047, -50.59757614135742, -48.72420883178711, -46.8508415222168, -44.977474212646484, -43.10411071777344, -41.230743408203125, -39.35737609863281, -37.4840087890625, -35.61064529418945, -33.73727798461914, -31.863910675048828, -29.990543365478516, -28.117177963256836, -26.243810653686523, -24.37044334411621, -22.49707794189453, -20.62371063232422, -18.75034523010254, -16.876977920532227, -15.00361156463623, -13.130245208740234, -11.256878852844238, -9.383512496948242, -7.510146141052246, -5.636779308319092, -3.7634129524230957, -1.8900461196899414, -0.016679763793945312, 1.8566865921020508, 3.730052947998047, 5.603419303894043, 7.476785659790039, 9.350152969360352, 11.223518371582031, 13.096885681152344, 14.97025203704834, 16.843618392944336, 18.716983795166016, 20.590351104736328, 22.463716506958008, 24.33708381652832, 26.21044921875, 28.083816528320312, 29.957183837890625, 31.830549240112305, 33.70391845703125, 35.57728576660156, 37.450653076171875, 39.32401657104492, 41.197383880615234, 43.07075119018555, 44.94411849975586, 46.817481994628906, 48.69084930419922, 50.56421661376953, 52.437583923339844, 54.31094741821289, 56.1843147277832, 58.057682037353516, 59.93104934692383, 61.804412841796875, 63.67778015136719]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 10.0, 7.0, 7.0, 4.0, 7.0, 4.0, 12.0, 16.0, 10.0, 20.0, 12.0, 26.0, 19.0, 31.0, 25.0, 20.0, 30.0, 35.0, 26.0, 37.0, 39.0, 45.0, 38.0, 37.0, 39.0, 37.0, 32.0, 34.0, 34.0, 28.0, 25.0, 24.0, 25.0, 25.0, 23.0, 22.0, 25.0, 14.0, 15.0, 8.0, 10.0, 8.0, 13.0, 12.0, 5.0, 9.0, 3.0, 2.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.13671875, -6.9102783203125, -6.683837890625, -6.4573974609375, -6.23095703125, -6.0045166015625, -5.778076171875, -5.5516357421875, -5.3251953125, -5.0987548828125, -4.872314453125, -4.6458740234375, -4.41943359375, -4.1929931640625, -3.966552734375, -3.7401123046875, -3.513671875, -3.2872314453125, -3.060791015625, -2.8343505859375, -2.60791015625, -2.3814697265625, -2.155029296875, -1.9285888671875, -1.7021484375, -1.4757080078125, -1.249267578125, -1.0228271484375, -0.79638671875, -0.5699462890625, -0.343505859375, -0.1170654296875, 0.109375, 0.3358154296875, 0.562255859375, 0.7886962890625, 1.01513671875, 1.2415771484375, 1.468017578125, 1.6944580078125, 1.9208984375, 2.1473388671875, 2.373779296875, 2.6002197265625, 2.82666015625, 3.0531005859375, 3.279541015625, 3.5059814453125, 3.732421875, 3.9588623046875, 4.185302734375, 4.4117431640625, 4.63818359375, 4.8646240234375, 5.091064453125, 5.3175048828125, 5.5439453125, 5.7703857421875, 5.996826171875, 6.2232666015625, 6.44970703125, 6.6761474609375, 6.902587890625, 7.1290283203125, 7.35546875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 8.0, 4.0, 6.0, 15.0, 16.0, 23.0, 34.0, 54.0, 93.0, 107.0, 151.0, 194.0, 317.0, 428.0, 652.0, 822.0, 1169.0, 1755.0, 2350.0, 3525.0, 5006.0, 7512.0, 10763.0, 16012.0, 24039.0, 37561.0, 60232.0, 102212.0, 189615.0, 244853.0, 130119.0, 74575.0, 45331.0, 29346.0, 18939.0, 12611.0, 8657.0, 5933.0, 3986.0, 2804.0, 2028.0, 1378.0, 954.0, 703.0, 526.0, 332.0, 223.0, 171.0, 124.0, 83.0, 76.0, 44.0, 33.0, 23.0, 12.0, 12.0, 8.0, 7.0, 3.0, 2.0, 1.0], "bins": [-1.2822265625, -1.2424163818359375, -1.202606201171875, -1.1627960205078125, -1.12298583984375, -1.0831756591796875, -1.043365478515625, -1.0035552978515625, -0.9637451171875, -0.9239349365234375, -0.884124755859375, -0.8443145751953125, -0.80450439453125, -0.7646942138671875, -0.724884033203125, -0.6850738525390625, -0.645263671875, -0.6054534912109375, -0.565643310546875, -0.5258331298828125, -0.48602294921875, -0.4462127685546875, -0.406402587890625, -0.3665924072265625, -0.3267822265625, -0.2869720458984375, -0.247161865234375, -0.2073516845703125, -0.16754150390625, -0.1277313232421875, -0.087921142578125, -0.0481109619140625, -0.00830078125, 0.0315093994140625, 0.071319580078125, 0.1111297607421875, 0.15093994140625, 0.1907501220703125, 0.230560302734375, 0.2703704833984375, 0.3101806640625, 0.3499908447265625, 0.389801025390625, 0.4296112060546875, 0.46942138671875, 0.5092315673828125, 0.549041748046875, 0.5888519287109375, 0.628662109375, 0.6684722900390625, 0.708282470703125, 0.7480926513671875, 0.78790283203125, 0.8277130126953125, 0.867523193359375, 0.9073333740234375, 0.9471435546875, 0.9869537353515625, 1.026763916015625, 1.0665740966796875, 1.10638427734375, 1.1461944580078125, 1.186004638671875, 1.2258148193359375, 1.265625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 3.0, 6.0, 5.0, 9.0, 8.0, 15.0, 12.0, 19.0, 15.0, 16.0, 31.0, 27.0, 35.0, 27.0, 45.0, 41.0, 39.0, 42.0, 32.0, 44.0, 1070.0, 29.0, 41.0, 26.0, 39.0, 56.0, 46.0, 31.0, 30.0, 19.0, 18.0, 24.0, 17.0, 23.0, 6.0, 18.0, 14.0, 11.0, 13.0, 5.0, 1.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-5.67578125, -5.51507568359375, -5.3543701171875, -5.19366455078125, -5.032958984375, -4.87225341796875, -4.7115478515625, -4.55084228515625, -4.39013671875, -4.22943115234375, -4.0687255859375, -3.90802001953125, -3.747314453125, -3.58660888671875, -3.4259033203125, -3.26519775390625, -3.1044921875, -2.94378662109375, -2.7830810546875, -2.62237548828125, -2.461669921875, -2.30096435546875, -2.1402587890625, -1.97955322265625, -1.81884765625, -1.65814208984375, -1.4974365234375, -1.33673095703125, -1.176025390625, -1.01531982421875, -0.8546142578125, -0.69390869140625, -0.533203125, -0.37249755859375, -0.2117919921875, -0.05108642578125, 0.109619140625, 0.27032470703125, 0.4310302734375, 0.59173583984375, 0.75244140625, 0.91314697265625, 1.0738525390625, 1.23455810546875, 1.395263671875, 1.55596923828125, 1.7166748046875, 1.87738037109375, 2.0380859375, 2.19879150390625, 2.3594970703125, 2.52020263671875, 2.680908203125, 2.84161376953125, 3.0023193359375, 3.16302490234375, 3.32373046875, 3.48443603515625, 3.6451416015625, 3.80584716796875, 3.966552734375, 4.12725830078125, 4.2879638671875, 4.44866943359375, 4.609375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 5.0, 4.0, 7.0, 15.0, 8.0, 18.0, 38.0, 52.0, 64.0, 95.0, 158.0, 248.0, 326.0, 519.0, 807.0, 1174.0, 1875.0, 2954.0, 5013.0, 7907.0, 13062.0, 22663.0, 38811.0, 73257.0, 150688.0, 1361665.0, 203402.0, 93561.0, 48634.0, 27950.0, 16112.0, 10028.0, 6060.0, 3607.0, 2248.0, 1460.0, 895.0, 616.0, 385.0, 243.0, 160.0, 106.0, 83.0, 58.0, 37.0, 25.0, 10.0, 8.0, 8.0, 6.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.458984375, -1.4098358154296875, -1.360687255859375, -1.3115386962890625, -1.26239013671875, -1.2132415771484375, -1.164093017578125, -1.1149444580078125, -1.0657958984375, -1.0166473388671875, -0.967498779296875, -0.9183502197265625, -0.86920166015625, -0.8200531005859375, -0.770904541015625, -0.7217559814453125, -0.672607421875, -0.6234588623046875, -0.574310302734375, -0.5251617431640625, -0.47601318359375, -0.4268646240234375, -0.377716064453125, -0.3285675048828125, -0.2794189453125, -0.2302703857421875, -0.181121826171875, -0.1319732666015625, -0.08282470703125, -0.0336761474609375, 0.015472412109375, 0.0646209716796875, 0.11376953125, 0.1629180908203125, 0.212066650390625, 0.2612152099609375, 0.31036376953125, 0.3595123291015625, 0.408660888671875, 0.4578094482421875, 0.5069580078125, 0.5561065673828125, 0.605255126953125, 0.6544036865234375, 0.70355224609375, 0.7527008056640625, 0.801849365234375, 0.8509979248046875, 0.900146484375, 0.9492950439453125, 0.998443603515625, 1.0475921630859375, 1.09674072265625, 1.1458892822265625, 1.195037841796875, 1.2441864013671875, 1.2933349609375, 1.3424835205078125, 1.391632080078125, 1.4407806396484375, 1.48992919921875, 1.5390777587890625, 1.588226318359375, 1.6373748779296875, 1.6865234375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 3.0, 2.0, 5.0, 4.0, 12.0, 10.0, 17.0, 19.0, 20.0, 15.0, 29.0, 36.0, 30.0, 38.0, 47.0, 44.0, 51.0, 60.0, 58.0, 61.0, 53.0, 65.0, 40.0, 49.0, 33.0, 27.0, 35.0, 21.0, 32.0, 20.0, 13.0, 12.0, 16.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0018796920776367188, -0.0018223077058792114, -0.001764923334121704, -0.0017075389623641968, -0.0016501545906066895, -0.0015927702188491821, -0.0015353858470916748, -0.0014780014753341675, -0.0014206171035766602, -0.0013632327318191528, -0.0013058483600616455, -0.0012484639883041382, -0.0011910796165466309, -0.0011336952447891235, -0.0010763108730316162, -0.0010189265012741089, -0.0009615421295166016, -0.0009041577577590942, -0.0008467733860015869, -0.0007893890142440796, -0.0007320046424865723, -0.0006746202707290649, -0.0006172358989715576, -0.0005598515272140503, -0.000502467155456543, -0.00044508278369903564, -0.0003876984119415283, -0.000330314040184021, -0.00027292966842651367, -0.00021554529666900635, -0.00015816092491149902, -0.0001007765531539917, -4.3392181396484375e-05, 1.399219036102295e-05, 7.137656211853027e-05, 0.0001287609338760376, 0.00018614530563354492, 0.00024352967739105225, 0.00030091404914855957, 0.0003582984209060669, 0.0004156827926635742, 0.00047306716442108154, 0.0005304515361785889, 0.0005878359079360962, 0.0006452202796936035, 0.0007026046514511108, 0.0007599890232086182, 0.0008173733949661255, 0.0008747577667236328, 0.0009321421384811401, 0.0009895265102386475, 0.0010469108819961548, 0.0011042952537536621, 0.0011616796255111694, 0.0012190639972686768, 0.001276448369026184, 0.0013338327407836914, 0.0013912171125411987, 0.001448601484298706, 0.0015059858560562134, 0.0015633702278137207, 0.001620754599571228, 0.0016781389713287354, 0.0017355233430862427, 0.00179290771484375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 6.0, 2.0, 1.0, 3.0, 5.0, 4.0, 20.0, 9.0, 18.0, 17.0, 19.0, 37.0, 58.0, 55.0, 51.0, 77.0, 99.0, 143.0, 236.0, 488.0, 1087.0, 66765.0, 975921.0, 1832.0, 602.0, 317.0, 159.0, 101.0, 96.0, 56.0, 61.0, 49.0, 32.0, 25.0, 30.0, 18.0, 14.0, 7.0, 8.0, 7.0, 8.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.03546142578125, -0.03432464599609375, -0.0331878662109375, -0.03205108642578125, -0.030914306640625, -0.02977752685546875, -0.0286407470703125, -0.02750396728515625, -0.0263671875, -0.02523040771484375, -0.0240936279296875, -0.02295684814453125, -0.021820068359375, -0.02068328857421875, -0.0195465087890625, -0.01840972900390625, -0.01727294921875, -0.01613616943359375, -0.0149993896484375, -0.01386260986328125, -0.012725830078125, -0.01158905029296875, -0.0104522705078125, -0.00931549072265625, -0.0081787109375, -0.00704193115234375, -0.0059051513671875, -0.00476837158203125, -0.003631591796875, -0.00249481201171875, -0.0013580322265625, -0.00022125244140625, 0.00091552734375, 0.00205230712890625, 0.0031890869140625, 0.00432586669921875, 0.005462646484375, 0.00659942626953125, 0.0077362060546875, 0.00887298583984375, 0.010009765625, 0.01114654541015625, 0.0122833251953125, 0.01342010498046875, 0.014556884765625, 0.01569366455078125, 0.0168304443359375, 0.01796722412109375, 0.01910400390625, 0.02024078369140625, 0.0213775634765625, 0.02251434326171875, 0.023651123046875, 0.02478790283203125, 0.0259246826171875, 0.02706146240234375, 0.0281982421875, 0.02933502197265625, 0.0304718017578125, 0.03160858154296875, 0.032745361328125, 0.03388214111328125, 0.0350189208984375, 0.03615570068359375, 0.03729248046875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 54.0, 887.0, 70.0, 5.0], "bins": [-0.017986489459872246, -0.0176940206438303, -0.017401551827788353, -0.017109083011746407, -0.01681661419570446, -0.016524145379662514, -0.016231676563620567, -0.01593920774757862, -0.015646738931536674, -0.015354270115494728, -0.015061801299452782, -0.014769332483410835, -0.014476863667368889, -0.014184394851326942, -0.013891926035284996, -0.01359945721924305, -0.013306989334523678, -0.013014520518481731, -0.012722051702439785, -0.012429582886397839, -0.012137114070355892, -0.011844645254313946, -0.011552176438272, -0.011259708553552628, -0.010967239737510681, -0.010674770921468735, -0.010382302105426788, -0.010089833289384842, -0.009797364473342896, -0.009504895657300949, -0.009212426841259003, -0.008919958025217056, -0.008627488277852535, -0.008335019461810589, -0.008042550645768642, -0.007750081829726696, -0.00745761301368475, -0.007165144197642803, -0.006872675847262144, -0.006580207031220198, -0.006287738680839539, -0.005995269864797592, -0.005702801048755646, -0.005410332232713699, -0.005117863416671753, -0.0048253946006298065, -0.004532926250249147, -0.004240457434207201, -0.003947988618165255, -0.003655519802123308, -0.0033630509860813618, -0.003070582402870059, -0.0027781135868281126, -0.002485644770786166, -0.0021931761875748634, -0.001900707371532917, -0.0016082384390756488, -0.0013157697394490242, -0.0010233009234070778, -0.0007308321655727923, -0.0004383634077385068, -0.00014589459169656038, 0.0001465741079300642, 0.0004390428075566888, 0.0007315116235986352]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 7.0, 6.0, 12.0, 9.0, 11.0, 8.0, 19.0, 31.0, 18.0, 24.0, 27.0, 29.0, 22.0, 40.0, 36.0, 40.0, 45.0, 45.0, 49.0, 36.0, 48.0, 36.0, 33.0, 41.0, 35.0, 30.0, 41.0, 32.0, 29.0, 28.0, 23.0, 14.0, 20.0, 17.0, 13.0, 6.0, 8.0, 7.0, 9.0, 6.0, 5.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000926971435546875, -0.0008967993780970573, -0.0008666273206472397, -0.000836455263197422, -0.0008062832057476044, -0.0007761111482977867, -0.0007459390908479691, -0.0007157670333981514, -0.0006855949759483337, -0.0006554229184985161, -0.0006252508610486984, -0.0005950788035988808, -0.0005649067461490631, -0.0005347346886992455, -0.0005045626312494278, -0.00047439057379961014, -0.0004442185163497925, -0.0004140464588999748, -0.00038387440145015717, -0.0003537023440003395, -0.00032353028655052185, -0.0002933582291007042, -0.00026318617165088654, -0.00023301411420106888, -0.00020284205675125122, -0.00017266999930143356, -0.0001424979418516159, -0.00011232588440179825, -8.215382695198059e-05, -5.198176950216293e-05, -2.1809712052345276e-05, 8.362345397472382e-06, 3.853440284729004e-05, 6.87064602971077e-05, 9.887851774692535e-05, 0.000129050575196743, 0.00015922263264656067, 0.00018939469009637833, 0.00021956674754619598, 0.00024973880499601364, 0.0002799108624458313, 0.00031008291989564896, 0.0003402549773454666, 0.00037042703479528427, 0.00040059909224510193, 0.0004307711496949196, 0.00046094320714473724, 0.0004911152645945549, 0.0005212873220443726, 0.0005514593794941902, 0.0005816314369440079, 0.0006118034943938255, 0.0006419755518436432, 0.0006721476092934608, 0.0007023196667432785, 0.0007324917241930962, 0.0007626637816429138, 0.0007928358390927315, 0.0008230078965425491, 0.0008531799539923668, 0.0008833520114421844, 0.0009135240688920021, 0.0009436961263418198, 0.0009738681837916374, 0.001004040241241455]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 2.0, 3.0, 3.0, 2.0, 10.0, 7.0, 7.0, 4.0, 7.0, 4.0, 12.0, 16.0, 10.0, 20.0, 12.0, 26.0, 19.0, 31.0, 25.0, 20.0, 30.0, 35.0, 26.0, 37.0, 39.0, 45.0, 38.0, 37.0, 39.0, 37.0, 32.0, 34.0, 34.0, 28.0, 25.0, 24.0, 25.0, 24.0, 24.0, 22.0, 25.0, 14.0, 15.0, 8.0, 10.0, 8.0, 13.0, 12.0, 5.0, 9.0, 3.0, 2.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.13671875, -6.9102783203125, -6.683837890625, -6.4573974609375, -6.23095703125, -6.0045166015625, -5.778076171875, -5.5516357421875, -5.3251953125, -5.0987548828125, -4.872314453125, -4.6458740234375, -4.41943359375, -4.1929931640625, -3.966552734375, -3.7401123046875, -3.513671875, -3.2872314453125, -3.060791015625, -2.8343505859375, -2.60791015625, -2.3814697265625, -2.155029296875, -1.9285888671875, -1.7021484375, -1.4757080078125, -1.249267578125, -1.0228271484375, -0.79638671875, -0.5699462890625, -0.343505859375, -0.1170654296875, 0.109375, 0.3358154296875, 0.562255859375, 0.7886962890625, 1.01513671875, 1.2415771484375, 1.468017578125, 1.6944580078125, 1.9208984375, 2.1473388671875, 2.373779296875, 2.6002197265625, 2.82666015625, 3.0531005859375, 3.279541015625, 3.5059814453125, 3.732421875, 3.9588623046875, 4.185302734375, 4.4117431640625, 4.63818359375, 4.8646240234375, 5.091064453125, 5.3175048828125, 5.5439453125, 5.7703857421875, 5.996826171875, 6.2232666015625, 6.44970703125, 6.6761474609375, 6.902587890625, 7.1290283203125, 7.35546875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 5.0, 7.0, 13.0, 4.0, 17.0, 17.0, 19.0, 16.0, 23.0, 39.0, 66.0, 110.0, 206.0, 345.0, 658.0, 1420.0, 3083.0, 6724.0, 14680.0, 32918.0, 79324.0, 197523.0, 334297.0, 220455.0, 89283.0, 36809.0, 16214.0, 7574.0, 3422.0, 1520.0, 781.0, 367.0, 220.0, 118.0, 73.0, 47.0, 27.0, 28.0, 21.0, 16.0, 8.0, 12.0, 9.0, 4.0, 5.0, 8.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0], "bins": [-8.3125, -8.0572509765625, -7.802001953125, -7.5467529296875, -7.29150390625, -7.0362548828125, -6.781005859375, -6.5257568359375, -6.2705078125, -6.0152587890625, -5.760009765625, -5.5047607421875, -5.24951171875, -4.9942626953125, -4.739013671875, -4.4837646484375, -4.228515625, -3.9732666015625, -3.718017578125, -3.4627685546875, -3.20751953125, -2.9522705078125, -2.697021484375, -2.4417724609375, -2.1865234375, -1.9312744140625, -1.676025390625, -1.4207763671875, -1.16552734375, -0.9102783203125, -0.655029296875, -0.3997802734375, -0.14453125, 0.1107177734375, 0.365966796875, 0.6212158203125, 0.87646484375, 1.1317138671875, 1.386962890625, 1.6422119140625, 1.8974609375, 2.1527099609375, 2.407958984375, 2.6632080078125, 2.91845703125, 3.1737060546875, 3.428955078125, 3.6842041015625, 3.939453125, 4.1947021484375, 4.449951171875, 4.7052001953125, 4.96044921875, 5.2156982421875, 5.470947265625, 5.7261962890625, 5.9814453125, 6.2366943359375, 6.491943359375, 6.7471923828125, 7.00244140625, 7.2576904296875, 7.512939453125, 7.7681884765625, 8.0234375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 7.0, 9.0, 8.0, 14.0, 16.0, 20.0, 20.0, 37.0, 29.0, 36.0, 40.0, 43.0, 57.0, 60.0, 85.0, 167.0, 1445.0, 373.0, 136.0, 79.0, 54.0, 50.0, 42.0, 38.0, 33.0, 27.0, 24.0, 19.0, 11.0, 16.0, 13.0, 8.0, 9.0, 8.0, 6.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.421875, -25.404541015625, -24.38720703125, -23.369873046875, -22.3525390625, -21.335205078125, -20.31787109375, -19.300537109375, -18.283203125, -17.265869140625, -16.24853515625, -15.231201171875, -14.2138671875, -13.196533203125, -12.17919921875, -11.161865234375, -10.14453125, -9.127197265625, -8.10986328125, -7.092529296875, -6.0751953125, -5.057861328125, -4.04052734375, -3.023193359375, -2.005859375, -0.988525390625, 0.02880859375, 1.046142578125, 2.0634765625, 3.080810546875, 4.09814453125, 5.115478515625, 6.1328125, 7.150146484375, 8.16748046875, 9.184814453125, 10.2021484375, 11.219482421875, 12.23681640625, 13.254150390625, 14.271484375, 15.288818359375, 16.30615234375, 17.323486328125, 18.3408203125, 19.358154296875, 20.37548828125, 21.392822265625, 22.41015625, 23.427490234375, 24.44482421875, 25.462158203125, 26.4794921875, 27.496826171875, 28.51416015625, 29.531494140625, 30.548828125, 31.566162109375, 32.58349609375, 33.600830078125, 34.6181640625, 35.635498046875, 36.65283203125, 37.670166015625, 38.6875]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 5.0, 3.0, 4.0, 11.0, 18.0, 19.0, 33.0, 31.0, 63.0, 69.0, 97.0, 154.0, 291.0, 525.0, 1303.0, 24360.0, 3089093.0, 26905.0, 1278.0, 567.0, 298.0, 181.0, 124.0, 68.0, 52.0, 37.0, 32.0, 16.0, 18.0, 10.0, 6.0, 10.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-73.5625, -71.1513671875, -68.740234375, -66.3291015625, -63.91796875, -61.5068359375, -59.095703125, -56.6845703125, -54.2734375, -51.8623046875, -49.451171875, -47.0400390625, -44.62890625, -42.2177734375, -39.806640625, -37.3955078125, -34.984375, -32.5732421875, -30.162109375, -27.7509765625, -25.33984375, -22.9287109375, -20.517578125, -18.1064453125, -15.6953125, -13.2841796875, -10.873046875, -8.4619140625, -6.05078125, -3.6396484375, -1.228515625, 1.1826171875, 3.59375, 6.0048828125, 8.416015625, 10.8271484375, 13.23828125, 15.6494140625, 18.060546875, 20.4716796875, 22.8828125, 25.2939453125, 27.705078125, 30.1162109375, 32.52734375, 34.9384765625, 37.349609375, 39.7607421875, 42.171875, 44.5830078125, 46.994140625, 49.4052734375, 51.81640625, 54.2275390625, 56.638671875, 59.0498046875, 61.4609375, 63.8720703125, 66.283203125, 68.6943359375, 71.10546875, 73.5166015625, 75.927734375, 78.3388671875, 80.75]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 110.0, 344.0, 391.0, 138.0, 21.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-194.06666564941406, -190.47366333007812, -186.8806610107422, -183.28765869140625, -179.6946563720703, -176.10165405273438, -172.50865173339844, -168.9156494140625, -165.3226318359375, -161.72962951660156, -158.13662719726562, -154.5436248779297, -150.95062255859375, -147.3576202392578, -143.76461791992188, -140.17160034179688, -136.57861328125, -132.98561096191406, -129.39260864257812, -125.79960632324219, -122.20660400390625, -118.61360168457031, -115.02059173583984, -111.4275894165039, -107.83458709716797, -104.24158477783203, -100.6485824584961, -97.05558013916016, -93.46257019042969, -89.86956787109375, -86.27656555175781, -82.68356323242188, -79.09056091308594, -75.49755859375, -71.90455627441406, -68.31155395507812, -64.71855163574219, -61.125545501708984, -57.53253936767578, -53.939537048339844, -50.34653091430664, -46.7535285949707, -43.1605224609375, -39.56752014160156, -35.974517822265625, -32.38151550292969, -28.788511276245117, -25.195507049560547, -21.60250473022461, -18.009502410888672, -14.416498184204102, -10.823494911193848, -7.230491638183594, -3.6374893188476562, -0.04448509216308594, 3.5485191345214844, 7.141521453857422, 10.734524726867676, 14.32752799987793, 17.9205322265625, 21.513534545898438, 25.106536865234375, 28.699541091918945, 32.292545318603516, 35.88554763793945]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 8.0, 7.0, 10.0, 14.0, 9.0, 11.0, 14.0, 25.0, 23.0, 35.0, 36.0, 29.0, 38.0, 19.0, 44.0, 62.0, 42.0, 35.0, 41.0, 49.0, 43.0, 46.0, 41.0, 44.0, 37.0, 20.0, 22.0, 32.0, 27.0, 25.0, 15.0, 20.0, 16.0, 12.0, 11.0, 11.0, 5.0, 5.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.61741638183594, -64.4090576171875, -62.2006950378418, -59.992332458496094, -57.783973693847656, -55.57561492919922, -53.367252349853516, -51.15888977050781, -48.950531005859375, -46.74217224121094, -44.533809661865234, -42.32544708251953, -40.117088317871094, -37.908729553222656, -35.70036697387695, -33.49200439453125, -31.283645629882812, -29.075284957885742, -26.866924285888672, -24.6585636138916, -22.45020294189453, -20.24184226989746, -18.03348159790039, -15.82512092590332, -13.61676025390625, -11.40839958190918, -9.20003890991211, -6.991678237915039, -4.783317565917969, -2.5749568939208984, -0.3665962219238281, 1.8417644500732422, 4.0501251220703125, 6.258485794067383, 8.466846466064453, 10.675207138061523, 12.883567810058594, 15.091928482055664, 17.300289154052734, 19.508649826049805, 21.717010498046875, 23.925371170043945, 26.133731842041016, 28.342092514038086, 30.550453186035156, 32.758811950683594, 34.9671745300293, 37.175537109375, 39.38389587402344, 41.592254638671875, 43.80061721801758, 46.00897979736328, 48.21733856201172, 50.425697326660156, 52.63405990600586, 54.84242248535156, 57.05078125, 59.25914001464844, 61.46750259399414, 63.675865173339844, 65.88422393798828, 68.09258270263672, 70.30094909667969, 72.50930786132812, 74.71766662597656]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 4.0, 4.0, 2.0, 10.0, 5.0, 5.0, 12.0, 9.0, 16.0, 16.0, 19.0, 15.0, 26.0, 20.0, 19.0, 24.0, 29.0, 31.0, 35.0, 35.0, 48.0, 48.0, 40.0, 37.0, 36.0, 45.0, 39.0, 37.0, 36.0, 30.0, 30.0, 16.0, 31.0, 25.0, 24.0, 23.0, 21.0, 15.0, 16.0, 10.0, 10.0, 9.0, 9.0, 7.0, 9.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-9.2265625, -8.96807861328125, -8.7095947265625, -8.45111083984375, -8.192626953125, -7.93414306640625, -7.6756591796875, -7.41717529296875, -7.15869140625, -6.90020751953125, -6.6417236328125, -6.38323974609375, -6.124755859375, -5.86627197265625, -5.6077880859375, -5.34930419921875, -5.0908203125, -4.83233642578125, -4.5738525390625, -4.31536865234375, -4.056884765625, -3.79840087890625, -3.5399169921875, -3.28143310546875, -3.02294921875, -2.76446533203125, -2.5059814453125, -2.24749755859375, -1.989013671875, -1.73052978515625, -1.4720458984375, -1.21356201171875, -0.955078125, -0.69659423828125, -0.4381103515625, -0.17962646484375, 0.078857421875, 0.33734130859375, 0.5958251953125, 0.85430908203125, 1.11279296875, 1.37127685546875, 1.6297607421875, 1.88824462890625, 2.146728515625, 2.40521240234375, 2.6636962890625, 2.92218017578125, 3.1806640625, 3.43914794921875, 3.6976318359375, 3.95611572265625, 4.214599609375, 4.47308349609375, 4.7315673828125, 4.99005126953125, 5.24853515625, 5.50701904296875, 5.7655029296875, 6.02398681640625, 6.282470703125, 6.54095458984375, 6.7994384765625, 7.05792236328125, 7.31640625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 2.0, 2.0, 1.0, 2.0, 4.0, 7.0, 11.0, 9.0, 15.0, 16.0, 12.0, 17.0, 20.0, 21.0, 31.0, 29.0, 51.0, 47.0, 73.0, 86.0, 163.0, 286.0, 1053.0, 10018.0, 358288.0, 3151191.0, 652445.0, 17970.0, 1399.0, 349.0, 156.0, 111.0, 77.0, 47.0, 51.0, 44.0, 24.0, 23.0, 30.0, 17.0, 12.0, 21.0, 9.0, 8.0, 11.0, 6.0, 7.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-28.53125, -27.7294921875, -26.927734375, -26.1259765625, -25.32421875, -24.5224609375, -23.720703125, -22.9189453125, -22.1171875, -21.3154296875, -20.513671875, -19.7119140625, -18.91015625, -18.1083984375, -17.306640625, -16.5048828125, -15.703125, -14.9013671875, -14.099609375, -13.2978515625, -12.49609375, -11.6943359375, -10.892578125, -10.0908203125, -9.2890625, -8.4873046875, -7.685546875, -6.8837890625, -6.08203125, -5.2802734375, -4.478515625, -3.6767578125, -2.875, -2.0732421875, -1.271484375, -0.4697265625, 0.33203125, 1.1337890625, 1.935546875, 2.7373046875, 3.5390625, 4.3408203125, 5.142578125, 5.9443359375, 6.74609375, 7.5478515625, 8.349609375, 9.1513671875, 9.953125, 10.7548828125, 11.556640625, 12.3583984375, 13.16015625, 13.9619140625, 14.763671875, 15.5654296875, 16.3671875, 17.1689453125, 17.970703125, 18.7724609375, 19.57421875, 20.3759765625, 21.177734375, 21.9794921875, 22.78125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 9.0, 4.0, 5.0, 14.0, 19.0, 18.0, 35.0, 38.0, 53.0, 55.0, 79.0, 131.0, 186.0, 236.0, 304.0, 345.0, 421.0, 435.0, 405.0, 323.0, 256.0, 169.0, 129.0, 103.0, 77.0, 52.0, 41.0, 36.0, 30.0, 21.0, 13.0, 9.0, 8.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.2421875, -14.7841796875, -14.326171875, -13.8681640625, -13.41015625, -12.9521484375, -12.494140625, -12.0361328125, -11.578125, -11.1201171875, -10.662109375, -10.2041015625, -9.74609375, -9.2880859375, -8.830078125, -8.3720703125, -7.9140625, -7.4560546875, -6.998046875, -6.5400390625, -6.08203125, -5.6240234375, -5.166015625, -4.7080078125, -4.25, -3.7919921875, -3.333984375, -2.8759765625, -2.41796875, -1.9599609375, -1.501953125, -1.0439453125, -0.5859375, -0.1279296875, 0.330078125, 0.7880859375, 1.24609375, 1.7041015625, 2.162109375, 2.6201171875, 3.078125, 3.5361328125, 3.994140625, 4.4521484375, 4.91015625, 5.3681640625, 5.826171875, 6.2841796875, 6.7421875, 7.2001953125, 7.658203125, 8.1162109375, 8.57421875, 9.0322265625, 9.490234375, 9.9482421875, 10.40625, 10.8642578125, 11.322265625, 11.7802734375, 12.23828125, 12.6962890625, 13.154296875, 13.6123046875, 14.0703125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 14.0, 5.0, 19.0, 27.0, 41.0, 48.0, 65.0, 82.0, 102.0, 139.0, 199.0, 277.0, 452.0, 1018.0, 8189.0, 606152.0, 3518667.0, 54515.0, 2206.0, 726.0, 406.0, 252.0, 202.0, 124.0, 86.0, 71.0, 52.0, 38.0, 32.0, 29.0, 11.0, 12.0, 12.0, 5.0, 4.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.28125, -51.6787109375, -50.076171875, -48.4736328125, -46.87109375, -45.2685546875, -43.666015625, -42.0634765625, -40.4609375, -38.8583984375, -37.255859375, -35.6533203125, -34.05078125, -32.4482421875, -30.845703125, -29.2431640625, -27.640625, -26.0380859375, -24.435546875, -22.8330078125, -21.23046875, -19.6279296875, -18.025390625, -16.4228515625, -14.8203125, -13.2177734375, -11.615234375, -10.0126953125, -8.41015625, -6.8076171875, -5.205078125, -3.6025390625, -2.0, -0.3974609375, 1.205078125, 2.8076171875, 4.41015625, 6.0126953125, 7.615234375, 9.2177734375, 10.8203125, 12.4228515625, 14.025390625, 15.6279296875, 17.23046875, 18.8330078125, 20.435546875, 22.0380859375, 23.640625, 25.2431640625, 26.845703125, 28.4482421875, 30.05078125, 31.6533203125, 33.255859375, 34.8583984375, 36.4609375, 38.0634765625, 39.666015625, 41.2685546875, 42.87109375, 44.4736328125, 46.076171875, 47.6787109375, 49.28125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 78.0, 684.0, 247.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-142.2712860107422, -128.9454345703125, -115.61957550048828, -102.2937240600586, -88.96786499023438, -75.64201354980469, -62.316162109375, -48.99030303955078, -35.664451599121094, -22.33859634399414, -9.01274299621582, 4.3131103515625, 17.638965606689453, 30.964820861816406, 44.290672302246094, 57.61653137207031, 70.9423828125, 84.26823425292969, 97.5940933227539, 110.9199447631836, 124.24580383300781, 137.5716552734375, 150.8975067138672, 164.22335815429688, 177.54922485351562, 190.8750762939453, 204.200927734375, 217.52679443359375, 230.85264587402344, 244.17849731445312, 257.50433349609375, 270.8302001953125, 284.1560363769531, 297.4819030761719, 310.8077392578125, 324.13360595703125, 337.4594421386719, 350.7853088378906, 364.11114501953125, 377.43701171875, 390.76287841796875, 404.0887451171875, 417.4145812988281, 430.7404479980469, 444.0662841796875, 457.39215087890625, 470.718017578125, 484.0438537597656, 497.36968994140625, 510.695556640625, 524.0214233398438, 537.3472290039062, 550.673095703125, 563.9989624023438, 577.3248291015625, 590.6506958007812, 603.9765625, 617.3024291992188, 630.6282958984375, 643.9541015625, 657.2799682617188, 670.6058349609375, 683.9317016601562, 697.257568359375, 710.5833740234375]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 9.0, 9.0, 11.0, 18.0, 8.0, 13.0, 23.0, 19.0, 15.0, 39.0, 34.0, 31.0, 40.0, 33.0, 28.0, 42.0, 36.0, 42.0, 43.0, 47.0, 38.0, 39.0, 35.0, 39.0, 28.0, 31.0, 43.0, 22.0, 34.0, 17.0, 20.0, 21.0, 10.0, 19.0, 9.0, 15.0, 8.0, 5.0, 8.0, 6.0, 3.0, 3.0, 0.0, 1.0, 5.0, 1.0], "bins": [-59.062870025634766, -57.444156646728516, -55.82544708251953, -54.20673370361328, -52.5880241394043, -50.96931076049805, -49.35060119628906, -47.73188781738281, -46.11317443847656, -44.49446105957031, -42.87575149536133, -41.25703811645508, -39.638328552246094, -38.019615173339844, -36.400901794433594, -34.78219223022461, -33.163482666015625, -31.544771194458008, -29.92605972290039, -28.30734634399414, -26.688636779785156, -25.069923400878906, -23.45121192932129, -21.832500457763672, -20.213788986206055, -18.595077514648438, -16.97636604309082, -15.357653617858887, -13.73894214630127, -12.120230674743652, -10.501518249511719, -8.882806777954102, -7.264091491699219, -5.645380020141602, -4.026668071746826, -2.407956123352051, -0.7892446517944336, 0.8294668197631836, 2.448179244995117, 4.066890716552734, 5.685602188110352, 7.304313659667969, 8.923025131225586, 10.54173755645752, 12.160449028015137, 13.779160499572754, 15.397872924804688, 17.016584396362305, 18.635295867919922, 20.25400733947754, 21.872718811035156, 23.491432189941406, 25.11014175415039, 26.72885513305664, 28.347566604614258, 29.966278076171875, 31.584989547729492, 33.20370101928711, 34.82241439819336, 36.441123962402344, 38.059837341308594, 39.67854690551758, 41.29726028442383, 42.91596984863281, 44.53468322753906]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 6.0, 8.0, 8.0, 4.0, 6.0, 10.0, 11.0, 11.0, 18.0, 12.0, 30.0, 21.0, 23.0, 33.0, 22.0, 25.0, 30.0, 32.0, 28.0, 49.0, 40.0, 31.0, 32.0, 44.0, 50.0, 35.0, 48.0, 25.0, 35.0, 24.0, 32.0, 34.0, 17.0, 20.0, 16.0, 21.0, 14.0, 20.0, 13.0, 14.0, 15.0, 7.0, 9.0, 4.0, 2.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.77734375, -7.52630615234375, -7.2752685546875, -7.02423095703125, -6.773193359375, -6.52215576171875, -6.2711181640625, -6.02008056640625, -5.76904296875, -5.51800537109375, -5.2669677734375, -5.01593017578125, -4.764892578125, -4.51385498046875, -4.2628173828125, -4.01177978515625, -3.7607421875, -3.50970458984375, -3.2586669921875, -3.00762939453125, -2.756591796875, -2.50555419921875, -2.2545166015625, -2.00347900390625, -1.75244140625, -1.50140380859375, -1.2503662109375, -0.99932861328125, -0.748291015625, -0.49725341796875, -0.2462158203125, 0.00482177734375, 0.255859375, 0.50689697265625, 0.7579345703125, 1.00897216796875, 1.260009765625, 1.51104736328125, 1.7620849609375, 2.01312255859375, 2.26416015625, 2.51519775390625, 2.7662353515625, 3.01727294921875, 3.268310546875, 3.51934814453125, 3.7703857421875, 4.02142333984375, 4.2724609375, 4.52349853515625, 4.7745361328125, 5.02557373046875, 5.276611328125, 5.52764892578125, 5.7786865234375, 6.02972412109375, 6.28076171875, 6.53179931640625, 6.7828369140625, 7.03387451171875, 7.284912109375, 7.53594970703125, 7.7869873046875, 8.03802490234375, 8.2890625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 10.0, 19.0, 25.0, 45.0, 39.0, 91.0, 123.0, 186.0, 251.0, 363.0, 600.0, 940.0, 1298.0, 1957.0, 2762.0, 4192.0, 6038.0, 8907.0, 12507.0, 18892.0, 27768.0, 42301.0, 66879.0, 115665.0, 212271.0, 212599.0, 115895.0, 66322.0, 42488.0, 27713.0, 18802.0, 12877.0, 8685.0, 6058.0, 4222.0, 2825.0, 1939.0, 1322.0, 872.0, 598.0, 389.0, 285.0, 183.0, 114.0, 75.0, 55.0, 32.0, 30.0, 14.0, 13.0, 8.0, 3.0, 2.0, 2.0, 4.0, 0.0, 2.0], "bins": [-1.314453125, -1.27337646484375, -1.2322998046875, -1.19122314453125, -1.150146484375, -1.10906982421875, -1.0679931640625, -1.02691650390625, -0.98583984375, -0.94476318359375, -0.9036865234375, -0.86260986328125, -0.821533203125, -0.78045654296875, -0.7393798828125, -0.69830322265625, -0.6572265625, -0.61614990234375, -0.5750732421875, -0.53399658203125, -0.492919921875, -0.45184326171875, -0.4107666015625, -0.36968994140625, -0.32861328125, -0.28753662109375, -0.2464599609375, -0.20538330078125, -0.164306640625, -0.12322998046875, -0.0821533203125, -0.04107666015625, 0.0, 0.04107666015625, 0.0821533203125, 0.12322998046875, 0.164306640625, 0.20538330078125, 0.2464599609375, 0.28753662109375, 0.32861328125, 0.36968994140625, 0.4107666015625, 0.45184326171875, 0.492919921875, 0.53399658203125, 0.5750732421875, 0.61614990234375, 0.6572265625, 0.69830322265625, 0.7393798828125, 0.78045654296875, 0.821533203125, 0.86260986328125, 0.9036865234375, 0.94476318359375, 0.98583984375, 1.02691650390625, 1.0679931640625, 1.10906982421875, 1.150146484375, 1.19122314453125, 1.2322998046875, 1.27337646484375, 1.314453125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 1.0, 10.0, 4.0, 16.0, 11.0, 13.0, 24.0, 16.0, 31.0, 25.0, 34.0, 32.0, 48.0, 34.0, 38.0, 45.0, 41.0, 39.0, 1066.0, 57.0, 42.0, 38.0, 42.0, 38.0, 37.0, 32.0, 23.0, 29.0, 20.0, 20.0, 22.0, 10.0, 12.0, 18.0, 6.0, 10.0, 4.0, 7.0, 7.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.1640625, -5.98046875, -5.796875, -5.61328125, -5.4296875, -5.24609375, -5.0625, -4.87890625, -4.6953125, -4.51171875, -4.328125, -4.14453125, -3.9609375, -3.77734375, -3.59375, -3.41015625, -3.2265625, -3.04296875, -2.859375, -2.67578125, -2.4921875, -2.30859375, -2.125, -1.94140625, -1.7578125, -1.57421875, -1.390625, -1.20703125, -1.0234375, -0.83984375, -0.65625, -0.47265625, -0.2890625, -0.10546875, 0.078125, 0.26171875, 0.4453125, 0.62890625, 0.8125, 0.99609375, 1.1796875, 1.36328125, 1.546875, 1.73046875, 1.9140625, 2.09765625, 2.28125, 2.46484375, 2.6484375, 2.83203125, 3.015625, 3.19921875, 3.3828125, 3.56640625, 3.75, 3.93359375, 4.1171875, 4.30078125, 4.484375, 4.66796875, 4.8515625, 5.03515625, 5.21875, 5.40234375, 5.5859375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 1.0, 10.0, 8.0, 4.0, 16.0, 16.0, 21.0, 35.0, 54.0, 71.0, 87.0, 159.0, 249.0, 325.0, 459.0, 667.0, 1023.0, 1590.0, 2462.0, 3865.0, 5917.0, 9648.0, 15743.0, 25928.0, 43709.0, 79084.0, 157370.0, 1351409.0, 183192.0, 90333.0, 48770.0, 28285.0, 17099.0, 10538.0, 6674.0, 4234.0, 2705.0, 1762.0, 1158.0, 785.0, 532.0, 345.0, 251.0, 168.0, 112.0, 79.0, 51.0, 40.0, 35.0, 21.0, 19.0, 7.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.546875, -1.4963226318359375, -1.445770263671875, -1.3952178955078125, -1.34466552734375, -1.2941131591796875, -1.243560791015625, -1.1930084228515625, -1.1424560546875, -1.0919036865234375, -1.041351318359375, -0.9907989501953125, -0.94024658203125, -0.8896942138671875, -0.839141845703125, -0.7885894775390625, -0.738037109375, -0.6874847412109375, -0.636932373046875, -0.5863800048828125, -0.53582763671875, -0.4852752685546875, -0.434722900390625, -0.3841705322265625, -0.3336181640625, -0.2830657958984375, -0.232513427734375, -0.1819610595703125, -0.13140869140625, -0.0808563232421875, -0.030303955078125, 0.0202484130859375, 0.07080078125, 0.1213531494140625, 0.171905517578125, 0.2224578857421875, 0.27301025390625, 0.3235626220703125, 0.374114990234375, 0.4246673583984375, 0.4752197265625, 0.5257720947265625, 0.576324462890625, 0.6268768310546875, 0.67742919921875, 0.7279815673828125, 0.778533935546875, 0.8290863037109375, 0.879638671875, 0.9301910400390625, 0.980743408203125, 1.0312957763671875, 1.08184814453125, 1.1324005126953125, 1.182952880859375, 1.2335052490234375, 1.2840576171875, 1.3346099853515625, 1.385162353515625, 1.4357147216796875, 1.48626708984375, 1.5368194580078125, 1.587371826171875, 1.6379241943359375, 1.6884765625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 9.0, 12.0, 8.0, 8.0, 15.0, 25.0, 24.0, 44.0, 51.0, 57.0, 63.0, 88.0, 99.0, 102.0, 89.0, 61.0, 52.0, 44.0, 41.0, 28.0, 19.0, 12.0, 11.0, 13.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0025196075439453125, -0.0024425387382507324, -0.0023654699325561523, -0.0022884011268615723, -0.002211332321166992, -0.002134263515472412, -0.002057194709777832, -0.001980125904083252, -0.0019030570983886719, -0.0018259882926940918, -0.0017489194869995117, -0.0016718506813049316, -0.0015947818756103516, -0.0015177130699157715, -0.0014406442642211914, -0.0013635754585266113, -0.0012865066528320312, -0.0012094378471374512, -0.001132369041442871, -0.001055300235748291, -0.000978231430053711, -0.0009011626243591309, -0.0008240938186645508, -0.0007470250129699707, -0.0006699562072753906, -0.0005928874015808105, -0.0005158185958862305, -0.0004387497901916504, -0.0003616809844970703, -0.00028461217880249023, -0.00020754337310791016, -0.00013047456741333008, -5.340576171875e-05, 2.3663043975830078e-05, 0.00010073184967041016, 0.00017780065536499023, 0.0002548694610595703, 0.0003319382667541504, 0.00040900707244873047, 0.00048607587814331055, 0.0005631446838378906, 0.0006402134895324707, 0.0007172822952270508, 0.0007943511009216309, 0.0008714199066162109, 0.000948488712310791, 0.001025557518005371, 0.0011026263236999512, 0.0011796951293945312, 0.0012567639350891113, 0.0013338327407836914, 0.0014109015464782715, 0.0014879703521728516, 0.0015650391578674316, 0.0016421079635620117, 0.0017191767692565918, 0.0017962455749511719, 0.001873314380645752, 0.001950383186340332, 0.002027451992034912, 0.002104520797729492, 0.0021815896034240723, 0.0022586584091186523, 0.0023357272148132324, 0.0024127960205078125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 11.0, 13.0, 18.0, 20.0, 18.0, 44.0, 54.0, 82.0, 101.0, 189.0, 307.0, 757.0, 15221.0, 1029119.0, 1491.0, 444.0, 236.0, 122.0, 89.0, 63.0, 36.0, 28.0, 27.0, 17.0, 16.0, 5.0, 6.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049407958984375, -0.047827720642089844, -0.04624748229980469, -0.04466724395751953, -0.043087005615234375, -0.04150676727294922, -0.03992652893066406, -0.038346290588378906, -0.03676605224609375, -0.035185813903808594, -0.03360557556152344, -0.03202533721923828, -0.030445098876953125, -0.02886486053466797, -0.027284622192382812, -0.025704383850097656, -0.0241241455078125, -0.022543907165527344, -0.020963668823242188, -0.01938343048095703, -0.017803192138671875, -0.01622295379638672, -0.014642715454101562, -0.013062477111816406, -0.01148223876953125, -0.009902000427246094, -0.008321762084960938, -0.006741523742675781, -0.005161285400390625, -0.0035810470581054688, -0.0020008087158203125, -0.00042057037353515625, 0.00115966796875, 0.0027399063110351562, 0.0043201446533203125, 0.005900382995605469, 0.007480621337890625, 0.009060859680175781, 0.010641098022460938, 0.012221336364746094, 0.01380157470703125, 0.015381813049316406, 0.016962051391601562, 0.01854228973388672, 0.020122528076171875, 0.02170276641845703, 0.023283004760742188, 0.024863243103027344, 0.0264434814453125, 0.028023719787597656, 0.029603958129882812, 0.03118419647216797, 0.032764434814453125, 0.03434467315673828, 0.03592491149902344, 0.037505149841308594, 0.03908538818359375, 0.040665626525878906, 0.04224586486816406, 0.04382610321044922, 0.045406341552734375, 0.04698657989501953, 0.04856681823730469, 0.050147056579589844, 0.051727294921875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 12.0, 33.0, 111.0, 200.0, 259.0, 222.0, 115.0, 47.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002450825646519661, -0.002383795566856861, -0.002316765720024705, -0.002249735640361905, -0.0021827055606991053, -0.002115675713866949, -0.0020486456342041492, -0.0019816155545413494, -0.0019145855912938714, -0.0018475556280463934, -0.0017805255483835936, -0.0017134955851361156, -0.0016464656218886375, -0.0015794355422258377, -0.0015124055789783597, -0.0014453756157308817, -0.0013783455360680819, -0.0013113155728206038, -0.001244285493157804, -0.001177255529910326, -0.0011102254502475262, -0.0010431954870000482, -0.0009761655237525702, -0.0009091355022974312, -0.0008421054808422923, -0.0007750754593871534, -0.0007080454379320145, -0.0006410154746845365, -0.0005739854532293975, -0.0005069554317742586, -0.00043992543942295015, -0.0003728954470716417, -0.0003058655420318246, -0.0002388355351286009, -0.0001718055282253772, -0.00010477552132215351, -3.7745514418929815e-05, 2.9284507036209106e-05, 9.631449938751757e-05, 0.00016334449173882604, 0.00023037451319396496, 0.0002974045346491039, 0.00036443452700041234, 0.0004314645193517208, 0.0004984945408068597, 0.0005655245622619987, 0.0006325545255094767, 0.0006995845469646156, 0.0007666145684197545, 0.0008336445898748934, 0.0009006746113300323, 0.0009677045745775104, 0.0010347345378249884, 0.0011017646174877882, 0.0011687945807352662, 0.0012358245439827442, 0.001302854623645544, 0.001369884586893022, 0.001436914666555822, 0.0015039446298033, 0.0015709747094660997, 0.0016380046727135777, 0.0017050346359610558, 0.0017720647156238556, 0.0018390946788713336]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 15.0, 18.0, 12.0, 22.0, 17.0, 16.0, 28.0, 36.0, 20.0, 34.0, 22.0, 31.0, 41.0, 40.0, 51.0, 32.0, 45.0, 41.0, 41.0, 32.0, 48.0, 39.0, 37.0, 40.0, 33.0, 33.0, 27.0, 31.0, 17.0, 15.0, 12.0, 14.0, 10.0, 7.0, 10.0, 11.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0009078383445739746, -0.0008779633790254593, -0.000848088413476944, -0.0008182134479284286, -0.0007883384823799133, -0.000758463516831398, -0.0007285885512828827, -0.0006987135857343674, -0.000668838620185852, -0.0006389636546373367, -0.0006090886890888214, -0.0005792137235403061, -0.0005493387579917908, -0.0005194637924432755, -0.0004895888268947601, -0.0004597138613462448, -0.0004298388957977295, -0.00039996393024921417, -0.00037008896470069885, -0.00034021399915218353, -0.0003103390336036682, -0.0002804640680551529, -0.0002505891025066376, -0.00022071413695812225, -0.00019083917140960693, -0.00016096420586109161, -0.0001310892403125763, -0.00010121427476406097, -7.133930921554565e-05, -4.1464343667030334e-05, -1.1589378118515015e-05, 1.8285587430000305e-05, 4.8160552978515625e-05, 7.803551852703094e-05, 0.00010791048407554626, 0.00013778544962406158, 0.0001676604151725769, 0.00019753538072109222, 0.00022741034626960754, 0.00025728531181812286, 0.0002871602773666382, 0.0003170352429151535, 0.0003469102084636688, 0.00037678517401218414, 0.00040666013956069946, 0.0004365351051092148, 0.0004664100706577301, 0.0004962850362062454, 0.0005261600017547607, 0.0005560349673032761, 0.0005859099328517914, 0.0006157848984003067, 0.000645659863948822, 0.0006755348294973373, 0.0007054097950458527, 0.000735284760594368, 0.0007651597261428833, 0.0007950346916913986, 0.0008249096572399139, 0.0008547846227884293, 0.0008846595883369446, 0.0009145345538854599, 0.0009444095194339752, 0.0009742844849824905, 0.0010041594505310059]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 0.0, 6.0, 8.0, 8.0, 4.0, 6.0, 10.0, 11.0, 11.0, 18.0, 12.0, 30.0, 21.0, 23.0, 33.0, 22.0, 25.0, 30.0, 32.0, 28.0, 49.0, 40.0, 31.0, 32.0, 43.0, 51.0, 35.0, 48.0, 25.0, 35.0, 24.0, 32.0, 34.0, 17.0, 20.0, 16.0, 21.0, 14.0, 20.0, 13.0, 14.0, 15.0, 7.0, 9.0, 4.0, 2.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.77734375, -7.52630615234375, -7.2752685546875, -7.02423095703125, -6.773193359375, -6.52215576171875, -6.2711181640625, -6.02008056640625, -5.76904296875, -5.51800537109375, -5.2669677734375, -5.01593017578125, -4.764892578125, -4.51385498046875, -4.2628173828125, -4.01177978515625, -3.7607421875, -3.50970458984375, -3.2586669921875, -3.00762939453125, -2.756591796875, -2.50555419921875, -2.2545166015625, -2.00347900390625, -1.75244140625, -1.50140380859375, -1.2503662109375, -0.99932861328125, -0.748291015625, -0.49725341796875, -0.2462158203125, 0.00482177734375, 0.255859375, 0.50689697265625, 0.7579345703125, 1.00897216796875, 1.260009765625, 1.51104736328125, 1.7620849609375, 2.01312255859375, 2.26416015625, 2.51519775390625, 2.7662353515625, 3.01727294921875, 3.268310546875, 3.51934814453125, 3.7703857421875, 4.02142333984375, 4.2724609375, 4.52349853515625, 4.7745361328125, 5.02557373046875, 5.276611328125, 5.52764892578125, 5.7786865234375, 6.02972412109375, 6.28076171875, 6.53179931640625, 6.7828369140625, 7.03387451171875, 7.284912109375, 7.53594970703125, 7.7869873046875, 8.03802490234375, 8.2890625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 9.0, 5.0, 10.0, 11.0, 19.0, 20.0, 19.0, 36.0, 42.0, 54.0, 76.0, 109.0, 146.0, 176.0, 266.0, 440.0, 917.0, 2997.0, 11332.0, 45516.0, 233363.0, 566704.0, 144126.0, 30442.0, 7561.0, 2073.0, 766.0, 386.0, 246.0, 158.0, 130.0, 94.0, 67.0, 56.0, 37.0, 34.0, 32.0, 21.0, 18.0, 11.0, 3.0, 6.0, 7.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2421875, -13.7730712890625, -13.303955078125, -12.8348388671875, -12.36572265625, -11.8966064453125, -11.427490234375, -10.9583740234375, -10.4892578125, -10.0201416015625, -9.551025390625, -9.0819091796875, -8.61279296875, -8.1436767578125, -7.674560546875, -7.2054443359375, -6.736328125, -6.2672119140625, -5.798095703125, -5.3289794921875, -4.85986328125, -4.3907470703125, -3.921630859375, -3.4525146484375, -2.9833984375, -2.5142822265625, -2.045166015625, -1.5760498046875, -1.10693359375, -0.6378173828125, -0.168701171875, 0.3004150390625, 0.76953125, 1.2386474609375, 1.707763671875, 2.1768798828125, 2.64599609375, 3.1151123046875, 3.584228515625, 4.0533447265625, 4.5224609375, 4.9915771484375, 5.460693359375, 5.9298095703125, 6.39892578125, 6.8680419921875, 7.337158203125, 7.8062744140625, 8.275390625, 8.7445068359375, 9.213623046875, 9.6827392578125, 10.15185546875, 10.6209716796875, 11.090087890625, 11.5592041015625, 12.0283203125, 12.4974365234375, 12.966552734375, 13.4356689453125, 13.90478515625, 14.3739013671875, 14.843017578125, 15.3121337890625, 15.78125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 6.0, 2.0, 4.0, 2.0, 8.0, 7.0, 7.0, 9.0, 12.0, 11.0, 11.0, 14.0, 15.0, 15.0, 15.0, 21.0, 25.0, 21.0, 36.0, 46.0, 48.0, 43.0, 61.0, 69.0, 173.0, 1469.0, 307.0, 121.0, 75.0, 60.0, 43.0, 36.0, 33.0, 29.0, 30.0, 24.0, 25.0, 20.0, 22.0, 19.0, 11.0, 14.0, 8.0, 11.0, 8.0, 4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-26.0, -25.15576171875, -24.3115234375, -23.46728515625, -22.623046875, -21.77880859375, -20.9345703125, -20.09033203125, -19.24609375, -18.40185546875, -17.5576171875, -16.71337890625, -15.869140625, -15.02490234375, -14.1806640625, -13.33642578125, -12.4921875, -11.64794921875, -10.8037109375, -9.95947265625, -9.115234375, -8.27099609375, -7.4267578125, -6.58251953125, -5.73828125, -4.89404296875, -4.0498046875, -3.20556640625, -2.361328125, -1.51708984375, -0.6728515625, 0.17138671875, 1.015625, 1.85986328125, 2.7041015625, 3.54833984375, 4.392578125, 5.23681640625, 6.0810546875, 6.92529296875, 7.76953125, 8.61376953125, 9.4580078125, 10.30224609375, 11.146484375, 11.99072265625, 12.8349609375, 13.67919921875, 14.5234375, 15.36767578125, 16.2119140625, 17.05615234375, 17.900390625, 18.74462890625, 19.5888671875, 20.43310546875, 21.27734375, 22.12158203125, 22.9658203125, 23.81005859375, 24.654296875, 25.49853515625, 26.3427734375, 27.18701171875, 28.03125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 4.0, 4.0, 3.0, 8.0, 13.0, 19.0, 22.0, 22.0, 32.0, 31.0, 41.0, 46.0, 72.0, 75.0, 134.0, 178.0, 291.0, 536.0, 1515.0, 17326.0, 3011992.0, 108846.0, 2570.0, 747.0, 368.0, 235.0, 121.0, 94.0, 72.0, 49.0, 42.0, 30.0, 19.0, 28.0, 27.0, 20.0, 6.0, 9.0, 16.0, 10.0, 8.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-63.125, -61.0673828125, -59.009765625, -56.9521484375, -54.89453125, -52.8369140625, -50.779296875, -48.7216796875, -46.6640625, -44.6064453125, -42.548828125, -40.4912109375, -38.43359375, -36.3759765625, -34.318359375, -32.2607421875, -30.203125, -28.1455078125, -26.087890625, -24.0302734375, -21.97265625, -19.9150390625, -17.857421875, -15.7998046875, -13.7421875, -11.6845703125, -9.626953125, -7.5693359375, -5.51171875, -3.4541015625, -1.396484375, 0.6611328125, 2.71875, 4.7763671875, 6.833984375, 8.8916015625, 10.94921875, 13.0068359375, 15.064453125, 17.1220703125, 19.1796875, 21.2373046875, 23.294921875, 25.3525390625, 27.41015625, 29.4677734375, 31.525390625, 33.5830078125, 35.640625, 37.6982421875, 39.755859375, 41.8134765625, 43.87109375, 45.9287109375, 47.986328125, 50.0439453125, 52.1015625, 54.1591796875, 56.216796875, 58.2744140625, 60.33203125, 62.3896484375, 64.447265625, 66.5048828125, 68.5625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 24.0, 393.0, 549.0, 50.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-235.83131408691406, -229.30050659179688, -222.7696990966797, -216.2388916015625, -209.70806884765625, -203.17726135253906, -196.64645385742188, -190.1156463623047, -183.5848388671875, -177.0540313720703, -170.52322387695312, -163.99240112304688, -157.4615936279297, -150.9307861328125, -144.3999786376953, -137.86917114257812, -131.33834838867188, -124.80754089355469, -118.27672576904297, -111.74591827392578, -105.21510314941406, -98.68429565429688, -92.15348815917969, -85.6226806640625, -79.09186553955078, -72.5610580444336, -66.03024291992188, -59.49943542480469, -52.968624114990234, -46.43781280517578, -39.907005310058594, -33.37619400024414, -26.845382690429688, -20.314571380615234, -13.783761978149414, -7.252952575683594, -0.7221412658691406, 5.8086700439453125, 12.3394775390625, 18.870288848876953, 25.401100158691406, 31.93191146850586, 38.46272277832031, 44.9935302734375, 51.52434158325195, 58.055152893066406, 64.5859603881836, 71.11677551269531, 77.6475830078125, 84.17839050292969, 90.7092056274414, 97.2400131225586, 103.77082824707031, 110.3016357421875, 116.83244323730469, 123.36325073242188, 129.89407348632812, 136.4248809814453, 142.9556884765625, 149.48651123046875, 156.01731872558594, 162.54812622070312, 169.0789337158203, 175.6097412109375, 182.1405487060547]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 6.0, 7.0, 7.0, 8.0, 9.0, 4.0, 12.0, 14.0, 12.0, 16.0, 16.0, 24.0, 20.0, 30.0, 37.0, 22.0, 43.0, 24.0, 38.0, 37.0, 33.0, 38.0, 30.0, 45.0, 42.0, 39.0, 40.0, 34.0, 34.0, 32.0, 31.0, 23.0, 26.0, 30.0, 18.0, 13.0, 18.0, 14.0, 13.0, 9.0, 17.0, 11.0, 5.0, 6.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0], "bins": [-70.77459716796875, -68.72064971923828, -66.66670989990234, -64.61276245117188, -62.55881881713867, -60.50487518310547, -58.450927734375, -56.3969841003418, -54.343040466308594, -52.28909683227539, -50.23515319824219, -48.18120574951172, -46.127262115478516, -44.07331848144531, -42.019371032714844, -39.96542739868164, -37.91148376464844, -35.857540130615234, -33.80359649658203, -31.749649047851562, -29.69570541381836, -27.641761779785156, -25.58781623840332, -23.533870697021484, -21.47992706298828, -19.425983428955078, -17.372037887573242, -15.318093299865723, -13.264148712158203, -11.210204124450684, -9.156259536743164, -7.1023149490356445, -5.048374176025391, -2.994429588317871, -0.9404850006103516, 1.113459587097168, 3.1674041748046875, 5.221348762512207, 7.275293350219727, 9.329237937927246, 11.383182525634766, 13.437127113342285, 15.491071701049805, 17.54501724243164, 19.598960876464844, 21.652904510498047, 23.706850051879883, 25.76079559326172, 27.814739227294922, 29.868682861328125, 31.92262840270996, 33.9765739440918, 36.030517578125, 38.0844612121582, 40.138404846191406, 42.192352294921875, 44.24629592895508, 46.30023956298828, 48.35418701171875, 50.40813064575195, 52.462074279785156, 54.51601791381836, 56.56996154785156, 58.62390899658203, 60.677852630615234]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 5.0, 8.0, 7.0, 8.0, 20.0, 12.0, 16.0, 20.0, 17.0, 26.0, 21.0, 28.0, 26.0, 28.0, 33.0, 38.0, 31.0, 41.0, 42.0, 28.0, 39.0, 47.0, 34.0, 36.0, 45.0, 27.0, 31.0, 32.0, 27.0, 24.0, 29.0, 25.0, 25.0, 24.0, 10.0, 14.0, 15.0, 12.0, 9.0, 9.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-8.2421875, -7.9732666015625, -7.704345703125, -7.4354248046875, -7.16650390625, -6.8975830078125, -6.628662109375, -6.3597412109375, -6.0908203125, -5.8218994140625, -5.552978515625, -5.2840576171875, -5.01513671875, -4.7462158203125, -4.477294921875, -4.2083740234375, -3.939453125, -3.6705322265625, -3.401611328125, -3.1326904296875, -2.86376953125, -2.5948486328125, -2.325927734375, -2.0570068359375, -1.7880859375, -1.5191650390625, -1.250244140625, -0.9813232421875, -0.71240234375, -0.4434814453125, -0.174560546875, 0.0943603515625, 0.36328125, 0.6322021484375, 0.901123046875, 1.1700439453125, 1.43896484375, 1.7078857421875, 1.976806640625, 2.2457275390625, 2.5146484375, 2.7835693359375, 3.052490234375, 3.3214111328125, 3.59033203125, 3.8592529296875, 4.128173828125, 4.3970947265625, 4.666015625, 4.9349365234375, 5.203857421875, 5.4727783203125, 5.74169921875, 6.0106201171875, 6.279541015625, 6.5484619140625, 6.8173828125, 7.0863037109375, 7.355224609375, 7.6241455078125, 7.89306640625, 8.1619873046875, 8.430908203125, 8.6998291015625, 8.96875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 6.0, 11.0, 8.0, 9.0, 13.0, 13.0, 17.0, 22.0, 28.0, 35.0, 48.0, 52.0, 54.0, 88.0, 179.0, 342.0, 1307.0, 9763.0, 160593.0, 1953989.0, 1905764.0, 150367.0, 9421.0, 1211.0, 346.0, 169.0, 94.0, 59.0, 46.0, 41.0, 28.0, 27.0, 19.0, 20.0, 20.0, 12.0, 15.0, 10.0, 5.0, 5.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.875, -20.178955078125, -19.48291015625, -18.786865234375, -18.0908203125, -17.394775390625, -16.69873046875, -16.002685546875, -15.306640625, -14.610595703125, -13.91455078125, -13.218505859375, -12.5224609375, -11.826416015625, -11.13037109375, -10.434326171875, -9.73828125, -9.042236328125, -8.34619140625, -7.650146484375, -6.9541015625, -6.258056640625, -5.56201171875, -4.865966796875, -4.169921875, -3.473876953125, -2.77783203125, -2.081787109375, -1.3857421875, -0.689697265625, 0.00634765625, 0.702392578125, 1.3984375, 2.094482421875, 2.79052734375, 3.486572265625, 4.1826171875, 4.878662109375, 5.57470703125, 6.270751953125, 6.966796875, 7.662841796875, 8.35888671875, 9.054931640625, 9.7509765625, 10.447021484375, 11.14306640625, 11.839111328125, 12.53515625, 13.231201171875, 13.92724609375, 14.623291015625, 15.3193359375, 16.015380859375, 16.71142578125, 17.407470703125, 18.103515625, 18.799560546875, 19.49560546875, 20.191650390625, 20.8876953125, 21.583740234375, 22.27978515625, 22.975830078125, 23.671875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 7.0, 7.0, 13.0, 15.0, 28.0, 28.0, 40.0, 51.0, 99.0, 128.0, 173.0, 250.0, 326.0, 447.0, 474.0, 486.0, 417.0, 321.0, 220.0, 172.0, 119.0, 78.0, 46.0, 45.0, 16.0, 16.0, 15.0, 12.0, 9.0, 2.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.296875, -18.7735595703125, -18.250244140625, -17.7269287109375, -17.20361328125, -16.6802978515625, -16.156982421875, -15.6336669921875, -15.1103515625, -14.5870361328125, -14.063720703125, -13.5404052734375, -13.01708984375, -12.4937744140625, -11.970458984375, -11.4471435546875, -10.923828125, -10.4005126953125, -9.877197265625, -9.3538818359375, -8.83056640625, -8.3072509765625, -7.783935546875, -7.2606201171875, -6.7373046875, -6.2139892578125, -5.690673828125, -5.1673583984375, -4.64404296875, -4.1207275390625, -3.597412109375, -3.0740966796875, -2.55078125, -2.0274658203125, -1.504150390625, -0.9808349609375, -0.45751953125, 0.0657958984375, 0.589111328125, 1.1124267578125, 1.6357421875, 2.1590576171875, 2.682373046875, 3.2056884765625, 3.72900390625, 4.2523193359375, 4.775634765625, 5.2989501953125, 5.822265625, 6.3455810546875, 6.868896484375, 7.3922119140625, 7.91552734375, 8.4388427734375, 8.962158203125, 9.4854736328125, 10.0087890625, 10.5321044921875, 11.055419921875, 11.5787353515625, 12.10205078125, 12.6253662109375, 13.148681640625, 13.6719970703125, 14.1953125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 9.0, 19.0, 21.0, 29.0, 42.0, 57.0, 74.0, 100.0, 120.0, 183.0, 285.0, 424.0, 845.0, 2887.0, 24758.0, 741825.0, 3269921.0, 141372.0, 8072.0, 1454.0, 607.0, 333.0, 226.0, 160.0, 122.0, 78.0, 75.0, 46.0, 40.0, 25.0, 15.0, 15.0, 8.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.78125, -33.59326171875, -32.4052734375, -31.21728515625, -30.029296875, -28.84130859375, -27.6533203125, -26.46533203125, -25.27734375, -24.08935546875, -22.9013671875, -21.71337890625, -20.525390625, -19.33740234375, -18.1494140625, -16.96142578125, -15.7734375, -14.58544921875, -13.3974609375, -12.20947265625, -11.021484375, -9.83349609375, -8.6455078125, -7.45751953125, -6.26953125, -5.08154296875, -3.8935546875, -2.70556640625, -1.517578125, -0.32958984375, 0.8583984375, 2.04638671875, 3.234375, 4.42236328125, 5.6103515625, 6.79833984375, 7.986328125, 9.17431640625, 10.3623046875, 11.55029296875, 12.73828125, 13.92626953125, 15.1142578125, 16.30224609375, 17.490234375, 18.67822265625, 19.8662109375, 21.05419921875, 22.2421875, 23.43017578125, 24.6181640625, 25.80615234375, 26.994140625, 28.18212890625, 29.3701171875, 30.55810546875, 31.74609375, 32.93408203125, 34.1220703125, 35.31005859375, 36.498046875, 37.68603515625, 38.8740234375, 40.06201171875, 41.25]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 3.0, 12.0, 370.0, 594.0, 38.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.25001525878906, -43.489776611328125, -29.729541778564453, -15.969306945800781, -2.2090682983398438, 11.551170349121094, 25.3114013671875, 39.07164001464844, 52.831878662109375, 66.59211730957031, 80.35235595703125, 94.11258697509766, 107.8728256225586, 121.63306427001953, 135.39329528808594, 149.15353393554688, 162.9137725830078, 176.67401123046875, 190.4342498779297, 204.19448852539062, 217.9547119140625, 231.7149658203125, 245.47518920898438, 259.23541259765625, 272.99566650390625, 286.7558898925781, 300.5161437988281, 314.2763671875, 328.03662109375, 341.7968444824219, 355.55706787109375, 369.31732177734375, 383.07757568359375, 396.8377990722656, 410.5980529785156, 424.3582763671875, 438.1185302734375, 451.8787536621094, 465.63897705078125, 479.39923095703125, 493.15948486328125, 506.9197082519531, 520.679931640625, 534.440185546875, 548.200439453125, 561.960693359375, 575.7208862304688, 589.4811401367188, 603.2413330078125, 617.0015869140625, 630.7617797851562, 644.5220336914062, 658.2822875976562, 672.0425415039062, 685.802734375, 699.56298828125, 713.3232421875, 727.08349609375, 740.8436889648438, 754.6039428710938, 768.3641967773438, 782.1244506835938, 795.8846435546875, 809.6448974609375, 823.4051513671875]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 5.0, 1.0, 2.0, 8.0, 14.0, 11.0, 12.0, 12.0, 22.0, 26.0, 17.0, 16.0, 25.0, 29.0, 34.0, 41.0, 32.0, 33.0, 31.0, 41.0, 36.0, 38.0, 45.0, 39.0, 34.0, 39.0, 33.0, 44.0, 34.0, 24.0, 31.0, 30.0, 29.0, 14.0, 21.0, 16.0, 16.0, 10.0, 11.0, 8.0, 6.0, 8.0, 6.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-53.6789665222168, -52.08578872680664, -50.492610931396484, -48.89943313598633, -47.30625915527344, -45.71308135986328, -44.119903564453125, -42.52672576904297, -40.93354797363281, -39.340370178222656, -37.7471923828125, -36.154014587402344, -34.56083679199219, -32.9676628112793, -31.37448501586914, -29.781307220458984, -28.188129425048828, -26.594951629638672, -25.001773834228516, -23.408597946166992, -21.815420150756836, -20.22224235534668, -18.629066467285156, -17.035888671875, -15.442710876464844, -13.849533081054688, -12.256356239318848, -10.663179397583008, -9.070001602172852, -7.4768242835998535, -5.8836469650268555, -4.290470123291016, -2.6972923278808594, -1.1041150093078613, 0.4890623092651367, 2.0822396278381348, 3.675416946411133, 5.268594264984131, 6.861771583557129, 8.454948425292969, 10.048126220703125, 11.641304016113281, 13.234480857849121, 14.827657699584961, 16.420835494995117, 18.014013290405273, 19.607189178466797, 21.200366973876953, 22.79354476928711, 24.386722564697266, 25.979900360107422, 27.573076248168945, 29.1662540435791, 30.759431838989258, 32.35260772705078, 33.94578552246094, 35.538963317871094, 37.13214111328125, 38.725318908691406, 40.31849670410156, 41.91167449951172, 43.50484848022461, 45.098026275634766, 46.69120407104492, 48.28438186645508]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 6.0, 4.0, 11.0, 11.0, 9.0, 16.0, 11.0, 14.0, 20.0, 26.0, 27.0, 29.0, 17.0, 30.0, 35.0, 31.0, 32.0, 25.0, 36.0, 33.0, 39.0, 52.0, 38.0, 42.0, 49.0, 28.0, 42.0, 31.0, 42.0, 18.0, 26.0, 28.0, 23.0, 16.0, 19.0, 8.0, 15.0, 12.0, 7.0, 6.0, 6.0, 10.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.234375, -7.954345703125, -7.67431640625, -7.394287109375, -7.1142578125, -6.834228515625, -6.55419921875, -6.274169921875, -5.994140625, -5.714111328125, -5.43408203125, -5.154052734375, -4.8740234375, -4.593994140625, -4.31396484375, -4.033935546875, -3.75390625, -3.473876953125, -3.19384765625, -2.913818359375, -2.6337890625, -2.353759765625, -2.07373046875, -1.793701171875, -1.513671875, -1.233642578125, -0.95361328125, -0.673583984375, -0.3935546875, -0.113525390625, 0.16650390625, 0.446533203125, 0.7265625, 1.006591796875, 1.28662109375, 1.566650390625, 1.8466796875, 2.126708984375, 2.40673828125, 2.686767578125, 2.966796875, 3.246826171875, 3.52685546875, 3.806884765625, 4.0869140625, 4.366943359375, 4.64697265625, 4.927001953125, 5.20703125, 5.487060546875, 5.76708984375, 6.047119140625, 6.3271484375, 6.607177734375, 6.88720703125, 7.167236328125, 7.447265625, 7.727294921875, 8.00732421875, 8.287353515625, 8.5673828125, 8.847412109375, 9.12744140625, 9.407470703125, 9.6875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 5.0, 9.0, 4.0, 22.0, 20.0, 38.0, 47.0, 64.0, 112.0, 165.0, 232.0, 362.0, 516.0, 858.0, 1235.0, 1801.0, 2998.0, 4770.0, 7420.0, 12060.0, 20361.0, 34497.0, 60416.0, 112154.0, 240919.0, 266268.0, 122022.0, 65438.0, 36883.0, 21851.0, 13030.0, 7993.0, 5019.0, 3126.0, 2020.0, 1203.0, 878.0, 558.0, 369.0, 252.0, 188.0, 104.0, 87.0, 66.0, 28.0, 27.0, 25.0, 11.0, 5.0, 6.0, 4.0, 4.0, 3.0, 2.0], "bins": [-1.9775390625, -1.921142578125, -1.86474609375, -1.808349609375, -1.751953125, -1.695556640625, -1.63916015625, -1.582763671875, -1.5263671875, -1.469970703125, -1.41357421875, -1.357177734375, -1.30078125, -1.244384765625, -1.18798828125, -1.131591796875, -1.0751953125, -1.018798828125, -0.96240234375, -0.906005859375, -0.849609375, -0.793212890625, -0.73681640625, -0.680419921875, -0.6240234375, -0.567626953125, -0.51123046875, -0.454833984375, -0.3984375, -0.342041015625, -0.28564453125, -0.229248046875, -0.1728515625, -0.116455078125, -0.06005859375, -0.003662109375, 0.052734375, 0.109130859375, 0.16552734375, 0.221923828125, 0.2783203125, 0.334716796875, 0.39111328125, 0.447509765625, 0.50390625, 0.560302734375, 0.61669921875, 0.673095703125, 0.7294921875, 0.785888671875, 0.84228515625, 0.898681640625, 0.955078125, 1.011474609375, 1.06787109375, 1.124267578125, 1.1806640625, 1.237060546875, 1.29345703125, 1.349853515625, 1.40625, 1.462646484375, 1.51904296875, 1.575439453125, 1.6318359375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 5.0, 1.0, 8.0, 9.0, 9.0, 9.0, 8.0, 12.0, 16.0, 18.0, 13.0, 13.0, 21.0, 18.0, 19.0, 29.0, 28.0, 19.0, 29.0, 32.0, 38.0, 26.0, 40.0, 28.0, 1058.0, 43.0, 41.0, 47.0, 47.0, 37.0, 37.0, 22.0, 27.0, 19.0, 19.0, 20.0, 16.0, 18.0, 20.0, 18.0, 16.0, 13.0, 10.0, 13.0, 10.0, 9.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 4.0, 3.0], "bins": [-5.75, -5.5845947265625, -5.419189453125, -5.2537841796875, -5.08837890625, -4.9229736328125, -4.757568359375, -4.5921630859375, -4.4267578125, -4.2613525390625, -4.095947265625, -3.9305419921875, -3.76513671875, -3.5997314453125, -3.434326171875, -3.2689208984375, -3.103515625, -2.9381103515625, -2.772705078125, -2.6072998046875, -2.44189453125, -2.2764892578125, -2.111083984375, -1.9456787109375, -1.7802734375, -1.6148681640625, -1.449462890625, -1.2840576171875, -1.11865234375, -0.9532470703125, -0.787841796875, -0.6224365234375, -0.45703125, -0.2916259765625, -0.126220703125, 0.0391845703125, 0.20458984375, 0.3699951171875, 0.535400390625, 0.7008056640625, 0.8662109375, 1.0316162109375, 1.197021484375, 1.3624267578125, 1.52783203125, 1.6932373046875, 1.858642578125, 2.0240478515625, 2.189453125, 2.3548583984375, 2.520263671875, 2.6856689453125, 2.85107421875, 3.0164794921875, 3.181884765625, 3.3472900390625, 3.5126953125, 3.6781005859375, 3.843505859375, 4.0089111328125, 4.17431640625, 4.3397216796875, 4.505126953125, 4.6705322265625, 4.8359375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [7.0, 5.0, 15.0, 17.0, 22.0, 21.0, 42.0, 66.0, 62.0, 131.0, 155.0, 189.0, 291.0, 358.0, 581.0, 720.0, 1191.0, 1616.0, 2368.0, 3283.0, 5092.0, 7357.0, 10910.0, 16013.0, 23970.0, 36042.0, 58376.0, 102286.0, 201978.0, 1298563.0, 127855.0, 69891.0, 42479.0, 27613.0, 18248.0, 12554.0, 8297.0, 5626.0, 3944.0, 2699.0, 1909.0, 1253.0, 904.0, 628.0, 451.0, 288.0, 216.0, 155.0, 146.0, 75.0, 61.0, 39.0, 24.0, 19.0, 16.0, 13.0, 5.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.3134765625, -1.2684478759765625, -1.223419189453125, -1.1783905029296875, -1.13336181640625, -1.0883331298828125, -1.043304443359375, -0.9982757568359375, -0.9532470703125, -0.9082183837890625, -0.863189697265625, -0.8181610107421875, -0.77313232421875, -0.7281036376953125, -0.683074951171875, -0.6380462646484375, -0.593017578125, -0.5479888916015625, -0.502960205078125, -0.4579315185546875, -0.41290283203125, -0.3678741455078125, -0.322845458984375, -0.2778167724609375, -0.2327880859375, -0.1877593994140625, -0.142730712890625, -0.0977020263671875, -0.05267333984375, -0.0076446533203125, 0.037384033203125, 0.0824127197265625, 0.12744140625, 0.1724700927734375, 0.217498779296875, 0.2625274658203125, 0.30755615234375, 0.3525848388671875, 0.397613525390625, 0.4426422119140625, 0.4876708984375, 0.5326995849609375, 0.577728271484375, 0.6227569580078125, 0.66778564453125, 0.7128143310546875, 0.757843017578125, 0.8028717041015625, 0.847900390625, 0.8929290771484375, 0.937957763671875, 0.9829864501953125, 1.02801513671875, 1.0730438232421875, 1.118072509765625, 1.1631011962890625, 1.2081298828125, 1.2531585693359375, 1.298187255859375, 1.3432159423828125, 1.38824462890625, 1.4332733154296875, 1.478302001953125, 1.5233306884765625, 1.568359375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 0.0, 3.0, 4.0, 0.0, 5.0, 4.0, 7.0, 14.0, 13.0, 11.0, 17.0, 17.0, 25.0, 19.0, 33.0, 41.0, 50.0, 76.0, 74.0, 85.0, 73.0, 63.0, 67.0, 54.0, 52.0, 48.0, 31.0, 22.0, 14.0, 21.0, 15.0, 15.0, 4.0, 5.0, 2.0, 4.0, 6.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.002567291259765625, -0.002500012516975403, -0.0024327337741851807, -0.0023654550313949585, -0.0022981762886047363, -0.002230897545814514, -0.002163618803024292, -0.00209634006023407, -0.0020290613174438477, -0.0019617825746536255, -0.0018945038318634033, -0.0018272250890731812, -0.001759946346282959, -0.0016926676034927368, -0.0016253888607025146, -0.0015581101179122925, -0.0014908313751220703, -0.0014235526323318481, -0.001356273889541626, -0.0012889951467514038, -0.0012217164039611816, -0.0011544376611709595, -0.0010871589183807373, -0.0010198801755905151, -0.000952601432800293, -0.0008853226900100708, -0.0008180439472198486, -0.0007507652044296265, -0.0006834864616394043, -0.0006162077188491821, -0.00054892897605896, -0.0004816502332687378, -0.0004143714904785156, -0.00034709274768829346, -0.0002798140048980713, -0.00021253526210784912, -0.00014525651931762695, -7.797777652740479e-05, -1.0699033737182617e-05, 5.657970905303955e-05, 0.00012385845184326172, 0.0001911371946334839, 0.00025841593742370605, 0.0003256946802139282, 0.0003929734230041504, 0.00046025216579437256, 0.0005275309085845947, 0.0005948096513748169, 0.0006620883941650391, 0.0007293671369552612, 0.0007966458797454834, 0.0008639246225357056, 0.0009312033653259277, 0.00099848210811615, 0.001065760850906372, 0.0011330395936965942, 0.0012003183364868164, 0.0012675970792770386, 0.0013348758220672607, 0.001402154564857483, 0.001469433307647705, 0.0015367120504379272, 0.0016039907932281494, 0.0016712695360183716, 0.0017385482788085938]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 8.0, 4.0, 11.0, 20.0, 10.0, 24.0, 37.0, 42.0, 49.0, 83.0, 109.0, 178.0, 314.0, 593.0, 2357.0, 1015118.0, 27607.0, 848.0, 394.0, 229.0, 123.0, 90.0, 73.0, 44.0, 32.0, 30.0, 19.0, 22.0, 27.0, 8.0, 8.0, 3.0, 7.0, 6.0, 4.0, 4.0, 4.0, 1.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033935546875, -0.03261566162109375, -0.0312957763671875, -0.02997589111328125, -0.028656005859375, -0.02733612060546875, -0.0260162353515625, -0.02469635009765625, -0.02337646484375, -0.02205657958984375, -0.0207366943359375, -0.01941680908203125, -0.018096923828125, -0.01677703857421875, -0.0154571533203125, -0.01413726806640625, -0.0128173828125, -0.01149749755859375, -0.0101776123046875, -0.00885772705078125, -0.007537841796875, -0.00621795654296875, -0.0048980712890625, -0.00357818603515625, -0.00225830078125, -0.00093841552734375, 0.0003814697265625, 0.00170135498046875, 0.003021240234375, 0.00434112548828125, 0.0056610107421875, 0.00698089599609375, 0.00830078125, 0.00962066650390625, 0.0109405517578125, 0.01226043701171875, 0.013580322265625, 0.01490020751953125, 0.0162200927734375, 0.01753997802734375, 0.01885986328125, 0.02017974853515625, 0.0214996337890625, 0.02281951904296875, 0.024139404296875, 0.02545928955078125, 0.0267791748046875, 0.02809906005859375, 0.0294189453125, 0.03073883056640625, 0.0320587158203125, 0.03337860107421875, 0.034698486328125, 0.03601837158203125, 0.0373382568359375, 0.03865814208984375, 0.03997802734375, 0.04129791259765625, 0.0426177978515625, 0.04393768310546875, 0.045257568359375, 0.04657745361328125, 0.0478973388671875, 0.04921722412109375, 0.050537109375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 20.0, 307.0, 571.0, 114.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008393684402108192, -0.008208485320210457, -0.008023286238312721, -0.007838087156414986, -0.007652888540178537, -0.007467689458280802, -0.007282490376383066, -0.007097291294485331, -0.006912092678248882, -0.006726893596351147, -0.006541694514453411, -0.0063564954325556755, -0.006171296816319227, -0.005986097734421492, -0.005800898652523756, -0.00561569957062602, -0.005430500488728285, -0.005245301406830549, -0.005060102324932814, -0.004874903708696365, -0.00468970462679863, -0.004504505544900894, -0.004319306463003159, -0.004134107381105423, -0.003948908299207687, -0.0037637092173099518, -0.00357851036824286, -0.0033933112863451242, -0.0032081124372780323, -0.0030229133553802967, -0.002837714273482561, -0.0026525151915848255, -0.00246731610968709, -0.0022821170277893543, -0.0020969181787222624, -0.0019117190968245268, -0.001726520131342113, -0.0015413211658596992, -0.0013561220839619637, -0.0011709231184795499, -0.0009857241529971361, -0.0008005251875147223, -0.0006153261638246477, -0.000430127140134573, -0.0002449281746521592, -5.9729209169745445e-05, 0.00012546987272799015, 0.0003106688382104039, 0.0004958678036928177, 0.0006810667691752315, 0.0008662657928653061, 0.0010514648165553808, 0.0012366637820377946, 0.0014218627475202084, 0.001607061829417944, 0.0017922607949003577, 0.0019774597603827715, 0.002162658842280507, 0.002347857691347599, 0.0025330567732453346, 0.0027182558551430702, 0.002903454704210162, 0.0030886537861078978, 0.0032738526351749897, 0.0034590517170727253]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 5.0, 7.0, 12.0, 9.0, 12.0, 14.0, 23.0, 26.0, 28.0, 30.0, 20.0, 38.0, 26.0, 31.0, 40.0, 41.0, 44.0, 37.0, 37.0, 50.0, 34.0, 41.0, 36.0, 33.0, 32.0, 33.0, 28.0, 30.0, 27.0, 34.0, 13.0, 28.0, 20.0, 13.0, 12.0, 11.0, 9.0, 3.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.0011210441589355469, -0.0010897833853960037, -0.0010585226118564606, -0.0010272618383169174, -0.0009960010647773743, -0.0009647402912378311, -0.000933479517698288, -0.0009022187441587448, -0.0008709579706192017, -0.0008396971970796585, -0.0008084364235401154, -0.0007771756500005722, -0.000745914876461029, -0.0007146541029214859, -0.0006833933293819427, -0.0006521325558423996, -0.0006208717823028564, -0.0005896110087633133, -0.0005583502352237701, -0.000527089461684227, -0.0004958286881446838, -0.0004645679146051407, -0.00043330714106559753, -0.0004020463675260544, -0.00037078559398651123, -0.0003395248204469681, -0.0003082640469074249, -0.0002770032733678818, -0.0002457424998283386, -0.00021448172628879547, -0.00018322095274925232, -0.00015196017920970917, -0.00012069940567016602, -8.943863213062286e-05, -5.817785859107971e-05, -2.691708505153656e-05, 4.343688488006592e-06, 3.5604462027549744e-05, 6.68652355670929e-05, 9.812600910663605e-05, 0.0001293867826461792, 0.00016064755618572235, 0.0001919083297252655, 0.00022316910326480865, 0.0002544298768043518, 0.00028569065034389496, 0.0003169514238834381, 0.00034821219742298126, 0.0003794729709625244, 0.00041073374450206757, 0.0004419945180416107, 0.00047325529158115387, 0.000504516065120697, 0.0005357768386602402, 0.0005670376121997833, 0.0005982983857393265, 0.0006295591592788696, 0.0006608199328184128, 0.0006920807063579559, 0.0007233414798974991, 0.0007546022534370422, 0.0007858630269765854, 0.0008171238005161285, 0.0008483845740556717, 0.0008796453475952148]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 1.0, 4.0, 6.0, 4.0, 11.0, 11.0, 9.0, 16.0, 11.0, 14.0, 20.0, 26.0, 27.0, 29.0, 17.0, 30.0, 35.0, 31.0, 32.0, 25.0, 36.0, 33.0, 39.0, 52.0, 38.0, 42.0, 49.0, 28.0, 42.0, 31.0, 42.0, 18.0, 26.0, 28.0, 23.0, 16.0, 19.0, 8.0, 15.0, 12.0, 7.0, 6.0, 6.0, 10.0, 3.0, 4.0, 5.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.234375, -7.954345703125, -7.67431640625, -7.394287109375, -7.1142578125, -6.834228515625, -6.55419921875, -6.274169921875, -5.994140625, -5.714111328125, -5.43408203125, -5.154052734375, -4.8740234375, -4.593994140625, -4.31396484375, -4.033935546875, -3.75390625, -3.473876953125, -3.19384765625, -2.913818359375, -2.6337890625, -2.353759765625, -2.07373046875, -1.793701171875, -1.513671875, -1.233642578125, -0.95361328125, -0.673583984375, -0.3935546875, -0.113525390625, 0.16650390625, 0.446533203125, 0.7265625, 1.006591796875, 1.28662109375, 1.566650390625, 1.8466796875, 2.126708984375, 2.40673828125, 2.686767578125, 2.966796875, 3.246826171875, 3.52685546875, 3.806884765625, 4.0869140625, 4.366943359375, 4.64697265625, 4.927001953125, 5.20703125, 5.487060546875, 5.76708984375, 6.047119140625, 6.3271484375, 6.607177734375, 6.88720703125, 7.167236328125, 7.447265625, 7.727294921875, 8.00732421875, 8.287353515625, 8.5673828125, 8.847412109375, 9.12744140625, 9.407470703125, 9.6875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 4.0, 13.0, 4.0, 9.0, 18.0, 31.0, 32.0, 30.0, 52.0, 76.0, 72.0, 116.0, 124.0, 190.0, 246.0, 300.0, 435.0, 575.0, 1037.0, 2732.0, 10554.0, 53210.0, 600550.0, 330300.0, 35067.0, 7592.0, 2156.0, 858.0, 564.0, 388.0, 299.0, 221.0, 168.0, 131.0, 86.0, 71.0, 63.0, 36.0, 31.0, 23.0, 17.0, 14.0, 14.0, 9.0, 7.0, 11.0, 5.0, 4.0, 6.0, 0.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-20.71875, -20.025390625, -19.33203125, -18.638671875, -17.9453125, -17.251953125, -16.55859375, -15.865234375, -15.171875, -14.478515625, -13.78515625, -13.091796875, -12.3984375, -11.705078125, -11.01171875, -10.318359375, -9.625, -8.931640625, -8.23828125, -7.544921875, -6.8515625, -6.158203125, -5.46484375, -4.771484375, -4.078125, -3.384765625, -2.69140625, -1.998046875, -1.3046875, -0.611328125, 0.08203125, 0.775390625, 1.46875, 2.162109375, 2.85546875, 3.548828125, 4.2421875, 4.935546875, 5.62890625, 6.322265625, 7.015625, 7.708984375, 8.40234375, 9.095703125, 9.7890625, 10.482421875, 11.17578125, 11.869140625, 12.5625, 13.255859375, 13.94921875, 14.642578125, 15.3359375, 16.029296875, 16.72265625, 17.416015625, 18.109375, 18.802734375, 19.49609375, 20.189453125, 20.8828125, 21.576171875, 22.26953125, 22.962890625, 23.65625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 9.0, 11.0, 9.0, 18.0, 6.0, 17.0, 19.0, 22.0, 29.0, 23.0, 47.0, 44.0, 40.0, 43.0, 60.0, 70.0, 173.0, 1546.0, 336.0, 114.0, 47.0, 46.0, 53.0, 44.0, 37.0, 21.0, 22.0, 25.0, 26.0, 28.0, 7.0, 12.0, 10.0, 13.0, 7.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-33.78125, -32.77978515625, -31.7783203125, -30.77685546875, -29.775390625, -28.77392578125, -27.7724609375, -26.77099609375, -25.76953125, -24.76806640625, -23.7666015625, -22.76513671875, -21.763671875, -20.76220703125, -19.7607421875, -18.75927734375, -17.7578125, -16.75634765625, -15.7548828125, -14.75341796875, -13.751953125, -12.75048828125, -11.7490234375, -10.74755859375, -9.74609375, -8.74462890625, -7.7431640625, -6.74169921875, -5.740234375, -4.73876953125, -3.7373046875, -2.73583984375, -1.734375, -0.73291015625, 0.2685546875, 1.27001953125, 2.271484375, 3.27294921875, 4.2744140625, 5.27587890625, 6.27734375, 7.27880859375, 8.2802734375, 9.28173828125, 10.283203125, 11.28466796875, 12.2861328125, 13.28759765625, 14.2890625, 15.29052734375, 16.2919921875, 17.29345703125, 18.294921875, 19.29638671875, 20.2978515625, 21.29931640625, 22.30078125, 23.30224609375, 24.3037109375, 25.30517578125, 26.306640625, 27.30810546875, 28.3095703125, 29.31103515625, 30.3125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 12.0, 9.0, 20.0, 12.0, 16.0, 29.0, 27.0, 36.0, 29.0, 44.0, 72.0, 89.0, 156.0, 313.0, 636.0, 2486.0, 130690.0, 3000939.0, 7922.0, 1087.0, 366.0, 186.0, 131.0, 81.0, 73.0, 46.0, 44.0, 31.0, 27.0, 12.0, 16.0, 13.0, 14.0, 11.0, 7.0, 7.0, 2.0, 2.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.25, -81.4619140625, -78.673828125, -75.8857421875, -73.09765625, -70.3095703125, -67.521484375, -64.7333984375, -61.9453125, -59.1572265625, -56.369140625, -53.5810546875, -50.79296875, -48.0048828125, -45.216796875, -42.4287109375, -39.640625, -36.8525390625, -34.064453125, -31.2763671875, -28.48828125, -25.7001953125, -22.912109375, -20.1240234375, -17.3359375, -14.5478515625, -11.759765625, -8.9716796875, -6.18359375, -3.3955078125, -0.607421875, 2.1806640625, 4.96875, 7.7568359375, 10.544921875, 13.3330078125, 16.12109375, 18.9091796875, 21.697265625, 24.4853515625, 27.2734375, 30.0615234375, 32.849609375, 35.6376953125, 38.42578125, 41.2138671875, 44.001953125, 46.7900390625, 49.578125, 52.3662109375, 55.154296875, 57.9423828125, 60.73046875, 63.5185546875, 66.306640625, 69.0947265625, 71.8828125, 74.6708984375, 77.458984375, 80.2470703125, 83.03515625, 85.8232421875, 88.611328125, 91.3994140625, 94.1875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [3.0, 3.0, 42.0, 325.0, 484.0, 142.0, 17.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.861318588256836, -15.196775436401367, -10.532233238220215, -5.8676910400390625, -1.2031478881835938, 3.461395263671875, 8.125936508178711, 12.79047966003418, 17.45502281188965, 22.119565963745117, 26.784107208251953, 31.448650360107422, 36.11319351196289, 40.77773666381836, 45.44227600097656, 50.10681915283203, 54.7713623046875, 59.43590545654297, 64.10044860839844, 68.7649917602539, 73.42953491210938, 78.09407806396484, 82.75862121582031, 87.42315673828125, 92.08770751953125, 96.75225067138672, 101.41679382324219, 106.08133697509766, 110.74588012695312, 115.4104232788086, 120.07496643066406, 124.739501953125, 129.40403747558594, 134.06857299804688, 138.73312377929688, 143.3976593017578, 148.0622100830078, 152.72674560546875, 157.39129638671875, 162.0558319091797, 166.7203826904297, 171.38491821289062, 176.04946899414062, 180.71400451660156, 185.37855529785156, 190.0430908203125, 194.7076416015625, 199.37217712402344, 204.03671264648438, 208.7012481689453, 213.3657989501953, 218.03033447265625, 222.69488525390625, 227.3594207763672, 232.0239715576172, 236.68850708007812, 241.35305786132812, 246.01759338378906, 250.68214416503906, 255.3466796875, 260.01123046875, 264.67578125, 269.3403015136719, 274.0048522949219, 278.6694030761719]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 4.0, 8.0, 3.0, 13.0, 5.0, 17.0, 10.0, 17.0, 22.0, 34.0, 25.0, 29.0, 24.0, 24.0, 21.0, 32.0, 31.0, 38.0, 36.0, 34.0, 41.0, 30.0, 42.0, 54.0, 43.0, 30.0, 29.0, 37.0, 34.0, 29.0, 24.0, 24.0, 20.0, 18.0, 24.0, 14.0, 20.0, 16.0, 15.0, 10.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.53705596923828, -72.21614837646484, -69.8952407836914, -67.57432556152344, -65.25341796875, -62.93251037597656, -60.611602783203125, -58.29069519042969, -55.969783782958984, -53.64887619018555, -51.327964782714844, -49.007057189941406, -46.68614959716797, -44.365238189697266, -42.04433059692383, -39.723419189453125, -37.40251159667969, -35.08160400390625, -32.76069259643555, -30.43978500366211, -28.11887550354004, -25.79796600341797, -23.47705841064453, -21.15614891052246, -18.83523941040039, -16.51432991027832, -14.193421363830566, -11.872512817382812, -9.551603317260742, -7.230693817138672, -4.909785270690918, -2.588876724243164, -0.267974853515625, 2.052934169769287, 4.373843193054199, 6.694752216339111, 9.015661239624023, 11.336570739746094, 13.657479286193848, 15.978387832641602, 18.299297332763672, 20.620206832885742, 22.941116333007812, 25.26202392578125, 27.58293342590332, 29.90384292602539, 32.22475051879883, 34.54566192626953, 36.86656951904297, 39.187477111816406, 41.50838851928711, 43.82929611206055, 46.15020751953125, 48.47111511230469, 50.792022705078125, 53.11293029785156, 55.433841705322266, 57.7547492980957, 60.075660705566406, 62.396568298339844, 64.71747589111328, 67.03839111328125, 69.35929870605469, 71.68020629882812, 74.00111389160156]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 8.0, 1.0, 8.0, 8.0, 13.0, 9.0, 30.0, 20.0, 27.0, 18.0, 35.0, 37.0, 26.0, 23.0, 45.0, 29.0, 43.0, 36.0, 51.0, 41.0, 51.0, 41.0, 38.0, 54.0, 44.0, 22.0, 35.0, 29.0, 30.0, 24.0, 21.0, 13.0, 12.0, 17.0, 7.0, 10.0, 5.0, 8.0, 3.0, 8.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.7578125, -10.435546875, -10.11328125, -9.791015625, -9.46875, -9.146484375, -8.82421875, -8.501953125, -8.1796875, -7.857421875, -7.53515625, -7.212890625, -6.890625, -6.568359375, -6.24609375, -5.923828125, -5.6015625, -5.279296875, -4.95703125, -4.634765625, -4.3125, -3.990234375, -3.66796875, -3.345703125, -3.0234375, -2.701171875, -2.37890625, -2.056640625, -1.734375, -1.412109375, -1.08984375, -0.767578125, -0.4453125, -0.123046875, 0.19921875, 0.521484375, 0.84375, 1.166015625, 1.48828125, 1.810546875, 2.1328125, 2.455078125, 2.77734375, 3.099609375, 3.421875, 3.744140625, 4.06640625, 4.388671875, 4.7109375, 5.033203125, 5.35546875, 5.677734375, 6.0, 6.322265625, 6.64453125, 6.966796875, 7.2890625, 7.611328125, 7.93359375, 8.255859375, 8.578125, 8.900390625, 9.22265625, 9.544921875, 9.8671875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 14.0, 9.0, 11.0, 14.0, 18.0, 22.0, 29.0, 32.0, 57.0, 64.0, 82.0, 115.0, 139.0, 207.0, 271.0, 505.0, 1322.0, 5791.0, 46304.0, 530541.0, 2381272.0, 1103246.0, 109054.0, 11118.0, 2085.0, 731.0, 331.0, 222.0, 157.0, 128.0, 87.0, 63.0, 56.0, 36.0, 18.0, 31.0, 21.0, 16.0, 17.0, 15.0, 8.0, 2.0, 6.0, 5.0, 3.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.0, -18.380615234375, -17.76123046875, -17.141845703125, -16.5224609375, -15.903076171875, -15.28369140625, -14.664306640625, -14.044921875, -13.425537109375, -12.80615234375, -12.186767578125, -11.5673828125, -10.947998046875, -10.32861328125, -9.709228515625, -9.08984375, -8.470458984375, -7.85107421875, -7.231689453125, -6.6123046875, -5.992919921875, -5.37353515625, -4.754150390625, -4.134765625, -3.515380859375, -2.89599609375, -2.276611328125, -1.6572265625, -1.037841796875, -0.41845703125, 0.200927734375, 0.8203125, 1.439697265625, 2.05908203125, 2.678466796875, 3.2978515625, 3.917236328125, 4.53662109375, 5.156005859375, 5.775390625, 6.394775390625, 7.01416015625, 7.633544921875, 8.2529296875, 8.872314453125, 9.49169921875, 10.111083984375, 10.73046875, 11.349853515625, 11.96923828125, 12.588623046875, 13.2080078125, 13.827392578125, 14.44677734375, 15.066162109375, 15.685546875, 16.304931640625, 16.92431640625, 17.543701171875, 18.1630859375, 18.782470703125, 19.40185546875, 20.021240234375, 20.640625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 7.0, 5.0, 5.0, 8.0, 8.0, 16.0, 22.0, 32.0, 34.0, 70.0, 63.0, 107.0, 163.0, 181.0, 263.0, 344.0, 352.0, 454.0, 439.0, 320.0, 303.0, 234.0, 165.0, 113.0, 104.0, 65.0, 39.0, 36.0, 23.0, 26.0, 16.0, 13.0, 11.0, 6.0, 3.0, 10.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-17.296875, -16.8123779296875, -16.327880859375, -15.8433837890625, -15.35888671875, -14.8743896484375, -14.389892578125, -13.9053955078125, -13.4208984375, -12.9364013671875, -12.451904296875, -11.9674072265625, -11.48291015625, -10.9984130859375, -10.513916015625, -10.0294189453125, -9.544921875, -9.0604248046875, -8.575927734375, -8.0914306640625, -7.60693359375, -7.1224365234375, -6.637939453125, -6.1534423828125, -5.6689453125, -5.1844482421875, -4.699951171875, -4.2154541015625, -3.73095703125, -3.2464599609375, -2.761962890625, -2.2774658203125, -1.79296875, -1.3084716796875, -0.823974609375, -0.3394775390625, 0.14501953125, 0.6295166015625, 1.114013671875, 1.5985107421875, 2.0830078125, 2.5675048828125, 3.052001953125, 3.5364990234375, 4.02099609375, 4.5054931640625, 4.989990234375, 5.4744873046875, 5.958984375, 6.4434814453125, 6.927978515625, 7.4124755859375, 7.89697265625, 8.3814697265625, 8.865966796875, 9.3504638671875, 9.8349609375, 10.3194580078125, 10.803955078125, 11.2884521484375, 11.77294921875, 12.2574462890625, 12.741943359375, 13.2264404296875, 13.7109375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 5.0, 5.0, 12.0, 8.0, 10.0, 30.0, 29.0, 39.0, 73.0, 90.0, 112.0, 198.0, 309.0, 531.0, 968.0, 2866.0, 19056.0, 470511.0, 3513883.0, 170716.0, 10761.0, 2063.0, 799.0, 415.0, 275.0, 164.0, 104.0, 88.0, 42.0, 37.0, 20.0, 19.0, 12.0, 8.0, 17.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-42.75, -41.42919921875, -40.1083984375, -38.78759765625, -37.466796875, -36.14599609375, -34.8251953125, -33.50439453125, -32.18359375, -30.86279296875, -29.5419921875, -28.22119140625, -26.900390625, -25.57958984375, -24.2587890625, -22.93798828125, -21.6171875, -20.29638671875, -18.9755859375, -17.65478515625, -16.333984375, -15.01318359375, -13.6923828125, -12.37158203125, -11.05078125, -9.72998046875, -8.4091796875, -7.08837890625, -5.767578125, -4.44677734375, -3.1259765625, -1.80517578125, -0.484375, 0.83642578125, 2.1572265625, 3.47802734375, 4.798828125, 6.11962890625, 7.4404296875, 8.76123046875, 10.08203125, 11.40283203125, 12.7236328125, 14.04443359375, 15.365234375, 16.68603515625, 18.0068359375, 19.32763671875, 20.6484375, 21.96923828125, 23.2900390625, 24.61083984375, 25.931640625, 27.25244140625, 28.5732421875, 29.89404296875, 31.21484375, 32.53564453125, 33.8564453125, 35.17724609375, 36.498046875, 37.81884765625, 39.1396484375, 40.46044921875, 41.78125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 404.0, 584.0, 19.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-167.4840850830078, -152.35263061523438, -137.22117614746094, -122.08971405029297, -106.958251953125, -91.82679748535156, -76.69534301757812, -61.563880920410156, -46.43242645263672, -31.300968170166016, -16.169511795043945, -1.038055419921875, 14.093402862548828, 29.22486114501953, 44.35631561279297, 59.48777770996094, 74.61923217773438, 89.75068664550781, 104.88214874267578, 120.01360321044922, 135.1450653076172, 150.27651977539062, 165.40797424316406, 180.5394287109375, 195.6708984375, 210.80235290527344, 225.93380737304688, 241.06527709960938, 256.19671630859375, 271.32818603515625, 286.45965576171875, 301.5910949707031, 316.7225646972656, 331.8540344238281, 346.9854736328125, 362.116943359375, 377.2483825683594, 392.3798522949219, 407.51129150390625, 422.64276123046875, 437.77423095703125, 452.90570068359375, 468.0371398925781, 483.1686096191406, 498.300048828125, 513.4315185546875, 528.56298828125, 543.6944580078125, 558.8258666992188, 573.9573364257812, 589.0888061523438, 604.22021484375, 619.3516845703125, 634.483154296875, 649.6146240234375, 664.74609375, 679.8775634765625, 695.009033203125, 710.1405029296875, 725.2719116210938, 740.4033813476562, 755.5348510742188, 770.6663208007812, 785.7977905273438, 800.92919921875]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 13.0, 15.0, 9.0, 17.0, 9.0, 25.0, 27.0, 26.0, 30.0, 33.0, 39.0, 33.0, 46.0, 32.0, 49.0, 54.0, 52.0, 47.0, 37.0, 45.0, 38.0, 31.0, 32.0, 44.0, 24.0, 22.0, 23.0, 17.0, 22.0, 16.0, 17.0, 7.0, 13.0, 14.0, 11.0, 9.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-65.03279876708984, -63.19601058959961, -61.359222412109375, -59.52243423461914, -57.685646057128906, -55.84886169433594, -54.01206970214844, -52.17528533935547, -50.338497161865234, -48.501708984375, -46.664920806884766, -44.82813262939453, -42.9913444519043, -41.15455627441406, -39.317771911621094, -37.48098373413086, -35.644195556640625, -33.80740737915039, -31.970619201660156, -30.133831024169922, -28.29704475402832, -26.460256576538086, -24.62346839904785, -22.78668212890625, -20.94989013671875, -19.113101959228516, -17.27631378173828, -15.439526557922363, -13.602739334106445, -11.765951156616211, -9.929162979125977, -8.092375755310059, -6.255588531494141, -4.4188008308410645, -2.582012891769409, -0.7452249526977539, 1.0915627479553223, 2.9283504486083984, 4.765138626098633, 6.601925849914551, 8.438714027404785, 10.27550220489502, 12.112289428710938, 13.949077606201172, 15.785865783691406, 17.62265396118164, 19.459442138671875, 21.296228408813477, 23.13301658630371, 24.969804763793945, 26.80659294128418, 28.64337921142578, 30.480167388916016, 32.31695556640625, 34.153743743896484, 35.99053192138672, 37.82732009887695, 39.66410827636719, 41.50089645385742, 43.337684631347656, 45.17447280883789, 47.011260986328125, 48.848045349121094, 50.68483352661133, 52.52162170410156]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 4.0, 9.0, 8.0, 17.0, 20.0, 14.0, 26.0, 27.0, 23.0, 33.0, 29.0, 32.0, 35.0, 48.0, 38.0, 44.0, 42.0, 56.0, 36.0, 38.0, 51.0, 44.0, 42.0, 46.0, 33.0, 25.0, 25.0, 18.0, 25.0, 25.0, 14.0, 15.0, 12.0, 7.0, 9.0, 6.0, 6.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.96875, -11.61279296875, -11.2568359375, -10.90087890625, -10.544921875, -10.18896484375, -9.8330078125, -9.47705078125, -9.12109375, -8.76513671875, -8.4091796875, -8.05322265625, -7.697265625, -7.34130859375, -6.9853515625, -6.62939453125, -6.2734375, -5.91748046875, -5.5615234375, -5.20556640625, -4.849609375, -4.49365234375, -4.1376953125, -3.78173828125, -3.42578125, -3.06982421875, -2.7138671875, -2.35791015625, -2.001953125, -1.64599609375, -1.2900390625, -0.93408203125, -0.578125, -0.22216796875, 0.1337890625, 0.48974609375, 0.845703125, 1.20166015625, 1.5576171875, 1.91357421875, 2.26953125, 2.62548828125, 2.9814453125, 3.33740234375, 3.693359375, 4.04931640625, 4.4052734375, 4.76123046875, 5.1171875, 5.47314453125, 5.8291015625, 6.18505859375, 6.541015625, 6.89697265625, 7.2529296875, 7.60888671875, 7.96484375, 8.32080078125, 8.6767578125, 9.03271484375, 9.388671875, 9.74462890625, 10.1005859375, 10.45654296875, 10.8125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 16.0, 11.0, 26.0, 39.0, 51.0, 81.0, 107.0, 167.0, 229.0, 366.0, 558.0, 846.0, 1243.0, 1935.0, 3156.0, 4742.0, 7559.0, 12493.0, 20764.0, 34768.0, 61530.0, 116430.0, 249036.0, 256323.0, 121483.0, 63216.0, 35702.0, 21195.0, 12765.0, 7851.0, 4950.0, 3174.0, 1983.0, 1254.0, 834.0, 565.0, 399.0, 224.0, 143.0, 110.0, 65.0, 49.0, 41.0, 22.0, 18.0, 11.0, 10.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.0, -1.9394378662109375, -1.878875732421875, -1.8183135986328125, -1.75775146484375, -1.6971893310546875, -1.636627197265625, -1.5760650634765625, -1.5155029296875, -1.4549407958984375, -1.394378662109375, -1.3338165283203125, -1.27325439453125, -1.2126922607421875, -1.152130126953125, -1.0915679931640625, -1.031005859375, -0.9704437255859375, -0.909881591796875, -0.8493194580078125, -0.78875732421875, -0.7281951904296875, -0.667633056640625, -0.6070709228515625, -0.5465087890625, -0.4859466552734375, -0.425384521484375, -0.3648223876953125, -0.30426025390625, -0.2436981201171875, -0.183135986328125, -0.1225738525390625, -0.06201171875, -0.0014495849609375, 0.059112548828125, 0.1196746826171875, 0.18023681640625, 0.2407989501953125, 0.301361083984375, 0.3619232177734375, 0.4224853515625, 0.4830474853515625, 0.543609619140625, 0.6041717529296875, 0.66473388671875, 0.7252960205078125, 0.785858154296875, 0.8464202880859375, 0.906982421875, 0.9675445556640625, 1.028106689453125, 1.0886688232421875, 1.14923095703125, 1.2097930908203125, 1.270355224609375, 1.3309173583984375, 1.3914794921875, 1.4520416259765625, 1.512603759765625, 1.5731658935546875, 1.63372802734375, 1.6942901611328125, 1.754852294921875, 1.8154144287109375, 1.8759765625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 7.0, 8.0, 14.0, 15.0, 16.0, 14.0, 28.0, 18.0, 26.0, 29.0, 33.0, 27.0, 33.0, 33.0, 37.0, 36.0, 38.0, 43.0, 1064.0, 37.0, 34.0, 36.0, 44.0, 31.0, 37.0, 32.0, 38.0, 27.0, 24.0, 20.0, 18.0, 17.0, 21.0, 14.0, 17.0, 11.0, 6.0, 8.0, 5.0, 9.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.4140625, -6.20660400390625, -5.9991455078125, -5.79168701171875, -5.584228515625, -5.37677001953125, -5.1693115234375, -4.96185302734375, -4.75439453125, -4.54693603515625, -4.3394775390625, -4.13201904296875, -3.924560546875, -3.71710205078125, -3.5096435546875, -3.30218505859375, -3.0947265625, -2.88726806640625, -2.6798095703125, -2.47235107421875, -2.264892578125, -2.05743408203125, -1.8499755859375, -1.64251708984375, -1.43505859375, -1.22760009765625, -1.0201416015625, -0.81268310546875, -0.605224609375, -0.39776611328125, -0.1903076171875, 0.01715087890625, 0.224609375, 0.43206787109375, 0.6395263671875, 0.84698486328125, 1.054443359375, 1.26190185546875, 1.4693603515625, 1.67681884765625, 1.88427734375, 2.09173583984375, 2.2991943359375, 2.50665283203125, 2.714111328125, 2.92156982421875, 3.1290283203125, 3.33648681640625, 3.5439453125, 3.75140380859375, 3.9588623046875, 4.16632080078125, 4.373779296875, 4.58123779296875, 4.7886962890625, 4.99615478515625, 5.20361328125, 5.41107177734375, 5.6185302734375, 5.82598876953125, 6.033447265625, 6.24090576171875, 6.4483642578125, 6.65582275390625, 6.86328125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 5.0, 10.0, 16.0, 21.0, 26.0, 43.0, 74.0, 94.0, 133.0, 172.0, 285.0, 396.0, 626.0, 862.0, 1211.0, 1928.0, 3010.0, 4512.0, 6923.0, 11118.0, 16942.0, 26911.0, 42586.0, 71517.0, 131329.0, 1309561.0, 205896.0, 103081.0, 58035.0, 35642.0, 22775.0, 14269.0, 9338.0, 6108.0, 3857.0, 2593.0, 1602.0, 1187.0, 732.0, 518.0, 386.0, 261.0, 157.0, 120.0, 75.0, 55.0, 39.0, 32.0, 20.0, 18.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.75, -1.6949920654296875, -1.639984130859375, -1.5849761962890625, -1.52996826171875, -1.4749603271484375, -1.419952392578125, -1.3649444580078125, -1.3099365234375, -1.2549285888671875, -1.199920654296875, -1.1449127197265625, -1.08990478515625, -1.0348968505859375, -0.979888916015625, -0.9248809814453125, -0.869873046875, -0.8148651123046875, -0.759857177734375, -0.7048492431640625, -0.64984130859375, -0.5948333740234375, -0.539825439453125, -0.4848175048828125, -0.4298095703125, -0.3748016357421875, -0.319793701171875, -0.2647857666015625, -0.20977783203125, -0.1547698974609375, -0.099761962890625, -0.0447540283203125, 0.01025390625, 0.0652618408203125, 0.120269775390625, 0.1752777099609375, 0.23028564453125, 0.2852935791015625, 0.340301513671875, 0.3953094482421875, 0.4503173828125, 0.5053253173828125, 0.560333251953125, 0.6153411865234375, 0.67034912109375, 0.7253570556640625, 0.780364990234375, 0.8353729248046875, 0.890380859375, 0.9453887939453125, 1.000396728515625, 1.0554046630859375, 1.11041259765625, 1.1654205322265625, 1.220428466796875, 1.2754364013671875, 1.3304443359375, 1.3854522705078125, 1.440460205078125, 1.4954681396484375, 1.55047607421875, 1.6054840087890625, 1.660491943359375, 1.7154998779296875, 1.7705078125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 3.0, 5.0, 4.0, 5.0, 5.0, 2.0, 4.0, 7.0, 10.0, 4.0, 10.0, 14.0, 17.0, 23.0, 23.0, 29.0, 28.0, 29.0, 42.0, 40.0, 36.0, 53.0, 56.0, 51.0, 40.0, 53.0, 52.0, 50.0, 48.0, 41.0, 31.0, 26.0, 26.0, 16.0, 22.0, 16.0, 9.0, 14.0, 15.0, 6.0, 12.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0018529891967773438, -0.0017946064472198486, -0.0017362236976623535, -0.0016778409481048584, -0.0016194581985473633, -0.0015610754489898682, -0.001502692699432373, -0.001444309949874878, -0.0013859272003173828, -0.0013275444507598877, -0.0012691617012023926, -0.0012107789516448975, -0.0011523962020874023, -0.0010940134525299072, -0.0010356307029724121, -0.000977247953414917, -0.0009188652038574219, -0.0008604824542999268, -0.0008020997047424316, -0.0007437169551849365, -0.0006853342056274414, -0.0006269514560699463, -0.0005685687065124512, -0.0005101859569549561, -0.00045180320739746094, -0.0003934204578399658, -0.0003350377082824707, -0.0002766549587249756, -0.00021827220916748047, -0.00015988945960998535, -0.00010150671005249023, -4.312396049499512e-05, 1.52587890625e-05, 7.364153861999512e-05, 0.00013202428817749023, 0.00019040703773498535, 0.00024878978729248047, 0.0003071725368499756, 0.0003655552864074707, 0.0004239380359649658, 0.00048232078552246094, 0.0005407035350799561, 0.0005990862846374512, 0.0006574690341949463, 0.0007158517837524414, 0.0007742345333099365, 0.0008326172828674316, 0.0008910000324249268, 0.0009493827819824219, 0.001007765531539917, 0.0010661482810974121, 0.0011245310306549072, 0.0011829137802124023, 0.0012412965297698975, 0.0012996792793273926, 0.0013580620288848877, 0.0014164447784423828, 0.001474827527999878, 0.001533210277557373, 0.0015915930271148682, 0.0016499757766723633, 0.0017083585262298584, 0.0017667412757873535, 0.0018251240253448486, 0.0018835067749023438]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 4.0, 8.0, 3.0, 7.0, 4.0, 4.0, 9.0, 14.0, 10.0, 23.0, 21.0, 25.0, 27.0, 31.0, 36.0, 67.0, 64.0, 93.0, 118.0, 175.0, 243.0, 339.0, 663.0, 2151.0, 643545.0, 397279.0, 1757.0, 600.0, 325.0, 196.0, 169.0, 111.0, 89.0, 68.0, 61.0, 36.0, 31.0, 20.0, 24.0, 19.0, 9.0, 12.0, 8.0, 10.0, 9.0, 9.0, 8.0, 5.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0], "bins": [-0.03521728515625, -0.03411531448364258, -0.033013343811035156, -0.031911373138427734, -0.030809402465820312, -0.02970743179321289, -0.02860546112060547, -0.027503490447998047, -0.026401519775390625, -0.025299549102783203, -0.02419757843017578, -0.02309560775756836, -0.021993637084960938, -0.020891666412353516, -0.019789695739746094, -0.018687725067138672, -0.01758575439453125, -0.016483783721923828, -0.015381813049316406, -0.014279842376708984, -0.013177871704101562, -0.01207590103149414, -0.010973930358886719, -0.009871959686279297, -0.008769989013671875, -0.007668018341064453, -0.006566047668457031, -0.005464076995849609, -0.0043621063232421875, -0.0032601356506347656, -0.0021581649780273438, -0.0010561943054199219, 4.57763671875e-05, 0.0011477470397949219, 0.0022497177124023438, 0.0033516883850097656, 0.0044536590576171875, 0.005555629730224609, 0.006657600402832031, 0.007759571075439453, 0.008861541748046875, 0.009963512420654297, 0.011065483093261719, 0.01216745376586914, 0.013269424438476562, 0.014371395111083984, 0.015473365783691406, 0.016575336456298828, 0.01767730712890625, 0.018779277801513672, 0.019881248474121094, 0.020983219146728516, 0.022085189819335938, 0.02318716049194336, 0.02428913116455078, 0.025391101837158203, 0.026493072509765625, 0.027595043182373047, 0.02869701385498047, 0.02979898452758789, 0.030900955200195312, 0.032002925872802734, 0.033104896545410156, 0.03420686721801758, 0.035308837890625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 13.0, 20.0, 48.0, 120.0, 204.0, 236.0, 187.0, 101.0, 52.0, 19.0, 10.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012192301219329238, -0.0011452160542830825, -0.001071202103048563, -0.0009971880353987217, -0.0009231739677488804, -0.0008491599583067, -0.0007751459488645196, -0.0007011318812146783, -0.0006271178717724979, -0.0005531038623303175, -0.0004790897946804762, -0.0004050757852382958, -0.00033106174669228494, -0.0002570477081462741, -0.0001830336987040937, -0.00010901963105425239, -3.500562161207199e-05, 3.900840965798125e-05, 0.00011302244092803448, 0.0001870364649221301, 0.00026105050346814096, 0.0003350645420141518, 0.0004090785514563322, 0.0004830926191061735, 0.0005571066285483539, 0.0006311206379905343, 0.0007051347056403756, 0.000779148715082556, 0.0008531627245247364, 0.0009271767921745777, 0.001001190859824419, 0.0010752049274742603, 0.001149218762293458, 0.0012232328299432993, 0.0012972467811778188, 0.00137126084882766, 0.0014452749164775014, 0.0015192888677120209, 0.0015933029353618622, 0.0016673170030117035, 0.0017413310706615448, 0.001815345138311386, 0.0018893590895459056, 0.0019633732736110687, 0.0020373871084302664, 0.0021114011760801077, 0.002185415243729949, 0.0022594293113797903, 0.002333443146198988, 0.0024074572138488293, 0.0024814712814986706, 0.002555485349148512, 0.0026294991839677095, 0.002703513251617551, 0.002777527319267392, 0.0028515413869172335, 0.0029255554545670748, 0.002999569522216916, 0.0030735835898667574, 0.003147597424685955, 0.0032216114923357964, 0.0032956255599856377, 0.003369639627635479, 0.0034436536952853203, 0.0035176677629351616]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 5.0, 4.0, 7.0, 6.0, 12.0, 11.0, 18.0, 15.0, 20.0, 29.0, 29.0, 32.0, 30.0, 39.0, 41.0, 48.0, 41.0, 50.0, 48.0, 54.0, 48.0, 41.0, 44.0, 49.0, 44.0, 39.0, 25.0, 29.0, 28.0, 19.0, 19.0, 20.0, 15.0, 13.0, 7.0, 3.0, 9.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0013067126274108887, -0.0012669125571846962, -0.0012271124869585037, -0.0011873124167323112, -0.0011475123465061188, -0.0011077122762799263, -0.0010679122060537338, -0.0010281121358275414, -0.0009883120656013489, -0.0009485119953751564, -0.0009087119251489639, -0.0008689118549227715, -0.000829111784696579, -0.0007893117144703865, -0.000749511644244194, -0.0007097115740180016, -0.0006699115037918091, -0.0006301114335656166, -0.0005903113633394241, -0.0005505112931132317, -0.0005107112228870392, -0.0004709111526608467, -0.00043111108243465424, -0.00039131101220846176, -0.0003515109419822693, -0.0003117108717560768, -0.00027191080152988434, -0.00023211073130369186, -0.0001923106610774994, -0.00015251059085130692, -0.00011271052062511444, -7.291045039892197e-05, -3.311038017272949e-05, 6.689690053462982e-06, 4.6489760279655457e-05, 8.628983050584793e-05, 0.0001260899007320404, 0.00016588997095823288, 0.00020569004118442535, 0.00024549011141061783, 0.0002852901816368103, 0.0003250902518630028, 0.00036489032208919525, 0.0004046903923153877, 0.0004444904625415802, 0.0004842905327677727, 0.0005240906029939651, 0.0005638906732201576, 0.0006036907434463501, 0.0006434908136725426, 0.000683290883898735, 0.0007230909541249275, 0.00076289102435112, 0.0008026910945773125, 0.0008424911648035049, 0.0008822912350296974, 0.0009220913052558899, 0.0009618913754820824, 0.0010016914457082748, 0.0010414915159344673, 0.0010812915861606598, 0.0011210916563868523, 0.0011608917266130447, 0.0012006917968392372, 0.0012404918670654297]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 4.0, 9.0, 8.0, 17.0, 20.0, 14.0, 26.0, 27.0, 23.0, 33.0, 29.0, 32.0, 35.0, 48.0, 38.0, 44.0, 42.0, 56.0, 37.0, 37.0, 51.0, 44.0, 42.0, 46.0, 33.0, 25.0, 25.0, 18.0, 25.0, 25.0, 14.0, 15.0, 12.0, 7.0, 9.0, 6.0, 6.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.96875, -11.61279296875, -11.2568359375, -10.90087890625, -10.544921875, -10.18896484375, -9.8330078125, -9.47705078125, -9.12109375, -8.76513671875, -8.4091796875, -8.05322265625, -7.697265625, -7.34130859375, -6.9853515625, -6.62939453125, -6.2734375, -5.91748046875, -5.5615234375, -5.20556640625, -4.849609375, -4.49365234375, -4.1376953125, -3.78173828125, -3.42578125, -3.06982421875, -2.7138671875, -2.35791015625, -2.001953125, -1.64599609375, -1.2900390625, -0.93408203125, -0.578125, -0.22216796875, 0.1337890625, 0.48974609375, 0.845703125, 1.20166015625, 1.5576171875, 1.91357421875, 2.26953125, 2.62548828125, 2.9814453125, 3.33740234375, 3.693359375, 4.04931640625, 4.4052734375, 4.76123046875, 5.1171875, 5.47314453125, 5.8291015625, 6.18505859375, 6.541015625, 6.89697265625, 7.2529296875, 7.60888671875, 7.96484375, 8.32080078125, 8.6767578125, 9.03271484375, 9.388671875, 9.74462890625, 10.1005859375, 10.45654296875, 10.8125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 7.0, 10.0, 16.0, 19.0, 26.0, 36.0, 47.0, 66.0, 79.0, 119.0, 152.0, 271.0, 417.0, 701.0, 1338.0, 2724.0, 6240.0, 15410.0, 42784.0, 122643.0, 354440.0, 325930.0, 110797.0, 38725.0, 14312.0, 5594.0, 2540.0, 1231.0, 656.0, 373.0, 237.0, 181.0, 113.0, 92.0, 50.0, 45.0, 32.0, 37.0, 16.0, 13.0, 13.0, 3.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.453125, -14.0145263671875, -13.575927734375, -13.1373291015625, -12.69873046875, -12.2601318359375, -11.821533203125, -11.3829345703125, -10.9443359375, -10.5057373046875, -10.067138671875, -9.6285400390625, -9.18994140625, -8.7513427734375, -8.312744140625, -7.8741455078125, -7.435546875, -6.9969482421875, -6.558349609375, -6.1197509765625, -5.68115234375, -5.2425537109375, -4.803955078125, -4.3653564453125, -3.9267578125, -3.4881591796875, -3.049560546875, -2.6109619140625, -2.17236328125, -1.7337646484375, -1.295166015625, -0.8565673828125, -0.41796875, 0.0206298828125, 0.459228515625, 0.8978271484375, 1.33642578125, 1.7750244140625, 2.213623046875, 2.6522216796875, 3.0908203125, 3.5294189453125, 3.968017578125, 4.4066162109375, 4.84521484375, 5.2838134765625, 5.722412109375, 6.1610107421875, 6.599609375, 7.0382080078125, 7.476806640625, 7.9154052734375, 8.35400390625, 8.7926025390625, 9.231201171875, 9.6697998046875, 10.1083984375, 10.5469970703125, 10.985595703125, 11.4241943359375, 11.86279296875, 12.3013916015625, 12.739990234375, 13.1785888671875, 13.6171875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 3.0, 3.0, 4.0, 8.0, 8.0, 11.0, 6.0, 6.0, 5.0, 14.0, 21.0, 24.0, 23.0, 21.0, 20.0, 30.0, 32.0, 26.0, 56.0, 52.0, 82.0, 119.0, 219.0, 1517.0, 198.0, 102.0, 46.0, 54.0, 48.0, 33.0, 27.0, 31.0, 19.0, 24.0, 22.0, 16.0, 18.0, 14.0, 21.0, 8.0, 11.0, 9.0, 9.0, 8.0, 7.0, 4.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-28.671875, -27.75927734375, -26.8466796875, -25.93408203125, -25.021484375, -24.10888671875, -23.1962890625, -22.28369140625, -21.37109375, -20.45849609375, -19.5458984375, -18.63330078125, -17.720703125, -16.80810546875, -15.8955078125, -14.98291015625, -14.0703125, -13.15771484375, -12.2451171875, -11.33251953125, -10.419921875, -9.50732421875, -8.5947265625, -7.68212890625, -6.76953125, -5.85693359375, -4.9443359375, -4.03173828125, -3.119140625, -2.20654296875, -1.2939453125, -0.38134765625, 0.53125, 1.44384765625, 2.3564453125, 3.26904296875, 4.181640625, 5.09423828125, 6.0068359375, 6.91943359375, 7.83203125, 8.74462890625, 9.6572265625, 10.56982421875, 11.482421875, 12.39501953125, 13.3076171875, 14.22021484375, 15.1328125, 16.04541015625, 16.9580078125, 17.87060546875, 18.783203125, 19.69580078125, 20.6083984375, 21.52099609375, 22.43359375, 23.34619140625, 24.2587890625, 25.17138671875, 26.083984375, 26.99658203125, 27.9091796875, 28.82177734375, 29.734375]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 8.0, 8.0, 17.0, 12.0, 12.0, 17.0, 17.0, 29.0, 39.0, 44.0, 68.0, 137.0, 180.0, 317.0, 465.0, 860.0, 4877.0, 265748.0, 2840737.0, 28887.0, 1559.0, 612.0, 337.0, 232.0, 131.0, 99.0, 67.0, 47.0, 31.0, 31.0, 20.0, 15.0, 12.0, 7.0, 4.0, 2.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.53125, -56.38330078125, -54.2353515625, -52.08740234375, -49.939453125, -47.79150390625, -45.6435546875, -43.49560546875, -41.34765625, -39.19970703125, -37.0517578125, -34.90380859375, -32.755859375, -30.60791015625, -28.4599609375, -26.31201171875, -24.1640625, -22.01611328125, -19.8681640625, -17.72021484375, -15.572265625, -13.42431640625, -11.2763671875, -9.12841796875, -6.98046875, -4.83251953125, -2.6845703125, -0.53662109375, 1.611328125, 3.75927734375, 5.9072265625, 8.05517578125, 10.203125, 12.35107421875, 14.4990234375, 16.64697265625, 18.794921875, 20.94287109375, 23.0908203125, 25.23876953125, 27.38671875, 29.53466796875, 31.6826171875, 33.83056640625, 35.978515625, 38.12646484375, 40.2744140625, 42.42236328125, 44.5703125, 46.71826171875, 48.8662109375, 51.01416015625, 53.162109375, 55.31005859375, 57.4580078125, 59.60595703125, 61.75390625, 63.90185546875, 66.0498046875, 68.19775390625, 70.345703125, 72.49365234375, 74.6416015625, 76.78955078125, 78.9375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 8.0, 37.0, 52.0, 134.0, 209.0, 229.0, 164.0, 99.0, 53.0, 17.0, 7.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.11601257324219, -66.57567596435547, -64.03533935546875, -61.49501037597656, -58.954673767089844, -56.414337158203125, -53.87400436401367, -51.33367156982422, -48.7933349609375, -46.25299835205078, -43.71266555786133, -41.172332763671875, -38.631996154785156, -36.09165954589844, -33.551326751708984, -31.0109920501709, -28.470657348632812, -25.930322647094727, -23.38998794555664, -20.849653244018555, -18.30931854248047, -15.768983840942383, -13.228649139404297, -10.688314437866211, -8.147979736328125, -5.607645034790039, -3.067310333251953, -0.5269756317138672, 2.0133590698242188, 4.553693771362305, 7.094028472900391, 9.634363174438477, 12.174697875976562, 14.715032577514648, 17.255367279052734, 19.79570198059082, 22.336036682128906, 24.876371383666992, 27.416706085205078, 29.957040786743164, 32.49737548828125, 35.03771209716797, 37.57804489135742, 40.118377685546875, 42.658714294433594, 45.19905090332031, 47.739383697509766, 50.27971649169922, 52.82005310058594, 55.360389709472656, 57.90072250366211, 60.44105529785156, 62.98139190673828, 65.521728515625, 68.06205749511719, 70.6023941040039, 73.14273071289062, 75.68306732177734, 78.22340393066406, 80.76373291015625, 83.30406951904297, 85.84440612792969, 88.38473510742188, 90.9250717163086, 93.46540832519531]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 7.0, 3.0, 5.0, 10.0, 6.0, 14.0, 7.0, 16.0, 15.0, 13.0, 20.0, 20.0, 27.0, 21.0, 22.0, 18.0, 29.0, 37.0, 33.0, 32.0, 37.0, 38.0, 37.0, 36.0, 41.0, 42.0, 49.0, 38.0, 37.0, 33.0, 35.0, 23.0, 30.0, 23.0, 20.0, 22.0, 18.0, 11.0, 7.0, 16.0, 8.0, 8.0, 9.0, 5.0, 8.0, 2.0, 4.0, 2.0, 7.0, 3.0, 2.0, 2.0, 0.0, 4.0], "bins": [-70.0136947631836, -67.9543685913086, -65.8950424194336, -63.83572006225586, -61.77639389038086, -59.71706771850586, -57.657745361328125, -55.598419189453125, -53.539093017578125, -51.479766845703125, -49.420440673828125, -47.36111831665039, -45.30179214477539, -43.24246597290039, -41.183143615722656, -39.123817443847656, -37.064491271972656, -35.005165100097656, -32.945838928222656, -30.886516571044922, -28.827190399169922, -26.767864227294922, -24.708539962768555, -22.649215698242188, -20.589889526367188, -18.530563354492188, -16.47123908996582, -14.411913871765137, -12.352588653564453, -10.29326343536377, -8.233938217163086, -6.174612998962402, -4.115287780761719, -2.055962562561035, 0.0033626556396484375, 2.062687873840332, 4.122013092041016, 6.181338310241699, 8.240663528442383, 10.299988746643066, 12.35931396484375, 14.418639183044434, 16.477964401245117, 18.537288665771484, 20.596614837646484, 22.655941009521484, 24.71526527404785, 26.77458953857422, 28.83391571044922, 30.89324188232422, 32.95256805419922, 35.01189041137695, 37.07121658325195, 39.13054275512695, 41.18986511230469, 43.24919128417969, 45.30851745605469, 47.36784362792969, 49.42716979980469, 51.48649215698242, 53.54581832885742, 55.60514450073242, 57.664466857910156, 59.723793029785156, 61.783119201660156]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 11.0, 6.0, 13.0, 10.0, 18.0, 23.0, 19.0, 20.0, 28.0, 35.0, 39.0, 36.0, 40.0, 35.0, 36.0, 48.0, 41.0, 60.0, 34.0, 58.0, 52.0, 39.0, 48.0, 39.0, 28.0, 28.0, 32.0, 28.0, 16.0, 12.0, 13.0, 12.0, 5.0, 11.0, 6.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.34375, -12.954345703125, -12.56494140625, -12.175537109375, -11.7861328125, -11.396728515625, -11.00732421875, -10.617919921875, -10.228515625, -9.839111328125, -9.44970703125, -9.060302734375, -8.6708984375, -8.281494140625, -7.89208984375, -7.502685546875, -7.11328125, -6.723876953125, -6.33447265625, -5.945068359375, -5.5556640625, -5.166259765625, -4.77685546875, -4.387451171875, -3.998046875, -3.608642578125, -3.21923828125, -2.829833984375, -2.4404296875, -2.051025390625, -1.66162109375, -1.272216796875, -0.8828125, -0.493408203125, -0.10400390625, 0.285400390625, 0.6748046875, 1.064208984375, 1.45361328125, 1.843017578125, 2.232421875, 2.621826171875, 3.01123046875, 3.400634765625, 3.7900390625, 4.179443359375, 4.56884765625, 4.958251953125, 5.34765625, 5.737060546875, 6.12646484375, 6.515869140625, 6.9052734375, 7.294677734375, 7.68408203125, 8.073486328125, 8.462890625, 8.852294921875, 9.24169921875, 9.631103515625, 10.0205078125, 10.409912109375, 10.79931640625, 11.188720703125, 11.578125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 5.0, 6.0, 7.0, 9.0, 8.0, 18.0, 15.0, 22.0, 24.0, 45.0, 46.0, 74.0, 100.0, 154.0, 255.0, 507.0, 986.0, 2425.0, 7829.0, 34535.0, 186863.0, 877943.0, 1825428.0, 980177.0, 222180.0, 40431.0, 9071.0, 2647.0, 1073.0, 541.0, 267.0, 143.0, 135.0, 90.0, 52.0, 34.0, 28.0, 23.0, 21.0, 12.0, 13.0, 11.0, 9.0, 9.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-14.640625, -14.1907958984375, -13.740966796875, -13.2911376953125, -12.84130859375, -12.3914794921875, -11.941650390625, -11.4918212890625, -11.0419921875, -10.5921630859375, -10.142333984375, -9.6925048828125, -9.24267578125, -8.7928466796875, -8.343017578125, -7.8931884765625, -7.443359375, -6.9935302734375, -6.543701171875, -6.0938720703125, -5.64404296875, -5.1942138671875, -4.744384765625, -4.2945556640625, -3.8447265625, -3.3948974609375, -2.945068359375, -2.4952392578125, -2.04541015625, -1.5955810546875, -1.145751953125, -0.6959228515625, -0.24609375, 0.2037353515625, 0.653564453125, 1.1033935546875, 1.55322265625, 2.0030517578125, 2.452880859375, 2.9027099609375, 3.3525390625, 3.8023681640625, 4.252197265625, 4.7020263671875, 5.15185546875, 5.6016845703125, 6.051513671875, 6.5013427734375, 6.951171875, 7.4010009765625, 7.850830078125, 8.3006591796875, 8.75048828125, 9.2003173828125, 9.650146484375, 10.0999755859375, 10.5498046875, 10.9996337890625, 11.449462890625, 11.8992919921875, 12.34912109375, 12.7989501953125, 13.248779296875, 13.6986083984375, 14.1484375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 6.0, 6.0, 9.0, 11.0, 6.0, 21.0, 36.0, 43.0, 47.0, 75.0, 81.0, 109.0, 200.0, 229.0, 388.0, 442.0, 498.0, 444.0, 403.0, 303.0, 213.0, 140.0, 127.0, 66.0, 43.0, 39.0, 25.0, 23.0, 14.0, 9.0, 7.0, 8.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-18.953125, -18.435546875, -17.91796875, -17.400390625, -16.8828125, -16.365234375, -15.84765625, -15.330078125, -14.8125, -14.294921875, -13.77734375, -13.259765625, -12.7421875, -12.224609375, -11.70703125, -11.189453125, -10.671875, -10.154296875, -9.63671875, -9.119140625, -8.6015625, -8.083984375, -7.56640625, -7.048828125, -6.53125, -6.013671875, -5.49609375, -4.978515625, -4.4609375, -3.943359375, -3.42578125, -2.908203125, -2.390625, -1.873046875, -1.35546875, -0.837890625, -0.3203125, 0.197265625, 0.71484375, 1.232421875, 1.75, 2.267578125, 2.78515625, 3.302734375, 3.8203125, 4.337890625, 4.85546875, 5.373046875, 5.890625, 6.408203125, 6.92578125, 7.443359375, 7.9609375, 8.478515625, 8.99609375, 9.513671875, 10.03125, 10.548828125, 11.06640625, 11.583984375, 12.1015625, 12.619140625, 13.13671875, 13.654296875, 14.171875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 8.0, 8.0, 11.0, 17.0, 14.0, 48.0, 36.0, 80.0, 105.0, 207.0, 348.0, 680.0, 1737.0, 5279.0, 20509.0, 116384.0, 1144636.0, 2542105.0, 305497.0, 42473.0, 9195.0, 2658.0, 1080.0, 457.0, 260.0, 158.0, 92.0, 60.0, 30.0, 34.0, 15.0, 19.0, 11.0, 4.0, 10.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.203125, -24.444580078125, -23.68603515625, -22.927490234375, -22.1689453125, -21.410400390625, -20.65185546875, -19.893310546875, -19.134765625, -18.376220703125, -17.61767578125, -16.859130859375, -16.1005859375, -15.342041015625, -14.58349609375, -13.824951171875, -13.06640625, -12.307861328125, -11.54931640625, -10.790771484375, -10.0322265625, -9.273681640625, -8.51513671875, -7.756591796875, -6.998046875, -6.239501953125, -5.48095703125, -4.722412109375, -3.9638671875, -3.205322265625, -2.44677734375, -1.688232421875, -0.9296875, -0.171142578125, 0.58740234375, 1.345947265625, 2.1044921875, 2.863037109375, 3.62158203125, 4.380126953125, 5.138671875, 5.897216796875, 6.65576171875, 7.414306640625, 8.1728515625, 8.931396484375, 9.68994140625, 10.448486328125, 11.20703125, 11.965576171875, 12.72412109375, 13.482666015625, 14.2412109375, 14.999755859375, 15.75830078125, 16.516845703125, 17.275390625, 18.033935546875, 18.79248046875, 19.551025390625, 20.3095703125, 21.068115234375, 21.82666015625, 22.585205078125, 23.34375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 17.0, 200.0, 557.0, 223.0, 16.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-248.54029846191406, -238.80068969726562, -229.06106567382812, -219.3214569091797, -209.58184814453125, -199.8422393798828, -190.10263061523438, -180.36300659179688, -170.62339782714844, -160.8837890625, -151.1441650390625, -141.40455627441406, -131.66494750976562, -121.92533874511719, -112.18572235107422, -102.44610595703125, -92.70649719238281, -82.96688842773438, -73.2272720336914, -63.4876594543457, -53.748046875, -44.0084342956543, -34.268821716308594, -24.529205322265625, -14.789596557617188, -5.049983978271484, 4.689628601074219, 14.429241180419922, 24.168853759765625, 33.90846633911133, 43.64807891845703, 53.3876953125, 63.1273193359375, 72.86692810058594, 82.6065444946289, 92.34616088867188, 102.08576965332031, 111.82537841796875, 121.56499481201172, 131.3046112060547, 141.04421997070312, 150.78382873535156, 160.5234375, 170.2630615234375, 180.00267028808594, 189.74227905273438, 199.48190307617188, 209.2215118408203, 218.96112060546875, 228.7007293701172, 238.44033813476562, 248.17996215820312, 257.9195556640625, 267.6591796875, 277.3988037109375, 287.138427734375, 296.8780212402344, 306.6176452636719, 316.35723876953125, 326.09686279296875, 335.83648681640625, 345.5760803222656, 355.3157043457031, 365.0552978515625, 374.794921875]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 4.0, 4.0, 15.0, 8.0, 12.0, 13.0, 15.0, 19.0, 18.0, 30.0, 27.0, 28.0, 31.0, 29.0, 32.0, 47.0, 47.0, 51.0, 34.0, 47.0, 47.0, 49.0, 30.0, 43.0, 40.0, 30.0, 30.0, 34.0, 29.0, 34.0, 21.0, 19.0, 12.0, 15.0, 14.0, 9.0, 12.0, 5.0, 5.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-57.726356506347656, -55.976531982421875, -54.226707458496094, -52.47688293457031, -50.72705841064453, -48.97723388671875, -47.2274055480957, -45.47758102416992, -43.72775650024414, -41.97793197631836, -40.22810745239258, -38.4782829284668, -36.72845458984375, -34.97863006591797, -33.22880554199219, -31.478981018066406, -29.729156494140625, -27.979331970214844, -26.229507446289062, -24.47968101501465, -22.729856491088867, -20.980031967163086, -19.230205535888672, -17.48038101196289, -15.73055648803711, -13.980731964111328, -12.23090648651123, -10.481081008911133, -8.731256484985352, -6.98143196105957, -5.231606483459473, -3.481781005859375, -1.7319564819335938, 0.017868518829345703, 1.7676935195922852, 3.5175185203552246, 5.267343521118164, 7.017168045043945, 8.766993522644043, 10.51681900024414, 12.266643524169922, 14.016468048095703, 15.7662935256958, 17.5161190032959, 19.26594352722168, 21.01576805114746, 22.765594482421875, 24.515419006347656, 26.265243530273438, 28.01506805419922, 29.764892578125, 31.514719009399414, 33.26454162597656, 35.014366149902344, 36.76419448852539, 38.51401901245117, 40.26384353637695, 42.013668060302734, 43.763492584228516, 45.5133171081543, 47.263145446777344, 49.012969970703125, 50.762794494628906, 52.51261901855469, 54.26244354248047]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 5.0, 8.0, 5.0, 10.0, 10.0, 11.0, 16.0, 12.0, 19.0, 18.0, 21.0, 22.0, 27.0, 27.0, 36.0, 31.0, 42.0, 39.0, 39.0, 44.0, 46.0, 33.0, 41.0, 37.0, 37.0, 39.0, 39.0, 32.0, 28.0, 35.0, 24.0, 20.0, 26.0, 12.0, 16.0, 13.0, 13.0, 8.0, 7.0, 13.0, 7.0, 8.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-10.828125, -10.5028076171875, -10.177490234375, -9.8521728515625, -9.52685546875, -9.2015380859375, -8.876220703125, -8.5509033203125, -8.2255859375, -7.9002685546875, -7.574951171875, -7.2496337890625, -6.92431640625, -6.5989990234375, -6.273681640625, -5.9483642578125, -5.623046875, -5.2977294921875, -4.972412109375, -4.6470947265625, -4.32177734375, -3.9964599609375, -3.671142578125, -3.3458251953125, -3.0205078125, -2.6951904296875, -2.369873046875, -2.0445556640625, -1.71923828125, -1.3939208984375, -1.068603515625, -0.7432861328125, -0.41796875, -0.0926513671875, 0.232666015625, 0.5579833984375, 0.88330078125, 1.2086181640625, 1.533935546875, 1.8592529296875, 2.1845703125, 2.5098876953125, 2.835205078125, 3.1605224609375, 3.48583984375, 3.8111572265625, 4.136474609375, 4.4617919921875, 4.787109375, 5.1124267578125, 5.437744140625, 5.7630615234375, 6.08837890625, 6.4136962890625, 6.739013671875, 7.0643310546875, 7.3896484375, 7.7149658203125, 8.040283203125, 8.3656005859375, 8.69091796875, 9.0162353515625, 9.341552734375, 9.6668701171875, 9.9921875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 12.0, 9.0, 6.0, 19.0, 29.0, 41.0, 63.0, 82.0, 134.0, 221.0, 356.0, 594.0, 973.0, 1546.0, 2514.0, 4197.0, 6961.0, 11895.0, 19836.0, 35679.0, 66715.0, 140154.0, 333745.0, 218123.0, 92833.0, 47597.0, 26441.0, 15214.0, 8883.0, 5437.0, 3222.0, 1855.0, 1207.0, 747.0, 454.0, 298.0, 169.0, 119.0, 73.0, 38.0, 23.0, 14.0, 15.0, 4.0, 6.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1171875, -2.04351806640625, -1.9698486328125, -1.89617919921875, -1.822509765625, -1.74884033203125, -1.6751708984375, -1.60150146484375, -1.52783203125, -1.45416259765625, -1.3804931640625, -1.30682373046875, -1.233154296875, -1.15948486328125, -1.0858154296875, -1.01214599609375, -0.9384765625, -0.86480712890625, -0.7911376953125, -0.71746826171875, -0.643798828125, -0.57012939453125, -0.4964599609375, -0.42279052734375, -0.34912109375, -0.27545166015625, -0.2017822265625, -0.12811279296875, -0.054443359375, 0.01922607421875, 0.0928955078125, 0.16656494140625, 0.240234375, 0.31390380859375, 0.3875732421875, 0.46124267578125, 0.534912109375, 0.60858154296875, 0.6822509765625, 0.75592041015625, 0.82958984375, 0.90325927734375, 0.9769287109375, 1.05059814453125, 1.124267578125, 1.19793701171875, 1.2716064453125, 1.34527587890625, 1.4189453125, 1.49261474609375, 1.5662841796875, 1.63995361328125, 1.713623046875, 1.78729248046875, 1.8609619140625, 1.93463134765625, 2.00830078125, 2.08197021484375, 2.1556396484375, 2.22930908203125, 2.302978515625, 2.37664794921875, 2.4503173828125, 2.52398681640625, 2.59765625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 4.0, 4.0, 2.0, 4.0, 6.0, 8.0, 12.0, 11.0, 14.0, 27.0, 18.0, 32.0, 27.0, 29.0, 32.0, 23.0, 40.0, 42.0, 34.0, 34.0, 35.0, 48.0, 1063.0, 45.0, 43.0, 41.0, 38.0, 36.0, 31.0, 29.0, 36.0, 28.0, 18.0, 15.0, 22.0, 23.0, 13.0, 10.0, 14.0, 7.0, 10.0, 4.0, 2.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.94921875, -6.73419189453125, -6.5191650390625, -6.30413818359375, -6.089111328125, -5.87408447265625, -5.6590576171875, -5.44403076171875, -5.22900390625, -5.01397705078125, -4.7989501953125, -4.58392333984375, -4.368896484375, -4.15386962890625, -3.9388427734375, -3.72381591796875, -3.5087890625, -3.29376220703125, -3.0787353515625, -2.86370849609375, -2.648681640625, -2.43365478515625, -2.2186279296875, -2.00360107421875, -1.78857421875, -1.57354736328125, -1.3585205078125, -1.14349365234375, -0.928466796875, -0.71343994140625, -0.4984130859375, -0.28338623046875, -0.068359375, 0.14666748046875, 0.3616943359375, 0.57672119140625, 0.791748046875, 1.00677490234375, 1.2218017578125, 1.43682861328125, 1.65185546875, 1.86688232421875, 2.0819091796875, 2.29693603515625, 2.511962890625, 2.72698974609375, 2.9420166015625, 3.15704345703125, 3.3720703125, 3.58709716796875, 3.8021240234375, 4.01715087890625, 4.232177734375, 4.44720458984375, 4.6622314453125, 4.87725830078125, 5.09228515625, 5.30731201171875, 5.5223388671875, 5.73736572265625, 5.952392578125, 6.16741943359375, 6.3824462890625, 6.59747314453125, 6.8125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 5.0, 5.0, 8.0, 12.0, 15.0, 34.0, 45.0, 61.0, 113.0, 122.0, 155.0, 248.0, 353.0, 529.0, 739.0, 1014.0, 1506.0, 2406.0, 3570.0, 5246.0, 7964.0, 12338.0, 19112.0, 30163.0, 48486.0, 82960.0, 158891.0, 1327189.0, 168320.0, 86730.0, 50209.0, 31383.0, 19769.0, 12837.0, 8158.0, 5545.0, 3494.0, 2307.0, 1575.0, 1129.0, 757.0, 459.0, 364.0, 227.0, 166.0, 121.0, 85.0, 67.0, 39.0, 36.0, 23.0, 21.0, 11.0, 8.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.6533203125, -1.59918212890625, -1.5450439453125, -1.49090576171875, -1.436767578125, -1.38262939453125, -1.3284912109375, -1.27435302734375, -1.22021484375, -1.16607666015625, -1.1119384765625, -1.05780029296875, -1.003662109375, -0.94952392578125, -0.8953857421875, -0.84124755859375, -0.787109375, -0.73297119140625, -0.6788330078125, -0.62469482421875, -0.570556640625, -0.51641845703125, -0.4622802734375, -0.40814208984375, -0.35400390625, -0.29986572265625, -0.2457275390625, -0.19158935546875, -0.137451171875, -0.08331298828125, -0.0291748046875, 0.02496337890625, 0.0791015625, 0.13323974609375, 0.1873779296875, 0.24151611328125, 0.295654296875, 0.34979248046875, 0.4039306640625, 0.45806884765625, 0.51220703125, 0.56634521484375, 0.6204833984375, 0.67462158203125, 0.728759765625, 0.78289794921875, 0.8370361328125, 0.89117431640625, 0.9453125, 0.99945068359375, 1.0535888671875, 1.10772705078125, 1.161865234375, 1.21600341796875, 1.2701416015625, 1.32427978515625, 1.37841796875, 1.43255615234375, 1.4866943359375, 1.54083251953125, 1.594970703125, 1.64910888671875, 1.7032470703125, 1.75738525390625, 1.8115234375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 7.0, 3.0, 9.0, 5.0, 5.0, 10.0, 9.0, 19.0, 15.0, 18.0, 26.0, 30.0, 35.0, 38.0, 54.0, 56.0, 65.0, 68.0, 61.0, 90.0, 77.0, 57.0, 39.0, 45.0, 22.0, 24.0, 24.0, 16.0, 7.0, 11.0, 13.0, 11.0, 7.0, 6.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023708343505859375, -0.002284109592437744, -0.0021973848342895508, -0.0021106600761413574, -0.002023935317993164, -0.0019372105598449707, -0.0018504858016967773, -0.001763761043548584, -0.0016770362854003906, -0.0015903115272521973, -0.001503586769104004, -0.0014168620109558105, -0.0013301372528076172, -0.0012434124946594238, -0.0011566877365112305, -0.0010699629783630371, -0.0009832382202148438, -0.0008965134620666504, -0.000809788703918457, -0.0007230639457702637, -0.0006363391876220703, -0.000549614429473877, -0.0004628896713256836, -0.00037616491317749023, -0.0002894401550292969, -0.00020271539688110352, -0.00011599063873291016, -2.9265880584716797e-05, 5.745887756347656e-05, 0.00014418363571166992, 0.00023090839385986328, 0.00031763315200805664, 0.00040435791015625, 0.0004910826683044434, 0.0005778074264526367, 0.0006645321846008301, 0.0007512569427490234, 0.0008379817008972168, 0.0009247064590454102, 0.0010114312171936035, 0.0010981559753417969, 0.0011848807334899902, 0.0012716054916381836, 0.001358330249786377, 0.0014450550079345703, 0.0015317797660827637, 0.001618504524230957, 0.0017052292823791504, 0.0017919540405273438, 0.0018786787986755371, 0.0019654035568237305, 0.002052128314971924, 0.002138853073120117, 0.0022255778312683105, 0.002312302589416504, 0.0023990273475646973, 0.0024857521057128906, 0.002572476863861084, 0.0026592016220092773, 0.0027459263801574707, 0.002832651138305664, 0.0029193758964538574, 0.0030061006546020508, 0.003092825412750244, 0.0031795501708984375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 2.0, 6.0, 3.0, 3.0, 9.0, 7.0, 9.0, 13.0, 18.0, 18.0, 28.0, 22.0, 37.0, 49.0, 71.0, 77.0, 132.0, 202.0, 337.0, 593.0, 1797.0, 958040.0, 84551.0, 1077.0, 490.0, 269.0, 185.0, 121.0, 97.0, 64.0, 40.0, 36.0, 33.0, 26.0, 14.0, 16.0, 10.0, 13.0, 12.0, 10.0, 7.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-0.0601806640625, -0.05854654312133789, -0.05691242218017578, -0.05527830123901367, -0.05364418029785156, -0.05201005935668945, -0.050375938415527344, -0.048741817474365234, -0.047107696533203125, -0.045473575592041016, -0.043839454650878906, -0.0422053337097168, -0.04057121276855469, -0.03893709182739258, -0.03730297088623047, -0.03566884994506836, -0.03403472900390625, -0.03240060806274414, -0.03076648712158203, -0.029132366180419922, -0.027498245239257812, -0.025864124298095703, -0.024230003356933594, -0.022595882415771484, -0.020961761474609375, -0.019327640533447266, -0.017693519592285156, -0.016059398651123047, -0.014425277709960938, -0.012791156768798828, -0.011157035827636719, -0.00952291488647461, -0.0078887939453125, -0.006254673004150391, -0.004620552062988281, -0.002986431121826172, -0.0013523101806640625, 0.0002818107604980469, 0.0019159317016601562, 0.0035500526428222656, 0.005184173583984375, 0.006818294525146484, 0.008452415466308594, 0.010086536407470703, 0.011720657348632812, 0.013354778289794922, 0.014988899230957031, 0.01662302017211914, 0.01825714111328125, 0.01989126205444336, 0.02152538299560547, 0.023159503936767578, 0.024793624877929688, 0.026427745819091797, 0.028061866760253906, 0.029695987701416016, 0.031330108642578125, 0.032964229583740234, 0.034598350524902344, 0.03623247146606445, 0.03786659240722656, 0.03950071334838867, 0.04113483428955078, 0.04276895523071289, 0.044403076171875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 6.0, 13.0, 35.0, 78.0, 157.0, 212.0, 187.0, 178.0, 83.0, 44.0, 13.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.003763421904295683, -0.0036912220530211926, -0.003619022434577346, -0.0035468225833028555, -0.003474622732028365, -0.0034024231135845184, -0.003330223262310028, -0.0032580234110355377, -0.0031858235597610474, -0.003113623708486557, -0.0030414240900427103, -0.00296922423876822, -0.0028970243874937296, -0.002824824769049883, -0.0027526249177753925, -0.002680425066500902, -0.0026082254480570555, -0.002536025596782565, -0.0024638259783387184, -0.002391626127064228, -0.0023194262757897377, -0.0022472264245152473, -0.0021750268060714006, -0.0021028269547969103, -0.0020306273363530636, -0.0019584274850785732, -0.0018862277502194047, -0.0018140280153602362, -0.0017418281640857458, -0.0016696284292265773, -0.0015974286943674088, -0.0015252288430929184, -0.0014530288754031062, -0.0013808291405439377, -0.0013086292892694473, -0.0012364295544102788, -0.0011642298195511103, -0.00109202996827662, -0.0010198302334174514, -0.0009476304403506219, -0.0008754306472837925, -0.000803230854216963, -0.0007310310611501336, -0.0006588313262909651, -0.0005866315332241356, -0.0005144317401573062, -0.0004422319761943072, -0.0003700322122313082, -0.0002978324191644788, -0.00022563264064956456, -0.00015343286213465035, -8.123308361973614e-05, -9.03330510482192e-06, 6.316648796200752e-05, 0.0001353662519250065, 0.0002075660158880055, 0.00027976580895483494, 0.0003519656020216644, 0.00042416536598466337, 0.0004963651299476624, 0.0005685649230144918, 0.0006407647160813212, 0.0007129644509404898, 0.0007851642440073192, 0.0008573640370741487]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 8.0, 6.0, 7.0, 10.0, 11.0, 13.0, 10.0, 17.0, 15.0, 25.0, 25.0, 28.0, 27.0, 31.0, 38.0, 27.0, 33.0, 29.0, 42.0, 44.0, 34.0, 40.0, 42.0, 38.0, 40.0, 39.0, 32.0, 38.0, 29.0, 30.0, 32.0, 22.0, 27.0, 20.0, 15.0, 17.0, 5.0, 12.0, 10.0, 11.0, 5.0, 4.0, 4.0, 1.0, 0.0, 4.0, 6.0, 2.0, 2.0], "bins": [-0.0014423131942749023, -0.0014021145179867744, -0.0013619158416986465, -0.0013217171654105186, -0.0012815184891223907, -0.0012413198128342628, -0.001201121136546135, -0.001160922460258007, -0.0011207237839698792, -0.0010805251076817513, -0.0010403264313936234, -0.0010001277551054955, -0.0009599290788173676, -0.0009197304025292397, -0.0008795317262411118, -0.0008393330499529839, -0.000799134373664856, -0.0007589356973767281, -0.0007187370210886002, -0.0006785383448004723, -0.0006383396685123444, -0.0005981409922242165, -0.0005579423159360886, -0.0005177436396479607, -0.00047754496335983276, -0.00043734628707170486, -0.00039714761078357697, -0.00035694893449544907, -0.00031675025820732117, -0.00027655158191919327, -0.00023635290563106537, -0.00019615422934293747, -0.00015595555305480957, -0.00011575687676668167, -7.555820047855377e-05, -3.535952419042587e-05, 4.839152097702026e-06, 4.5037828385829926e-05, 8.523650467395782e-05, 0.00012543518096208572, 0.00016563385725021362, 0.00020583253353834152, 0.0002460312098264694, 0.0002862298861145973, 0.0003264285624027252, 0.0003666272386908531, 0.000406825914978981, 0.0004470245912671089, 0.0004872232675552368, 0.0005274219438433647, 0.0005676206201314926, 0.0006078192964196205, 0.0006480179727077484, 0.0006882166489958763, 0.0007284153252840042, 0.0007686140015721321, 0.00080881267786026, 0.0008490113541483879, 0.0008892100304365158, 0.0009294087067246437, 0.0009696073830127716, 0.0010098060593008995, 0.0010500047355890274, 0.0010902034118771553, 0.0011304020881652832]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 5.0, 8.0, 5.0, 10.0, 10.0, 11.0, 16.0, 12.0, 19.0, 18.0, 21.0, 22.0, 27.0, 27.0, 36.0, 31.0, 42.0, 39.0, 39.0, 44.0, 46.0, 33.0, 41.0, 37.0, 37.0, 39.0, 39.0, 32.0, 28.0, 35.0, 24.0, 20.0, 26.0, 12.0, 16.0, 13.0, 13.0, 8.0, 7.0, 13.0, 7.0, 8.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-10.828125, -10.5028076171875, -10.177490234375, -9.8521728515625, -9.52685546875, -9.2015380859375, -8.876220703125, -8.5509033203125, -8.2255859375, -7.9002685546875, -7.574951171875, -7.2496337890625, -6.92431640625, -6.5989990234375, -6.273681640625, -5.9483642578125, -5.623046875, -5.2977294921875, -4.972412109375, -4.6470947265625, -4.32177734375, -3.9964599609375, -3.671142578125, -3.3458251953125, -3.0205078125, -2.6951904296875, -2.369873046875, -2.0445556640625, -1.71923828125, -1.3939208984375, -1.068603515625, -0.7432861328125, -0.41796875, -0.0926513671875, 0.232666015625, 0.5579833984375, 0.88330078125, 1.2086181640625, 1.533935546875, 1.8592529296875, 2.1845703125, 2.5098876953125, 2.835205078125, 3.1605224609375, 3.48583984375, 3.8111572265625, 4.136474609375, 4.4617919921875, 4.787109375, 5.1124267578125, 5.437744140625, 5.7630615234375, 6.08837890625, 6.4136962890625, 6.739013671875, 7.0643310546875, 7.3896484375, 7.7149658203125, 8.040283203125, 8.3656005859375, 8.69091796875, 9.0162353515625, 9.341552734375, 9.6668701171875, 9.9921875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 5.0, 10.0, 10.0, 18.0, 9.0, 15.0, 28.0, 34.0, 51.0, 59.0, 78.0, 100.0, 104.0, 172.0, 182.0, 287.0, 398.0, 652.0, 1074.0, 1949.0, 3914.0, 9524.0, 26620.0, 75934.0, 210137.0, 370306.0, 220045.0, 79751.0, 27622.0, 10000.0, 4016.0, 2066.0, 1099.0, 696.0, 418.0, 273.0, 217.0, 158.0, 122.0, 73.0, 85.0, 49.0, 41.0, 37.0, 31.0, 33.0, 20.0, 12.0, 7.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-13.4296875, -13.003662109375, -12.57763671875, -12.151611328125, -11.7255859375, -11.299560546875, -10.87353515625, -10.447509765625, -10.021484375, -9.595458984375, -9.16943359375, -8.743408203125, -8.3173828125, -7.891357421875, -7.46533203125, -7.039306640625, -6.61328125, -6.187255859375, -5.76123046875, -5.335205078125, -4.9091796875, -4.483154296875, -4.05712890625, -3.631103515625, -3.205078125, -2.779052734375, -2.35302734375, -1.927001953125, -1.5009765625, -1.074951171875, -0.64892578125, -0.222900390625, 0.203125, 0.629150390625, 1.05517578125, 1.481201171875, 1.9072265625, 2.333251953125, 2.75927734375, 3.185302734375, 3.611328125, 4.037353515625, 4.46337890625, 4.889404296875, 5.3154296875, 5.741455078125, 6.16748046875, 6.593505859375, 7.01953125, 7.445556640625, 7.87158203125, 8.297607421875, 8.7236328125, 9.149658203125, 9.57568359375, 10.001708984375, 10.427734375, 10.853759765625, 11.27978515625, 11.705810546875, 12.1318359375, 12.557861328125, 12.98388671875, 13.409912109375, 13.8359375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 1.0, 6.0, 0.0, 5.0, 5.0, 7.0, 5.0, 8.0, 12.0, 16.0, 20.0, 22.0, 30.0, 40.0, 41.0, 45.0, 41.0, 77.0, 71.0, 197.0, 329.0, 1397.0, 190.0, 102.0, 72.0, 55.0, 42.0, 38.0, 25.0, 36.0, 22.0, 20.0, 11.0, 18.0, 14.0, 9.0, 9.0, 3.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.359375, -30.318603515625, -29.27783203125, -28.237060546875, -27.1962890625, -26.155517578125, -25.11474609375, -24.073974609375, -23.033203125, -21.992431640625, -20.95166015625, -19.910888671875, -18.8701171875, -17.829345703125, -16.78857421875, -15.747802734375, -14.70703125, -13.666259765625, -12.62548828125, -11.584716796875, -10.5439453125, -9.503173828125, -8.46240234375, -7.421630859375, -6.380859375, -5.340087890625, -4.29931640625, -3.258544921875, -2.2177734375, -1.177001953125, -0.13623046875, 0.904541015625, 1.9453125, 2.986083984375, 4.02685546875, 5.067626953125, 6.1083984375, 7.149169921875, 8.18994140625, 9.230712890625, 10.271484375, 11.312255859375, 12.35302734375, 13.393798828125, 14.4345703125, 15.475341796875, 16.51611328125, 17.556884765625, 18.59765625, 19.638427734375, 20.67919921875, 21.719970703125, 22.7607421875, 23.801513671875, 24.84228515625, 25.883056640625, 26.923828125, 27.964599609375, 29.00537109375, 30.046142578125, 31.0869140625, 32.127685546875, 33.16845703125, 34.209228515625, 35.25]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 3.0, 3.0, 4.0, 9.0, 9.0, 18.0, 24.0, 27.0, 25.0, 35.0, 49.0, 69.0, 113.0, 180.0, 238.0, 403.0, 739.0, 1780.0, 32790.0, 2975149.0, 128757.0, 3011.0, 842.0, 512.0, 290.0, 183.0, 121.0, 88.0, 54.0, 36.0, 35.0, 26.0, 22.0, 21.0, 6.0, 6.0, 3.0, 3.0, 3.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-63.03125, -60.83056640625, -58.6298828125, -56.42919921875, -54.228515625, -52.02783203125, -49.8271484375, -47.62646484375, -45.42578125, -43.22509765625, -41.0244140625, -38.82373046875, -36.623046875, -34.42236328125, -32.2216796875, -30.02099609375, -27.8203125, -25.61962890625, -23.4189453125, -21.21826171875, -19.017578125, -16.81689453125, -14.6162109375, -12.41552734375, -10.21484375, -8.01416015625, -5.8134765625, -3.61279296875, -1.412109375, 0.78857421875, 2.9892578125, 5.18994140625, 7.390625, 9.59130859375, 11.7919921875, 13.99267578125, 16.193359375, 18.39404296875, 20.5947265625, 22.79541015625, 24.99609375, 27.19677734375, 29.3974609375, 31.59814453125, 33.798828125, 35.99951171875, 38.2001953125, 40.40087890625, 42.6015625, 44.80224609375, 47.0029296875, 49.20361328125, 51.404296875, 53.60498046875, 55.8056640625, 58.00634765625, 60.20703125, 62.40771484375, 64.6083984375, 66.80908203125, 69.009765625, 71.21044921875, 73.4111328125, 75.61181640625, 77.8125]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [2.0, 5.0, 40.0, 229.0, 464.0, 236.0, 38.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.76854133605957, -19.154367446899414, -13.540193557739258, -7.926019668579102, -2.3118457794189453, 3.302328109741211, 8.916501998901367, 14.530675888061523, 20.14484977722168, 25.759023666381836, 31.373197555541992, 36.98737335205078, 42.60154724121094, 48.215721130371094, 53.82989501953125, 59.444068908691406, 65.05824279785156, 70.67241668701172, 76.28659057617188, 81.90076446533203, 87.51493835449219, 93.12911224365234, 98.7432861328125, 104.35746002197266, 109.97163391113281, 115.58580780029297, 121.19998168945312, 126.81415557861328, 132.42832946777344, 138.04251098632812, 143.65667724609375, 149.27084350585938, 154.885009765625, 160.49917602539062, 166.1133575439453, 171.7275390625, 177.34170532226562, 182.95587158203125, 188.57005310058594, 194.18423461914062, 199.79840087890625, 205.41256713867188, 211.02674865722656, 216.64093017578125, 222.25509643554688, 227.8692626953125, 233.4834442138672, 239.09762573242188, 244.7117919921875, 250.32595825195312, 255.9401397705078, 261.5543212890625, 267.1684875488281, 272.78265380859375, 278.3968505859375, 284.0110168457031, 289.62518310546875, 295.2393493652344, 300.853515625, 306.46771240234375, 312.0818786621094, 317.696044921875, 323.31024169921875, 328.9244079589844, 334.53857421875]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 7.0, 2.0, 11.0, 11.0, 8.0, 16.0, 14.0, 19.0, 19.0, 26.0, 37.0, 36.0, 34.0, 34.0, 52.0, 44.0, 31.0, 38.0, 44.0, 48.0, 36.0, 37.0, 42.0, 43.0, 35.0, 38.0, 26.0, 38.0, 34.0, 26.0, 34.0, 19.0, 17.0, 16.0, 8.0, 13.0, 5.0, 6.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.93299102783203, -56.68267059326172, -54.432350158691406, -52.182029724121094, -49.93170928955078, -47.68138885498047, -45.431068420410156, -43.180747985839844, -40.93042755126953, -38.68010711669922, -36.429786682128906, -34.179466247558594, -31.92914581298828, -29.67882537841797, -27.428504943847656, -25.178184509277344, -22.92786407470703, -20.67754364013672, -18.427223205566406, -16.176902770996094, -13.926582336425781, -11.676261901855469, -9.425941467285156, -7.175621032714844, -4.925300598144531, -2.6749801635742188, -0.42465972900390625, 1.8256607055664062, 4.075981140136719, 6.326301574707031, 8.576622009277344, 10.826942443847656, 13.077255249023438, 15.32757568359375, 17.577896118164062, 19.828216552734375, 22.078536987304688, 24.328857421875, 26.579177856445312, 28.829498291015625, 31.079818725585938, 33.33013916015625, 35.58045959472656, 37.830780029296875, 40.08110046386719, 42.3314208984375, 44.58174133300781, 46.832061767578125, 49.08238220214844, 51.33270263671875, 53.58302307128906, 55.833343505859375, 58.08366394042969, 60.333984375, 62.58430480957031, 64.83462524414062, 67.08494567871094, 69.33526611328125, 71.58558654785156, 73.83590698242188, 76.08622741699219, 78.3365478515625, 80.58686828613281, 82.83718872070312, 85.08750915527344]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 10.0, 4.0, 6.0, 5.0, 9.0, 18.0, 14.0, 16.0, 15.0, 13.0, 22.0, 16.0, 33.0, 34.0, 47.0, 32.0, 29.0, 38.0, 46.0, 51.0, 40.0, 46.0, 43.0, 42.0, 40.0, 33.0, 53.0, 39.0, 36.0, 28.0, 26.0, 23.0, 16.0, 11.0, 13.0, 16.0, 6.0, 7.0, 5.0, 11.0, 7.0, 4.0, 2.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0234375, -12.651611328125, -12.27978515625, -11.907958984375, -11.5361328125, -11.164306640625, -10.79248046875, -10.420654296875, -10.048828125, -9.677001953125, -9.30517578125, -8.933349609375, -8.5615234375, -8.189697265625, -7.81787109375, -7.446044921875, -7.07421875, -6.702392578125, -6.33056640625, -5.958740234375, -5.5869140625, -5.215087890625, -4.84326171875, -4.471435546875, -4.099609375, -3.727783203125, -3.35595703125, -2.984130859375, -2.6123046875, -2.240478515625, -1.86865234375, -1.496826171875, -1.125, -0.753173828125, -0.38134765625, -0.009521484375, 0.3623046875, 0.734130859375, 1.10595703125, 1.477783203125, 1.849609375, 2.221435546875, 2.59326171875, 2.965087890625, 3.3369140625, 3.708740234375, 4.08056640625, 4.452392578125, 4.82421875, 5.196044921875, 5.56787109375, 5.939697265625, 6.3115234375, 6.683349609375, 7.05517578125, 7.427001953125, 7.798828125, 8.170654296875, 8.54248046875, 8.914306640625, 9.2861328125, 9.657958984375, 10.02978515625, 10.401611328125, 10.7734375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 7.0, 5.0, 4.0, 6.0, 9.0, 7.0, 8.0, 14.0, 17.0, 25.0, 24.0, 35.0, 29.0, 48.0, 63.0, 78.0, 116.0, 136.0, 202.0, 268.0, 337.0, 438.0, 1460.0, 3281591.0, 906614.0, 990.0, 391.0, 305.0, 251.0, 172.0, 157.0, 103.0, 70.0, 59.0, 53.0, 40.0, 34.0, 19.0, 24.0, 12.0, 12.0, 14.0, 13.0, 7.0, 8.0, 8.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-124.5, -120.7177734375, -116.935546875, -113.1533203125, -109.37109375, -105.5888671875, -101.806640625, -98.0244140625, -94.2421875, -90.4599609375, -86.677734375, -82.8955078125, -79.11328125, -75.3310546875, -71.548828125, -67.7666015625, -63.984375, -60.2021484375, -56.419921875, -52.6376953125, -48.85546875, -45.0732421875, -41.291015625, -37.5087890625, -33.7265625, -29.9443359375, -26.162109375, -22.3798828125, -18.59765625, -14.8154296875, -11.033203125, -7.2509765625, -3.46875, 0.3134765625, 4.095703125, 7.8779296875, 11.66015625, 15.4423828125, 19.224609375, 23.0068359375, 26.7890625, 30.5712890625, 34.353515625, 38.1357421875, 41.91796875, 45.7001953125, 49.482421875, 53.2646484375, 57.046875, 60.8291015625, 64.611328125, 68.3935546875, 72.17578125, 75.9580078125, 79.740234375, 83.5224609375, 87.3046875, 91.0869140625, 94.869140625, 98.6513671875, 102.43359375, 106.2158203125, 109.998046875, 113.7802734375, 117.5625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 1.0, 6.0, 5.0, 4.0, 7.0, 9.0, 11.0, 19.0, 16.0, 20.0, 38.0, 51.0, 66.0, 93.0, 124.0, 159.0, 224.0, 312.0, 424.0, 512.0, 519.0, 377.0, 278.0, 234.0, 170.0, 96.0, 79.0, 52.0, 51.0, 18.0, 27.0, 13.0, 13.0, 11.0, 12.0, 6.0, 8.0, 4.0, 4.0, 1.0, 2.0, 6.0, 1.0, 0.0, 1.0], "bins": [-21.171875, -20.627197265625, -20.08251953125, -19.537841796875, -18.9931640625, -18.448486328125, -17.90380859375, -17.359130859375, -16.814453125, -16.269775390625, -15.72509765625, -15.180419921875, -14.6357421875, -14.091064453125, -13.54638671875, -13.001708984375, -12.45703125, -11.912353515625, -11.36767578125, -10.822998046875, -10.2783203125, -9.733642578125, -9.18896484375, -8.644287109375, -8.099609375, -7.554931640625, -7.01025390625, -6.465576171875, -5.9208984375, -5.376220703125, -4.83154296875, -4.286865234375, -3.7421875, -3.197509765625, -2.65283203125, -2.108154296875, -1.5634765625, -1.018798828125, -0.47412109375, 0.070556640625, 0.615234375, 1.159912109375, 1.70458984375, 2.249267578125, 2.7939453125, 3.338623046875, 3.88330078125, 4.427978515625, 4.97265625, 5.517333984375, 6.06201171875, 6.606689453125, 7.1513671875, 7.696044921875, 8.24072265625, 8.785400390625, 9.330078125, 9.874755859375, 10.41943359375, 10.964111328125, 11.5087890625, 12.053466796875, 12.59814453125, 13.142822265625, 13.6875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 10.0, 8.0, 14.0, 18.0, 19.0, 24.0, 27.0, 37.0, 54.0, 61.0, 147.0, 342.0, 1528.0, 138800.0, 4032529.0, 19301.0, 759.0, 239.0, 102.0, 58.0, 49.0, 36.0, 30.0, 19.0, 22.0, 15.0, 6.0, 10.0, 7.0, 8.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.375, -61.4921875, -58.609375, -55.7265625, -52.84375, -49.9609375, -47.078125, -44.1953125, -41.3125, -38.4296875, -35.546875, -32.6640625, -29.78125, -26.8984375, -24.015625, -21.1328125, -18.25, -15.3671875, -12.484375, -9.6015625, -6.71875, -3.8359375, -0.953125, 1.9296875, 4.8125, 7.6953125, 10.578125, 13.4609375, 16.34375, 19.2265625, 22.109375, 24.9921875, 27.875, 30.7578125, 33.640625, 36.5234375, 39.40625, 42.2890625, 45.171875, 48.0546875, 50.9375, 53.8203125, 56.703125, 59.5859375, 62.46875, 65.3515625, 68.234375, 71.1171875, 74.0, 76.8828125, 79.765625, 82.6484375, 85.53125, 88.4140625, 91.296875, 94.1796875, 97.0625, 99.9453125, 102.828125, 105.7109375, 108.59375, 111.4765625, 114.359375, 117.2421875, 120.125]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 102.0, 679.0, 220.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-422.70098876953125, -410.1365966796875, -397.5722351074219, -385.00787353515625, -372.4434814453125, -359.87908935546875, -347.3147277832031, -334.7503662109375, -322.18597412109375, -309.62158203125, -297.0572204589844, -284.49285888671875, -271.928466796875, -259.36407470703125, -246.79971313476562, -234.23533630371094, -221.67095947265625, -209.10658264160156, -196.54220581054688, -183.9778289794922, -171.4134521484375, -158.8490753173828, -146.28469848632812, -133.72032165527344, -121.15594482421875, -108.59156799316406, -96.02719116210938, -83.46281433105469, -70.8984375, -58.33406066894531, -45.769683837890625, -33.20530700683594, -20.64093017578125, -8.076553344726562, 4.487823486328125, 17.052200317382812, 29.6165771484375, 42.18095397949219, 54.745330810546875, 67.30970764160156, 79.87408447265625, 92.43846130371094, 105.00283813476562, 117.56721496582031, 130.131591796875, 142.6959686279297, 155.26034545898438, 167.82472229003906, 180.38909912109375, 192.95347595214844, 205.51785278320312, 218.0822296142578, 230.6466064453125, 243.2109832763672, 255.77536010742188, 268.3397216796875, 280.90411376953125, 293.468505859375, 306.0328674316406, 318.59722900390625, 331.16162109375, 343.72601318359375, 356.2903747558594, 368.854736328125, 381.41912841796875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 11.0, 6.0, 6.0, 8.0, 12.0, 7.0, 8.0, 9.0, 15.0, 18.0, 17.0, 22.0, 32.0, 25.0, 18.0, 34.0, 24.0, 30.0, 42.0, 28.0, 37.0, 39.0, 36.0, 47.0, 35.0, 26.0, 40.0, 39.0, 40.0, 36.0, 25.0, 33.0, 21.0, 22.0, 21.0, 16.0, 16.0, 12.0, 17.0, 13.0, 10.0, 11.0, 6.0, 8.0, 5.0, 5.0, 4.0, 8.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0], "bins": [-55.753265380859375, -54.11888885498047, -52.48451232910156, -50.850135803222656, -49.21575927734375, -47.581382751464844, -45.94700622558594, -44.31262969970703, -42.678253173828125, -41.04387664794922, -39.40950012207031, -37.775123596191406, -36.1407470703125, -34.506370544433594, -32.87199401855469, -31.23761749267578, -29.603239059448242, -27.968862533569336, -26.33448600769043, -24.700109481811523, -23.065732955932617, -21.431354522705078, -19.796977996826172, -18.162601470947266, -16.52822494506836, -14.893848419189453, -13.259471893310547, -11.62509536743164, -9.990718841552734, -8.356341361999512, -6.7219648361206055, -5.087588310241699, -3.4532127380371094, -1.8188360929489136, -0.18445944786071777, 1.4499173164367676, 3.084293842315674, 4.718670845031738, 6.3530473709106445, 7.987423896789551, 9.621800422668457, 11.256176948547363, 12.89055347442627, 14.524930953979492, 16.1593074798584, 17.793684005737305, 19.42806053161621, 21.062437057495117, 22.696813583374023, 24.33119010925293, 25.965566635131836, 27.599943161010742, 29.23431968688965, 30.868698120117188, 32.503074645996094, 34.137451171875, 35.771827697753906, 37.40620422363281, 39.04058074951172, 40.674957275390625, 42.30933380126953, 43.94371032714844, 45.578086853027344, 47.21246337890625, 48.846839904785156]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 5.0, 12.0, 10.0, 8.0, 13.0, 9.0, 14.0, 19.0, 26.0, 23.0, 31.0, 30.0, 17.0, 34.0, 35.0, 34.0, 31.0, 53.0, 39.0, 48.0, 40.0, 34.0, 32.0, 43.0, 37.0, 30.0, 35.0, 29.0, 36.0, 27.0, 20.0, 20.0, 24.0, 17.0, 10.0, 9.0, 11.0, 10.0, 9.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0], "bins": [-11.8984375, -11.5672607421875, -11.236083984375, -10.9049072265625, -10.57373046875, -10.2425537109375, -9.911376953125, -9.5802001953125, -9.2490234375, -8.9178466796875, -8.586669921875, -8.2554931640625, -7.92431640625, -7.5931396484375, -7.261962890625, -6.9307861328125, -6.599609375, -6.2684326171875, -5.937255859375, -5.6060791015625, -5.27490234375, -4.9437255859375, -4.612548828125, -4.2813720703125, -3.9501953125, -3.6190185546875, -3.287841796875, -2.9566650390625, -2.62548828125, -2.2943115234375, -1.963134765625, -1.6319580078125, -1.30078125, -0.9696044921875, -0.638427734375, -0.3072509765625, 0.02392578125, 0.3551025390625, 0.686279296875, 1.0174560546875, 1.3486328125, 1.6798095703125, 2.010986328125, 2.3421630859375, 2.67333984375, 3.0045166015625, 3.335693359375, 3.6668701171875, 3.998046875, 4.3292236328125, 4.660400390625, 4.9915771484375, 5.32275390625, 5.6539306640625, 5.985107421875, 6.3162841796875, 6.6474609375, 6.9786376953125, 7.309814453125, 7.6409912109375, 7.97216796875, 8.3033447265625, 8.634521484375, 8.9656982421875, 9.296875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 9.0, 14.0, 22.0, 31.0, 42.0, 59.0, 113.0, 132.0, 195.0, 284.0, 388.0, 638.0, 968.0, 1394.0, 2167.0, 3307.0, 5204.0, 8034.0, 13121.0, 21440.0, 36022.0, 64476.0, 124508.0, 270279.0, 240064.0, 110630.0, 58633.0, 33040.0, 19689.0, 12179.0, 7404.0, 4907.0, 3124.0, 2008.0, 1326.0, 840.0, 599.0, 404.0, 283.0, 166.0, 132.0, 83.0, 68.0, 43.0, 33.0, 19.0, 9.0, 10.0, 7.0, 0.0, 1.0, 2.0, 1.0, 4.0], "bins": [-2.244140625, -2.177978515625, -2.11181640625, -2.045654296875, -1.9794921875, -1.913330078125, -1.84716796875, -1.781005859375, -1.71484375, -1.648681640625, -1.58251953125, -1.516357421875, -1.4501953125, -1.384033203125, -1.31787109375, -1.251708984375, -1.185546875, -1.119384765625, -1.05322265625, -0.987060546875, -0.9208984375, -0.854736328125, -0.78857421875, -0.722412109375, -0.65625, -0.590087890625, -0.52392578125, -0.457763671875, -0.3916015625, -0.325439453125, -0.25927734375, -0.193115234375, -0.126953125, -0.060791015625, 0.00537109375, 0.071533203125, 0.1376953125, 0.203857421875, 0.27001953125, 0.336181640625, 0.40234375, 0.468505859375, 0.53466796875, 0.600830078125, 0.6669921875, 0.733154296875, 0.79931640625, 0.865478515625, 0.931640625, 0.997802734375, 1.06396484375, 1.130126953125, 1.1962890625, 1.262451171875, 1.32861328125, 1.394775390625, 1.4609375, 1.527099609375, 1.59326171875, 1.659423828125, 1.7255859375, 1.791748046875, 1.85791015625, 1.924072265625, 1.990234375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 2.0, 1.0, 6.0, 10.0, 15.0, 11.0, 13.0, 16.0, 15.0, 18.0, 24.0, 24.0, 30.0, 37.0, 28.0, 34.0, 31.0, 33.0, 33.0, 34.0, 48.0, 1064.0, 41.0, 30.0, 38.0, 36.0, 40.0, 26.0, 31.0, 30.0, 26.0, 31.0, 31.0, 16.0, 19.0, 8.0, 13.0, 15.0, 9.0, 10.0, 6.0, 11.0, 9.0, 4.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.9375, -5.7283935546875, -5.519287109375, -5.3101806640625, -5.10107421875, -4.8919677734375, -4.682861328125, -4.4737548828125, -4.2646484375, -4.0555419921875, -3.846435546875, -3.6373291015625, -3.42822265625, -3.2191162109375, -3.010009765625, -2.8009033203125, -2.591796875, -2.3826904296875, -2.173583984375, -1.9644775390625, -1.75537109375, -1.5462646484375, -1.337158203125, -1.1280517578125, -0.9189453125, -0.7098388671875, -0.500732421875, -0.2916259765625, -0.08251953125, 0.1265869140625, 0.335693359375, 0.5447998046875, 0.75390625, 0.9630126953125, 1.172119140625, 1.3812255859375, 1.59033203125, 1.7994384765625, 2.008544921875, 2.2176513671875, 2.4267578125, 2.6358642578125, 2.844970703125, 3.0540771484375, 3.26318359375, 3.4722900390625, 3.681396484375, 3.8905029296875, 4.099609375, 4.3087158203125, 4.517822265625, 4.7269287109375, 4.93603515625, 5.1451416015625, 5.354248046875, 5.5633544921875, 5.7724609375, 5.9815673828125, 6.190673828125, 6.3997802734375, 6.60888671875, 6.8179931640625, 7.027099609375, 7.2362060546875, 7.4453125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 1.0, 4.0, 7.0, 12.0, 16.0, 15.0, 41.0, 63.0, 62.0, 114.0, 157.0, 195.0, 321.0, 436.0, 635.0, 903.0, 1370.0, 2087.0, 3162.0, 4601.0, 7144.0, 10632.0, 16431.0, 25730.0, 41887.0, 71456.0, 134231.0, 1312285.0, 205360.0, 102714.0, 57348.0, 34606.0, 21793.0, 13983.0, 8965.0, 6188.0, 3940.0, 2544.0, 1800.0, 1216.0, 830.0, 560.0, 365.0, 297.0, 189.0, 135.0, 98.0, 66.0, 45.0, 38.0, 20.0, 13.0, 11.0, 11.0, 3.0, 2.0, 1.0, 1.0], "bins": [-1.9609375, -1.902923583984375, -1.84490966796875, -1.786895751953125, -1.7288818359375, -1.670867919921875, -1.61285400390625, -1.554840087890625, -1.496826171875, -1.438812255859375, -1.38079833984375, -1.322784423828125, -1.2647705078125, -1.206756591796875, -1.14874267578125, -1.090728759765625, -1.03271484375, -0.974700927734375, -0.91668701171875, -0.858673095703125, -0.8006591796875, -0.742645263671875, -0.68463134765625, -0.626617431640625, -0.568603515625, -0.510589599609375, -0.45257568359375, -0.394561767578125, -0.3365478515625, -0.278533935546875, -0.22052001953125, -0.162506103515625, -0.1044921875, -0.046478271484375, 0.01153564453125, 0.069549560546875, 0.1275634765625, 0.185577392578125, 0.24359130859375, 0.301605224609375, 0.359619140625, 0.417633056640625, 0.47564697265625, 0.533660888671875, 0.5916748046875, 0.649688720703125, 0.70770263671875, 0.765716552734375, 0.82373046875, 0.881744384765625, 0.93975830078125, 0.997772216796875, 1.0557861328125, 1.113800048828125, 1.17181396484375, 1.229827880859375, 1.287841796875, 1.345855712890625, 1.40386962890625, 1.461883544921875, 1.5198974609375, 1.577911376953125, 1.63592529296875, 1.693939208984375, 1.751953125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 11.0, 9.0, 8.0, 16.0, 17.0, 16.0, 21.0, 44.0, 40.0, 45.0, 58.0, 72.0, 73.0, 82.0, 79.0, 54.0, 52.0, 52.0, 43.0, 43.0, 32.0, 29.0, 24.0, 19.0, 9.0, 12.0, 11.0, 6.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002109527587890625, -0.002039581537246704, -0.001969635486602783, -0.0018996894359588623, -0.0018297433853149414, -0.0017597973346710205, -0.0016898512840270996, -0.0016199052333831787, -0.0015499591827392578, -0.001480013132095337, -0.001410067081451416, -0.0013401210308074951, -0.0012701749801635742, -0.0012002289295196533, -0.0011302828788757324, -0.0010603368282318115, -0.0009903907775878906, -0.0009204447269439697, -0.0008504986763000488, -0.0007805526256561279, -0.000710606575012207, -0.0006406605243682861, -0.0005707144737243652, -0.0005007684230804443, -0.00043082237243652344, -0.00036087632179260254, -0.00029093027114868164, -0.00022098422050476074, -0.00015103816986083984, -8.109211921691895e-05, -1.1146068572998047e-05, 5.879998207092285e-05, 0.00012874603271484375, 0.00019869208335876465, 0.00026863813400268555, 0.00033858418464660645, 0.00040853023529052734, 0.00047847628593444824, 0.0005484223365783691, 0.00061836838722229, 0.0006883144378662109, 0.0007582604885101318, 0.0008282065391540527, 0.0008981525897979736, 0.0009680986404418945, 0.0010380446910858154, 0.0011079907417297363, 0.0011779367923736572, 0.0012478828430175781, 0.001317828893661499, 0.00138777494430542, 0.0014577209949493408, 0.0015276670455932617, 0.0015976130962371826, 0.0016675591468811035, 0.0017375051975250244, 0.0018074512481689453, 0.0018773972988128662, 0.0019473433494567871, 0.002017289400100708, 0.002087235450744629, 0.00215718150138855, 0.0022271275520324707, 0.0022970736026763916, 0.0023670196533203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 9.0, 11.0, 17.0, 13.0, 22.0, 23.0, 27.0, 49.0, 64.0, 59.0, 92.0, 164.0, 208.0, 406.0, 604.0, 1392.0, 395636.0, 646196.0, 1650.0, 676.0, 394.0, 245.0, 171.0, 100.0, 87.0, 60.0, 42.0, 27.0, 24.0, 22.0, 21.0, 15.0, 5.0, 4.0, 3.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.041015625, -0.0398106575012207, -0.038605690002441406, -0.03740072250366211, -0.03619575500488281, -0.034990787506103516, -0.03378582000732422, -0.03258085250854492, -0.031375885009765625, -0.030170917510986328, -0.02896595001220703, -0.027760982513427734, -0.026556015014648438, -0.02535104751586914, -0.024146080017089844, -0.022941112518310547, -0.02173614501953125, -0.020531177520751953, -0.019326210021972656, -0.01812124252319336, -0.016916275024414062, -0.015711307525634766, -0.014506340026855469, -0.013301372528076172, -0.012096405029296875, -0.010891437530517578, -0.009686470031738281, -0.008481502532958984, -0.0072765350341796875, -0.006071567535400391, -0.004866600036621094, -0.003661632537841797, -0.0024566650390625, -0.0012516975402832031, -4.673004150390625e-05, 0.0011582374572753906, 0.0023632049560546875, 0.0035681724548339844, 0.004773139953613281, 0.005978107452392578, 0.007183074951171875, 0.008388042449951172, 0.009593009948730469, 0.010797977447509766, 0.012002944946289062, 0.01320791244506836, 0.014412879943847656, 0.015617847442626953, 0.01682281494140625, 0.018027782440185547, 0.019232749938964844, 0.02043771743774414, 0.021642684936523438, 0.022847652435302734, 0.02405261993408203, 0.025257587432861328, 0.026462554931640625, 0.027667522430419922, 0.02887248992919922, 0.030077457427978516, 0.03128242492675781, 0.03248739242553711, 0.033692359924316406, 0.0348973274230957, 0.036102294921875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 29.0, 101.0, 236.0, 279.0, 233.0, 91.0, 24.0, 7.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0023880270309746265, -0.0022976913023740053, -0.002207355573773384, -0.0021170200780034065, -0.0020266843494027853, -0.001936348620802164, -0.0018460128922015429, -0.0017556771636009216, -0.0016653415514156222, -0.001575005822815001, -0.0014846702106297016, -0.0013943344820290804, -0.0013039987534284592, -0.0012136631412431598, -0.0011233274126425385, -0.0010329918004572392, -0.0009426560718566179, -0.0008523204014636576, -0.0007619847310706973, -0.0006716490024700761, -0.0005813133320771158, -0.0004909776616841555, -0.00040064193308353424, -0.00031030626269057393, -0.00021997059229761362, -0.00012963490735273808, -3.9299222407862544e-05, 5.103647708892822e-05, 0.00014137214748188853, 0.00023170781787484884, 0.00032204354647547007, 0.0004123792168684304, 0.000502714654430747, 0.0005930503248237073, 0.0006833859952166677, 0.0007737217238172889, 0.0008640573942102492, 0.0009543930646032095, 0.0010447287932038307, 0.001135064521804452, 0.0012254001339897513, 0.0013157358625903726, 0.001406071474775672, 0.0014964072033762932, 0.0015867429319769144, 0.0016770785441622138, 0.001767414272762835, 0.0018577498849481344, 0.0019480856135487556, 0.002038421342149377, 0.002128757070749998, 0.0022190925665199757, 0.002309428295120597, 0.002399764023721218, 0.0024900997523218393, 0.0025804354809224606, 0.002670770976692438, 0.0027611067052930593, 0.0028514424338936806, 0.002941777929663658, 0.0030321136582642794, 0.0031224493868649006, 0.003212785115465522, 0.003303120844066143, 0.0033934565726667643]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 7.0, 8.0, 6.0, 17.0, 18.0, 10.0, 23.0, 23.0, 11.0, 23.0, 22.0, 25.0, 30.0, 24.0, 30.0, 34.0, 28.0, 46.0, 39.0, 41.0, 37.0, 45.0, 42.0, 36.0, 38.0, 35.0, 38.0, 26.0, 28.0, 31.0, 32.0, 16.0, 21.0, 20.0, 19.0, 13.0, 7.0, 17.0, 8.0, 3.0, 8.0, 6.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008754134178161621, -0.0008452590554952621, -0.0008151046931743622, -0.0007849503308534622, -0.0007547959685325623, -0.0007246416062116623, -0.0006944872438907623, -0.0006643328815698624, -0.0006341785192489624, -0.0006040241569280624, -0.0005738697946071625, -0.0005437154322862625, -0.0005135610699653625, -0.0004834067076444626, -0.0004532523453235626, -0.00042309798300266266, -0.0003929436206817627, -0.00036278925836086273, -0.00033263489603996277, -0.0003024805337190628, -0.00027232617139816284, -0.00024217180907726288, -0.00021201744675636292, -0.00018186308443546295, -0.000151708722114563, -0.00012155435979366302, -9.139999747276306e-05, -6.12456351518631e-05, -3.1091272830963135e-05, -9.369105100631714e-07, 2.9217451810836792e-05, 5.9371814131736755e-05, 8.952617645263672e-05, 0.00011968053877353668, 0.00014983490109443665, 0.0001799892634153366, 0.00021014362573623657, 0.00024029798805713654, 0.0002704523503780365, 0.00030060671269893646, 0.0003307610750198364, 0.0003609154373407364, 0.00039106979966163635, 0.0004212241619825363, 0.0004513785243034363, 0.00048153288662433624, 0.0005116872489452362, 0.0005418416112661362, 0.0005719959735870361, 0.0006021503359079361, 0.0006323046982288361, 0.000662459060549736, 0.000692613422870636, 0.000722767785191536, 0.0007529221475124359, 0.0007830765098333359, 0.0008132308721542358, 0.0008433852344751358, 0.0008735395967960358, 0.0009036939591169357, 0.0009338483214378357, 0.0009640026837587357, 0.0009941570460796356, 0.0010243114084005356, 0.0010544657707214355]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 5.0, 12.0, 10.0, 8.0, 13.0, 9.0, 14.0, 19.0, 26.0, 23.0, 30.0, 31.0, 17.0, 33.0, 36.0, 34.0, 31.0, 53.0, 39.0, 48.0, 40.0, 34.0, 32.0, 43.0, 37.0, 30.0, 35.0, 29.0, 36.0, 27.0, 20.0, 20.0, 24.0, 17.0, 10.0, 9.0, 11.0, 10.0, 9.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0], "bins": [-11.8984375, -11.5672607421875, -11.236083984375, -10.9049072265625, -10.57373046875, -10.2425537109375, -9.911376953125, -9.5802001953125, -9.2490234375, -8.9178466796875, -8.586669921875, -8.2554931640625, -7.92431640625, -7.5931396484375, -7.261962890625, -6.9307861328125, -6.599609375, -6.2684326171875, -5.937255859375, -5.6060791015625, -5.27490234375, -4.9437255859375, -4.612548828125, -4.2813720703125, -3.9501953125, -3.6190185546875, -3.287841796875, -2.9566650390625, -2.62548828125, -2.2943115234375, -1.963134765625, -1.6319580078125, -1.30078125, -0.9696044921875, -0.638427734375, -0.3072509765625, 0.02392578125, 0.3551025390625, 0.686279296875, 1.0174560546875, 1.3486328125, 1.6798095703125, 2.010986328125, 2.3421630859375, 2.67333984375, 3.0045166015625, 3.335693359375, 3.6668701171875, 3.998046875, 4.3292236328125, 4.660400390625, 4.9915771484375, 5.32275390625, 5.6539306640625, 5.985107421875, 6.3162841796875, 6.6474609375, 6.9786376953125, 7.309814453125, 7.6409912109375, 7.97216796875, 8.3033447265625, 8.634521484375, 8.9656982421875, 9.296875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 13.0, 8.0, 11.0, 17.0, 32.0, 33.0, 54.0, 58.0, 93.0, 107.0, 146.0, 196.0, 250.0, 331.0, 411.0, 519.0, 753.0, 1047.0, 1584.0, 3047.0, 9292.0, 49043.0, 275395.0, 531539.0, 138320.0, 23575.0, 5498.0, 2213.0, 1345.0, 837.0, 700.0, 498.0, 376.0, 301.0, 220.0, 135.0, 144.0, 92.0, 79.0, 58.0, 43.0, 30.0, 25.0, 24.0, 17.0, 10.0, 8.0, 12.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-22.53125, -21.8544921875, -21.177734375, -20.5009765625, -19.82421875, -19.1474609375, -18.470703125, -17.7939453125, -17.1171875, -16.4404296875, -15.763671875, -15.0869140625, -14.41015625, -13.7333984375, -13.056640625, -12.3798828125, -11.703125, -11.0263671875, -10.349609375, -9.6728515625, -8.99609375, -8.3193359375, -7.642578125, -6.9658203125, -6.2890625, -5.6123046875, -4.935546875, -4.2587890625, -3.58203125, -2.9052734375, -2.228515625, -1.5517578125, -0.875, -0.1982421875, 0.478515625, 1.1552734375, 1.83203125, 2.5087890625, 3.185546875, 3.8623046875, 4.5390625, 5.2158203125, 5.892578125, 6.5693359375, 7.24609375, 7.9228515625, 8.599609375, 9.2763671875, 9.953125, 10.6298828125, 11.306640625, 11.9833984375, 12.66015625, 13.3369140625, 14.013671875, 14.6904296875, 15.3671875, 16.0439453125, 16.720703125, 17.3974609375, 18.07421875, 18.7509765625, 19.427734375, 20.1044921875, 20.78125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 9.0, 7.0, 12.0, 12.0, 18.0, 18.0, 22.0, 27.0, 26.0, 28.0, 32.0, 44.0, 42.0, 49.0, 54.0, 100.0, 186.0, 1380.0, 329.0, 146.0, 83.0, 64.0, 49.0, 45.0, 33.0, 32.0, 30.0, 28.0, 25.0, 12.0, 19.0, 17.0, 15.0, 6.0, 11.0, 6.0, 8.0, 4.0, 9.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-31.015625, -30.125244140625, -29.23486328125, -28.344482421875, -27.4541015625, -26.563720703125, -25.67333984375, -24.782958984375, -23.892578125, -23.002197265625, -22.11181640625, -21.221435546875, -20.3310546875, -19.440673828125, -18.55029296875, -17.659912109375, -16.76953125, -15.879150390625, -14.98876953125, -14.098388671875, -13.2080078125, -12.317626953125, -11.42724609375, -10.536865234375, -9.646484375, -8.756103515625, -7.86572265625, -6.975341796875, -6.0849609375, -5.194580078125, -4.30419921875, -3.413818359375, -2.5234375, -1.633056640625, -0.74267578125, 0.147705078125, 1.0380859375, 1.928466796875, 2.81884765625, 3.709228515625, 4.599609375, 5.489990234375, 6.38037109375, 7.270751953125, 8.1611328125, 9.051513671875, 9.94189453125, 10.832275390625, 11.72265625, 12.613037109375, 13.50341796875, 14.393798828125, 15.2841796875, 16.174560546875, 17.06494140625, 17.955322265625, 18.845703125, 19.736083984375, 20.62646484375, 21.516845703125, 22.4072265625, 23.297607421875, 24.18798828125, 25.078369140625, 25.96875]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 8.0, 3.0, 4.0, 8.0, 13.0, 17.0, 17.0, 15.0, 19.0, 24.0, 55.0, 48.0, 71.0, 105.0, 180.0, 240.0, 420.0, 831.0, 2182.0, 2957047.0, 180868.0, 1673.0, 735.0, 346.0, 214.0, 144.0, 112.0, 73.0, 65.0, 44.0, 27.0, 13.0, 17.0, 19.0, 6.0, 6.0, 10.0, 6.0, 8.0, 4.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-153.75, -148.9296875, -144.109375, -139.2890625, -134.46875, -129.6484375, -124.828125, -120.0078125, -115.1875, -110.3671875, -105.546875, -100.7265625, -95.90625, -91.0859375, -86.265625, -81.4453125, -76.625, -71.8046875, -66.984375, -62.1640625, -57.34375, -52.5234375, -47.703125, -42.8828125, -38.0625, -33.2421875, -28.421875, -23.6015625, -18.78125, -13.9609375, -9.140625, -4.3203125, 0.5, 5.3203125, 10.140625, 14.9609375, 19.78125, 24.6015625, 29.421875, 34.2421875, 39.0625, 43.8828125, 48.703125, 53.5234375, 58.34375, 63.1640625, 67.984375, 72.8046875, 77.625, 82.4453125, 87.265625, 92.0859375, 96.90625, 101.7265625, 106.546875, 111.3671875, 116.1875, 121.0078125, 125.828125, 130.6484375, 135.46875, 140.2890625, 145.109375, 149.9296875, 154.75]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 51.0, 125.0, 247.0, 294.0, 196.0, 57.0, 22.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.45406341552734, -76.62646484375, -72.79886627197266, -68.97126770019531, -65.14366149902344, -61.31606674194336, -57.48846435546875, -53.660865783691406, -49.83326721191406, -46.00566864013672, -42.178070068359375, -38.350467681884766, -34.52286911010742, -30.695270538330078, -26.8676700592041, -23.040069580078125, -19.21247100830078, -15.384871482849121, -11.557271957397461, -7.729672431945801, -3.9020729064941406, -0.07447433471679688, 3.7531261444091797, 7.580726623535156, 11.4083251953125, 15.23592472076416, 19.06352424621582, 22.891124725341797, 26.71872329711914, 30.546321868896484, 34.373924255371094, 38.20152282714844, 42.02911376953125, 45.856712341308594, 49.68431091308594, 53.51191329956055, 57.33951187133789, 61.167110443115234, 64.99471282958984, 68.82231140136719, 72.64990997314453, 76.47750854492188, 80.30510711669922, 84.13270568847656, 87.96031188964844, 91.78790283203125, 95.61550903320312, 99.44310760498047, 103.27070617675781, 107.09830474853516, 110.9259033203125, 114.75350189208984, 118.58110046386719, 122.40870666503906, 126.2363052368164, 130.06390380859375, 133.89151000976562, 137.7191162109375, 141.5467071533203, 145.3743133544922, 149.201904296875, 153.02951049804688, 156.8571014404297, 160.68470764160156, 164.51229858398438]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 8.0, 17.0, 14.0, 21.0, 23.0, 32.0, 34.0, 34.0, 37.0, 39.0, 32.0, 42.0, 40.0, 55.0, 38.0, 50.0, 41.0, 51.0, 36.0, 33.0, 38.0, 32.0, 33.0, 31.0, 37.0, 24.0, 14.0, 13.0, 12.0, 11.0, 4.0, 14.0, 7.0, 8.0, 7.0, 5.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-75.38371276855469, -72.91327667236328, -70.44284057617188, -67.972412109375, -65.5019760131836, -63.03153991699219, -60.56110382080078, -58.090667724609375, -55.620235443115234, -53.14979934692383, -50.67936706542969, -48.20893096923828, -45.738494873046875, -43.268062591552734, -40.79762649536133, -38.32719421386719, -35.85675811767578, -33.386322021484375, -30.915889739990234, -28.445453643798828, -25.975019454956055, -23.50458526611328, -21.034149169921875, -18.5637149810791, -16.093280792236328, -13.622846603393555, -11.152411460876465, -8.681976318359375, -6.211542129516602, -3.741107940673828, -1.2706727981567383, 1.1997623443603516, 3.6701889038085938, 6.140623569488525, 8.611058235168457, 11.081493377685547, 13.55192756652832, 16.022361755371094, 18.4927978515625, 20.963232040405273, 23.433666229248047, 25.90410041809082, 28.374534606933594, 30.844970703125, 33.315406799316406, 35.78583908081055, 38.25627517700195, 40.726707458496094, 43.1971435546875, 45.667579650878906, 48.13801193237305, 50.60844802856445, 53.078880310058594, 55.54931640625, 58.019752502441406, 60.49018859863281, 62.96062088012695, 65.4310531616211, 67.9014892578125, 70.3719253540039, 72.84236145019531, 75.31278991699219, 77.7832260131836, 80.253662109375, 82.7240982055664]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 4.0, 9.0, 5.0, 5.0, 6.0, 6.0, 8.0, 12.0, 19.0, 9.0, 13.0, 19.0, 21.0, 25.0, 20.0, 33.0, 28.0, 28.0, 35.0, 27.0, 39.0, 26.0, 43.0, 39.0, 48.0, 47.0, 35.0, 35.0, 32.0, 32.0, 27.0, 31.0, 26.0, 23.0, 21.0, 30.0, 18.0, 16.0, 18.0, 19.0, 13.0, 8.0, 7.0, 6.0, 8.0, 5.0, 6.0, 6.0, 1.0, 8.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.65625, -9.346923828125, -9.03759765625, -8.728271484375, -8.4189453125, -8.109619140625, -7.80029296875, -7.490966796875, -7.181640625, -6.872314453125, -6.56298828125, -6.253662109375, -5.9443359375, -5.635009765625, -5.32568359375, -5.016357421875, -4.70703125, -4.397705078125, -4.08837890625, -3.779052734375, -3.4697265625, -3.160400390625, -2.85107421875, -2.541748046875, -2.232421875, -1.923095703125, -1.61376953125, -1.304443359375, -0.9951171875, -0.685791015625, -0.37646484375, -0.067138671875, 0.2421875, 0.551513671875, 0.86083984375, 1.170166015625, 1.4794921875, 1.788818359375, 2.09814453125, 2.407470703125, 2.716796875, 3.026123046875, 3.33544921875, 3.644775390625, 3.9541015625, 4.263427734375, 4.57275390625, 4.882080078125, 5.19140625, 5.500732421875, 5.81005859375, 6.119384765625, 6.4287109375, 6.738037109375, 7.04736328125, 7.356689453125, 7.666015625, 7.975341796875, 8.28466796875, 8.593994140625, 8.9033203125, 9.212646484375, 9.52197265625, 9.831298828125, 10.140625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 7.0, 5.0, 6.0, 13.0, 20.0, 29.0, 40.0, 65.0, 101.0, 170.0, 301.0, 569.0, 1217.0, 3337.0, 14514.0, 139888.0, 1545580.0, 2195413.0, 263702.0, 22151.0, 4317.0, 1377.0, 638.0, 366.0, 184.0, 111.0, 62.0, 44.0, 27.0, 16.0, 9.0, 6.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.03125, -22.240234375, -21.44921875, -20.658203125, -19.8671875, -19.076171875, -18.28515625, -17.494140625, -16.703125, -15.912109375, -15.12109375, -14.330078125, -13.5390625, -12.748046875, -11.95703125, -11.166015625, -10.375, -9.583984375, -8.79296875, -8.001953125, -7.2109375, -6.419921875, -5.62890625, -4.837890625, -4.046875, -3.255859375, -2.46484375, -1.673828125, -0.8828125, -0.091796875, 0.69921875, 1.490234375, 2.28125, 3.072265625, 3.86328125, 4.654296875, 5.4453125, 6.236328125, 7.02734375, 7.818359375, 8.609375, 9.400390625, 10.19140625, 10.982421875, 11.7734375, 12.564453125, 13.35546875, 14.146484375, 14.9375, 15.728515625, 16.51953125, 17.310546875, 18.1015625, 18.892578125, 19.68359375, 20.474609375, 21.265625, 22.056640625, 22.84765625, 23.638671875, 24.4296875, 25.220703125, 26.01171875, 26.802734375, 27.59375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 9.0, 9.0, 10.0, 12.0, 20.0, 25.0, 46.0, 67.0, 86.0, 120.0, 156.0, 203.0, 232.0, 365.0, 435.0, 504.0, 509.0, 338.0, 223.0, 166.0, 137.0, 127.0, 77.0, 50.0, 44.0, 21.0, 21.0, 20.0, 12.0, 11.0, 4.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.296875, -14.645751953125, -13.99462890625, -13.343505859375, -12.6923828125, -12.041259765625, -11.39013671875, -10.739013671875, -10.087890625, -9.436767578125, -8.78564453125, -8.134521484375, -7.4833984375, -6.832275390625, -6.18115234375, -5.530029296875, -4.87890625, -4.227783203125, -3.57666015625, -2.925537109375, -2.2744140625, -1.623291015625, -0.97216796875, -0.321044921875, 0.330078125, 0.981201171875, 1.63232421875, 2.283447265625, 2.9345703125, 3.585693359375, 4.23681640625, 4.887939453125, 5.5390625, 6.190185546875, 6.84130859375, 7.492431640625, 8.1435546875, 8.794677734375, 9.44580078125, 10.096923828125, 10.748046875, 11.399169921875, 12.05029296875, 12.701416015625, 13.3525390625, 14.003662109375, 14.65478515625, 15.305908203125, 15.95703125, 16.608154296875, 17.25927734375, 17.910400390625, 18.5615234375, 19.212646484375, 19.86376953125, 20.514892578125, 21.166015625, 21.817138671875, 22.46826171875, 23.119384765625, 23.7705078125, 24.421630859375, 25.07275390625, 25.723876953125, 26.375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 11.0, 20.0, 37.0, 68.0, 96.0, 220.0, 429.0, 922.0, 2425.0, 12109.0, 583521.0, 3519782.0, 67115.0, 4717.0, 1556.0, 619.0, 295.0, 145.0, 84.0, 37.0, 32.0, 12.0, 10.0, 5.0, 5.0, 0.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.71875, -57.09912109375, -55.4794921875, -53.85986328125, -52.240234375, -50.62060546875, -49.0009765625, -47.38134765625, -45.76171875, -44.14208984375, -42.5224609375, -40.90283203125, -39.283203125, -37.66357421875, -36.0439453125, -34.42431640625, -32.8046875, -31.18505859375, -29.5654296875, -27.94580078125, -26.326171875, -24.70654296875, -23.0869140625, -21.46728515625, -19.84765625, -18.22802734375, -16.6083984375, -14.98876953125, -13.369140625, -11.74951171875, -10.1298828125, -8.51025390625, -6.890625, -5.27099609375, -3.6513671875, -2.03173828125, -0.412109375, 1.20751953125, 2.8271484375, 4.44677734375, 6.06640625, 7.68603515625, 9.3056640625, 10.92529296875, 12.544921875, 14.16455078125, 15.7841796875, 17.40380859375, 19.0234375, 20.64306640625, 22.2626953125, 23.88232421875, 25.501953125, 27.12158203125, 28.7412109375, 30.36083984375, 31.98046875, 33.60009765625, 35.2197265625, 36.83935546875, 38.458984375, 40.07861328125, 41.6982421875, 43.31787109375, 44.9375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 31.0, 365.0, 541.0, 71.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-304.3949890136719, -290.6909484863281, -276.9869079589844, -263.2828369140625, -249.57879638671875, -235.874755859375, -222.17071533203125, -208.4666748046875, -194.7626190185547, -181.05857849121094, -167.35452270507812, -153.65048217773438, -139.94644165039062, -126.24238586425781, -112.53834533691406, -98.83429718017578, -85.1302490234375, -71.42620086669922, -57.7221565246582, -44.01811218261719, -30.314064025878906, -16.610015869140625, -2.905975341796875, 10.798072814941406, 24.502120971679688, 38.20616912841797, 51.910213470458984, 65.6142578125, 79.31830596923828, 93.02235412597656, 106.72639465332031, 120.4304428100586, 134.134521484375, 147.83856201171875, 161.54261779785156, 175.2466583251953, 188.95071411132812, 202.65475463867188, 216.35879516601562, 230.06283569335938, 243.7668914794922, 257.470947265625, 271.17498779296875, 284.8790283203125, 298.58306884765625, 312.287109375, 325.99114990234375, 339.6952209472656, 353.3992614746094, 367.1033020019531, 380.8073425292969, 394.51141357421875, 408.2154541015625, 421.91949462890625, 435.62353515625, 449.32757568359375, 463.0316162109375, 476.73565673828125, 490.439697265625, 504.14373779296875, 517.8477783203125, 531.5518798828125, 545.255859375, 558.9599609375, 572.6640014648438]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 1.0, 11.0, 8.0, 10.0, 14.0, 12.0, 19.0, 28.0, 20.0, 19.0, 34.0, 24.0, 32.0, 43.0, 48.0, 34.0, 36.0, 38.0, 37.0, 32.0, 49.0, 43.0, 40.0, 36.0, 38.0, 34.0, 23.0, 27.0, 34.0, 24.0, 28.0, 22.0, 16.0, 19.0, 14.0, 11.0, 8.0, 9.0, 6.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-86.5997543334961, -84.2680435180664, -81.93633270263672, -79.60462188720703, -77.27291107177734, -74.94120025634766, -72.60948944091797, -70.27777862548828, -67.9460678100586, -65.6143569946289, -63.28264617919922, -60.95093536376953, -58.619224548339844, -56.287513732910156, -53.95580291748047, -51.62409210205078, -49.29238510131836, -46.96067428588867, -44.628963470458984, -42.2972526550293, -39.96554183959961, -37.63383102416992, -35.3021240234375, -32.97041320800781, -30.638700485229492, -28.306989669799805, -25.975278854370117, -23.643569946289062, -21.311859130859375, -18.980148315429688, -16.6484375, -14.316726684570312, -11.985015869140625, -9.653305053710938, -7.321594715118408, -4.989884376525879, -2.6581735610961914, -0.3264627456665039, 2.005247116088867, 4.336957931518555, 6.668668746948242, 9.00037956237793, 11.332090377807617, 13.663800239562988, 15.995511054992676, 18.327220916748047, 20.658931732177734, 22.990642547607422, 25.32235336303711, 27.654064178466797, 29.985774993896484, 32.31748580932617, 34.64919662475586, 36.98090744018555, 39.31261444091797, 41.644325256347656, 43.976036071777344, 46.30774688720703, 48.63945770263672, 50.971168518066406, 53.302879333496094, 55.63459014892578, 57.96630096435547, 60.298011779785156, 62.629722595214844]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 4.0, 9.0, 12.0, 10.0, 12.0, 19.0, 14.0, 20.0, 17.0, 22.0, 35.0, 40.0, 41.0, 35.0, 47.0, 42.0, 44.0, 44.0, 46.0, 57.0, 56.0, 55.0, 37.0, 40.0, 28.0, 29.0, 34.0, 24.0, 23.0, 14.0, 22.0, 13.0, 8.0, 10.0, 9.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.830078125, -7.55078125, -7.271484375, -6.9921875, -6.712890625, -6.43359375, -6.154296875, -5.875, -5.595703125, -5.31640625, -5.037109375, -4.7578125, -4.478515625, -4.19921875, -3.919921875, -3.640625, -3.361328125, -3.08203125, -2.802734375, -2.5234375, -2.244140625, -1.96484375, -1.685546875, -1.40625, -1.126953125, -0.84765625, -0.568359375, -0.2890625, -0.009765625, 0.26953125, 0.548828125, 0.828125, 1.107421875, 1.38671875, 1.666015625, 1.9453125, 2.224609375, 2.50390625, 2.783203125, 3.0625, 3.341796875, 3.62109375, 3.900390625, 4.1796875, 4.458984375, 4.73828125, 5.017578125, 5.296875, 5.576171875, 5.85546875, 6.134765625, 6.4140625, 6.693359375, 6.97265625, 7.251953125, 7.53125, 7.810546875, 8.08984375, 8.369140625, 8.6484375, 8.927734375, 9.20703125, 9.486328125, 9.765625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 10.0, 5.0, 13.0, 16.0, 21.0, 46.0, 53.0, 89.0, 139.0, 187.0, 252.0, 402.0, 556.0, 894.0, 1300.0, 1928.0, 3065.0, 4719.0, 7388.0, 11557.0, 18179.0, 29588.0, 49267.0, 86236.0, 168477.0, 302903.0, 156554.0, 80870.0, 47097.0, 28255.0, 17255.0, 10750.0, 7244.0, 4475.0, 2926.0, 1934.0, 1267.0, 903.0, 576.0, 358.0, 250.0, 172.0, 141.0, 76.0, 57.0, 40.0, 22.0, 14.0, 16.0, 11.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-1.59765625, -1.549896240234375, -1.50213623046875, -1.454376220703125, -1.4066162109375, -1.358856201171875, -1.31109619140625, -1.263336181640625, -1.215576171875, -1.167816162109375, -1.12005615234375, -1.072296142578125, -1.0245361328125, -0.976776123046875, -0.92901611328125, -0.881256103515625, -0.83349609375, -0.785736083984375, -0.73797607421875, -0.690216064453125, -0.6424560546875, -0.594696044921875, -0.54693603515625, -0.499176025390625, -0.451416015625, -0.403656005859375, -0.35589599609375, -0.308135986328125, -0.2603759765625, -0.212615966796875, -0.16485595703125, -0.117095947265625, -0.0693359375, -0.021575927734375, 0.02618408203125, 0.073944091796875, 0.1217041015625, 0.169464111328125, 0.21722412109375, 0.264984130859375, 0.312744140625, 0.360504150390625, 0.40826416015625, 0.456024169921875, 0.5037841796875, 0.551544189453125, 0.59930419921875, 0.647064208984375, 0.69482421875, 0.742584228515625, 0.79034423828125, 0.838104248046875, 0.8858642578125, 0.933624267578125, 0.98138427734375, 1.029144287109375, 1.076904296875, 1.124664306640625, 1.17242431640625, 1.220184326171875, 1.2679443359375, 1.315704345703125, 1.36346435546875, 1.411224365234375, 1.458984375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 1.0, 5.0, 5.0, 9.0, 7.0, 11.0, 12.0, 20.0, 12.0, 15.0, 19.0, 33.0, 24.0, 35.0, 42.0, 40.0, 28.0, 38.0, 30.0, 51.0, 45.0, 1067.0, 39.0, 36.0, 33.0, 45.0, 33.0, 34.0, 33.0, 28.0, 30.0, 16.0, 21.0, 20.0, 14.0, 16.0, 17.0, 17.0, 11.0, 9.0, 8.0, 3.0, 9.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.42578125, -5.26580810546875, -5.1058349609375, -4.94586181640625, -4.785888671875, -4.62591552734375, -4.4659423828125, -4.30596923828125, -4.14599609375, -3.98602294921875, -3.8260498046875, -3.66607666015625, -3.506103515625, -3.34613037109375, -3.1861572265625, -3.02618408203125, -2.8662109375, -2.70623779296875, -2.5462646484375, -2.38629150390625, -2.226318359375, -2.06634521484375, -1.9063720703125, -1.74639892578125, -1.58642578125, -1.42645263671875, -1.2664794921875, -1.10650634765625, -0.946533203125, -0.78656005859375, -0.6265869140625, -0.46661376953125, -0.306640625, -0.14666748046875, 0.0133056640625, 0.17327880859375, 0.333251953125, 0.49322509765625, 0.6531982421875, 0.81317138671875, 0.97314453125, 1.13311767578125, 1.2930908203125, 1.45306396484375, 1.613037109375, 1.77301025390625, 1.9329833984375, 2.09295654296875, 2.2529296875, 2.41290283203125, 2.5728759765625, 2.73284912109375, 2.892822265625, 3.05279541015625, 3.2127685546875, 3.37274169921875, 3.53271484375, 3.69268798828125, 3.8526611328125, 4.01263427734375, 4.172607421875, 4.33258056640625, 4.4925537109375, 4.65252685546875, 4.8125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 10.0, 9.0, 12.0, 14.0, 28.0, 45.0, 69.0, 85.0, 114.0, 153.0, 260.0, 328.0, 479.0, 752.0, 1074.0, 1645.0, 2569.0, 4079.0, 6310.0, 10009.0, 16062.0, 25806.0, 42205.0, 73307.0, 138424.0, 1325299.0, 204662.0, 100038.0, 55248.0, 32813.0, 20083.0, 12314.0, 8114.0, 5136.0, 3208.0, 2048.0, 1428.0, 966.0, 642.0, 412.0, 285.0, 194.0, 124.0, 68.0, 68.0, 46.0, 27.0, 20.0, 11.0, 11.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.3427734375, -1.2976531982421875, -1.252532958984375, -1.2074127197265625, -1.16229248046875, -1.1171722412109375, -1.072052001953125, -1.0269317626953125, -0.9818115234375, -0.9366912841796875, -0.891571044921875, -0.8464508056640625, -0.80133056640625, -0.7562103271484375, -0.711090087890625, -0.6659698486328125, -0.620849609375, -0.5757293701171875, -0.530609130859375, -0.4854888916015625, -0.44036865234375, -0.3952484130859375, -0.350128173828125, -0.3050079345703125, -0.2598876953125, -0.2147674560546875, -0.169647216796875, -0.1245269775390625, -0.07940673828125, -0.0342864990234375, 0.010833740234375, 0.0559539794921875, 0.10107421875, 0.1461944580078125, 0.191314697265625, 0.2364349365234375, 0.28155517578125, 0.3266754150390625, 0.371795654296875, 0.4169158935546875, 0.4620361328125, 0.5071563720703125, 0.552276611328125, 0.5973968505859375, 0.64251708984375, 0.6876373291015625, 0.732757568359375, 0.7778778076171875, 0.822998046875, 0.8681182861328125, 0.913238525390625, 0.9583587646484375, 1.00347900390625, 1.0485992431640625, 1.093719482421875, 1.1388397216796875, 1.1839599609375, 1.2290802001953125, 1.274200439453125, 1.3193206787109375, 1.36444091796875, 1.4095611572265625, 1.454681396484375, 1.4998016357421875, 1.544921875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 5.0, 5.0, 3.0, 8.0, 5.0, 9.0, 12.0, 20.0, 21.0, 24.0, 28.0, 47.0, 57.0, 82.0, 108.0, 86.0, 94.0, 78.0, 76.0, 51.0, 40.0, 26.0, 20.0, 16.0, 20.0, 9.0, 15.0, 12.0, 3.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021381378173828125, -0.0020641982555389404, -0.0019902586936950684, -0.0019163191318511963, -0.0018423795700073242, -0.0017684400081634521, -0.00169450044631958, -0.001620560884475708, -0.001546621322631836, -0.0014726817607879639, -0.0013987421989440918, -0.0013248026371002197, -0.0012508630752563477, -0.0011769235134124756, -0.0011029839515686035, -0.0010290443897247314, -0.0009551048278808594, -0.0008811652660369873, -0.0008072257041931152, -0.0007332861423492432, -0.0006593465805053711, -0.000585407018661499, -0.000511467456817627, -0.0004375278949737549, -0.0003635883331298828, -0.00028964877128601074, -0.00021570920944213867, -0.0001417696475982666, -6.783008575439453e-05, 6.109476089477539e-06, 8.004903793334961e-05, 0.00015398859977722168, 0.00022792816162109375, 0.0003018677234649658, 0.0003758072853088379, 0.00044974684715270996, 0.000523686408996582, 0.0005976259708404541, 0.0006715655326843262, 0.0007455050945281982, 0.0008194446563720703, 0.0008933842182159424, 0.0009673237800598145, 0.0010412633419036865, 0.0011152029037475586, 0.0011891424655914307, 0.0012630820274353027, 0.0013370215892791748, 0.0014109611511230469, 0.001484900712966919, 0.001558840274810791, 0.001632779836654663, 0.0017067193984985352, 0.0017806589603424072, 0.0018545985221862793, 0.0019285380840301514, 0.0020024776458740234, 0.0020764172077178955, 0.0021503567695617676, 0.0022242963314056396, 0.0022982358932495117, 0.002372175455093384, 0.002446115016937256, 0.002520054578781128, 0.002593994140625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 3.0, 5.0, 2.0, 7.0, 4.0, 8.0, 12.0, 21.0, 31.0, 32.0, 44.0, 39.0, 74.0, 88.0, 173.0, 283.0, 577.0, 1784.0, 994972.0, 48168.0, 1082.0, 435.0, 218.0, 154.0, 75.0, 74.0, 44.0, 37.0, 15.0, 22.0, 14.0, 11.0, 10.0, 4.0, 3.0, 6.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0], "bins": [-0.049346923828125, -0.047928810119628906, -0.04651069641113281, -0.04509258270263672, -0.043674468994140625, -0.04225635528564453, -0.04083824157714844, -0.039420127868652344, -0.03800201416015625, -0.036583900451660156, -0.03516578674316406, -0.03374767303466797, -0.032329559326171875, -0.03091144561767578, -0.029493331909179688, -0.028075218200683594, -0.0266571044921875, -0.025238990783691406, -0.023820877075195312, -0.02240276336669922, -0.020984649658203125, -0.01956653594970703, -0.018148422241210938, -0.016730308532714844, -0.01531219482421875, -0.013894081115722656, -0.012475967407226562, -0.011057853698730469, -0.009639739990234375, -0.008221626281738281, -0.0068035125732421875, -0.005385398864746094, -0.00396728515625, -0.0025491714477539062, -0.0011310577392578125, 0.00028705596923828125, 0.001705169677734375, 0.0031232833862304688, 0.0045413970947265625, 0.005959510803222656, 0.00737762451171875, 0.008795738220214844, 0.010213851928710938, 0.011631965637207031, 0.013050079345703125, 0.014468193054199219, 0.015886306762695312, 0.017304420471191406, 0.0187225341796875, 0.020140647888183594, 0.021558761596679688, 0.02297687530517578, 0.024394989013671875, 0.02581310272216797, 0.027231216430664062, 0.028649330139160156, 0.03006744384765625, 0.031485557556152344, 0.03290367126464844, 0.03432178497314453, 0.035739898681640625, 0.03715801239013672, 0.03857612609863281, 0.039994239807128906, 0.041412353515625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 52.0, 439.0, 468.0, 50.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007968557998538017, -0.007787508890032768, -0.007606459315866232, -0.007425410207360983, -0.007244361098855734, -0.007063311990350485, -0.0068822624161839485, -0.0067012133076786995, -0.0065201641991734505, -0.0063391150906682014, -0.006158065516501665, -0.005977016407996416, -0.005795967299491167, -0.005614918190985918, -0.005433868616819382, -0.005252819508314133, -0.005071770399808884, -0.004890721291303635, -0.004709671717137098, -0.004528622608631849, -0.0043475735001266, -0.004166524391621351, -0.003985474817454815, -0.003804425708949566, -0.0036233761347830296, -0.003442326793447137, -0.003261277684941888, -0.003080228343605995, -0.002899179235100746, -0.0027181298937648535, -0.002537080552428961, -0.0023560314439237118, -0.002174982102587819, -0.0019939327612519264, -0.0018128836527466774, -0.0016318343114107847, -0.0014507852029055357, -0.001269735861569643, -0.0010886866366490722, -0.0009076374117285013, -0.0007265881868079305, -0.0005455389618873596, -0.0003644897078629583, -0.000183440453838557, -2.3912289179861546e-06, 0.0001786579960025847, 0.00035970727913081646, 0.0005407565040513873, 0.0007218057289719582, 0.000902854953892529, 0.0010839041788130999, 0.0012649535201489925, 0.0014460026286542416, 0.0016270519699901342, 0.001808101194910705, 0.001989150419831276, 0.002170199528336525, 0.0023512488696724176, 0.0025322979781776667, 0.0027133473195135593, 0.0028943964280188084, 0.003075445769354701, 0.0032564951106905937, 0.0034375442191958427, 0.0036185935605317354]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 6.0, 2.0, 6.0, 7.0, 12.0, 12.0, 13.0, 18.0, 21.0, 24.0, 25.0, 39.0, 37.0, 38.0, 40.0, 41.0, 57.0, 57.0, 41.0, 52.0, 36.0, 49.0, 34.0, 28.0, 38.0, 38.0, 24.0, 30.0, 43.0, 23.0, 26.0, 22.0, 14.0, 15.0, 13.0, 9.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013026595115661621, -0.0012666219845414162, -0.0012305844575166702, -0.0011945469304919243, -0.0011585094034671783, -0.0011224718764424324, -0.0010864343494176865, -0.0010503968223929405, -0.0010143592953681946, -0.0009783217683434486, -0.0009422842413187027, -0.0009062467142939568, -0.0008702091872692108, -0.0008341716602444649, -0.0007981341332197189, -0.000762096606194973, -0.000726059079170227, -0.0006900215521454811, -0.0006539840251207352, -0.0006179464980959892, -0.0005819089710712433, -0.0005458714440464973, -0.0005098339170217514, -0.00047379638999700546, -0.0004377588629722595, -0.0004017213359475136, -0.00036568380892276764, -0.0003296462818980217, -0.00029360875487327576, -0.0002575712278485298, -0.00022153370082378387, -0.00018549617379903793, -0.000149458646774292, -0.00011342111974954605, -7.738359272480011e-05, -4.134606570005417e-05, -5.3085386753082275e-06, 3.0728988349437714e-05, 6.676651537418365e-05, 0.0001028040423989296, 0.00013884156942367554, 0.00017487909644842148, 0.00021091662347316742, 0.00024695415049791336, 0.0002829916775226593, 0.00031902920454740524, 0.0003550667315721512, 0.0003911042585968971, 0.00042714178562164307, 0.000463179312646389, 0.000499216839671135, 0.0005352543666958809, 0.0005712918937206268, 0.0006073294207453728, 0.0006433669477701187, 0.0006794044747948647, 0.0007154420018196106, 0.0007514795288443565, 0.0007875170558691025, 0.0008235545828938484, 0.0008595921099185944, 0.0008956296369433403, 0.0009316671639680862, 0.0009677046909928322, 0.0010037422180175781]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 5.0, 3.0, 4.0, 4.0, 9.0, 12.0, 10.0, 12.0, 19.0, 14.0, 20.0, 17.0, 22.0, 35.0, 40.0, 41.0, 35.0, 47.0, 42.0, 44.0, 44.0, 46.0, 57.0, 56.0, 55.0, 37.0, 40.0, 28.0, 29.0, 34.0, 24.0, 23.0, 14.0, 22.0, 13.0, 8.0, 10.0, 9.0, 8.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.830078125, -7.55078125, -7.271484375, -6.9921875, -6.712890625, -6.43359375, -6.154296875, -5.875, -5.595703125, -5.31640625, -5.037109375, -4.7578125, -4.478515625, -4.19921875, -3.919921875, -3.640625, -3.361328125, -3.08203125, -2.802734375, -2.5234375, -2.244140625, -1.96484375, -1.685546875, -1.40625, -1.126953125, -0.84765625, -0.568359375, -0.2890625, -0.009765625, 0.26953125, 0.548828125, 0.828125, 1.107421875, 1.38671875, 1.666015625, 1.9453125, 2.224609375, 2.50390625, 2.783203125, 3.0625, 3.341796875, 3.62109375, 3.900390625, 4.1796875, 4.458984375, 4.73828125, 5.017578125, 5.296875, 5.576171875, 5.85546875, 6.134765625, 6.4140625, 6.693359375, 6.97265625, 7.251953125, 7.53125, 7.810546875, 8.08984375, 8.369140625, 8.6484375, 8.927734375, 9.20703125, 9.486328125, 9.765625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 11.0, 15.0, 25.0, 14.0, 35.0, 48.0, 68.0, 79.0, 119.0, 159.0, 191.0, 272.0, 365.0, 464.0, 675.0, 886.0, 1322.0, 1904.0, 2932.0, 5942.0, 24672.0, 217108.0, 667859.0, 97281.0, 13309.0, 4476.0, 2455.0, 1670.0, 1086.0, 776.0, 628.0, 440.0, 326.0, 249.0, 182.0, 119.0, 102.0, 75.0, 61.0, 50.0, 38.0, 20.0, 24.0, 8.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.765625, -22.061279296875, -21.35693359375, -20.652587890625, -19.9482421875, -19.243896484375, -18.53955078125, -17.835205078125, -17.130859375, -16.426513671875, -15.72216796875, -15.017822265625, -14.3134765625, -13.609130859375, -12.90478515625, -12.200439453125, -11.49609375, -10.791748046875, -10.08740234375, -9.383056640625, -8.6787109375, -7.974365234375, -7.27001953125, -6.565673828125, -5.861328125, -5.156982421875, -4.45263671875, -3.748291015625, -3.0439453125, -2.339599609375, -1.63525390625, -0.930908203125, -0.2265625, 0.477783203125, 1.18212890625, 1.886474609375, 2.5908203125, 3.295166015625, 3.99951171875, 4.703857421875, 5.408203125, 6.112548828125, 6.81689453125, 7.521240234375, 8.2255859375, 8.929931640625, 9.63427734375, 10.338623046875, 11.04296875, 11.747314453125, 12.45166015625, 13.156005859375, 13.8603515625, 14.564697265625, 15.26904296875, 15.973388671875, 16.677734375, 17.382080078125, 18.08642578125, 18.790771484375, 19.4951171875, 20.199462890625, 20.90380859375, 21.608154296875, 22.3125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 6.0, 4.0, 4.0, 6.0, 6.0, 12.0, 11.0, 12.0, 14.0, 17.0, 25.0, 30.0, 26.0, 38.0, 40.0, 45.0, 53.0, 82.0, 104.0, 174.0, 1381.0, 296.0, 171.0, 95.0, 66.0, 50.0, 44.0, 29.0, 33.0, 29.0, 24.0, 17.0, 13.0, 16.0, 16.0, 11.0, 11.0, 7.0, 4.0, 4.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.3125, -19.673828125, -19.03515625, -18.396484375, -17.7578125, -17.119140625, -16.48046875, -15.841796875, -15.203125, -14.564453125, -13.92578125, -13.287109375, -12.6484375, -12.009765625, -11.37109375, -10.732421875, -10.09375, -9.455078125, -8.81640625, -8.177734375, -7.5390625, -6.900390625, -6.26171875, -5.623046875, -4.984375, -4.345703125, -3.70703125, -3.068359375, -2.4296875, -1.791015625, -1.15234375, -0.513671875, 0.125, 0.763671875, 1.40234375, 2.041015625, 2.6796875, 3.318359375, 3.95703125, 4.595703125, 5.234375, 5.873046875, 6.51171875, 7.150390625, 7.7890625, 8.427734375, 9.06640625, 9.705078125, 10.34375, 10.982421875, 11.62109375, 12.259765625, 12.8984375, 13.537109375, 14.17578125, 14.814453125, 15.453125, 16.091796875, 16.73046875, 17.369140625, 18.0078125, 18.646484375, 19.28515625, 19.923828125, 20.5625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 1.0, 5.0, 7.0, 9.0, 5.0, 10.0, 11.0, 18.0, 20.0, 16.0, 24.0, 33.0, 35.0, 62.0, 80.0, 91.0, 187.0, 276.0, 475.0, 851.0, 1821.0, 9529.0, 3113808.0, 14021.0, 2040.0, 889.0, 480.0, 271.0, 165.0, 106.0, 83.0, 77.0, 36.0, 32.0, 28.0, 26.0, 17.0, 13.0, 15.0, 11.0, 6.0, 6.0, 1.0, 5.0, 2.0, 3.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.1875, -74.4833984375, -71.779296875, -69.0751953125, -66.37109375, -63.6669921875, -60.962890625, -58.2587890625, -55.5546875, -52.8505859375, -50.146484375, -47.4423828125, -44.73828125, -42.0341796875, -39.330078125, -36.6259765625, -33.921875, -31.2177734375, -28.513671875, -25.8095703125, -23.10546875, -20.4013671875, -17.697265625, -14.9931640625, -12.2890625, -9.5849609375, -6.880859375, -4.1767578125, -1.47265625, 1.2314453125, 3.935546875, 6.6396484375, 9.34375, 12.0478515625, 14.751953125, 17.4560546875, 20.16015625, 22.8642578125, 25.568359375, 28.2724609375, 30.9765625, 33.6806640625, 36.384765625, 39.0888671875, 41.79296875, 44.4970703125, 47.201171875, 49.9052734375, 52.609375, 55.3134765625, 58.017578125, 60.7216796875, 63.42578125, 66.1298828125, 68.833984375, 71.5380859375, 74.2421875, 76.9462890625, 79.650390625, 82.3544921875, 85.05859375, 87.7626953125, 90.466796875, 93.1708984375, 95.875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 13.0, 40.0, 90.0, 131.0, 166.0, 197.0, 173.0, 103.0, 57.0, 15.0, 11.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-143.60562133789062, -140.67494201660156, -137.7442626953125, -134.81358337402344, -131.88290405273438, -128.9522247314453, -126.02153778076172, -123.09085845947266, -120.1601791381836, -117.22949981689453, -114.29882049560547, -111.3681411743164, -108.43745422363281, -105.50677490234375, -102.57609558105469, -99.64541625976562, -96.71473693847656, -93.7840576171875, -90.85337829589844, -87.92269897460938, -84.99201965332031, -82.06133270263672, -79.13065338134766, -76.1999740600586, -73.26929473876953, -70.33861541748047, -67.4079360961914, -64.47725677490234, -61.546573638916016, -58.61589431762695, -55.685211181640625, -52.75453186035156, -49.82384490966797, -46.893165588378906, -43.962486267089844, -41.031803131103516, -38.10112380981445, -35.17044448852539, -32.23976135253906, -29.30908203125, -26.378402709960938, -23.447723388671875, -20.51704216003418, -17.586360931396484, -14.655681610107422, -11.725001335144043, -8.794321060180664, -5.863639831542969, -2.9329605102539062, -0.0022802352905273438, 2.9284000396728516, 5.8590803146362305, 8.78976058959961, 11.720440864562988, 14.651121139526367, 17.581802368164062, 20.512481689453125, 23.443161010742188, 26.373842239379883, 29.304523468017578, 32.23520278930664, 35.1658821105957, 38.09656524658203, 41.027244567871094, 43.957923889160156]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 9.0, 4.0, 5.0, 8.0, 13.0, 16.0, 8.0, 17.0, 12.0, 23.0, 16.0, 29.0, 26.0, 27.0, 20.0, 35.0, 38.0, 34.0, 47.0, 41.0, 34.0, 46.0, 36.0, 29.0, 30.0, 34.0, 41.0, 35.0, 43.0, 25.0, 28.0, 22.0, 19.0, 22.0, 15.0, 23.0, 16.0, 15.0, 6.0, 11.0, 6.0, 6.0, 9.0, 7.0, 3.0, 1.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-50.77208709716797, -49.114017486572266, -47.45595169067383, -45.797882080078125, -44.13981246948242, -42.48174285888672, -40.82367706298828, -39.16560745239258, -37.507537841796875, -35.84946823120117, -34.191402435302734, -32.53333282470703, -30.875263214111328, -29.217195510864258, -27.559127807617188, -25.901058197021484, -24.242990493774414, -22.584922790527344, -20.92685317993164, -19.26878547668457, -17.610715866088867, -15.952648162841797, -14.29457950592041, -12.636510848999023, -10.978442192077637, -9.32037353515625, -7.662304878234863, -6.004236698150635, -4.346168041229248, -2.6880998611450195, -1.0300312042236328, 0.6280374526977539, 2.2861061096191406, 3.9441747665405273, 5.602243423461914, 7.260311603546143, 8.918380737304688, 10.576448440551758, 12.234517097473145, 13.892585754394531, 15.550654411315918, 17.208723068237305, 18.866790771484375, 20.524860382080078, 22.18292808532715, 23.84099578857422, 25.499065399169922, 27.157135009765625, 28.815202713012695, 30.473270416259766, 32.13134002685547, 33.78940963745117, 35.44747543334961, 37.10554504394531, 38.763614654541016, 40.42168426513672, 42.079750061035156, 43.73781967163086, 45.3958854675293, 47.053955078125, 48.7120246887207, 50.370094299316406, 52.028160095214844, 53.68622970581055, 55.34429931640625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 8.0, 2.0, 8.0, 13.0, 9.0, 15.0, 16.0, 13.0, 15.0, 16.0, 23.0, 21.0, 26.0, 28.0, 27.0, 49.0, 41.0, 45.0, 52.0, 47.0, 48.0, 45.0, 43.0, 50.0, 47.0, 30.0, 44.0, 34.0, 28.0, 24.0, 20.0, 19.0, 17.0, 15.0, 12.0, 16.0, 8.0, 4.0, 9.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.77734375, -7.50177001953125, -7.2261962890625, -6.95062255859375, -6.675048828125, -6.39947509765625, -6.1239013671875, -5.84832763671875, -5.57275390625, -5.29718017578125, -5.0216064453125, -4.74603271484375, -4.470458984375, -4.19488525390625, -3.9193115234375, -3.64373779296875, -3.3681640625, -3.09259033203125, -2.8170166015625, -2.54144287109375, -2.265869140625, -1.99029541015625, -1.7147216796875, -1.43914794921875, -1.16357421875, -0.88800048828125, -0.6124267578125, -0.33685302734375, -0.061279296875, 0.21429443359375, 0.4898681640625, 0.76544189453125, 1.041015625, 1.31658935546875, 1.5921630859375, 1.86773681640625, 2.143310546875, 2.41888427734375, 2.6944580078125, 2.97003173828125, 3.24560546875, 3.52117919921875, 3.7967529296875, 4.07232666015625, 4.347900390625, 4.62347412109375, 4.8990478515625, 5.17462158203125, 5.4501953125, 5.72576904296875, 6.0013427734375, 6.27691650390625, 6.552490234375, 6.82806396484375, 7.1036376953125, 7.37921142578125, 7.65478515625, 7.93035888671875, 8.2059326171875, 8.48150634765625, 8.757080078125, 9.03265380859375, 9.3082275390625, 9.58380126953125, 9.859375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 8.0, 5.0, 8.0, 5.0, 9.0, 15.0, 16.0, 20.0, 36.0, 30.0, 41.0, 50.0, 81.0, 115.0, 166.0, 266.0, 515.0, 994.0, 2269.0, 6251.0, 24271.0, 199049.0, 1773990.0, 1916626.0, 231688.0, 26442.0, 6589.0, 2369.0, 964.0, 496.0, 275.0, 164.0, 130.0, 88.0, 47.0, 51.0, 41.0, 29.0, 21.0, 9.0, 12.0, 12.0, 8.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.671875, -18.070068359375, -17.46826171875, -16.866455078125, -16.2646484375, -15.662841796875, -15.06103515625, -14.459228515625, -13.857421875, -13.255615234375, -12.65380859375, -12.052001953125, -11.4501953125, -10.848388671875, -10.24658203125, -9.644775390625, -9.04296875, -8.441162109375, -7.83935546875, -7.237548828125, -6.6357421875, -6.033935546875, -5.43212890625, -4.830322265625, -4.228515625, -3.626708984375, -3.02490234375, -2.423095703125, -1.8212890625, -1.219482421875, -0.61767578125, -0.015869140625, 0.5859375, 1.187744140625, 1.78955078125, 2.391357421875, 2.9931640625, 3.594970703125, 4.19677734375, 4.798583984375, 5.400390625, 6.002197265625, 6.60400390625, 7.205810546875, 7.8076171875, 8.409423828125, 9.01123046875, 9.613037109375, 10.21484375, 10.816650390625, 11.41845703125, 12.020263671875, 12.6220703125, 13.223876953125, 13.82568359375, 14.427490234375, 15.029296875, 15.631103515625, 16.23291015625, 16.834716796875, 17.4365234375, 18.038330078125, 18.64013671875, 19.241943359375, 19.84375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 5.0, 10.0, 18.0, 30.0, 53.0, 76.0, 149.0, 226.0, 372.0, 628.0, 807.0, 693.0, 426.0, 243.0, 140.0, 85.0, 45.0, 30.0, 16.0, 10.0, 9.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.125, -28.283935546875, -27.44287109375, -26.601806640625, -25.7607421875, -24.919677734375, -24.07861328125, -23.237548828125, -22.396484375, -21.555419921875, -20.71435546875, -19.873291015625, -19.0322265625, -18.191162109375, -17.35009765625, -16.509033203125, -15.66796875, -14.826904296875, -13.98583984375, -13.144775390625, -12.3037109375, -11.462646484375, -10.62158203125, -9.780517578125, -8.939453125, -8.098388671875, -7.25732421875, -6.416259765625, -5.5751953125, -4.734130859375, -3.89306640625, -3.052001953125, -2.2109375, -1.369873046875, -0.52880859375, 0.312255859375, 1.1533203125, 1.994384765625, 2.83544921875, 3.676513671875, 4.517578125, 5.358642578125, 6.19970703125, 7.040771484375, 7.8818359375, 8.722900390625, 9.56396484375, 10.405029296875, 11.24609375, 12.087158203125, 12.92822265625, 13.769287109375, 14.6103515625, 15.451416015625, 16.29248046875, 17.133544921875, 17.974609375, 18.815673828125, 19.65673828125, 20.497802734375, 21.3388671875, 22.179931640625, 23.02099609375, 23.862060546875, 24.703125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 1.0, 3.0, 4.0, 11.0, 11.0, 22.0, 41.0, 81.0, 178.0, 413.0, 1384.0, 7693.0, 3202234.0, 974878.0, 5364.0, 1163.0, 468.0, 174.0, 75.0, 45.0, 14.0, 12.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.8125, -65.619140625, -63.42578125, -61.232421875, -59.0390625, -56.845703125, -54.65234375, -52.458984375, -50.265625, -48.072265625, -45.87890625, -43.685546875, -41.4921875, -39.298828125, -37.10546875, -34.912109375, -32.71875, -30.525390625, -28.33203125, -26.138671875, -23.9453125, -21.751953125, -19.55859375, -17.365234375, -15.171875, -12.978515625, -10.78515625, -8.591796875, -6.3984375, -4.205078125, -2.01171875, 0.181640625, 2.375, 4.568359375, 6.76171875, 8.955078125, 11.1484375, 13.341796875, 15.53515625, 17.728515625, 19.921875, 22.115234375, 24.30859375, 26.501953125, 28.6953125, 30.888671875, 33.08203125, 35.275390625, 37.46875, 39.662109375, 41.85546875, 44.048828125, 46.2421875, 48.435546875, 50.62890625, 52.822265625, 55.015625, 57.208984375, 59.40234375, 61.595703125, 63.7890625, 65.982421875, 68.17578125, 70.369140625, 72.5625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 116.0, 683.0, 205.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-351.81243896484375, -338.5679016113281, -325.3233337402344, -312.07879638671875, -298.834228515625, -285.5896911621094, -272.34515380859375, -259.1005859375, -245.85604858398438, -232.6114959716797, -219.366943359375, -206.12240600585938, -192.8778533935547, -179.63330078125, -166.38876342773438, -153.1442108154297, -139.899658203125, -126.65510559082031, -113.41056060791016, -100.166015625, -86.92146301269531, -73.67691040039062, -60.43236541748047, -47.18782043457031, -33.943267822265625, -20.698719024658203, -7.454170227050781, 5.790378570556641, 19.034927368164062, 32.27947998046875, 45.524024963378906, 58.76856994628906, 72.01309204101562, 85.25764465332031, 98.50218963623047, 111.74673461914062, 124.99128723144531, 138.23583984375, 151.48037719726562, 164.7249298095703, 177.969482421875, 191.2140350341797, 204.45858764648438, 217.703125, 230.9476776123047, 244.19223022460938, 257.436767578125, 270.68133544921875, 283.9258728027344, 297.17041015625, 310.41497802734375, 323.6595153808594, 336.904052734375, 350.14862060546875, 363.3931579589844, 376.6376953125, 389.88226318359375, 403.1268005371094, 416.3713684082031, 429.61590576171875, 442.8604736328125, 456.1050109863281, 469.34954833984375, 482.5941162109375, 495.8386535644531]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 13.0, 12.0, 14.0, 16.0, 14.0, 18.0, 25.0, 33.0, 36.0, 34.0, 37.0, 39.0, 32.0, 36.0, 48.0, 38.0, 49.0, 47.0, 46.0, 43.0, 40.0, 39.0, 44.0, 29.0, 36.0, 26.0, 38.0, 22.0, 19.0, 16.0, 12.0, 8.0, 15.0, 5.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.49935913085938, -63.37350082397461, -61.247642517089844, -59.12178421020508, -56.99592590332031, -54.87006759643555, -52.74420928955078, -50.618350982666016, -48.49249267578125, -46.366634368896484, -44.24077606201172, -42.11491775512695, -39.98905944824219, -37.86320114135742, -35.737342834472656, -33.61148452758789, -31.485626220703125, -29.35976791381836, -27.233909606933594, -25.108051300048828, -22.982192993164062, -20.856334686279297, -18.73047637939453, -16.604618072509766, -14.478759765625, -12.352901458740234, -10.227043151855469, -8.101184844970703, -5.9753265380859375, -3.849468231201172, -1.7236099243164062, 0.4022483825683594, 2.5281143188476562, 4.653972625732422, 6.7798309326171875, 8.905689239501953, 11.031547546386719, 13.157405853271484, 15.28326416015625, 17.409122467041016, 19.53498077392578, 21.660839080810547, 23.786697387695312, 25.912555694580078, 28.038414001464844, 30.16427230834961, 32.290130615234375, 34.41598892211914, 36.541847229003906, 38.66770553588867, 40.79356384277344, 42.9194221496582, 45.04528045654297, 47.171138763427734, 49.2969970703125, 51.422855377197266, 53.54871368408203, 55.6745719909668, 57.80043029785156, 59.92628860473633, 62.052146911621094, 64.17800903320312, 66.30386352539062, 68.42971801757812, 70.55558013916016]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 3.0, 4.0, 4.0, 8.0, 3.0, 6.0, 12.0, 9.0, 8.0, 15.0, 16.0, 16.0, 26.0, 21.0, 21.0, 44.0, 28.0, 27.0, 27.0, 43.0, 49.0, 47.0, 57.0, 37.0, 50.0, 40.0, 39.0, 39.0, 35.0, 29.0, 37.0, 22.0, 33.0, 20.0, 20.0, 26.0, 21.0, 6.0, 13.0, 7.0, 13.0, 7.0, 3.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.91015625, -6.70269775390625, -6.4952392578125, -6.28778076171875, -6.080322265625, -5.87286376953125, -5.6654052734375, -5.45794677734375, -5.25048828125, -5.04302978515625, -4.8355712890625, -4.62811279296875, -4.420654296875, -4.21319580078125, -4.0057373046875, -3.79827880859375, -3.5908203125, -3.38336181640625, -3.1759033203125, -2.96844482421875, -2.760986328125, -2.55352783203125, -2.3460693359375, -2.13861083984375, -1.93115234375, -1.72369384765625, -1.5162353515625, -1.30877685546875, -1.101318359375, -0.89385986328125, -0.6864013671875, -0.47894287109375, -0.271484375, -0.06402587890625, 0.1434326171875, 0.35089111328125, 0.558349609375, 0.76580810546875, 0.9732666015625, 1.18072509765625, 1.38818359375, 1.59564208984375, 1.8031005859375, 2.01055908203125, 2.218017578125, 2.42547607421875, 2.6329345703125, 2.84039306640625, 3.0478515625, 3.25531005859375, 3.4627685546875, 3.67022705078125, 3.877685546875, 4.08514404296875, 4.2926025390625, 4.50006103515625, 4.70751953125, 4.91497802734375, 5.1224365234375, 5.32989501953125, 5.537353515625, 5.74481201171875, 5.9522705078125, 6.15972900390625, 6.3671875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 10.0, 10.0, 30.0, 24.0, 42.0, 54.0, 80.0, 147.0, 176.0, 268.0, 368.0, 506.0, 733.0, 998.0, 1409.0, 2040.0, 2853.0, 4315.0, 5991.0, 8585.0, 12674.0, 18621.0, 27352.0, 41704.0, 67471.0, 119487.0, 229991.0, 209668.0, 108203.0, 63007.0, 39358.0, 25947.0, 17449.0, 11811.0, 8241.0, 5689.0, 3907.0, 2762.0, 1960.0, 1345.0, 956.0, 673.0, 482.0, 363.0, 228.0, 176.0, 151.0, 92.0, 62.0, 38.0, 22.0, 13.0, 10.0, 6.0, 7.0, 0.0, 2.0, 2.0], "bins": [-0.98095703125, -0.9511642456054688, -0.9213714599609375, -0.8915786743164062, -0.861785888671875, -0.8319931030273438, -0.8022003173828125, -0.7724075317382812, -0.74261474609375, -0.7128219604492188, -0.6830291748046875, -0.6532363891601562, -0.623443603515625, -0.5936508178710938, -0.5638580322265625, -0.5340652465820312, -0.5042724609375, -0.47447967529296875, -0.4446868896484375, -0.41489410400390625, -0.385101318359375, -0.35530853271484375, -0.3255157470703125, -0.29572296142578125, -0.26593017578125, -0.23613739013671875, -0.2063446044921875, -0.17655181884765625, -0.146759033203125, -0.11696624755859375, -0.0871734619140625, -0.05738067626953125, -0.027587890625, 0.00220489501953125, 0.0319976806640625, 0.06179046630859375, 0.091583251953125, 0.12137603759765625, 0.1511688232421875, 0.18096160888671875, 0.21075439453125, 0.24054718017578125, 0.2703399658203125, 0.30013275146484375, 0.329925537109375, 0.35971832275390625, 0.3895111083984375, 0.41930389404296875, 0.4490966796875, 0.47888946533203125, 0.5086822509765625, 0.5384750366210938, 0.568267822265625, 0.5980606079101562, 0.6278533935546875, 0.6576461791992188, 0.68743896484375, 0.7172317504882812, 0.7470245361328125, 0.7768173217773438, 0.806610107421875, 0.8364028930664062, 0.8661956787109375, 0.8959884643554688, 0.92578125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 1.0, 3.0, 6.0, 6.0, 6.0, 13.0, 10.0, 22.0, 16.0, 17.0, 19.0, 36.0, 40.0, 32.0, 23.0, 38.0, 35.0, 49.0, 46.0, 35.0, 48.0, 1053.0, 45.0, 49.0, 45.0, 50.0, 26.0, 33.0, 33.0, 28.0, 32.0, 28.0, 15.0, 23.0, 15.0, 8.0, 7.0, 12.0, 9.0, 5.0, 7.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.16015625, -4.0185546875, -3.876953125, -3.7353515625, -3.59375, -3.4521484375, -3.310546875, -3.1689453125, -3.02734375, -2.8857421875, -2.744140625, -2.6025390625, -2.4609375, -2.3193359375, -2.177734375, -2.0361328125, -1.89453125, -1.7529296875, -1.611328125, -1.4697265625, -1.328125, -1.1865234375, -1.044921875, -0.9033203125, -0.76171875, -0.6201171875, -0.478515625, -0.3369140625, -0.1953125, -0.0537109375, 0.087890625, 0.2294921875, 0.37109375, 0.5126953125, 0.654296875, 0.7958984375, 0.9375, 1.0791015625, 1.220703125, 1.3623046875, 1.50390625, 1.6455078125, 1.787109375, 1.9287109375, 2.0703125, 2.2119140625, 2.353515625, 2.4951171875, 2.63671875, 2.7783203125, 2.919921875, 3.0615234375, 3.203125, 3.3447265625, 3.486328125, 3.6279296875, 3.76953125, 3.9111328125, 4.052734375, 4.1943359375, 4.3359375, 4.4775390625, 4.619140625, 4.7607421875, 4.90234375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 11.0, 21.0, 25.0, 26.0, 52.0, 61.0, 101.0, 149.0, 215.0, 300.0, 497.0, 772.0, 1112.0, 1815.0, 2851.0, 4455.0, 7497.0, 12290.0, 19990.0, 33657.0, 57655.0, 106570.0, 237350.0, 1328073.0, 122602.0, 64310.0, 37225.0, 22223.0, 13430.0, 8100.0, 4827.0, 3089.0, 1995.0, 1256.0, 800.0, 556.0, 363.0, 273.0, 145.0, 125.0, 82.0, 49.0, 35.0, 29.0, 17.0, 13.0, 8.0, 6.0, 8.0, 4.0, 1.0, 3.0, 3.0], "bins": [-1.3154296875, -1.27685546875, -1.23828125, -1.19970703125, -1.1611328125, -1.12255859375, -1.083984375, -1.04541015625, -1.0068359375, -0.96826171875, -0.9296875, -0.89111328125, -0.8525390625, -0.81396484375, -0.775390625, -0.73681640625, -0.6982421875, -0.65966796875, -0.62109375, -0.58251953125, -0.5439453125, -0.50537109375, -0.466796875, -0.42822265625, -0.3896484375, -0.35107421875, -0.3125, -0.27392578125, -0.2353515625, -0.19677734375, -0.158203125, -0.11962890625, -0.0810546875, -0.04248046875, -0.00390625, 0.03466796875, 0.0732421875, 0.11181640625, 0.150390625, 0.18896484375, 0.2275390625, 0.26611328125, 0.3046875, 0.34326171875, 0.3818359375, 0.42041015625, 0.458984375, 0.49755859375, 0.5361328125, 0.57470703125, 0.61328125, 0.65185546875, 0.6904296875, 0.72900390625, 0.767578125, 0.80615234375, 0.8447265625, 0.88330078125, 0.921875, 0.96044921875, 0.9990234375, 1.03759765625, 1.076171875, 1.11474609375, 1.1533203125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 7.0, 9.0, 11.0, 10.0, 15.0, 20.0, 23.0, 33.0, 44.0, 65.0, 68.0, 93.0, 102.0, 91.0, 81.0, 62.0, 64.0, 53.0, 27.0, 27.0, 27.0, 17.0, 16.0, 8.0, 8.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00255584716796875, -0.0024900883436203003, -0.0024243295192718506, -0.002358570694923401, -0.002292811870574951, -0.0022270530462265015, -0.0021612942218780518, -0.002095535397529602, -0.0020297765731811523, -0.0019640177488327026, -0.001898258924484253, -0.0018325001001358032, -0.0017667412757873535, -0.0017009824514389038, -0.001635223627090454, -0.0015694648027420044, -0.0015037059783935547, -0.001437947154045105, -0.0013721883296966553, -0.0013064295053482056, -0.0012406706809997559, -0.0011749118566513062, -0.0011091530323028564, -0.0010433942079544067, -0.000977635383605957, -0.0009118765592575073, -0.0008461177349090576, -0.0007803589105606079, -0.0007146000862121582, -0.0006488412618637085, -0.0005830824375152588, -0.0005173236131668091, -0.0004515647888183594, -0.00038580596446990967, -0.00032004714012145996, -0.00025428831577301025, -0.00018852949142456055, -0.00012277066707611084, -5.701184272766113e-05, 8.746981620788574e-06, 7.450580596923828e-05, 0.000140264630317688, 0.0002060234546661377, 0.0002717822790145874, 0.0003375411033630371, 0.0004032999277114868, 0.0004690587520599365, 0.0005348175764083862, 0.0006005764007568359, 0.0006663352251052856, 0.0007320940494537354, 0.0007978528738021851, 0.0008636116981506348, 0.0009293705224990845, 0.0009951293468475342, 0.0010608881711959839, 0.0011266469955444336, 0.0011924058198928833, 0.001258164644241333, 0.0013239234685897827, 0.0013896822929382324, 0.0014554411172866821, 0.0015211999416351318, 0.0015869587659835815, 0.0016527175903320312]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 0.0, 7.0, 6.0, 4.0, 8.0, 7.0, 12.0, 13.0, 20.0, 36.0, 50.0, 58.0, 85.0, 103.0, 189.0, 312.0, 545.0, 1312.0, 661133.0, 382112.0, 1223.0, 531.0, 280.0, 156.0, 113.0, 59.0, 49.0, 34.0, 27.0, 23.0, 15.0, 11.0, 15.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0285491943359375, -0.027405977249145508, -0.026262760162353516, -0.025119543075561523, -0.02397632598876953, -0.02283310890197754, -0.021689891815185547, -0.020546674728393555, -0.019403457641601562, -0.01826024055480957, -0.017117023468017578, -0.015973806381225586, -0.014830589294433594, -0.013687372207641602, -0.01254415512084961, -0.011400938034057617, -0.010257720947265625, -0.009114503860473633, -0.00797128677368164, -0.0068280696868896484, -0.005684852600097656, -0.004541635513305664, -0.003398418426513672, -0.0022552013397216797, -0.0011119842529296875, 3.123283386230469e-05, 0.0011744499206542969, 0.002317667007446289, 0.0034608840942382812, 0.0046041011810302734, 0.005747318267822266, 0.006890535354614258, 0.00803375244140625, 0.009176969528198242, 0.010320186614990234, 0.011463403701782227, 0.012606620788574219, 0.013749837875366211, 0.014893054962158203, 0.016036272048950195, 0.017179489135742188, 0.01832270622253418, 0.019465923309326172, 0.020609140396118164, 0.021752357482910156, 0.02289557456970215, 0.02403879165649414, 0.025182008743286133, 0.026325225830078125, 0.027468442916870117, 0.02861166000366211, 0.0297548770904541, 0.030898094177246094, 0.032041311264038086, 0.03318452835083008, 0.03432774543762207, 0.03547096252441406, 0.036614179611206055, 0.03775739669799805, 0.03890061378479004, 0.04004383087158203, 0.04118704795837402, 0.042330265045166016, 0.04347348213195801, 0.04461669921875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 27.0, 139.0, 456.0, 330.0, 54.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030125004705041647, -0.0029232713859528303, -0.002834042301401496, -0.002744813449680805, -0.002655584365129471, -0.0025663552805781364, -0.002477126196026802, -0.0023878971114754677, -0.0022986680269241333, -0.002209438942372799, -0.0021202098578214645, -0.00203098077327013, -0.0019417519215494394, -0.001852522836998105, -0.0017632937524467707, -0.0016740646678954363, -0.0015848358161747456, -0.0014956067316234112, -0.0014063777634873986, -0.0013171486789360642, -0.0012279197108000517, -0.0011386906262487173, -0.001049461541697383, -0.0009602325153537095, -0.000871003489010036, -0.0007817744626663625, -0.0006925454363226891, -0.0006033163517713547, -0.0005140873254276812, -0.00042485829908400774, -0.00033562921453267336, -0.0002464001881889999, -0.00015717116184532642, -6.794212094973773e-05, 2.128691994585097e-05, 0.00011051597539335489, 0.00019974500173702836, 0.00028897402808070183, 0.0003782031126320362, 0.0004674321389757097, 0.0005566611653193831, 0.0006458901916630566, 0.0007351192180067301, 0.0008243483025580645, 0.0009135773289017379, 0.0010028063552454114, 0.0010920354397967458, 0.0011812644079327583, 0.0012704934924840927, 0.001359722577035427, 0.0014489515451714396, 0.001538180629722774, 0.0016274095978587866, 0.001716638682410121, 0.0018058677669614553, 0.0018950968515127897, 0.0019843257032334805, 0.002073554787784815, 0.002162783872336149, 0.0022520129568874836, 0.0023412418086081743, 0.0024304708931595087, 0.002519699977710843, 0.0026089290622621775, 0.002698158146813512]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 6.0, 5.0, 12.0, 12.0, 13.0, 11.0, 16.0, 16.0, 21.0, 27.0, 22.0, 37.0, 23.0, 36.0, 28.0, 38.0, 38.0, 31.0, 41.0, 37.0, 37.0, 40.0, 36.0, 41.0, 48.0, 46.0, 31.0, 27.0, 42.0, 32.0, 31.0, 17.0, 15.0, 21.0, 14.0, 10.0, 6.0, 7.0, 5.0, 3.0, 10.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0008577704429626465, -0.0008324626833200455, -0.0008071549236774445, -0.0007818471640348434, -0.0007565394043922424, -0.0007312316447496414, -0.0007059238851070404, -0.0006806161254644394, -0.0006553083658218384, -0.0006300006061792374, -0.0006046928465366364, -0.0005793850868940353, -0.0005540773272514343, -0.0005287695676088333, -0.0005034618079662323, -0.0004781540483236313, -0.0004528462886810303, -0.00042753852903842926, -0.00040223076939582825, -0.00037692300975322723, -0.0003516152501106262, -0.0003263074904680252, -0.0003009997308254242, -0.0002756919711828232, -0.00025038421154022217, -0.00022507645189762115, -0.00019976869225502014, -0.00017446093261241913, -0.00014915317296981812, -0.0001238454133272171, -9.853765368461609e-05, -7.322989404201508e-05, -4.792213439941406e-05, -2.261437475681305e-05, 2.693384885787964e-06, 2.8001144528388977e-05, 5.330890417098999e-05, 7.8616663813591e-05, 0.00010392442345619202, 0.00012923218309879303, 0.00015453994274139404, 0.00017984770238399506, 0.00020515546202659607, 0.00023046322166919708, 0.0002557709813117981, 0.0002810787409543991, 0.0003063865005970001, 0.00033169426023960114, 0.00035700201988220215, 0.00038230977952480316, 0.0004076175391674042, 0.0004329252988100052, 0.0004582330584526062, 0.0004835408180952072, 0.0005088485777378082, 0.0005341563373804092, 0.0005594640970230103, 0.0005847718566656113, 0.0006100796163082123, 0.0006353873759508133, 0.0006606951355934143, 0.0006860028952360153, 0.0007113106548786163, 0.0007366184145212173, 0.0007619261741638184]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 3.0, 4.0, 4.0, 8.0, 3.0, 6.0, 12.0, 9.0, 8.0, 15.0, 16.0, 16.0, 26.0, 21.0, 21.0, 44.0, 28.0, 27.0, 27.0, 43.0, 49.0, 47.0, 57.0, 37.0, 50.0, 40.0, 39.0, 39.0, 36.0, 28.0, 37.0, 22.0, 33.0, 20.0, 20.0, 26.0, 21.0, 6.0, 13.0, 7.0, 13.0, 7.0, 3.0, 7.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-6.91015625, -6.70269775390625, -6.4952392578125, -6.28778076171875, -6.080322265625, -5.87286376953125, -5.6654052734375, -5.45794677734375, -5.25048828125, -5.04302978515625, -4.8355712890625, -4.62811279296875, -4.420654296875, -4.21319580078125, -4.0057373046875, -3.79827880859375, -3.5908203125, -3.38336181640625, -3.1759033203125, -2.96844482421875, -2.760986328125, -2.55352783203125, -2.3460693359375, -2.13861083984375, -1.93115234375, -1.72369384765625, -1.5162353515625, -1.30877685546875, -1.101318359375, -0.89385986328125, -0.6864013671875, -0.47894287109375, -0.271484375, -0.06402587890625, 0.1434326171875, 0.35089111328125, 0.558349609375, 0.76580810546875, 0.9732666015625, 1.18072509765625, 1.38818359375, 1.59564208984375, 1.8031005859375, 2.01055908203125, 2.218017578125, 2.42547607421875, 2.6329345703125, 2.84039306640625, 3.0478515625, 3.25531005859375, 3.4627685546875, 3.67022705078125, 3.877685546875, 4.08514404296875, 4.2926025390625, 4.50006103515625, 4.70751953125, 4.91497802734375, 5.1224365234375, 5.32989501953125, 5.537353515625, 5.74481201171875, 5.9522705078125, 6.15972900390625, 6.3671875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 12.0, 12.0, 15.0, 28.0, 20.0, 27.0, 50.0, 59.0, 87.0, 108.0, 164.0, 259.0, 327.0, 544.0, 885.0, 1487.0, 2928.0, 7583.0, 29451.0, 208736.0, 649496.0, 115386.0, 19187.0, 5778.0, 2412.0, 1246.0, 715.0, 455.0, 307.0, 223.0, 162.0, 106.0, 81.0, 60.0, 44.0, 39.0, 21.0, 11.0, 12.0, 8.0, 9.0, 2.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.8359375, -13.3802490234375, -12.924560546875, -12.4688720703125, -12.01318359375, -11.5574951171875, -11.101806640625, -10.6461181640625, -10.1904296875, -9.7347412109375, -9.279052734375, -8.8233642578125, -8.36767578125, -7.9119873046875, -7.456298828125, -7.0006103515625, -6.544921875, -6.0892333984375, -5.633544921875, -5.1778564453125, -4.72216796875, -4.2664794921875, -3.810791015625, -3.3551025390625, -2.8994140625, -2.4437255859375, -1.988037109375, -1.5323486328125, -1.07666015625, -0.6209716796875, -0.165283203125, 0.2904052734375, 0.74609375, 1.2017822265625, 1.657470703125, 2.1131591796875, 2.56884765625, 3.0245361328125, 3.480224609375, 3.9359130859375, 4.3916015625, 4.8472900390625, 5.302978515625, 5.7586669921875, 6.21435546875, 6.6700439453125, 7.125732421875, 7.5814208984375, 8.037109375, 8.4927978515625, 8.948486328125, 9.4041748046875, 9.85986328125, 10.3155517578125, 10.771240234375, 11.2269287109375, 11.6826171875, 12.1383056640625, 12.593994140625, 13.0496826171875, 13.50537109375, 13.9610595703125, 14.416748046875, 14.8724365234375, 15.328125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 7.0, 4.0, 9.0, 6.0, 11.0, 9.0, 14.0, 21.0, 25.0, 24.0, 25.0, 32.0, 56.0, 61.0, 86.0, 144.0, 297.0, 1500.0, 225.0, 110.0, 60.0, 71.0, 49.0, 37.0, 29.0, 20.0, 17.0, 22.0, 15.0, 12.0, 10.0, 6.0, 15.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-23.875, -23.158203125, -22.44140625, -21.724609375, -21.0078125, -20.291015625, -19.57421875, -18.857421875, -18.140625, -17.423828125, -16.70703125, -15.990234375, -15.2734375, -14.556640625, -13.83984375, -13.123046875, -12.40625, -11.689453125, -10.97265625, -10.255859375, -9.5390625, -8.822265625, -8.10546875, -7.388671875, -6.671875, -5.955078125, -5.23828125, -4.521484375, -3.8046875, -3.087890625, -2.37109375, -1.654296875, -0.9375, -0.220703125, 0.49609375, 1.212890625, 1.9296875, 2.646484375, 3.36328125, 4.080078125, 4.796875, 5.513671875, 6.23046875, 6.947265625, 7.6640625, 8.380859375, 9.09765625, 9.814453125, 10.53125, 11.248046875, 11.96484375, 12.681640625, 13.3984375, 14.115234375, 14.83203125, 15.548828125, 16.265625, 16.982421875, 17.69921875, 18.416015625, 19.1328125, 19.849609375, 20.56640625, 21.283203125, 22.0]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 11.0, 25.0, 21.0, 23.0, 40.0, 46.0, 37.0, 79.0, 122.0, 129.0, 224.0, 369.0, 832.0, 2556.0, 65456.0, 3064877.0, 7854.0, 1533.0, 530.0, 300.0, 166.0, 132.0, 80.0, 47.0, 39.0, 40.0, 30.0, 12.0, 18.0, 12.0, 13.0, 15.0, 5.0, 6.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-50.03125, -48.61328125, -47.1953125, -45.77734375, -44.359375, -42.94140625, -41.5234375, -40.10546875, -38.6875, -37.26953125, -35.8515625, -34.43359375, -33.015625, -31.59765625, -30.1796875, -28.76171875, -27.34375, -25.92578125, -24.5078125, -23.08984375, -21.671875, -20.25390625, -18.8359375, -17.41796875, -16.0, -14.58203125, -13.1640625, -11.74609375, -10.328125, -8.91015625, -7.4921875, -6.07421875, -4.65625, -3.23828125, -1.8203125, -0.40234375, 1.015625, 2.43359375, 3.8515625, 5.26953125, 6.6875, 8.10546875, 9.5234375, 10.94140625, 12.359375, 13.77734375, 15.1953125, 16.61328125, 18.03125, 19.44921875, 20.8671875, 22.28515625, 23.703125, 25.12109375, 26.5390625, 27.95703125, 29.375, 30.79296875, 32.2109375, 33.62890625, 35.046875, 36.46484375, 37.8828125, 39.30078125, 40.71875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 741.0, 269.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.532894134521484, -44.8148193359375, -33.09674835205078, -21.378673553466797, -9.660598754882812, 2.057476043701172, 13.77554702758789, 25.49362564086914, 37.21169662475586, 48.929771423339844, 60.64784240722656, 72.36592102050781, 84.08399200439453, 95.80206298828125, 107.5201416015625, 119.23822021484375, 130.95628356933594, 142.6743621826172, 154.39242553710938, 166.11050415039062, 177.82858276367188, 189.54666137695312, 201.2647247314453, 212.98280334472656, 224.7008819580078, 236.41896057128906, 248.13702392578125, 259.8551025390625, 271.57318115234375, 283.291259765625, 295.00933837890625, 306.7274169921875, 318.4454650878906, 330.1635437011719, 341.8816223144531, 353.59967041015625, 365.3177490234375, 377.03582763671875, 388.75390625, 400.47198486328125, 412.1900634765625, 423.90814208984375, 435.626220703125, 447.34429931640625, 459.0623474121094, 470.7804260253906, 482.4985046386719, 494.2165832519531, 505.93463134765625, 517.6527099609375, 529.3707885742188, 541.0888671875, 552.8069458007812, 564.5250244140625, 576.2430419921875, 587.961181640625, 599.6792602539062, 611.3973388671875, 623.1154174804688, 634.83349609375, 646.5515747070312, 658.2696533203125, 669.9876708984375, 681.705810546875, 693.423828125]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 12.0, 5.0, 7.0, 5.0, 14.0, 15.0, 21.0, 21.0, 19.0, 24.0, 25.0, 46.0, 16.0, 37.0, 39.0, 50.0, 69.0, 36.0, 37.0, 34.0, 47.0, 38.0, 51.0, 41.0, 38.0, 30.0, 27.0, 29.0, 27.0, 21.0, 18.0, 16.0, 12.0, 17.0, 16.0, 8.0, 12.0, 8.0, 4.0, 3.0, 2.0, 6.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.21110534667969, -43.72639465332031, -42.24168014526367, -40.7569694519043, -39.27225875854492, -37.78754425048828, -36.302833557128906, -34.81812286376953, -33.333412170410156, -31.84869956970215, -30.363988876342773, -28.879276275634766, -27.39456558227539, -25.909852981567383, -24.425140380859375, -22.9404296875, -21.45571517944336, -19.97100257873535, -18.486291885375977, -17.00157928466797, -15.516867637634277, -14.032155990600586, -12.547443389892578, -11.062731742858887, -9.578020095825195, -8.093308448791504, -6.608596324920654, -5.123884201049805, -3.6391725540161133, -2.154460906982422, -0.6697483062744141, 0.8149633407592773, 2.2996749877929688, 3.7843868732452393, 5.26909875869751, 6.753810882568359, 8.23852252960205, 9.723234176635742, 11.20794677734375, 12.692658424377441, 14.177370071411133, 15.662081718444824, 17.146793365478516, 18.631505966186523, 20.11621856689453, 21.600929260253906, 23.085641860961914, 24.570354461669922, 26.055065155029297, 27.539777755737305, 29.02448844909668, 30.509201049804688, 31.993911743164062, 33.47862243652344, 34.96333694458008, 36.44804763793945, 37.932762145996094, 39.41747283935547, 40.90218734741211, 42.386898040771484, 43.87160873413086, 45.3563232421875, 46.841033935546875, 48.32574462890625, 49.810455322265625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 8.0, 6.0, 8.0, 6.0, 8.0, 10.0, 10.0, 26.0, 18.0, 15.0, 20.0, 29.0, 35.0, 38.0, 44.0, 46.0, 48.0, 44.0, 46.0, 60.0, 45.0, 49.0, 43.0, 44.0, 35.0, 45.0, 32.0, 27.0, 24.0, 29.0, 24.0, 13.0, 19.0, 17.0, 11.0, 9.0, 8.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.7890625, -9.52215576171875, -9.2552490234375, -8.98834228515625, -8.721435546875, -8.45452880859375, -8.1876220703125, -7.92071533203125, -7.65380859375, -7.38690185546875, -7.1199951171875, -6.85308837890625, -6.586181640625, -6.31927490234375, -6.0523681640625, -5.78546142578125, -5.5185546875, -5.25164794921875, -4.9847412109375, -4.71783447265625, -4.450927734375, -4.18402099609375, -3.9171142578125, -3.65020751953125, -3.38330078125, -3.11639404296875, -2.8494873046875, -2.58258056640625, -2.315673828125, -2.04876708984375, -1.7818603515625, -1.51495361328125, -1.248046875, -0.98114013671875, -0.7142333984375, -0.44732666015625, -0.180419921875, 0.08648681640625, 0.3533935546875, 0.62030029296875, 0.88720703125, 1.15411376953125, 1.4210205078125, 1.68792724609375, 1.954833984375, 2.22174072265625, 2.4886474609375, 2.75555419921875, 3.0224609375, 3.28936767578125, 3.5562744140625, 3.82318115234375, 4.090087890625, 4.35699462890625, 4.6239013671875, 4.89080810546875, 5.15771484375, 5.42462158203125, 5.6915283203125, 5.95843505859375, 6.225341796875, 6.49224853515625, 6.7591552734375, 7.02606201171875, 7.29296875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 7.0, 9.0, 17.0, 7.0, 28.0, 23.0, 24.0, 50.0, 56.0, 81.0, 113.0, 168.0, 231.0, 392.0, 580.0, 963.0, 2230.0, 12481.0, 1253060.0, 2888677.0, 29017.0, 2911.0, 1151.0, 660.0, 425.0, 237.0, 205.0, 144.0, 100.0, 63.0, 45.0, 32.0, 26.0, 23.0, 6.0, 13.0, 7.0, 13.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-53.5, -52.0966796875, -50.693359375, -49.2900390625, -47.88671875, -46.4833984375, -45.080078125, -43.6767578125, -42.2734375, -40.8701171875, -39.466796875, -38.0634765625, -36.66015625, -35.2568359375, -33.853515625, -32.4501953125, -31.046875, -29.6435546875, -28.240234375, -26.8369140625, -25.43359375, -24.0302734375, -22.626953125, -21.2236328125, -19.8203125, -18.4169921875, -17.013671875, -15.6103515625, -14.20703125, -12.8037109375, -11.400390625, -9.9970703125, -8.59375, -7.1904296875, -5.787109375, -4.3837890625, -2.98046875, -1.5771484375, -0.173828125, 1.2294921875, 2.6328125, 4.0361328125, 5.439453125, 6.8427734375, 8.24609375, 9.6494140625, 11.052734375, 12.4560546875, 13.859375, 15.2626953125, 16.666015625, 18.0693359375, 19.47265625, 20.8759765625, 22.279296875, 23.6826171875, 25.0859375, 26.4892578125, 27.892578125, 29.2958984375, 30.69921875, 32.1025390625, 33.505859375, 34.9091796875, 36.3125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 6.0, 10.0, 14.0, 32.0, 57.0, 112.0, 236.0, 552.0, 907.0, 979.0, 607.0, 314.0, 129.0, 57.0, 32.0, 12.0, 7.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.328125, -30.43603515625, -29.5439453125, -28.65185546875, -27.759765625, -26.86767578125, -25.9755859375, -25.08349609375, -24.19140625, -23.29931640625, -22.4072265625, -21.51513671875, -20.623046875, -19.73095703125, -18.8388671875, -17.94677734375, -17.0546875, -16.16259765625, -15.2705078125, -14.37841796875, -13.486328125, -12.59423828125, -11.7021484375, -10.81005859375, -9.91796875, -9.02587890625, -8.1337890625, -7.24169921875, -6.349609375, -5.45751953125, -4.5654296875, -3.67333984375, -2.78125, -1.88916015625, -0.9970703125, -0.10498046875, 0.787109375, 1.67919921875, 2.5712890625, 3.46337890625, 4.35546875, 5.24755859375, 6.1396484375, 7.03173828125, 7.923828125, 8.81591796875, 9.7080078125, 10.60009765625, 11.4921875, 12.38427734375, 13.2763671875, 14.16845703125, 15.060546875, 15.95263671875, 16.8447265625, 17.73681640625, 18.62890625, 19.52099609375, 20.4130859375, 21.30517578125, 22.197265625, 23.08935546875, 23.9814453125, 24.87353515625, 25.765625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 6.0, 6.0, 13.0, 20.0, 31.0, 56.0, 123.0, 229.0, 473.0, 1232.0, 3946.0, 30324.0, 1776335.0, 2336628.0, 38189.0, 4286.0, 1374.0, 536.0, 237.0, 99.0, 51.0, 37.0, 15.0, 10.0, 9.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.8125, -35.8447265625, -34.876953125, -33.9091796875, -32.94140625, -31.9736328125, -31.005859375, -30.0380859375, -29.0703125, -28.1025390625, -27.134765625, -26.1669921875, -25.19921875, -24.2314453125, -23.263671875, -22.2958984375, -21.328125, -20.3603515625, -19.392578125, -18.4248046875, -17.45703125, -16.4892578125, -15.521484375, -14.5537109375, -13.5859375, -12.6181640625, -11.650390625, -10.6826171875, -9.71484375, -8.7470703125, -7.779296875, -6.8115234375, -5.84375, -4.8759765625, -3.908203125, -2.9404296875, -1.97265625, -1.0048828125, -0.037109375, 0.9306640625, 1.8984375, 2.8662109375, 3.833984375, 4.8017578125, 5.76953125, 6.7373046875, 7.705078125, 8.6728515625, 9.640625, 10.6083984375, 11.576171875, 12.5439453125, 13.51171875, 14.4794921875, 15.447265625, 16.4150390625, 17.3828125, 18.3505859375, 19.318359375, 20.2861328125, 21.25390625, 22.2216796875, 23.189453125, 24.1572265625, 25.125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 5.0, 4.0, 9.0, 9.0, 15.0, 17.0, 21.0, 27.0, 39.0, 30.0, 42.0, 56.0, 42.0, 50.0, 50.0, 58.0, 66.0, 67.0, 53.0, 52.0, 50.0, 42.0, 30.0, 24.0, 25.0, 25.0, 22.0, 24.0, 11.0, 12.0, 6.0, 7.0, 2.0, 6.0, 2.0, 3.0], "bins": [-77.31253814697266, -75.52256774902344, -73.73259735107422, -71.942626953125, -70.15265655517578, -68.36268615722656, -66.57271575927734, -64.78274536132812, -62.992774963378906, -61.20280456542969, -59.41283416748047, -57.62286376953125, -55.83289337158203, -54.04292297363281, -52.252952575683594, -50.462982177734375, -48.67301559448242, -46.8830451965332, -45.093074798583984, -43.303104400634766, -41.51313400268555, -39.72316360473633, -37.933197021484375, -36.143226623535156, -34.35325622558594, -32.56328582763672, -30.7733154296875, -28.98334503173828, -27.193374633789062, -25.403404235839844, -23.613435745239258, -21.82346534729004, -20.033496856689453, -18.243526458740234, -16.453556060791016, -14.663586616516113, -12.873616218566895, -11.083645820617676, -9.293676376342773, -7.503705978393555, -5.713735580444336, -3.9237654209136963, -2.1337952613830566, -0.3438253402709961, 1.4461450576782227, 3.2361154556274414, 5.026084899902344, 6.8160552978515625, 8.606025695800781, 10.39599609375, 12.185966491699219, 13.975935935974121, 15.76590633392334, 17.555877685546875, 19.34584617614746, 21.13581657409668, 22.9257869720459, 24.715757369995117, 26.505727767944336, 28.295696258544922, 30.08566665649414, 31.87563705444336, 33.66560745239258, 35.4555778503418, 37.245548248291016]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 6.0, 12.0, 11.0, 15.0, 14.0, 14.0, 25.0, 32.0, 28.0, 25.0, 34.0, 40.0, 55.0, 39.0, 42.0, 53.0, 56.0, 45.0, 40.0, 46.0, 38.0, 41.0, 35.0, 27.0, 32.0, 28.0, 21.0, 23.0, 29.0, 12.0, 17.0, 13.0, 9.0, 12.0, 6.0, 4.0, 7.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.723941802978516, -39.10563659667969, -37.48733139038086, -35.86902618408203, -34.2507209777832, -32.632415771484375, -31.01411247253418, -29.39580726623535, -27.777502059936523, -26.159196853637695, -24.540891647338867, -22.922588348388672, -21.304283142089844, -19.685977935791016, -18.067672729492188, -16.44936752319336, -14.831062316894531, -13.212757110595703, -11.594451904296875, -9.976147651672363, -8.357842445373535, -6.739537239074707, -5.121232986450195, -3.502927780151367, -1.884622573852539, -0.26631760597229004, 1.351987361907959, 2.970292091369629, 4.588597297668457, 6.206902503967285, 7.825206756591797, 9.443511962890625, 11.061820983886719, 12.680126190185547, 14.298431396484375, 15.916735649108887, 17.53504180908203, 19.15334701538086, 20.771650314331055, 22.389955520629883, 24.00826072692871, 25.62656593322754, 27.244871139526367, 28.863174438476562, 30.48147964477539, 32.09978485107422, 33.71809005737305, 35.336395263671875, 36.9547004699707, 38.57300567626953, 40.19131088256836, 41.80961608886719, 43.427921295166016, 45.046226501464844, 46.664527893066406, 48.2828369140625, 49.90113830566406, 51.51944351196289, 53.13774871826172, 54.75605392456055, 56.374359130859375, 57.9926643371582, 59.61096954345703, 61.229270935058594, 62.84757995605469]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 5.0, 6.0, 8.0, 7.0, 11.0, 22.0, 25.0, 17.0, 25.0, 26.0, 32.0, 24.0, 45.0, 39.0, 52.0, 44.0, 40.0, 64.0, 50.0, 53.0, 47.0, 40.0, 35.0, 37.0, 31.0, 29.0, 33.0, 23.0, 20.0, 18.0, 19.0, 14.0, 14.0, 15.0, 8.0, 9.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.4375, -78.5595703125, -75.681640625, -72.8037109375, -69.92578125, -67.0478515625, -64.169921875, -61.2919921875, -58.4140625, -55.5361328125, -52.658203125, -49.7802734375, -46.90234375, -44.0244140625, -41.146484375, -38.2685546875, -35.390625, -32.5126953125, -29.634765625, -26.7568359375, -23.87890625, -21.0009765625, -18.123046875, -15.2451171875, -12.3671875, -9.4892578125, -6.611328125, -3.7333984375, -0.85546875, 2.0224609375, 4.900390625, 7.7783203125, 10.65625, 13.5341796875, 16.412109375, 19.2900390625, 22.16796875, 25.0458984375, 27.923828125, 30.8017578125, 33.6796875, 36.5576171875, 39.435546875, 42.3134765625, 45.19140625, 48.0693359375, 50.947265625, 53.8251953125, 56.703125, 59.5810546875, 62.458984375, 65.3369140625, 68.21484375, 71.0927734375, 73.970703125, 76.8486328125, 79.7265625, 82.6044921875, 85.482421875, 88.3603515625, 91.23828125, 94.1162109375, 96.994140625, 99.8720703125, 102.75]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 9.0, 8.0, 13.0, 44.0, 55.0, 75.0, 107.0, 175.0, 248.0, 386.0, 601.0, 979.0, 1576.0, 2518.0, 4034.0, 6635.0, 10675.0, 17394.0, 28494.0, 49090.0, 86957.0, 167322.0, 279392.0, 173430.0, 91271.0, 50826.0, 29746.0, 17885.0, 10775.0, 6709.0, 4095.0, 2638.0, 1609.0, 997.0, 644.0, 406.0, 231.0, 182.0, 96.0, 76.0, 46.0, 22.0, 27.0, 21.0, 12.0, 5.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1171875, -13.65478515625, -13.1923828125, -12.72998046875, -12.267578125, -11.80517578125, -11.3427734375, -10.88037109375, -10.41796875, -9.95556640625, -9.4931640625, -9.03076171875, -8.568359375, -8.10595703125, -7.6435546875, -7.18115234375, -6.71875, -6.25634765625, -5.7939453125, -5.33154296875, -4.869140625, -4.40673828125, -3.9443359375, -3.48193359375, -3.01953125, -2.55712890625, -2.0947265625, -1.63232421875, -1.169921875, -0.70751953125, -0.2451171875, 0.21728515625, 0.6796875, 1.14208984375, 1.6044921875, 2.06689453125, 2.529296875, 2.99169921875, 3.4541015625, 3.91650390625, 4.37890625, 4.84130859375, 5.3037109375, 5.76611328125, 6.228515625, 6.69091796875, 7.1533203125, 7.61572265625, 8.078125, 8.54052734375, 9.0029296875, 9.46533203125, 9.927734375, 10.39013671875, 10.8525390625, 11.31494140625, 11.77734375, 12.23974609375, 12.7021484375, 13.16455078125, 13.626953125, 14.08935546875, 14.5517578125, 15.01416015625, 15.4765625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 0.0, 6.0, 4.0, 7.0, 2.0, 6.0, 7.0, 14.0, 15.0, 16.0, 27.0, 19.0, 22.0, 23.0, 29.0, 28.0, 35.0, 31.0, 41.0, 41.0, 41.0, 40.0, 1078.0, 45.0, 44.0, 36.0, 42.0, 46.0, 36.0, 32.0, 28.0, 26.0, 18.0, 22.0, 33.0, 29.0, 16.0, 10.0, 5.0, 10.0, 5.0, 3.0, 3.0, 5.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.25, -55.443359375, -53.63671875, -51.830078125, -50.0234375, -48.216796875, -46.41015625, -44.603515625, -42.796875, -40.990234375, -39.18359375, -37.376953125, -35.5703125, -33.763671875, -31.95703125, -30.150390625, -28.34375, -26.537109375, -24.73046875, -22.923828125, -21.1171875, -19.310546875, -17.50390625, -15.697265625, -13.890625, -12.083984375, -10.27734375, -8.470703125, -6.6640625, -4.857421875, -3.05078125, -1.244140625, 0.5625, 2.369140625, 4.17578125, 5.982421875, 7.7890625, 9.595703125, 11.40234375, 13.208984375, 15.015625, 16.822265625, 18.62890625, 20.435546875, 22.2421875, 24.048828125, 25.85546875, 27.662109375, 29.46875, 31.275390625, 33.08203125, 34.888671875, 36.6953125, 38.501953125, 40.30859375, 42.115234375, 43.921875, 45.728515625, 47.53515625, 49.341796875, 51.1484375, 52.955078125, 54.76171875, 56.568359375, 58.375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 7.0, 8.0, 15.0, 20.0, 39.0, 36.0, 59.0, 80.0, 132.0, 166.0, 265.0, 382.0, 554.0, 818.0, 1219.0, 1750.0, 2831.0, 4443.0, 6825.0, 10979.0, 17290.0, 27829.0, 46087.0, 80279.0, 151637.0, 1322181.0, 184133.0, 95977.0, 54250.0, 32175.0, 19898.0, 12357.0, 7814.0, 5014.0, 3246.0, 2074.0, 1331.0, 947.0, 601.0, 460.0, 319.0, 192.0, 113.0, 83.0, 73.0, 49.0, 32.0, 21.0, 14.0, 11.0, 8.0, 4.0, 0.0, 5.0, 3.0, 2.0, 1.0], "bins": [-15.0546875, -14.593505859375, -14.13232421875, -13.671142578125, -13.2099609375, -12.748779296875, -12.28759765625, -11.826416015625, -11.365234375, -10.904052734375, -10.44287109375, -9.981689453125, -9.5205078125, -9.059326171875, -8.59814453125, -8.136962890625, -7.67578125, -7.214599609375, -6.75341796875, -6.292236328125, -5.8310546875, -5.369873046875, -4.90869140625, -4.447509765625, -3.986328125, -3.525146484375, -3.06396484375, -2.602783203125, -2.1416015625, -1.680419921875, -1.21923828125, -0.758056640625, -0.296875, 0.164306640625, 0.62548828125, 1.086669921875, 1.5478515625, 2.009033203125, 2.47021484375, 2.931396484375, 3.392578125, 3.853759765625, 4.31494140625, 4.776123046875, 5.2373046875, 5.698486328125, 6.15966796875, 6.620849609375, 7.08203125, 7.543212890625, 8.00439453125, 8.465576171875, 8.9267578125, 9.387939453125, 9.84912109375, 10.310302734375, 10.771484375, 11.232666015625, 11.69384765625, 12.155029296875, 12.6162109375, 13.077392578125, 13.53857421875, 13.999755859375, 14.4609375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 3.0, 4.0, 6.0, 7.0, 5.0, 7.0, 14.0, 14.0, 23.0, 18.0, 23.0, 27.0, 50.0, 50.0, 51.0, 83.0, 72.0, 103.0, 77.0, 80.0, 56.0, 46.0, 34.0, 32.0, 27.0, 18.0, 12.0, 9.0, 13.0, 4.0, 10.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03900146484375, -0.03766012191772461, -0.03631877899169922, -0.03497743606567383, -0.03363609313964844, -0.03229475021362305, -0.030953407287597656, -0.029612064361572266, -0.028270721435546875, -0.026929378509521484, -0.025588035583496094, -0.024246692657470703, -0.022905349731445312, -0.021564006805419922, -0.02022266387939453, -0.01888132095336914, -0.01753997802734375, -0.01619863510131836, -0.014857292175292969, -0.013515949249267578, -0.012174606323242188, -0.010833263397216797, -0.009491920471191406, -0.008150577545166016, -0.006809234619140625, -0.005467891693115234, -0.004126548767089844, -0.002785205841064453, -0.0014438629150390625, -0.00010251998901367188, 0.0012388229370117188, 0.0025801658630371094, 0.0039215087890625, 0.005262851715087891, 0.006604194641113281, 0.007945537567138672, 0.009286880493164062, 0.010628223419189453, 0.011969566345214844, 0.013310909271240234, 0.014652252197265625, 0.015993595123291016, 0.017334938049316406, 0.018676280975341797, 0.020017623901367188, 0.021358966827392578, 0.02270030975341797, 0.02404165267944336, 0.02538299560546875, 0.02672433853149414, 0.02806568145751953, 0.029407024383544922, 0.030748367309570312, 0.0320897102355957, 0.033431053161621094, 0.034772396087646484, 0.036113739013671875, 0.037455081939697266, 0.038796424865722656, 0.04013776779174805, 0.04147911071777344, 0.04282045364379883, 0.04416179656982422, 0.04550313949584961, 0.046844482421875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 10.0, 8.0, 13.0, 12.0, 10.0, 28.0, 36.0, 43.0, 65.0, 84.0, 114.0, 164.0, 310.0, 486.0, 854.0, 1817.0, 4473.0, 15813.0, 91870.0, 612723.0, 270868.0, 35097.0, 7928.0, 2607.0, 1298.0, 653.0, 368.0, 238.0, 165.0, 95.0, 68.0, 49.0, 36.0, 37.0, 21.0, 19.0, 13.0, 14.0, 15.0, 2.0, 4.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24072265625, -0.23337173461914062, -0.22602081298828125, -0.21866989135742188, -0.2113189697265625, -0.20396804809570312, -0.19661712646484375, -0.18926620483398438, -0.181915283203125, -0.17456436157226562, -0.16721343994140625, -0.15986251831054688, -0.1525115966796875, -0.14516067504882812, -0.13780975341796875, -0.13045883178710938, -0.12310791015625, -0.11575698852539062, -0.10840606689453125, -0.10105514526367188, -0.0937042236328125, -0.08635330200195312, -0.07900238037109375, -0.07165145874023438, -0.064300537109375, -0.056949615478515625, -0.04959869384765625, -0.042247772216796875, -0.0348968505859375, -0.027545928955078125, -0.02019500732421875, -0.012844085693359375, -0.0054931640625, 0.001857757568359375, 0.00920867919921875, 0.016559600830078125, 0.0239105224609375, 0.031261444091796875, 0.03861236572265625, 0.045963287353515625, 0.053314208984375, 0.060665130615234375, 0.06801605224609375, 0.07536697387695312, 0.0827178955078125, 0.09006881713867188, 0.09741973876953125, 0.10477066040039062, 0.11212158203125, 0.11947250366210938, 0.12682342529296875, 0.13417434692382812, 0.1415252685546875, 0.14887619018554688, 0.15622711181640625, 0.16357803344726562, 0.170928955078125, 0.17827987670898438, 0.18563079833984375, 0.19298171997070312, 0.2003326416015625, 0.20768356323242188, 0.21503448486328125, 0.22238540649414062, 0.229736328125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 7.0, 18.0, 36.0, 92.0, 179.0, 266.0, 207.0, 116.0, 44.0, 18.0, 11.0, 2.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08062899857759476, -0.07869229465723038, -0.0767555981874466, -0.07481889426708221, -0.07288219779729843, -0.07094549387693405, -0.06900879740715027, -0.06707209348678589, -0.06513538956642151, -0.06319868564605713, -0.061261989176273346, -0.059325288981199265, -0.05738858878612518, -0.0554518848657608, -0.05351518467068672, -0.05157848447561264, -0.04964178800582886, -0.047705087810754776, -0.045768387615680695, -0.04383168742060661, -0.04189498722553253, -0.03995828330516815, -0.03802158311009407, -0.03608488291501999, -0.03414818271994591, -0.032211482524871826, -0.030274782329797745, -0.028338080272078514, -0.026401380077004433, -0.02446467988193035, -0.02252797782421112, -0.02059127762913704, -0.01865457370877266, -0.016717873513698578, -0.014781172387301922, -0.012844471260905266, -0.010907771065831184, -0.008971070870757103, -0.007034369744360447, -0.005097668617963791, -0.0031609684228897095, -0.0012242677621543407, 0.000712432898581028, 0.0026491335593163967, 0.0045858342200517654, 0.006522534415125847, 0.008459235541522503, 0.010395936667919159, 0.01233263686299324, 0.014269337058067322, 0.016206037253141403, 0.018142739310860634, 0.020079439505934715, 0.022016139701008797, 0.023952841758728027, 0.02588954195380211, 0.02782624214887619, 0.02976294234395027, 0.03169964253902435, 0.033636342734098434, 0.035573042929172516, 0.037509746849536896, 0.03944644704461098, 0.04138314723968506, 0.04331984743475914]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 7.0, 4.0, 4.0, 7.0, 9.0, 7.0, 13.0, 10.0, 12.0, 21.0, 12.0, 20.0, 20.0, 23.0, 27.0, 27.0, 19.0, 29.0, 32.0, 31.0, 42.0, 45.0, 39.0, 44.0, 42.0, 39.0, 34.0, 43.0, 39.0, 40.0, 33.0, 27.0, 26.0, 30.0, 31.0, 19.0, 17.0, 15.0, 15.0, 8.0, 13.0, 7.0, 8.0, 11.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.019526362419128418, -0.01888122223317623, -0.018236082047224045, -0.017590941861271858, -0.01694580167531967, -0.016300661489367485, -0.0156555213034153, -0.015010381117463112, -0.014365240931510925, -0.013720100745558739, -0.013074960559606552, -0.012429820373654366, -0.011784680187702179, -0.011139540001749992, -0.010494399815797806, -0.00984925962984562, -0.009204119443893433, -0.008558979257941246, -0.00791383907198906, -0.007268698886036873, -0.006623558700084686, -0.0059784185141325, -0.005333278328180313, -0.0046881381422281265, -0.00404299795627594, -0.0033978577703237534, -0.0027527175843715668, -0.00210757739841938, -0.0014624372124671936, -0.000817297026515007, -0.00017215684056282043, 0.00047298334538936615, 0.0011181235313415527, 0.0017632637172937393, 0.002408403903245926, 0.0030535440891981125, 0.003698684275150299, 0.004343824461102486, 0.004988964647054672, 0.005634104833006859, 0.006279245018959045, 0.006924385204911232, 0.007569525390863419, 0.008214665576815605, 0.008859805762767792, 0.009504945948719978, 0.010150086134672165, 0.010795226320624352, 0.011440366506576538, 0.012085506692528725, 0.012730646878480911, 0.013375787064433098, 0.014020927250385284, 0.014666067436337471, 0.015311207622289658, 0.015956347808241844, 0.01660148799419403, 0.017246628180146217, 0.017891768366098404, 0.01853690855205059, 0.019182048738002777, 0.019827188923954964, 0.02047232910990715, 0.021117469295859337, 0.021762609481811523]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 4.0, 4.0, 5.0, 6.0, 8.0, 8.0, 10.0, 22.0, 27.0, 16.0, 24.0, 26.0, 35.0, 21.0, 45.0, 40.0, 53.0, 42.0, 42.0, 63.0, 52.0, 52.0, 46.0, 40.0, 35.0, 37.0, 30.0, 30.0, 32.0, 24.0, 19.0, 18.0, 21.0, 12.0, 14.0, 16.0, 7.0, 9.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-81.3125, -78.4365234375, -75.560546875, -72.6845703125, -69.80859375, -66.9326171875, -64.056640625, -61.1806640625, -58.3046875, -55.4287109375, -52.552734375, -49.6767578125, -46.80078125, -43.9248046875, -41.048828125, -38.1728515625, -35.296875, -32.4208984375, -29.544921875, -26.6689453125, -23.79296875, -20.9169921875, -18.041015625, -15.1650390625, -12.2890625, -9.4130859375, -6.537109375, -3.6611328125, -0.78515625, 2.0908203125, 4.966796875, 7.8427734375, 10.71875, 13.5947265625, 16.470703125, 19.3466796875, 22.22265625, 25.0986328125, 27.974609375, 30.8505859375, 33.7265625, 36.6025390625, 39.478515625, 42.3544921875, 45.23046875, 48.1064453125, 50.982421875, 53.8583984375, 56.734375, 59.6103515625, 62.486328125, 65.3623046875, 68.23828125, 71.1142578125, 73.990234375, 76.8662109375, 79.7421875, 82.6181640625, 85.494140625, 88.3701171875, 91.24609375, 94.1220703125, 96.998046875, 99.8740234375, 102.75]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 12.0, 6.0, 18.0, 21.0, 37.0, 43.0, 58.0, 102.0, 121.0, 219.0, 312.0, 602.0, 1115.0, 2131.0, 4909.0, 13976.0, 56643.0, 268684.0, 505870.0, 146256.0, 31405.0, 8783.0, 3478.0, 1589.0, 837.0, 479.0, 267.0, 194.0, 111.0, 66.0, 53.0, 42.0, 28.0, 26.0, 16.0, 11.0, 8.0, 11.0, 4.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.546875, -13.011474609375, -12.47607421875, -11.940673828125, -11.4052734375, -10.869873046875, -10.33447265625, -9.799072265625, -9.263671875, -8.728271484375, -8.19287109375, -7.657470703125, -7.1220703125, -6.586669921875, -6.05126953125, -5.515869140625, -4.98046875, -4.445068359375, -3.90966796875, -3.374267578125, -2.8388671875, -2.303466796875, -1.76806640625, -1.232666015625, -0.697265625, -0.161865234375, 0.37353515625, 0.908935546875, 1.4443359375, 1.979736328125, 2.51513671875, 3.050537109375, 3.5859375, 4.121337890625, 4.65673828125, 5.192138671875, 5.7275390625, 6.262939453125, 6.79833984375, 7.333740234375, 7.869140625, 8.404541015625, 8.93994140625, 9.475341796875, 10.0107421875, 10.546142578125, 11.08154296875, 11.616943359375, 12.15234375, 12.687744140625, 13.22314453125, 13.758544921875, 14.2939453125, 14.829345703125, 15.36474609375, 15.900146484375, 16.435546875, 16.970947265625, 17.50634765625, 18.041748046875, 18.5771484375, 19.112548828125, 19.64794921875, 20.183349609375, 20.71875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 7.0, 2.0, 3.0, 5.0, 9.0, 14.0, 12.0, 20.0, 38.0, 25.0, 22.0, 36.0, 27.0, 35.0, 52.0, 41.0, 51.0, 41.0, 42.0, 1913.0, 214.0, 56.0, 47.0, 35.0, 25.0, 26.0, 38.0, 33.0, 31.0, 18.0, 22.0, 13.0, 18.0, 11.0, 13.0, 7.0, 8.0, 10.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0], "bins": [-144.0, -140.0947265625, -136.189453125, -132.2841796875, -128.37890625, -124.4736328125, -120.568359375, -116.6630859375, -112.7578125, -108.8525390625, -104.947265625, -101.0419921875, -97.13671875, -93.2314453125, -89.326171875, -85.4208984375, -81.515625, -77.6103515625, -73.705078125, -69.7998046875, -65.89453125, -61.9892578125, -58.083984375, -54.1787109375, -50.2734375, -46.3681640625, -42.462890625, -38.5576171875, -34.65234375, -30.7470703125, -26.841796875, -22.9365234375, -19.03125, -15.1259765625, -11.220703125, -7.3154296875, -3.41015625, 0.4951171875, 4.400390625, 8.3056640625, 12.2109375, 16.1162109375, 20.021484375, 23.9267578125, 27.83203125, 31.7373046875, 35.642578125, 39.5478515625, 43.453125, 47.3583984375, 51.263671875, 55.1689453125, 59.07421875, 62.9794921875, 66.884765625, 70.7900390625, 74.6953125, 78.6005859375, 82.505859375, 86.4111328125, 90.31640625, 94.2216796875, 98.126953125, 102.0322265625, 105.9375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 2.0, 3.0, 6.0, 10.0, 13.0, 16.0, 28.0, 47.0, 59.0, 63.0, 99.0, 124.0, 179.0, 244.0, 374.0, 560.0, 900.0, 1813.0, 5106.0, 27607.0, 253294.0, 2732022.0, 103113.0, 12984.0, 3238.0, 1323.0, 776.0, 500.0, 336.0, 241.0, 164.0, 103.0, 90.0, 64.0, 52.0, 33.0, 27.0, 23.0, 20.0, 12.0, 11.0, 7.0, 4.0, 3.0, 2.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-24.734375, -23.96875, -23.203125, -22.4375, -21.671875, -20.90625, -20.140625, -19.375, -18.609375, -17.84375, -17.078125, -16.3125, -15.546875, -14.78125, -14.015625, -13.25, -12.484375, -11.71875, -10.953125, -10.1875, -9.421875, -8.65625, -7.890625, -7.125, -6.359375, -5.59375, -4.828125, -4.0625, -3.296875, -2.53125, -1.765625, -1.0, -0.234375, 0.53125, 1.296875, 2.0625, 2.828125, 3.59375, 4.359375, 5.125, 5.890625, 6.65625, 7.421875, 8.1875, 8.953125, 9.71875, 10.484375, 11.25, 12.015625, 12.78125, 13.546875, 14.3125, 15.078125, 15.84375, 16.609375, 17.375, 18.140625, 18.90625, 19.671875, 20.4375, 21.203125, 21.96875, 22.734375, 23.5, 24.265625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 10.0, 5.0, 29.0, 72.0, 164.0, 246.0, 237.0, 112.0, 56.0, 29.0, 11.0, 13.0, 3.0, 6.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-178.3229217529297, -167.10427856445312, -155.8856201171875, -144.66697692871094, -133.44833374023438, -122.22969055175781, -111.01103973388672, -99.79238891601562, -88.57374572753906, -77.3551025390625, -66.1364517211914, -54.91780471801758, -43.69915771484375, -32.48051071166992, -21.261863708496094, -10.043212890625, 1.1754302978515625, 12.39407730102539, 23.61272430419922, 34.83137130737305, 46.050018310546875, 57.2686653137207, 68.48731231689453, 79.70596313476562, 90.92460632324219, 102.14324951171875, 113.36190032958984, 124.58055114746094, 135.7991943359375, 147.01783752441406, 158.23648071289062, 169.45513916015625, 180.67376708984375, 191.8924102783203, 203.11105346679688, 214.3297119140625, 225.54835510253906, 236.76699829101562, 247.98565673828125, 259.20428466796875, 270.4229431152344, 281.6416015625, 292.8602294921875, 304.0788879394531, 315.29754638671875, 326.51617431640625, 337.7348327636719, 348.9534912109375, 360.172119140625, 371.3907775878906, 382.6094055175781, 393.82806396484375, 405.04669189453125, 416.2653503417969, 427.4840087890625, 438.70263671875, 449.9212951660156, 461.13995361328125, 472.35858154296875, 483.5772399902344, 494.7958984375, 506.0145263671875, 517.233154296875, 528.4518432617188, 539.6704711914062]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 8.0, 8.0, 5.0, 8.0, 10.0, 7.0, 12.0, 13.0, 16.0, 18.0, 23.0, 28.0, 21.0, 36.0, 27.0, 45.0, 47.0, 46.0, 45.0, 43.0, 56.0, 36.0, 43.0, 49.0, 41.0, 35.0, 45.0, 26.0, 38.0, 27.0, 24.0, 21.0, 20.0, 13.0, 9.0, 12.0, 3.0, 6.0, 8.0, 8.0, 9.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-181.45619201660156, -176.06277465820312, -170.66934204101562, -165.2759246826172, -159.88250732421875, -154.4890899658203, -149.0956573486328, -143.70223999023438, -138.30882263183594, -132.9154052734375, -127.52198028564453, -122.12855529785156, -116.73513793945312, -111.34171295166016, -105.94828796386719, -100.55487060546875, -95.16144561767578, -89.76802062988281, -84.37460327148438, -78.9811782836914, -73.58776092529297, -68.1943359375, -62.8009147644043, -57.407493591308594, -52.01407241821289, -46.62065124511719, -41.227230072021484, -35.83380889892578, -30.440385818481445, -25.046964645385742, -19.653541564941406, -14.260120391845703, -8.86669921875, -3.4732775688171387, 1.9201440811157227, 7.313566207885742, 12.706987380981445, 18.10040855407715, 23.493831634521484, 28.887252807617188, 34.28067398071289, 39.674095153808594, 45.0675163269043, 50.4609375, 55.85436248779297, 61.247779846191406, 66.64120483398438, 72.03462219238281, 77.42804718017578, 82.82147216796875, 88.21488952636719, 93.60831451416016, 99.0017318725586, 104.39515686035156, 109.78857421875, 115.18199920654297, 120.57542419433594, 125.9688491821289, 131.36227416992188, 136.7556915283203, 142.14910888671875, 147.5425262451172, 152.9359588623047, 158.32937622070312, 163.72279357910156]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 16.0, 13.0, 23.0, 47.0, 46.0, 83.0, 118.0, 179.0, 257.0, 370.0, 513.0, 797.0, 1041.0, 1541.0, 2198.0, 2950.0, 4153.0, 1015315.0, 6154.0, 3711.0, 2603.0, 1946.0, 1337.0, 921.0, 663.0, 455.0, 320.0, 257.0, 161.0, 108.0, 69.0, 63.0, 45.0, 21.0, 11.0, 13.0, 11.0, 3.0, 1.0, 5.0, 4.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.211097717285156, -32.134246826171875, -31.057397842407227, -29.980546951293945, -28.903697967529297, -27.826847076416016, -26.749996185302734, -25.673145294189453, -24.596296310424805, -23.519445419311523, -22.442596435546875, -21.365745544433594, -20.288894653320312, -19.212045669555664, -18.135194778442383, -17.058345794677734, -15.981494903564453, -14.904644966125488, -13.827795028686523, -12.750944137573242, -11.674094200134277, -10.597244262695312, -9.520393371582031, -8.443543434143066, -7.366693496704102, -6.289843559265137, -5.212993144989014, -4.136142730712891, -3.059292793273926, -1.982442855834961, -0.9055924415588379, 0.17125797271728516, 1.24810791015625, 2.324958086013794, 3.401808261871338, 4.478658676147461, 5.555508613586426, 6.632358551025391, 7.709208965301514, 8.786059379577637, 9.862909317016602, 10.939759254455566, 12.016609191894531, 13.093460083007812, 14.170310020446777, 15.247159957885742, 16.324010848999023, 17.400859832763672, 18.477710723876953, 19.554561614990234, 20.631410598754883, 21.708261489868164, 22.785110473632812, 23.861961364746094, 24.938812255859375, 26.015663146972656, 27.092512130737305, 28.169363021850586, 29.246212005615234, 30.323062896728516, 31.399913787841797, 32.47676086425781, 33.553611755371094, 34.630462646484375, 35.707313537597656]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 11.0, 18.0, 35.0, 86.0, 89.0, 221.0, 51461384.0, 926.0, 160.0, 41.0, 41.0, 34.0, 45.0, 29.0, 15.0, 7.0, 10.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7336.69287109375, -7052.1484375, -6767.6044921875, -6483.06005859375, -6198.51611328125, -5913.9716796875, -5629.427734375, -5344.88330078125, -5060.3388671875, -4775.79443359375, -4491.25048828125, -4206.7060546875, -3922.162109375, -3637.61767578125, -3353.073486328125, -3068.529296875, -2783.9853515625, -2499.441162109375, -2214.89697265625, -1930.3526611328125, -1645.8084716796875, -1361.2642822265625, -1076.719970703125, -792.17578125, -507.631591796875, -223.08737182617188, 61.45684814453125, 346.0010986328125, 630.5452880859375, 915.0894775390625, 1199.6337890625, 1484.177978515625, 1768.72265625, 2053.266845703125, 2337.81103515625, 2622.35546875, 2906.8994140625, 3191.44384765625, 3475.988037109375, 3760.5322265625, 4045.076416015625, 4329.62060546875, 4614.1650390625, 4898.708984375, 5183.25341796875, 5467.79736328125, 5752.341796875, 6036.8857421875, 6321.43017578125, 6605.974609375, 6890.5185546875, 7175.06298828125, 7459.60693359375, 7744.1513671875, 8028.6953125, 8313.240234375, 8597.7841796875, 8882.328125, 9166.873046875, 9451.4169921875, 9735.9609375, 10020.5048828125, 10305.0498046875, 10589.59375, 10874.1376953125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 18.0, 7.0, 13.0, 20.0, 31.0, 65.0, 103.0, 148.0, 212.0, 378.0, 560.0, 842.0, 1480.0, 2297.0, 3838.0, 5921.0, 10031.0, 16101.0, 26197.0, 44441.0, 74961.0, 132122.0, 251395.0, 598793.0, 4046342.0, 536850.0, 233926.0, 125649.0, 72097.0, 42158.0, 24790.0, 15549.0, 9171.0, 5607.0, 3494.0, 2201.0, 1316.0, 918.0, 509.0, 334.0, 182.0, 136.0, 68.0, 57.0, 43.0, 17.0, 18.0, 6.0, 7.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 0.0, 3.0], "bins": [-8.0546875, -7.798583984375, -7.54248046875, -7.286376953125, -7.0302734375, -6.774169921875, -6.51806640625, -6.261962890625, -6.005859375, -5.749755859375, -5.49365234375, -5.237548828125, -4.9814453125, -4.725341796875, -4.46923828125, -4.213134765625, -3.95703125, -3.700927734375, -3.44482421875, -3.188720703125, -2.9326171875, -2.676513671875, -2.42041015625, -2.164306640625, -1.908203125, -1.652099609375, -1.39599609375, -1.139892578125, -0.8837890625, -0.627685546875, -0.37158203125, -0.115478515625, 0.140625, 0.396728515625, 0.65283203125, 0.908935546875, 1.1650390625, 1.421142578125, 1.67724609375, 1.933349609375, 2.189453125, 2.445556640625, 2.70166015625, 2.957763671875, 3.2138671875, 3.469970703125, 3.72607421875, 3.982177734375, 4.23828125, 4.494384765625, 4.75048828125, 5.006591796875, 5.2626953125, 5.518798828125, 5.77490234375, 6.031005859375, 6.287109375, 6.543212890625, 6.79931640625, 7.055419921875, 7.3115234375, 7.567626953125, 7.82373046875, 8.079833984375, 8.3359375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 7.0, 9.0, 7.0, 8.0, 11.0, 15.0, 16.0, 33.0, 25.0, 30.0, 32.0, 30.0, 26.0, 32.0, 37.0, 36.0, 47.0, 90.0, 325.0, 650.0, 100.0, 46.0, 37.0, 46.0, 45.0, 32.0, 27.0, 36.0, 24.0, 21.0, 19.0, 19.0, 20.0, 8.0, 17.0, 11.0, 11.0, 6.0, 4.0, 5.0, 5.0, 5.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-18.390625, -17.802978515625, -17.21533203125, -16.627685546875, -16.0400390625, -15.452392578125, -14.86474609375, -14.277099609375, -13.689453125, -13.101806640625, -12.51416015625, -11.926513671875, -11.3388671875, -10.751220703125, -10.16357421875, -9.575927734375, -8.98828125, -8.400634765625, -7.81298828125, -7.225341796875, -6.6376953125, -6.050048828125, -5.46240234375, -4.874755859375, -4.287109375, -3.699462890625, -3.11181640625, -2.524169921875, -1.9365234375, -1.348876953125, -0.76123046875, -0.173583984375, 0.4140625, 1.001708984375, 1.58935546875, 2.177001953125, 2.7646484375, 3.352294921875, 3.93994140625, 4.527587890625, 5.115234375, 5.702880859375, 6.29052734375, 6.878173828125, 7.4658203125, 8.053466796875, 8.64111328125, 9.228759765625, 9.81640625, 10.404052734375, 10.99169921875, 11.579345703125, 12.1669921875, 12.754638671875, 13.34228515625, 13.929931640625, 14.517578125, 15.105224609375, 15.69287109375, 16.280517578125, 16.8681640625, 17.455810546875, 18.04345703125, 18.631103515625, 19.21875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 6.0, 4.0, 5.0, 6.0, 7.0, 9.0, 21.0, 39.0, 58.0, 54.0, 44.0, 93.0, 148.0, 241.0, 311.0, 388.0, 641.0, 940.0, 1421.0, 2219.0, 3145.0, 4870.0, 7784.0, 11623.0, 19570.0, 30931.0, 50964.0, 86846.0, 157672.0, 329772.0, 1769271.0, 3062173.0, 353259.0, 165532.0, 90093.0, 53456.0, 31872.0, 19778.0, 12788.0, 7734.0, 5159.0, 3501.0, 2254.0, 1449.0, 1103.0, 635.0, 397.0, 285.0, 283.0, 233.0, 99.0, 54.0, 47.0, 41.0, 42.0, 37.0, 13.0, 9.0, 6.0, 3.0, 3.0, 7.0, 5.0], "bins": [-9.28125, -8.9915771484375, -8.701904296875, -8.4122314453125, -8.12255859375, -7.8328857421875, -7.543212890625, -7.2535400390625, -6.9638671875, -6.6741943359375, -6.384521484375, -6.0948486328125, -5.80517578125, -5.5155029296875, -5.225830078125, -4.9361572265625, -4.646484375, -4.3568115234375, -4.067138671875, -3.7774658203125, -3.48779296875, -3.1981201171875, -2.908447265625, -2.6187744140625, -2.3291015625, -2.0394287109375, -1.749755859375, -1.4600830078125, -1.17041015625, -0.8807373046875, -0.591064453125, -0.3013916015625, -0.01171875, 0.2779541015625, 0.567626953125, 0.8572998046875, 1.14697265625, 1.4366455078125, 1.726318359375, 2.0159912109375, 2.3056640625, 2.5953369140625, 2.885009765625, 3.1746826171875, 3.46435546875, 3.7540283203125, 4.043701171875, 4.3333740234375, 4.623046875, 4.9127197265625, 5.202392578125, 5.4920654296875, 5.78173828125, 6.0714111328125, 6.361083984375, 6.6507568359375, 6.9404296875, 7.2301025390625, 7.519775390625, 7.8094482421875, 8.09912109375, 8.3887939453125, 8.678466796875, 8.9681396484375, 9.2578125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 10.0, 9.0, 19.0, 18.0, 29.0, 35.0, 32.0, 36.0, 39.0, 50.0, 38.0, 61.0, 128.0, 407.0, 591.0, 106.0, 62.0, 52.0, 50.0, 36.0, 29.0, 36.0, 31.0, 19.0, 16.0, 13.0, 18.0, 9.0, 7.0, 9.0, 5.0, 3.0, 4.0, 3.0, 1.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.029052734375, -16.46435546875, -15.899658203125, -15.3349609375, -14.770263671875, -14.20556640625, -13.640869140625, -13.076171875, -12.511474609375, -11.94677734375, -11.382080078125, -10.8173828125, -10.252685546875, -9.68798828125, -9.123291015625, -8.55859375, -7.993896484375, -7.42919921875, -6.864501953125, -6.2998046875, -5.735107421875, -5.17041015625, -4.605712890625, -4.041015625, -3.476318359375, -2.91162109375, -2.346923828125, -1.7822265625, -1.217529296875, -0.65283203125, -0.088134765625, 0.4765625, 1.041259765625, 1.60595703125, 2.170654296875, 2.7353515625, 3.300048828125, 3.86474609375, 4.429443359375, 4.994140625, 5.558837890625, 6.12353515625, 6.688232421875, 7.2529296875, 7.817626953125, 8.38232421875, 8.947021484375, 9.51171875, 10.076416015625, 10.64111328125, 11.205810546875, 11.7705078125, 12.335205078125, 12.89990234375, 13.464599609375, 14.029296875, 14.593994140625, 15.15869140625, 15.723388671875, 16.2880859375, 16.852783203125, 17.41748046875, 17.982177734375, 18.546875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 5.0, 11.0, 5.0, 3.0, 3.0, 7.0, 14.0, 20.0, 16.0, 22.0, 53.0, 110.0, 73.0, 69.0, 94.0, 140.0, 189.0, 380.0, 390.0, 476.0, 775.0, 1128.0, 1601.0, 2698.0, 4303.0, 8135.0, 17053.0, 46567.0, 308839.0, 5791029.0, 62661.0, 21233.0, 9246.0, 5075.0, 2814.0, 1993.0, 1193.0, 757.0, 600.0, 409.0, 317.0, 250.0, 166.0, 104.0, 112.0, 83.0, 37.0, 44.0, 50.0, 43.0, 9.0, 10.0, 8.0, 9.0, 4.0, 3.0, 0.0, 6.0, 1.0, 2.0, 6.0], "bins": [-28.59375, -27.703369140625, -26.81298828125, -25.922607421875, -25.0322265625, -24.141845703125, -23.25146484375, -22.361083984375, -21.470703125, -20.580322265625, -19.68994140625, -18.799560546875, -17.9091796875, -17.018798828125, -16.12841796875, -15.238037109375, -14.34765625, -13.457275390625, -12.56689453125, -11.676513671875, -10.7861328125, -9.895751953125, -9.00537109375, -8.114990234375, -7.224609375, -6.334228515625, -5.44384765625, -4.553466796875, -3.6630859375, -2.772705078125, -1.88232421875, -0.991943359375, -0.1015625, 0.788818359375, 1.67919921875, 2.569580078125, 3.4599609375, 4.350341796875, 5.24072265625, 6.131103515625, 7.021484375, 7.911865234375, 8.80224609375, 9.692626953125, 10.5830078125, 11.473388671875, 12.36376953125, 13.254150390625, 14.14453125, 15.034912109375, 15.92529296875, 16.815673828125, 17.7060546875, 18.596435546875, 19.48681640625, 20.377197265625, 21.267578125, 22.157958984375, 23.04833984375, 23.938720703125, 24.8291015625, 25.719482421875, 26.60986328125, 27.500244140625, 28.390625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 11.0, 9.0, 6.0, 9.0, 12.0, 13.0, 9.0, 15.0, 22.0, 21.0, 29.0, 37.0, 45.0, 38.0, 41.0, 58.0, 89.0, 172.0, 409.0, 400.0, 114.0, 74.0, 51.0, 42.0, 27.0, 35.0, 28.0, 32.0, 29.0, 29.0, 18.0, 20.0, 16.0, 10.0, 8.0, 9.0, 17.0, 5.0, 2.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.8515625, -9.511962890625, -9.17236328125, -8.832763671875, -8.4931640625, -8.153564453125, -7.81396484375, -7.474365234375, -7.134765625, -6.795166015625, -6.45556640625, -6.115966796875, -5.7763671875, -5.436767578125, -5.09716796875, -4.757568359375, -4.41796875, -4.078369140625, -3.73876953125, -3.399169921875, -3.0595703125, -2.719970703125, -2.38037109375, -2.040771484375, -1.701171875, -1.361572265625, -1.02197265625, -0.682373046875, -0.3427734375, -0.003173828125, 0.33642578125, 0.676025390625, 1.015625, 1.355224609375, 1.69482421875, 2.034423828125, 2.3740234375, 2.713623046875, 3.05322265625, 3.392822265625, 3.732421875, 4.072021484375, 4.41162109375, 4.751220703125, 5.0908203125, 5.430419921875, 5.77001953125, 6.109619140625, 6.44921875, 6.788818359375, 7.12841796875, 7.468017578125, 7.8076171875, 8.147216796875, 8.48681640625, 8.826416015625, 9.166015625, 9.505615234375, 9.84521484375, 10.184814453125, 10.5244140625, 10.864013671875, 11.20361328125, 11.543212890625, 11.8828125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 7.0, 10.0, 26.0, 62.0, 205.0, 469.0, 139.0, 49.0, 24.0, 8.0, 4.0, 2.0, 1.0], "bins": [-125.38099670410156, -123.1585922241211, -120.93618774414062, -118.71378326416016, -116.49137878417969, -114.26897430419922, -112.04656982421875, -109.82416534423828, -107.60176086425781, -105.37935638427734, -103.15695190429688, -100.9345474243164, -98.71214294433594, -96.48973846435547, -94.267333984375, -92.04492950439453, -89.82252502441406, -87.6001205444336, -85.37771606445312, -83.15531158447266, -80.93290710449219, -78.71050262451172, -76.48809814453125, -74.26569366455078, -72.04329681396484, -69.82089233398438, -67.5984878540039, -65.37608337402344, -63.15367889404297, -60.9312744140625, -58.70886993408203, -56.48646545410156, -54.264060974121094, -52.041656494140625, -49.819252014160156, -47.59684753417969, -45.37444305419922, -43.15203857421875, -40.92963409423828, -38.70722961425781, -36.48482894897461, -34.26242446899414, -32.04001998901367, -29.817615509033203, -27.595211029052734, -25.372806549072266, -23.15040397644043, -20.92799949645996, -18.705595016479492, -16.483190536499023, -14.260786056518555, -12.038382530212402, -9.815978050231934, -7.593573570251465, -5.3711700439453125, -3.1487655639648438, -0.926361083984375, 1.2960431575775146, 3.5184473991394043, 5.740851402282715, 7.963255882263184, 10.185660362243652, 12.408063888549805, 14.630468368530273, 16.852872848510742]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 6.0, 13.0, 15.0, 16.0, 25.0, 19.0, 27.0, 29.0, 37.0, 33.0, 37.0, 32.0, 40.0, 50.0, 41.0, 51.0, 48.0, 46.0, 39.0, 49.0, 38.0, 44.0, 34.0, 40.0, 33.0, 26.0, 24.0, 16.0, 16.0, 12.0, 14.0, 10.0, 5.0, 11.0, 7.0, 5.0, 1.0, 2.0, 2.0, 4.0], "bins": [-22.12297821044922, -21.571548461914062, -21.020118713378906, -20.46868896484375, -19.917259216308594, -19.365829467773438, -18.81439971923828, -18.262969970703125, -17.71154022216797, -17.160110473632812, -16.608680725097656, -16.0572509765625, -15.505821228027344, -14.954391479492188, -14.402961730957031, -13.851531982421875, -13.300103187561035, -12.748673439025879, -12.197243690490723, -11.645813941955566, -11.09438419342041, -10.542954444885254, -9.991525650024414, -9.440095901489258, -8.888666152954102, -8.337236404418945, -7.785806655883789, -7.234376907348633, -6.682947158813477, -6.13151741027832, -5.580088138580322, -5.028658390045166, -4.477227210998535, -3.925797462463379, -3.3743677139282227, -2.8229382038116455, -2.2715084552764893, -1.720078706741333, -1.1686491966247559, -0.6172194480895996, -0.06578969955444336, 0.4856399893760681, 1.0370696783065796, 1.5884993076324463, 2.1399290561676025, 2.691358804702759, 3.242788314819336, 3.794218063354492, 4.345647811889648, 4.897077560424805, 5.448507308959961, 5.999937057495117, 6.551366806030273, 7.10279655456543, 7.654225826263428, 8.205656051635742, 8.757085800170898, 9.308515548706055, 9.859945297241211, 10.411375045776367, 10.962804794311523, 11.51423454284668, 12.065664291381836, 12.617094039916992, 13.168522834777832]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 3.0, 1.0, 2.0, 6.0, 6.0, 8.0, 6.0, 16.0, 19.0, 12.0, 28.0, 28.0, 40.0, 44.0, 66.0, 82.0, 128.0, 190.0, 243.0, 359.0, 566.0, 844.0, 1289.0, 2090.0, 3455.0, 6220.0, 12349.0, 29927.0, 104418.0, 3822134.0, 144269.0, 35747.0, 13986.0, 6588.0, 3525.0, 1982.0, 1225.0, 780.0, 448.0, 305.0, 220.0, 162.0, 130.0, 88.0, 51.0, 50.0, 40.0, 24.0, 24.0, 16.0, 9.0, 18.0, 4.0, 8.0, 2.0, 6.0, 4.0, 0.0, 6.0, 0.0, 1.0], "bins": [-0.1090087890625, -0.10566329956054688, -0.10231781005859375, -0.09897232055664062, -0.0956268310546875, -0.09228134155273438, -0.08893585205078125, -0.08559036254882812, -0.082244873046875, -0.07889938354492188, -0.07555389404296875, -0.07220840454101562, -0.0688629150390625, -0.06551742553710938, -0.06217193603515625, -0.058826446533203125, -0.05548095703125, -0.052135467529296875, -0.04878997802734375, -0.045444488525390625, -0.0420989990234375, -0.038753509521484375, -0.03540802001953125, -0.032062530517578125, -0.028717041015625, -0.025371551513671875, -0.02202606201171875, -0.018680572509765625, -0.0153350830078125, -0.011989593505859375, -0.00864410400390625, -0.005298614501953125, -0.001953125, 0.001392364501953125, 0.00473785400390625, 0.008083343505859375, 0.0114288330078125, 0.014774322509765625, 0.01811981201171875, 0.021465301513671875, 0.024810791015625, 0.028156280517578125, 0.03150177001953125, 0.034847259521484375, 0.0381927490234375, 0.041538238525390625, 0.04488372802734375, 0.048229217529296875, 0.05157470703125, 0.054920196533203125, 0.05826568603515625, 0.061611175537109375, 0.0649566650390625, 0.06830215454101562, 0.07164764404296875, 0.07499313354492188, 0.078338623046875, 0.08168411254882812, 0.08502960205078125, 0.08837509155273438, 0.0917205810546875, 0.09506607055664062, 0.09841156005859375, 0.10175704956054688, 0.1051025390625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 4.0, 3.0, 1.0, 5.0, 3.0, 2.0, 3.0, 8.0, 5.0, 8.0, 6.0, 4.0, 11.0, 15.0, 18.0, 83.0, 712.0, 13.0, 14.0, 12.0, 9.0, 5.0, 4.0, 8.0, 7.0, 3.0, 12.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.03173828125, -0.030810117721557617, -0.029881954193115234, -0.02895379066467285, -0.02802562713623047, -0.027097463607788086, -0.026169300079345703, -0.02524113655090332, -0.024312973022460938, -0.023384809494018555, -0.022456645965576172, -0.02152848243713379, -0.020600318908691406, -0.019672155380249023, -0.01874399185180664, -0.017815828323364258, -0.016887664794921875, -0.015959501266479492, -0.01503133773803711, -0.014103174209594727, -0.013175010681152344, -0.012246847152709961, -0.011318683624267578, -0.010390520095825195, -0.009462356567382812, -0.00853419303894043, -0.007606029510498047, -0.006677865982055664, -0.005749702453613281, -0.0048215389251708984, -0.0038933753967285156, -0.002965211868286133, -0.00203704833984375, -0.0011088848114013672, -0.00018072128295898438, 0.0007474422454833984, 0.0016756057739257812, 0.002603769302368164, 0.003531932830810547, 0.00446009635925293, 0.0053882598876953125, 0.006316423416137695, 0.007244586944580078, 0.008172750473022461, 0.009100914001464844, 0.010029077529907227, 0.01095724105834961, 0.011885404586791992, 0.012813568115234375, 0.013741731643676758, 0.01466989517211914, 0.015598058700561523, 0.016526222229003906, 0.01745438575744629, 0.018382549285888672, 0.019310712814331055, 0.020238876342773438, 0.02116703987121582, 0.022095203399658203, 0.023023366928100586, 0.02395153045654297, 0.02487969398498535, 0.025807857513427734, 0.026736021041870117, 0.0276641845703125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 6.0, 3.0, 5.0, 13.0, 16.0, 13.0, 31.0, 36.0, 108.0, 268.0, 641.0, 1746.0, 6129.0, 30586.0, 295329.0, 3509286.0, 308529.0, 31990.0, 6469.0, 1874.0, 649.0, 273.0, 138.0, 55.0, 33.0, 15.0, 12.0, 10.0, 8.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165283203125, -0.1596813201904297, -0.15407943725585938, -0.14847755432128906, -0.14287567138671875, -0.13727378845214844, -0.13167190551757812, -0.1260700225830078, -0.1204681396484375, -0.11486625671386719, -0.10926437377929688, -0.10366249084472656, -0.09806060791015625, -0.09245872497558594, -0.08685684204101562, -0.08125495910644531, -0.075653076171875, -0.07005119323730469, -0.06444931030273438, -0.05884742736816406, -0.05324554443359375, -0.04764366149902344, -0.042041778564453125, -0.03643989562988281, -0.0308380126953125, -0.025236129760742188, -0.019634246826171875, -0.014032363891601562, -0.00843048095703125, -0.0028285980224609375, 0.002773284912109375, 0.008375167846679688, 0.01397705078125, 0.019578933715820312, 0.025180816650390625, 0.030782699584960938, 0.03638458251953125, 0.04198646545410156, 0.047588348388671875, 0.05319023132324219, 0.0587921142578125, 0.06439399719238281, 0.06999588012695312, 0.07559776306152344, 0.08119964599609375, 0.08680152893066406, 0.09240341186523438, 0.09800529479980469, 0.103607177734375, 0.10920906066894531, 0.11481094360351562, 0.12041282653808594, 0.12601470947265625, 0.13161659240722656, 0.13721847534179688, 0.1428203582763672, 0.1484222412109375, 0.1540241241455078, 0.15962600708007812, 0.16522789001464844, 0.17082977294921875, 0.17643165588378906, 0.18203353881835938, 0.1876354217529297, 0.1932373046875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 9.0, 11.0, 8.0, 14.0, 28.0, 27.0, 43.0, 68.0, 103.0, 124.0, 219.0, 342.0, 628.0, 918.0, 533.0, 320.0, 188.0, 144.0, 82.0, 63.0, 54.0, 43.0, 25.0, 23.0, 13.0, 7.0, 4.0, 8.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.045501708984375, -0.04414081573486328, -0.04277992248535156, -0.041419029235839844, -0.040058135986328125, -0.038697242736816406, -0.03733634948730469, -0.03597545623779297, -0.03461456298828125, -0.03325366973876953, -0.03189277648925781, -0.030531883239746094, -0.029170989990234375, -0.027810096740722656, -0.026449203491210938, -0.02508831024169922, -0.0237274169921875, -0.02236652374267578, -0.021005630493164062, -0.019644737243652344, -0.018283843994140625, -0.016922950744628906, -0.015562057495117188, -0.014201164245605469, -0.01284027099609375, -0.011479377746582031, -0.010118484497070312, -0.008757591247558594, -0.007396697998046875, -0.006035804748535156, -0.0046749114990234375, -0.0033140182495117188, -0.001953125, -0.0005922317504882812, 0.0007686614990234375, 0.0021295547485351562, 0.003490447998046875, 0.004851341247558594, 0.0062122344970703125, 0.007573127746582031, 0.00893402099609375, 0.010294914245605469, 0.011655807495117188, 0.013016700744628906, 0.014377593994140625, 0.015738487243652344, 0.017099380493164062, 0.01846027374267578, 0.0198211669921875, 0.02118206024169922, 0.022542953491210938, 0.023903846740722656, 0.025264739990234375, 0.026625633239746094, 0.027986526489257812, 0.02934741973876953, 0.03070831298828125, 0.03206920623779297, 0.03343009948730469, 0.034790992736816406, 0.036151885986328125, 0.037512779235839844, 0.03887367248535156, 0.04023456573486328, 0.041595458984375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 39.0, 65.0, 145.0, 280.0, 253.0, 116.0, 50.0, 29.0, 15.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6133080720901489, -0.597533643245697, -0.5817592144012451, -0.5659847855567932, -0.5502103567123413, -0.5344359278678894, -0.5186614990234375, -0.5028870701789856, -0.4871126413345337, -0.4713382124900818, -0.4555637836456299, -0.439789354801178, -0.4240149259567261, -0.40824049711227417, -0.39246606826782227, -0.37669163942337036, -0.36091718077659607, -0.34514275193214417, -0.32936832308769226, -0.31359389424324036, -0.29781946539878845, -0.28204503655433655, -0.26627057790756226, -0.25049614906311035, -0.23472173511981964, -0.21894730627536774, -0.20317287743091583, -0.18739843368530273, -0.17162400484085083, -0.15584957599639893, -0.14007514715194702, -0.12430071830749512, -0.10852628946304321, -0.09275186061859131, -0.0769774317741394, -0.0612029954791069, -0.045428566634655, -0.029654137790203094, -0.013879701495170593, 0.001894727349281311, 0.017669156193733215, 0.03344358503818512, 0.04921801760792732, 0.06499245017766953, 0.08076687902212143, 0.09654130786657333, 0.11231574416160583, 0.12809017300605774, 0.14386460185050964, 0.15963903069496155, 0.17541345953941345, 0.19118788838386536, 0.20696231722831726, 0.22273674607276917, 0.23851118981838226, 0.25428563356399536, 0.27006006240844727, 0.28583449125289917, 0.3016089200973511, 0.317383348941803, 0.3331577777862549, 0.3489322066307068, 0.3647066354751587, 0.3804810643196106, 0.3962554931640625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 6.0, 1.0, 6.0, 8.0, 7.0, 11.0, 19.0, 24.0, 35.0, 44.0, 36.0, 49.0, 52.0, 60.0, 63.0, 65.0, 62.0, 58.0, 76.0, 60.0, 51.0, 44.0, 32.0, 29.0, 19.0, 19.0, 12.0, 16.0, 9.0, 8.0, 3.0, 2.0, 4.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.23663735389709473, -0.23024378716945648, -0.22385022044181824, -0.21745665371418, -0.21106308698654175, -0.2046695202589035, -0.19827595353126526, -0.1918824017047882, -0.18548882007598877, -0.17909525334835052, -0.17270168662071228, -0.16630811989307404, -0.1599145531654358, -0.15352098643779755, -0.1471274197101593, -0.14073386788368225, -0.134340301156044, -0.12794673442840576, -0.12155316770076752, -0.11515960097312927, -0.10876603424549103, -0.10237246751785278, -0.09597890824079514, -0.08958534151315689, -0.08319177478551865, -0.0767982080578804, -0.07040464133024216, -0.06401108205318451, -0.057617511600255966, -0.05122394487261772, -0.044830381870269775, -0.03843681514263153, -0.032043248414993286, -0.02564968168735504, -0.019256116822361946, -0.01286255195736885, -0.006468985229730606, -7.541850209236145e-05, 0.006318144500255585, 0.01271171122789383, 0.019105277955532074, 0.02549884468317032, 0.03189241141080856, 0.03828597441315651, 0.044679541140794754, 0.051073107868433, 0.057466670870780945, 0.06386023759841919, 0.07025380432605743, 0.07664737105369568, 0.08304093778133392, 0.08943450450897217, 0.09582807123661041, 0.10222163796424866, 0.1086151972413063, 0.11500876396894455, 0.1214023306965828, 0.12779588997364044, 0.1341894567012787, 0.14058302342891693, 0.14697659015655518, 0.15337015688419342, 0.15976372361183167, 0.1661572903394699, 0.17255085706710815]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 5.0, 16.0, 10.0, 20.0, 32.0, 33.0, 36.0, 69.0, 88.0, 133.0, 176.0, 271.0, 383.0, 520.0, 786.0, 1102.0, 1771.0, 2560.0, 4083.0, 6916.0, 12463.0, 26626.0, 249228.0, 672147.0, 33355.0, 14429.0, 7841.0, 4578.0, 2962.0, 1865.0, 1238.0, 830.0, 582.0, 410.0, 285.0, 199.0, 148.0, 95.0, 72.0, 52.0, 33.0, 39.0, 11.0, 20.0, 10.0, 9.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.157470703125, -0.15256690979003906, -0.14766311645507812, -0.1427593231201172, -0.13785552978515625, -0.1329517364501953, -0.12804794311523438, -0.12314414978027344, -0.1182403564453125, -0.11333656311035156, -0.10843276977539062, -0.10352897644042969, -0.09862518310546875, -0.09372138977050781, -0.08881759643554688, -0.08391380310058594, -0.079010009765625, -0.07410621643066406, -0.06920242309570312, -0.06429862976074219, -0.05939483642578125, -0.05449104309082031, -0.049587249755859375, -0.04468345642089844, -0.0397796630859375, -0.03487586975097656, -0.029972076416015625, -0.025068283081054688, -0.02016448974609375, -0.015260696411132812, -0.010356903076171875, -0.0054531097412109375, -0.00054931640625, 0.0043544769287109375, 0.009258270263671875, 0.014162063598632812, 0.01906585693359375, 0.023969650268554688, 0.028873443603515625, 0.03377723693847656, 0.0386810302734375, 0.04358482360839844, 0.048488616943359375, 0.05339241027832031, 0.05829620361328125, 0.06319999694824219, 0.06810379028320312, 0.07300758361816406, 0.077911376953125, 0.08281517028808594, 0.08771896362304688, 0.09262275695800781, 0.09752655029296875, 0.10243034362792969, 0.10733413696289062, 0.11223793029785156, 0.1171417236328125, 0.12204551696777344, 0.12694931030273438, 0.1318531036376953, 0.13675689697265625, 0.1416606903076172, 0.14656448364257812, 0.15146827697753906, 0.1563720703125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 6.0, 10.0, 9.0, 11.0, 13.0, 24.0, 92.0, 301.0, 298.0, 96.0, 22.0, 17.0, 13.0, 5.0, 6.0, 7.0, 7.0, 7.0, 4.0, 4.0, 7.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.030303955078125, -0.029439926147460938, -0.028575897216796875, -0.027711868286132812, -0.02684783935546875, -0.025983810424804688, -0.025119781494140625, -0.024255752563476562, -0.0233917236328125, -0.022527694702148438, -0.021663665771484375, -0.020799636840820312, -0.01993560791015625, -0.019071578979492188, -0.018207550048828125, -0.017343521118164062, -0.0164794921875, -0.015615463256835938, -0.014751434326171875, -0.013887405395507812, -0.01302337646484375, -0.012159347534179688, -0.011295318603515625, -0.010431289672851562, -0.0095672607421875, -0.008703231811523438, -0.007839202880859375, -0.0069751739501953125, -0.00611114501953125, -0.0052471160888671875, -0.004383087158203125, -0.0035190582275390625, -0.002655029296875, -0.0017910003662109375, -0.000926971435546875, -6.29425048828125e-05, 0.00080108642578125, 0.0016651153564453125, 0.002529144287109375, 0.0033931732177734375, 0.0042572021484375, 0.0051212310791015625, 0.005985260009765625, 0.0068492889404296875, 0.00771331787109375, 0.008577346801757812, 0.009441375732421875, 0.010305404663085938, 0.01116943359375, 0.012033462524414062, 0.012897491455078125, 0.013761520385742188, 0.01462554931640625, 0.015489578247070312, 0.016353607177734375, 0.017217636108398438, 0.0180816650390625, 0.018945693969726562, 0.019809722900390625, 0.020673751831054688, 0.02153778076171875, 0.022401809692382812, 0.023265838623046875, 0.024129867553710938, 0.024993896484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 8.0, 10.0, 11.0, 12.0, 15.0, 32.0, 55.0, 77.0, 127.0, 230.0, 511.0, 1373.0, 5592.0, 69179.0, 904948.0, 58975.0, 5081.0, 1269.0, 467.0, 221.0, 138.0, 82.0, 50.0, 23.0, 25.0, 15.0, 7.0, 6.0, 8.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42626953125, -0.4118080139160156, -0.39734649658203125, -0.3828849792480469, -0.3684234619140625, -0.3539619445800781, -0.33950042724609375, -0.3250389099121094, -0.310577392578125, -0.2961158752441406, -0.28165435791015625, -0.2671928405761719, -0.2527313232421875, -0.23826980590820312, -0.22380828857421875, -0.20934677124023438, -0.19488525390625, -0.18042373657226562, -0.16596221923828125, -0.15150070190429688, -0.1370391845703125, -0.12257766723632812, -0.10811614990234375, -0.09365463256835938, -0.079193115234375, -0.06473159790039062, -0.05027008056640625, -0.035808563232421875, -0.0213470458984375, -0.006885528564453125, 0.00757598876953125, 0.022037506103515625, 0.0364990234375, 0.050960540771484375, 0.06542205810546875, 0.07988357543945312, 0.0943450927734375, 0.10880661010742188, 0.12326812744140625, 0.13772964477539062, 0.152191162109375, 0.16665267944335938, 0.18111419677734375, 0.19557571411132812, 0.2100372314453125, 0.22449874877929688, 0.23896026611328125, 0.2534217834472656, 0.26788330078125, 0.2823448181152344, 0.29680633544921875, 0.3112678527832031, 0.3257293701171875, 0.3401908874511719, 0.35465240478515625, 0.3691139221191406, 0.383575439453125, 0.3980369567871094, 0.41249847412109375, 0.4269599914550781, 0.4414215087890625, 0.4558830261230469, 0.47034454345703125, 0.4848060607910156, 0.499267578125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 5.0, 11.0, 7.0, 9.0, 11.0, 21.0, 16.0, 13.0, 21.0, 19.0, 26.0, 26.0, 24.0, 33.0, 45.0, 35.0, 31.0, 43.0, 48.0, 37.0, 42.0, 38.0, 46.0, 48.0, 29.0, 34.0, 27.0, 35.0, 43.0, 25.0, 24.0, 17.0, 30.0, 9.0, 18.0, 11.0, 4.0, 9.0, 8.0, 6.0, 3.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.1298828125, -0.12615203857421875, -0.1224212646484375, -0.11869049072265625, -0.114959716796875, -0.11122894287109375, -0.1074981689453125, -0.10376739501953125, -0.10003662109375, -0.09630584716796875, -0.0925750732421875, -0.08884429931640625, -0.085113525390625, -0.08138275146484375, -0.0776519775390625, -0.07392120361328125, -0.0701904296875, -0.06645965576171875, -0.0627288818359375, -0.05899810791015625, -0.055267333984375, -0.05153656005859375, -0.0478057861328125, -0.04407501220703125, -0.04034423828125, -0.03661346435546875, -0.0328826904296875, -0.02915191650390625, -0.025421142578125, -0.02169036865234375, -0.0179595947265625, -0.01422882080078125, -0.010498046875, -0.00676727294921875, -0.0030364990234375, 0.00069427490234375, 0.004425048828125, 0.00815582275390625, 0.0118865966796875, 0.01561737060546875, 0.01934814453125, 0.02307891845703125, 0.0268096923828125, 0.03054046630859375, 0.034271240234375, 0.03800201416015625, 0.0417327880859375, 0.04546356201171875, 0.0491943359375, 0.05292510986328125, 0.0566558837890625, 0.06038665771484375, 0.064117431640625, 0.06784820556640625, 0.0715789794921875, 0.07530975341796875, 0.07904052734375, 0.08277130126953125, 0.0865020751953125, 0.09023284912109375, 0.093963623046875, 0.09769439697265625, 0.1014251708984375, 0.10515594482421875, 0.10888671875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 10.0, 18.0, 24.0, 50.0, 65.0, 88.0, 209.0, 369.0, 820.0, 2678.0, 15492.0, 968493.0, 53306.0, 4559.0, 1299.0, 442.0, 278.0, 128.0, 73.0, 37.0, 28.0, 20.0, 14.0, 8.0, 10.0, 3.0, 7.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.4326171875, -0.4180450439453125, -0.403472900390625, -0.3889007568359375, -0.37432861328125, -0.3597564697265625, -0.345184326171875, -0.3306121826171875, -0.3160400390625, -0.3014678955078125, -0.286895751953125, -0.2723236083984375, -0.25775146484375, -0.2431793212890625, -0.228607177734375, -0.2140350341796875, -0.199462890625, -0.1848907470703125, -0.170318603515625, -0.1557464599609375, -0.14117431640625, -0.1266021728515625, -0.112030029296875, -0.0974578857421875, -0.0828857421875, -0.0683135986328125, -0.053741455078125, -0.0391693115234375, -0.02459716796875, -0.0100250244140625, 0.004547119140625, 0.0191192626953125, 0.03369140625, 0.0482635498046875, 0.062835693359375, 0.0774078369140625, 0.09197998046875, 0.1065521240234375, 0.121124267578125, 0.1356964111328125, 0.1502685546875, 0.1648406982421875, 0.179412841796875, 0.1939849853515625, 0.20855712890625, 0.2231292724609375, 0.237701416015625, 0.2522735595703125, 0.266845703125, 0.2814178466796875, 0.295989990234375, 0.3105621337890625, 0.32513427734375, 0.3397064208984375, 0.354278564453125, 0.3688507080078125, 0.3834228515625, 0.3979949951171875, 0.412567138671875, 0.4271392822265625, 0.44171142578125, 0.4562835693359375, 0.470855712890625, 0.4854278564453125, 0.5]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 7.0, 7.0, 11.0, 13.0, 9.0, 11.0, 18.0, 21.0, 26.0, 36.0, 38.0, 44.0, 46.0, 98.0, 149.0, 86.0, 68.0, 69.0, 48.0, 27.0, 29.0, 25.0, 22.0, 12.0, 19.0, 8.0, 10.0, 9.0, 4.0, 6.0, 3.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0016937255859375, -0.0016447901725769043, -0.0015958547592163086, -0.0015469193458557129, -0.0014979839324951172, -0.0014490485191345215, -0.0014001131057739258, -0.00135117769241333, -0.0013022422790527344, -0.0012533068656921387, -0.001204371452331543, -0.0011554360389709473, -0.0011065006256103516, -0.0010575652122497559, -0.0010086297988891602, -0.0009596943855285645, -0.0009107589721679688, -0.000861823558807373, -0.0008128881454467773, -0.0007639527320861816, -0.0007150173187255859, -0.0006660819053649902, -0.0006171464920043945, -0.0005682110786437988, -0.0005192756652832031, -0.0004703402519226074, -0.0004214048385620117, -0.000372469425201416, -0.0003235340118408203, -0.0002745985984802246, -0.0002256631851196289, -0.0001767277717590332, -0.0001277923583984375, -7.88569450378418e-05, -2.9921531677246094e-05, 1.901388168334961e-05, 6.794929504394531e-05, 0.00011688470840454102, 0.00016582012176513672, 0.00021475553512573242, 0.0002636909484863281, 0.00031262636184692383, 0.00036156177520751953, 0.00041049718856811523, 0.00045943260192871094, 0.0005083680152893066, 0.0005573034286499023, 0.000606238842010498, 0.0006551742553710938, 0.0007041096687316895, 0.0007530450820922852, 0.0008019804954528809, 0.0008509159088134766, 0.0008998513221740723, 0.000948786735534668, 0.0009977221488952637, 0.0010466575622558594, 0.001095592975616455, 0.0011445283889770508, 0.0011934638023376465, 0.0012423992156982422, 0.0012913346290588379, 0.0013402700424194336, 0.0013892054557800293, 0.001438140869140625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 6.0, 10.0, 6.0, 5.0, 15.0, 19.0, 19.0, 34.0, 59.0, 77.0, 125.0, 169.0, 317.0, 534.0, 961.0, 1783.0, 3831.0, 9479.0, 29937.0, 170627.0, 693493.0, 101356.0, 21657.0, 7468.0, 3120.0, 1473.0, 791.0, 424.0, 264.0, 154.0, 101.0, 76.0, 43.0, 33.0, 31.0, 19.0, 8.0, 8.0, 8.0, 8.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1461181640625, -0.14130783081054688, -0.13649749755859375, -0.13168716430664062, -0.1268768310546875, -0.12206649780273438, -0.11725616455078125, -0.11244583129882812, -0.107635498046875, -0.10282516479492188, -0.09801483154296875, -0.09320449829101562, -0.0883941650390625, -0.08358383178710938, -0.07877349853515625, -0.07396316528320312, -0.06915283203125, -0.06434249877929688, -0.05953216552734375, -0.054721832275390625, -0.0499114990234375, -0.045101165771484375, -0.04029083251953125, -0.035480499267578125, -0.030670166015625, -0.025859832763671875, -0.02104949951171875, -0.016239166259765625, -0.0114288330078125, -0.006618499755859375, -0.00180816650390625, 0.003002166748046875, 0.0078125, 0.012622833251953125, 0.01743316650390625, 0.022243499755859375, 0.0270538330078125, 0.031864166259765625, 0.03667449951171875, 0.041484832763671875, 0.046295166015625, 0.051105499267578125, 0.05591583251953125, 0.060726165771484375, 0.0655364990234375, 0.07034683227539062, 0.07515716552734375, 0.07996749877929688, 0.08477783203125, 0.08958816528320312, 0.09439849853515625, 0.09920883178710938, 0.1040191650390625, 0.10882949829101562, 0.11363983154296875, 0.11845016479492188, 0.123260498046875, 0.12807083129882812, 0.13288116455078125, 0.13769149780273438, 0.1425018310546875, 0.14731216430664062, 0.15212249755859375, 0.15693283081054688, 0.1617431640625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 5.0, 8.0, 11.0, 10.0, 21.0, 20.0, 31.0, 44.0, 43.0, 50.0, 78.0, 102.0, 93.0, 89.0, 72.0, 62.0, 38.0, 35.0, 39.0, 21.0, 14.0, 17.0, 18.0, 10.0, 11.0, 10.0, 5.0, 4.0, 10.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1387939453125, -0.13465118408203125, -0.1305084228515625, -0.12636566162109375, -0.122222900390625, -0.11808013916015625, -0.1139373779296875, -0.10979461669921875, -0.10565185546875, -0.10150909423828125, -0.0973663330078125, -0.09322357177734375, -0.089080810546875, -0.08493804931640625, -0.0807952880859375, -0.07665252685546875, -0.072509765625, -0.06836700439453125, -0.0642242431640625, -0.06008148193359375, -0.055938720703125, -0.05179595947265625, -0.0476531982421875, -0.04351043701171875, -0.03936767578125, -0.03522491455078125, -0.0310821533203125, -0.02693939208984375, -0.022796630859375, -0.01865386962890625, -0.0145111083984375, -0.01036834716796875, -0.0062255859375, -0.00208282470703125, 0.0020599365234375, 0.00620269775390625, 0.010345458984375, 0.01448822021484375, 0.0186309814453125, 0.02277374267578125, 0.02691650390625, 0.03105926513671875, 0.0352020263671875, 0.03934478759765625, 0.043487548828125, 0.04763031005859375, 0.0517730712890625, 0.05591583251953125, 0.06005859375, 0.06420135498046875, 0.0683441162109375, 0.07248687744140625, 0.076629638671875, 0.08077239990234375, 0.0849151611328125, 0.08905792236328125, 0.09320068359375, 0.09734344482421875, 0.1014862060546875, 0.10562896728515625, 0.109771728515625, 0.11391448974609375, 0.1180572509765625, 0.12220001220703125, 0.1263427734375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 3.0, 3.0, 4.0, 9.0, 5.0, 15.0, 11.0, 43.0, 84.0, 188.0, 346.0, 157.0, 57.0, 31.0, 17.0, 10.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.265544891357422, -2.198141574859619, -2.1307382583618164, -2.0633351802825928, -1.99593186378479, -1.9285285472869873, -1.8611253499984741, -1.793722152709961, -1.7263188362121582, -1.6589155197143555, -1.5915123224258423, -1.524109125137329, -1.4567058086395264, -1.3893024921417236, -1.3218992948532104, -1.2544960975646973, -1.1870927810668945, -1.1196894645690918, -1.0522862672805786, -0.9848830103874207, -0.9174797534942627, -0.8500764966011047, -0.7826732397079468, -0.7152699828147888, -0.6478667259216309, -0.5804634690284729, -0.5130602121353149, -0.445656955242157, -0.378253698348999, -0.31085044145584106, -0.2434471845626831, -0.17604392766952515, -0.10864090919494629, -0.04123765230178833, 0.02616560459136963, 0.09356886148452759, 0.16097211837768555, 0.2283753752708435, 0.29577863216400146, 0.3631818890571594, 0.4305851459503174, 0.49798840284347534, 0.5653916597366333, 0.6327949166297913, 0.7001981735229492, 0.7676014304161072, 0.8350046873092651, 0.9024079442024231, 0.969811201095581, 1.0372145175933838, 1.104617714881897, 1.1720209121704102, 1.239424228668213, 1.3068275451660156, 1.3742307424545288, 1.441633939743042, 1.5090372562408447, 1.5764405727386475, 1.6438437700271606, 1.7112469673156738, 1.7786502838134766, 1.8460536003112793, 1.9134567975997925, 1.9808599948883057, 2.0482633113861084]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 9.0, 7.0, 13.0, 13.0, 20.0, 22.0, 64.0, 86.0, 117.0, 168.0, 158.0, 116.0, 60.0, 35.0, 27.0, 16.0, 13.0, 9.0, 8.0, 3.0, 3.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1231069564819336, -2.040691375732422, -1.9582756757736206, -1.8758600950241089, -1.7934445142745972, -1.711028814315796, -1.6286132335662842, -1.5461976528167725, -1.4637820720672607, -1.381366491317749, -1.2989507913589478, -1.216535210609436, -1.1341196298599243, -1.051703929901123, -0.9692883491516113, -0.8868727684020996, -0.8044570684432983, -0.7220414280891418, -0.6396258473396301, -0.5572102069854736, -0.4747945964336395, -0.3923789858818054, -0.3099633455276489, -0.2275477647781372, -0.1451321244239807, -0.06271650642156601, 0.019699111580848694, 0.102114737033844, 0.1845303475856781, 0.2669459581375122, 0.3493615984916687, 0.4317771792411804, 0.5141928195953369, 0.5966084599494934, 0.6790240406990051, 0.7614396810531616, 0.8438552618026733, 0.9262709021568298, 1.0086865425109863, 1.091102123260498, 1.1735177040100098, 1.2559332847595215, 1.3383489847183228, 1.4207645654678345, 1.5031801462173462, 1.5855958461761475, 1.6680114269256592, 1.750427007675171, 1.8328427076339722, 1.9152582883834839, 1.9976739883422852, 2.080089569091797, 2.1625051498413086, 2.2449207305908203, 2.327336311340332, 2.4097518920898438, 2.4921677112579346, 2.5745832920074463, 2.656998872756958, 2.739414691925049, 2.8218302726745605, 2.9042458534240723, 2.986661434173584, 3.0690770149230957, 3.1514925956726074]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 3.0, 5.0, 10.0, 18.0, 26.0, 30.0, 46.0, 111.0, 476.0, 27133.0, 4165389.0, 844.0, 75.0, 37.0, 26.0, 14.0, 13.0, 6.0, 3.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6875, -8.491119384765625, -8.29473876953125, -8.098358154296875, -7.9019775390625, -7.705596923828125, -7.50921630859375, -7.312835693359375, -7.116455078125, -6.920074462890625, -6.72369384765625, -6.527313232421875, -6.3309326171875, -6.134552001953125, -5.93817138671875, -5.741790771484375, -5.54541015625, -5.349029541015625, -5.15264892578125, -4.956268310546875, -4.7598876953125, -4.563507080078125, -4.36712646484375, -4.170745849609375, -3.974365234375, -3.777984619140625, -3.58160400390625, -3.385223388671875, -3.1888427734375, -2.992462158203125, -2.79608154296875, -2.599700927734375, -2.4033203125, -2.206939697265625, -2.01055908203125, -1.814178466796875, -1.6177978515625, -1.421417236328125, -1.22503662109375, -1.028656005859375, -0.832275390625, -0.635894775390625, -0.43951416015625, -0.243133544921875, -0.0467529296875, 0.149627685546875, 0.34600830078125, 0.542388916015625, 0.73876953125, 0.935150146484375, 1.13153076171875, 1.327911376953125, 1.5242919921875, 1.720672607421875, 1.91705322265625, 2.113433837890625, 2.309814453125, 2.506195068359375, 2.70257568359375, 2.898956298828125, 3.0953369140625, 3.291717529296875, 3.48809814453125, 3.684478759765625, 3.880859375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 3.0, 6.0, 16.0, 16.0, 38.0, 57.0, 114.0, 178.0, 199.0, 138.0, 64.0, 41.0, 16.0, 15.0, 10.0, 10.0, 7.0, 7.0, 3.0, 3.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0254364013671875, -0.024671077728271484, -0.02390575408935547, -0.023140430450439453, -0.022375106811523438, -0.021609783172607422, -0.020844459533691406, -0.02007913589477539, -0.019313812255859375, -0.01854848861694336, -0.017783164978027344, -0.017017841339111328, -0.016252517700195312, -0.015487194061279297, -0.014721870422363281, -0.013956546783447266, -0.01319122314453125, -0.012425899505615234, -0.011660575866699219, -0.010895252227783203, -0.010129928588867188, -0.009364604949951172, -0.008599281311035156, -0.00783395767211914, -0.007068634033203125, -0.006303310394287109, -0.005537986755371094, -0.004772663116455078, -0.0040073394775390625, -0.003242015838623047, -0.0024766921997070312, -0.0017113685607910156, -0.000946044921875, -0.00018072128295898438, 0.0005846023559570312, 0.0013499259948730469, 0.0021152496337890625, 0.002880573272705078, 0.0036458969116210938, 0.004411220550537109, 0.005176544189453125, 0.005941867828369141, 0.006707191467285156, 0.007472515106201172, 0.008237838745117188, 0.009003162384033203, 0.009768486022949219, 0.010533809661865234, 0.01129913330078125, 0.012064456939697266, 0.012829780578613281, 0.013595104217529297, 0.014360427856445312, 0.015125751495361328, 0.015891075134277344, 0.01665639877319336, 0.017421722412109375, 0.01818704605102539, 0.018952369689941406, 0.019717693328857422, 0.020483016967773438, 0.021248340606689453, 0.02201366424560547, 0.022778987884521484, 0.0235443115234375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 6.0, 1.0, 9.0, 17.0, 29.0, 46.0, 86.0, 231.0, 2059.0, 3775002.0, 414531.0, 1395.0, 283.0, 188.0, 145.0, 100.0, 73.0, 39.0, 35.0, 9.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66162109375, -0.6141128540039062, -0.5666046142578125, -0.5190963745117188, -0.471588134765625, -0.42407989501953125, -0.3765716552734375, -0.32906341552734375, -0.28155517578125, -0.23404693603515625, -0.1865386962890625, -0.13903045654296875, -0.091522216796875, -0.04401397705078125, 0.0034942626953125, 0.05100250244140625, 0.0985107421875, 0.14601898193359375, 0.1935272216796875, 0.24103546142578125, 0.288543701171875, 0.33605194091796875, 0.3835601806640625, 0.43106842041015625, 0.47857666015625, 0.5260848999023438, 0.5735931396484375, 0.6211013793945312, 0.668609619140625, 0.7161178588867188, 0.7636260986328125, 0.8111343383789062, 0.858642578125, 0.9061508178710938, 0.9536590576171875, 1.0011672973632812, 1.048675537109375, 1.0961837768554688, 1.1436920166015625, 1.1912002563476562, 1.23870849609375, 1.2862167358398438, 1.3337249755859375, 1.3812332153320312, 1.428741455078125, 1.4762496948242188, 1.5237579345703125, 1.5712661743164062, 1.6187744140625, 1.6662826538085938, 1.7137908935546875, 1.7612991333007812, 1.808807373046875, 1.8563156127929688, 1.9038238525390625, 1.9513320922851562, 1.99884033203125, 2.0463485717773438, 2.0938568115234375, 2.1413650512695312, 2.188873291015625, 2.2363815307617188, 2.2838897705078125, 2.3313980102539062, 2.37890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 5.0, 11.0, 24.0, 25.0, 29.0, 52.0, 76.0, 146.0, 275.0, 658.0, 1309.0, 752.0, 330.0, 151.0, 68.0, 34.0, 24.0, 18.0, 8.0, 12.0, 9.0, 14.0, 5.0, 5.0, 4.0, 5.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043487548828125, -0.04218769073486328, -0.04088783264160156, -0.039587974548339844, -0.038288116455078125, -0.036988258361816406, -0.03568840026855469, -0.03438854217529297, -0.03308868408203125, -0.03178882598876953, -0.030488967895507812, -0.029189109802246094, -0.027889251708984375, -0.026589393615722656, -0.025289535522460938, -0.02398967742919922, -0.0226898193359375, -0.02138996124267578, -0.020090103149414062, -0.018790245056152344, -0.017490386962890625, -0.016190528869628906, -0.014890670776367188, -0.013590812683105469, -0.01229095458984375, -0.010991096496582031, -0.009691238403320312, -0.008391380310058594, -0.007091522216796875, -0.005791664123535156, -0.0044918060302734375, -0.0031919479370117188, -0.00189208984375, -0.0005922317504882812, 0.0007076263427734375, 0.0020074844360351562, 0.003307342529296875, 0.004607200622558594, 0.0059070587158203125, 0.007206916809082031, 0.00850677490234375, 0.009806632995605469, 0.011106491088867188, 0.012406349182128906, 0.013706207275390625, 0.015006065368652344, 0.016305923461914062, 0.01760578155517578, 0.0189056396484375, 0.02020549774169922, 0.021505355834960938, 0.022805213928222656, 0.024105072021484375, 0.025404930114746094, 0.026704788208007812, 0.02800464630126953, 0.02930450439453125, 0.03060436248779297, 0.03190422058105469, 0.033204078674316406, 0.034503936767578125, 0.035803794860839844, 0.03710365295410156, 0.03840351104736328, 0.039703369140625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [778.0, 230.0, 14.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12951700389385223, 0.027795732021331787, 0.1851084679365158, 0.34242117404937744, 0.49973392486572266, 0.6570466756820679, 0.8143593668937683, 0.9716721177101135, 1.1289849281311035, 1.2862976789474487, 1.443610429763794, 1.6009230613708496, 1.7582359313964844, 1.91554856300354, 2.0728611946105957, 2.2301740646362305, 2.387486696243286, 2.544799327850342, 2.7021121978759766, 2.8594248294830322, 3.016737699508667, 3.1740503311157227, 3.3313632011413574, 3.488675832748413, 3.645988702774048, 3.8033013343811035, 3.9606142044067383, 4.117927074432373, 4.27523946762085, 4.432552337646484, 4.589865207672119, 4.747178077697754, 4.904490947723389, 5.061803817749023, 5.2191162109375, 5.376429080963135, 5.5337419509887695, 5.691054821014404, 5.848367214202881, 6.005680084228516, 6.16299295425415, 6.320305824279785, 6.477618217468262, 6.6349310874938965, 6.792243957519531, 6.949556827545166, 7.106869220733643, 7.264182090759277, 7.421494483947754, 7.578807353973389, 7.736119747161865, 7.8934326171875, 8.050745010375977, 8.20805835723877, 8.365370750427246, 8.522684097290039, 8.679996490478516, 8.837308883666992, 8.994622230529785, 9.151934623718262, 9.309247016906738, 9.466560363769531, 9.623872756958008, 9.781185150146484, 9.938498497009277]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 1.0, 7.0, 6.0, 10.0, 7.0, 22.0, 35.0, 38.0, 47.0, 66.0, 98.0, 83.0, 119.0, 88.0, 87.0, 73.0, 48.0, 43.0, 35.0, 14.0, 17.0, 10.0, 9.0, 4.0, 3.0, 7.0, 4.0, 1.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23453474044799805, -0.22675292193889618, -0.2189711034297943, -0.21118929982185364, -0.20340748131275177, -0.1956256628036499, -0.18784385919570923, -0.18006204068660736, -0.1722802221775055, -0.16449840366840363, -0.15671658515930176, -0.14893478155136108, -0.14115296304225922, -0.13337114453315735, -0.12558934092521667, -0.11780752241611481, -0.11002570390701294, -0.10224388539791107, -0.0944620743393898, -0.08668026328086853, -0.07889844477176666, -0.0711166262626648, -0.06333481520414352, -0.055553000420331955, -0.047771185636520386, -0.039989370852708817, -0.03220755606889725, -0.024425741285085678, -0.01664392650127411, -0.00886211171746254, -0.0010802969336509705, 0.006701517850160599, 0.014483332633972168, 0.022265147417783737, 0.030046962201595306, 0.037828776985406876, 0.045610591769218445, 0.053392406553030014, 0.06117422133684158, 0.06895603239536285, 0.07673785090446472, 0.08451966941356659, 0.09230148047208786, 0.10008329153060913, 0.107865110039711, 0.11564692854881287, 0.12342873960733414, 0.1312105506658554, 0.13899236917495728, 0.14677418768405914, 0.154556006193161, 0.16233780980110168, 0.17011962831020355, 0.17790144681930542, 0.1856832504272461, 0.19346506893634796, 0.20124688744544983, 0.2090287059545517, 0.21681052446365356, 0.22459232807159424, 0.2323741465806961, 0.24015596508979797, 0.24793776869773865, 0.2557196021080017, 0.2635014057159424]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 8.0, 8.0, 12.0, 6.0, 13.0, 22.0, 28.0, 17.0, 38.0, 48.0, 63.0, 145.0, 673.0, 3504.0, 27875.0, 907262.0, 99286.0, 7694.0, 1264.0, 283.0, 74.0, 34.0, 46.0, 23.0, 24.0, 14.0, 9.0, 20.0, 11.0, 12.0, 3.0, 5.0, 4.0, 6.0, 1.0, 8.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.397705078125, -0.38385009765625, -0.3699951171875, -0.35614013671875, -0.34228515625, -0.32843017578125, -0.3145751953125, -0.30072021484375, -0.286865234375, -0.27301025390625, -0.2591552734375, -0.24530029296875, -0.2314453125, -0.21759033203125, -0.2037353515625, -0.18988037109375, -0.176025390625, -0.16217041015625, -0.1483154296875, -0.13446044921875, -0.12060546875, -0.10675048828125, -0.0928955078125, -0.07904052734375, -0.065185546875, -0.05133056640625, -0.0374755859375, -0.02362060546875, -0.009765625, 0.00408935546875, 0.0179443359375, 0.03179931640625, 0.045654296875, 0.05950927734375, 0.0733642578125, 0.08721923828125, 0.10107421875, 0.11492919921875, 0.1287841796875, 0.14263916015625, 0.156494140625, 0.17034912109375, 0.1842041015625, 0.19805908203125, 0.2119140625, 0.22576904296875, 0.2396240234375, 0.25347900390625, 0.267333984375, 0.28118896484375, 0.2950439453125, 0.30889892578125, 0.32275390625, 0.33660888671875, 0.3504638671875, 0.36431884765625, 0.378173828125, 0.39202880859375, 0.4058837890625, 0.41973876953125, 0.43359375, 0.44744873046875, 0.4613037109375, 0.47515869140625, 0.489013671875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 10.0, 5.0, 18.0, 19.0, 29.0, 119.0, 275.0, 296.0, 144.0, 30.0, 21.0, 10.0, 13.0, 8.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.07470703125, -0.07324361801147461, -0.07178020477294922, -0.07031679153442383, -0.06885337829589844, -0.06738996505737305, -0.06592655181884766, -0.06446313858032227, -0.06299972534179688, -0.061536312103271484, -0.060072898864746094, -0.0586094856262207, -0.05714607238769531, -0.05568265914916992, -0.05421924591064453, -0.05275583267211914, -0.05129241943359375, -0.04982900619506836, -0.04836559295654297, -0.04690217971801758, -0.04543876647949219, -0.0439753532409668, -0.042511940002441406, -0.041048526763916016, -0.039585113525390625, -0.038121700286865234, -0.036658287048339844, -0.03519487380981445, -0.03373146057128906, -0.03226804733276367, -0.03080463409423828, -0.02934122085571289, -0.0278778076171875, -0.02641439437866211, -0.02495098114013672, -0.023487567901611328, -0.022024154663085938, -0.020560741424560547, -0.019097328186035156, -0.017633914947509766, -0.016170501708984375, -0.014707088470458984, -0.013243675231933594, -0.011780261993408203, -0.010316848754882812, -0.008853435516357422, -0.007390022277832031, -0.005926609039306641, -0.00446319580078125, -0.0029997825622558594, -0.0015363693237304688, -7.295608520507812e-05, 0.0013904571533203125, 0.002853870391845703, 0.004317283630371094, 0.005780696868896484, 0.007244110107421875, 0.008707523345947266, 0.010170936584472656, 0.011634349822998047, 0.013097763061523438, 0.014561176300048828, 0.01602458953857422, 0.01748800277709961, 0.018951416015625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 6.0, 12.0, 17.0, 21.0, 53.0, 127.0, 713.0, 15961.0, 959774.0, 70130.0, 1384.0, 202.0, 55.0, 30.0, 12.0, 13.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6650390625, -0.6468925476074219, -0.6287460327148438, -0.6105995178222656, -0.5924530029296875, -0.5743064880371094, -0.5561599731445312, -0.5380134582519531, -0.519866943359375, -0.5017204284667969, -0.48357391357421875, -0.4654273986816406, -0.4472808837890625, -0.4291343688964844, -0.41098785400390625, -0.3928413391113281, -0.37469482421875, -0.3565483093261719, -0.33840179443359375, -0.3202552795410156, -0.3021087646484375, -0.2839622497558594, -0.26581573486328125, -0.24766921997070312, -0.229522705078125, -0.21137619018554688, -0.19322967529296875, -0.17508316040039062, -0.1569366455078125, -0.13879013061523438, -0.12064361572265625, -0.10249710083007812, -0.0843505859375, -0.06620407104492188, -0.04805755615234375, -0.029911041259765625, -0.0117645263671875, 0.006381988525390625, 0.02452850341796875, 0.042675018310546875, 0.060821533203125, 0.07896804809570312, 0.09711456298828125, 0.11526107788085938, 0.1334075927734375, 0.15155410766601562, 0.16970062255859375, 0.18784713745117188, 0.20599365234375, 0.22414016723632812, 0.24228668212890625, 0.2604331970214844, 0.2785797119140625, 0.2967262268066406, 0.31487274169921875, 0.3330192565917969, 0.351165771484375, 0.3693122863769531, 0.38745880126953125, 0.4056053161621094, 0.4237518310546875, 0.4418983459472656, 0.46004486083984375, 0.4781913757324219, 0.496337890625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 9.0, 3.0, 7.0, 5.0, 5.0, 9.0, 15.0, 22.0, 19.0, 22.0, 25.0, 25.0, 31.0, 32.0, 38.0, 38.0, 41.0, 43.0, 50.0, 41.0, 32.0, 32.0, 33.0, 41.0, 31.0, 29.0, 46.0, 45.0, 31.0, 21.0, 31.0, 33.0, 11.0, 21.0, 14.0, 15.0, 11.0, 11.0, 5.0, 5.0, 3.0, 3.0, 6.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06683349609375, -0.06458473205566406, -0.062335968017578125, -0.06008720397949219, -0.05783843994140625, -0.05558967590332031, -0.053340911865234375, -0.05109214782714844, -0.0488433837890625, -0.04659461975097656, -0.044345855712890625, -0.04209709167480469, -0.03984832763671875, -0.03759956359863281, -0.035350799560546875, -0.03310203552246094, -0.030853271484375, -0.028604507446289062, -0.026355743408203125, -0.024106979370117188, -0.02185821533203125, -0.019609451293945312, -0.017360687255859375, -0.015111923217773438, -0.0128631591796875, -0.010614395141601562, -0.008365631103515625, -0.0061168670654296875, -0.00386810302734375, -0.0016193389892578125, 0.000629425048828125, 0.0028781890869140625, 0.005126953125, 0.0073757171630859375, 0.009624481201171875, 0.011873245239257812, 0.01412200927734375, 0.016370773315429688, 0.018619537353515625, 0.020868301391601562, 0.0231170654296875, 0.025365829467773438, 0.027614593505859375, 0.029863357543945312, 0.03211212158203125, 0.03436088562011719, 0.036609649658203125, 0.03885841369628906, 0.041107177734375, 0.04335594177246094, 0.045604705810546875, 0.04785346984863281, 0.05010223388671875, 0.05235099792480469, 0.054599761962890625, 0.05684852600097656, 0.0590972900390625, 0.06134605407714844, 0.06359481811523438, 0.06584358215332031, 0.06809234619140625, 0.07034111022949219, 0.07258987426757812, 0.07483863830566406, 0.07708740234375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 8.0, 18.0, 56.0, 267.0, 1850.0, 994066.0, 51125.0, 890.0, 152.0, 41.0, 19.0, 9.0, 7.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.005859375, -0.9709930419921875, -0.936126708984375, -0.9012603759765625, -0.86639404296875, -0.8315277099609375, -0.796661376953125, -0.7617950439453125, -0.7269287109375, -0.6920623779296875, -0.657196044921875, -0.6223297119140625, -0.58746337890625, -0.5525970458984375, -0.517730712890625, -0.4828643798828125, -0.447998046875, -0.4131317138671875, -0.378265380859375, -0.3433990478515625, -0.30853271484375, -0.2736663818359375, -0.238800048828125, -0.2039337158203125, -0.1690673828125, -0.1342010498046875, -0.099334716796875, -0.0644683837890625, -0.02960205078125, 0.0052642822265625, 0.040130615234375, 0.0749969482421875, 0.10986328125, 0.1447296142578125, 0.179595947265625, 0.2144622802734375, 0.24932861328125, 0.2841949462890625, 0.319061279296875, 0.3539276123046875, 0.3887939453125, 0.4236602783203125, 0.458526611328125, 0.4933929443359375, 0.52825927734375, 0.5631256103515625, 0.597991943359375, 0.6328582763671875, 0.667724609375, 0.7025909423828125, 0.737457275390625, 0.7723236083984375, 0.80718994140625, 0.8420562744140625, 0.876922607421875, 0.9117889404296875, 0.9466552734375, 0.9815216064453125, 1.016387939453125, 1.0512542724609375, 1.08612060546875, 1.1209869384765625, 1.155853271484375, 1.1907196044921875, 1.2255859375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 3.0, 5.0, 3.0, 11.0, 12.0, 12.0, 25.0, 39.0, 169.0, 544.0, 65.0, 37.0, 22.0, 16.0, 5.0, 3.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029354095458984375, -0.0028274953365325928, -0.002719581127166748, -0.0026116669178009033, -0.0025037527084350586, -0.002395838499069214, -0.002287924289703369, -0.0021800100803375244, -0.0020720958709716797, -0.001964181661605835, -0.0018562674522399902, -0.0017483532428741455, -0.0016404390335083008, -0.001532524824142456, -0.0014246106147766113, -0.0013166964054107666, -0.0012087821960449219, -0.0011008679866790771, -0.0009929537773132324, -0.0008850395679473877, -0.000777125358581543, -0.0006692111492156982, -0.0005612969398498535, -0.0004533827304840088, -0.00034546852111816406, -0.00023755431175231934, -0.0001296401023864746, -2.1725893020629883e-05, 8.618831634521484e-05, 0.00019410252571105957, 0.0003020167350769043, 0.000409930944442749, 0.0005178451538085938, 0.0006257593631744385, 0.0007336735725402832, 0.0008415877819061279, 0.0009495019912719727, 0.0010574162006378174, 0.0011653304100036621, 0.0012732446193695068, 0.0013811588287353516, 0.0014890730381011963, 0.001596987247467041, 0.0017049014568328857, 0.0018128156661987305, 0.0019207298755645752, 0.00202864408493042, 0.0021365582942962646, 0.0022444725036621094, 0.002352386713027954, 0.002460300922393799, 0.0025682151317596436, 0.0026761293411254883, 0.002784043550491333, 0.0028919577598571777, 0.0029998719692230225, 0.003107786178588867, 0.003215700387954712, 0.0033236145973205566, 0.0034315288066864014, 0.003539443016052246, 0.003647357225418091, 0.0037552714347839355, 0.0038631856441497803, 0.003971099853515625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 5.0, 2.0, 8.0, 15.0, 22.0, 21.0, 23.0, 35.0, 70.0, 86.0, 134.0, 210.0, 388.0, 799.0, 1922.0, 7112.0, 53185.0, 829934.0, 137549.0, 11981.0, 2942.0, 1039.0, 418.0, 259.0, 139.0, 85.0, 66.0, 33.0, 26.0, 18.0, 9.0, 7.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25244140625, -0.24446487426757812, -0.23648834228515625, -0.22851181030273438, -0.2205352783203125, -0.21255874633789062, -0.20458221435546875, -0.19660568237304688, -0.188629150390625, -0.18065261840820312, -0.17267608642578125, -0.16469955444335938, -0.1567230224609375, -0.14874649047851562, -0.14076995849609375, -0.13279342651367188, -0.12481689453125, -0.11684036254882812, -0.10886383056640625, -0.10088729858398438, -0.0929107666015625, -0.08493423461914062, -0.07695770263671875, -0.06898117065429688, -0.061004638671875, -0.053028106689453125, -0.04505157470703125, -0.037075042724609375, -0.0290985107421875, -0.021121978759765625, -0.01314544677734375, -0.005168914794921875, 0.0028076171875, 0.010784149169921875, 0.01876068115234375, 0.026737213134765625, 0.0347137451171875, 0.042690277099609375, 0.05066680908203125, 0.058643341064453125, 0.066619873046875, 0.07459640502929688, 0.08257293701171875, 0.09054946899414062, 0.0985260009765625, 0.10650253295898438, 0.11447906494140625, 0.12245559692382812, 0.13043212890625, 0.13840866088867188, 0.14638519287109375, 0.15436172485351562, 0.1623382568359375, 0.17031478881835938, 0.17829132080078125, 0.18626785278320312, 0.194244384765625, 0.20222091674804688, 0.21019744873046875, 0.21817398071289062, 0.2261505126953125, 0.23412704467773438, 0.24210357666015625, 0.2500801086425781, 0.258056640625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 2.0, 15.0, 16.0, 24.0, 36.0, 71.0, 107.0, 148.0, 155.0, 130.0, 102.0, 67.0, 44.0, 22.0, 25.0, 8.0, 9.0, 4.0, 4.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.1883544921875, -0.18403053283691406, -0.17970657348632812, -0.1753826141357422, -0.17105865478515625, -0.1667346954345703, -0.16241073608398438, -0.15808677673339844, -0.1537628173828125, -0.14943885803222656, -0.14511489868164062, -0.1407909393310547, -0.13646697998046875, -0.1321430206298828, -0.12781906127929688, -0.12349510192871094, -0.119171142578125, -0.11484718322753906, -0.11052322387695312, -0.10619926452636719, -0.10187530517578125, -0.09755134582519531, -0.09322738647460938, -0.08890342712402344, -0.0845794677734375, -0.08025550842285156, -0.07593154907226562, -0.07160758972167969, -0.06728363037109375, -0.06295967102050781, -0.058635711669921875, -0.05431175231933594, -0.04998779296875, -0.04566383361816406, -0.041339874267578125, -0.03701591491699219, -0.03269195556640625, -0.028367996215820312, -0.024044036865234375, -0.019720077514648438, -0.0153961181640625, -0.011072158813476562, -0.006748199462890625, -0.0024242401123046875, 0.00189971923828125, 0.0062236785888671875, 0.010547637939453125, 0.014871597290039062, 0.019195556640625, 0.023519515991210938, 0.027843475341796875, 0.03216743469238281, 0.03649139404296875, 0.04081535339355469, 0.045139312744140625, 0.04946327209472656, 0.0537872314453125, 0.05811119079589844, 0.062435150146484375, 0.06675910949707031, 0.07108306884765625, 0.07540702819824219, 0.07973098754882812, 0.08405494689941406, 0.08837890625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 10.0, 12.0, 18.0, 38.0, 63.0, 105.0, 178.0, 195.0, 153.0, 114.0, 36.0, 27.0, 15.0, 10.0, 9.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.082637071609497, -1.0558706521987915, -1.029104232788086, -1.00233793258667, -0.9755715131759644, -0.9488050937652588, -0.9220386743545532, -0.8952723145484924, -0.8685059547424316, -0.8417395353317261, -0.8149731755256653, -0.7882067561149597, -0.7614403963088989, -0.7346739768981934, -0.7079075574874878, -0.681141197681427, -0.6543747782707214, -0.6276083588600159, -0.6008419990539551, -0.5740755796432495, -0.5473092198371887, -0.5205428004264832, -0.4937764108181, -0.4670100212097168, -0.4402436316013336, -0.41347724199295044, -0.38671085238456726, -0.3599444627761841, -0.3331780433654785, -0.3064116835594177, -0.27964526414871216, -0.252878874540329, -0.22611242532730103, -0.19934603571891785, -0.17257964611053467, -0.1458132416009903, -0.11904685199260712, -0.09228046238422394, -0.06551405787467957, -0.03874766826629639, -0.011981278657913208, 0.01478511467576027, 0.041551508009433746, 0.06831790506839752, 0.0950842946767807, 0.12185068428516388, 0.14861708879470825, 0.17538347840309143, 0.2021498680114746, 0.2289162576198578, 0.25568264722824097, 0.28244906663894653, 0.3092154264450073, 0.3359818458557129, 0.36274823546409607, 0.38951462507247925, 0.4162810146808624, 0.4430474042892456, 0.4698137938976288, 0.49658018350601196, 0.5233466029167175, 0.5501129627227783, 0.5768793821334839, 0.6036458015441895, 0.6304121613502502]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 11.0, 9.0, 10.0, 13.0, 13.0, 26.0, 46.0, 47.0, 63.0, 105.0, 89.0, 111.0, 112.0, 71.0, 74.0, 51.0, 47.0, 28.0, 19.0, 13.0, 6.0, 8.0, 4.0, 2.0, 3.0, 3.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1939961910247803, -1.161128044128418, -1.1282597780227661, -1.0953916311264038, -1.062523365020752, -1.0296552181243896, -0.9967870712280273, -0.9639188647270203, -0.9310506582260132, -0.8981824517250061, -0.865314245223999, -0.8324460983276367, -0.7995778918266296, -0.7667096853256226, -0.7338415384292603, -0.7009733319282532, -0.6681051254272461, -0.635236918926239, -0.6023687124252319, -0.5695005655288696, -0.5366323590278625, -0.5037641525268555, -0.4708959758281708, -0.4380277991294861, -0.405159592628479, -0.3722913861274719, -0.33942320942878723, -0.30655503273010254, -0.27368682622909546, -0.24081863462924957, -0.2079504430294037, -0.1750822514295578, -0.14221394062042236, -0.10934574902057648, -0.07647755742073059, -0.043609365820884705, -0.010741174221038818, 0.022127017378807068, 0.054995208978652954, 0.08786340057849884, 0.12073159217834473, 0.1535997837781906, 0.1864679753780365, 0.21933616697788239, 0.25220435857772827, 0.28507256507873535, 0.31794074177742004, 0.35080891847610474, 0.3836771249771118, 0.4165453314781189, 0.4494135081768036, 0.4822816848754883, 0.5151498913764954, 0.5480180978775024, 0.5808862447738647, 0.6137544512748718, 0.6466226577758789, 0.679490864276886, 0.7123590707778931, 0.7452272176742554, 0.7780954241752625, 0.8109636306762695, 0.8438317775726318, 0.8766999840736389, 0.909568190574646]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 4.0, 4.0, 4.0, 2.0, 4.0, 6.0, 8.0, 0.0, 6.0, 13.0, 11.0, 15.0, 17.0, 26.0, 21.0, 24.0, 25.0, 33.0, 62.0, 100.0, 533.0, 6077.0, 4161316.0, 24273.0, 1305.0, 194.0, 53.0, 30.0, 24.0, 14.0, 18.0, 10.0, 4.0, 8.0, 2.0, 6.0, 8.0, 0.0, 0.0, 2.0, 6.0, 2.0, 6.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1796875, -2.118560791015625, -2.05743408203125, -1.996307373046875, -1.9351806640625, -1.874053955078125, -1.81292724609375, -1.751800537109375, -1.690673828125, -1.629547119140625, -1.56842041015625, -1.507293701171875, -1.4461669921875, -1.385040283203125, -1.32391357421875, -1.262786865234375, -1.20166015625, -1.140533447265625, -1.07940673828125, -1.018280029296875, -0.9571533203125, -0.896026611328125, -0.83489990234375, -0.773773193359375, -0.712646484375, -0.651519775390625, -0.59039306640625, -0.529266357421875, -0.4681396484375, -0.407012939453125, -0.34588623046875, -0.284759521484375, -0.2236328125, -0.162506103515625, -0.10137939453125, -0.040252685546875, 0.0208740234375, 0.082000732421875, 0.14312744140625, 0.204254150390625, 0.265380859375, 0.326507568359375, 0.38763427734375, 0.448760986328125, 0.5098876953125, 0.571014404296875, 0.63214111328125, 0.693267822265625, 0.75439453125, 0.815521240234375, 0.87664794921875, 0.937774658203125, 0.9989013671875, 1.060028076171875, 1.12115478515625, 1.182281494140625, 1.243408203125, 1.304534912109375, 1.36566162109375, 1.426788330078125, 1.4879150390625, 1.549041748046875, 1.61016845703125, 1.671295166015625, 1.732421875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 11.0, 5.0, 11.0, 15.0, 26.0, 55.0, 89.0, 145.0, 203.0, 186.0, 109.0, 61.0, 32.0, 18.0, 10.0, 6.0, 7.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0401611328125, -0.03921937942504883, -0.038277626037597656, -0.037335872650146484, -0.03639411926269531, -0.03545236587524414, -0.03451061248779297, -0.0335688591003418, -0.032627105712890625, -0.03168535232543945, -0.03074359893798828, -0.02980184555053711, -0.028860092163085938, -0.027918338775634766, -0.026976585388183594, -0.026034832000732422, -0.02509307861328125, -0.024151325225830078, -0.023209571838378906, -0.022267818450927734, -0.021326065063476562, -0.02038431167602539, -0.01944255828857422, -0.018500804901123047, -0.017559051513671875, -0.016617298126220703, -0.01567554473876953, -0.01473379135131836, -0.013792037963867188, -0.012850284576416016, -0.011908531188964844, -0.010966777801513672, -0.0100250244140625, -0.009083271026611328, -0.008141517639160156, -0.007199764251708984, -0.0062580108642578125, -0.005316257476806641, -0.004374504089355469, -0.003432750701904297, -0.002490997314453125, -0.0015492439270019531, -0.0006074905395507812, 0.0003342628479003906, 0.0012760162353515625, 0.0022177696228027344, 0.0031595230102539062, 0.004101276397705078, 0.00504302978515625, 0.005984783172607422, 0.006926536560058594, 0.007868289947509766, 0.008810043334960938, 0.00975179672241211, 0.010693550109863281, 0.011635303497314453, 0.012577056884765625, 0.013518810272216797, 0.014460563659667969, 0.01540231704711914, 0.016344070434570312, 0.017285823822021484, 0.018227577209472656, 0.019169330596923828, 0.020111083984375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 16.0, 99.0, 748.0, 4187702.0, 5509.0, 185.0, 36.0], "bins": [-6.7734375, -6.661884307861328, -6.550331115722656, -6.438777923583984, -6.3272247314453125, -6.215671539306641, -6.104118347167969, -5.992565155029297, -5.881011962890625, -5.769458770751953, -5.657905578613281, -5.546352386474609, -5.4347991943359375, -5.323246002197266, -5.211692810058594, -5.100139617919922, -4.98858642578125, -4.877033233642578, -4.765480041503906, -4.653926849365234, -4.5423736572265625, -4.430820465087891, -4.319267272949219, -4.207714080810547, -4.096160888671875, -3.984607696533203, -3.8730545043945312, -3.7615013122558594, -3.6499481201171875, -3.5383949279785156, -3.4268417358398438, -3.315288543701172, -3.2037353515625, -3.092182159423828, -2.9806289672851562, -2.8690757751464844, -2.7575225830078125, -2.6459693908691406, -2.5344161987304688, -2.422863006591797, -2.311309814453125, -2.199756622314453, -2.0882034301757812, -1.9766502380371094, -1.8650970458984375, -1.7535438537597656, -1.6419906616210938, -1.5304374694824219, -1.41888427734375, -1.3073310852050781, -1.1957778930664062, -1.0842247009277344, -0.9726715087890625, -0.8611183166503906, -0.7495651245117188, -0.6380119323730469, -0.526458740234375, -0.4149055480957031, -0.30335235595703125, -0.19179916381835938, -0.0802459716796875, 0.031307220458984375, 0.14286041259765625, 0.2544136047363281, 0.365966796875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 7.0, 9.0, 15.0, 32.0, 51.0, 174.0, 864.0, 2369.0, 349.0, 109.0, 46.0, 34.0, 12.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1461181640625, -0.1429586410522461, -0.1397991180419922, -0.13663959503173828, -0.13348007202148438, -0.13032054901123047, -0.12716102600097656, -0.12400150299072266, -0.12084197998046875, -0.11768245697021484, -0.11452293395996094, -0.11136341094970703, -0.10820388793945312, -0.10504436492919922, -0.10188484191894531, -0.0987253189086914, -0.0955657958984375, -0.0924062728881836, -0.08924674987792969, -0.08608722686767578, -0.08292770385742188, -0.07976818084716797, -0.07660865783691406, -0.07344913482666016, -0.07028961181640625, -0.06713008880615234, -0.06397056579589844, -0.06081104278564453, -0.057651519775390625, -0.05449199676513672, -0.05133247375488281, -0.048172950744628906, -0.045013427734375, -0.041853904724121094, -0.03869438171386719, -0.03553485870361328, -0.032375335693359375, -0.02921581268310547, -0.026056289672851562, -0.022896766662597656, -0.01973724365234375, -0.016577720642089844, -0.013418197631835938, -0.010258674621582031, -0.007099151611328125, -0.003939628601074219, -0.0007801055908203125, 0.0023794174194335938, 0.0055389404296875, 0.008698463439941406, 0.011857986450195312, 0.015017509460449219, 0.018177032470703125, 0.02133655548095703, 0.024496078491210938, 0.027655601501464844, 0.03081512451171875, 0.033974647521972656, 0.03713417053222656, 0.04029369354248047, 0.043453216552734375, 0.04661273956298828, 0.04977226257324219, 0.052931785583496094, 0.05609130859375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 363.0, 644.0, 8.0, 1.0, 1.0], "bins": [-16.237573623657227, -15.967021942138672, -15.696470260620117, -15.425917625427246, -15.155365943908691, -14.884814262390137, -14.614261627197266, -14.343709945678711, -14.073158264160156, -13.802606582641602, -13.532054901123047, -13.261502265930176, -12.990950584411621, -12.720398902893066, -12.449846267700195, -12.17929458618164, -11.908742904663086, -11.638191223144531, -11.367639541625977, -11.097086906433105, -10.82653522491455, -10.555983543395996, -10.285430908203125, -10.01487922668457, -9.744327545166016, -9.473775863647461, -9.203224182128906, -8.932671546936035, -8.66211986541748, -8.391568183898926, -8.121015548706055, -7.8504638671875, -7.579912185668945, -7.309360504150391, -7.038808345794678, -6.768256187438965, -6.49770450592041, -6.2271528244018555, -5.956600666046143, -5.68604850769043, -5.415496826171875, -5.14494514465332, -4.874392986297607, -4.6038408279418945, -4.33328914642334, -4.062737464904785, -3.7921853065490723, -3.5216333866119385, -3.251081705093384, -2.98052978515625, -2.709977865219116, -2.4394259452819824, -2.1688740253448486, -1.8983221054077148, -1.627770185470581, -1.3572182655334473, -1.0866663455963135, -0.8161144256591797, -0.5455625057220459, -0.2750105857849121, -0.00445866584777832, 0.26609325408935547, 0.5366451740264893, 0.807197093963623, 1.0777490139007568]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 15.0, 30.0, 112.0, 211.0, 282.0, 192.0, 109.0, 40.0, 14.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.9985620975494385, -2.9411702156066895, -2.8837780952453613, -2.8263862133026123, -2.768994092941284, -2.711602210998535, -2.654210329055786, -2.596818208694458, -2.539426326751709, -2.48203444480896, -2.424642324447632, -2.367250442504883, -2.3098583221435547, -2.2524664402008057, -2.1950745582580566, -2.1376824378967285, -2.0802905559539795, -2.0228986740112305, -1.9655065536499023, -1.9081146717071533, -1.8507226705551147, -1.7933306694030762, -1.7359386682510376, -1.678546667098999, -1.6211546659469604, -1.5637626647949219, -1.5063706636428833, -1.4489787817001343, -1.3915867805480957, -1.3341947793960571, -1.2768027782440186, -1.2194108963012695, -1.1620190143585205, -1.104627013206482, -1.0472350120544434, -0.9898430705070496, -0.9324511289596558, -0.8750591278076172, -0.8176671266555786, -0.7602751851081848, -0.7028831243515015, -0.6454911231994629, -0.5880991816520691, -0.5307071805000305, -0.4733152389526367, -0.41592323780059814, -0.35853126645088196, -0.30113929510116577, -0.24374735355377197, -0.1863553822040558, -0.1289634108543396, -0.07157142460346222, -0.014179453253746033, 0.04321253299713135, 0.10060450434684753, 0.15799647569656372, 0.2153884470462799, 0.2727804183959961, 0.3301723897457123, 0.38756436109542847, 0.44495636224746704, 0.5023483037948608, 0.5597403049468994, 0.617132306098938, 0.6745242476463318]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 7.0, 6.0, 5.0, 6.0, 22.0, 13.0, 19.0, 19.0, 24.0, 35.0, 26.0, 29.0, 47.0, 52.0, 37.0, 73.0, 6758.0, 1040878.0, 89.0, 57.0, 59.0, 43.0, 35.0, 38.0, 18.0, 30.0, 20.0, 16.0, 19.0, 12.0, 12.0, 4.0, 9.0, 6.0, 3.0, 4.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.44921875, -3.3311767578125, -3.213134765625, -3.0950927734375, -2.97705078125, -2.8590087890625, -2.740966796875, -2.6229248046875, -2.5048828125, -2.3868408203125, -2.268798828125, -2.1507568359375, -2.03271484375, -1.9146728515625, -1.796630859375, -1.6785888671875, -1.560546875, -1.4425048828125, -1.324462890625, -1.2064208984375, -1.08837890625, -0.9703369140625, -0.852294921875, -0.7342529296875, -0.6162109375, -0.4981689453125, -0.380126953125, -0.2620849609375, -0.14404296875, -0.0260009765625, 0.092041015625, 0.2100830078125, 0.328125, 0.4461669921875, 0.564208984375, 0.6822509765625, 0.80029296875, 0.9183349609375, 1.036376953125, 1.1544189453125, 1.2724609375, 1.3905029296875, 1.508544921875, 1.6265869140625, 1.74462890625, 1.8626708984375, 1.980712890625, 2.0987548828125, 2.216796875, 2.3348388671875, 2.452880859375, 2.5709228515625, 2.68896484375, 2.8070068359375, 2.925048828125, 3.0430908203125, 3.1611328125, 3.2791748046875, 3.397216796875, 3.5152587890625, 3.63330078125, 3.7513427734375, 3.869384765625, 3.9874267578125, 4.10546875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 150.0, 771.0, 95.0, 2.0], "bins": [-0.84716796875, -0.8333635330200195, -0.8195590972900391, -0.8057546615600586, -0.7919502258300781, -0.7781457901000977, -0.7643413543701172, -0.7505369186401367, -0.7367324829101562, -0.7229280471801758, -0.7091236114501953, -0.6953191757202148, -0.6815147399902344, -0.6677103042602539, -0.6539058685302734, -0.640101432800293, -0.6262969970703125, -0.612492561340332, -0.5986881256103516, -0.5848836898803711, -0.5710792541503906, -0.5572748184204102, -0.5434703826904297, -0.5296659469604492, -0.5158615112304688, -0.5020570755004883, -0.4882526397705078, -0.47444820404052734, -0.4606437683105469, -0.4468393325805664, -0.43303489685058594, -0.41923046112060547, -0.405426025390625, -0.39162158966064453, -0.37781715393066406, -0.3640127182006836, -0.3502082824707031, -0.33640384674072266, -0.3225994110107422, -0.3087949752807617, -0.29499053955078125, -0.2811861038208008, -0.2673816680908203, -0.25357723236083984, -0.23977279663085938, -0.2259683609008789, -0.21216392517089844, -0.19835948944091797, -0.1845550537109375, -0.17075061798095703, -0.15694618225097656, -0.1431417465209961, -0.12933731079101562, -0.11553287506103516, -0.10172843933105469, -0.08792400360107422, -0.07411956787109375, -0.06031513214111328, -0.04651069641113281, -0.032706260681152344, -0.018901824951171875, -0.005097389221191406, 0.008707046508789062, 0.02251148223876953, 0.03631591796875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 6.0, 10.0, 7.0, 10.0, 9.0, 14.0, 19.0, 26.0, 45.0, 73.0, 157.0, 249.0, 509.0, 1092.0, 2718.0, 7804.0, 29410.0, 173878.0, 704239.0, 98796.0, 19934.0, 5741.0, 2031.0, 814.0, 411.0, 211.0, 111.0, 77.0, 43.0, 43.0, 19.0, 9.0, 9.0, 8.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.73388671875, -0.708892822265625, -0.68389892578125, -0.658905029296875, -0.6339111328125, -0.608917236328125, -0.58392333984375, -0.558929443359375, -0.533935546875, -0.508941650390625, -0.48394775390625, -0.458953857421875, -0.4339599609375, -0.408966064453125, -0.38397216796875, -0.358978271484375, -0.333984375, -0.308990478515625, -0.28399658203125, -0.259002685546875, -0.2340087890625, -0.209014892578125, -0.18402099609375, -0.159027099609375, -0.134033203125, -0.109039306640625, -0.08404541015625, -0.059051513671875, -0.0340576171875, -0.009063720703125, 0.01593017578125, 0.040924072265625, 0.06591796875, 0.090911865234375, 0.11590576171875, 0.140899658203125, 0.1658935546875, 0.190887451171875, 0.21588134765625, 0.240875244140625, 0.265869140625, 0.290863037109375, 0.31585693359375, 0.340850830078125, 0.3658447265625, 0.390838623046875, 0.41583251953125, 0.440826416015625, 0.4658203125, 0.490814208984375, 0.51580810546875, 0.540802001953125, 0.5657958984375, 0.590789794921875, 0.61578369140625, 0.640777587890625, 0.665771484375, 0.690765380859375, 0.71575927734375, 0.740753173828125, 0.7657470703125, 0.790740966796875, 0.81573486328125, 0.840728759765625, 0.86572265625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 7.0, 5.0, 7.0, 13.0, 7.0, 11.0, 11.0, 25.0, 32.0, 38.0, 50.0, 54.0, 50.0, 52.0, 75.0, 80.0, 59.0, 72.0, 71.0, 59.0, 39.0, 29.0, 40.0, 25.0, 25.0, 16.0, 11.0, 10.0, 10.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56201171875, -0.5417861938476562, -0.5215606689453125, -0.5013351440429688, -0.481109619140625, -0.46088409423828125, -0.4406585693359375, -0.42043304443359375, -0.40020751953125, -0.37998199462890625, -0.3597564697265625, -0.33953094482421875, -0.319305419921875, -0.29907989501953125, -0.2788543701171875, -0.25862884521484375, -0.2384033203125, -0.21817779541015625, -0.1979522705078125, -0.17772674560546875, -0.157501220703125, -0.13727569580078125, -0.1170501708984375, -0.09682464599609375, -0.07659912109375, -0.05637359619140625, -0.0361480712890625, -0.01592254638671875, 0.004302978515625, 0.02452850341796875, 0.0447540283203125, 0.06497955322265625, 0.085205078125, 0.10543060302734375, 0.1256561279296875, 0.14588165283203125, 0.166107177734375, 0.18633270263671875, 0.2065582275390625, 0.22678375244140625, 0.24700927734375, 0.26723480224609375, 0.2874603271484375, 0.30768585205078125, 0.327911376953125, 0.34813690185546875, 0.3683624267578125, 0.38858795166015625, 0.4088134765625, 0.42903900146484375, 0.4492645263671875, 0.46949005126953125, 0.489715576171875, 0.5099411010742188, 0.5301666259765625, 0.5503921508789062, 0.57061767578125, 0.5908432006835938, 0.6110687255859375, 0.6312942504882812, 0.651519775390625, 0.6717453002929688, 0.6919708251953125, 0.7121963500976562, 0.732421875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 2.0, 5.0, 8.0, 6.0, 12.0, 12.0, 20.0, 18.0, 32.0, 53.0, 68.0, 149.0, 304.0, 924.0, 4040.0, 52803.0, 932467.0, 52031.0, 4000.0, 865.0, 320.0, 145.0, 69.0, 53.0, 29.0, 21.0, 17.0, 16.0, 14.0, 11.0, 4.0, 2.0, 3.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.369140625, -1.3270111083984375, -1.284881591796875, -1.2427520751953125, -1.20062255859375, -1.1584930419921875, -1.116363525390625, -1.0742340087890625, -1.0321044921875, -0.9899749755859375, -0.947845458984375, -0.9057159423828125, -0.86358642578125, -0.8214569091796875, -0.779327392578125, -0.7371978759765625, -0.695068359375, -0.6529388427734375, -0.610809326171875, -0.5686798095703125, -0.52655029296875, -0.4844207763671875, -0.442291259765625, -0.4001617431640625, -0.3580322265625, -0.3159027099609375, -0.273773193359375, -0.2316436767578125, -0.18951416015625, -0.1473846435546875, -0.105255126953125, -0.0631256103515625, -0.02099609375, 0.0211334228515625, 0.063262939453125, 0.1053924560546875, 0.14752197265625, 0.1896514892578125, 0.231781005859375, 0.2739105224609375, 0.3160400390625, 0.3581695556640625, 0.400299072265625, 0.4424285888671875, 0.48455810546875, 0.5266876220703125, 0.568817138671875, 0.6109466552734375, 0.653076171875, 0.6952056884765625, 0.737335205078125, 0.7794647216796875, 0.82159423828125, 0.8637237548828125, 0.905853271484375, 0.9479827880859375, 0.9901123046875, 1.0322418212890625, 1.074371337890625, 1.1165008544921875, 1.15863037109375, 1.2007598876953125, 1.242889404296875, 1.2850189208984375, 1.3271484375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 4.0, 3.0, 4.0, 8.0, 10.0, 16.0, 18.0, 21.0, 40.0, 49.0, 82.0, 97.0, 181.0, 155.0, 91.0, 56.0, 46.0, 31.0, 23.0, 18.0, 12.0, 12.0, 2.0, 5.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0008244514465332031, -0.0008032247424125671, -0.0007819980382919312, -0.0007607713341712952, -0.0007395446300506592, -0.0007183179259300232, -0.0006970912218093872, -0.0006758645176887512, -0.0006546378135681152, -0.0006334111094474792, -0.0006121844053268433, -0.0005909577012062073, -0.0005697309970855713, -0.0005485042929649353, -0.0005272775888442993, -0.0005060508847236633, -0.00048482418060302734, -0.00046359747648239136, -0.00044237077236175537, -0.0004211440682411194, -0.0003999173641204834, -0.0003786906599998474, -0.0003574639558792114, -0.00033623725175857544, -0.00031501054763793945, -0.00029378384351730347, -0.0002725571393966675, -0.0002513304352760315, -0.0002301037311553955, -0.00020887702703475952, -0.00018765032291412354, -0.00016642361879348755, -0.00014519691467285156, -0.00012397021055221558, -0.00010274350643157959, -8.15168023109436e-05, -6.029009819030762e-05, -3.906339406967163e-05, -1.7836689949035645e-05, 3.390014171600342e-06, 2.4616718292236328e-05, 4.5843422412872314e-05, 6.70701265335083e-05, 8.829683065414429e-05, 0.00010952353477478027, 0.00013075023889541626, 0.00015197694301605225, 0.00017320364713668823, 0.00019443035125732422, 0.0002156570553779602, 0.0002368837594985962, 0.0002581104636192322, 0.00027933716773986816, 0.00030056387186050415, 0.00032179057598114014, 0.0003430172801017761, 0.0003642439842224121, 0.0003854706883430481, 0.0004066973924636841, 0.00042792409658432007, 0.00044915080070495605, 0.00047037750482559204, 0.000491604208946228, 0.000512830913066864, 0.0005340576171875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 6.0, 4.0, 5.0, 6.0, 4.0, 11.0, 22.0, 48.0, 81.0, 166.0, 447.0, 1284.0, 4679.0, 25142.0, 690337.0, 302818.0, 17742.0, 3872.0, 1121.0, 406.0, 157.0, 75.0, 45.0, 26.0, 10.0, 7.0, 9.0, 7.0, 5.0, 7.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1591796875, -1.110687255859375, -1.06219482421875, -1.013702392578125, -0.9652099609375, -0.916717529296875, -0.86822509765625, -0.819732666015625, -0.771240234375, -0.722747802734375, -0.67425537109375, -0.625762939453125, -0.5772705078125, -0.528778076171875, -0.48028564453125, -0.431793212890625, -0.38330078125, -0.334808349609375, -0.28631591796875, -0.237823486328125, -0.1893310546875, -0.140838623046875, -0.09234619140625, -0.043853759765625, 0.004638671875, 0.053131103515625, 0.10162353515625, 0.150115966796875, 0.1986083984375, 0.247100830078125, 0.29559326171875, 0.344085693359375, 0.392578125, 0.441070556640625, 0.48956298828125, 0.538055419921875, 0.5865478515625, 0.635040283203125, 0.68353271484375, 0.732025146484375, 0.780517578125, 0.829010009765625, 0.87750244140625, 0.925994873046875, 0.9744873046875, 1.022979736328125, 1.07147216796875, 1.119964599609375, 1.16845703125, 1.216949462890625, 1.26544189453125, 1.313934326171875, 1.3624267578125, 1.410919189453125, 1.45941162109375, 1.507904052734375, 1.556396484375, 1.604888916015625, 1.65338134765625, 1.701873779296875, 1.7503662109375, 1.798858642578125, 1.84735107421875, 1.895843505859375, 1.9443359375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 4.0, 15.0, 12.0, 28.0, 41.0, 64.0, 134.0, 277.0, 157.0, 87.0, 54.0, 32.0, 20.0, 13.0, 5.0, 6.0, 3.0, 4.0, 4.0, 5.0, 3.0, 1.0, 7.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65087890625, -0.6244277954101562, -0.5979766845703125, -0.5715255737304688, -0.545074462890625, -0.5186233520507812, -0.4921722412109375, -0.46572113037109375, -0.43927001953125, -0.41281890869140625, -0.3863677978515625, -0.35991668701171875, -0.333465576171875, -0.30701446533203125, -0.2805633544921875, -0.25411224365234375, -0.2276611328125, -0.20121002197265625, -0.1747589111328125, -0.14830780029296875, -0.121856689453125, -0.09540557861328125, -0.0689544677734375, -0.04250335693359375, -0.01605224609375, 0.01039886474609375, 0.0368499755859375, 0.06330108642578125, 0.089752197265625, 0.11620330810546875, 0.1426544189453125, 0.16910552978515625, 0.195556640625, 0.22200775146484375, 0.2484588623046875, 0.27490997314453125, 0.301361083984375, 0.32781219482421875, 0.3542633056640625, 0.38071441650390625, 0.40716552734375, 0.43361663818359375, 0.4600677490234375, 0.48651885986328125, 0.512969970703125, 0.5394210815429688, 0.5658721923828125, 0.5923233032226562, 0.6187744140625, 0.6452255249023438, 0.6716766357421875, 0.6981277465820312, 0.724578857421875, 0.7510299682617188, 0.7774810791015625, 0.8039321899414062, 0.83038330078125, 0.8568344116210938, 0.8832855224609375, 0.9097366333007812, 0.936187744140625, 0.9626388549804688, 0.9890899658203125, 1.0155410766601562, 1.0419921875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 51.0, 929.0, 32.0, 7.0], "bins": [-121.34996032714844, -119.36675262451172, -117.38353729248047, -115.40032958984375, -113.41712188720703, -111.43391418457031, -109.45069885253906, -107.46749114990234, -105.48428344726562, -103.5010757446289, -101.51786041259766, -99.53465270996094, -97.55144500732422, -95.5682373046875, -93.58502197265625, -91.60181427001953, -89.61859893798828, -87.63539123535156, -85.65217590332031, -83.6689682006836, -81.68576049804688, -79.70254516601562, -77.7193374633789, -75.73612976074219, -73.75291442871094, -71.76970672607422, -69.78649139404297, -67.80328369140625, -65.82007598876953, -63.83686447143555, -61.85365295410156, -59.870445251464844, -57.88724136352539, -55.904029846191406, -53.92082214355469, -51.9376106262207, -49.95439910888672, -47.97119140625, -45.987979888916016, -44.00476837158203, -42.02156066894531, -40.03834915161133, -38.05514144897461, -36.071929931640625, -34.088722229003906, -32.10551071166992, -30.122299194335938, -28.139089584350586, -26.155879974365234, -24.172670364379883, -22.18946075439453, -20.206249237060547, -18.223039627075195, -16.239830017089844, -14.256619453430176, -12.273408889770508, -10.29019832611084, -8.306987762451172, -6.32377815246582, -4.3405680656433105, -2.357357978820801, -0.3741483688354492, 1.6090621948242188, 3.5922727584838867, 5.575482368469238]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 10.0, 23.0, 44.0, 65.0, 77.0, 109.0, 121.0, 132.0, 128.0, 100.0, 82.0, 46.0, 29.0, 24.0, 11.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-14.445422172546387, -14.167328834533691, -13.889235496520996, -13.611141204833984, -13.333047866821289, -13.054954528808594, -12.776861190795898, -12.498767852783203, -12.220673561096191, -11.942580223083496, -11.6644868850708, -11.386392593383789, -11.108299255371094, -10.830205917358398, -10.552112579345703, -10.274019241333008, -9.995925903320312, -9.717832565307617, -9.439739227294922, -9.16164493560791, -8.883551597595215, -8.60545825958252, -8.327364921569824, -8.049270629882812, -7.771177291870117, -7.493083953857422, -7.214990139007568, -6.936896800994873, -6.6588029861450195, -6.380709648132324, -6.102616310119629, -5.824522495269775, -5.546428680419922, -5.268335342407227, -4.990241527557373, -4.712148189544678, -4.434054374694824, -4.155961036682129, -3.8778674602508545, -3.59977388381958, -3.3216803073883057, -3.0435867309570312, -2.765493154525757, -2.4873995780944824, -2.209306240081787, -1.9312125444412231, -1.6531190872192383, -1.3750255107879639, -1.0969319343566895, -0.818838357925415, -0.5407448410987854, -0.26265132427215576, 0.015442252159118652, 0.29353582859039307, 0.5716292858123779, 0.8497228622436523, 1.1278164386749268, 1.4059100151062012, 1.6840035915374756, 1.9620970487594604, 2.2401905059814453, 2.518284320831299, 2.796377658843994, 3.0744712352752686, 3.352564811706543]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 10.0, 11.0, 12.0, 28.0, 39.0, 44.0, 100.0, 141.0, 357.0, 2312.0, 4190913.0, 251.0, 62.0, 12.0, 3.0], "bins": [-34.4375, -33.85693359375, -33.2763671875, -32.69580078125, -32.115234375, -31.53466796875, -30.9541015625, -30.37353515625, -29.79296875, -29.21240234375, -28.6318359375, -28.05126953125, -27.470703125, -26.89013671875, -26.3095703125, -25.72900390625, -25.1484375, -24.56787109375, -23.9873046875, -23.40673828125, -22.826171875, -22.24560546875, -21.6650390625, -21.08447265625, -20.50390625, -19.92333984375, -19.3427734375, -18.76220703125, -18.181640625, -17.60107421875, -17.0205078125, -16.43994140625, -15.859375, -15.27880859375, -14.6982421875, -14.11767578125, -13.537109375, -12.95654296875, -12.3759765625, -11.79541015625, -11.21484375, -10.63427734375, -10.0537109375, -9.47314453125, -8.892578125, -8.31201171875, -7.7314453125, -7.15087890625, -6.5703125, -5.98974609375, -5.4091796875, -4.82861328125, -4.248046875, -3.66748046875, -3.0869140625, -2.50634765625, -1.92578125, -1.34521484375, -0.7646484375, -0.18408203125, 0.396484375, 0.97705078125, 1.5576171875, 2.13818359375, 2.71875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 16.0, 74.0, 247.0, 383.0, 215.0, 67.0, 13.0, 3.0], "bins": [-0.99462890625, -0.977874755859375, -0.96112060546875, -0.944366455078125, -0.9276123046875, -0.910858154296875, -0.89410400390625, -0.877349853515625, -0.860595703125, -0.843841552734375, -0.82708740234375, -0.810333251953125, -0.7935791015625, -0.776824951171875, -0.76007080078125, -0.743316650390625, -0.7265625, -0.709808349609375, -0.69305419921875, -0.676300048828125, -0.6595458984375, -0.642791748046875, -0.62603759765625, -0.609283447265625, -0.592529296875, -0.575775146484375, -0.55902099609375, -0.542266845703125, -0.5255126953125, -0.508758544921875, -0.49200439453125, -0.475250244140625, -0.45849609375, -0.441741943359375, -0.42498779296875, -0.408233642578125, -0.3914794921875, -0.374725341796875, -0.35797119140625, -0.341217041015625, -0.324462890625, -0.307708740234375, -0.29095458984375, -0.274200439453125, -0.2574462890625, -0.240692138671875, -0.22393798828125, -0.207183837890625, -0.1904296875, -0.173675537109375, -0.15692138671875, -0.140167236328125, -0.1234130859375, -0.106658935546875, -0.08990478515625, -0.073150634765625, -0.056396484375, -0.039642333984375, -0.02288818359375, -0.006134033203125, 0.0106201171875, 0.027374267578125, 0.04412841796875, 0.060882568359375, 0.07763671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 11.0, 21.0, 41.0, 45.0, 80.0, 126.0, 231.0, 675.0, 22648.0, 4167945.0, 1879.0, 331.0, 117.0, 61.0, 28.0, 25.0, 8.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.3125, -20.87042236328125, -20.4283447265625, -19.98626708984375, -19.544189453125, -19.10211181640625, -18.6600341796875, -18.21795654296875, -17.77587890625, -17.33380126953125, -16.8917236328125, -16.44964599609375, -16.007568359375, -15.56549072265625, -15.1234130859375, -14.68133544921875, -14.2392578125, -13.79718017578125, -13.3551025390625, -12.91302490234375, -12.470947265625, -12.02886962890625, -11.5867919921875, -11.14471435546875, -10.70263671875, -10.26055908203125, -9.8184814453125, -9.37640380859375, -8.934326171875, -8.49224853515625, -8.0501708984375, -7.60809326171875, -7.166015625, -6.72393798828125, -6.2818603515625, -5.83978271484375, -5.397705078125, -4.95562744140625, -4.5135498046875, -4.07147216796875, -3.62939453125, -3.18731689453125, -2.7452392578125, -2.30316162109375, -1.861083984375, -1.41900634765625, -0.9769287109375, -0.53485107421875, -0.0927734375, 0.34930419921875, 0.7913818359375, 1.23345947265625, 1.675537109375, 2.11761474609375, 2.5596923828125, 3.00177001953125, 3.44384765625, 3.88592529296875, 4.3280029296875, 4.77008056640625, 5.212158203125, 5.65423583984375, 6.0963134765625, 6.53839111328125, 6.98046875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 32.0, 2979.0, 949.0, 88.0, 22.0, 8.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.990234375, -2.9237060546875, -2.857177734375, -2.7906494140625, -2.72412109375, -2.6575927734375, -2.591064453125, -2.5245361328125, -2.4580078125, -2.3914794921875, -2.324951171875, -2.2584228515625, -2.19189453125, -2.1253662109375, -2.058837890625, -1.9923095703125, -1.92578125, -1.8592529296875, -1.792724609375, -1.7261962890625, -1.65966796875, -1.5931396484375, -1.526611328125, -1.4600830078125, -1.3935546875, -1.3270263671875, -1.260498046875, -1.1939697265625, -1.12744140625, -1.0609130859375, -0.994384765625, -0.9278564453125, -0.861328125, -0.7947998046875, -0.728271484375, -0.6617431640625, -0.59521484375, -0.5286865234375, -0.462158203125, -0.3956298828125, -0.3291015625, -0.2625732421875, -0.196044921875, -0.1295166015625, -0.06298828125, 0.0035400390625, 0.070068359375, 0.1365966796875, 0.203125, 0.2696533203125, 0.336181640625, 0.4027099609375, 0.46923828125, 0.5357666015625, 0.602294921875, 0.6688232421875, 0.7353515625, 0.8018798828125, 0.868408203125, 0.9349365234375, 1.00146484375, 1.0679931640625, 1.134521484375, 1.2010498046875, 1.267578125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 10.0, 77.0, 525.0, 320.0, 42.0, 22.0, 6.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-22.40868377685547, -21.999893188476562, -21.591102600097656, -21.18231201171875, -20.773521423339844, -20.364730834960938, -19.95594024658203, -19.547149658203125, -19.138357162475586, -18.72956657409668, -18.320775985717773, -17.911985397338867, -17.50319480895996, -17.094404220581055, -16.685611724853516, -16.27682113647461, -15.868032455444336, -15.45924186706543, -15.050451278686523, -14.641660690307617, -14.232869148254395, -13.824078559875488, -13.415287971496582, -13.006497383117676, -12.597705841064453, -12.188915252685547, -11.78012466430664, -11.371334075927734, -10.962542533874512, -10.553751945495605, -10.1449613571167, -9.736170768737793, -9.32737922668457, -8.918588638305664, -8.509798049926758, -8.101007461547852, -7.692216396331787, -7.283425331115723, -6.874634742736816, -6.46584415435791, -6.057053565979004, -5.648262977600098, -5.239471912384033, -4.830681324005127, -4.421890735626221, -4.013099670410156, -3.60430908203125, -3.1955184936523438, -2.7867279052734375, -2.377937078475952, -1.969146490097046, -1.5603556632995605, -1.1515649557113647, -0.742774248123169, -0.3339834213256836, 0.07480716705322266, 0.483597993850708, 0.8923887014389038, 1.3011794090270996, 1.709970235824585, 2.1187610626220703, 2.5275516510009766, 2.936342477798462, 3.345133066177368, 3.7539238929748535]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 12.0, 17.0, 44.0, 72.0, 103.0, 149.0, 152.0, 148.0, 115.0, 82.0, 51.0, 23.0, 21.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.61284065246582, -9.29484748840332, -8.97685432434082, -8.65886116027832, -8.34086799621582, -8.02287483215332, -7.704881191253662, -7.386888027191162, -7.068894863128662, -6.750901699066162, -6.432908535003662, -6.114915370941162, -5.796921730041504, -5.478928565979004, -5.160935401916504, -4.842942237854004, -4.524949073791504, -4.206955909729004, -3.888962745666504, -3.570969343185425, -3.252976179122925, -2.934983015060425, -2.6169896125793457, -2.2989964485168457, -1.9810032844543457, -1.6630101203918457, -1.3450168371200562, -1.0270235538482666, -0.7090303897857666, -0.3910372257232666, -0.07304394245147705, 0.2449493408203125, 0.5629415512084961, 0.8809347748756409, 1.1989279985427856, 1.5169212818145752, 1.8349144458770752, 2.152907609939575, 2.4709010124206543, 2.7888941764831543, 3.1068873405456543, 3.4248805046081543, 3.7428736686706543, 4.060866832733154, 4.3788604736328125, 4.6968536376953125, 5.0148468017578125, 5.3328399658203125, 5.6508331298828125, 5.9688262939453125, 6.2868194580078125, 6.6048126220703125, 6.9228057861328125, 7.2407989501953125, 7.558792591094971, 7.876785755157471, 8.194778442382812, 8.512771606445312, 8.830764770507812, 9.148757934570312, 9.466751098632812, 9.784744262695312, 10.102737426757812, 10.420730590820312, 10.738724708557129]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 4.0, 7.0, 3.0, 2.0, 10.0, 16.0, 15.0, 22.0, 26.0, 46.0, 61.0, 105.0, 185.0, 570.0, 2640.0, 54527.0, 971174.0, 16665.0, 1605.0, 419.0, 179.0, 83.0, 51.0, 38.0, 28.0, 16.0, 12.0, 13.0, 9.0, 5.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.37109375, -5.205078125, -5.0390625, -4.873046875, -4.70703125, -4.541015625, -4.375, -4.208984375, -4.04296875, -3.876953125, -3.7109375, -3.544921875, -3.37890625, -3.212890625, -3.046875, -2.880859375, -2.71484375, -2.548828125, -2.3828125, -2.216796875, -2.05078125, -1.884765625, -1.71875, -1.552734375, -1.38671875, -1.220703125, -1.0546875, -0.888671875, -0.72265625, -0.556640625, -0.390625, -0.224609375, -0.05859375, 0.107421875, 0.2734375, 0.439453125, 0.60546875, 0.771484375, 0.9375, 1.103515625, 1.26953125, 1.435546875, 1.6015625, 1.767578125, 1.93359375, 2.099609375, 2.265625, 2.431640625, 2.59765625, 2.763671875, 2.9296875, 3.095703125, 3.26171875, 3.427734375, 3.59375, 3.759765625, 3.92578125, 4.091796875, 4.2578125, 4.423828125, 4.58984375, 4.755859375, 4.921875, 5.087890625, 5.25390625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 23.0, 48.0, 116.0, 176.0, 230.0, 209.0, 116.0, 50.0, 23.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2392578125, -1.2136955261230469, -1.1881332397460938, -1.1625709533691406, -1.1370086669921875, -1.1114463806152344, -1.0858840942382812, -1.0603218078613281, -1.034759521484375, -1.0091972351074219, -0.9836349487304688, -0.9580726623535156, -0.9325103759765625, -0.9069480895996094, -0.8813858032226562, -0.8558235168457031, -0.83026123046875, -0.8046989440917969, -0.7791366577148438, -0.7535743713378906, -0.7280120849609375, -0.7024497985839844, -0.6768875122070312, -0.6513252258300781, -0.625762939453125, -0.6002006530761719, -0.5746383666992188, -0.5490760803222656, -0.5235137939453125, -0.4979515075683594, -0.47238922119140625, -0.4468269348144531, -0.4212646484375, -0.3957023620605469, -0.37014007568359375, -0.3445777893066406, -0.3190155029296875, -0.2934532165527344, -0.26789093017578125, -0.24232864379882812, -0.216766357421875, -0.19120407104492188, -0.16564178466796875, -0.14007949829101562, -0.1145172119140625, -0.08895492553710938, -0.06339263916015625, -0.037830352783203125, -0.01226806640625, 0.013294219970703125, 0.03885650634765625, 0.06441879272460938, 0.0899810791015625, 0.11554336547851562, 0.14110565185546875, 0.16666793823242188, 0.192230224609375, 0.21779251098632812, 0.24335479736328125, 0.2689170837402344, 0.2944793701171875, 0.3200416564941406, 0.34560394287109375, 0.3711662292480469, 0.396728515625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 17.0, 14.0, 17.0, 15.0, 30.0, 57.0, 80.0, 232.0, 632.0, 3074.0, 40184.0, 910688.0, 87258.0, 4907.0, 815.0, 259.0, 101.0, 54.0, 17.0, 25.0, 17.0, 13.0, 11.0, 7.0, 8.0, 4.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.544921875, -2.458984375, -2.373046875, -2.287109375, -2.201171875, -2.115234375, -2.029296875, -1.943359375, -1.857421875, -1.771484375, -1.685546875, -1.599609375, -1.513671875, -1.427734375, -1.341796875, -1.255859375, -1.169921875, -1.083984375, -0.998046875, -0.912109375, -0.826171875, -0.740234375, -0.654296875, -0.568359375, -0.482421875, -0.396484375, -0.310546875, -0.224609375, -0.138671875, -0.052734375, 0.033203125, 0.119140625, 0.205078125, 0.291015625, 0.376953125, 0.462890625, 0.548828125, 0.634765625, 0.720703125, 0.806640625, 0.892578125, 0.978515625, 1.064453125, 1.150390625, 1.236328125, 1.322265625, 1.408203125, 1.494140625, 1.580078125, 1.666015625, 1.751953125, 1.837890625, 1.923828125, 2.009765625, 2.095703125, 2.181640625, 2.267578125, 2.353515625, 2.439453125, 2.525390625, 2.611328125, 2.697265625, 2.783203125, 2.869140625, 2.955078125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 4.0, 9.0, 9.0, 15.0, 16.0, 21.0, 23.0, 36.0, 31.0, 43.0, 42.0, 53.0, 64.0, 79.0, 73.0, 67.0, 71.0, 61.0, 52.0, 50.0, 37.0, 32.0, 24.0, 21.0, 16.0, 9.0, 13.0, 8.0, 6.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2353515625, -1.19635009765625, -1.1573486328125, -1.11834716796875, -1.079345703125, -1.04034423828125, -1.0013427734375, -0.96234130859375, -0.92333984375, -0.88433837890625, -0.8453369140625, -0.80633544921875, -0.767333984375, -0.72833251953125, -0.6893310546875, -0.65032958984375, -0.611328125, -0.57232666015625, -0.5333251953125, -0.49432373046875, -0.455322265625, -0.41632080078125, -0.3773193359375, -0.33831787109375, -0.29931640625, -0.26031494140625, -0.2213134765625, -0.18231201171875, -0.143310546875, -0.10430908203125, -0.0653076171875, -0.02630615234375, 0.0126953125, 0.05169677734375, 0.0906982421875, 0.12969970703125, 0.168701171875, 0.20770263671875, 0.2467041015625, 0.28570556640625, 0.32470703125, 0.36370849609375, 0.4027099609375, 0.44171142578125, 0.480712890625, 0.51971435546875, 0.5587158203125, 0.59771728515625, 0.63671875, 0.67572021484375, 0.7147216796875, 0.75372314453125, 0.792724609375, 0.83172607421875, 0.8707275390625, 0.90972900390625, 0.94873046875, 0.98773193359375, 1.0267333984375, 1.06573486328125, 1.104736328125, 1.14373779296875, 1.1827392578125, 1.22174072265625, 1.2607421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 12.0, 20.0, 24.0, 48.0, 86.0, 180.0, 373.0, 1053.0, 4308.0, 46893.0, 857943.0, 127333.0, 7764.0, 1549.0, 522.0, 204.0, 109.0, 51.0, 32.0, 16.0, 9.0, 8.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3251953125, -1.2858123779296875, -1.246429443359375, -1.2070465087890625, -1.16766357421875, -1.1282806396484375, -1.088897705078125, -1.0495147705078125, -1.0101318359375, -0.9707489013671875, -0.931365966796875, -0.8919830322265625, -0.85260009765625, -0.8132171630859375, -0.773834228515625, -0.7344512939453125, -0.695068359375, -0.6556854248046875, -0.616302490234375, -0.5769195556640625, -0.53753662109375, -0.4981536865234375, -0.458770751953125, -0.4193878173828125, -0.3800048828125, -0.3406219482421875, -0.301239013671875, -0.2618560791015625, -0.22247314453125, -0.1830902099609375, -0.143707275390625, -0.1043243408203125, -0.06494140625, -0.0255584716796875, 0.013824462890625, 0.0532073974609375, 0.09259033203125, 0.1319732666015625, 0.171356201171875, 0.2107391357421875, 0.2501220703125, 0.2895050048828125, 0.328887939453125, 0.3682708740234375, 0.40765380859375, 0.4470367431640625, 0.486419677734375, 0.5258026123046875, 0.565185546875, 0.6045684814453125, 0.643951416015625, 0.6833343505859375, 0.72271728515625, 0.7621002197265625, 0.801483154296875, 0.8408660888671875, 0.8802490234375, 0.9196319580078125, 0.959014892578125, 0.9983978271484375, 1.03778076171875, 1.0771636962890625, 1.116546630859375, 1.1559295654296875, 1.1953125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 1.0, 6.0, 10.0, 6.0, 9.0, 10.0, 13.0, 14.0, 13.0, 19.0, 27.0, 30.0, 43.0, 54.0, 88.0, 163.0, 132.0, 89.0, 46.0, 23.0, 33.0, 24.0, 19.0, 15.0, 19.0, 14.0, 15.0, 14.0, 4.0, 8.0, 3.0, 4.0, 6.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0004858970642089844, -0.00047066062688827515, -0.0004554241895675659, -0.0004401877522468567, -0.00042495131492614746, -0.00040971487760543823, -0.000394478440284729, -0.0003792420029640198, -0.00036400556564331055, -0.0003487691283226013, -0.0003335326910018921, -0.00031829625368118286, -0.00030305981636047363, -0.0002878233790397644, -0.0002725869417190552, -0.00025735050439834595, -0.00024211406707763672, -0.0002268776297569275, -0.00021164119243621826, -0.00019640475511550903, -0.0001811683177947998, -0.00016593188047409058, -0.00015069544315338135, -0.00013545900583267212, -0.00012022256851196289, -0.00010498613119125366, -8.974969387054443e-05, -7.45132565498352e-05, -5.9276819229125977e-05, -4.404038190841675e-05, -2.880394458770752e-05, -1.3567507266998291e-05, 1.6689300537109375e-06, 1.6905367374420166e-05, 3.2141804695129395e-05, 4.737824201583862e-05, 6.261467933654785e-05, 7.785111665725708e-05, 9.308755397796631e-05, 0.00010832399129867554, 0.00012356042861938477, 0.000138796865940094, 0.00015403330326080322, 0.00016926974058151245, 0.00018450617790222168, 0.0001997426152229309, 0.00021497905254364014, 0.00023021548986434937, 0.0002454519271850586, 0.0002606883645057678, 0.00027592480182647705, 0.0002911612391471863, 0.0003063976764678955, 0.00032163411378860474, 0.00033687055110931396, 0.0003521069884300232, 0.0003673434257507324, 0.00038257986307144165, 0.0003978163003921509, 0.0004130527377128601, 0.00042828917503356934, 0.00044352561235427856, 0.0004587620496749878, 0.000473998486995697, 0.0004892349243164062]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 15.0, 21.0, 38.0, 81.0, 249.0, 760.0, 2866.0, 24839.0, 865952.0, 144979.0, 6822.0, 1289.0, 377.0, 131.0, 61.0, 31.0, 16.0, 8.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.203125, -2.1490478515625, -2.094970703125, -2.0408935546875, -1.98681640625, -1.9327392578125, -1.878662109375, -1.8245849609375, -1.7705078125, -1.7164306640625, -1.662353515625, -1.6082763671875, -1.55419921875, -1.5001220703125, -1.446044921875, -1.3919677734375, -1.337890625, -1.2838134765625, -1.229736328125, -1.1756591796875, -1.12158203125, -1.0675048828125, -1.013427734375, -0.9593505859375, -0.9052734375, -0.8511962890625, -0.797119140625, -0.7430419921875, -0.68896484375, -0.6348876953125, -0.580810546875, -0.5267333984375, -0.47265625, -0.4185791015625, -0.364501953125, -0.3104248046875, -0.25634765625, -0.2022705078125, -0.148193359375, -0.0941162109375, -0.0400390625, 0.0140380859375, 0.068115234375, 0.1221923828125, 0.17626953125, 0.2303466796875, 0.284423828125, 0.3385009765625, 0.392578125, 0.4466552734375, 0.500732421875, 0.5548095703125, 0.60888671875, 0.6629638671875, 0.717041015625, 0.7711181640625, 0.8251953125, 0.8792724609375, 0.933349609375, 0.9874267578125, 1.04150390625, 1.0955810546875, 1.149658203125, 1.2037353515625, 1.2578125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 5.0, 11.0, 22.0, 35.0, 51.0, 77.0, 130.0, 202.0, 167.0, 114.0, 61.0, 48.0, 29.0, 21.0, 10.0, 7.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03125, -1.0053787231445312, -0.9795074462890625, -0.9536361694335938, -0.927764892578125, -0.9018936157226562, -0.8760223388671875, -0.8501510620117188, -0.82427978515625, -0.7984085083007812, -0.7725372314453125, -0.7466659545898438, -0.720794677734375, -0.6949234008789062, -0.6690521240234375, -0.6431808471679688, -0.6173095703125, -0.5914382934570312, -0.5655670166015625, -0.5396957397460938, -0.513824462890625, -0.48795318603515625, -0.4620819091796875, -0.43621063232421875, -0.41033935546875, -0.38446807861328125, -0.3585968017578125, -0.33272552490234375, -0.306854248046875, -0.28098297119140625, -0.2551116943359375, -0.22924041748046875, -0.203369140625, -0.17749786376953125, -0.1516265869140625, -0.12575531005859375, -0.099884033203125, -0.07401275634765625, -0.0481414794921875, -0.02227020263671875, 0.00360107421875, 0.02947235107421875, 0.0553436279296875, 0.08121490478515625, 0.107086181640625, 0.13295745849609375, 0.1588287353515625, 0.18470001220703125, 0.2105712890625, 0.23644256591796875, 0.2623138427734375, 0.28818511962890625, 0.314056396484375, 0.33992767333984375, 0.3657989501953125, 0.39167022705078125, 0.41754150390625, 0.44341278076171875, 0.4692840576171875, 0.49515533447265625, 0.521026611328125, 0.5468978881835938, 0.5727691650390625, 0.5986404418945312, 0.62451171875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 26.0, 99.0, 391.0, 357.0, 92.0, 24.0, 11.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.354442596435547, -19.86855125427246, -19.382659912109375, -18.89676856994629, -18.410877227783203, -17.924985885620117, -17.43909454345703, -16.953205108642578, -16.46731185913086, -15.981420516967773, -15.495529174804688, -15.009637832641602, -14.523746490478516, -14.03785514831543, -13.55196475982666, -13.066073417663574, -12.580183029174805, -12.094291687011719, -11.608400344848633, -11.122509002685547, -10.636617660522461, -10.150726318359375, -9.664835929870605, -9.17894458770752, -8.693053245544434, -8.207161903381348, -7.721270561218262, -7.235379695892334, -6.749488353729248, -6.263597011566162, -5.777706146240234, -5.291814804077148, -4.8059234619140625, -4.320032119750977, -3.8341410160064697, -3.348249912261963, -2.862358570098877, -2.376467227935791, -1.8905761241912842, -1.4046850204467773, -0.9187936782836914, -0.432902455329895, 0.05298876762390137, 0.5388799905776978, 1.0247712135314941, 1.51066255569458, 1.996553659439087, 2.4824447631835938, 2.9683361053466797, 3.4542274475097656, 3.9401185512542725, 4.426009654998779, 4.911900997161865, 5.397792339324951, 5.883683204650879, 6.369574546813965, 6.855465888977051, 7.341357231140137, 7.827248573303223, 8.313139915466309, 8.799030303955078, 9.284921646118164, 9.77081298828125, 10.256704330444336, 10.742595672607422]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 6.0, 18.0, 13.0, 13.0, 25.0, 29.0, 38.0, 52.0, 65.0, 63.0, 58.0, 70.0, 54.0, 59.0, 62.0, 60.0, 57.0, 53.0, 46.0, 35.0, 28.0, 26.0, 22.0, 18.0, 9.0, 7.0, 6.0, 1.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9454803466796875, -6.694910526275635, -6.444340705871582, -6.1937713623046875, -5.943201541900635, -5.692631721496582, -5.442061901092529, -5.191492080688477, -4.940922737121582, -4.690352916717529, -4.439783096313477, -4.189213752746582, -3.9386439323425293, -3.6880741119384766, -3.437504291534424, -3.186934471130371, -2.9363646507263184, -2.6857948303222656, -2.435225248336792, -2.1846554279327393, -1.934085726737976, -1.683516025543213, -1.4329462051391602, -1.182376503944397, -0.9318068027496338, -0.6812371015548706, -0.43066734075546265, -0.1800975799560547, 0.0704721212387085, 0.3210418224334717, 0.5716116428375244, 0.8221813440322876, 1.0727510452270508, 1.323320746421814, 1.5738904476165771, 1.8244602680206299, 2.0750298500061035, 2.3255996704101562, 2.576169490814209, 2.8267393112182617, 3.0773088932037354, 3.327878713607788, 3.5784482955932617, 3.8290181159973145, 4.079587936401367, 4.330157279968262, 4.580727577209473, 4.831296920776367, 5.08186674118042, 5.332436561584473, 5.583006381988525, 5.833576202392578, 6.084145545959473, 6.334715366363525, 6.585285186767578, 6.835855007171631, 7.086424827575684, 7.336994647979736, 7.587564468383789, 7.838133811950684, 8.088704109191895, 8.339273452758789, 8.58984375, 8.840413093566895, 9.090982437133789]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 6.0, 5.0, 6.0, 17.0, 17.0, 23.0, 16.0, 22.0, 33.0, 25.0, 44.0, 53.0, 67.0, 123.0, 192.0, 428.0, 1353.0, 12059.0, 4001603.0, 172674.0, 4670.0, 618.0, 152.0, 54.0, 18.0, 7.0, 3.0, 0.0, 0.0, 2.0], "bins": [-11.2890625, -11.0753173828125, -10.861572265625, -10.6478271484375, -10.43408203125, -10.2203369140625, -10.006591796875, -9.7928466796875, -9.5791015625, -9.3653564453125, -9.151611328125, -8.9378662109375, -8.72412109375, -8.5103759765625, -8.296630859375, -8.0828857421875, -7.869140625, -7.6553955078125, -7.441650390625, -7.2279052734375, -7.01416015625, -6.8004150390625, -6.586669921875, -6.3729248046875, -6.1591796875, -5.9454345703125, -5.731689453125, -5.5179443359375, -5.30419921875, -5.0904541015625, -4.876708984375, -4.6629638671875, -4.44921875, -4.2354736328125, -4.021728515625, -3.8079833984375, -3.59423828125, -3.3804931640625, -3.166748046875, -2.9530029296875, -2.7392578125, -2.5255126953125, -2.311767578125, -2.0980224609375, -1.88427734375, -1.6705322265625, -1.456787109375, -1.2430419921875, -1.029296875, -0.8155517578125, -0.601806640625, -0.3880615234375, -0.17431640625, 0.0394287109375, 0.253173828125, 0.4669189453125, 0.6806640625, 0.8944091796875, 1.108154296875, 1.3218994140625, 1.53564453125, 1.7493896484375, 1.963134765625, 2.1768798828125, 2.390625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 12.0, 26.0, 63.0, 98.0, 187.0, 194.0, 182.0, 113.0, 71.0, 25.0, 21.0, 12.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.2275390625, -1.2041969299316406, -1.1808547973632812, -1.1575126647949219, -1.1341705322265625, -1.1108283996582031, -1.0874862670898438, -1.0641441345214844, -1.040802001953125, -1.0174598693847656, -0.9941177368164062, -0.9707756042480469, -0.9474334716796875, -0.9240913391113281, -0.9007492065429688, -0.8774070739746094, -0.85406494140625, -0.8307228088378906, -0.8073806762695312, -0.7840385437011719, -0.7606964111328125, -0.7373542785644531, -0.7140121459960938, -0.6906700134277344, -0.667327880859375, -0.6439857482910156, -0.6206436157226562, -0.5973014831542969, -0.5739593505859375, -0.5506172180175781, -0.5272750854492188, -0.5039329528808594, -0.4805908203125, -0.4572486877441406, -0.43390655517578125, -0.4105644226074219, -0.3872222900390625, -0.3638801574707031, -0.34053802490234375, -0.3171958923339844, -0.293853759765625, -0.2705116271972656, -0.24716949462890625, -0.22382736206054688, -0.2004852294921875, -0.17714309692382812, -0.15380096435546875, -0.13045883178710938, -0.10711669921875, -0.08377456665039062, -0.06043243408203125, -0.037090301513671875, -0.0137481689453125, 0.009593963623046875, 0.03293609619140625, 0.056278228759765625, 0.079620361328125, 0.10296249389648438, 0.12630462646484375, 0.14964675903320312, 0.1729888916015625, 0.19633102416992188, 0.21967315673828125, 0.24301528930664062, 0.266357421875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 3.0, 8.0, 10.0, 14.0, 32.0, 46.0, 92.0, 150.0, 401.0, 2776.0, 4188023.0, 2273.0, 262.0, 87.0, 49.0, 38.0, 17.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.15625, -33.466552734375, -32.77685546875, -32.087158203125, -31.3974609375, -30.707763671875, -30.01806640625, -29.328369140625, -28.638671875, -27.948974609375, -27.25927734375, -26.569580078125, -25.8798828125, -25.190185546875, -24.50048828125, -23.810791015625, -23.12109375, -22.431396484375, -21.74169921875, -21.052001953125, -20.3623046875, -19.672607421875, -18.98291015625, -18.293212890625, -17.603515625, -16.913818359375, -16.22412109375, -15.534423828125, -14.8447265625, -14.155029296875, -13.46533203125, -12.775634765625, -12.0859375, -11.396240234375, -10.70654296875, -10.016845703125, -9.3271484375, -8.637451171875, -7.94775390625, -7.258056640625, -6.568359375, -5.878662109375, -5.18896484375, -4.499267578125, -3.8095703125, -3.119873046875, -2.43017578125, -1.740478515625, -1.05078125, -0.361083984375, 0.32861328125, 1.018310546875, 1.7080078125, 2.397705078125, 3.08740234375, 3.777099609375, 4.466796875, 5.156494140625, 5.84619140625, 6.535888671875, 7.2255859375, 7.915283203125, 8.60498046875, 9.294677734375, 9.984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 9.0, 19.0, 102.0, 3427.0, 453.0, 44.0, 16.0, 8.0, 6.0], "bins": [-4.68359375, -4.6039276123046875, -4.524261474609375, -4.4445953369140625, -4.36492919921875, -4.2852630615234375, -4.205596923828125, -4.1259307861328125, -4.0462646484375, -3.9665985107421875, -3.886932373046875, -3.8072662353515625, -3.72760009765625, -3.6479339599609375, -3.568267822265625, -3.4886016845703125, -3.408935546875, -3.3292694091796875, -3.249603271484375, -3.1699371337890625, -3.09027099609375, -3.0106048583984375, -2.930938720703125, -2.8512725830078125, -2.7716064453125, -2.6919403076171875, -2.612274169921875, -2.5326080322265625, -2.45294189453125, -2.3732757568359375, -2.293609619140625, -2.2139434814453125, -2.13427734375, -2.0546112060546875, -1.974945068359375, -1.8952789306640625, -1.81561279296875, -1.7359466552734375, -1.656280517578125, -1.5766143798828125, -1.4969482421875, -1.4172821044921875, -1.337615966796875, -1.2579498291015625, -1.17828369140625, -1.0986175537109375, -1.018951416015625, -0.9392852783203125, -0.859619140625, -0.7799530029296875, -0.700286865234375, -0.6206207275390625, -0.54095458984375, -0.4612884521484375, -0.381622314453125, -0.3019561767578125, -0.2222900390625, -0.1426239013671875, -0.062957763671875, 0.0167083740234375, 0.09637451171875, 0.1760406494140625, 0.255706787109375, 0.3353729248046875, 0.4150390625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 10.0, 9.0, 22.0, 55.0, 179.0, 476.0, 183.0, 45.0, 8.0, 8.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.767427444458008, -15.442994117736816, -15.118560791015625, -14.794127464294434, -14.469694137573242, -14.145259857177734, -13.820826530456543, -13.496393203735352, -13.17195987701416, -12.847526550292969, -12.523093223571777, -12.198659896850586, -11.874225616455078, -11.549792289733887, -11.225358963012695, -10.900925636291504, -10.576492309570312, -10.252058982849121, -9.92762565612793, -9.603192329406738, -9.278759002685547, -8.954324722290039, -8.629891395568848, -8.305458068847656, -7.981024742126465, -7.656591415405273, -7.332158088684082, -7.007724285125732, -6.683290958404541, -6.35885763168335, -6.034423828125, -5.709990501403809, -5.385556221008301, -5.061122894287109, -4.736689567565918, -4.412255764007568, -4.087822437286377, -3.7633891105651855, -3.438955545425415, -3.1145219802856445, -2.790088653564453, -2.4656553268432617, -2.141221761703491, -1.8167883157730103, -1.4923548698425293, -1.1679214239120483, -0.8434879779815674, -0.5190544128417969, -0.19462108612060547, 0.1298123598098755, 0.45424580574035645, 0.7786792516708374, 1.1031126976013184, 1.4275461435317993, 1.7519795894622803, 2.076413154602051, 2.400846481323242, 2.7252798080444336, 3.049713373184204, 3.3741469383239746, 3.698580265045166, 4.023013591766357, 4.347447395324707, 4.671880722045898, 4.99631404876709]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 6.0, 2.0, 10.0, 19.0, 35.0, 49.0, 68.0, 93.0, 121.0, 131.0, 118.0, 90.0, 106.0, 64.0, 40.0, 23.0, 14.0, 8.0, 8.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.52816390991211, -10.221487998962402, -9.914811134338379, -9.608135223388672, -9.301459312438965, -8.994783401489258, -8.688106536865234, -8.381430625915527, -8.07475471496582, -7.768078327178955, -7.461402416229248, -7.154726028442383, -6.848050117492676, -6.5413737297058105, -6.234697341918945, -5.928021430969238, -5.621345043182373, -5.314668655395508, -5.007992744445801, -4.7013163566589355, -4.3946404457092285, -4.087964057922363, -3.781287908554077, -3.474611759185791, -3.167935609817505, -2.8612594604492188, -2.5545833110809326, -2.2479071617126465, -1.9412308931350708, -1.6345547437667847, -1.327878475189209, -1.0212023258209229, -0.7145261764526367, -0.4078499972820282, -0.10117381811141968, 0.20550239086151123, 0.5121785402297974, 0.8188546895980835, 1.1255309581756592, 1.4322071075439453, 1.7388832569122314, 2.0455594062805176, 2.3522355556488037, 2.65891170501709, 2.965588092803955, 3.272264003753662, 3.5789403915405273, 3.8856165409088135, 4.1922926902771, 4.498969078063965, 4.805644989013672, 5.112321376800537, 5.418997287750244, 5.725673675537109, 6.032349586486816, 6.339025974273682, 6.645702362060547, 6.952378749847412, 7.259054660797119, 7.565731048583984, 7.872406959533691, 8.179082870483398, 8.485759735107422, 8.792435646057129, 9.099111557006836]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 4.0, 5.0, 8.0, 14.0, 17.0, 15.0, 20.0, 41.0, 45.0, 75.0, 91.0, 135.0, 237.0, 389.0, 839.0, 2351.0, 9018.0, 63009.0, 795173.0, 154951.0, 16090.0, 3551.0, 1163.0, 463.0, 276.0, 174.0, 106.0, 63.0, 56.0, 42.0, 22.0, 28.0, 18.0, 16.0, 13.0, 4.0, 7.0, 5.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.748046875, -3.642974853515625, -3.53790283203125, -3.432830810546875, -3.3277587890625, -3.222686767578125, -3.11761474609375, -3.012542724609375, -2.907470703125, -2.802398681640625, -2.69732666015625, -2.592254638671875, -2.4871826171875, -2.382110595703125, -2.27703857421875, -2.171966552734375, -2.06689453125, -1.961822509765625, -1.85675048828125, -1.751678466796875, -1.6466064453125, -1.541534423828125, -1.43646240234375, -1.331390380859375, -1.226318359375, -1.121246337890625, -1.01617431640625, -0.911102294921875, -0.8060302734375, -0.700958251953125, -0.59588623046875, -0.490814208984375, -0.3857421875, -0.280670166015625, -0.17559814453125, -0.070526123046875, 0.0345458984375, 0.139617919921875, 0.24468994140625, 0.349761962890625, 0.454833984375, 0.559906005859375, 0.66497802734375, 0.770050048828125, 0.8751220703125, 0.980194091796875, 1.08526611328125, 1.190338134765625, 1.29541015625, 1.400482177734375, 1.50555419921875, 1.610626220703125, 1.7156982421875, 1.820770263671875, 1.92584228515625, 2.030914306640625, 2.135986328125, 2.241058349609375, 2.34613037109375, 2.451202392578125, 2.5562744140625, 2.661346435546875, 2.76641845703125, 2.871490478515625, 2.9765625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 7.0, 19.0, 36.0, 53.0, 77.0, 93.0, 138.0, 138.0, 132.0, 102.0, 82.0, 51.0, 39.0, 15.0, 10.0, 5.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.287109375, -1.2581939697265625, -1.229278564453125, -1.2003631591796875, -1.17144775390625, -1.1425323486328125, -1.113616943359375, -1.0847015380859375, -1.0557861328125, -1.0268707275390625, -0.997955322265625, -0.9690399169921875, -0.94012451171875, -0.9112091064453125, -0.882293701171875, -0.8533782958984375, -0.824462890625, -0.7955474853515625, -0.766632080078125, -0.7377166748046875, -0.70880126953125, -0.6798858642578125, -0.650970458984375, -0.6220550537109375, -0.5931396484375, -0.5642242431640625, -0.535308837890625, -0.5063934326171875, -0.47747802734375, -0.4485626220703125, -0.419647216796875, -0.3907318115234375, -0.36181640625, -0.3329010009765625, -0.303985595703125, -0.2750701904296875, -0.24615478515625, -0.2172393798828125, -0.188323974609375, -0.1594085693359375, -0.1304931640625, -0.1015777587890625, -0.072662353515625, -0.0437469482421875, -0.01483154296875, 0.0140838623046875, 0.042999267578125, 0.0719146728515625, 0.100830078125, 0.1297454833984375, 0.158660888671875, 0.1875762939453125, 0.21649169921875, 0.2454071044921875, 0.274322509765625, 0.3032379150390625, 0.3321533203125, 0.3610687255859375, 0.389984130859375, 0.4188995361328125, 0.44781494140625, 0.4767303466796875, 0.505645751953125, 0.5345611572265625, 0.5634765625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 12.0, 12.0, 13.0, 18.0, 29.0, 59.0, 60.0, 109.0, 186.0, 373.0, 706.0, 1826.0, 5173.0, 18923.0, 103757.0, 733511.0, 149160.0, 24376.0, 6258.0, 2078.0, 888.0, 440.0, 215.0, 114.0, 70.0, 45.0, 34.0, 22.0, 24.0, 8.0, 11.0, 6.0, 12.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8046875, -1.741546630859375, -1.67840576171875, -1.615264892578125, -1.5521240234375, -1.488983154296875, -1.42584228515625, -1.362701416015625, -1.299560546875, -1.236419677734375, -1.17327880859375, -1.110137939453125, -1.0469970703125, -0.983856201171875, -0.92071533203125, -0.857574462890625, -0.79443359375, -0.731292724609375, -0.66815185546875, -0.605010986328125, -0.5418701171875, -0.478729248046875, -0.41558837890625, -0.352447509765625, -0.289306640625, -0.226165771484375, -0.16302490234375, -0.099884033203125, -0.0367431640625, 0.026397705078125, 0.08953857421875, 0.152679443359375, 0.2158203125, 0.278961181640625, 0.34210205078125, 0.405242919921875, 0.4683837890625, 0.531524658203125, 0.59466552734375, 0.657806396484375, 0.720947265625, 0.784088134765625, 0.84722900390625, 0.910369873046875, 0.9735107421875, 1.036651611328125, 1.09979248046875, 1.162933349609375, 1.22607421875, 1.289215087890625, 1.35235595703125, 1.415496826171875, 1.4786376953125, 1.541778564453125, 1.60491943359375, 1.668060302734375, 1.731201171875, 1.794342041015625, 1.85748291015625, 1.920623779296875, 1.9837646484375, 2.046905517578125, 2.11004638671875, 2.173187255859375, 2.236328125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 7.0, 9.0, 8.0, 11.0, 14.0, 19.0, 23.0, 31.0, 32.0, 29.0, 37.0, 35.0, 53.0, 62.0, 56.0, 63.0, 58.0, 54.0, 55.0, 58.0, 39.0, 41.0, 42.0, 30.0, 23.0, 24.0, 18.0, 15.0, 11.0, 11.0, 5.0, 8.0, 4.0, 7.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.607421875, -1.551849365234375, -1.49627685546875, -1.440704345703125, -1.3851318359375, -1.329559326171875, -1.27398681640625, -1.218414306640625, -1.162841796875, -1.107269287109375, -1.05169677734375, -0.996124267578125, -0.9405517578125, -0.884979248046875, -0.82940673828125, -0.773834228515625, -0.71826171875, -0.662689208984375, -0.60711669921875, -0.551544189453125, -0.4959716796875, -0.440399169921875, -0.38482666015625, -0.329254150390625, -0.273681640625, -0.218109130859375, -0.16253662109375, -0.106964111328125, -0.0513916015625, 0.004180908203125, 0.05975341796875, 0.115325927734375, 0.1708984375, 0.226470947265625, 0.28204345703125, 0.337615966796875, 0.3931884765625, 0.448760986328125, 0.50433349609375, 0.559906005859375, 0.615478515625, 0.671051025390625, 0.72662353515625, 0.782196044921875, 0.8377685546875, 0.893341064453125, 0.94891357421875, 1.004486083984375, 1.06005859375, 1.115631103515625, 1.17120361328125, 1.226776123046875, 1.2823486328125, 1.337921142578125, 1.39349365234375, 1.449066162109375, 1.504638671875, 1.560211181640625, 1.61578369140625, 1.671356201171875, 1.7269287109375, 1.782501220703125, 1.83807373046875, 1.893646240234375, 1.94921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 9.0, 10.0, 15.0, 13.0, 34.0, 46.0, 98.0, 155.0, 271.0, 594.0, 1257.0, 3050.0, 8924.0, 37875.0, 630545.0, 328150.0, 25985.0, 6880.0, 2478.0, 1111.0, 461.0, 217.0, 128.0, 79.0, 52.0, 38.0, 19.0, 12.0, 11.0, 12.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9375, -0.9071502685546875, -0.876800537109375, -0.8464508056640625, -0.81610107421875, -0.7857513427734375, -0.755401611328125, -0.7250518798828125, -0.6947021484375, -0.6643524169921875, -0.634002685546875, -0.6036529541015625, -0.57330322265625, -0.5429534912109375, -0.512603759765625, -0.4822540283203125, -0.451904296875, -0.4215545654296875, -0.391204833984375, -0.3608551025390625, -0.33050537109375, -0.3001556396484375, -0.269805908203125, -0.2394561767578125, -0.2091064453125, -0.1787567138671875, -0.148406982421875, -0.1180572509765625, -0.08770751953125, -0.0573577880859375, -0.027008056640625, 0.0033416748046875, 0.03369140625, 0.0640411376953125, 0.094390869140625, 0.1247406005859375, 0.15509033203125, 0.1854400634765625, 0.215789794921875, 0.2461395263671875, 0.2764892578125, 0.3068389892578125, 0.337188720703125, 0.3675384521484375, 0.39788818359375, 0.4282379150390625, 0.458587646484375, 0.4889373779296875, 0.519287109375, 0.5496368408203125, 0.579986572265625, 0.6103363037109375, 0.64068603515625, 0.6710357666015625, 0.701385498046875, 0.7317352294921875, 0.7620849609375, 0.7924346923828125, 0.822784423828125, 0.8531341552734375, 0.88348388671875, 0.9138336181640625, 0.944183349609375, 0.9745330810546875, 1.0048828125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 17.0, 26.0, 32.0, 36.0, 74.0, 110.0, 163.0, 164.0, 129.0, 81.0, 52.0, 37.0, 28.0, 10.0, 5.0, 7.0, 8.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003216266632080078, -0.0003131777048110962, -0.00030472874641418457, -0.00029627978801727295, -0.00028783082962036133, -0.0002793818712234497, -0.0002709329128265381, -0.00026248395442962646, -0.00025403499603271484, -0.0002455860376358032, -0.0002371370792388916, -0.00022868812084197998, -0.00022023916244506836, -0.00021179020404815674, -0.00020334124565124512, -0.0001948922872543335, -0.00018644332885742188, -0.00017799437046051025, -0.00016954541206359863, -0.000161096453666687, -0.0001526474952697754, -0.00014419853687286377, -0.00013574957847595215, -0.00012730062007904053, -0.0001188516616821289, -0.00011040270328521729, -0.00010195374488830566, -9.350478649139404e-05, -8.505582809448242e-05, -7.66068696975708e-05, -6.815791130065918e-05, -5.970895290374756e-05, -5.125999450683594e-05, -4.2811036109924316e-05, -3.4362077713012695e-05, -2.5913119316101074e-05, -1.7464160919189453e-05, -9.015202522277832e-06, -5.662441253662109e-07, 7.88271427154541e-06, 1.633167266845703e-05, 2.4780631065368652e-05, 3.3229589462280273e-05, 4.1678547859191895e-05, 5.0127506256103516e-05, 5.857646465301514e-05, 6.702542304992676e-05, 7.547438144683838e-05, 8.392333984375e-05, 9.237229824066162e-05, 0.00010082125663757324, 0.00010927021503448486, 0.00011771917343139648, 0.0001261681318283081, 0.00013461709022521973, 0.00014306604862213135, 0.00015151500701904297, 0.0001599639654159546, 0.0001684129238128662, 0.00017686188220977783, 0.00018531084060668945, 0.00019375979900360107, 0.0002022087574005127, 0.00021065771579742432, 0.00021910667419433594]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 9.0, 7.0, 8.0, 19.0, 27.0, 35.0, 53.0, 92.0, 170.0, 291.0, 484.0, 959.0, 2428.0, 6982.0, 32149.0, 555157.0, 412548.0, 26654.0, 6254.0, 2087.0, 1011.0, 483.0, 252.0, 131.0, 84.0, 55.0, 41.0, 26.0, 16.0, 14.0, 9.0, 9.0, 3.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.189453125, -1.158111572265625, -1.12677001953125, -1.095428466796875, -1.0640869140625, -1.032745361328125, -1.00140380859375, -0.970062255859375, -0.938720703125, -0.907379150390625, -0.87603759765625, -0.844696044921875, -0.8133544921875, -0.782012939453125, -0.75067138671875, -0.719329833984375, -0.68798828125, -0.656646728515625, -0.62530517578125, -0.593963623046875, -0.5626220703125, -0.531280517578125, -0.49993896484375, -0.468597412109375, -0.437255859375, -0.405914306640625, -0.37457275390625, -0.343231201171875, -0.3118896484375, -0.280548095703125, -0.24920654296875, -0.217864990234375, -0.1865234375, -0.155181884765625, -0.12384033203125, -0.092498779296875, -0.0611572265625, -0.029815673828125, 0.00152587890625, 0.032867431640625, 0.064208984375, 0.095550537109375, 0.12689208984375, 0.158233642578125, 0.1895751953125, 0.220916748046875, 0.25225830078125, 0.283599853515625, 0.31494140625, 0.346282958984375, 0.37762451171875, 0.408966064453125, 0.4403076171875, 0.471649169921875, 0.50299072265625, 0.534332275390625, 0.565673828125, 0.597015380859375, 0.62835693359375, 0.659698486328125, 0.6910400390625, 0.722381591796875, 0.75372314453125, 0.785064697265625, 0.81640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 1.0, 4.0, 3.0, 5.0, 8.0, 18.0, 33.0, 39.0, 82.0, 175.0, 175.0, 184.0, 128.0, 67.0, 23.0, 23.0, 12.0, 8.0, 5.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98876953125, -0.9632339477539062, -0.9376983642578125, -0.9121627807617188, -0.886627197265625, -0.8610916137695312, -0.8355560302734375, -0.8100204467773438, -0.78448486328125, -0.7589492797851562, -0.7334136962890625, -0.7078781127929688, -0.682342529296875, -0.6568069458007812, -0.6312713623046875, -0.6057357788085938, -0.5802001953125, -0.5546646118164062, -0.5291290283203125, -0.5035934448242188, -0.478057861328125, -0.45252227783203125, -0.4269866943359375, -0.40145111083984375, -0.37591552734375, -0.35037994384765625, -0.3248443603515625, -0.29930877685546875, -0.273773193359375, -0.24823760986328125, -0.2227020263671875, -0.19716644287109375, -0.171630859375, -0.14609527587890625, -0.1205596923828125, -0.09502410888671875, -0.069488525390625, -0.04395294189453125, -0.0184173583984375, 0.00711822509765625, 0.03265380859375, 0.05818939208984375, 0.0837249755859375, 0.10926055908203125, 0.134796142578125, 0.16033172607421875, 0.1858673095703125, 0.21140289306640625, 0.2369384765625, 0.26247406005859375, 0.2880096435546875, 0.31354522705078125, 0.339080810546875, 0.36461639404296875, 0.3901519775390625, 0.41568756103515625, 0.44122314453125, 0.46675872802734375, 0.4922943115234375, 0.5178298950195312, 0.543365478515625, 0.5689010620117188, 0.5944366455078125, 0.6199722290039062, 0.6455078125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 10.0, 28.0, 125.0, 377.0, 305.0, 105.0, 25.0, 14.0, 8.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.373247146606445, -27.724830627441406, -27.076416015625, -26.42799949645996, -25.779582977294922, -25.131168365478516, -24.482751846313477, -23.834335327148438, -23.18592071533203, -22.537504196166992, -21.889089584350586, -21.240673065185547, -20.592256546020508, -19.94384002685547, -19.295425415039062, -18.647008895874023, -17.998592376708984, -17.350175857543945, -16.70176124572754, -16.0533447265625, -15.404928207397461, -14.756512641906738, -14.108097076416016, -13.459680557250977, -12.811264991760254, -12.162849426269531, -11.514432907104492, -10.86601734161377, -10.217601776123047, -9.569185256958008, -8.920769691467285, -8.272354125976562, -7.623935699462891, -6.97551965713501, -6.327103614807129, -5.678688049316406, -5.030272006988525, -4.3818559646606445, -3.7334401607513428, -3.085024356842041, -2.43660831451416, -1.7881923913955688, -1.1397764682769775, -0.49136054515838623, 0.15705537796020508, 0.8054714202880859, 1.4538872241973877, 2.1023030281066895, 2.7507190704345703, 3.399135112762451, 4.047551155090332, 4.695966720581055, 5.3443827629089355, 5.992798805236816, 6.641214370727539, 7.28963041305542, 7.938046455383301, 8.586462020874023, 9.234878540039062, 9.883294105529785, 10.531709671020508, 11.180126190185547, 11.82854175567627, 12.476957321166992, 13.125373840332031]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 7.0, 8.0, 9.0, 7.0, 6.0, 11.0, 21.0, 29.0, 22.0, 36.0, 30.0, 39.0, 42.0, 48.0, 60.0, 50.0, 58.0, 59.0, 56.0, 51.0, 46.0, 37.0, 28.0, 42.0, 32.0, 38.0, 29.0, 23.0, 16.0, 16.0, 13.0, 13.0, 3.0, 4.0, 5.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.747722625732422, -9.450126647949219, -9.1525297164917, -8.85493278503418, -8.557336807250977, -8.259740829467773, -7.962143898010254, -7.664547443389893, -7.366950988769531, -7.06935453414917, -6.771758079528809, -6.474161624908447, -6.176565170288086, -5.878968715667725, -5.581372261047363, -5.283775806427002, -4.986179351806641, -4.688582897186279, -4.390986442565918, -4.093389987945557, -3.7957935333251953, -3.498197078704834, -3.2006006240844727, -2.9030041694641113, -2.60540771484375, -2.3078112602233887, -2.0102148056030273, -1.712618350982666, -1.4150218963623047, -1.1174254417419434, -0.819828987121582, -0.5222325325012207, -0.22463607788085938, 0.07296037673950195, 0.3705568313598633, 0.6681532859802246, 0.9657497406005859, 1.2633461952209473, 1.5609426498413086, 1.85853910446167, 2.1561355590820312, 2.4537320137023926, 2.751328468322754, 3.0489249229431152, 3.3465213775634766, 3.644117832183838, 3.941714286804199, 4.2393107414245605, 4.536907196044922, 4.834503650665283, 5.1321001052856445, 5.429696559906006, 5.727293014526367, 6.0248894691467285, 6.32248592376709, 6.620082378387451, 6.9176788330078125, 7.215275287628174, 7.512871742248535, 7.8104681968688965, 8.108064651489258, 8.405660629272461, 8.70325756072998, 9.0008544921875, 9.298450469970703]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 6.0, 6.0, 13.0, 11.0, 15.0, 25.0, 28.0, 24.0, 43.0, 53.0, 100.0, 98.0, 176.0, 356.0, 801.0, 2045.0, 7804.0, 69795.0, 4053531.0, 49648.0, 6770.0, 1774.0, 642.0, 249.0, 107.0, 55.0, 31.0, 26.0, 15.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.73828125, -5.59637451171875, -5.4544677734375, -5.31256103515625, -5.170654296875, -5.02874755859375, -4.8868408203125, -4.74493408203125, -4.60302734375, -4.46112060546875, -4.3192138671875, -4.17730712890625, -4.035400390625, -3.89349365234375, -3.7515869140625, -3.60968017578125, -3.4677734375, -3.32586669921875, -3.1839599609375, -3.04205322265625, -2.900146484375, -2.75823974609375, -2.6163330078125, -2.47442626953125, -2.33251953125, -2.19061279296875, -2.0487060546875, -1.90679931640625, -1.764892578125, -1.62298583984375, -1.4810791015625, -1.33917236328125, -1.197265625, -1.05535888671875, -0.9134521484375, -0.77154541015625, -0.629638671875, -0.48773193359375, -0.3458251953125, -0.20391845703125, -0.06201171875, 0.07989501953125, 0.2218017578125, 0.36370849609375, 0.505615234375, 0.64752197265625, 0.7894287109375, 0.93133544921875, 1.0732421875, 1.21514892578125, 1.3570556640625, 1.49896240234375, 1.640869140625, 1.78277587890625, 1.9246826171875, 2.06658935546875, 2.20849609375, 2.35040283203125, 2.4923095703125, 2.63421630859375, 2.776123046875, 2.91802978515625, 3.0599365234375, 3.20184326171875, 3.34375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 7.0, 15.0, 17.0, 43.0, 63.0, 78.0, 124.0, 121.0, 140.0, 100.0, 89.0, 83.0, 46.0, 31.0, 22.0, 12.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3369140625, -1.3079910278320312, -1.2790679931640625, -1.2501449584960938, -1.221221923828125, -1.1922988891601562, -1.1633758544921875, -1.1344528198242188, -1.10552978515625, -1.0766067504882812, -1.0476837158203125, -1.0187606811523438, -0.989837646484375, -0.9609146118164062, -0.9319915771484375, -0.9030685424804688, -0.8741455078125, -0.8452224731445312, -0.8162994384765625, -0.7873764038085938, -0.758453369140625, -0.7295303344726562, -0.7006072998046875, -0.6716842651367188, -0.64276123046875, -0.6138381958007812, -0.5849151611328125, -0.5559921264648438, -0.527069091796875, -0.49814605712890625, -0.4692230224609375, -0.44029998779296875, -0.411376953125, -0.38245391845703125, -0.3535308837890625, -0.32460784912109375, -0.295684814453125, -0.26676177978515625, -0.2378387451171875, -0.20891571044921875, -0.17999267578125, -0.15106964111328125, -0.1221466064453125, -0.09322357177734375, -0.064300537109375, -0.03537750244140625, -0.0064544677734375, 0.02246856689453125, 0.0513916015625, 0.08031463623046875, 0.1092376708984375, 0.13816070556640625, 0.167083740234375, 0.19600677490234375, 0.2249298095703125, 0.25385284423828125, 0.28277587890625, 0.31169891357421875, 0.3406219482421875, 0.36954498291015625, 0.398468017578125, 0.42739105224609375, 0.4563140869140625, 0.48523712158203125, 0.51416015625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 8.0, 11.0, 29.0, 31.0, 64.0, 120.0, 190.0, 387.0, 1505.0, 464747.0, 3724303.0, 1859.0, 500.0, 229.0, 136.0, 73.0, 46.0, 20.0, 19.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1875, -9.8482666015625, -9.509033203125, -9.1697998046875, -8.83056640625, -8.4913330078125, -8.152099609375, -7.8128662109375, -7.4736328125, -7.1343994140625, -6.795166015625, -6.4559326171875, -6.11669921875, -5.7774658203125, -5.438232421875, -5.0989990234375, -4.759765625, -4.4205322265625, -4.081298828125, -3.7420654296875, -3.40283203125, -3.0635986328125, -2.724365234375, -2.3851318359375, -2.0458984375, -1.7066650390625, -1.367431640625, -1.0281982421875, -0.68896484375, -0.3497314453125, -0.010498046875, 0.3287353515625, 0.66796875, 1.0072021484375, 1.346435546875, 1.6856689453125, 2.02490234375, 2.3641357421875, 2.703369140625, 3.0426025390625, 3.3818359375, 3.7210693359375, 4.060302734375, 4.3995361328125, 4.73876953125, 5.0780029296875, 5.417236328125, 5.7564697265625, 6.095703125, 6.4349365234375, 6.774169921875, 7.1134033203125, 7.45263671875, 7.7918701171875, 8.131103515625, 8.4703369140625, 8.8095703125, 9.1488037109375, 9.488037109375, 9.8272705078125, 10.16650390625, 10.5057373046875, 10.844970703125, 11.1842041015625, 11.5234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 38.0, 178.0, 3619.0, 198.0, 27.0, 17.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.456939697265625, -2.37091064453125, -2.284881591796875, -2.1988525390625, -2.112823486328125, -2.02679443359375, -1.940765380859375, -1.854736328125, -1.768707275390625, -1.68267822265625, -1.596649169921875, -1.5106201171875, -1.424591064453125, -1.33856201171875, -1.252532958984375, -1.16650390625, -1.080474853515625, -0.99444580078125, -0.908416748046875, -0.8223876953125, -0.736358642578125, -0.65032958984375, -0.564300537109375, -0.478271484375, -0.392242431640625, -0.30621337890625, -0.220184326171875, -0.1341552734375, -0.048126220703125, 0.03790283203125, 0.123931884765625, 0.2099609375, 0.295989990234375, 0.38201904296875, 0.468048095703125, 0.5540771484375, 0.640106201171875, 0.72613525390625, 0.812164306640625, 0.898193359375, 0.984222412109375, 1.07025146484375, 1.156280517578125, 1.2423095703125, 1.328338623046875, 1.41436767578125, 1.500396728515625, 1.58642578125, 1.672454833984375, 1.75848388671875, 1.844512939453125, 1.9305419921875, 2.016571044921875, 2.10260009765625, 2.188629150390625, 2.274658203125, 2.360687255859375, 2.44671630859375, 2.532745361328125, 2.6187744140625, 2.704803466796875, 2.79083251953125, 2.876861572265625, 2.962890625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 9.0, 18.0, 71.0, 268.0, 404.0, 170.0, 35.0, 15.0, 5.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.647691249847412, -6.404347896575928, -6.161004066467285, -5.917660713195801, -5.674317359924316, -5.430974006652832, -5.1876301765441895, -4.944286823272705, -4.7009429931640625, -4.457599639892578, -4.2142558097839355, -3.970912456512451, -3.727569103240967, -3.4842255115509033, -3.24088191986084, -2.9975385665893555, -2.754195213317871, -2.5108516216278076, -2.2675082683563232, -2.0241646766662598, -1.7808212041854858, -1.537477731704712, -1.2941341400146484, -1.0507906675338745, -0.8074471950531006, -0.5641037225723267, -0.32076019048690796, -0.07741665840148926, 0.16592681407928467, 0.4092702865600586, 0.6526138782501221, 0.895957350730896, 1.1393003463745117, 1.3826438188552856, 1.6259872913360596, 1.869330883026123, 2.1126742362976074, 2.356017827987671, 2.5993614196777344, 2.8427047729492188, 3.0860483646392822, 3.3293919563293457, 3.57273530960083, 3.8160789012908936, 4.059422492980957, 4.302765846252441, 4.546109199523926, 4.789453029632568, 5.032796382904053, 5.276139736175537, 5.51948356628418, 5.762826919555664, 6.006170272827148, 6.249513626098633, 6.492857456207275, 6.73620080947876, 6.979544639587402, 7.222887992858887, 7.466231822967529, 7.709575176239014, 7.952918529510498, 8.19626235961914, 8.439605712890625, 8.68294906616211, 8.926292419433594]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 3.0, 7.0, 9.0, 26.0, 29.0, 41.0, 66.0, 57.0, 83.0, 96.0, 90.0, 103.0, 90.0, 77.0, 79.0, 46.0, 37.0, 28.0, 9.0, 15.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.543935775756836, -4.413177490234375, -4.282419204711914, -4.151660442352295, -4.020902156829834, -3.890143871307373, -3.759385347366333, -3.628626823425293, -3.497868537902832, -3.367110252380371, -3.236351728439331, -3.105593204498291, -2.97483491897583, -2.844076633453369, -2.713318109512329, -2.582559585571289, -2.451801300048828, -2.321043014526367, -2.190284490585327, -2.059525966644287, -1.9287676811218262, -1.7980092763900757, -1.6672508716583252, -1.5364924669265747, -1.4057340621948242, -1.2749756574630737, -1.1442172527313232, -1.0134588479995728, -0.8827004432678223, -0.7519420385360718, -0.6211836338043213, -0.4904252290725708, -0.3596673011779785, -0.22890889644622803, -0.09815049171447754, 0.03260791301727295, 0.16336631774902344, 0.2941247224807739, 0.4248831272125244, 0.5556415319442749, 0.6863999366760254, 0.8171583414077759, 0.9479167461395264, 1.0786751508712769, 1.2094335556030273, 1.3401919603347778, 1.4709503650665283, 1.6017087697982788, 1.7324671745300293, 1.8632255792617798, 1.9939839839935303, 2.1247425079345703, 2.2555007934570312, 2.386259078979492, 2.5170176029205322, 2.6477761268615723, 2.778534412384033, 2.909292697906494, 3.040051221847534, 3.170809745788574, 3.301568031311035, 3.432326316833496, 3.563084840774536, 3.693843364715576, 3.824601650238037]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 2.0, 9.0, 6.0, 13.0, 12.0, 13.0, 24.0, 25.0, 52.0, 77.0, 147.0, 200.0, 464.0, 1115.0, 3689.0, 18796.0, 280381.0, 697221.0, 37510.0, 5818.0, 1615.0, 637.0, 298.0, 147.0, 97.0, 64.0, 35.0, 26.0, 18.0, 10.0, 8.0, 4.0, 7.0, 10.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.310546875, -3.200775146484375, -3.09100341796875, -2.981231689453125, -2.8714599609375, -2.761688232421875, -2.65191650390625, -2.542144775390625, -2.432373046875, -2.322601318359375, -2.21282958984375, -2.103057861328125, -1.9932861328125, -1.883514404296875, -1.77374267578125, -1.663970947265625, -1.55419921875, -1.444427490234375, -1.33465576171875, -1.224884033203125, -1.1151123046875, -1.005340576171875, -0.89556884765625, -0.785797119140625, -0.676025390625, -0.566253662109375, -0.45648193359375, -0.346710205078125, -0.2369384765625, -0.127166748046875, -0.01739501953125, 0.092376708984375, 0.2021484375, 0.311920166015625, 0.42169189453125, 0.531463623046875, 0.6412353515625, 0.751007080078125, 0.86077880859375, 0.970550537109375, 1.080322265625, 1.190093994140625, 1.29986572265625, 1.409637451171875, 1.5194091796875, 1.629180908203125, 1.73895263671875, 1.848724365234375, 1.95849609375, 2.068267822265625, 2.17803955078125, 2.287811279296875, 2.3975830078125, 2.507354736328125, 2.61712646484375, 2.726898193359375, 2.836669921875, 2.946441650390625, 3.05621337890625, 3.165985107421875, 3.2757568359375, 3.385528564453125, 3.49530029296875, 3.605072021484375, 3.71484375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 4.0, 12.0, 22.0, 41.0, 47.0, 68.0, 85.0, 109.0, 106.0, 108.0, 97.0, 80.0, 61.0, 65.0, 34.0, 23.0, 15.0, 8.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.1962890625, -1.1702537536621094, -1.1442184448242188, -1.1181831359863281, -1.0921478271484375, -1.0661125183105469, -1.0400772094726562, -1.0140419006347656, -0.988006591796875, -0.9619712829589844, -0.9359359741210938, -0.9099006652832031, -0.8838653564453125, -0.8578300476074219, -0.8317947387695312, -0.8057594299316406, -0.77972412109375, -0.7536888122558594, -0.7276535034179688, -0.7016181945800781, -0.6755828857421875, -0.6495475769042969, -0.6235122680664062, -0.5974769592285156, -0.571441650390625, -0.5454063415527344, -0.5193710327148438, -0.4933357238769531, -0.4673004150390625, -0.4412651062011719, -0.41522979736328125, -0.3891944885253906, -0.3631591796875, -0.3371238708496094, -0.31108856201171875, -0.2850532531738281, -0.2590179443359375, -0.23298263549804688, -0.20694732666015625, -0.18091201782226562, -0.154876708984375, -0.12884140014648438, -0.10280609130859375, -0.07677078247070312, -0.0507354736328125, -0.024700164794921875, 0.00133514404296875, 0.027370452880859375, 0.05340576171875, 0.07944107055664062, 0.10547637939453125, 0.13151168823242188, 0.1575469970703125, 0.18358230590820312, 0.20961761474609375, 0.23565292358398438, 0.261688232421875, 0.2877235412597656, 0.31375885009765625, 0.3397941589355469, 0.3658294677734375, 0.3918647766113281, 0.41790008544921875, 0.4439353942871094, 0.469970703125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 8.0, 10.0, 12.0, 13.0, 25.0, 40.0, 44.0, 81.0, 127.0, 272.0, 451.0, 1087.0, 3072.0, 12329.0, 86973.0, 779392.0, 141198.0, 16986.0, 3969.0, 1242.0, 521.0, 256.0, 176.0, 98.0, 38.0, 35.0, 23.0, 17.0, 10.0, 7.0, 6.0, 9.0, 2.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.291015625, -3.20574951171875, -3.1204833984375, -3.03521728515625, -2.949951171875, -2.86468505859375, -2.7794189453125, -2.69415283203125, -2.60888671875, -2.52362060546875, -2.4383544921875, -2.35308837890625, -2.267822265625, -2.18255615234375, -2.0972900390625, -2.01202392578125, -1.9267578125, -1.84149169921875, -1.7562255859375, -1.67095947265625, -1.585693359375, -1.50042724609375, -1.4151611328125, -1.32989501953125, -1.24462890625, -1.15936279296875, -1.0740966796875, -0.98883056640625, -0.903564453125, -0.81829833984375, -0.7330322265625, -0.64776611328125, -0.5625, -0.47723388671875, -0.3919677734375, -0.30670166015625, -0.221435546875, -0.13616943359375, -0.0509033203125, 0.03436279296875, 0.11962890625, 0.20489501953125, 0.2901611328125, 0.37542724609375, 0.460693359375, 0.54595947265625, 0.6312255859375, 0.71649169921875, 0.8017578125, 0.88702392578125, 0.9722900390625, 1.05755615234375, 1.142822265625, 1.22808837890625, 1.3133544921875, 1.39862060546875, 1.48388671875, 1.56915283203125, 1.6544189453125, 1.73968505859375, 1.824951171875, 1.91021728515625, 1.9954833984375, 2.08074951171875, 2.166015625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 10.0, 3.0, 8.0, 15.0, 18.0, 19.0, 24.0, 28.0, 41.0, 26.0, 58.0, 65.0, 76.0, 63.0, 73.0, 65.0, 80.0, 58.0, 44.0, 40.0, 36.0, 41.0, 27.0, 26.0, 10.0, 9.0, 8.0, 4.0, 2.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-3.271484375, -3.188720703125, -3.10595703125, -3.023193359375, -2.9404296875, -2.857666015625, -2.77490234375, -2.692138671875, -2.609375, -2.526611328125, -2.44384765625, -2.361083984375, -2.2783203125, -2.195556640625, -2.11279296875, -2.030029296875, -1.947265625, -1.864501953125, -1.78173828125, -1.698974609375, -1.6162109375, -1.533447265625, -1.45068359375, -1.367919921875, -1.28515625, -1.202392578125, -1.11962890625, -1.036865234375, -0.9541015625, -0.871337890625, -0.78857421875, -0.705810546875, -0.623046875, -0.540283203125, -0.45751953125, -0.374755859375, -0.2919921875, -0.209228515625, -0.12646484375, -0.043701171875, 0.0390625, 0.121826171875, 0.20458984375, 0.287353515625, 0.3701171875, 0.452880859375, 0.53564453125, 0.618408203125, 0.701171875, 0.783935546875, 0.86669921875, 0.949462890625, 1.0322265625, 1.114990234375, 1.19775390625, 1.280517578125, 1.36328125, 1.446044921875, 1.52880859375, 1.611572265625, 1.6943359375, 1.777099609375, 1.85986328125, 1.942626953125, 2.025390625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 10.0, 12.0, 10.0, 18.0, 27.0, 43.0, 51.0, 77.0, 120.0, 210.0, 302.0, 561.0, 1022.0, 2001.0, 4225.0, 10243.0, 31312.0, 198128.0, 681930.0, 84579.0, 19785.0, 7228.0, 3189.0, 1452.0, 789.0, 474.0, 259.0, 171.0, 91.0, 74.0, 50.0, 31.0, 27.0, 15.0, 10.0, 7.0, 9.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8251953125, -0.7970428466796875, -0.768890380859375, -0.7407379150390625, -0.71258544921875, -0.6844329833984375, -0.656280517578125, -0.6281280517578125, -0.5999755859375, -0.5718231201171875, -0.543670654296875, -0.5155181884765625, -0.48736572265625, -0.4592132568359375, -0.431060791015625, -0.4029083251953125, -0.374755859375, -0.3466033935546875, -0.318450927734375, -0.2902984619140625, -0.26214599609375, -0.2339935302734375, -0.205841064453125, -0.1776885986328125, -0.1495361328125, -0.1213836669921875, -0.093231201171875, -0.0650787353515625, -0.03692626953125, -0.0087738037109375, 0.019378662109375, 0.0475311279296875, 0.07568359375, 0.1038360595703125, 0.131988525390625, 0.1601409912109375, 0.18829345703125, 0.2164459228515625, 0.244598388671875, 0.2727508544921875, 0.3009033203125, 0.3290557861328125, 0.357208251953125, 0.3853607177734375, 0.41351318359375, 0.4416656494140625, 0.469818115234375, 0.4979705810546875, 0.526123046875, 0.5542755126953125, 0.582427978515625, 0.6105804443359375, 0.63873291015625, 0.6668853759765625, 0.695037841796875, 0.7231903076171875, 0.7513427734375, 0.7794952392578125, 0.807647705078125, 0.8358001708984375, 0.86395263671875, 0.8921051025390625, 0.920257568359375, 0.9484100341796875, 0.9765625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 10.0, 6.0, 7.0, 12.0, 9.0, 12.0, 29.0, 32.0, 42.0, 48.0, 50.0, 52.0, 91.0, 85.0, 110.0, 69.0, 69.0, 57.0, 47.0, 40.0, 19.0, 20.0, 19.0, 16.0, 6.0, 9.0, 8.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.00013780593872070312, -0.00013336539268493652, -0.00012892484664916992, -0.00012448430061340332, -0.00012004375457763672, -0.00011560320854187012, -0.00011116266250610352, -0.00010672211647033691, -0.00010228157043457031, -9.784102439880371e-05, -9.340047836303711e-05, -8.895993232727051e-05, -8.45193862915039e-05, -8.00788402557373e-05, -7.56382942199707e-05, -7.11977481842041e-05, -6.67572021484375e-05, -6.23166561126709e-05, -5.78761100769043e-05, -5.3435564041137695e-05, -4.8995018005371094e-05, -4.455447196960449e-05, -4.011392593383789e-05, -3.567337989807129e-05, -3.123283386230469e-05, -2.6792287826538086e-05, -2.2351741790771484e-05, -1.7911195755004883e-05, -1.3470649719238281e-05, -9.03010368347168e-06, -4.589557647705078e-06, -1.4901161193847656e-07, 4.291534423828125e-06, 8.732080459594727e-06, 1.3172626495361328e-05, 1.761317253112793e-05, 2.205371856689453e-05, 2.6494264602661133e-05, 3.0934810638427734e-05, 3.5375356674194336e-05, 3.981590270996094e-05, 4.425644874572754e-05, 4.869699478149414e-05, 5.313754081726074e-05, 5.7578086853027344e-05, 6.201863288879395e-05, 6.645917892456055e-05, 7.089972496032715e-05, 7.534027099609375e-05, 7.978081703186035e-05, 8.422136306762695e-05, 8.866190910339355e-05, 9.310245513916016e-05, 9.754300117492676e-05, 0.00010198354721069336, 0.00010642409324645996, 0.00011086463928222656, 0.00011530518531799316, 0.00011974573135375977, 0.00012418627738952637, 0.00012862682342529297, 0.00013306736946105957, 0.00013750791549682617, 0.00014194846153259277, 0.00014638900756835938]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 2.0, 8.0, 11.0, 20.0, 25.0, 28.0, 44.0, 85.0, 137.0, 225.0, 430.0, 809.0, 1836.0, 5227.0, 21295.0, 322097.0, 652606.0, 32646.0, 6598.0, 2338.0, 960.0, 474.0, 237.0, 141.0, 101.0, 57.0, 38.0, 15.0, 21.0, 12.0, 5.0, 7.0, 6.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8642578125, -1.81658935546875, -1.7689208984375, -1.72125244140625, -1.673583984375, -1.62591552734375, -1.5782470703125, -1.53057861328125, -1.48291015625, -1.43524169921875, -1.3875732421875, -1.33990478515625, -1.292236328125, -1.24456787109375, -1.1968994140625, -1.14923095703125, -1.1015625, -1.05389404296875, -1.0062255859375, -0.95855712890625, -0.910888671875, -0.86322021484375, -0.8155517578125, -0.76788330078125, -0.72021484375, -0.67254638671875, -0.6248779296875, -0.57720947265625, -0.529541015625, -0.48187255859375, -0.4342041015625, -0.38653564453125, -0.3388671875, -0.29119873046875, -0.2435302734375, -0.19586181640625, -0.148193359375, -0.10052490234375, -0.0528564453125, -0.00518798828125, 0.04248046875, 0.09014892578125, 0.1378173828125, 0.18548583984375, 0.233154296875, 0.28082275390625, 0.3284912109375, 0.37615966796875, 0.423828125, 0.47149658203125, 0.5191650390625, 0.56683349609375, 0.614501953125, 0.66217041015625, 0.7098388671875, 0.75750732421875, 0.80517578125, 0.85284423828125, 0.9005126953125, 0.94818115234375, 0.995849609375, 1.04351806640625, 1.0911865234375, 1.13885498046875, 1.1865234375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 2.0, 6.0, 9.0, 6.0, 7.0, 15.0, 28.0, 39.0, 65.0, 88.0, 161.0, 178.0, 162.0, 100.0, 44.0, 29.0, 12.0, 15.0, 8.0, 7.0, 9.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.33203125, -1.2973098754882812, -1.2625885009765625, -1.2278671264648438, -1.193145751953125, -1.1584243774414062, -1.1237030029296875, -1.0889816284179688, -1.05426025390625, -1.0195388793945312, -0.9848175048828125, -0.9500961303710938, -0.915374755859375, -0.8806533813476562, -0.8459320068359375, -0.8112106323242188, -0.7764892578125, -0.7417678833007812, -0.7070465087890625, -0.6723251342773438, -0.637603759765625, -0.6028823852539062, -0.5681610107421875, -0.5334396362304688, -0.49871826171875, -0.46399688720703125, -0.4292755126953125, -0.39455413818359375, -0.359832763671875, -0.32511138916015625, -0.2903900146484375, -0.25566864013671875, -0.220947265625, -0.18622589111328125, -0.1515045166015625, -0.11678314208984375, -0.082061767578125, -0.04734039306640625, -0.0126190185546875, 0.02210235595703125, 0.05682373046875, 0.09154510498046875, 0.1262664794921875, 0.16098785400390625, 0.195709228515625, 0.23043060302734375, 0.2651519775390625, 0.29987335205078125, 0.3345947265625, 0.36931610107421875, 0.4040374755859375, 0.43875885009765625, 0.473480224609375, 0.5082015991210938, 0.5429229736328125, 0.5776443481445312, 0.61236572265625, 0.6470870971679688, 0.6818084716796875, 0.7165298461914062, 0.751251220703125, 0.7859725952148438, 0.8206939697265625, 0.8554153442382812, 0.89013671875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 8.0, 12.0, 15.0, 41.0, 121.0, 283.0, 303.0, 135.0, 50.0, 24.0, 6.0, 9.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.609941482543945, -28.949974060058594, -28.29000473022461, -27.630035400390625, -26.970067977905273, -26.310100555419922, -25.650131225585938, -24.990161895751953, -24.3301944732666, -23.67022705078125, -23.010257720947266, -22.35028839111328, -21.69032096862793, -21.030353546142578, -20.370384216308594, -19.71041488647461, -19.050447463989258, -18.390480041503906, -17.730510711669922, -17.070541381835938, -16.410573959350586, -15.750605583190918, -15.09063720703125, -14.430668830871582, -13.770700454711914, -13.110732078552246, -12.450763702392578, -11.79079532623291, -11.130826950073242, -10.470858573913574, -9.810890197753906, -9.150921821594238, -8.490952491760254, -7.830984115600586, -7.171015739440918, -6.51104736328125, -5.851078987121582, -5.191110610961914, -4.531142234802246, -3.871173858642578, -3.21120548248291, -2.551237106323242, -1.8912687301635742, -1.2313003540039062, -0.5713319778442383, 0.08863639831542969, 0.7486047744750977, 1.4085731506347656, 2.0685415267944336, 2.7285099029541016, 3.3884782791137695, 4.0484466552734375, 4.7084150314331055, 5.368383407592773, 6.028351783752441, 6.688320159912109, 7.348288536071777, 8.008256912231445, 8.668225288391113, 9.328193664550781, 9.98816204071045, 10.648130416870117, 11.308098793029785, 11.968067169189453, 12.628035545349121]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 8.0, 12.0, 6.0, 12.0, 16.0, 11.0, 12.0, 20.0, 24.0, 31.0, 39.0, 34.0, 43.0, 45.0, 37.0, 49.0, 56.0, 48.0, 41.0, 54.0, 39.0, 42.0, 31.0, 48.0, 39.0, 33.0, 20.0, 32.0, 17.0, 15.0, 13.0, 15.0, 9.0, 10.0, 8.0, 6.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.417352676391602, -11.057940483093262, -10.698528289794922, -10.339116096496582, -9.979703903198242, -9.620291709899902, -9.260879516601562, -8.901466369628906, -8.542055130004883, -8.182642936706543, -7.823230743408203, -7.463818550109863, -7.104406356811523, -6.744994163513184, -6.3855814933776855, -6.026169300079346, -5.666756629943848, -5.307344436645508, -4.947932243347168, -4.588520050048828, -4.229107856750488, -3.8696954250335693, -3.5102829933166504, -3.1508708000183105, -2.7914586067199707, -2.432046413421631, -2.072634220123291, -1.713221788406372, -1.3538095951080322, -0.9943974018096924, -0.6349849700927734, -0.2755727767944336, 0.08383941650390625, 0.44325166940689087, 0.8026639223098755, 1.1620762348175049, 1.5214884281158447, 1.8809006214141846, 2.2403130531311035, 2.5997252464294434, 2.959137439727783, 3.318549633026123, 3.677961826324463, 4.037374496459961, 4.396786689758301, 4.756198883056641, 5.1156110763549805, 5.47502326965332, 5.83443546295166, 6.19384765625, 6.55325984954834, 6.91267204284668, 7.2720842361450195, 7.631496429443359, 7.990909099578857, 8.350320816040039, 8.709733963012695, 9.069146156311035, 9.428558349609375, 9.787970542907715, 10.147382736206055, 10.506794929504395, 10.866207122802734, 11.22562026977539, 11.585031509399414]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 9.0, 7.0, 16.0, 17.0, 15.0, 25.0, 37.0, 60.0, 69.0, 127.0, 188.0, 347.0, 702.0, 1724.0, 6845.0, 49182.0, 3996598.0, 123314.0, 11210.0, 2412.0, 776.0, 329.0, 126.0, 68.0, 27.0, 18.0, 13.0, 6.0, 1.0, 4.0, 0.0, 3.0], "bins": [-8.5390625, -8.363525390625, -8.18798828125, -8.012451171875, -7.8369140625, -7.661376953125, -7.48583984375, -7.310302734375, -7.134765625, -6.959228515625, -6.78369140625, -6.608154296875, -6.4326171875, -6.257080078125, -6.08154296875, -5.906005859375, -5.73046875, -5.554931640625, -5.37939453125, -5.203857421875, -5.0283203125, -4.852783203125, -4.67724609375, -4.501708984375, -4.326171875, -4.150634765625, -3.97509765625, -3.799560546875, -3.6240234375, -3.448486328125, -3.27294921875, -3.097412109375, -2.921875, -2.746337890625, -2.57080078125, -2.395263671875, -2.2197265625, -2.044189453125, -1.86865234375, -1.693115234375, -1.517578125, -1.342041015625, -1.16650390625, -0.990966796875, -0.8154296875, -0.639892578125, -0.46435546875, -0.288818359375, -0.11328125, 0.062255859375, 0.23779296875, 0.413330078125, 0.5888671875, 0.764404296875, 0.93994140625, 1.115478515625, 1.291015625, 1.466552734375, 1.64208984375, 1.817626953125, 1.9931640625, 2.168701171875, 2.34423828125, 2.519775390625, 2.6953125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 9.0, 13.0, 18.0, 34.0, 47.0, 45.0, 75.0, 106.0, 83.0, 102.0, 99.0, 86.0, 77.0, 65.0, 49.0, 36.0, 22.0, 13.0, 11.0, 3.0, 2.0, 5.0, 2.0, 1.0, 3.0], "bins": [-1.283203125, -1.2567710876464844, -1.2303390502929688, -1.2039070129394531, -1.1774749755859375, -1.1510429382324219, -1.1246109008789062, -1.0981788635253906, -1.071746826171875, -1.0453147888183594, -1.0188827514648438, -0.9924507141113281, -0.9660186767578125, -0.9395866394042969, -0.9131546020507812, -0.8867225646972656, -0.86029052734375, -0.8338584899902344, -0.8074264526367188, -0.7809944152832031, -0.7545623779296875, -0.7281303405761719, -0.7016983032226562, -0.6752662658691406, -0.648834228515625, -0.6224021911621094, -0.5959701538085938, -0.5695381164550781, -0.5431060791015625, -0.5166740417480469, -0.49024200439453125, -0.4638099670410156, -0.4373779296875, -0.4109458923339844, -0.38451385498046875, -0.3580818176269531, -0.3316497802734375, -0.3052177429199219, -0.27878570556640625, -0.2523536682128906, -0.225921630859375, -0.19948959350585938, -0.17305755615234375, -0.14662551879882812, -0.1201934814453125, -0.09376144409179688, -0.06732940673828125, -0.040897369384765625, -0.01446533203125, 0.011966705322265625, 0.03839874267578125, 0.06483078002929688, 0.0912628173828125, 0.11769485473632812, 0.14412689208984375, 0.17055892944335938, 0.196990966796875, 0.22342300415039062, 0.24985504150390625, 0.2762870788574219, 0.3027191162109375, 0.3291511535644531, 0.35558319091796875, 0.3820152282714844, 0.408447265625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 4.0, 9.0, 21.0, 14.0, 32.0, 34.0, 64.0, 90.0, 149.0, 366.0, 1354.0, 9082.0, 4099535.0, 79038.0, 3487.0, 600.0, 205.0, 83.0, 38.0, 25.0, 19.0, 14.0, 11.0, 12.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.140625, -15.78021240234375, -15.4197998046875, -15.05938720703125, -14.698974609375, -14.33856201171875, -13.9781494140625, -13.61773681640625, -13.25732421875, -12.89691162109375, -12.5364990234375, -12.17608642578125, -11.815673828125, -11.45526123046875, -11.0948486328125, -10.73443603515625, -10.3740234375, -10.01361083984375, -9.6531982421875, -9.29278564453125, -8.932373046875, -8.57196044921875, -8.2115478515625, -7.85113525390625, -7.49072265625, -7.13031005859375, -6.7698974609375, -6.40948486328125, -6.049072265625, -5.68865966796875, -5.3282470703125, -4.96783447265625, -4.607421875, -4.24700927734375, -3.8865966796875, -3.52618408203125, -3.165771484375, -2.80535888671875, -2.4449462890625, -2.08453369140625, -1.72412109375, -1.36370849609375, -1.0032958984375, -0.64288330078125, -0.282470703125, 0.07794189453125, 0.4383544921875, 0.79876708984375, 1.1591796875, 1.51959228515625, 1.8800048828125, 2.24041748046875, 2.600830078125, 2.96124267578125, 3.3216552734375, 3.68206787109375, 4.04248046875, 4.40289306640625, 4.7633056640625, 5.12371826171875, 5.484130859375, 5.84454345703125, 6.2049560546875, 6.56536865234375, 6.92578125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 7.0, 13.0, 26.0, 58.0, 160.0, 2984.0, 664.0, 98.0, 27.0, 17.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-5.34765625, -5.2423553466796875, -5.137054443359375, -5.0317535400390625, -4.92645263671875, -4.8211517333984375, -4.715850830078125, -4.6105499267578125, -4.5052490234375, -4.3999481201171875, -4.294647216796875, -4.1893463134765625, -4.08404541015625, -3.9787445068359375, -3.873443603515625, -3.7681427001953125, -3.662841796875, -3.5575408935546875, -3.452239990234375, -3.3469390869140625, -3.24163818359375, -3.1363372802734375, -3.031036376953125, -2.9257354736328125, -2.8204345703125, -2.7151336669921875, -2.609832763671875, -2.5045318603515625, -2.39923095703125, -2.2939300537109375, -2.188629150390625, -2.0833282470703125, -1.97802734375, -1.8727264404296875, -1.767425537109375, -1.6621246337890625, -1.55682373046875, -1.4515228271484375, -1.346221923828125, -1.2409210205078125, -1.1356201171875, -1.0303192138671875, -0.925018310546875, -0.8197174072265625, -0.71441650390625, -0.6091156005859375, -0.503814697265625, -0.3985137939453125, -0.293212890625, -0.1879119873046875, -0.082611083984375, 0.0226898193359375, 0.12799072265625, 0.2332916259765625, 0.338592529296875, 0.4438934326171875, 0.5491943359375, 0.6544952392578125, 0.759796142578125, 0.8650970458984375, 0.97039794921875, 1.0756988525390625, 1.180999755859375, 1.2863006591796875, 1.3916015625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 5.0, 13.0, 16.0, 27.0, 77.0, 185.0, 294.0, 203.0, 102.0, 37.0, 24.0, 7.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.662993431091309, -11.335687637329102, -11.008380889892578, -10.681075096130371, -10.353768348693848, -10.02646255493164, -9.699155807495117, -9.37185001373291, -9.044544219970703, -8.717238426208496, -8.389931678771973, -8.062625885009766, -7.735319137573242, -7.408013343811035, -7.08070707321167, -6.753400802612305, -6.426094055175781, -6.098787784576416, -5.771481513977051, -5.4441752433776855, -5.11686897277832, -4.789563179016113, -4.462256908416748, -4.134950637817383, -3.8076443672180176, -3.4803380966186523, -3.153031826019287, -2.825725793838501, -2.4984195232391357, -2.1711132526397705, -1.8438071012496948, -1.5165009498596191, -1.1891937255859375, -0.861887514591217, -0.5345813035964966, -0.20727509260177612, 0.12003111839294434, 0.44733738899230957, 0.7746435403823853, 1.101949691772461, 1.4292559623718262, 1.7565622329711914, 2.0838685035705566, 2.4111745357513428, 2.738480806350708, 3.0657870769500732, 3.3930931091308594, 3.7203993797302246, 4.04770565032959, 4.375011920928955, 4.70231819152832, 5.0296244621276855, 5.356930732727051, 5.684236526489258, 6.011542797088623, 6.338849067687988, 6.6661553382873535, 6.993461608886719, 7.320767879486084, 7.648074150085449, 7.975379943847656, 8.30268669128418, 8.629992485046387, 8.957298278808594, 9.284605026245117]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 14.0, 40.0, 59.0, 71.0, 103.0, 127.0, 154.0, 126.0, 114.0, 83.0, 51.0, 27.0, 18.0, 6.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.98848819732666, -12.605815887451172, -12.223142623901367, -11.840470314025879, -11.457797050476074, -11.075124740600586, -10.692451477050781, -10.309779167175293, -9.927106857299805, -9.544434547424316, -9.161761283874512, -8.779088973999023, -8.396415710449219, -8.01374340057373, -7.631070613861084, -7.2483978271484375, -6.865724563598633, -6.483051776885986, -6.10037899017334, -5.717706680297852, -5.335033416748047, -4.952361106872559, -4.569688320159912, -4.187015533447266, -3.804342746734619, -3.4216699600219727, -3.038997173309326, -2.656324625015259, -2.2736518383026123, -1.8909790515899658, -1.5083065032958984, -1.125633716583252, -0.7429599761962891, -0.36028724908828735, 0.022385478019714355, 0.4050581455230713, 0.7877309322357178, 1.1704037189483643, 1.5530762672424316, 1.9357490539550781, 2.3184218406677246, 2.701094627380371, 3.0837674140930176, 3.466439962387085, 3.8491127490997314, 4.231785774230957, 4.614458084106445, 4.997130870819092, 5.379803657531738, 5.762476444244385, 6.145149230957031, 6.5278215408325195, 6.910494804382324, 7.2931671142578125, 7.675839900970459, 8.058512687683105, 8.441184997558594, 8.823857307434082, 9.206530570983887, 9.589202880859375, 9.97187614440918, 10.354548454284668, 10.737220764160156, 11.119894027709961, 11.502567291259766]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 7.0, 6.0, 6.0, 7.0, 14.0, 8.0, 16.0, 22.0, 24.0, 45.0, 61.0, 107.0, 158.0, 238.0, 460.0, 946.0, 2851.0, 13529.0, 109013.0, 756723.0, 142450.0, 16247.0, 3388.0, 1077.0, 443.0, 238.0, 132.0, 99.0, 69.0, 51.0, 35.0, 22.0, 11.0, 8.0, 14.0, 10.0, 6.0, 6.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.853515625, -2.7569580078125, -2.660400390625, -2.5638427734375, -2.46728515625, -2.3707275390625, -2.274169921875, -2.1776123046875, -2.0810546875, -1.9844970703125, -1.887939453125, -1.7913818359375, -1.69482421875, -1.5982666015625, -1.501708984375, -1.4051513671875, -1.30859375, -1.2120361328125, -1.115478515625, -1.0189208984375, -0.92236328125, -0.8258056640625, -0.729248046875, -0.6326904296875, -0.5361328125, -0.4395751953125, -0.343017578125, -0.2464599609375, -0.14990234375, -0.0533447265625, 0.043212890625, 0.1397705078125, 0.236328125, 0.3328857421875, 0.429443359375, 0.5260009765625, 0.62255859375, 0.7191162109375, 0.815673828125, 0.9122314453125, 1.0087890625, 1.1053466796875, 1.201904296875, 1.2984619140625, 1.39501953125, 1.4915771484375, 1.588134765625, 1.6846923828125, 1.78125, 1.8778076171875, 1.974365234375, 2.0709228515625, 2.16748046875, 2.2640380859375, 2.360595703125, 2.4571533203125, 2.5537109375, 2.6502685546875, 2.746826171875, 2.8433837890625, 2.93994140625, 3.0364990234375, 3.133056640625, 3.2296142578125, 3.326171875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 16.0, 39.0, 69.0, 83.0, 96.0, 144.0, 135.0, 110.0, 110.0, 82.0, 57.0, 28.0, 9.0, 14.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.630859375, -1.5941162109375, -1.557373046875, -1.5206298828125, -1.48388671875, -1.4471435546875, -1.410400390625, -1.3736572265625, -1.3369140625, -1.3001708984375, -1.263427734375, -1.2266845703125, -1.18994140625, -1.1531982421875, -1.116455078125, -1.0797119140625, -1.04296875, -1.0062255859375, -0.969482421875, -0.9327392578125, -0.89599609375, -0.8592529296875, -0.822509765625, -0.7857666015625, -0.7490234375, -0.7122802734375, -0.675537109375, -0.6387939453125, -0.60205078125, -0.5653076171875, -0.528564453125, -0.4918212890625, -0.455078125, -0.4183349609375, -0.381591796875, -0.3448486328125, -0.30810546875, -0.2713623046875, -0.234619140625, -0.1978759765625, -0.1611328125, -0.1243896484375, -0.087646484375, -0.0509033203125, -0.01416015625, 0.0225830078125, 0.059326171875, 0.0960693359375, 0.1328125, 0.1695556640625, 0.206298828125, 0.2430419921875, 0.27978515625, 0.3165283203125, 0.353271484375, 0.3900146484375, 0.4267578125, 0.4635009765625, 0.500244140625, 0.5369873046875, 0.57373046875, 0.6104736328125, 0.647216796875, 0.6839599609375, 0.720703125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 3.0, 6.0, 5.0, 6.0, 8.0, 7.0, 14.0, 15.0, 24.0, 21.0, 30.0, 38.0, 48.0, 113.0, 163.0, 317.0, 605.0, 1263.0, 2622.0, 5878.0, 14161.0, 37566.0, 118598.0, 417280.0, 316550.0, 85016.0, 27894.0, 11026.0, 4776.0, 2123.0, 1061.0, 511.0, 286.0, 165.0, 104.0, 67.0, 38.0, 29.0, 24.0, 27.0, 19.0, 10.0, 12.0, 9.0, 8.0, 3.0, 6.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-1.27734375, -1.2384796142578125, -1.199615478515625, -1.1607513427734375, -1.12188720703125, -1.0830230712890625, -1.044158935546875, -1.0052947998046875, -0.9664306640625, -0.9275665283203125, -0.888702392578125, -0.8498382568359375, -0.81097412109375, -0.7721099853515625, -0.733245849609375, -0.6943817138671875, -0.655517578125, -0.6166534423828125, -0.577789306640625, -0.5389251708984375, -0.50006103515625, -0.4611968994140625, -0.422332763671875, -0.3834686279296875, -0.3446044921875, -0.3057403564453125, -0.266876220703125, -0.2280120849609375, -0.18914794921875, -0.1502838134765625, -0.111419677734375, -0.0725555419921875, -0.03369140625, 0.0051727294921875, 0.044036865234375, 0.0829010009765625, 0.12176513671875, 0.1606292724609375, 0.199493408203125, 0.2383575439453125, 0.2772216796875, 0.3160858154296875, 0.354949951171875, 0.3938140869140625, 0.43267822265625, 0.4715423583984375, 0.510406494140625, 0.5492706298828125, 0.588134765625, 0.6269989013671875, 0.665863037109375, 0.7047271728515625, 0.74359130859375, 0.7824554443359375, 0.821319580078125, 0.8601837158203125, 0.8990478515625, 0.9379119873046875, 0.976776123046875, 1.0156402587890625, 1.05450439453125, 1.0933685302734375, 1.132232666015625, 1.1710968017578125, 1.2099609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 9.0, 3.0, 5.0, 7.0, 6.0, 13.0, 18.0, 16.0, 36.0, 24.0, 20.0, 24.0, 32.0, 29.0, 46.0, 45.0, 40.0, 47.0, 45.0, 47.0, 52.0, 49.0, 48.0, 38.0, 51.0, 40.0, 28.0, 23.0, 27.0, 21.0, 22.0, 16.0, 14.0, 17.0, 7.0, 7.0, 7.0, 4.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.83203125, -1.7748565673828125, -1.717681884765625, -1.6605072021484375, -1.60333251953125, -1.5461578369140625, -1.488983154296875, -1.4318084716796875, -1.3746337890625, -1.3174591064453125, -1.260284423828125, -1.2031097412109375, -1.14593505859375, -1.0887603759765625, -1.031585693359375, -0.9744110107421875, -0.917236328125, -0.8600616455078125, -0.802886962890625, -0.7457122802734375, -0.68853759765625, -0.6313629150390625, -0.574188232421875, -0.5170135498046875, -0.4598388671875, -0.4026641845703125, -0.345489501953125, -0.2883148193359375, -0.23114013671875, -0.1739654541015625, -0.116790771484375, -0.0596160888671875, -0.00244140625, 0.0547332763671875, 0.111907958984375, 0.1690826416015625, 0.22625732421875, 0.2834320068359375, 0.340606689453125, 0.3977813720703125, 0.4549560546875, 0.5121307373046875, 0.569305419921875, 0.6264801025390625, 0.68365478515625, 0.7408294677734375, 0.798004150390625, 0.8551788330078125, 0.912353515625, 0.9695281982421875, 1.026702880859375, 1.0838775634765625, 1.14105224609375, 1.1982269287109375, 1.255401611328125, 1.3125762939453125, 1.3697509765625, 1.4269256591796875, 1.484100341796875, 1.5412750244140625, 1.59844970703125, 1.6556243896484375, 1.712799072265625, 1.7699737548828125, 1.8271484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 8.0, 3.0, 9.0, 15.0, 19.0, 18.0, 25.0, 40.0, 56.0, 94.0, 150.0, 215.0, 354.0, 663.0, 1215.0, 2788.0, 6446.0, 18023.0, 71780.0, 481864.0, 381435.0, 57066.0, 15452.0, 5651.0, 2500.0, 1136.0, 617.0, 314.0, 206.0, 107.0, 73.0, 72.0, 44.0, 37.0, 13.0, 15.0, 10.0, 7.0, 6.0, 3.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.79345703125, -0.7660293579101562, -0.7386016845703125, -0.7111740112304688, -0.683746337890625, -0.6563186645507812, -0.6288909912109375, -0.6014633178710938, -0.57403564453125, -0.5466079711914062, -0.5191802978515625, -0.49175262451171875, -0.464324951171875, -0.43689727783203125, -0.4094696044921875, -0.38204193115234375, -0.3546142578125, -0.32718658447265625, -0.2997589111328125, -0.27233123779296875, -0.244903564453125, -0.21747589111328125, -0.1900482177734375, -0.16262054443359375, -0.13519287109375, -0.10776519775390625, -0.0803375244140625, -0.05290985107421875, -0.025482177734375, 0.00194549560546875, 0.0293731689453125, 0.05680084228515625, 0.084228515625, 0.11165618896484375, 0.1390838623046875, 0.16651153564453125, 0.193939208984375, 0.22136688232421875, 0.2487945556640625, 0.27622222900390625, 0.30364990234375, 0.33107757568359375, 0.3585052490234375, 0.38593292236328125, 0.413360595703125, 0.44078826904296875, 0.4682159423828125, 0.49564361572265625, 0.5230712890625, 0.5504989624023438, 0.5779266357421875, 0.6053543090820312, 0.632781982421875, 0.6602096557617188, 0.6876373291015625, 0.7150650024414062, 0.74249267578125, 0.7699203491210938, 0.7973480224609375, 0.8247756958007812, 0.852203369140625, 0.8796310424804688, 0.9070587158203125, 0.9344863891601562, 0.9619140625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 4.0, 8.0, 12.0, 9.0, 31.0, 32.0, 60.0, 88.0, 206.0, 246.0, 135.0, 57.0, 49.0, 19.0, 22.0, 15.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004286766052246094, -0.000416487455368042, -0.0004042983055114746, -0.0003921091556549072, -0.00037992000579833984, -0.00036773085594177246, -0.0003555417060852051, -0.0003433525562286377, -0.0003311634063720703, -0.00031897425651550293, -0.00030678510665893555, -0.00029459595680236816, -0.0002824068069458008, -0.0002702176570892334, -0.000258028507232666, -0.00024583935737609863, -0.00023365020751953125, -0.00022146105766296387, -0.00020927190780639648, -0.0001970827579498291, -0.00018489360809326172, -0.00017270445823669434, -0.00016051530838012695, -0.00014832615852355957, -0.0001361370086669922, -0.0001239478588104248, -0.00011175870895385742, -9.956955909729004e-05, -8.738040924072266e-05, -7.519125938415527e-05, -6.300210952758789e-05, -5.081295967102051e-05, -3.8623809814453125e-05, -2.6434659957885742e-05, -1.424551010131836e-05, -2.0563602447509766e-06, 1.0132789611816406e-05, 2.232193946838379e-05, 3.451108932495117e-05, 4.6700239181518555e-05, 5.888938903808594e-05, 7.107853889465332e-05, 8.32676887512207e-05, 9.545683860778809e-05, 0.00010764598846435547, 0.00011983513832092285, 0.00013202428817749023, 0.00014421343803405762, 0.000156402587890625, 0.00016859173774719238, 0.00018078088760375977, 0.00019297003746032715, 0.00020515918731689453, 0.00021734833717346191, 0.0002295374870300293, 0.00024172663688659668, 0.00025391578674316406, 0.00026610493659973145, 0.00027829408645629883, 0.0002904832363128662, 0.0003026723861694336, 0.000314861536026001, 0.00032705068588256836, 0.00033923983573913574, 0.0003514289855957031]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 5.0, 15.0, 24.0, 42.0, 56.0, 84.0, 185.0, 416.0, 843.0, 2026.0, 5914.0, 25157.0, 253649.0, 686537.0, 57966.0, 10190.0, 3147.0, 1250.0, 511.0, 253.0, 126.0, 56.0, 34.0, 23.0, 15.0, 6.0, 6.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.05078125, -1.00738525390625, -0.9639892578125, -0.92059326171875, -0.877197265625, -0.83380126953125, -0.7904052734375, -0.74700927734375, -0.70361328125, -0.66021728515625, -0.6168212890625, -0.57342529296875, -0.530029296875, -0.48663330078125, -0.4432373046875, -0.39984130859375, -0.3564453125, -0.31304931640625, -0.2696533203125, -0.22625732421875, -0.182861328125, -0.13946533203125, -0.0960693359375, -0.05267333984375, -0.00927734375, 0.03411865234375, 0.0775146484375, 0.12091064453125, 0.164306640625, 0.20770263671875, 0.2510986328125, 0.29449462890625, 0.337890625, 0.38128662109375, 0.4246826171875, 0.46807861328125, 0.511474609375, 0.55487060546875, 0.5982666015625, 0.64166259765625, 0.68505859375, 0.72845458984375, 0.7718505859375, 0.81524658203125, 0.858642578125, 0.90203857421875, 0.9454345703125, 0.98883056640625, 1.0322265625, 1.07562255859375, 1.1190185546875, 1.16241455078125, 1.205810546875, 1.24920654296875, 1.2926025390625, 1.33599853515625, 1.37939453125, 1.42279052734375, 1.4661865234375, 1.50958251953125, 1.552978515625, 1.59637451171875, 1.6397705078125, 1.68316650390625, 1.7265625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 6.0, 7.0, 10.0, 12.0, 27.0, 36.0, 67.0, 80.0, 109.0, 144.0, 119.0, 100.0, 82.0, 61.0, 46.0, 25.0, 17.0, 12.0, 8.0, 6.0, 5.0, 3.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.88623046875, -0.8558883666992188, -0.8255462646484375, -0.7952041625976562, -0.764862060546875, -0.7345199584960938, -0.7041778564453125, -0.6738357543945312, -0.64349365234375, -0.6131515502929688, -0.5828094482421875, -0.5524673461914062, -0.522125244140625, -0.49178314208984375, -0.4614410400390625, -0.43109893798828125, -0.4007568359375, -0.37041473388671875, -0.3400726318359375, -0.30973052978515625, -0.279388427734375, -0.24904632568359375, -0.2187042236328125, -0.18836212158203125, -0.15802001953125, -0.12767791748046875, -0.0973358154296875, -0.06699371337890625, -0.036651611328125, -0.00630950927734375, 0.0240325927734375, 0.05437469482421875, 0.084716796875, 0.11505889892578125, 0.1454010009765625, 0.17574310302734375, 0.206085205078125, 0.23642730712890625, 0.2667694091796875, 0.29711151123046875, 0.32745361328125, 0.35779571533203125, 0.3881378173828125, 0.41847991943359375, 0.448822021484375, 0.47916412353515625, 0.5095062255859375, 0.5398483276367188, 0.5701904296875, 0.6005325317382812, 0.6308746337890625, 0.6612167358398438, 0.691558837890625, 0.7219009399414062, 0.7522430419921875, 0.7825851440429688, 0.81292724609375, 0.8432693481445312, 0.8736114501953125, 0.9039535522460938, 0.934295654296875, 0.9646377563476562, 0.9949798583984375, 1.0253219604492188, 1.0556640625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 25.0, 68.0, 235.0, 440.0, 179.0, 43.0, 16.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.55865478515625, -44.59474563598633, -43.630836486816406, -42.666927337646484, -41.70301818847656, -40.73910903930664, -39.77519989013672, -38.8112907409668, -37.847381591796875, -36.88347244262695, -35.91956329345703, -34.95565414428711, -33.99174499511719, -33.027835845947266, -32.063926696777344, -31.100017547607422, -30.1361083984375, -29.172199249267578, -28.208290100097656, -27.244380950927734, -26.280471801757812, -25.31656265258789, -24.35265350341797, -23.388744354248047, -22.424835205078125, -21.460926055908203, -20.49701690673828, -19.53310775756836, -18.569198608398438, -17.605289459228516, -16.641380310058594, -15.677471160888672, -14.713560104370117, -13.749650955200195, -12.785741806030273, -11.821832656860352, -10.85792350769043, -9.894014358520508, -8.930105209350586, -7.966196060180664, -7.002286911010742, -6.03837776184082, -5.074468612670898, -4.110559463500977, -3.1466503143310547, -2.182741165161133, -1.218832015991211, -0.25492286682128906, 0.7089862823486328, 1.6728954315185547, 2.6368045806884766, 3.6007137298583984, 4.56462287902832, 5.528532028198242, 6.492441177368164, 7.456350326538086, 8.420259475708008, 9.38416862487793, 10.348077774047852, 11.311986923217773, 12.275896072387695, 13.239805221557617, 14.203714370727539, 15.167623519897461, 16.131532669067383]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 7.0, 6.0, 8.0, 17.0, 22.0, 19.0, 16.0, 21.0, 24.0, 33.0, 43.0, 28.0, 48.0, 47.0, 40.0, 35.0, 44.0, 46.0, 59.0, 40.0, 56.0, 38.0, 44.0, 32.0, 38.0, 29.0, 30.0, 31.0, 20.0, 9.0, 13.0, 13.0, 12.0, 4.0, 4.0, 7.0, 7.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.683826446533203, -11.341886520385742, -10.999945640563965, -10.658005714416504, -10.316064834594727, -9.974124908447266, -9.632184982299805, -9.290244102478027, -8.94830322265625, -8.606363296508789, -8.264422416687012, -7.922482490539551, -7.580541610717773, -7.2386016845703125, -6.896661281585693, -6.554720878601074, -6.212780952453613, -5.870840549468994, -5.528900146484375, -5.186960220336914, -4.845019340515137, -4.503079414367676, -4.161139011383057, -3.8191986083984375, -3.4772582054138184, -3.135317802429199, -2.79337739944458, -2.45143723487854, -2.109496831893921, -1.7675564289093018, -1.4256162643432617, -1.0836758613586426, -0.7417354583740234, -0.3997951149940491, -0.05785477161407471, 0.2840855121612549, 0.626025915145874, 0.9679663181304932, 1.3099064826965332, 1.6518468856811523, 1.9937872886657715, 2.3357276916503906, 2.6776680946350098, 3.01960825920105, 3.361548662185669, 3.703489065170288, 4.045429229736328, 4.387369632720947, 4.729310035705566, 5.0712504386901855, 5.413190841674805, 5.755130767822266, 6.097071647644043, 6.439011573791504, 6.780951976776123, 7.122892379760742, 7.464832782745361, 7.8067731857299805, 8.148713111877441, 8.490653991699219, 8.83259391784668, 9.174534797668457, 9.516474723815918, 9.858415603637695, 10.200355529785156]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 3.0, 7.0, 7.0, 12.0, 14.0, 17.0, 27.0, 29.0, 53.0, 79.0, 115.0, 260.0, 594.0, 2170.0, 10669.0, 196800.0, 3957790.0, 20591.0, 3399.0, 910.0, 333.0, 156.0, 88.0, 48.0, 34.0, 18.0, 9.0, 13.0, 7.0, 4.0, 4.0, 7.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.84765625, -4.72064208984375, -4.5936279296875, -4.46661376953125, -4.339599609375, -4.21258544921875, -4.0855712890625, -3.95855712890625, -3.83154296875, -3.70452880859375, -3.5775146484375, -3.45050048828125, -3.323486328125, -3.19647216796875, -3.0694580078125, -2.94244384765625, -2.8154296875, -2.68841552734375, -2.5614013671875, -2.43438720703125, -2.307373046875, -2.18035888671875, -2.0533447265625, -1.92633056640625, -1.79931640625, -1.67230224609375, -1.5452880859375, -1.41827392578125, -1.291259765625, -1.16424560546875, -1.0372314453125, -0.91021728515625, -0.783203125, -0.65618896484375, -0.5291748046875, -0.40216064453125, -0.275146484375, -0.14813232421875, -0.0211181640625, 0.10589599609375, 0.23291015625, 0.35992431640625, 0.4869384765625, 0.61395263671875, 0.740966796875, 0.86798095703125, 0.9949951171875, 1.12200927734375, 1.2490234375, 1.37603759765625, 1.5030517578125, 1.63006591796875, 1.757080078125, 1.88409423828125, 2.0111083984375, 2.13812255859375, 2.26513671875, 2.39215087890625, 2.5191650390625, 2.64617919921875, 2.773193359375, 2.90020751953125, 3.0272216796875, 3.15423583984375, 3.28125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 16.0, 19.0, 32.0, 59.0, 71.0, 107.0, 119.0, 108.0, 102.0, 111.0, 94.0, 69.0, 47.0, 27.0, 5.0, 5.0, 6.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.625, -1.5894317626953125, -1.553863525390625, -1.5182952880859375, -1.48272705078125, -1.4471588134765625, -1.411590576171875, -1.3760223388671875, -1.3404541015625, -1.3048858642578125, -1.269317626953125, -1.2337493896484375, -1.19818115234375, -1.1626129150390625, -1.127044677734375, -1.0914764404296875, -1.055908203125, -1.0203399658203125, -0.984771728515625, -0.9492034912109375, -0.91363525390625, -0.8780670166015625, -0.842498779296875, -0.8069305419921875, -0.7713623046875, -0.7357940673828125, -0.700225830078125, -0.6646575927734375, -0.62908935546875, -0.5935211181640625, -0.557952880859375, -0.5223846435546875, -0.48681640625, -0.4512481689453125, -0.415679931640625, -0.3801116943359375, -0.34454345703125, -0.3089752197265625, -0.273406982421875, -0.2378387451171875, -0.2022705078125, -0.1667022705078125, -0.131134033203125, -0.0955657958984375, -0.05999755859375, -0.0244293212890625, 0.011138916015625, 0.0467071533203125, 0.082275390625, 0.1178436279296875, 0.153411865234375, 0.1889801025390625, 0.22454833984375, 0.2601165771484375, 0.295684814453125, 0.3312530517578125, 0.3668212890625, 0.4023895263671875, 0.437957763671875, 0.4735260009765625, 0.50909423828125, 0.5446624755859375, 0.580230712890625, 0.6157989501953125, 0.6513671875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 4.0, 12.0, 20.0, 25.0, 44.0, 62.0, 103.0, 179.0, 832.0, 10789.0, 4129143.0, 50494.0, 1831.0, 316.0, 150.0, 111.0, 67.0, 40.0, 20.0, 22.0, 11.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.224609375, -3.005035400390625, -2.78546142578125, -2.565887451171875, -2.3463134765625, -2.126739501953125, -1.90716552734375, -1.687591552734375, -1.468017578125, -1.248443603515625, -1.02886962890625, -0.809295654296875, -0.5897216796875, -0.370147705078125, -0.15057373046875, 0.069000244140625, 0.28857421875, 0.508148193359375, 0.72772216796875, 0.947296142578125, 1.1668701171875, 1.386444091796875, 1.60601806640625, 1.825592041015625, 2.045166015625, 2.264739990234375, 2.48431396484375, 2.703887939453125, 2.9234619140625, 3.143035888671875, 3.36260986328125, 3.582183837890625, 3.8017578125, 4.021331787109375, 4.24090576171875, 4.460479736328125, 4.6800537109375, 4.899627685546875, 5.11920166015625, 5.338775634765625, 5.558349609375, 5.777923583984375, 5.99749755859375, 6.217071533203125, 6.4366455078125, 6.656219482421875, 6.87579345703125, 7.095367431640625, 7.31494140625, 7.534515380859375, 7.75408935546875, 7.973663330078125, 8.1932373046875, 8.412811279296875, 8.63238525390625, 8.851959228515625, 9.071533203125, 9.291107177734375, 9.51068115234375, 9.730255126953125, 9.9498291015625, 10.169403076171875, 10.38897705078125, 10.608551025390625, 10.828125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 7.0, 8.0, 10.0, 25.0, 68.0, 229.0, 3060.0, 479.0, 93.0, 42.0, 20.0, 19.0, 10.0, 3.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68310546875, -0.6365432739257812, -0.5899810791015625, -0.5434188842773438, -0.496856689453125, -0.45029449462890625, -0.4037322998046875, -0.35717010498046875, -0.31060791015625, -0.26404571533203125, -0.2174835205078125, -0.17092132568359375, -0.124359130859375, -0.07779693603515625, -0.0312347412109375, 0.01532745361328125, 0.0618896484375, 0.10845184326171875, 0.1550140380859375, 0.20157623291015625, 0.248138427734375, 0.29470062255859375, 0.3412628173828125, 0.38782501220703125, 0.43438720703125, 0.48094940185546875, 0.5275115966796875, 0.5740737915039062, 0.620635986328125, 0.6671981811523438, 0.7137603759765625, 0.7603225708007812, 0.806884765625, 0.8534469604492188, 0.9000091552734375, 0.9465713500976562, 0.993133544921875, 1.0396957397460938, 1.0862579345703125, 1.1328201293945312, 1.17938232421875, 1.2259445190429688, 1.2725067138671875, 1.3190689086914062, 1.365631103515625, 1.4121932983398438, 1.4587554931640625, 1.5053176879882812, 1.5518798828125, 1.5984420776367188, 1.6450042724609375, 1.6915664672851562, 1.738128662109375, 1.7846908569335938, 1.8312530517578125, 1.8778152465820312, 1.92437744140625, 1.9709396362304688, 2.0175018310546875, 2.0640640258789062, 2.110626220703125, 2.1571884155273438, 2.2037506103515625, 2.2503128051757812, 2.296875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 22.0, 89.0, 305.0, 334.0, 160.0, 62.0, 20.0, 8.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.603825569152832, -6.2742085456848145, -5.944591522216797, -5.614974498748779, -5.285357475280762, -4.955740451812744, -4.626123428344727, -4.296506404876709, -3.9668893814086914, -3.637272357940674, -3.3076553344726562, -2.9780383110046387, -2.648421287536621, -2.3188042640686035, -1.989187240600586, -1.6595702171325684, -1.3299531936645508, -1.0003361701965332, -0.6707191467285156, -0.34110212326049805, -0.011485099792480469, 0.3181319236755371, 0.6477489471435547, 0.9773659706115723, 1.3069829940795898, 1.6366000175476074, 1.966217041015625, 2.2958340644836426, 2.62545108795166, 2.9550681114196777, 3.2846851348876953, 3.614302158355713, 3.943918228149414, 4.273535251617432, 4.603152275085449, 4.932769298553467, 5.262386322021484, 5.592003345489502, 5.9216203689575195, 6.251237392425537, 6.580854415893555, 6.910471439361572, 7.24008846282959, 7.569705486297607, 7.899322509765625, 8.228939056396484, 8.55855655670166, 8.888174057006836, 9.217790603637695, 9.547407150268555, 9.87702465057373, 10.206642150878906, 10.536258697509766, 10.865875244140625, 11.1954927444458, 11.525110244750977, 11.854726791381836, 12.184343338012695, 12.513960838317871, 12.843578338623047, 13.173194885253906, 13.502811431884766, 13.832428932189941, 14.162046432495117, 14.491662979125977]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 3.0, 11.0, 13.0, 14.0, 22.0, 43.0, 42.0, 48.0, 69.0, 65.0, 84.0, 76.0, 75.0, 80.0, 64.0, 64.0, 53.0, 47.0, 31.0, 27.0, 21.0, 21.0, 11.0, 9.0, 5.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.327057361602783, -3.1848394870758057, -3.042621612548828, -2.9004037380218506, -2.758185863494873, -2.6159679889678955, -2.473750114440918, -2.3315322399139404, -2.189314365386963, -2.0470964908599854, -1.9048786163330078, -1.7626607418060303, -1.6204428672790527, -1.4782249927520752, -1.3360071182250977, -1.1937892436981201, -1.0515713691711426, -0.909353494644165, -0.7671356201171875, -0.62491774559021, -0.4826998710632324, -0.3404819965362549, -0.19826412200927734, -0.056046247482299805, 0.08617162704467773, 0.22838950157165527, 0.3706073760986328, 0.5128252506256104, 0.6550431251525879, 0.7972609996795654, 0.939478874206543, 1.0816967487335205, 1.2239151000976562, 1.3661329746246338, 1.5083508491516113, 1.6505687236785889, 1.7927865982055664, 1.935004472732544, 2.0772223472595215, 2.219440221786499, 2.3616580963134766, 2.503875970840454, 2.6460938453674316, 2.788311719894409, 2.9305295944213867, 3.0727474689483643, 3.214965343475342, 3.3571832180023193, 3.499401092529297, 3.6416189670562744, 3.783836841583252, 3.9260547161102295, 4.068272590637207, 4.2104902267456055, 4.352708339691162, 4.494926452636719, 4.637144088745117, 4.779361724853516, 4.921579837799072, 5.063797950744629, 5.206015586853027, 5.348233222961426, 5.490451335906982, 5.632669448852539, 5.7748870849609375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 9.0, 7.0, 19.0, 17.0, 24.0, 43.0, 83.0, 129.0, 266.0, 696.0, 2266.0, 10709.0, 85363.0, 780939.0, 147612.0, 15814.0, 3022.0, 832.0, 309.0, 153.0, 77.0, 60.0, 28.0, 29.0, 13.0, 9.0, 10.0, 3.0, 7.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.576171875, -2.471466064453125, -2.36676025390625, -2.262054443359375, -2.1573486328125, -2.052642822265625, -1.94793701171875, -1.843231201171875, -1.738525390625, -1.633819580078125, -1.52911376953125, -1.424407958984375, -1.3197021484375, -1.214996337890625, -1.11029052734375, -1.005584716796875, -0.90087890625, -0.796173095703125, -0.69146728515625, -0.586761474609375, -0.4820556640625, -0.377349853515625, -0.27264404296875, -0.167938232421875, -0.063232421875, 0.041473388671875, 0.14617919921875, 0.250885009765625, 0.3555908203125, 0.460296630859375, 0.56500244140625, 0.669708251953125, 0.7744140625, 0.879119873046875, 0.98382568359375, 1.088531494140625, 1.1932373046875, 1.297943115234375, 1.40264892578125, 1.507354736328125, 1.612060546875, 1.716766357421875, 1.82147216796875, 1.926177978515625, 2.0308837890625, 2.135589599609375, 2.24029541015625, 2.345001220703125, 2.44970703125, 2.554412841796875, 2.65911865234375, 2.763824462890625, 2.8685302734375, 2.973236083984375, 3.07794189453125, 3.182647705078125, 3.287353515625, 3.392059326171875, 3.49676513671875, 3.601470947265625, 3.7061767578125, 3.810882568359375, 3.91558837890625, 4.020294189453125, 4.125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 10.0, 7.0, 25.0, 29.0, 45.0, 64.0, 68.0, 89.0, 99.0, 91.0, 118.0, 81.0, 73.0, 77.0, 46.0, 36.0, 18.0, 11.0, 9.0, 0.0, 4.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.361328125, -1.3308029174804688, -1.3002777099609375, -1.2697525024414062, -1.239227294921875, -1.2087020874023438, -1.1781768798828125, -1.1476516723632812, -1.11712646484375, -1.0866012573242188, -1.0560760498046875, -1.0255508422851562, -0.995025634765625, -0.9645004272460938, -0.9339752197265625, -0.9034500122070312, -0.8729248046875, -0.8423995971679688, -0.8118743896484375, -0.7813491821289062, -0.750823974609375, -0.7202987670898438, -0.6897735595703125, -0.6592483520507812, -0.62872314453125, -0.5981979370117188, -0.5676727294921875, -0.5371475219726562, -0.506622314453125, -0.47609710693359375, -0.4455718994140625, -0.41504669189453125, -0.384521484375, -0.35399627685546875, -0.3234710693359375, -0.29294586181640625, -0.262420654296875, -0.23189544677734375, -0.2013702392578125, -0.17084503173828125, -0.14031982421875, -0.10979461669921875, -0.0792694091796875, -0.04874420166015625, -0.018218994140625, 0.01230621337890625, 0.0428314208984375, 0.07335662841796875, 0.1038818359375, 0.13440704345703125, 0.1649322509765625, 0.19545745849609375, 0.225982666015625, 0.25650787353515625, 0.2870330810546875, 0.31755828857421875, 0.34808349609375, 0.37860870361328125, 0.4091339111328125, 0.43965911865234375, 0.470184326171875, 0.5007095336914062, 0.5312347412109375, 0.5617599487304688, 0.59228515625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 7.0, 10.0, 9.0, 13.0, 22.0, 22.0, 40.0, 80.0, 143.0, 235.0, 508.0, 1243.0, 3151.0, 8399.0, 26891.0, 124451.0, 644572.0, 186303.0, 35493.0, 10295.0, 3806.0, 1487.0, 607.0, 338.0, 173.0, 84.0, 45.0, 32.0, 23.0, 13.0, 9.0, 10.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9580078125, -1.8940277099609375, -1.830047607421875, -1.7660675048828125, -1.70208740234375, -1.6381072998046875, -1.574127197265625, -1.5101470947265625, -1.4461669921875, -1.3821868896484375, -1.318206787109375, -1.2542266845703125, -1.19024658203125, -1.1262664794921875, -1.062286376953125, -0.9983062744140625, -0.934326171875, -0.8703460693359375, -0.806365966796875, -0.7423858642578125, -0.67840576171875, -0.6144256591796875, -0.550445556640625, -0.4864654541015625, -0.4224853515625, -0.3585052490234375, -0.294525146484375, -0.2305450439453125, -0.16656494140625, -0.1025848388671875, -0.038604736328125, 0.0253753662109375, 0.08935546875, 0.1533355712890625, 0.217315673828125, 0.2812957763671875, 0.34527587890625, 0.4092559814453125, 0.473236083984375, 0.5372161865234375, 0.6011962890625, 0.6651763916015625, 0.729156494140625, 0.7931365966796875, 0.85711669921875, 0.9210968017578125, 0.985076904296875, 1.0490570068359375, 1.113037109375, 1.1770172119140625, 1.240997314453125, 1.3049774169921875, 1.36895751953125, 1.4329376220703125, 1.496917724609375, 1.5608978271484375, 1.6248779296875, 1.6888580322265625, 1.752838134765625, 1.8168182373046875, 1.88079833984375, 1.9447784423828125, 2.008758544921875, 2.0727386474609375, 2.13671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 4.0, 10.0, 11.0, 8.0, 11.0, 13.0, 14.0, 30.0, 30.0, 38.0, 47.0, 30.0, 47.0, 49.0, 55.0, 59.0, 70.0, 61.0, 39.0, 55.0, 45.0, 41.0, 50.0, 32.0, 36.0, 24.0, 28.0, 16.0, 15.0, 12.0, 7.0, 2.0, 6.0, 7.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.04296875, -1.96466064453125, -1.8863525390625, -1.80804443359375, -1.729736328125, -1.65142822265625, -1.5731201171875, -1.49481201171875, -1.41650390625, -1.33819580078125, -1.2598876953125, -1.18157958984375, -1.103271484375, -1.02496337890625, -0.9466552734375, -0.86834716796875, -0.7900390625, -0.71173095703125, -0.6334228515625, -0.55511474609375, -0.476806640625, -0.39849853515625, -0.3201904296875, -0.24188232421875, -0.16357421875, -0.08526611328125, -0.0069580078125, 0.07135009765625, 0.149658203125, 0.22796630859375, 0.3062744140625, 0.38458251953125, 0.462890625, 0.54119873046875, 0.6195068359375, 0.69781494140625, 0.776123046875, 0.85443115234375, 0.9327392578125, 1.01104736328125, 1.08935546875, 1.16766357421875, 1.2459716796875, 1.32427978515625, 1.402587890625, 1.48089599609375, 1.5592041015625, 1.63751220703125, 1.7158203125, 1.79412841796875, 1.8724365234375, 1.95074462890625, 2.029052734375, 2.10736083984375, 2.1856689453125, 2.26397705078125, 2.34228515625, 2.42059326171875, 2.4989013671875, 2.57720947265625, 2.655517578125, 2.73382568359375, 2.8121337890625, 2.89044189453125, 2.96875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 6.0, 3.0, 18.0, 18.0, 28.0, 35.0, 51.0, 79.0, 145.0, 195.0, 292.0, 592.0, 1151.0, 2244.0, 5259.0, 14951.0, 67772.0, 674813.0, 233042.0, 31745.0, 8976.0, 3490.0, 1625.0, 830.0, 441.0, 271.0, 172.0, 93.0, 69.0, 48.0, 21.0, 19.0, 18.0, 15.0, 7.0, 7.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5732421875, -1.529266357421875, -1.48529052734375, -1.441314697265625, -1.3973388671875, -1.353363037109375, -1.30938720703125, -1.265411376953125, -1.221435546875, -1.177459716796875, -1.13348388671875, -1.089508056640625, -1.0455322265625, -1.001556396484375, -0.95758056640625, -0.913604736328125, -0.86962890625, -0.825653076171875, -0.78167724609375, -0.737701416015625, -0.6937255859375, -0.649749755859375, -0.60577392578125, -0.561798095703125, -0.517822265625, -0.473846435546875, -0.42987060546875, -0.385894775390625, -0.3419189453125, -0.297943115234375, -0.25396728515625, -0.209991455078125, -0.166015625, -0.122039794921875, -0.07806396484375, -0.034088134765625, 0.0098876953125, 0.053863525390625, 0.09783935546875, 0.141815185546875, 0.185791015625, 0.229766845703125, 0.27374267578125, 0.317718505859375, 0.3616943359375, 0.405670166015625, 0.44964599609375, 0.493621826171875, 0.53759765625, 0.581573486328125, 0.62554931640625, 0.669525146484375, 0.7135009765625, 0.757476806640625, 0.80145263671875, 0.845428466796875, 0.889404296875, 0.933380126953125, 0.97735595703125, 1.021331787109375, 1.0653076171875, 1.109283447265625, 1.15325927734375, 1.197235107421875, 1.2412109375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 8.0, 8.0, 17.0, 23.0, 26.0, 49.0, 57.0, 96.0, 191.0, 188.0, 89.0, 51.0, 42.0, 42.0, 23.0, 16.0, 18.0, 12.0, 9.0, 5.0, 2.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00036072731018066406, -0.0003509595990180969, -0.0003411918878555298, -0.00033142417669296265, -0.0003216564655303955, -0.00031188875436782837, -0.00030212104320526123, -0.0002923533320426941, -0.00028258562088012695, -0.0002728179097175598, -0.0002630501985549927, -0.00025328248739242554, -0.0002435147762298584, -0.00023374706506729126, -0.00022397935390472412, -0.00021421164274215698, -0.00020444393157958984, -0.0001946762204170227, -0.00018490850925445557, -0.00017514079809188843, -0.0001653730869293213, -0.00015560537576675415, -0.000145837664604187, -0.00013606995344161987, -0.00012630224227905273, -0.0001165345311164856, -0.00010676681995391846, -9.699910879135132e-05, -8.723139762878418e-05, -7.746368646621704e-05, -6.76959753036499e-05, -5.7928264141082764e-05, -4.8160552978515625e-05, -3.8392841815948486e-05, -2.8625130653381348e-05, -1.885741949081421e-05, -9.08970832824707e-06, 6.780028343200684e-07, 1.0445713996887207e-05, 2.0213425159454346e-05, 2.9981136322021484e-05, 3.974884748458862e-05, 4.951655864715576e-05, 5.92842698097229e-05, 6.905198097229004e-05, 7.881969213485718e-05, 8.858740329742432e-05, 9.835511445999146e-05, 0.0001081228256225586, 0.00011789053678512573, 0.00012765824794769287, 0.00013742595911026, 0.00014719367027282715, 0.0001569613814353943, 0.00016672909259796143, 0.00017649680376052856, 0.0001862645149230957, 0.00019603222608566284, 0.00020579993724822998, 0.00021556764841079712, 0.00022533535957336426, 0.0002351030707359314, 0.00024487078189849854, 0.0002546384930610657, 0.0002644062042236328]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 10.0, 21.0, 24.0, 41.0, 92.0, 172.0, 336.0, 813.0, 2260.0, 6865.0, 30144.0, 443537.0, 519536.0, 33293.0, 7642.0, 2225.0, 849.0, 333.0, 158.0, 71.0, 53.0, 31.0, 13.0, 9.0, 9.0, 9.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.208984375, -2.14208984375, -2.0751953125, -2.00830078125, -1.94140625, -1.87451171875, -1.8076171875, -1.74072265625, -1.673828125, -1.60693359375, -1.5400390625, -1.47314453125, -1.40625, -1.33935546875, -1.2724609375, -1.20556640625, -1.138671875, -1.07177734375, -1.0048828125, -0.93798828125, -0.87109375, -0.80419921875, -0.7373046875, -0.67041015625, -0.603515625, -0.53662109375, -0.4697265625, -0.40283203125, -0.3359375, -0.26904296875, -0.2021484375, -0.13525390625, -0.068359375, -0.00146484375, 0.0654296875, 0.13232421875, 0.19921875, 0.26611328125, 0.3330078125, 0.39990234375, 0.466796875, 0.53369140625, 0.6005859375, 0.66748046875, 0.734375, 0.80126953125, 0.8681640625, 0.93505859375, 1.001953125, 1.06884765625, 1.1357421875, 1.20263671875, 1.26953125, 1.33642578125, 1.4033203125, 1.47021484375, 1.537109375, 1.60400390625, 1.6708984375, 1.73779296875, 1.8046875, 1.87158203125, 1.9384765625, 2.00537109375, 2.072265625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 13.0, 7.0, 13.0, 16.0, 21.0, 32.0, 39.0, 87.0, 92.0, 150.0, 162.0, 109.0, 73.0, 48.0, 40.0, 24.0, 19.0, 12.0, 14.0, 11.0, 7.0, 8.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.611328125, -1.5677490234375, -1.524169921875, -1.4805908203125, -1.43701171875, -1.3934326171875, -1.349853515625, -1.3062744140625, -1.2626953125, -1.2191162109375, -1.175537109375, -1.1319580078125, -1.08837890625, -1.0447998046875, -1.001220703125, -0.9576416015625, -0.9140625, -0.8704833984375, -0.826904296875, -0.7833251953125, -0.73974609375, -0.6961669921875, -0.652587890625, -0.6090087890625, -0.5654296875, -0.5218505859375, -0.478271484375, -0.4346923828125, -0.39111328125, -0.3475341796875, -0.303955078125, -0.2603759765625, -0.216796875, -0.1732177734375, -0.129638671875, -0.0860595703125, -0.04248046875, 0.0010986328125, 0.044677734375, 0.0882568359375, 0.1318359375, 0.1754150390625, 0.218994140625, 0.2625732421875, 0.30615234375, 0.3497314453125, 0.393310546875, 0.4368896484375, 0.48046875, 0.5240478515625, 0.567626953125, 0.6112060546875, 0.65478515625, 0.6983642578125, 0.741943359375, 0.7855224609375, 0.8291015625, 0.8726806640625, 0.916259765625, 0.9598388671875, 1.00341796875, 1.0469970703125, 1.090576171875, 1.1341552734375, 1.177734375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 12.0, 26.0, 39.0, 70.0, 115.0, 199.0, 192.0, 131.0, 89.0, 51.0, 36.0, 22.0, 9.0, 4.0, 3.0, 4.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.77408504486084, -14.223430633544922, -13.672775268554688, -13.12212085723877, -12.571466445922852, -12.020811080932617, -11.4701566696167, -10.919502258300781, -10.368846893310547, -9.818192481994629, -9.267537117004395, -8.716882705688477, -8.166228294372559, -7.615573406219482, -7.064918518066406, -6.514264106750488, -5.96360969543457, -5.412954807281494, -4.862300395965576, -4.3116455078125, -3.760990858078003, -3.210336208343506, -2.6596813201904297, -2.1090266704559326, -1.5583720207214355, -1.0077173709869385, -0.45706260204315186, 0.09359216690063477, 0.6442468166351318, 1.194901466369629, 1.745556354522705, 2.296211004257202, 2.8468666076660156, 3.3975212574005127, 3.9481759071350098, 4.498830795288086, 5.049485206604004, 5.60014009475708, 6.150794982910156, 6.701449394226074, 7.25210428237915, 7.802759170532227, 8.353413581848145, 8.904067993164062, 9.454723358154297, 10.005377769470215, 10.556032180786133, 11.106687545776367, 11.657341957092285, 12.207996368408203, 12.758651733398438, 13.309306144714355, 13.859960556030273, 14.410615921020508, 14.961270332336426, 15.511924743652344, 16.062580108642578, 16.613235473632812, 17.163888931274414, 17.71454429626465, 18.265199661254883, 18.815853118896484, 19.36650848388672, 19.917163848876953, 20.467817306518555]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 9.0, 13.0, 10.0, 17.0, 24.0, 20.0, 32.0, 27.0, 42.0, 52.0, 64.0, 68.0, 61.0, 63.0, 46.0, 70.0, 56.0, 58.0, 44.0, 36.0, 44.0, 26.0, 29.0, 25.0, 20.0, 12.0, 16.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.967788696289062, -14.452939987182617, -13.938092231750488, -13.423243522644043, -12.908395767211914, -12.393547058105469, -11.878698348999023, -11.363850593566895, -10.849002838134766, -10.33415412902832, -9.819306373596191, -9.304457664489746, -8.789609909057617, -8.274761199951172, -7.759912967681885, -7.245064735412598, -6.730216026306152, -6.215367794036865, -5.700519561767578, -5.185670852661133, -4.670823097229004, -4.155974388122559, -3.6411261558532715, -3.1262779235839844, -2.6114296913146973, -2.09658145904541, -1.5817331075668335, -1.0668847560882568, -0.5520365238189697, -0.03718829154968262, 0.4776601791381836, 0.9925084114074707, 1.5073566436767578, 2.022204875946045, 2.537053108215332, 3.0519015789031982, 3.5667498111724854, 4.081598281860352, 4.596446514129639, 5.111294746398926, 5.626142978668213, 6.1409912109375, 6.655839443206787, 7.170687675476074, 7.6855363845825195, 8.200384140014648, 8.715232849121094, 9.230081558227539, 9.744929313659668, 10.259778022766113, 10.774625778198242, 11.289474487304688, 11.804322242736816, 12.319170951843262, 12.83401870727539, 13.348867416381836, 13.863716125488281, 14.378564834594727, 14.893412590026855, 15.4082612991333, 15.92310905456543, 16.437957763671875, 16.95280647277832, 17.467655181884766, 17.982501983642578]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 12.0, 13.0, 11.0, 26.0, 46.0, 79.0, 155.0, 265.0, 612.0, 1729.0, 6494.0, 54550.0, 4093707.0, 29534.0, 4703.0, 1328.0, 487.0, 257.0, 124.0, 56.0, 30.0, 28.0, 11.0, 8.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.40625, -7.21826171875, -7.0302734375, -6.84228515625, -6.654296875, -6.46630859375, -6.2783203125, -6.09033203125, -5.90234375, -5.71435546875, -5.5263671875, -5.33837890625, -5.150390625, -4.96240234375, -4.7744140625, -4.58642578125, -4.3984375, -4.21044921875, -4.0224609375, -3.83447265625, -3.646484375, -3.45849609375, -3.2705078125, -3.08251953125, -2.89453125, -2.70654296875, -2.5185546875, -2.33056640625, -2.142578125, -1.95458984375, -1.7666015625, -1.57861328125, -1.390625, -1.20263671875, -1.0146484375, -0.82666015625, -0.638671875, -0.45068359375, -0.2626953125, -0.07470703125, 0.11328125, 0.30126953125, 0.4892578125, 0.67724609375, 0.865234375, 1.05322265625, 1.2412109375, 1.42919921875, 1.6171875, 1.80517578125, 1.9931640625, 2.18115234375, 2.369140625, 2.55712890625, 2.7451171875, 2.93310546875, 3.12109375, 3.30908203125, 3.4970703125, 3.68505859375, 3.873046875, 4.06103515625, 4.2490234375, 4.43701171875, 4.625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 16.0, 14.0, 29.0, 31.0, 37.0, 50.0, 67.0, 59.0, 89.0, 84.0, 91.0, 79.0, 73.0, 71.0, 48.0, 43.0, 42.0, 28.0, 20.0, 13.0, 4.0, 3.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.353515625, -1.3221664428710938, -1.2908172607421875, -1.2594680786132812, -1.228118896484375, -1.1967697143554688, -1.1654205322265625, -1.1340713500976562, -1.10272216796875, -1.0713729858398438, -1.0400238037109375, -1.0086746215820312, -0.977325439453125, -0.9459762573242188, -0.9146270751953125, -0.8832778930664062, -0.8519287109375, -0.8205795288085938, -0.7892303466796875, -0.7578811645507812, -0.726531982421875, -0.6951828002929688, -0.6638336181640625, -0.6324844360351562, -0.60113525390625, -0.5697860717773438, -0.5384368896484375, -0.5070877075195312, -0.475738525390625, -0.44438934326171875, -0.4130401611328125, -0.38169097900390625, -0.350341796875, -0.31899261474609375, -0.2876434326171875, -0.25629425048828125, -0.224945068359375, -0.19359588623046875, -0.1622467041015625, -0.13089752197265625, -0.09954833984375, -0.06819915771484375, -0.0368499755859375, -0.00550079345703125, 0.025848388671875, 0.05719757080078125, 0.0885467529296875, 0.11989593505859375, 0.1512451171875, 0.18259429931640625, 0.2139434814453125, 0.24529266357421875, 0.276641845703125, 0.30799102783203125, 0.3393402099609375, 0.37068939208984375, 0.40203857421875, 0.43338775634765625, 0.4647369384765625, 0.49608612060546875, 0.527435302734375, 0.5587844848632812, 0.5901336669921875, 0.6214828491210938, 0.65283203125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 8.0, 22.0, 41.0, 57.0, 111.0, 282.0, 1603.0, 28359.0, 4147012.0, 15166.0, 1207.0, 224.0, 94.0, 44.0, 26.0, 21.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5546875, -13.2274169921875, -12.900146484375, -12.5728759765625, -12.24560546875, -11.9183349609375, -11.591064453125, -11.2637939453125, -10.9365234375, -10.6092529296875, -10.281982421875, -9.9547119140625, -9.62744140625, -9.3001708984375, -8.972900390625, -8.6456298828125, -8.318359375, -7.9910888671875, -7.663818359375, -7.3365478515625, -7.00927734375, -6.6820068359375, -6.354736328125, -6.0274658203125, -5.7001953125, -5.3729248046875, -5.045654296875, -4.7183837890625, -4.39111328125, -4.0638427734375, -3.736572265625, -3.4093017578125, -3.08203125, -2.7547607421875, -2.427490234375, -2.1002197265625, -1.77294921875, -1.4456787109375, -1.118408203125, -0.7911376953125, -0.4638671875, -0.1365966796875, 0.190673828125, 0.5179443359375, 0.84521484375, 1.1724853515625, 1.499755859375, 1.8270263671875, 2.154296875, 2.4815673828125, 2.808837890625, 3.1361083984375, 3.46337890625, 3.7906494140625, 4.117919921875, 4.4451904296875, 4.7724609375, 5.0997314453125, 5.427001953125, 5.7542724609375, 6.08154296875, 6.4088134765625, 6.736083984375, 7.0633544921875, 7.390625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 12.0, 5.0, 13.0, 36.0, 57.0, 157.0, 2196.0, 1378.0, 120.0, 38.0, 27.0, 15.0, 8.0, 2.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.197265625, -3.1210784912109375, -3.044891357421875, -2.9687042236328125, -2.89251708984375, -2.8163299560546875, -2.740142822265625, -2.6639556884765625, -2.5877685546875, -2.5115814208984375, -2.435394287109375, -2.3592071533203125, -2.28302001953125, -2.2068328857421875, -2.130645751953125, -2.0544586181640625, -1.978271484375, -1.9020843505859375, -1.825897216796875, -1.7497100830078125, -1.67352294921875, -1.5973358154296875, -1.521148681640625, -1.4449615478515625, -1.3687744140625, -1.2925872802734375, -1.216400146484375, -1.1402130126953125, -1.06402587890625, -0.9878387451171875, -0.911651611328125, -0.8354644775390625, -0.75927734375, -0.6830902099609375, -0.606903076171875, -0.5307159423828125, -0.45452880859375, -0.3783416748046875, -0.302154541015625, -0.2259674072265625, -0.1497802734375, -0.0735931396484375, 0.002593994140625, 0.0787811279296875, 0.15496826171875, 0.2311553955078125, 0.307342529296875, 0.3835296630859375, 0.459716796875, 0.5359039306640625, 0.612091064453125, 0.6882781982421875, 0.76446533203125, 0.8406524658203125, 0.916839599609375, 0.9930267333984375, 1.0692138671875, 1.1454010009765625, 1.221588134765625, 1.2977752685546875, 1.37396240234375, 1.4501495361328125, 1.526336669921875, 1.6025238037109375, 1.6787109375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 10.0, 13.0, 16.0, 25.0, 46.0, 64.0, 95.0, 128.0, 171.0, 154.0, 107.0, 65.0, 34.0, 21.0, 17.0, 6.0, 6.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3805065155029297, -3.1994922161102295, -3.0184779167175293, -2.837463855743408, -2.656449317932129, -2.475435256958008, -2.2944209575653076, -2.1134066581726074, -1.9323923587799072, -1.751378059387207, -1.5703637599945068, -1.3893495798110962, -1.208335280418396, -1.0273209810256958, -0.8463068008422852, -0.665292501449585, -0.48427820205688477, -0.30326393246650696, -0.12224966287612915, 0.05876457691192627, 0.23977887630462646, 0.42079317569732666, 0.6018073558807373, 0.7828216552734375, 0.9638359546661377, 1.144850254058838, 1.325864553451538, 1.5068787336349487, 1.687893033027649, 1.8689073324203491, 2.0499215126037598, 2.23093581199646, 2.41195011138916, 2.5929644107818604, 2.7739787101745605, 2.9549927711486816, 3.136007308959961, 3.317021369934082, 3.4980356693267822, 3.6790499687194824, 3.8600642681121826, 4.041078567504883, 4.222092628479004, 4.403107166290283, 4.584121227264404, 4.765135765075684, 4.946149826049805, 5.127163887023926, 5.308178424835205, 5.489192485809326, 5.6702070236206055, 5.851221084594727, 6.032235622406006, 6.213249683380127, 6.394264221191406, 6.575278282165527, 6.756292343139648, 6.9373064041137695, 7.118320941925049, 7.29933500289917, 7.480349540710449, 7.66136360168457, 7.842377662658691, 8.023391723632812, 8.20440673828125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 11.0, 4.0, 9.0, 14.0, 22.0, 19.0, 26.0, 25.0, 22.0, 28.0, 48.0, 50.0, 45.0, 35.0, 48.0, 49.0, 37.0, 45.0, 64.0, 42.0, 52.0, 34.0, 43.0, 39.0, 30.0, 27.0, 22.0, 21.0, 22.0, 11.0, 14.0, 7.0, 9.0, 6.0, 5.0, 2.0, 2.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.015883445739746, -2.8940465450286865, -2.772209882736206, -2.6503729820251465, -2.528536319732666, -2.4066994190216064, -2.284862518310547, -2.1630258560180664, -2.041188955307007, -1.9193521738052368, -1.7975153923034668, -1.6756784915924072, -1.5538417100906372, -1.4320049285888672, -1.3101680278778076, -1.1883312463760376, -1.0664944648742676, -0.9446576833724976, -0.8228208422660828, -0.700984001159668, -0.579147219657898, -0.45731043815612793, -0.33547359704971313, -0.21363675594329834, -0.09179997444152832, 0.030036836862564087, 0.1518736481666565, 0.2737104594707489, 0.3955472707748413, 0.5173840522766113, 0.6392208933830261, 0.7610577344894409, 0.8828945159912109, 1.004731297492981, 1.126568078994751, 1.2484049797058105, 1.3702417612075806, 1.4920785427093506, 1.6139154434204102, 1.7357522249221802, 1.8575890064239502, 1.9794257879257202, 2.1012625694274902, 2.22309947013855, 2.3449363708496094, 2.46677303314209, 2.5886099338531494, 2.710446834564209, 2.8322834968566895, 2.954120397567749, 3.0759570598602295, 3.197793960571289, 3.3196306228637695, 3.441467523574829, 3.5633044242858887, 3.685141086578369, 3.8069779872894287, 3.9288148880004883, 4.050651550292969, 4.172488212585449, 4.294325351715088, 4.416162014007568, 4.537998676300049, 4.6598358154296875, 4.781672477722168]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 0.0, 4.0, 5.0, 13.0, 29.0, 48.0, 89.0, 183.0, 405.0, 1057.0, 3092.0, 13443.0, 148372.0, 810001.0, 60219.0, 8095.0, 2096.0, 770.0, 326.0, 138.0, 69.0, 44.0, 22.0, 12.0, 9.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.9139404296875, -3.765380859375, -3.6168212890625, -3.46826171875, -3.3197021484375, -3.171142578125, -3.0225830078125, -2.8740234375, -2.7254638671875, -2.576904296875, -2.4283447265625, -2.27978515625, -2.1312255859375, -1.982666015625, -1.8341064453125, -1.685546875, -1.5369873046875, -1.388427734375, -1.2398681640625, -1.09130859375, -0.9427490234375, -0.794189453125, -0.6456298828125, -0.4970703125, -0.3485107421875, -0.199951171875, -0.0513916015625, 0.09716796875, 0.2457275390625, 0.394287109375, 0.5428466796875, 0.69140625, 0.8399658203125, 0.988525390625, 1.1370849609375, 1.28564453125, 1.4342041015625, 1.582763671875, 1.7313232421875, 1.8798828125, 2.0284423828125, 2.177001953125, 2.3255615234375, 2.47412109375, 2.6226806640625, 2.771240234375, 2.9197998046875, 3.068359375, 3.2169189453125, 3.365478515625, 3.5140380859375, 3.66259765625, 3.8111572265625, 3.959716796875, 4.1082763671875, 4.2568359375, 4.4053955078125, 4.553955078125, 4.7025146484375, 4.85107421875, 4.9996337890625, 5.148193359375, 5.2967529296875, 5.4453125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 5.0, 10.0, 16.0, 23.0, 39.0, 36.0, 53.0, 56.0, 50.0, 70.0, 89.0, 73.0, 80.0, 58.0, 76.0, 72.0, 48.0, 37.0, 40.0, 25.0, 17.0, 6.0, 7.0, 7.0, 2.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.2919921875, -1.2610397338867188, -1.2300872802734375, -1.1991348266601562, -1.168182373046875, -1.1372299194335938, -1.1062774658203125, -1.0753250122070312, -1.04437255859375, -1.0134201049804688, -0.9824676513671875, -0.9515151977539062, -0.920562744140625, -0.8896102905273438, -0.8586578369140625, -0.8277053833007812, -0.7967529296875, -0.7658004760742188, -0.7348480224609375, -0.7038955688476562, -0.672943115234375, -0.6419906616210938, -0.6110382080078125, -0.5800857543945312, -0.54913330078125, -0.5181808471679688, -0.4872283935546875, -0.45627593994140625, -0.425323486328125, -0.39437103271484375, -0.3634185791015625, -0.33246612548828125, -0.301513671875, -0.27056121826171875, -0.2396087646484375, -0.20865631103515625, -0.177703857421875, -0.14675140380859375, -0.1157989501953125, -0.08484649658203125, -0.05389404296875, -0.02294158935546875, 0.0080108642578125, 0.03896331787109375, 0.069915771484375, 0.10086822509765625, 0.1318206787109375, 0.16277313232421875, 0.1937255859375, 0.22467803955078125, 0.2556304931640625, 0.28658294677734375, 0.317535400390625, 0.34848785400390625, 0.3794403076171875, 0.41039276123046875, 0.44134521484375, 0.47229766845703125, 0.5032501220703125, 0.5342025756835938, 0.565155029296875, 0.5961074829101562, 0.6270599365234375, 0.6580123901367188, 0.68896484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 8.0, 11.0, 28.0, 75.0, 132.0, 293.0, 638.0, 2085.0, 9884.0, 155936.0, 837044.0, 35802.0, 4545.0, 1192.0, 417.0, 208.0, 102.0, 57.0, 26.0, 29.0, 9.0, 9.0, 7.0, 4.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1484375, -4.99822998046875, -4.8480224609375, -4.69781494140625, -4.547607421875, -4.39739990234375, -4.2471923828125, -4.09698486328125, -3.94677734375, -3.79656982421875, -3.6463623046875, -3.49615478515625, -3.345947265625, -3.19573974609375, -3.0455322265625, -2.89532470703125, -2.7451171875, -2.59490966796875, -2.4447021484375, -2.29449462890625, -2.144287109375, -1.99407958984375, -1.8438720703125, -1.69366455078125, -1.54345703125, -1.39324951171875, -1.2430419921875, -1.09283447265625, -0.942626953125, -0.79241943359375, -0.6422119140625, -0.49200439453125, -0.341796875, -0.19158935546875, -0.0413818359375, 0.10882568359375, 0.259033203125, 0.40924072265625, 0.5594482421875, 0.70965576171875, 0.85986328125, 1.01007080078125, 1.1602783203125, 1.31048583984375, 1.460693359375, 1.61090087890625, 1.7611083984375, 1.91131591796875, 2.0615234375, 2.21173095703125, 2.3619384765625, 2.51214599609375, 2.662353515625, 2.81256103515625, 2.9627685546875, 3.11297607421875, 3.26318359375, 3.41339111328125, 3.5635986328125, 3.71380615234375, 3.864013671875, 4.01422119140625, 4.1644287109375, 4.31463623046875, 4.46484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 1.0, 5.0, 10.0, 13.0, 13.0, 23.0, 21.0, 34.0, 33.0, 58.0, 55.0, 72.0, 51.0, 69.0, 62.0, 76.0, 62.0, 55.0, 46.0, 48.0, 29.0, 25.0, 30.0, 23.0, 21.0, 10.0, 11.0, 15.0, 6.0, 4.0, 2.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.80859375, -3.7020263671875, -3.595458984375, -3.4888916015625, -3.38232421875, -3.2757568359375, -3.169189453125, -3.0626220703125, -2.9560546875, -2.8494873046875, -2.742919921875, -2.6363525390625, -2.52978515625, -2.4232177734375, -2.316650390625, -2.2100830078125, -2.103515625, -1.9969482421875, -1.890380859375, -1.7838134765625, -1.67724609375, -1.5706787109375, -1.464111328125, -1.3575439453125, -1.2509765625, -1.1444091796875, -1.037841796875, -0.9312744140625, -0.82470703125, -0.7181396484375, -0.611572265625, -0.5050048828125, -0.3984375, -0.2918701171875, -0.185302734375, -0.0787353515625, 0.02783203125, 0.1343994140625, 0.240966796875, 0.3475341796875, 0.4541015625, 0.5606689453125, 0.667236328125, 0.7738037109375, 0.88037109375, 0.9869384765625, 1.093505859375, 1.2000732421875, 1.306640625, 1.4132080078125, 1.519775390625, 1.6263427734375, 1.73291015625, 1.8394775390625, 1.946044921875, 2.0526123046875, 2.1591796875, 2.2657470703125, 2.372314453125, 2.4788818359375, 2.58544921875, 2.6920166015625, 2.798583984375, 2.9051513671875, 3.01171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 7.0, 18.0, 40.0, 61.0, 178.0, 533.0, 2137.0, 11839.0, 898996.0, 126127.0, 6672.0, 1330.0, 393.0, 103.0, 52.0, 30.0, 18.0, 7.0, 6.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.47265625, -5.282958984375, -5.09326171875, -4.903564453125, -4.7138671875, -4.524169921875, -4.33447265625, -4.144775390625, -3.955078125, -3.765380859375, -3.57568359375, -3.385986328125, -3.1962890625, -3.006591796875, -2.81689453125, -2.627197265625, -2.4375, -2.247802734375, -2.05810546875, -1.868408203125, -1.6787109375, -1.489013671875, -1.29931640625, -1.109619140625, -0.919921875, -0.730224609375, -0.54052734375, -0.350830078125, -0.1611328125, 0.028564453125, 0.21826171875, 0.407958984375, 0.59765625, 0.787353515625, 0.97705078125, 1.166748046875, 1.3564453125, 1.546142578125, 1.73583984375, 1.925537109375, 2.115234375, 2.304931640625, 2.49462890625, 2.684326171875, 2.8740234375, 3.063720703125, 3.25341796875, 3.443115234375, 3.6328125, 3.822509765625, 4.01220703125, 4.201904296875, 4.3916015625, 4.581298828125, 4.77099609375, 4.960693359375, 5.150390625, 5.340087890625, 5.52978515625, 5.719482421875, 5.9091796875, 6.098876953125, 6.28857421875, 6.478271484375, 6.66796875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 12.0, 19.0, 37.0, 79.0, 192.0, 388.0, 157.0, 60.0, 32.0, 15.0, 3.0, 9.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007786750793457031, -0.0007607340812683105, -0.000742793083190918, -0.0007248520851135254, -0.0007069110870361328, -0.0006889700889587402, -0.0006710290908813477, -0.0006530880928039551, -0.0006351470947265625, -0.0006172060966491699, -0.0005992650985717773, -0.0005813241004943848, -0.0005633831024169922, -0.0005454421043395996, -0.000527501106262207, -0.0005095601081848145, -0.0004916191101074219, -0.0004736781120300293, -0.0004557371139526367, -0.00043779611587524414, -0.00041985511779785156, -0.000401914119720459, -0.0003839731216430664, -0.00036603212356567383, -0.00034809112548828125, -0.00033015012741088867, -0.0003122091293334961, -0.0002942681312561035, -0.00027632713317871094, -0.00025838613510131836, -0.00024044513702392578, -0.0002225041389465332, -0.00020456314086914062, -0.00018662214279174805, -0.00016868114471435547, -0.0001507401466369629, -0.0001327991485595703, -0.00011485815048217773, -9.691715240478516e-05, -7.897615432739258e-05, -6.103515625e-05, -4.309415817260742e-05, -2.5153160095214844e-05, -7.212162017822266e-06, 1.0728836059570312e-05, 2.866983413696289e-05, 4.661083221435547e-05, 6.455183029174805e-05, 8.249282836914062e-05, 0.0001004338264465332, 0.00011837482452392578, 0.00013631582260131836, 0.00015425682067871094, 0.00017219781875610352, 0.0001901388168334961, 0.00020807981491088867, 0.00022602081298828125, 0.00024396181106567383, 0.0002619028091430664, 0.000279843807220459, 0.00029778480529785156, 0.00031572580337524414, 0.0003336668014526367, 0.0003516077995300293, 0.0003695487976074219]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 15.0, 21.0, 30.0, 68.0, 155.0, 368.0, 1256.0, 9466.0, 959681.0, 72635.0, 3700.0, 717.0, 244.0, 82.0, 40.0, 26.0, 13.0, 11.0, 5.0, 9.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.2890625, -9.05560302734375, -8.8221435546875, -8.58868408203125, -8.355224609375, -8.12176513671875, -7.8883056640625, -7.65484619140625, -7.42138671875, -7.18792724609375, -6.9544677734375, -6.72100830078125, -6.487548828125, -6.25408935546875, -6.0206298828125, -5.78717041015625, -5.5537109375, -5.32025146484375, -5.0867919921875, -4.85333251953125, -4.619873046875, -4.38641357421875, -4.1529541015625, -3.91949462890625, -3.68603515625, -3.45257568359375, -3.2191162109375, -2.98565673828125, -2.752197265625, -2.51873779296875, -2.2852783203125, -2.05181884765625, -1.818359375, -1.58489990234375, -1.3514404296875, -1.11798095703125, -0.884521484375, -0.65106201171875, -0.4176025390625, -0.18414306640625, 0.04931640625, 0.28277587890625, 0.5162353515625, 0.74969482421875, 0.983154296875, 1.21661376953125, 1.4500732421875, 1.68353271484375, 1.9169921875, 2.15045166015625, 2.3839111328125, 2.61737060546875, 2.850830078125, 3.08428955078125, 3.3177490234375, 3.55120849609375, 3.78466796875, 4.01812744140625, 4.2515869140625, 4.48504638671875, 4.718505859375, 4.95196533203125, 5.1854248046875, 5.41888427734375, 5.65234375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 8.0, 6.0, 14.0, 16.0, 74.0, 412.0, 371.0, 51.0, 20.0, 13.0, 10.0, 7.0, 3.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.34375, -8.1400146484375, -7.936279296875, -7.7325439453125, -7.52880859375, -7.3250732421875, -7.121337890625, -6.9176025390625, -6.7138671875, -6.5101318359375, -6.306396484375, -6.1026611328125, -5.89892578125, -5.6951904296875, -5.491455078125, -5.2877197265625, -5.083984375, -4.8802490234375, -4.676513671875, -4.4727783203125, -4.26904296875, -4.0653076171875, -3.861572265625, -3.6578369140625, -3.4541015625, -3.2503662109375, -3.046630859375, -2.8428955078125, -2.63916015625, -2.4354248046875, -2.231689453125, -2.0279541015625, -1.82421875, -1.6204833984375, -1.416748046875, -1.2130126953125, -1.00927734375, -0.8055419921875, -0.601806640625, -0.3980712890625, -0.1943359375, 0.0093994140625, 0.213134765625, 0.4168701171875, 0.62060546875, 0.8243408203125, 1.028076171875, 1.2318115234375, 1.435546875, 1.6392822265625, 1.843017578125, 2.0467529296875, 2.25048828125, 2.4542236328125, 2.657958984375, 2.8616943359375, 3.0654296875, 3.2691650390625, 3.472900390625, 3.6766357421875, 3.88037109375, 4.0841064453125, 4.287841796875, 4.4915771484375, 4.6953125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 10.0, 3.0, 14.0, 25.0, 61.0, 106.0, 185.0, 266.0, 195.0, 83.0, 36.0, 12.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.32080078125, -40.34654235839844, -39.372283935546875, -38.39802551269531, -37.42376708984375, -36.44950866699219, -35.475250244140625, -34.50099182128906, -33.5267333984375, -32.55247497558594, -31.578216552734375, -30.603958129882812, -29.62969970703125, -28.655441284179688, -27.681182861328125, -26.706924438476562, -25.732666015625, -24.758407592773438, -23.784149169921875, -22.809890747070312, -21.83563232421875, -20.861373901367188, -19.887115478515625, -18.912857055664062, -17.9385986328125, -16.964340209960938, -15.990081787109375, -15.015823364257812, -14.04156494140625, -13.067306518554688, -12.093048095703125, -11.118789672851562, -10.144533157348633, -9.17027473449707, -8.196016311645508, -7.221757888793945, -6.247499465942383, -5.27324104309082, -4.298982620239258, -3.3247241973876953, -2.350465774536133, -1.3762073516845703, -0.4019489288330078, 0.5723094940185547, 1.5465679168701172, 2.5208263397216797, 3.495084762573242, 4.469343185424805, 5.443601608276367, 6.41786003112793, 7.392118453979492, 8.366376876831055, 9.340635299682617, 10.31489372253418, 11.289152145385742, 12.263410568237305, 13.237668991088867, 14.21192741394043, 15.186185836791992, 16.160444259643555, 17.134702682495117, 18.10896110534668, 19.083219528198242, 20.057477951049805, 21.031736373901367]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 7.0, 5.0, 8.0, 5.0, 11.0, 9.0, 13.0, 22.0, 20.0, 25.0, 25.0, 25.0, 33.0, 35.0, 35.0, 22.0, 40.0, 35.0, 59.0, 41.0, 39.0, 54.0, 34.0, 42.0, 37.0, 33.0, 35.0, 35.0, 29.0, 24.0, 31.0, 20.0, 19.0, 13.0, 9.0, 13.0, 16.0, 10.0, 8.0, 6.0, 9.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-14.256242752075195, -13.861167907714844, -13.466093063354492, -13.07101821899414, -12.675944328308105, -12.280869483947754, -11.885794639587402, -11.49071979522705, -11.0956449508667, -10.700570106506348, -10.305495262145996, -9.910421371459961, -9.51534652709961, -9.120271682739258, -8.725196838378906, -8.330121994018555, -7.935047626495361, -7.53997278213501, -7.144898414611816, -6.749823570251465, -6.354748725891113, -5.959673881530762, -5.564599514007568, -5.169524669647217, -4.774450302124023, -4.379375457763672, -3.9843008518218994, -3.589226245880127, -3.1941514015197754, -2.799076795578003, -2.4040021896362305, -2.008927345275879, -1.6138525009155273, -1.2187777757644653, -0.8237031102180481, -0.42862844467163086, -0.03355371952056885, 0.36152100563049316, 0.7565956115722656, 1.1516704559326172, 1.5467450618743896, 1.9418197870254517, 2.3368945121765137, 2.731969118118286, 3.1270437240600586, 3.52211856842041, 3.9171931743621826, 4.312268257141113, 4.707342624664307, 5.102417469024658, 5.497491836547852, 5.892566680908203, 6.287641525268555, 6.682716369628906, 7.0777907371521, 7.472865581512451, 7.8679399490356445, 8.263014793395996, 8.658089637756348, 9.053163528442383, 9.448238372802734, 9.843313217163086, 10.238388061523438, 10.633462905883789, 11.02853775024414]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 7.0, 10.0, 13.0, 14.0, 16.0, 25.0, 31.0, 29.0, 50.0, 81.0, 155.0, 293.0, 882.0, 3727.0, 31740.0, 4126162.0, 26118.0, 3365.0, 826.0, 304.0, 143.0, 90.0, 58.0, 31.0, 28.0, 19.0, 16.0, 9.0, 11.0, 9.0, 8.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.59765625, -7.409912109375, -7.22216796875, -7.034423828125, -6.8466796875, -6.658935546875, -6.47119140625, -6.283447265625, -6.095703125, -5.907958984375, -5.72021484375, -5.532470703125, -5.3447265625, -5.156982421875, -4.96923828125, -4.781494140625, -4.59375, -4.406005859375, -4.21826171875, -4.030517578125, -3.8427734375, -3.655029296875, -3.46728515625, -3.279541015625, -3.091796875, -2.904052734375, -2.71630859375, -2.528564453125, -2.3408203125, -2.153076171875, -1.96533203125, -1.777587890625, -1.58984375, -1.402099609375, -1.21435546875, -1.026611328125, -0.8388671875, -0.651123046875, -0.46337890625, -0.275634765625, -0.087890625, 0.099853515625, 0.28759765625, 0.475341796875, 0.6630859375, 0.850830078125, 1.03857421875, 1.226318359375, 1.4140625, 1.601806640625, 1.78955078125, 1.977294921875, 2.1650390625, 2.352783203125, 2.54052734375, 2.728271484375, 2.916015625, 3.103759765625, 3.29150390625, 3.479248046875, 3.6669921875, 3.854736328125, 4.04248046875, 4.230224609375, 4.41796875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 17.0, 15.0, 17.0, 29.0, 29.0, 59.0, 55.0, 61.0, 74.0, 78.0, 76.0, 86.0, 73.0, 72.0, 64.0, 61.0, 52.0, 23.0, 21.0, 15.0, 8.0, 7.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.568359375, -1.5324478149414062, -1.4965362548828125, -1.4606246948242188, -1.424713134765625, -1.3888015747070312, -1.3528900146484375, -1.3169784545898438, -1.28106689453125, -1.2451553344726562, -1.2092437744140625, -1.1733322143554688, -1.137420654296875, -1.1015090942382812, -1.0655975341796875, -1.0296859741210938, -0.9937744140625, -0.9578628540039062, -0.9219512939453125, -0.8860397338867188, -0.850128173828125, -0.8142166137695312, -0.7783050537109375, -0.7423934936523438, -0.70648193359375, -0.6705703735351562, -0.6346588134765625, -0.5987472534179688, -0.562835693359375, -0.5269241333007812, -0.4910125732421875, -0.45510101318359375, -0.419189453125, -0.38327789306640625, -0.3473663330078125, -0.31145477294921875, -0.275543212890625, -0.23963165283203125, -0.2037200927734375, -0.16780853271484375, -0.13189697265625, -0.09598541259765625, -0.0600738525390625, -0.02416229248046875, 0.011749267578125, 0.04766082763671875, 0.0835723876953125, 0.11948394775390625, 0.1553955078125, 0.19130706787109375, 0.2272186279296875, 0.26313018798828125, 0.299041748046875, 0.33495330810546875, 0.3708648681640625, 0.40677642822265625, 0.44268798828125, 0.47859954833984375, 0.5145111083984375, 0.5504226684570312, 0.586334228515625, 0.6222457885742188, 0.6581573486328125, 0.6940689086914062, 0.72998046875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 21.0, 30.0, 82.0, 126.0, 292.0, 915.0, 7068.0, 4116433.0, 65471.0, 2908.0, 526.0, 198.0, 95.0, 47.0, 29.0, 15.0, 12.0, 10.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.328125, -6.008544921875, -5.68896484375, -5.369384765625, -5.0498046875, -4.730224609375, -4.41064453125, -4.091064453125, -3.771484375, -3.451904296875, -3.13232421875, -2.812744140625, -2.4931640625, -2.173583984375, -1.85400390625, -1.534423828125, -1.21484375, -0.895263671875, -0.57568359375, -0.256103515625, 0.0634765625, 0.383056640625, 0.70263671875, 1.022216796875, 1.341796875, 1.661376953125, 1.98095703125, 2.300537109375, 2.6201171875, 2.939697265625, 3.25927734375, 3.578857421875, 3.8984375, 4.218017578125, 4.53759765625, 4.857177734375, 5.1767578125, 5.496337890625, 5.81591796875, 6.135498046875, 6.455078125, 6.774658203125, 7.09423828125, 7.413818359375, 7.7333984375, 8.052978515625, 8.37255859375, 8.692138671875, 9.01171875, 9.331298828125, 9.65087890625, 9.970458984375, 10.2900390625, 10.609619140625, 10.92919921875, 11.248779296875, 11.568359375, 11.887939453125, 12.20751953125, 12.527099609375, 12.8466796875, 13.166259765625, 13.48583984375, 13.805419921875, 14.125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 10.0, 29.0, 31.0, 170.0, 3222.0, 498.0, 56.0, 14.0, 15.0, 7.0, 8.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3125, -2.234893798828125, -2.15728759765625, -2.079681396484375, -2.0020751953125, -1.924468994140625, -1.84686279296875, -1.769256591796875, -1.691650390625, -1.614044189453125, -1.53643798828125, -1.458831787109375, -1.3812255859375, -1.303619384765625, -1.22601318359375, -1.148406982421875, -1.07080078125, -0.993194580078125, -0.91558837890625, -0.837982177734375, -0.7603759765625, -0.682769775390625, -0.60516357421875, -0.527557373046875, -0.449951171875, -0.372344970703125, -0.29473876953125, -0.217132568359375, -0.1395263671875, -0.061920166015625, 0.01568603515625, 0.093292236328125, 0.1708984375, 0.248504638671875, 0.32611083984375, 0.403717041015625, 0.4813232421875, 0.558929443359375, 0.63653564453125, 0.714141845703125, 0.791748046875, 0.869354248046875, 0.94696044921875, 1.024566650390625, 1.1021728515625, 1.179779052734375, 1.25738525390625, 1.334991455078125, 1.41259765625, 1.490203857421875, 1.56781005859375, 1.645416259765625, 1.7230224609375, 1.800628662109375, 1.87823486328125, 1.955841064453125, 2.033447265625, 2.111053466796875, 2.18865966796875, 2.266265869140625, 2.3438720703125, 2.421478271484375, 2.49908447265625, 2.576690673828125, 2.654296875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 5.0, 10.0, 8.0, 13.0, 36.0, 70.0, 119.0, 177.0, 207.0, 140.0, 100.0, 48.0, 29.0, 16.0, 11.0, 6.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.163535118103027, -7.940217971801758, -7.71690034866333, -7.493582725524902, -7.270265579223633, -7.046948432922363, -6.8236308097839355, -6.600313186645508, -6.376996040344238, -6.153678894042969, -5.930361270904541, -5.707043647766113, -5.483726501464844, -5.260409355163574, -5.0370917320251465, -4.813774108886719, -4.590456962585449, -4.36713981628418, -4.143822193145752, -3.9205048084259033, -3.6971874237060547, -3.473870038986206, -3.2505526542663574, -3.027235269546509, -2.80391788482666, -2.5806005001068115, -2.357283115386963, -2.1339657306671143, -1.9106483459472656, -1.687330961227417, -1.4640135765075684, -1.2406961917877197, -1.017378330230713, -0.7940609455108643, -0.5707435607910156, -0.347426176071167, -0.12410879135131836, 0.09920859336853027, 0.3225259780883789, 0.5458433628082275, 0.7691607475280762, 0.9924781322479248, 1.2157955169677734, 1.439112901687622, 1.6624302864074707, 1.8857476711273193, 2.109065055847168, 2.3323824405670166, 2.5556998252868652, 2.779017210006714, 3.0023345947265625, 3.225651979446411, 3.4489693641662598, 3.6722867488861084, 3.895604133605957, 4.118921279907227, 4.342238903045654, 4.565556526184082, 4.788873672485352, 5.012190818786621, 5.235508441925049, 5.458826065063477, 5.682143211364746, 5.905460357666016, 6.128777980804443]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 4.0, 3.0, 1.0, 5.0, 13.0, 7.0, 2.0, 13.0, 20.0, 17.0, 20.0, 21.0, 30.0, 30.0, 38.0, 40.0, 34.0, 37.0, 57.0, 44.0, 54.0, 43.0, 39.0, 51.0, 40.0, 40.0, 50.0, 32.0, 35.0, 36.0, 26.0, 14.0, 17.0, 15.0, 19.0, 15.0, 14.0, 8.0, 4.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-3.828338384628296, -3.725740432739258, -3.623142719268799, -3.5205447673797607, -3.4179468154907227, -3.3153488636016846, -3.2127509117126465, -3.1101531982421875, -3.0075552463531494, -2.9049572944641113, -2.8023595809936523, -2.6997616291046143, -2.597163677215576, -2.494565725326538, -2.3919677734375, -2.289370059967041, -2.186772108078003, -2.084174156188965, -1.9815763235092163, -1.8789784908294678, -1.7763805389404297, -1.6737825870513916, -1.571184754371643, -1.4685869216918945, -1.3659889698028564, -1.2633910179138184, -1.1607931852340698, -1.0581953525543213, -0.9555974006652832, -0.8529995083808899, -0.7504016160964966, -0.6478037238121033, -0.5452060699462891, -0.44260817766189575, -0.34001028537750244, -0.23741239309310913, -0.13481450080871582, -0.03221660852432251, 0.0703812837600708, 0.1729791760444641, 0.2755770683288574, 0.37817496061325073, 0.48077285289764404, 0.5833707451820374, 0.6859686374664307, 0.788566529750824, 0.8911644220352173, 0.9937623143196106, 1.096360206604004, 1.198958158493042, 1.3015559911727905, 1.404153823852539, 1.5067517757415771, 1.6093497276306152, 1.7119475603103638, 1.8145453929901123, 1.9171433448791504, 2.0197412967681885, 2.1223392486572266, 2.2249369621276855, 2.3275349140167236, 2.4301328659057617, 2.5327305793762207, 2.635328531265259, 2.737926483154297]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 15.0, 2.0, 14.0, 18.0, 37.0, 60.0, 79.0, 213.0, 415.0, 912.0, 2277.0, 5841.0, 18191.0, 75007.0, 503634.0, 363877.0, 55300.0, 14394.0, 4851.0, 1886.0, 815.0, 330.0, 163.0, 72.0, 34.0, 25.0, 16.0, 14.0, 14.0, 11.0, 3.0, 3.0, 2.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.876953125, -2.789520263671875, -2.70208740234375, -2.614654541015625, -2.5272216796875, -2.439788818359375, -2.35235595703125, -2.264923095703125, -2.177490234375, -2.090057373046875, -2.00262451171875, -1.915191650390625, -1.8277587890625, -1.740325927734375, -1.65289306640625, -1.565460205078125, -1.47802734375, -1.390594482421875, -1.30316162109375, -1.215728759765625, -1.1282958984375, -1.040863037109375, -0.95343017578125, -0.865997314453125, -0.778564453125, -0.691131591796875, -0.60369873046875, -0.516265869140625, -0.4288330078125, -0.341400146484375, -0.25396728515625, -0.166534423828125, -0.0791015625, 0.008331298828125, 0.09576416015625, 0.183197021484375, 0.2706298828125, 0.358062744140625, 0.44549560546875, 0.532928466796875, 0.620361328125, 0.707794189453125, 0.79522705078125, 0.882659912109375, 0.9700927734375, 1.057525634765625, 1.14495849609375, 1.232391357421875, 1.31982421875, 1.407257080078125, 1.49468994140625, 1.582122802734375, 1.6695556640625, 1.756988525390625, 1.84442138671875, 1.931854248046875, 2.019287109375, 2.106719970703125, 2.19415283203125, 2.281585693359375, 2.3690185546875, 2.456451416015625, 2.54388427734375, 2.631317138671875, 2.71875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 7.0, 5.0, 14.0, 14.0, 17.0, 28.0, 33.0, 36.0, 56.0, 60.0, 75.0, 65.0, 85.0, 76.0, 76.0, 82.0, 57.0, 69.0, 46.0, 30.0, 31.0, 25.0, 5.0, 7.0, 6.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0], "bins": [-1.666015625, -1.6298446655273438, -1.5936737060546875, -1.5575027465820312, -1.521331787109375, -1.4851608276367188, -1.4489898681640625, -1.4128189086914062, -1.37664794921875, -1.3404769897460938, -1.3043060302734375, -1.2681350708007812, -1.231964111328125, -1.1957931518554688, -1.1596221923828125, -1.1234512329101562, -1.0872802734375, -1.0511093139648438, -1.0149383544921875, -0.9787673950195312, -0.942596435546875, -0.9064254760742188, -0.8702545166015625, -0.8340835571289062, -0.79791259765625, -0.7617416381835938, -0.7255706787109375, -0.6893997192382812, -0.653228759765625, -0.6170578002929688, -0.5808868408203125, -0.5447158813476562, -0.508544921875, -0.47237396240234375, -0.4362030029296875, -0.40003204345703125, -0.363861083984375, -0.32769012451171875, -0.2915191650390625, -0.25534820556640625, -0.21917724609375, -0.18300628662109375, -0.1468353271484375, -0.11066436767578125, -0.074493408203125, -0.03832244873046875, -0.0021514892578125, 0.03401947021484375, 0.0701904296875, 0.10636138916015625, 0.1425323486328125, 0.17870330810546875, 0.214874267578125, 0.25104522705078125, 0.2872161865234375, 0.32338714599609375, 0.35955810546875, 0.39572906494140625, 0.4319000244140625, 0.46807098388671875, 0.504241943359375, 0.5404129028320312, 0.5765838623046875, 0.6127548217773438, 0.64892578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 7.0, 10.0, 9.0, 11.0, 28.0, 36.0, 91.0, 257.0, 934.0, 4712.0, 39167.0, 841086.0, 149284.0, 10450.0, 1679.0, 477.0, 137.0, 57.0, 29.0, 17.0, 11.0, 10.0, 6.0, 5.0, 8.0, 6.0, 4.0, 5.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.37109375, -6.2021484375, -6.033203125, -5.8642578125, -5.6953125, -5.5263671875, -5.357421875, -5.1884765625, -5.01953125, -4.8505859375, -4.681640625, -4.5126953125, -4.34375, -4.1748046875, -4.005859375, -3.8369140625, -3.66796875, -3.4990234375, -3.330078125, -3.1611328125, -2.9921875, -2.8232421875, -2.654296875, -2.4853515625, -2.31640625, -2.1474609375, -1.978515625, -1.8095703125, -1.640625, -1.4716796875, -1.302734375, -1.1337890625, -0.96484375, -0.7958984375, -0.626953125, -0.4580078125, -0.2890625, -0.1201171875, 0.048828125, 0.2177734375, 0.38671875, 0.5556640625, 0.724609375, 0.8935546875, 1.0625, 1.2314453125, 1.400390625, 1.5693359375, 1.73828125, 1.9072265625, 2.076171875, 2.2451171875, 2.4140625, 2.5830078125, 2.751953125, 2.9208984375, 3.08984375, 3.2587890625, 3.427734375, 3.5966796875, 3.765625, 3.9345703125, 4.103515625, 4.2724609375, 4.44140625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 7.0, 3.0, 8.0, 8.0, 12.0, 19.0, 26.0, 28.0, 18.0, 27.0, 32.0, 48.0, 53.0, 50.0, 70.0, 56.0, 58.0, 61.0, 55.0, 46.0, 66.0, 34.0, 31.0, 32.0, 30.0, 20.0, 28.0, 22.0, 11.0, 11.0, 9.0, 15.0, 6.0, 5.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-4.5546875, -4.4451904296875, -4.335693359375, -4.2261962890625, -4.11669921875, -4.0072021484375, -3.897705078125, -3.7882080078125, -3.6787109375, -3.5692138671875, -3.459716796875, -3.3502197265625, -3.24072265625, -3.1312255859375, -3.021728515625, -2.9122314453125, -2.802734375, -2.6932373046875, -2.583740234375, -2.4742431640625, -2.36474609375, -2.2552490234375, -2.145751953125, -2.0362548828125, -1.9267578125, -1.8172607421875, -1.707763671875, -1.5982666015625, -1.48876953125, -1.3792724609375, -1.269775390625, -1.1602783203125, -1.05078125, -0.9412841796875, -0.831787109375, -0.7222900390625, -0.61279296875, -0.5032958984375, -0.393798828125, -0.2843017578125, -0.1748046875, -0.0653076171875, 0.044189453125, 0.1536865234375, 0.26318359375, 0.3726806640625, 0.482177734375, 0.5916748046875, 0.701171875, 0.8106689453125, 0.920166015625, 1.0296630859375, 1.13916015625, 1.2486572265625, 1.358154296875, 1.4676513671875, 1.5771484375, 1.6866455078125, 1.796142578125, 1.9056396484375, 2.01513671875, 2.1246337890625, 2.234130859375, 2.3436279296875, 2.453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 11.0, 7.0, 11.0, 16.0, 22.0, 37.0, 48.0, 103.0, 232.0, 571.0, 1850.0, 8409.0, 954097.0, 77241.0, 4003.0, 1124.0, 403.0, 154.0, 76.0, 46.0, 27.0, 20.0, 18.0, 13.0, 6.0, 4.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-9.0546875, -8.8525390625, -8.650390625, -8.4482421875, -8.24609375, -8.0439453125, -7.841796875, -7.6396484375, -7.4375, -7.2353515625, -7.033203125, -6.8310546875, -6.62890625, -6.4267578125, -6.224609375, -6.0224609375, -5.8203125, -5.6181640625, -5.416015625, -5.2138671875, -5.01171875, -4.8095703125, -4.607421875, -4.4052734375, -4.203125, -4.0009765625, -3.798828125, -3.5966796875, -3.39453125, -3.1923828125, -2.990234375, -2.7880859375, -2.5859375, -2.3837890625, -2.181640625, -1.9794921875, -1.77734375, -1.5751953125, -1.373046875, -1.1708984375, -0.96875, -0.7666015625, -0.564453125, -0.3623046875, -0.16015625, 0.0419921875, 0.244140625, 0.4462890625, 0.6484375, 0.8505859375, 1.052734375, 1.2548828125, 1.45703125, 1.6591796875, 1.861328125, 2.0634765625, 2.265625, 2.4677734375, 2.669921875, 2.8720703125, 3.07421875, 3.2763671875, 3.478515625, 3.6806640625, 3.8828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 4.0, 2.0, 11.0, 17.0, 28.0, 43.0, 107.0, 234.0, 311.0, 133.0, 46.0, 31.0, 13.0, 4.0, 9.0, 3.0, 1.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0006165504455566406, -0.0006031878292560577, -0.0005898252129554749, -0.000576462596654892, -0.0005630999803543091, -0.0005497373640537262, -0.0005363747477531433, -0.0005230121314525604, -0.0005096495151519775, -0.0004962868988513947, -0.00048292428255081177, -0.0004695616662502289, -0.000456199049949646, -0.0004428364336490631, -0.0004294738173484802, -0.00041611120104789734, -0.00040274858474731445, -0.00038938596844673157, -0.0003760233521461487, -0.0003626607358455658, -0.0003492981195449829, -0.0003359355032444, -0.00032257288694381714, -0.00030921027064323425, -0.00029584765434265137, -0.0002824850380420685, -0.0002691224217414856, -0.0002557598054409027, -0.00024239718914031982, -0.00022903457283973694, -0.00021567195653915405, -0.00020230934023857117, -0.00018894672393798828, -0.0001755841076374054, -0.0001622214913368225, -0.00014885887503623962, -0.00013549625873565674, -0.00012213364243507385, -0.00010877102613449097, -9.540840983390808e-05, -8.20457935333252e-05, -6.868317723274231e-05, -5.5320560932159424e-05, -4.195794463157654e-05, -2.8595328330993652e-05, -1.5232712030410767e-05, -1.8700957298278809e-06, 1.1492520570755005e-05, 2.485513687133789e-05, 3.8217753171920776e-05, 5.158036947250366e-05, 6.494298577308655e-05, 7.830560207366943e-05, 9.166821837425232e-05, 0.0001050308346748352, 0.00011839345097541809, 0.00013175606727600098, 0.00014511868357658386, 0.00015848129987716675, 0.00017184391617774963, 0.00018520653247833252, 0.0001985691487789154, 0.0002119317650794983, 0.00022529438138008118, 0.00023865699768066406]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 10.0, 10.0, 45.0, 88.0, 307.0, 934.0, 3448.0, 58840.0, 974307.0, 8035.0, 1730.0, 521.0, 180.0, 50.0, 25.0, 5.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.8125, -5.60662841796875, -5.4007568359375, -5.19488525390625, -4.989013671875, -4.78314208984375, -4.5772705078125, -4.37139892578125, -4.16552734375, -3.95965576171875, -3.7537841796875, -3.54791259765625, -3.342041015625, -3.13616943359375, -2.9302978515625, -2.72442626953125, -2.5185546875, -2.31268310546875, -2.1068115234375, -1.90093994140625, -1.695068359375, -1.48919677734375, -1.2833251953125, -1.07745361328125, -0.87158203125, -0.66571044921875, -0.4598388671875, -0.25396728515625, -0.048095703125, 0.15777587890625, 0.3636474609375, 0.56951904296875, 0.775390625, 0.98126220703125, 1.1871337890625, 1.39300537109375, 1.598876953125, 1.80474853515625, 2.0106201171875, 2.21649169921875, 2.42236328125, 2.62823486328125, 2.8341064453125, 3.03997802734375, 3.245849609375, 3.45172119140625, 3.6575927734375, 3.86346435546875, 4.0693359375, 4.27520751953125, 4.4810791015625, 4.68695068359375, 4.892822265625, 5.09869384765625, 5.3045654296875, 5.51043701171875, 5.71630859375, 5.92218017578125, 6.1280517578125, 6.33392333984375, 6.539794921875, 6.74566650390625, 6.9515380859375, 7.15740966796875, 7.36328125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 8.0, 12.0, 13.0, 31.0, 91.0, 170.0, 256.0, 194.0, 87.0, 48.0, 27.0, 23.0, 11.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.130859375, -2.053802490234375, -1.97674560546875, -1.899688720703125, -1.8226318359375, -1.745574951171875, -1.66851806640625, -1.591461181640625, -1.514404296875, -1.437347412109375, -1.36029052734375, -1.283233642578125, -1.2061767578125, -1.129119873046875, -1.05206298828125, -0.975006103515625, -0.89794921875, -0.820892333984375, -0.74383544921875, -0.666778564453125, -0.5897216796875, -0.512664794921875, -0.43560791015625, -0.358551025390625, -0.281494140625, -0.204437255859375, -0.12738037109375, -0.050323486328125, 0.0267333984375, 0.103790283203125, 0.18084716796875, 0.257904052734375, 0.3349609375, 0.412017822265625, 0.48907470703125, 0.566131591796875, 0.6431884765625, 0.720245361328125, 0.79730224609375, 0.874359130859375, 0.951416015625, 1.028472900390625, 1.10552978515625, 1.182586669921875, 1.2596435546875, 1.336700439453125, 1.41375732421875, 1.490814208984375, 1.56787109375, 1.644927978515625, 1.72198486328125, 1.799041748046875, 1.8760986328125, 1.953155517578125, 2.03021240234375, 2.107269287109375, 2.184326171875, 2.261383056640625, 2.33843994140625, 2.415496826171875, 2.4925537109375, 2.569610595703125, 2.64666748046875, 2.723724365234375, 2.80078125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 12.0, 33.0, 109.0, 317.0, 324.0, 155.0, 36.0, 14.0, 7.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.81879806518555, -32.27683639526367, -30.734874725341797, -29.192913055419922, -27.650951385498047, -26.108989715576172, -24.56702995300293, -23.025068283081055, -21.48310661315918, -19.941144943237305, -18.39918327331543, -16.857223510742188, -15.315260887145996, -13.773299217224121, -12.231338500976562, -10.689376831054688, -9.147415161132812, -7.6054534912109375, -6.063492298126221, -4.521531105041504, -2.979569435119629, -1.437607765197754, 0.10435295104980469, 1.6463146209716797, 3.1882762908935547, 4.73023796081543, 6.2721991539001465, 7.814160346984863, 9.356122016906738, 10.898083686828613, 12.440044403076172, 13.982006072998047, 15.523971557617188, 17.065933227539062, 18.607894897460938, 20.149856567382812, 21.691818237304688, 23.233779907226562, 24.775739669799805, 26.31770133972168, 27.859663009643555, 29.40162467956543, 30.943586349487305, 32.48554611206055, 34.02750778198242, 35.5694694519043, 37.11143112182617, 38.65339279174805, 40.19535446166992, 41.7373161315918, 43.27927780151367, 44.82123947143555, 46.36320114135742, 47.9051628112793, 49.447120666503906, 50.98908233642578, 52.531044006347656, 54.07300567626953, 55.614967346191406, 57.15692901611328, 58.698890686035156, 60.24085235595703, 61.782814025878906, 63.32477569580078, 64.86673736572266]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 5.0, 5.0, 9.0, 10.0, 9.0, 20.0, 20.0, 14.0, 15.0, 18.0, 34.0, 36.0, 32.0, 49.0, 43.0, 41.0, 34.0, 47.0, 56.0, 59.0, 44.0, 46.0, 36.0, 51.0, 30.0, 36.0, 35.0, 34.0, 24.0, 16.0, 17.0, 19.0, 11.0, 11.0, 11.0, 11.0, 7.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.812686920166016, -12.33586597442627, -11.859044075012207, -11.382223129272461, -10.905401229858398, -10.428580284118652, -9.951759338378906, -9.474937438964844, -8.998116493225098, -8.521295547485352, -8.044473648071289, -7.567652702331543, -7.090831279754639, -6.614009857177734, -6.137188911437988, -5.660367488861084, -5.18354606628418, -4.706724643707275, -4.229903221130371, -3.753082275390625, -3.2762608528137207, -2.7994394302368164, -2.322618246078491, -1.845797061920166, -1.3689756393432617, -0.892154335975647, -0.4153330326080322, 0.06148827075958252, 0.5383095741271973, 1.0151309967041016, 1.4919521808624268, 1.968773365020752, 2.4455947875976562, 2.9224162101745605, 3.3992373943328857, 3.876058578491211, 4.352880001068115, 4.8297014236450195, 5.306522369384766, 5.78334379196167, 6.260165214538574, 6.7369866371154785, 7.213808059692383, 7.690629005432129, 8.167449951171875, 8.644271850585938, 9.121092796325684, 9.59791374206543, 10.074735641479492, 10.551556587219238, 11.0283784866333, 11.505199432373047, 11.98202133178711, 12.458842277526855, 12.935663223266602, 13.412485122680664, 13.88930606842041, 14.366127014160156, 14.842948913574219, 15.319769859313965, 15.796590805053711, 16.273412704467773, 16.750234603881836, 17.227054595947266, 17.703876495361328]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 7.0, 5.0, 10.0, 17.0, 24.0, 45.0, 61.0, 66.0, 109.0, 198.0, 278.0, 383.0, 662.0, 1093.0, 1973.0, 3533.0, 7884.0, 24721.0, 419602.0, 3684803.0, 30691.0, 8811.0, 3821.0, 2090.0, 1262.0, 703.0, 489.0, 321.0, 216.0, 121.0, 87.0, 61.0, 32.0, 21.0, 23.0, 17.0, 10.0, 11.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.59375, -4.4698486328125, -4.345947265625, -4.2220458984375, -4.09814453125, -3.9742431640625, -3.850341796875, -3.7264404296875, -3.6025390625, -3.4786376953125, -3.354736328125, -3.2308349609375, -3.10693359375, -2.9830322265625, -2.859130859375, -2.7352294921875, -2.611328125, -2.4874267578125, -2.363525390625, -2.2396240234375, -2.11572265625, -1.9918212890625, -1.867919921875, -1.7440185546875, -1.6201171875, -1.4962158203125, -1.372314453125, -1.2484130859375, -1.12451171875, -1.0006103515625, -0.876708984375, -0.7528076171875, -0.62890625, -0.5050048828125, -0.381103515625, -0.2572021484375, -0.13330078125, -0.0093994140625, 0.114501953125, 0.2384033203125, 0.3623046875, 0.4862060546875, 0.610107421875, 0.7340087890625, 0.85791015625, 0.9818115234375, 1.105712890625, 1.2296142578125, 1.353515625, 1.4774169921875, 1.601318359375, 1.7252197265625, 1.84912109375, 1.9730224609375, 2.096923828125, 2.2208251953125, 2.3447265625, 2.4686279296875, 2.592529296875, 2.7164306640625, 2.84033203125, 2.9642333984375, 3.088134765625, 3.2120361328125, 3.3359375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 3.0, 4.0, 6.0, 6.0, 10.0, 9.0, 30.0, 27.0, 36.0, 46.0, 58.0, 44.0, 63.0, 62.0, 64.0, 66.0, 50.0, 73.0, 61.0, 40.0, 50.0, 46.0, 34.0, 26.0, 25.0, 21.0, 10.0, 17.0, 6.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.3984375, -1.3647994995117188, -1.3311614990234375, -1.2975234985351562, -1.263885498046875, -1.2302474975585938, -1.1966094970703125, -1.1629714965820312, -1.12933349609375, -1.0956954956054688, -1.0620574951171875, -1.0284194946289062, -0.994781494140625, -0.9611434936523438, -0.9275054931640625, -0.8938674926757812, -0.8602294921875, -0.8265914916992188, -0.7929534912109375, -0.7593154907226562, -0.725677490234375, -0.6920394897460938, -0.6584014892578125, -0.6247634887695312, -0.59112548828125, -0.5574874877929688, -0.5238494873046875, -0.49021148681640625, -0.456573486328125, -0.42293548583984375, -0.3892974853515625, -0.35565948486328125, -0.322021484375, -0.28838348388671875, -0.2547454833984375, -0.22110748291015625, -0.187469482421875, -0.15383148193359375, -0.1201934814453125, -0.08655548095703125, -0.05291748046875, -0.01927947998046875, 0.0143585205078125, 0.04799652099609375, 0.081634521484375, 0.11527252197265625, 0.1489105224609375, 0.18254852294921875, 0.2161865234375, 0.24982452392578125, 0.2834625244140625, 0.31710052490234375, 0.350738525390625, 0.38437652587890625, 0.4180145263671875, 0.45165252685546875, 0.48529052734375, 0.5189285278320312, 0.5525665283203125, 0.5862045288085938, 0.619842529296875, 0.6534805297851562, 0.6871185302734375, 0.7207565307617188, 0.75439453125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 5.0, 5.0, 19.0, 40.0, 51.0, 89.0, 201.0, 453.0, 1223.0, 4012.0, 20497.0, 4088218.0, 69242.0, 6974.0, 1959.0, 686.0, 271.0, 143.0, 85.0, 42.0, 30.0, 17.0, 7.0, 3.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.21875, -5.9564208984375, -5.694091796875, -5.4317626953125, -5.16943359375, -4.9071044921875, -4.644775390625, -4.3824462890625, -4.1201171875, -3.8577880859375, -3.595458984375, -3.3331298828125, -3.07080078125, -2.8084716796875, -2.546142578125, -2.2838134765625, -2.021484375, -1.7591552734375, -1.496826171875, -1.2344970703125, -0.97216796875, -0.7098388671875, -0.447509765625, -0.1851806640625, 0.0771484375, 0.3394775390625, 0.601806640625, 0.8641357421875, 1.12646484375, 1.3887939453125, 1.651123046875, 1.9134521484375, 2.17578125, 2.4381103515625, 2.700439453125, 2.9627685546875, 3.22509765625, 3.4874267578125, 3.749755859375, 4.0120849609375, 4.2744140625, 4.5367431640625, 4.799072265625, 5.0614013671875, 5.32373046875, 5.5860595703125, 5.848388671875, 6.1107177734375, 6.373046875, 6.6353759765625, 6.897705078125, 7.1600341796875, 7.42236328125, 7.6846923828125, 7.947021484375, 8.2093505859375, 8.4716796875, 8.7340087890625, 8.996337890625, 9.2586669921875, 9.52099609375, 9.7833251953125, 10.045654296875, 10.3079833984375, 10.5703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 5.0, 1.0, 6.0, 10.0, 15.0, 24.0, 47.0, 171.0, 3415.0, 243.0, 70.0, 21.0, 14.0, 9.0, 10.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.22265625, -1.13897705078125, -1.0552978515625, -0.97161865234375, -0.887939453125, -0.80426025390625, -0.7205810546875, -0.63690185546875, -0.55322265625, -0.46954345703125, -0.3858642578125, -0.30218505859375, -0.218505859375, -0.13482666015625, -0.0511474609375, 0.03253173828125, 0.1162109375, 0.19989013671875, 0.2835693359375, 0.36724853515625, 0.450927734375, 0.53460693359375, 0.6182861328125, 0.70196533203125, 0.78564453125, 0.86932373046875, 0.9530029296875, 1.03668212890625, 1.120361328125, 1.20404052734375, 1.2877197265625, 1.37139892578125, 1.455078125, 1.53875732421875, 1.6224365234375, 1.70611572265625, 1.789794921875, 1.87347412109375, 1.9571533203125, 2.04083251953125, 2.12451171875, 2.20819091796875, 2.2918701171875, 2.37554931640625, 2.459228515625, 2.54290771484375, 2.6265869140625, 2.71026611328125, 2.7939453125, 2.87762451171875, 2.9613037109375, 3.04498291015625, 3.128662109375, 3.21234130859375, 3.2960205078125, 3.37969970703125, 3.46337890625, 3.54705810546875, 3.6307373046875, 3.71441650390625, 3.798095703125, 3.88177490234375, 3.9654541015625, 4.04913330078125, 4.1328125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 7.0, 4.0, 3.0, 7.0, 21.0, 48.0, 100.0, 172.0, 239.0, 190.0, 106.0, 45.0, 20.0, 14.0, 8.0, 6.0, 4.0, 5.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.624087810516357, -5.3508381843566895, -5.077588081359863, -4.804338455200195, -4.531088352203369, -4.257838726043701, -3.984588861465454, -3.711338996887207, -3.43808913230896, -3.164839267730713, -2.891589403152466, -2.6183395385742188, -2.345089912414551, -2.0718398094177246, -1.7985901832580566, -1.5253403186798096, -1.2520904541015625, -0.9788405895233154, -0.7055907845497131, -0.43234097957611084, -0.15909111499786377, 0.1141587495803833, 0.3874084949493408, 0.6606583595275879, 0.933908224105835, 1.207158088684082, 1.480407953262329, 1.7536576986312866, 2.026907444000244, 2.3001575469970703, 2.5734071731567383, 2.8466570377349854, 3.119906425476074, 3.3931562900543213, 3.6664061546325684, 3.9396557807922363, 4.2129058837890625, 4.4861555099487305, 4.759405136108398, 5.032655239105225, 5.305905342102051, 5.579154968261719, 5.852405071258545, 6.125654697418213, 6.398904800415039, 6.672154426574707, 6.945404052734375, 7.218654155731201, 7.491903781890869, 7.765153408050537, 8.038403511047363, 8.311653137207031, 8.5849027633667, 8.858153343200684, 9.131402969360352, 9.40465259552002, 9.677902221679688, 9.951151847839355, 10.224401473999023, 10.497652053833008, 10.770901679992676, 11.044151306152344, 11.317400932312012, 11.59065055847168, 11.863901138305664]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 7.0, 12.0, 16.0, 14.0, 21.0, 29.0, 30.0, 28.0, 30.0, 33.0, 53.0, 60.0, 73.0, 57.0, 62.0, 61.0, 58.0, 52.0, 41.0, 39.0, 48.0, 36.0, 29.0, 29.0, 26.0, 15.0, 8.0, 12.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.688807487487793, -4.528800964355469, -4.3687944412231445, -4.208787441253662, -4.048780918121338, -3.8887743949890137, -3.7287676334381104, -3.568760871887207, -3.408754348754883, -3.2487478256225586, -3.0887410640716553, -2.928734302520752, -2.7687277793884277, -2.6087212562561035, -2.4487144947052, -2.288707733154297, -2.1287012100219727, -1.9686945676803589, -1.8086879253387451, -1.6486812829971313, -1.4886746406555176, -1.3286679983139038, -1.16866135597229, -1.0086547136306763, -0.8486480712890625, -0.6886414289474487, -0.528634786605835, -0.3686281442642212, -0.20862150192260742, -0.04861485958099365, 0.11139178276062012, 0.2713984251022339, 0.43140506744384766, 0.5914117097854614, 0.7514183521270752, 0.911424994468689, 1.0714316368103027, 1.2314382791519165, 1.3914449214935303, 1.551451563835144, 1.7114582061767578, 1.8714648485183716, 2.0314714908599854, 2.1914782524108887, 2.351484775543213, 2.511491298675537, 2.6714980602264404, 2.8315048217773438, 2.991511344909668, 3.151517868041992, 3.3115246295928955, 3.471531391143799, 3.631537914276123, 3.7915444374084473, 3.9515511989593506, 4.111557960510254, 4.271564483642578, 4.431571006774902, 4.591577529907227, 4.751584529876709, 4.911591053009033, 5.071597576141357, 5.23160457611084, 5.391611099243164, 5.551617622375488]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 8.0, 17.0, 23.0, 34.0, 66.0, 87.0, 167.0, 261.0, 569.0, 1177.0, 2296.0, 5013.0, 11864.0, 29687.0, 82193.0, 241705.0, 401015.0, 174228.0, 59538.0, 21735.0, 9007.0, 3980.0, 1838.0, 981.0, 466.0, 232.0, 132.0, 79.0, 50.0, 40.0, 28.0, 16.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7763671875, -1.7158355712890625, -1.655303955078125, -1.5947723388671875, -1.53424072265625, -1.4737091064453125, -1.413177490234375, -1.3526458740234375, -1.2921142578125, -1.2315826416015625, -1.171051025390625, -1.1105194091796875, -1.04998779296875, -0.9894561767578125, -0.928924560546875, -0.8683929443359375, -0.807861328125, -0.7473297119140625, -0.686798095703125, -0.6262664794921875, -0.56573486328125, -0.5052032470703125, -0.444671630859375, -0.3841400146484375, -0.3236083984375, -0.2630767822265625, -0.202545166015625, -0.1420135498046875, -0.08148193359375, -0.0209503173828125, 0.039581298828125, 0.1001129150390625, 0.16064453125, 0.2211761474609375, 0.281707763671875, 0.3422393798828125, 0.40277099609375, 0.4633026123046875, 0.523834228515625, 0.5843658447265625, 0.6448974609375, 0.7054290771484375, 0.765960693359375, 0.8264923095703125, 0.88702392578125, 0.9475555419921875, 1.008087158203125, 1.0686187744140625, 1.129150390625, 1.1896820068359375, 1.250213623046875, 1.3107452392578125, 1.37127685546875, 1.4318084716796875, 1.492340087890625, 1.5528717041015625, 1.6134033203125, 1.6739349365234375, 1.734466552734375, 1.7949981689453125, 1.85552978515625, 1.9160614013671875, 1.976593017578125, 2.0371246337890625, 2.09765625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 0.0, 7.0, 1.0, 10.0, 13.0, 19.0, 20.0, 26.0, 30.0, 25.0, 29.0, 39.0, 46.0, 61.0, 63.0, 52.0, 77.0, 60.0, 56.0, 47.0, 41.0, 50.0, 32.0, 38.0, 30.0, 19.0, 36.0, 20.0, 18.0, 10.0, 11.0, 6.0, 4.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.3525390625, -1.3187103271484375, -1.284881591796875, -1.2510528564453125, -1.21722412109375, -1.1833953857421875, -1.149566650390625, -1.1157379150390625, -1.0819091796875, -1.0480804443359375, -1.014251708984375, -0.9804229736328125, -0.94659423828125, -0.9127655029296875, -0.878936767578125, -0.8451080322265625, -0.811279296875, -0.7774505615234375, -0.743621826171875, -0.7097930908203125, -0.67596435546875, -0.6421356201171875, -0.608306884765625, -0.5744781494140625, -0.5406494140625, -0.5068206787109375, -0.472991943359375, -0.4391632080078125, -0.40533447265625, -0.3715057373046875, -0.337677001953125, -0.3038482666015625, -0.27001953125, -0.2361907958984375, -0.202362060546875, -0.1685333251953125, -0.13470458984375, -0.1008758544921875, -0.067047119140625, -0.0332183837890625, 0.0006103515625, 0.0344390869140625, 0.068267822265625, 0.1020965576171875, 0.13592529296875, 0.1697540283203125, 0.203582763671875, 0.2374114990234375, 0.271240234375, 0.3050689697265625, 0.338897705078125, 0.3727264404296875, 0.40655517578125, 0.4403839111328125, 0.474212646484375, 0.5080413818359375, 0.5418701171875, 0.5756988525390625, 0.609527587890625, 0.6433563232421875, 0.67718505859375, 0.7110137939453125, 0.744842529296875, 0.7786712646484375, 0.8125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 7.0, 1.0, 3.0, 6.0, 9.0, 6.0, 21.0, 16.0, 26.0, 33.0, 46.0, 69.0, 102.0, 167.0, 337.0, 644.0, 1817.0, 7729.0, 48830.0, 562887.0, 382283.0, 34749.0, 5966.0, 1455.0, 579.0, 251.0, 168.0, 117.0, 62.0, 43.0, 29.0, 18.0, 15.0, 15.0, 11.0, 11.0, 10.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.9453125, -3.81768798828125, -3.6900634765625, -3.56243896484375, -3.434814453125, -3.30718994140625, -3.1795654296875, -3.05194091796875, -2.92431640625, -2.79669189453125, -2.6690673828125, -2.54144287109375, -2.413818359375, -2.28619384765625, -2.1585693359375, -2.03094482421875, -1.9033203125, -1.77569580078125, -1.6480712890625, -1.52044677734375, -1.392822265625, -1.26519775390625, -1.1375732421875, -1.00994873046875, -0.88232421875, -0.75469970703125, -0.6270751953125, -0.49945068359375, -0.371826171875, -0.24420166015625, -0.1165771484375, 0.01104736328125, 0.138671875, 0.26629638671875, 0.3939208984375, 0.52154541015625, 0.649169921875, 0.77679443359375, 0.9044189453125, 1.03204345703125, 1.15966796875, 1.28729248046875, 1.4149169921875, 1.54254150390625, 1.670166015625, 1.79779052734375, 1.9254150390625, 2.05303955078125, 2.1806640625, 2.30828857421875, 2.4359130859375, 2.56353759765625, 2.691162109375, 2.81878662109375, 2.9464111328125, 3.07403564453125, 3.20166015625, 3.32928466796875, 3.4569091796875, 3.58453369140625, 3.712158203125, 3.83978271484375, 3.9674072265625, 4.09503173828125, 4.22265625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 9.0, 12.0, 15.0, 11.0, 12.0, 20.0, 21.0, 27.0, 31.0, 42.0, 32.0, 46.0, 41.0, 57.0, 42.0, 54.0, 50.0, 45.0, 53.0, 42.0, 37.0, 42.0, 37.0, 33.0, 25.0, 40.0, 14.0, 18.0, 18.0, 14.0, 13.0, 11.0, 7.0, 8.0, 10.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.794921875, -3.656402587890625, -3.51788330078125, -3.379364013671875, -3.2408447265625, -3.102325439453125, -2.96380615234375, -2.825286865234375, -2.686767578125, -2.548248291015625, -2.40972900390625, -2.271209716796875, -2.1326904296875, -1.994171142578125, -1.85565185546875, -1.717132568359375, -1.57861328125, -1.440093994140625, -1.30157470703125, -1.163055419921875, -1.0245361328125, -0.886016845703125, -0.74749755859375, -0.608978271484375, -0.470458984375, -0.331939697265625, -0.19342041015625, -0.054901123046875, 0.0836181640625, 0.222137451171875, 0.36065673828125, 0.499176025390625, 0.6376953125, 0.776214599609375, 0.91473388671875, 1.053253173828125, 1.1917724609375, 1.330291748046875, 1.46881103515625, 1.607330322265625, 1.745849609375, 1.884368896484375, 2.02288818359375, 2.161407470703125, 2.2999267578125, 2.438446044921875, 2.57696533203125, 2.715484619140625, 2.85400390625, 2.992523193359375, 3.13104248046875, 3.269561767578125, 3.4080810546875, 3.546600341796875, 3.68511962890625, 3.823638916015625, 3.962158203125, 4.100677490234375, 4.23919677734375, 4.377716064453125, 4.5162353515625, 4.654754638671875, 4.79327392578125, 4.931793212890625, 5.0703125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 12.0, 26.0, 41.0, 72.0, 169.0, 434.0, 1826.0, 13867.0, 883879.0, 140612.0, 6078.0, 1019.0, 256.0, 108.0, 68.0, 40.0, 17.0, 8.0, 5.0, 0.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.984375, -4.82769775390625, -4.6710205078125, -4.51434326171875, -4.357666015625, -4.20098876953125, -4.0443115234375, -3.88763427734375, -3.73095703125, -3.57427978515625, -3.4176025390625, -3.26092529296875, -3.104248046875, -2.94757080078125, -2.7908935546875, -2.63421630859375, -2.4775390625, -2.32086181640625, -2.1641845703125, -2.00750732421875, -1.850830078125, -1.69415283203125, -1.5374755859375, -1.38079833984375, -1.22412109375, -1.06744384765625, -0.9107666015625, -0.75408935546875, -0.597412109375, -0.44073486328125, -0.2840576171875, -0.12738037109375, 0.029296875, 0.18597412109375, 0.3426513671875, 0.49932861328125, 0.656005859375, 0.81268310546875, 0.9693603515625, 1.12603759765625, 1.28271484375, 1.43939208984375, 1.5960693359375, 1.75274658203125, 1.909423828125, 2.06610107421875, 2.2227783203125, 2.37945556640625, 2.5361328125, 2.69281005859375, 2.8494873046875, 3.00616455078125, 3.162841796875, 3.31951904296875, 3.4761962890625, 3.63287353515625, 3.78955078125, 3.94622802734375, 4.1029052734375, 4.25958251953125, 4.416259765625, 4.57293701171875, 4.7296142578125, 4.88629150390625, 5.04296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 4.0, 6.0, 8.0, 14.0, 13.0, 17.0, 26.0, 33.0, 55.0, 63.0, 120.0, 152.0, 148.0, 95.0, 70.0, 42.0, 41.0, 21.0, 16.0, 10.0, 13.0, 12.0, 3.0, 3.0, 0.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00032210350036621094, -0.00031422078609466553, -0.0003063380718231201, -0.0002984553575515747, -0.0002905726432800293, -0.0002826899290084839, -0.0002748072147369385, -0.00026692450046539307, -0.00025904178619384766, -0.00025115907192230225, -0.00024327635765075684, -0.00023539364337921143, -0.00022751092910766602, -0.0002196282148361206, -0.0002117455005645752, -0.00020386278629302979, -0.00019598007202148438, -0.00018809735774993896, -0.00018021464347839355, -0.00017233192920684814, -0.00016444921493530273, -0.00015656650066375732, -0.00014868378639221191, -0.0001408010721206665, -0.0001329183578491211, -0.00012503564357757568, -0.00011715292930603027, -0.00010927021503448486, -0.00010138750076293945, -9.350478649139404e-05, -8.562207221984863e-05, -7.773935794830322e-05, -6.985664367675781e-05, -6.19739294052124e-05, -5.409121513366699e-05, -4.620850086212158e-05, -3.832578659057617e-05, -3.0443072319030762e-05, -2.256035804748535e-05, -1.4677643775939941e-05, -6.794929504394531e-06, 1.087784767150879e-06, 8.970499038696289e-06, 1.68532133102417e-05, 2.473592758178711e-05, 3.261864185333252e-05, 4.050135612487793e-05, 4.838407039642334e-05, 5.626678466796875e-05, 6.414949893951416e-05, 7.203221321105957e-05, 7.991492748260498e-05, 8.779764175415039e-05, 9.56803560256958e-05, 0.00010356307029724121, 0.00011144578456878662, 0.00011932849884033203, 0.00012721121311187744, 0.00013509392738342285, 0.00014297664165496826, 0.00015085935592651367, 0.00015874207019805908, 0.0001666247844696045, 0.0001745074987411499, 0.0001823902130126953]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 10.0, 7.0, 16.0, 12.0, 33.0, 35.0, 51.0, 82.0, 211.0, 518.0, 1596.0, 6964.0, 59822.0, 868570.0, 98293.0, 9159.0, 2024.0, 608.0, 257.0, 122.0, 45.0, 33.0, 18.0, 19.0, 19.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.83984375, -2.71942138671875, -2.5989990234375, -2.47857666015625, -2.358154296875, -2.23773193359375, -2.1173095703125, -1.99688720703125, -1.87646484375, -1.75604248046875, -1.6356201171875, -1.51519775390625, -1.394775390625, -1.27435302734375, -1.1539306640625, -1.03350830078125, -0.9130859375, -0.79266357421875, -0.6722412109375, -0.55181884765625, -0.431396484375, -0.31097412109375, -0.1905517578125, -0.07012939453125, 0.05029296875, 0.17071533203125, 0.2911376953125, 0.41156005859375, 0.531982421875, 0.65240478515625, 0.7728271484375, 0.89324951171875, 1.013671875, 1.13409423828125, 1.2545166015625, 1.37493896484375, 1.495361328125, 1.61578369140625, 1.7362060546875, 1.85662841796875, 1.97705078125, 2.09747314453125, 2.2178955078125, 2.33831787109375, 2.458740234375, 2.57916259765625, 2.6995849609375, 2.82000732421875, 2.9404296875, 3.06085205078125, 3.1812744140625, 3.30169677734375, 3.422119140625, 3.54254150390625, 3.6629638671875, 3.78338623046875, 3.90380859375, 4.02423095703125, 4.1446533203125, 4.26507568359375, 4.385498046875, 4.50592041015625, 4.6263427734375, 4.74676513671875, 4.8671875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 8.0, 12.0, 15.0, 16.0, 16.0, 20.0, 37.0, 44.0, 56.0, 56.0, 62.0, 97.0, 98.0, 71.0, 78.0, 71.0, 38.0, 34.0, 34.0, 30.0, 22.0, 10.0, 15.0, 9.0, 10.0, 1.0, 3.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4931640625, -1.438690185546875, -1.38421630859375, -1.329742431640625, -1.2752685546875, -1.220794677734375, -1.16632080078125, -1.111846923828125, -1.057373046875, -1.002899169921875, -0.94842529296875, -0.893951416015625, -0.8394775390625, -0.785003662109375, -0.73052978515625, -0.676055908203125, -0.62158203125, -0.567108154296875, -0.51263427734375, -0.458160400390625, -0.4036865234375, -0.349212646484375, -0.29473876953125, -0.240264892578125, -0.185791015625, -0.131317138671875, -0.07684326171875, -0.022369384765625, 0.0321044921875, 0.086578369140625, 0.14105224609375, 0.195526123046875, 0.25, 0.304473876953125, 0.35894775390625, 0.413421630859375, 0.4678955078125, 0.522369384765625, 0.57684326171875, 0.631317138671875, 0.685791015625, 0.740264892578125, 0.79473876953125, 0.849212646484375, 0.9036865234375, 0.958160400390625, 1.01263427734375, 1.067108154296875, 1.12158203125, 1.176055908203125, 1.23052978515625, 1.285003662109375, 1.3394775390625, 1.393951416015625, 1.44842529296875, 1.502899169921875, 1.557373046875, 1.611846923828125, 1.66632080078125, 1.720794677734375, 1.7752685546875, 1.829742431640625, 1.88421630859375, 1.938690185546875, 1.9931640625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 13.0, 52.0, 268.0, 458.0, 171.0, 37.0, 9.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.21356201171875, -79.81673431396484, -77.41991424560547, -75.02308654785156, -72.62626647949219, -70.22943878173828, -67.83261108398438, -65.435791015625, -63.038963317871094, -60.64213943481445, -58.24531555175781, -55.848487854003906, -53.451663970947266, -51.054840087890625, -48.65801239013672, -46.26118850708008, -43.86436462402344, -41.4675407409668, -39.070716857910156, -36.67388916015625, -34.27706527709961, -31.88024139404297, -29.483415603637695, -27.086589813232422, -24.68976593017578, -22.29294204711914, -19.896116256713867, -17.499290466308594, -15.102466583251953, -12.705641746520996, -10.308816909790039, -7.911991119384766, -5.515174865722656, -3.118350028991699, -0.7215251922607422, 1.6752996444702148, 4.072124481201172, 6.468949317932129, 8.865774154663086, 11.26259994506836, 13.659423828125, 16.05624771118164, 18.453073501586914, 20.849899291992188, 23.246723175048828, 25.64354705810547, 28.040372848510742, 30.437198638916016, 32.834022521972656, 35.2308464050293, 37.62767028808594, 40.024497985839844, 42.421321868896484, 44.818145751953125, 47.21497344970703, 49.61179733276367, 52.00862121582031, 54.40544509887695, 56.802268981933594, 59.1990966796875, 61.59592056274414, 63.99274444580078, 66.38957214355469, 68.78639221191406, 71.18321990966797]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 7.0, 3.0, 5.0, 10.0, 5.0, 11.0, 18.0, 13.0, 23.0, 16.0, 19.0, 36.0, 24.0, 27.0, 40.0, 27.0, 35.0, 40.0, 45.0, 35.0, 49.0, 46.0, 51.0, 42.0, 42.0, 36.0, 35.0, 38.0, 25.0, 37.0, 23.0, 27.0, 20.0, 14.0, 19.0, 9.0, 14.0, 9.0, 7.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.294517517089844, -18.607702255249023, -17.920886993408203, -17.234071731567383, -16.547256469726562, -15.860441207885742, -15.173625946044922, -14.486810684204102, -13.799995422363281, -13.113180160522461, -12.42636489868164, -11.73954963684082, -11.052734375, -10.36591911315918, -9.67910385131836, -8.992288589477539, -8.305474281311035, -7.618659019470215, -6.9318437576293945, -6.245028495788574, -5.558213233947754, -4.871397972106934, -4.1845831871032715, -3.497767925262451, -2.810952663421631, -2.1241374015808105, -1.4373222589492798, -0.750507116317749, -0.06369185447692871, 0.6231234073638916, 1.3099384307861328, 1.9967536926269531, 2.6835689544677734, 3.3703842163085938, 4.057199478149414, 4.744014739990234, 5.430830001831055, 6.117645263671875, 6.804460048675537, 7.491275310516357, 8.178091049194336, 8.864906311035156, 9.551721572875977, 10.238536834716797, 10.925352096557617, 11.612167358398438, 12.298982620239258, 12.985797882080078, 13.672612190246582, 14.359427452087402, 15.046242713928223, 15.733057975769043, 16.419872283935547, 17.106687545776367, 17.793502807617188, 18.480318069458008, 19.167133331298828, 19.85394859313965, 20.54076385498047, 21.22757911682129, 21.91439437866211, 22.60120964050293, 23.28802490234375, 23.97484016418457, 24.66165542602539]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 10.0, 13.0, 17.0, 28.0, 37.0, 66.0, 86.0, 160.0, 244.0, 440.0, 888.0, 1721.0, 3717.0, 9080.0, 33498.0, 2874147.0, 1222851.0, 31664.0, 8592.0, 3391.0, 1614.0, 829.0, 457.0, 278.0, 160.0, 94.0, 77.0, 43.0, 28.0, 16.0, 8.0, 11.0, 6.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.015625, -3.900848388671875, -3.78607177734375, -3.671295166015625, -3.5565185546875, -3.441741943359375, -3.32696533203125, -3.212188720703125, -3.097412109375, -2.982635498046875, -2.86785888671875, -2.753082275390625, -2.6383056640625, -2.523529052734375, -2.40875244140625, -2.293975830078125, -2.17919921875, -2.064422607421875, -1.94964599609375, -1.834869384765625, -1.7200927734375, -1.605316162109375, -1.49053955078125, -1.375762939453125, -1.260986328125, -1.146209716796875, -1.03143310546875, -0.916656494140625, -0.8018798828125, -0.687103271484375, -0.57232666015625, -0.457550048828125, -0.3427734375, -0.227996826171875, -0.11322021484375, 0.001556396484375, 0.1163330078125, 0.231109619140625, 0.34588623046875, 0.460662841796875, 0.575439453125, 0.690216064453125, 0.80499267578125, 0.919769287109375, 1.0345458984375, 1.149322509765625, 1.26409912109375, 1.378875732421875, 1.49365234375, 1.608428955078125, 1.72320556640625, 1.837982177734375, 1.9527587890625, 2.067535400390625, 2.18231201171875, 2.297088623046875, 2.411865234375, 2.526641845703125, 2.64141845703125, 2.756195068359375, 2.8709716796875, 2.985748291015625, 3.10052490234375, 3.215301513671875, 3.330078125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 10.0, 10.0, 12.0, 16.0, 18.0, 24.0, 31.0, 20.0, 37.0, 29.0, 41.0, 46.0, 47.0, 40.0, 52.0, 61.0, 59.0, 47.0, 47.0, 40.0, 51.0, 41.0, 37.0, 27.0, 27.0, 20.0, 21.0, 11.0, 17.0, 15.0, 16.0, 11.0, 6.0, 5.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1884765625, -1.151519775390625, -1.11456298828125, -1.077606201171875, -1.0406494140625, -1.003692626953125, -0.96673583984375, -0.929779052734375, -0.892822265625, -0.855865478515625, -0.81890869140625, -0.781951904296875, -0.7449951171875, -0.708038330078125, -0.67108154296875, -0.634124755859375, -0.59716796875, -0.560211181640625, -0.52325439453125, -0.486297607421875, -0.4493408203125, -0.412384033203125, -0.37542724609375, -0.338470458984375, -0.301513671875, -0.264556884765625, -0.22760009765625, -0.190643310546875, -0.1536865234375, -0.116729736328125, -0.07977294921875, -0.042816162109375, -0.005859375, 0.031097412109375, 0.06805419921875, 0.105010986328125, 0.1419677734375, 0.178924560546875, 0.21588134765625, 0.252838134765625, 0.289794921875, 0.326751708984375, 0.36370849609375, 0.400665283203125, 0.4376220703125, 0.474578857421875, 0.51153564453125, 0.548492431640625, 0.58544921875, 0.622406005859375, 0.65936279296875, 0.696319580078125, 0.7332763671875, 0.770233154296875, 0.80718994140625, 0.844146728515625, 0.881103515625, 0.918060302734375, 0.95501708984375, 0.991973876953125, 1.0289306640625, 1.065887451171875, 1.10284423828125, 1.139801025390625, 1.1767578125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 19.0, 20.0, 27.0, 66.0, 102.0, 234.0, 501.0, 1402.0, 4923.0, 55906.0, 4102352.0, 23654.0, 3261.0, 1037.0, 402.0, 162.0, 99.0, 52.0, 29.0, 17.0, 3.0, 9.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.84375, -8.5787353515625, -8.313720703125, -8.0487060546875, -7.78369140625, -7.5186767578125, -7.253662109375, -6.9886474609375, -6.7236328125, -6.4586181640625, -6.193603515625, -5.9285888671875, -5.66357421875, -5.3985595703125, -5.133544921875, -4.8685302734375, -4.603515625, -4.3385009765625, -4.073486328125, -3.8084716796875, -3.54345703125, -3.2784423828125, -3.013427734375, -2.7484130859375, -2.4833984375, -2.2183837890625, -1.953369140625, -1.6883544921875, -1.42333984375, -1.1583251953125, -0.893310546875, -0.6282958984375, -0.36328125, -0.0982666015625, 0.166748046875, 0.4317626953125, 0.69677734375, 0.9617919921875, 1.226806640625, 1.4918212890625, 1.7568359375, 2.0218505859375, 2.286865234375, 2.5518798828125, 2.81689453125, 3.0819091796875, 3.346923828125, 3.6119384765625, 3.876953125, 4.1419677734375, 4.406982421875, 4.6719970703125, 4.93701171875, 5.2020263671875, 5.467041015625, 5.7320556640625, 5.9970703125, 6.2620849609375, 6.527099609375, 6.7921142578125, 7.05712890625, 7.3221435546875, 7.587158203125, 7.8521728515625, 8.1171875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 16.0, 17.0, 38.0, 52.0, 104.0, 1047.0, 2517.0, 112.0, 61.0, 26.0, 26.0, 11.0, 10.0, 5.0, 9.0, 0.0, 4.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904296875, -2.816436767578125, -2.72857666015625, -2.640716552734375, -2.5528564453125, -2.464996337890625, -2.37713623046875, -2.289276123046875, -2.201416015625, -2.113555908203125, -2.02569580078125, -1.937835693359375, -1.8499755859375, -1.762115478515625, -1.67425537109375, -1.586395263671875, -1.49853515625, -1.410675048828125, -1.32281494140625, -1.234954833984375, -1.1470947265625, -1.059234619140625, -0.97137451171875, -0.883514404296875, -0.795654296875, -0.707794189453125, -0.61993408203125, -0.532073974609375, -0.4442138671875, -0.356353759765625, -0.26849365234375, -0.180633544921875, -0.0927734375, -0.004913330078125, 0.08294677734375, 0.170806884765625, 0.2586669921875, 0.346527099609375, 0.43438720703125, 0.522247314453125, 0.610107421875, 0.697967529296875, 0.78582763671875, 0.873687744140625, 0.9615478515625, 1.049407958984375, 1.13726806640625, 1.225128173828125, 1.31298828125, 1.400848388671875, 1.48870849609375, 1.576568603515625, 1.6644287109375, 1.752288818359375, 1.84014892578125, 1.928009033203125, 2.015869140625, 2.103729248046875, 2.19158935546875, 2.279449462890625, 2.3673095703125, 2.455169677734375, 2.54302978515625, 2.630889892578125, 2.71875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 15.0, 30.0, 130.0, 366.0, 306.0, 104.0, 26.0, 10.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.114532470703125, -26.49797821044922, -25.881423950195312, -25.26487159729004, -24.648317337036133, -24.031763076782227, -23.41520881652832, -22.798654556274414, -22.18210220336914, -21.565547943115234, -20.948993682861328, -20.332441329956055, -19.71588706970215, -19.099332809448242, -18.482778549194336, -17.86622428894043, -17.249670028686523, -16.633115768432617, -16.01656150817871, -15.400008201599121, -14.783454895019531, -14.166900634765625, -13.550346374511719, -12.933792114257812, -12.317238807678223, -11.700684547424316, -11.084131240844727, -10.46757698059082, -9.851022720336914, -9.234469413757324, -8.617915153503418, -8.001361846923828, -7.384807586669922, -6.768253803253174, -6.151700019836426, -5.5351457595825195, -4.9185919761657715, -4.302038192749023, -3.6854841709136963, -3.068930149078369, -2.452376365661621, -1.8358224630355835, -1.219268560409546, -0.6027146577835083, 0.013839244842529297, 0.6303930282592773, 1.2469470500946045, 1.8635010719299316, 2.4800548553466797, 3.0966086387634277, 3.713162660598755, 4.329716682434082, 4.94627046585083, 5.562824249267578, 6.179378509521484, 6.795932292938232, 7.4124860763549805, 8.029040336608887, 8.645593643188477, 9.262147903442383, 9.878702163696289, 10.495255470275879, 11.111809730529785, 11.728363037109375, 12.344917297363281]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 1.0, 5.0, 7.0, 3.0, 7.0, 11.0, 17.0, 12.0, 24.0, 22.0, 15.0, 34.0, 39.0, 24.0, 31.0, 44.0, 47.0, 53.0, 44.0, 31.0, 55.0, 44.0, 52.0, 57.0, 55.0, 50.0, 26.0, 21.0, 27.0, 28.0, 16.0, 17.0, 23.0, 14.0, 12.0, 10.0, 6.0, 5.0, 2.0, 0.0, 6.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0], "bins": [-5.83771276473999, -5.674121379852295, -5.5105299949646, -5.346938610076904, -5.183347225189209, -5.019755840301514, -4.856164455413818, -4.692573070526123, -4.528981685638428, -4.365390300750732, -4.201798915863037, -4.038207530975342, -3.8746161460876465, -3.711024761199951, -3.547433376312256, -3.3838419914245605, -3.2202506065368652, -3.05665922164917, -2.8930678367614746, -2.7294764518737793, -2.565885066986084, -2.4022936820983887, -2.2387022972106934, -2.075110912322998, -1.9115195274353027, -1.7479281425476074, -1.584336757659912, -1.4207453727722168, -1.2571539878845215, -1.0935626029968262, -0.9299712181091309, -0.7663798332214355, -0.6027884483337402, -0.4391970634460449, -0.2756056785583496, -0.1120142936706543, 0.051577091217041016, 0.21516847610473633, 0.37875986099243164, 0.542351245880127, 0.7059426307678223, 0.8695340156555176, 1.033125400543213, 1.1967167854309082, 1.3603081703186035, 1.5238995552062988, 1.6874909400939941, 1.8510823249816895, 2.0146737098693848, 2.17826509475708, 2.3418564796447754, 2.5054478645324707, 2.669039249420166, 2.8326306343078613, 2.9962220191955566, 3.159813404083252, 3.3234047889709473, 3.4869961738586426, 3.650587558746338, 3.814178943634033, 3.9777703285217285, 4.141361713409424, 4.304953098297119, 4.4685444831848145, 4.63213586807251]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 9.0, 3.0, 3.0, 10.0, 21.0, 19.0, 21.0, 23.0, 43.0, 52.0, 68.0, 134.0, 290.0, 652.0, 1614.0, 4202.0, 13513.0, 52453.0, 260075.0, 537779.0, 133871.0, 30123.0, 8629.0, 2800.0, 1107.0, 471.0, 257.0, 86.0, 73.0, 35.0, 29.0, 20.0, 20.0, 9.0, 7.0, 11.0, 9.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.51953125, -2.430511474609375, -2.34149169921875, -2.252471923828125, -2.1634521484375, -2.074432373046875, -1.98541259765625, -1.896392822265625, -1.807373046875, -1.718353271484375, -1.62933349609375, -1.540313720703125, -1.4512939453125, -1.362274169921875, -1.27325439453125, -1.184234619140625, -1.09521484375, -1.006195068359375, -0.91717529296875, -0.828155517578125, -0.7391357421875, -0.650115966796875, -0.56109619140625, -0.472076416015625, -0.383056640625, -0.294036865234375, -0.20501708984375, -0.115997314453125, -0.0269775390625, 0.062042236328125, 0.15106201171875, 0.240081787109375, 0.3291015625, 0.418121337890625, 0.50714111328125, 0.596160888671875, 0.6851806640625, 0.774200439453125, 0.86322021484375, 0.952239990234375, 1.041259765625, 1.130279541015625, 1.21929931640625, 1.308319091796875, 1.3973388671875, 1.486358642578125, 1.57537841796875, 1.664398193359375, 1.75341796875, 1.842437744140625, 1.93145751953125, 2.020477294921875, 2.1094970703125, 2.198516845703125, 2.28753662109375, 2.376556396484375, 2.465576171875, 2.554595947265625, 2.64361572265625, 2.732635498046875, 2.8216552734375, 2.910675048828125, 2.99969482421875, 3.088714599609375, 3.177734375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 3.0, 4.0, 4.0, 13.0, 14.0, 13.0, 19.0, 22.0, 22.0, 29.0, 31.0, 45.0, 35.0, 51.0, 47.0, 50.0, 50.0, 63.0, 52.0, 52.0, 49.0, 51.0, 31.0, 40.0, 40.0, 28.0, 18.0, 28.0, 20.0, 15.0, 14.0, 15.0, 7.0, 7.0, 9.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.263671875, -1.2228240966796875, -1.181976318359375, -1.1411285400390625, -1.10028076171875, -1.0594329833984375, -1.018585205078125, -0.9777374267578125, -0.9368896484375, -0.8960418701171875, -0.855194091796875, -0.8143463134765625, -0.77349853515625, -0.7326507568359375, -0.691802978515625, -0.6509552001953125, -0.610107421875, -0.5692596435546875, -0.528411865234375, -0.4875640869140625, -0.44671630859375, -0.4058685302734375, -0.365020751953125, -0.3241729736328125, -0.2833251953125, -0.2424774169921875, -0.201629638671875, -0.1607818603515625, -0.11993408203125, -0.0790863037109375, -0.038238525390625, 0.0026092529296875, 0.04345703125, 0.0843048095703125, 0.125152587890625, 0.1660003662109375, 0.20684814453125, 0.2476959228515625, 0.288543701171875, 0.3293914794921875, 0.3702392578125, 0.4110870361328125, 0.451934814453125, 0.4927825927734375, 0.53363037109375, 0.5744781494140625, 0.615325927734375, 0.6561737060546875, 0.697021484375, 0.7378692626953125, 0.778717041015625, 0.8195648193359375, 0.86041259765625, 0.9012603759765625, 0.942108154296875, 0.9829559326171875, 1.0238037109375, 1.0646514892578125, 1.105499267578125, 1.1463470458984375, 1.18719482421875, 1.2280426025390625, 1.268890380859375, 1.3097381591796875, 1.3505859375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 7.0, 6.0, 10.0, 19.0, 21.0, 27.0, 47.0, 52.0, 97.0, 135.0, 185.0, 306.0, 573.0, 1812.0, 8194.0, 68654.0, 815204.0, 136474.0, 12598.0, 2336.0, 763.0, 361.0, 198.0, 130.0, 89.0, 67.0, 42.0, 41.0, 13.0, 23.0, 21.0, 9.0, 9.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.0625, -4.91192626953125, -4.7613525390625, -4.61077880859375, -4.460205078125, -4.30963134765625, -4.1590576171875, -4.00848388671875, -3.85791015625, -3.70733642578125, -3.5567626953125, -3.40618896484375, -3.255615234375, -3.10504150390625, -2.9544677734375, -2.80389404296875, -2.6533203125, -2.50274658203125, -2.3521728515625, -2.20159912109375, -2.051025390625, -1.90045166015625, -1.7498779296875, -1.59930419921875, -1.44873046875, -1.29815673828125, -1.1475830078125, -0.99700927734375, -0.846435546875, -0.69586181640625, -0.5452880859375, -0.39471435546875, -0.244140625, -0.09356689453125, 0.0570068359375, 0.20758056640625, 0.358154296875, 0.50872802734375, 0.6593017578125, 0.80987548828125, 0.96044921875, 1.11102294921875, 1.2615966796875, 1.41217041015625, 1.562744140625, 1.71331787109375, 1.8638916015625, 2.01446533203125, 2.1650390625, 2.31561279296875, 2.4661865234375, 2.61676025390625, 2.767333984375, 2.91790771484375, 3.0684814453125, 3.21905517578125, 3.36962890625, 3.52020263671875, 3.6707763671875, 3.82135009765625, 3.971923828125, 4.12249755859375, 4.2730712890625, 4.42364501953125, 4.57421875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 7.0, 12.0, 3.0, 6.0, 7.0, 10.0, 10.0, 21.0, 31.0, 29.0, 36.0, 42.0, 34.0, 38.0, 40.0, 58.0, 48.0, 59.0, 63.0, 67.0, 62.0, 57.0, 46.0, 53.0, 34.0, 30.0, 15.0, 20.0, 20.0, 12.0, 10.0, 13.0, 6.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-8.484375, -8.27679443359375, -8.0692138671875, -7.86163330078125, -7.654052734375, -7.44647216796875, -7.2388916015625, -7.03131103515625, -6.82373046875, -6.61614990234375, -6.4085693359375, -6.20098876953125, -5.993408203125, -5.78582763671875, -5.5782470703125, -5.37066650390625, -5.1630859375, -4.95550537109375, -4.7479248046875, -4.54034423828125, -4.332763671875, -4.12518310546875, -3.9176025390625, -3.71002197265625, -3.50244140625, -3.29486083984375, -3.0872802734375, -2.87969970703125, -2.672119140625, -2.46453857421875, -2.2569580078125, -2.04937744140625, -1.841796875, -1.63421630859375, -1.4266357421875, -1.21905517578125, -1.011474609375, -0.80389404296875, -0.5963134765625, -0.38873291015625, -0.18115234375, 0.02642822265625, 0.2340087890625, 0.44158935546875, 0.649169921875, 0.85675048828125, 1.0643310546875, 1.27191162109375, 1.4794921875, 1.68707275390625, 1.8946533203125, 2.10223388671875, 2.309814453125, 2.51739501953125, 2.7249755859375, 2.93255615234375, 3.14013671875, 3.34771728515625, 3.5552978515625, 3.76287841796875, 3.970458984375, 4.17803955078125, 4.3856201171875, 4.59320068359375, 4.80078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 2.0, 11.0, 10.0, 15.0, 31.0, 33.0, 54.0, 119.0, 164.0, 341.0, 666.0, 1302.0, 3120.0, 8257.0, 34987.0, 576962.0, 381984.0, 27929.0, 7191.0, 2808.0, 1244.0, 601.0, 327.0, 143.0, 79.0, 58.0, 40.0, 25.0, 12.0, 12.0, 7.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.951629638671875, -1.88177490234375, -1.811920166015625, -1.7420654296875, -1.672210693359375, -1.60235595703125, -1.532501220703125, -1.462646484375, -1.392791748046875, -1.32293701171875, -1.253082275390625, -1.1832275390625, -1.113372802734375, -1.04351806640625, -0.973663330078125, -0.90380859375, -0.833953857421875, -0.76409912109375, -0.694244384765625, -0.6243896484375, -0.554534912109375, -0.48468017578125, -0.414825439453125, -0.344970703125, -0.275115966796875, -0.20526123046875, -0.135406494140625, -0.0655517578125, 0.004302978515625, 0.07415771484375, 0.144012451171875, 0.2138671875, 0.283721923828125, 0.35357666015625, 0.423431396484375, 0.4932861328125, 0.563140869140625, 0.63299560546875, 0.702850341796875, 0.772705078125, 0.842559814453125, 0.91241455078125, 0.982269287109375, 1.0521240234375, 1.121978759765625, 1.19183349609375, 1.261688232421875, 1.33154296875, 1.401397705078125, 1.47125244140625, 1.541107177734375, 1.6109619140625, 1.680816650390625, 1.75067138671875, 1.820526123046875, 1.890380859375, 1.960235595703125, 2.03009033203125, 2.099945068359375, 2.1697998046875, 2.239654541015625, 2.30950927734375, 2.379364013671875, 2.44921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 10.0, 13.0, 22.0, 74.0, 200.0, 346.0, 189.0, 75.0, 28.0, 15.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00033783912658691406, -0.00032046064734458923, -0.0003030821681022644, -0.0002857036888599396, -0.00026832520961761475, -0.0002509467303752899, -0.0002335682511329651, -0.00021618977189064026, -0.00019881129264831543, -0.0001814328134059906, -0.00016405433416366577, -0.00014667585492134094, -0.0001292973756790161, -0.00011191889643669128, -9.454041719436646e-05, -7.716193795204163e-05, -5.97834587097168e-05, -4.240497946739197e-05, -2.502650022506714e-05, -7.64802098274231e-06, 9.73045825958252e-06, 2.710893750190735e-05, 4.448741674423218e-05, 6.186589598655701e-05, 7.924437522888184e-05, 9.662285447120667e-05, 0.0001140013337135315, 0.00013137981295585632, 0.00014875829219818115, 0.00016613677144050598, 0.0001835152506828308, 0.00020089372992515564, 0.00021827220916748047, 0.0002356506884098053, 0.0002530291676521301, 0.00027040764689445496, 0.0002877861261367798, 0.0003051646053791046, 0.00032254308462142944, 0.00033992156386375427, 0.0003573000431060791, 0.00037467852234840393, 0.00039205700159072876, 0.0004094354808330536, 0.0004268139600753784, 0.00044419243931770325, 0.0004615709185600281, 0.0004789493978023529, 0.0004963278770446777, 0.0005137063562870026, 0.0005310848355293274, 0.0005484633147716522, 0.000565841794013977, 0.0005832202732563019, 0.0006005987524986267, 0.0006179772317409515, 0.0006353557109832764, 0.0006527341902256012, 0.000670112669467926, 0.0006874911487102509, 0.0007048696279525757, 0.0007222481071949005, 0.0007396265864372253, 0.0007570050656795502, 0.000774383544921875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 0.0, 6.0, 5.0, 7.0, 10.0, 22.0, 22.0, 30.0, 41.0, 54.0, 83.0, 160.0, 334.0, 673.0, 1256.0, 2620.0, 6390.0, 20361.0, 183399.0, 752431.0, 60560.0, 11849.0, 4306.0, 1891.0, 941.0, 443.0, 268.0, 130.0, 74.0, 54.0, 40.0, 28.0, 19.0, 17.0, 11.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.1484375, -2.0775146484375, -2.006591796875, -1.9356689453125, -1.86474609375, -1.7938232421875, -1.722900390625, -1.6519775390625, -1.5810546875, -1.5101318359375, -1.439208984375, -1.3682861328125, -1.29736328125, -1.2264404296875, -1.155517578125, -1.0845947265625, -1.013671875, -0.9427490234375, -0.871826171875, -0.8009033203125, -0.72998046875, -0.6590576171875, -0.588134765625, -0.5172119140625, -0.4462890625, -0.3753662109375, -0.304443359375, -0.2335205078125, -0.16259765625, -0.0916748046875, -0.020751953125, 0.0501708984375, 0.12109375, 0.1920166015625, 0.262939453125, 0.3338623046875, 0.40478515625, 0.4757080078125, 0.546630859375, 0.6175537109375, 0.6884765625, 0.7593994140625, 0.830322265625, 0.9012451171875, 0.97216796875, 1.0430908203125, 1.114013671875, 1.1849365234375, 1.255859375, 1.3267822265625, 1.397705078125, 1.4686279296875, 1.53955078125, 1.6104736328125, 1.681396484375, 1.7523193359375, 1.8232421875, 1.8941650390625, 1.965087890625, 2.0360107421875, 2.10693359375, 2.1778564453125, 2.248779296875, 2.3197021484375, 2.390625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 1.0, 2.0, 5.0, 16.0, 8.0, 16.0, 21.0, 44.0, 61.0, 96.0, 139.0, 211.0, 129.0, 76.0, 43.0, 37.0, 32.0, 16.0, 23.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.724609375, -3.63677978515625, -3.5489501953125, -3.46112060546875, -3.373291015625, -3.28546142578125, -3.1976318359375, -3.10980224609375, -3.02197265625, -2.93414306640625, -2.8463134765625, -2.75848388671875, -2.670654296875, -2.58282470703125, -2.4949951171875, -2.40716552734375, -2.3193359375, -2.23150634765625, -2.1436767578125, -2.05584716796875, -1.968017578125, -1.88018798828125, -1.7923583984375, -1.70452880859375, -1.61669921875, -1.52886962890625, -1.4410400390625, -1.35321044921875, -1.265380859375, -1.17755126953125, -1.0897216796875, -1.00189208984375, -0.9140625, -0.82623291015625, -0.7384033203125, -0.65057373046875, -0.562744140625, -0.47491455078125, -0.3870849609375, -0.29925537109375, -0.21142578125, -0.12359619140625, -0.0357666015625, 0.05206298828125, 0.139892578125, 0.22772216796875, 0.3155517578125, 0.40338134765625, 0.4912109375, 0.57904052734375, 0.6668701171875, 0.75469970703125, 0.842529296875, 0.93035888671875, 1.0181884765625, 1.10601806640625, 1.19384765625, 1.28167724609375, 1.3695068359375, 1.45733642578125, 1.545166015625, 1.63299560546875, 1.7208251953125, 1.80865478515625, 1.896484375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 12.0, 91.0, 445.0, 366.0, 73.0, 12.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.65074157714844, -34.00177764892578, -31.352811813354492, -28.703847885131836, -26.054882049560547, -23.40591812133789, -20.756954193115234, -18.107988357543945, -15.459024429321289, -12.810059547424316, -10.161094665527344, -7.5121307373046875, -4.863165855407715, -2.214200973510742, 0.43476295471191406, 3.083728790283203, 5.732692718505859, 8.381657600402832, 11.030622482299805, 13.679586410522461, 16.32855224609375, 18.977516174316406, 21.626480102539062, 24.27544593811035, 26.924409866333008, 29.573373794555664, 32.22233963012695, 34.87130355834961, 37.520267486572266, 40.16923522949219, 42.818199157714844, 45.4671630859375, 48.116127014160156, 50.76509094238281, 53.41405487060547, 56.063018798828125, 58.71198654174805, 61.3609504699707, 64.00991821289062, 66.65888214111328, 69.30784606933594, 71.9568099975586, 74.60577392578125, 77.2547378540039, 79.90370178222656, 82.55267333984375, 85.20162963867188, 87.85060119628906, 90.49955749511719, 93.14852142333984, 95.7974853515625, 98.44644927978516, 101.09541320800781, 103.744384765625, 106.39334106445312, 109.04231262207031, 111.69127655029297, 114.34024047851562, 116.98920440673828, 119.63816833496094, 122.2871322631836, 124.93609619140625, 127.58506774902344, 130.23402404785156, 132.88299560546875]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 6.0, 15.0, 22.0, 21.0, 20.0, 21.0, 28.0, 30.0, 34.0, 31.0, 43.0, 51.0, 42.0, 42.0, 58.0, 41.0, 42.0, 50.0, 53.0, 44.0, 36.0, 31.0, 33.0, 27.0, 27.0, 35.0, 30.0, 21.0, 11.0, 6.0, 8.0, 4.0, 3.0, 8.0, 6.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-27.014636993408203, -26.159589767456055, -25.30454444885254, -24.44949722290039, -23.594451904296875, -22.739404678344727, -21.884357452392578, -21.029312133789062, -20.174264907836914, -19.319217681884766, -18.46417236328125, -17.6091251373291, -16.754077911376953, -15.899032592773438, -15.043985366821289, -14.188939094543457, -13.333892822265625, -12.478846549987793, -11.623800277709961, -10.768753051757812, -9.91370677947998, -9.058660507202148, -8.20361328125, -7.348567008972168, -6.493520736694336, -5.638474464416504, -4.783427715301514, -3.9283812046051025, -3.0733346939086914, -2.2182884216308594, -1.3632416725158691, -0.5081949234008789, 0.3468494415283203, 1.2018959522247314, 2.0569424629211426, 2.9119889736175537, 3.767035484313965, 4.622081756591797, 5.477128505706787, 6.332175254821777, 7.187221527099609, 8.042267799377441, 8.897314071655273, 9.752361297607422, 10.607407569885254, 11.462453842163086, 12.317501068115234, 13.172547340393066, 14.027593612670898, 14.88263988494873, 15.737686157226562, 16.59273338317871, 17.44778060913086, 18.302825927734375, 19.157873153686523, 20.012920379638672, 20.867965698242188, 21.723012924194336, 22.57805824279785, 23.43310546875, 24.288150787353516, 25.143198013305664, 25.998245239257812, 26.853290557861328, 27.708337783813477]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 7.0, 6.0, 12.0, 18.0, 14.0, 19.0, 23.0, 32.0, 31.0, 32.0, 47.0, 51.0, 67.0, 97.0, 134.0, 265.0, 618.0, 1880.0, 7617.0, 3979910.0, 193902.0, 6394.0, 1720.0, 538.0, 260.0, 135.0, 79.0, 60.0, 49.0, 50.0, 40.0, 30.0, 26.0, 24.0, 17.0, 18.0, 10.0, 10.0, 10.0, 6.0, 6.0, 1.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.7265625, -4.56329345703125, -4.4000244140625, -4.23675537109375, -4.073486328125, -3.91021728515625, -3.7469482421875, -3.58367919921875, -3.42041015625, -3.25714111328125, -3.0938720703125, -2.93060302734375, -2.767333984375, -2.60406494140625, -2.4407958984375, -2.27752685546875, -2.1142578125, -1.95098876953125, -1.7877197265625, -1.62445068359375, -1.461181640625, -1.29791259765625, -1.1346435546875, -0.97137451171875, -0.80810546875, -0.64483642578125, -0.4815673828125, -0.31829833984375, -0.155029296875, 0.00823974609375, 0.1715087890625, 0.33477783203125, 0.498046875, 0.66131591796875, 0.8245849609375, 0.98785400390625, 1.151123046875, 1.31439208984375, 1.4776611328125, 1.64093017578125, 1.80419921875, 1.96746826171875, 2.1307373046875, 2.29400634765625, 2.457275390625, 2.62054443359375, 2.7838134765625, 2.94708251953125, 3.1103515625, 3.27362060546875, 3.4368896484375, 3.60015869140625, 3.763427734375, 3.92669677734375, 4.0899658203125, 4.25323486328125, 4.41650390625, 4.57977294921875, 4.7430419921875, 4.90631103515625, 5.069580078125, 5.23284912109375, 5.3961181640625, 5.55938720703125, 5.72265625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 6.0, 0.0, 0.0, 5.0, 3.0, 2.0, 8.0, 7.0, 7.0, 8.0, 8.0, 14.0, 8.0, 18.0, 23.0, 29.0, 30.0, 34.0, 43.0, 44.0, 41.0, 34.0, 41.0, 37.0, 40.0, 43.0, 52.0, 51.0, 37.0, 42.0, 26.0, 32.0, 32.0, 20.0, 28.0, 35.0, 15.0, 20.0, 21.0, 14.0, 13.0, 10.0, 13.0, 5.0, 2.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1826171875, -1.1425018310546875, -1.102386474609375, -1.0622711181640625, -1.02215576171875, -0.9820404052734375, -0.941925048828125, -0.9018096923828125, -0.8616943359375, -0.8215789794921875, -0.781463623046875, -0.7413482666015625, -0.70123291015625, -0.6611175537109375, -0.621002197265625, -0.5808868408203125, -0.540771484375, -0.5006561279296875, -0.460540771484375, -0.4204254150390625, -0.38031005859375, -0.3401947021484375, -0.300079345703125, -0.2599639892578125, -0.2198486328125, -0.1797332763671875, -0.139617919921875, -0.0995025634765625, -0.05938720703125, -0.0192718505859375, 0.020843505859375, 0.0609588623046875, 0.10107421875, 0.1411895751953125, 0.181304931640625, 0.2214202880859375, 0.26153564453125, 0.3016510009765625, 0.341766357421875, 0.3818817138671875, 0.4219970703125, 0.4621124267578125, 0.502227783203125, 0.5423431396484375, 0.58245849609375, 0.6225738525390625, 0.662689208984375, 0.7028045654296875, 0.742919921875, 0.7830352783203125, 0.823150634765625, 0.8632659912109375, 0.90338134765625, 0.9434967041015625, 0.983612060546875, 1.0237274169921875, 1.0638427734375, 1.1039581298828125, 1.144073486328125, 1.1841888427734375, 1.22430419921875, 1.2644195556640625, 1.304534912109375, 1.3446502685546875, 1.384765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 4.0, 9.0, 11.0, 8.0, 15.0, 29.0, 34.0, 36.0, 49.0, 75.0, 141.0, 269.0, 684.0, 2846.0, 4069245.0, 116796.0, 2552.0, 743.0, 265.0, 145.0, 87.0, 73.0, 47.0, 38.0, 16.0, 15.0, 15.0, 14.0, 8.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.359375, -8.96875, -8.578125, -8.1875, -7.796875, -7.40625, -7.015625, -6.625, -6.234375, -5.84375, -5.453125, -5.0625, -4.671875, -4.28125, -3.890625, -3.5, -3.109375, -2.71875, -2.328125, -1.9375, -1.546875, -1.15625, -0.765625, -0.375, 0.015625, 0.40625, 0.796875, 1.1875, 1.578125, 1.96875, 2.359375, 2.75, 3.140625, 3.53125, 3.921875, 4.3125, 4.703125, 5.09375, 5.484375, 5.875, 6.265625, 6.65625, 7.046875, 7.4375, 7.828125, 8.21875, 8.609375, 9.0, 9.390625, 9.78125, 10.171875, 10.5625, 10.953125, 11.34375, 11.734375, 12.125, 12.515625, 12.90625, 13.296875, 13.6875, 14.078125, 14.46875, 14.859375, 15.25, 15.640625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 29.0, 3911.0, 105.0, 13.0, 3.0, 5.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5517578125, -1.4595794677734375, -1.367401123046875, -1.2752227783203125, -1.18304443359375, -1.0908660888671875, -0.998687744140625, -0.9065093994140625, -0.8143310546875, -0.7221527099609375, -0.629974365234375, -0.5377960205078125, -0.44561767578125, -0.3534393310546875, -0.261260986328125, -0.1690826416015625, -0.076904296875, 0.0152740478515625, 0.107452392578125, 0.1996307373046875, 0.29180908203125, 0.3839874267578125, 0.476165771484375, 0.5683441162109375, 0.6605224609375, 0.7527008056640625, 0.844879150390625, 0.9370574951171875, 1.02923583984375, 1.1214141845703125, 1.213592529296875, 1.3057708740234375, 1.39794921875, 1.4901275634765625, 1.582305908203125, 1.6744842529296875, 1.76666259765625, 1.8588409423828125, 1.951019287109375, 2.0431976318359375, 2.1353759765625, 2.2275543212890625, 2.319732666015625, 2.4119110107421875, 2.50408935546875, 2.5962677001953125, 2.688446044921875, 2.7806243896484375, 2.872802734375, 2.9649810791015625, 3.057159423828125, 3.1493377685546875, 3.24151611328125, 3.3336944580078125, 3.425872802734375, 3.5180511474609375, 3.6102294921875, 3.7024078369140625, 3.794586181640625, 3.8867645263671875, 3.97894287109375, 4.0711212158203125, 4.163299560546875, 4.2554779052734375, 4.34765625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 4.0, 17.0, 33.0, 69.0, 203.0, 252.0, 205.0, 107.0, 45.0, 32.0, 13.0, 8.0, 6.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4273147583007812, -3.2193522453308105, -3.01138973236084, -2.80342698097229, -2.5954644680023193, -2.3875019550323486, -2.179539203643799, -1.9715766906738281, -1.7636141777038574, -1.5556516647338867, -1.3476890325546265, -1.1397264003753662, -0.9317638874053955, -0.7238013744354248, -0.5158387422561646, -0.3078761100769043, -0.0999135971069336, 0.10804897546768188, 0.31601154804229736, 0.5239741206169128, 0.7319366931915283, 0.939899206161499, 1.1478618383407593, 1.3558244705200195, 1.5637869834899902, 1.771749496459961, 1.9797121286392212, 2.1876747608184814, 2.395637273788452, 2.603599786758423, 2.8115625381469727, 3.0195250511169434, 3.227487564086914, 3.4354500770568848, 3.6434125900268555, 3.8513753414154053, 4.059337615966797, 4.267300605773926, 4.4752631187438965, 4.683225631713867, 4.891188144683838, 5.099150657653809, 5.307113170623779, 5.51507568359375, 5.723038673400879, 5.931000709533691, 6.13896369934082, 6.346926212310791, 6.554888725280762, 6.762851238250732, 6.970813751220703, 7.178776264190674, 7.3867387771606445, 7.594701766967773, 7.802664279937744, 8.010626792907715, 8.218589782714844, 8.426552772521973, 8.634514808654785, 8.842477798461914, 9.050439834594727, 9.258402824401855, 9.466364860534668, 9.674327850341797, 9.88228988647461]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 5.0, 5.0, 11.0, 12.0, 6.0, 14.0, 21.0, 18.0, 21.0, 32.0, 21.0, 29.0, 32.0, 38.0, 47.0, 38.0, 56.0, 55.0, 48.0, 46.0, 58.0, 41.0, 38.0, 35.0, 44.0, 37.0, 32.0, 24.0, 21.0, 22.0, 16.0, 17.0, 12.0, 8.0, 13.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.9107766151428223, -3.8045763969421387, -3.698376178741455, -3.5921757221221924, -3.485975503921509, -3.379775285720825, -3.2735750675201416, -3.167374610900879, -3.0611743927001953, -2.9549741744995117, -2.848773956298828, -2.7425734996795654, -2.636373281478882, -2.5301730632781982, -2.4239728450775146, -2.317772388458252, -2.2115721702575684, -2.1053719520568848, -1.9991716146469116, -1.892971396446228, -1.7867710590362549, -1.6805708408355713, -1.5743706226348877, -1.4681702852249146, -1.3619701862335205, -1.255769968032837, -1.1495696306228638, -1.0433694124221802, -0.937169075012207, -0.8309688568115234, -0.7247685790061951, -0.6185683012008667, -0.5123679637908936, -0.4061676859855652, -0.2999674081802368, -0.19376716017723083, -0.08756688237190247, 0.018633365631103516, 0.12483364343643188, 0.23103392124176025, 0.3372341990470886, 0.443434476852417, 0.5496347546577454, 0.6558350324630737, 0.7620352506637573, 0.8682355284690857, 0.9744358062744141, 1.0806360244750977, 1.1868363618850708, 1.2930365800857544, 1.3992369174957275, 1.5054371356964111, 1.6116374731063843, 1.7178376913070679, 1.824038028717041, 1.9302382469177246, 2.036438465118408, 2.142638683319092, 2.2488389015197754, 2.355039358139038, 2.4612395763397217, 2.5674397945404053, 2.673640012741089, 2.7798404693603516, 2.886040687561035]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 4.0, 5.0, 11.0, 8.0, 11.0, 6.0, 15.0, 14.0, 13.0, 19.0, 30.0, 31.0, 45.0, 59.0, 80.0, 131.0, 243.0, 480.0, 973.0, 2007.0, 4522.0, 10643.0, 27504.0, 77509.0, 234945.0, 401447.0, 187374.0, 61734.0, 22371.0, 8877.0, 3754.0, 1762.0, 806.0, 436.0, 232.0, 143.0, 70.0, 43.0, 44.0, 22.0, 25.0, 23.0, 22.0, 10.0, 13.0, 10.0, 7.0, 4.0, 5.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0], "bins": [-2.341796875, -2.273712158203125, -2.20562744140625, -2.137542724609375, -2.0694580078125, -2.001373291015625, -1.93328857421875, -1.865203857421875, -1.797119140625, -1.729034423828125, -1.66094970703125, -1.592864990234375, -1.5247802734375, -1.456695556640625, -1.38861083984375, -1.320526123046875, -1.25244140625, -1.184356689453125, -1.11627197265625, -1.048187255859375, -0.9801025390625, -0.912017822265625, -0.84393310546875, -0.775848388671875, -0.707763671875, -0.639678955078125, -0.57159423828125, -0.503509521484375, -0.4354248046875, -0.367340087890625, -0.29925537109375, -0.231170654296875, -0.1630859375, -0.095001220703125, -0.02691650390625, 0.041168212890625, 0.1092529296875, 0.177337646484375, 0.24542236328125, 0.313507080078125, 0.381591796875, 0.449676513671875, 0.51776123046875, 0.585845947265625, 0.6539306640625, 0.722015380859375, 0.79010009765625, 0.858184814453125, 0.92626953125, 0.994354248046875, 1.06243896484375, 1.130523681640625, 1.1986083984375, 1.266693115234375, 1.33477783203125, 1.402862548828125, 1.470947265625, 1.539031982421875, 1.60711669921875, 1.675201416015625, 1.7432861328125, 1.811370849609375, 1.87945556640625, 1.947540283203125, 2.015625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 7.0, 9.0, 10.0, 11.0, 10.0, 17.0, 14.0, 12.0, 19.0, 23.0, 35.0, 32.0, 25.0, 34.0, 36.0, 36.0, 39.0, 55.0, 37.0, 31.0, 39.0, 51.0, 45.0, 36.0, 41.0, 37.0, 24.0, 31.0, 19.0, 29.0, 29.0, 17.0, 18.0, 19.0, 10.0, 13.0, 8.0, 5.0, 8.0, 9.0, 7.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.390625, -1.343994140625, -1.29736328125, -1.250732421875, -1.2041015625, -1.157470703125, -1.11083984375, -1.064208984375, -1.017578125, -0.970947265625, -0.92431640625, -0.877685546875, -0.8310546875, -0.784423828125, -0.73779296875, -0.691162109375, -0.64453125, -0.597900390625, -0.55126953125, -0.504638671875, -0.4580078125, -0.411376953125, -0.36474609375, -0.318115234375, -0.271484375, -0.224853515625, -0.17822265625, -0.131591796875, -0.0849609375, -0.038330078125, 0.00830078125, 0.054931640625, 0.1015625, 0.148193359375, 0.19482421875, 0.241455078125, 0.2880859375, 0.334716796875, 0.38134765625, 0.427978515625, 0.474609375, 0.521240234375, 0.56787109375, 0.614501953125, 0.6611328125, 0.707763671875, 0.75439453125, 0.801025390625, 0.84765625, 0.894287109375, 0.94091796875, 0.987548828125, 1.0341796875, 1.080810546875, 1.12744140625, 1.174072265625, 1.220703125, 1.267333984375, 1.31396484375, 1.360595703125, 1.4072265625, 1.453857421875, 1.50048828125, 1.547119140625, 1.59375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 1.0, 6.0, 4.0, 6.0, 10.0, 9.0, 20.0, 18.0, 26.0, 43.0, 62.0, 91.0, 124.0, 183.0, 270.0, 565.0, 1372.0, 5665.0, 49725.0, 800144.0, 174153.0, 11964.0, 2267.0, 742.0, 368.0, 235.0, 129.0, 89.0, 65.0, 50.0, 34.0, 26.0, 24.0, 18.0, 12.0, 10.0, 2.0, 7.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.67578125, -6.493896484375, -6.31201171875, -6.130126953125, -5.9482421875, -5.766357421875, -5.58447265625, -5.402587890625, -5.220703125, -5.038818359375, -4.85693359375, -4.675048828125, -4.4931640625, -4.311279296875, -4.12939453125, -3.947509765625, -3.765625, -3.583740234375, -3.40185546875, -3.219970703125, -3.0380859375, -2.856201171875, -2.67431640625, -2.492431640625, -2.310546875, -2.128662109375, -1.94677734375, -1.764892578125, -1.5830078125, -1.401123046875, -1.21923828125, -1.037353515625, -0.85546875, -0.673583984375, -0.49169921875, -0.309814453125, -0.1279296875, 0.053955078125, 0.23583984375, 0.417724609375, 0.599609375, 0.781494140625, 0.96337890625, 1.145263671875, 1.3271484375, 1.509033203125, 1.69091796875, 1.872802734375, 2.0546875, 2.236572265625, 2.41845703125, 2.600341796875, 2.7822265625, 2.964111328125, 3.14599609375, 3.327880859375, 3.509765625, 3.691650390625, 3.87353515625, 4.055419921875, 4.2373046875, 4.419189453125, 4.60107421875, 4.782958984375, 4.96484375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 4.0, 8.0, 9.0, 4.0, 11.0, 13.0, 13.0, 14.0, 26.0, 26.0, 23.0, 35.0, 32.0, 31.0, 30.0, 36.0, 40.0, 43.0, 42.0, 53.0, 49.0, 43.0, 55.0, 38.0, 48.0, 29.0, 39.0, 23.0, 13.0, 31.0, 21.0, 18.0, 14.0, 19.0, 20.0, 10.0, 8.0, 9.0, 2.0, 6.0, 5.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.93359375, -5.70587158203125, -5.4781494140625, -5.25042724609375, -5.022705078125, -4.79498291015625, -4.5672607421875, -4.33953857421875, -4.11181640625, -3.88409423828125, -3.6563720703125, -3.42864990234375, -3.200927734375, -2.97320556640625, -2.7454833984375, -2.51776123046875, -2.2900390625, -2.06231689453125, -1.8345947265625, -1.60687255859375, -1.379150390625, -1.15142822265625, -0.9237060546875, -0.69598388671875, -0.46826171875, -0.24053955078125, -0.0128173828125, 0.21490478515625, 0.442626953125, 0.67034912109375, 0.8980712890625, 1.12579345703125, 1.353515625, 1.58123779296875, 1.8089599609375, 2.03668212890625, 2.264404296875, 2.49212646484375, 2.7198486328125, 2.94757080078125, 3.17529296875, 3.40301513671875, 3.6307373046875, 3.85845947265625, 4.086181640625, 4.31390380859375, 4.5416259765625, 4.76934814453125, 4.9970703125, 5.22479248046875, 5.4525146484375, 5.68023681640625, 5.907958984375, 6.13568115234375, 6.3634033203125, 6.59112548828125, 6.81884765625, 7.04656982421875, 7.2742919921875, 7.50201416015625, 7.729736328125, 7.95745849609375, 8.1851806640625, 8.41290283203125, 8.640625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 7.0, 11.0, 17.0, 16.0, 28.0, 43.0, 82.0, 155.0, 355.0, 868.0, 2958.0, 14288.0, 280541.0, 719706.0, 23390.0, 4096.0, 1175.0, 401.0, 167.0, 101.0, 50.0, 40.0, 23.0, 12.0, 12.0, 1.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.142578125, -3.05047607421875, -2.9583740234375, -2.86627197265625, -2.774169921875, -2.68206787109375, -2.5899658203125, -2.49786376953125, -2.40576171875, -2.31365966796875, -2.2215576171875, -2.12945556640625, -2.037353515625, -1.94525146484375, -1.8531494140625, -1.76104736328125, -1.6689453125, -1.57684326171875, -1.4847412109375, -1.39263916015625, -1.300537109375, -1.20843505859375, -1.1163330078125, -1.02423095703125, -0.93212890625, -0.84002685546875, -0.7479248046875, -0.65582275390625, -0.563720703125, -0.47161865234375, -0.3795166015625, -0.28741455078125, -0.1953125, -0.10321044921875, -0.0111083984375, 0.08099365234375, 0.173095703125, 0.26519775390625, 0.3572998046875, 0.44940185546875, 0.54150390625, 0.63360595703125, 0.7257080078125, 0.81781005859375, 0.909912109375, 1.00201416015625, 1.0941162109375, 1.18621826171875, 1.2783203125, 1.37042236328125, 1.4625244140625, 1.55462646484375, 1.646728515625, 1.73883056640625, 1.8309326171875, 1.92303466796875, 2.01513671875, 2.10723876953125, 2.1993408203125, 2.29144287109375, 2.383544921875, 2.47564697265625, 2.5677490234375, 2.65985107421875, 2.751953125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 5.0, 8.0, 8.0, 14.0, 19.0, 34.0, 44.0, 107.0, 164.0, 191.0, 151.0, 108.0, 61.0, 26.0, 20.0, 17.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001786947250366211, -0.000169483944773674, -0.00016027316451072693, -0.00015106238424777985, -0.00014185160398483276, -0.00013264082372188568, -0.0001234300434589386, -0.00011421926319599152, -0.00010500848293304443, -9.579770267009735e-05, -8.658692240715027e-05, -7.737614214420319e-05, -6.81653618812561e-05, -5.895458161830902e-05, -4.974380135536194e-05, -4.0533021092414856e-05, -3.1322240829467773e-05, -2.211146056652069e-05, -1.2900680303573608e-05, -3.689900040626526e-06, 5.520880222320557e-06, 1.473166048526764e-05, 2.394244074821472e-05, 3.3153221011161804e-05, 4.236400127410889e-05, 5.157478153705597e-05, 6.078556180000305e-05, 6.999634206295013e-05, 7.920712232589722e-05, 8.84179025888443e-05, 9.762868285179138e-05, 0.00010683946311473846, 0.00011605024337768555, 0.00012526102364063263, 0.0001344718039035797, 0.0001436825841665268, 0.00015289336442947388, 0.00016210414469242096, 0.00017131492495536804, 0.00018052570521831512, 0.0001897364854812622, 0.0001989472657442093, 0.00020815804600715637, 0.00021736882627010345, 0.00022657960653305054, 0.00023579038679599762, 0.0002450011670589447, 0.0002542119473218918, 0.00026342272758483887, 0.00027263350784778595, 0.00028184428811073303, 0.0002910550683736801, 0.0003002658486366272, 0.0003094766288995743, 0.00031868740916252136, 0.00032789818942546844, 0.00033710896968841553, 0.0003463197499513626, 0.0003555305302143097, 0.0003647413104772568, 0.00037395209074020386, 0.00038316287100315094, 0.000392373651266098, 0.0004015844315290451, 0.0004107952117919922]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 8.0, 11.0, 12.0, 33.0, 25.0, 71.0, 124.0, 370.0, 1174.0, 6035.0, 106597.0, 904899.0, 24966.0, 3051.0, 722.0, 229.0, 96.0, 47.0, 29.0, 25.0, 10.0, 6.0, 5.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.01953125, -2.895263671875, -2.77099609375, -2.646728515625, -2.5224609375, -2.398193359375, -2.27392578125, -2.149658203125, -2.025390625, -1.901123046875, -1.77685546875, -1.652587890625, -1.5283203125, -1.404052734375, -1.27978515625, -1.155517578125, -1.03125, -0.906982421875, -0.78271484375, -0.658447265625, -0.5341796875, -0.409912109375, -0.28564453125, -0.161376953125, -0.037109375, 0.087158203125, 0.21142578125, 0.335693359375, 0.4599609375, 0.584228515625, 0.70849609375, 0.832763671875, 0.95703125, 1.081298828125, 1.20556640625, 1.329833984375, 1.4541015625, 1.578369140625, 1.70263671875, 1.826904296875, 1.951171875, 2.075439453125, 2.19970703125, 2.323974609375, 2.4482421875, 2.572509765625, 2.69677734375, 2.821044921875, 2.9453125, 3.069580078125, 3.19384765625, 3.318115234375, 3.4423828125, 3.566650390625, 3.69091796875, 3.815185546875, 3.939453125, 4.063720703125, 4.18798828125, 4.312255859375, 4.4365234375, 4.560791015625, 4.68505859375, 4.809326171875, 4.93359375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 8.0, 6.0, 13.0, 16.0, 29.0, 43.0, 68.0, 105.0, 150.0, 148.0, 159.0, 84.0, 56.0, 40.0, 19.0, 14.0, 17.0, 7.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.603515625, -2.50115966796875, -2.3988037109375, -2.29644775390625, -2.194091796875, -2.09173583984375, -1.9893798828125, -1.88702392578125, -1.78466796875, -1.68231201171875, -1.5799560546875, -1.47760009765625, -1.375244140625, -1.27288818359375, -1.1705322265625, -1.06817626953125, -0.9658203125, -0.86346435546875, -0.7611083984375, -0.65875244140625, -0.556396484375, -0.45404052734375, -0.3516845703125, -0.24932861328125, -0.14697265625, -0.04461669921875, 0.0577392578125, 0.16009521484375, 0.262451171875, 0.36480712890625, 0.4671630859375, 0.56951904296875, 0.671875, 0.77423095703125, 0.8765869140625, 0.97894287109375, 1.081298828125, 1.18365478515625, 1.2860107421875, 1.38836669921875, 1.49072265625, 1.59307861328125, 1.6954345703125, 1.79779052734375, 1.900146484375, 2.00250244140625, 2.1048583984375, 2.20721435546875, 2.3095703125, 2.41192626953125, 2.5142822265625, 2.61663818359375, 2.718994140625, 2.82135009765625, 2.9237060546875, 3.02606201171875, 3.12841796875, 3.23077392578125, 3.3331298828125, 3.43548583984375, 3.537841796875, 3.64019775390625, 3.7425537109375, 3.84490966796875, 3.947265625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 35.0, 81.0, 162.0, 253.0, 204.0, 135.0, 66.0, 42.0, 9.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-75.76907348632812, -74.25141906738281, -72.7337646484375, -71.21611022949219, -69.69845581054688, -68.18080139160156, -66.66314697265625, -65.14550018310547, -63.627845764160156, -62.110191345214844, -60.59253692626953, -59.07488250732422, -57.55723190307617, -56.03957748413086, -54.52192306518555, -53.004268646240234, -51.48661422729492, -49.96895980834961, -48.4513053894043, -46.93365478515625, -45.41600036621094, -43.898345947265625, -42.38069152832031, -40.863037109375, -39.34538269042969, -37.827728271484375, -36.31007385253906, -34.79241943359375, -33.2747688293457, -31.75711441040039, -30.239459991455078, -28.721805572509766, -27.204158782958984, -25.686504364013672, -24.168851852416992, -22.65119743347168, -21.133544921875, -19.615890502929688, -18.098236083984375, -16.580581665039062, -15.062929153442383, -13.545275688171387, -12.02762222290039, -10.509967803955078, -8.992314338684082, -7.474660873413086, -5.957006454467773, -4.439352989196777, -2.9216995239257812, -1.404045820236206, 0.11360788345336914, 1.6312618255615234, 3.1489152908325195, 4.666568756103516, 6.184223175048828, 7.701876640319824, 9.21953010559082, 10.737183570861816, 12.254837036132812, 13.772491455078125, 15.290144920349121, 16.807798385620117, 18.32545280456543, 19.84310531616211, 21.360759735107422]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 3.0, 6.0, 6.0, 12.0, 7.0, 7.0, 15.0, 18.0, 14.0, 27.0, 20.0, 20.0, 23.0, 39.0, 38.0, 51.0, 39.0, 52.0, 41.0, 59.0, 55.0, 47.0, 51.0, 44.0, 47.0, 32.0, 29.0, 29.0, 16.0, 26.0, 32.0, 16.0, 20.0, 5.0, 12.0, 8.0, 13.0, 8.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.92325210571289, -31.663043975830078, -30.402835845947266, -29.142629623413086, -27.882421493530273, -26.62221336364746, -25.36200714111328, -24.10179901123047, -22.841590881347656, -21.581382751464844, -20.32117462158203, -19.06096839904785, -17.80076026916504, -16.540552139282227, -15.28034496307373, -14.020137786865234, -12.759929656982422, -11.49972152709961, -10.239514350891113, -8.979307174682617, -7.719099044799805, -6.45889139175415, -5.198683738708496, -3.9384765625, -2.6782684326171875, -1.4180607795715332, -0.1578531265258789, 1.1023545265197754, 2.3625621795654297, 3.622769832611084, 4.882977485656738, 6.143184661865234, 7.4033966064453125, 8.663604736328125, 9.923811912536621, 11.184019088745117, 12.44422721862793, 13.704435348510742, 14.964642524719238, 16.224849700927734, 17.485057830810547, 18.74526596069336, 20.005474090576172, 21.26568031311035, 22.525888442993164, 23.786096572875977, 25.046302795410156, 26.30651092529297, 27.56671905517578, 28.826927185058594, 30.087135314941406, 31.347341537475586, 32.60755157470703, 33.86775588989258, 35.12796401977539, 36.3881721496582, 37.648380279541016, 38.90858840942383, 40.16879653930664, 41.42900466918945, 42.689208984375, 43.94941711425781, 45.209625244140625, 46.46983337402344, 47.73004150390625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 7.0, 7.0, 18.0, 23.0, 21.0, 25.0, 34.0, 42.0, 52.0, 79.0, 98.0, 208.0, 334.0, 635.0, 1418.0, 3683.0, 18747.0, 4100149.0, 58710.0, 6192.0, 1910.0, 825.0, 393.0, 209.0, 124.0, 80.0, 64.0, 44.0, 33.0, 27.0, 19.0, 15.0, 9.0, 15.0, 10.0, 4.0, 2.0, 2.0, 6.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.814453125, -2.71282958984375, -2.6112060546875, -2.50958251953125, -2.407958984375, -2.30633544921875, -2.2047119140625, -2.10308837890625, -2.00146484375, -1.89984130859375, -1.7982177734375, -1.69659423828125, -1.594970703125, -1.49334716796875, -1.3917236328125, -1.29010009765625, -1.1884765625, -1.08685302734375, -0.9852294921875, -0.88360595703125, -0.781982421875, -0.68035888671875, -0.5787353515625, -0.47711181640625, -0.37548828125, -0.27386474609375, -0.1722412109375, -0.07061767578125, 0.031005859375, 0.13262939453125, 0.2342529296875, 0.33587646484375, 0.4375, 0.53912353515625, 0.6407470703125, 0.74237060546875, 0.843994140625, 0.94561767578125, 1.0472412109375, 1.14886474609375, 1.25048828125, 1.35211181640625, 1.4537353515625, 1.55535888671875, 1.656982421875, 1.75860595703125, 1.8602294921875, 1.96185302734375, 2.0634765625, 2.16510009765625, 2.2667236328125, 2.36834716796875, 2.469970703125, 2.57159423828125, 2.6732177734375, 2.77484130859375, 2.87646484375, 2.97808837890625, 3.0797119140625, 3.18133544921875, 3.282958984375, 3.38458251953125, 3.4862060546875, 3.58782958984375, 3.689453125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 2.0, 12.0, 9.0, 8.0, 12.0, 17.0, 19.0, 18.0, 28.0, 36.0, 25.0, 31.0, 35.0, 41.0, 50.0, 35.0, 51.0, 44.0, 48.0, 48.0, 43.0, 29.0, 46.0, 42.0, 27.0, 30.0, 33.0, 27.0, 20.0, 23.0, 28.0, 11.0, 15.0, 8.0, 16.0, 7.0, 5.0, 2.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6650390625, -1.611846923828125, -1.55865478515625, -1.505462646484375, -1.4522705078125, -1.399078369140625, -1.34588623046875, -1.292694091796875, -1.239501953125, -1.186309814453125, -1.13311767578125, -1.079925537109375, -1.0267333984375, -0.973541259765625, -0.92034912109375, -0.867156982421875, -0.81396484375, -0.760772705078125, -0.70758056640625, -0.654388427734375, -0.6011962890625, -0.548004150390625, -0.49481201171875, -0.441619873046875, -0.388427734375, -0.335235595703125, -0.28204345703125, -0.228851318359375, -0.1756591796875, -0.122467041015625, -0.06927490234375, -0.016082763671875, 0.037109375, 0.090301513671875, 0.14349365234375, 0.196685791015625, 0.2498779296875, 0.303070068359375, 0.35626220703125, 0.409454345703125, 0.462646484375, 0.515838623046875, 0.56903076171875, 0.622222900390625, 0.6754150390625, 0.728607177734375, 0.78179931640625, 0.834991455078125, 0.88818359375, 0.941375732421875, 0.99456787109375, 1.047760009765625, 1.1009521484375, 1.154144287109375, 1.20733642578125, 1.260528564453125, 1.313720703125, 1.366912841796875, 1.42010498046875, 1.473297119140625, 1.5264892578125, 1.579681396484375, 1.63287353515625, 1.686065673828125, 1.7392578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 6.0, 10.0, 9.0, 8.0, 18.0, 19.0, 20.0, 23.0, 21.0, 26.0, 27.0, 35.0, 42.0, 38.0, 45.0, 135.0, 493.0, 9253.0, 4181518.0, 1860.0, 256.0, 80.0, 58.0, 40.0, 37.0, 37.0, 32.0, 27.0, 24.0, 22.0, 14.0, 20.0, 8.0, 6.0, 6.0, 7.0, 3.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.34375, -15.837890625, -15.33203125, -14.826171875, -14.3203125, -13.814453125, -13.30859375, -12.802734375, -12.296875, -11.791015625, -11.28515625, -10.779296875, -10.2734375, -9.767578125, -9.26171875, -8.755859375, -8.25, -7.744140625, -7.23828125, -6.732421875, -6.2265625, -5.720703125, -5.21484375, -4.708984375, -4.203125, -3.697265625, -3.19140625, -2.685546875, -2.1796875, -1.673828125, -1.16796875, -0.662109375, -0.15625, 0.349609375, 0.85546875, 1.361328125, 1.8671875, 2.373046875, 2.87890625, 3.384765625, 3.890625, 4.396484375, 4.90234375, 5.408203125, 5.9140625, 6.419921875, 6.92578125, 7.431640625, 7.9375, 8.443359375, 8.94921875, 9.455078125, 9.9609375, 10.466796875, 10.97265625, 11.478515625, 11.984375, 12.490234375, 12.99609375, 13.501953125, 14.0078125, 14.513671875, 15.01953125, 15.525390625, 16.03125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 21.0, 180.0, 3855.0, 21.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80859375, -0.67779541015625, -0.5469970703125, -0.41619873046875, -0.285400390625, -0.15460205078125, -0.0238037109375, 0.10699462890625, 0.23779296875, 0.36859130859375, 0.4993896484375, 0.63018798828125, 0.760986328125, 0.89178466796875, 1.0225830078125, 1.15338134765625, 1.2841796875, 1.41497802734375, 1.5457763671875, 1.67657470703125, 1.807373046875, 1.93817138671875, 2.0689697265625, 2.19976806640625, 2.33056640625, 2.46136474609375, 2.5921630859375, 2.72296142578125, 2.853759765625, 2.98455810546875, 3.1153564453125, 3.24615478515625, 3.376953125, 3.50775146484375, 3.6385498046875, 3.76934814453125, 3.900146484375, 4.03094482421875, 4.1617431640625, 4.29254150390625, 4.42333984375, 4.55413818359375, 4.6849365234375, 4.81573486328125, 4.946533203125, 5.07733154296875, 5.2081298828125, 5.33892822265625, 5.4697265625, 5.60052490234375, 5.7313232421875, 5.86212158203125, 5.992919921875, 6.12371826171875, 6.2545166015625, 6.38531494140625, 6.51611328125, 6.64691162109375, 6.7777099609375, 6.90850830078125, 7.039306640625, 7.17010498046875, 7.3009033203125, 7.43170166015625, 7.5625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 8.0, 20.0, 70.0, 414.0, 346.0, 103.0, 26.0, 20.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.981804847717285, -2.3991165161132812, -1.8164284229278564, -1.233740210533142, -0.6510519981384277, -0.06836366653442383, 0.514324426651001, 1.0970125198364258, 1.6797008514404297, 2.2623891830444336, 2.8450772762298584, 3.427765369415283, 4.010453701019287, 4.593142032623291, 5.175829887390137, 5.758518218994141, 6.3412065505981445, 6.923894882202148, 7.506583213806152, 8.089271545410156, 8.671958923339844, 9.254648208618164, 9.837335586547852, 10.420023918151855, 11.00271224975586, 11.585400581359863, 12.168088912963867, 12.750777244567871, 13.333465576171875, 13.916152954101562, 14.498841285705566, 15.08152961730957, 15.66421890258789, 16.246906280517578, 16.8295955657959, 17.412282943725586, 17.994972229003906, 18.577659606933594, 19.160348892211914, 19.7430362701416, 20.325725555419922, 20.90841293334961, 21.49110221862793, 22.073789596557617, 22.656478881835938, 23.239166259765625, 23.821855545043945, 24.404542922973633, 24.98723030090332, 25.569917678833008, 26.152606964111328, 26.735294342041016, 27.317983627319336, 27.900671005249023, 28.483360290527344, 29.06604766845703, 29.64873504638672, 30.231422424316406, 30.814111709594727, 31.396799087524414, 31.979488372802734, 32.56217575073242, 33.14486312866211, 33.72755432128906, 34.31024169921875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 4.0, 11.0, 12.0, 10.0, 13.0, 12.0, 26.0, 16.0, 21.0, 28.0, 36.0, 28.0, 39.0, 44.0, 35.0, 39.0, 55.0, 51.0, 49.0, 40.0, 30.0, 52.0, 40.0, 42.0, 36.0, 36.0, 28.0, 22.0, 23.0, 17.0, 18.0, 14.0, 11.0, 13.0, 10.0, 8.0, 4.0, 7.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.090295314788818, -3.941415786743164, -3.792536497116089, -3.6436569690704346, -3.4947776794433594, -3.345898151397705, -3.197018623352051, -3.0481393337249756, -2.8992600440979004, -2.750380516052246, -2.601501226425171, -2.4526216983795166, -2.3037424087524414, -2.154862880706787, -2.005983352661133, -1.8571040630340576, -1.7082245349884033, -1.5593451261520386, -1.4104657173156738, -1.2615861892700195, -1.1127068996429443, -0.9638274312019348, -0.8149479627609253, -0.6660685539245605, -0.5171891450881958, -0.36830973625183105, -0.21943029761314392, -0.07055085897445679, 0.07832854986190796, 0.2272079586982727, 0.3760874271392822, 0.524966835975647, 0.6738462448120117, 0.8227256536483765, 0.9716050624847412, 1.1204845905303955, 1.2693638801574707, 1.418243408203125, 1.5671228170394897, 1.7160022258758545, 1.8648816347122192, 2.013761043548584, 2.1626405715942383, 2.3115198612213135, 2.4603993892669678, 2.609278678894043, 2.7581582069396973, 2.9070377349853516, 3.0559170246124268, 3.204796552658081, 3.3536758422851562, 3.5025553703308105, 3.6514346599578857, 3.80031418800354, 3.9491934776306152, 4.0980730056762695, 4.246952533721924, 4.395832061767578, 4.544711589813232, 4.6935906410217285, 4.842470169067383, 4.991349697113037, 5.140229225158691, 5.2891082763671875, 5.437987804412842]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 7.0, 15.0, 12.0, 14.0, 24.0, 34.0, 22.0, 48.0, 72.0, 91.0, 105.0, 208.0, 325.0, 632.0, 1167.0, 2668.0, 6301.0, 16624.0, 46503.0, 144732.0, 390998.0, 292608.0, 94042.0, 31108.0, 11496.0, 4458.0, 2019.0, 897.0, 470.0, 262.0, 165.0, 105.0, 83.0, 72.0, 27.0, 25.0, 22.0, 17.0, 18.0, 19.0, 10.0, 4.0, 8.0, 3.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.13671875, -2.06256103515625, -1.9884033203125, -1.91424560546875, -1.840087890625, -1.76593017578125, -1.6917724609375, -1.61761474609375, -1.54345703125, -1.46929931640625, -1.3951416015625, -1.32098388671875, -1.246826171875, -1.17266845703125, -1.0985107421875, -1.02435302734375, -0.9501953125, -0.87603759765625, -0.8018798828125, -0.72772216796875, -0.653564453125, -0.57940673828125, -0.5052490234375, -0.43109130859375, -0.35693359375, -0.28277587890625, -0.2086181640625, -0.13446044921875, -0.060302734375, 0.01385498046875, 0.0880126953125, 0.16217041015625, 0.236328125, 0.31048583984375, 0.3846435546875, 0.45880126953125, 0.532958984375, 0.60711669921875, 0.6812744140625, 0.75543212890625, 0.82958984375, 0.90374755859375, 0.9779052734375, 1.05206298828125, 1.126220703125, 1.20037841796875, 1.2745361328125, 1.34869384765625, 1.4228515625, 1.49700927734375, 1.5711669921875, 1.64532470703125, 1.719482421875, 1.79364013671875, 1.8677978515625, 1.94195556640625, 2.01611328125, 2.09027099609375, 2.1644287109375, 2.23858642578125, 2.312744140625, 2.38690185546875, 2.4610595703125, 2.53521728515625, 2.609375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 1.0, 1.0, 5.0, 4.0, 6.0, 6.0, 12.0, 13.0, 8.0, 19.0, 27.0, 21.0, 32.0, 33.0, 32.0, 30.0, 42.0, 40.0, 46.0, 48.0, 50.0, 45.0, 50.0, 39.0, 46.0, 47.0, 34.0, 30.0, 28.0, 34.0, 27.0, 25.0, 27.0, 14.0, 15.0, 18.0, 16.0, 4.0, 10.0, 4.0, 3.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.380859375, -2.3139495849609375, -2.247039794921875, -2.1801300048828125, -2.11322021484375, -2.0463104248046875, -1.979400634765625, -1.9124908447265625, -1.8455810546875, -1.7786712646484375, -1.711761474609375, -1.6448516845703125, -1.57794189453125, -1.5110321044921875, -1.444122314453125, -1.3772125244140625, -1.310302734375, -1.2433929443359375, -1.176483154296875, -1.1095733642578125, -1.04266357421875, -0.9757537841796875, -0.908843994140625, -0.8419342041015625, -0.7750244140625, -0.7081146240234375, -0.641204833984375, -0.5742950439453125, -0.50738525390625, -0.4404754638671875, -0.373565673828125, -0.3066558837890625, -0.23974609375, -0.1728363037109375, -0.105926513671875, -0.0390167236328125, 0.02789306640625, 0.0948028564453125, 0.161712646484375, 0.2286224365234375, 0.2955322265625, 0.3624420166015625, 0.429351806640625, 0.4962615966796875, 0.56317138671875, 0.6300811767578125, 0.696990966796875, 0.7639007568359375, 0.830810546875, 0.8977203369140625, 0.964630126953125, 1.0315399169921875, 1.09844970703125, 1.1653594970703125, 1.232269287109375, 1.2991790771484375, 1.3660888671875, 1.4329986572265625, 1.499908447265625, 1.5668182373046875, 1.63372802734375, 1.7006378173828125, 1.767547607421875, 1.8344573974609375, 1.9013671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 6.0, 7.0, 8.0, 13.0, 13.0, 20.0, 32.0, 34.0, 55.0, 65.0, 85.0, 146.0, 227.0, 449.0, 1015.0, 3452.0, 30894.0, 798764.0, 199535.0, 10250.0, 1883.0, 637.0, 313.0, 201.0, 129.0, 79.0, 57.0, 45.0, 28.0, 19.0, 22.0, 13.0, 17.0, 8.0, 11.0, 8.0, 4.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.9765625, -6.7498779296875, -6.523193359375, -6.2965087890625, -6.06982421875, -5.8431396484375, -5.616455078125, -5.3897705078125, -5.1630859375, -4.9364013671875, -4.709716796875, -4.4830322265625, -4.25634765625, -4.0296630859375, -3.802978515625, -3.5762939453125, -3.349609375, -3.1229248046875, -2.896240234375, -2.6695556640625, -2.44287109375, -2.2161865234375, -1.989501953125, -1.7628173828125, -1.5361328125, -1.3094482421875, -1.082763671875, -0.8560791015625, -0.62939453125, -0.4027099609375, -0.176025390625, 0.0506591796875, 0.27734375, 0.5040283203125, 0.730712890625, 0.9573974609375, 1.18408203125, 1.4107666015625, 1.637451171875, 1.8641357421875, 2.0908203125, 2.3175048828125, 2.544189453125, 2.7708740234375, 2.99755859375, 3.2242431640625, 3.450927734375, 3.6776123046875, 3.904296875, 4.1309814453125, 4.357666015625, 4.5843505859375, 4.81103515625, 5.0377197265625, 5.264404296875, 5.4910888671875, 5.7177734375, 5.9444580078125, 6.171142578125, 6.3978271484375, 6.62451171875, 6.8511962890625, 7.077880859375, 7.3045654296875, 7.53125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 7.0, 6.0, 12.0, 15.0, 16.0, 29.0, 25.0, 31.0, 49.0, 43.0, 58.0, 66.0, 82.0, 60.0, 61.0, 82.0, 74.0, 53.0, 53.0, 45.0, 33.0, 31.0, 19.0, 14.0, 10.0, 6.0, 5.0, 6.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.6640625, -15.224609375, -14.78515625, -14.345703125, -13.90625, -13.466796875, -13.02734375, -12.587890625, -12.1484375, -11.708984375, -11.26953125, -10.830078125, -10.390625, -9.951171875, -9.51171875, -9.072265625, -8.6328125, -8.193359375, -7.75390625, -7.314453125, -6.875, -6.435546875, -5.99609375, -5.556640625, -5.1171875, -4.677734375, -4.23828125, -3.798828125, -3.359375, -2.919921875, -2.48046875, -2.041015625, -1.6015625, -1.162109375, -0.72265625, -0.283203125, 0.15625, 0.595703125, 1.03515625, 1.474609375, 1.9140625, 2.353515625, 2.79296875, 3.232421875, 3.671875, 4.111328125, 4.55078125, 4.990234375, 5.4296875, 5.869140625, 6.30859375, 6.748046875, 7.1875, 7.626953125, 8.06640625, 8.505859375, 8.9453125, 9.384765625, 9.82421875, 10.263671875, 10.703125, 11.142578125, 11.58203125, 12.021484375, 12.4609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 7.0, 6.0, 9.0, 25.0, 60.0, 224.0, 3422.0, 1040811.0, 3625.0, 263.0, 62.0, 23.0, 10.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-19.984375, -19.5546875, -19.125, -18.6953125, -18.265625, -17.8359375, -17.40625, -16.9765625, -16.546875, -16.1171875, -15.6875, -15.2578125, -14.828125, -14.3984375, -13.96875, -13.5390625, -13.109375, -12.6796875, -12.25, -11.8203125, -11.390625, -10.9609375, -10.53125, -10.1015625, -9.671875, -9.2421875, -8.8125, -8.3828125, -7.953125, -7.5234375, -7.09375, -6.6640625, -6.234375, -5.8046875, -5.375, -4.9453125, -4.515625, -4.0859375, -3.65625, -3.2265625, -2.796875, -2.3671875, -1.9375, -1.5078125, -1.078125, -0.6484375, -0.21875, 0.2109375, 0.640625, 1.0703125, 1.5, 1.9296875, 2.359375, 2.7890625, 3.21875, 3.6484375, 4.078125, 4.5078125, 4.9375, 5.3671875, 5.796875, 6.2265625, 6.65625, 7.0859375, 7.515625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 7.0, 11.0, 16.0, 23.0, 28.0, 54.0, 103.0, 128.0, 185.0, 183.0, 102.0, 59.0, 44.0, 12.0, 14.0, 12.0, 8.0, 4.0, 1.0, 5.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031447410583496094, -0.0003067515790462494, -0.00029902905225753784, -0.0002913065254688263, -0.00028358399868011475, -0.0002758614718914032, -0.00026813894510269165, -0.0002604164183139801, -0.00025269389152526855, -0.000244971364736557, -0.00023724883794784546, -0.0002295263111591339, -0.00022180378437042236, -0.00021408125758171082, -0.00020635873079299927, -0.00019863620400428772, -0.00019091367721557617, -0.00018319115042686462, -0.00017546862363815308, -0.00016774609684944153, -0.00016002357006072998, -0.00015230104327201843, -0.00014457851648330688, -0.00013685598969459534, -0.0001291334629058838, -0.00012141093611717224, -0.0001136884093284607, -0.00010596588253974915, -9.82433557510376e-05, -9.052082896232605e-05, -8.27983021736145e-05, -7.507577538490295e-05, -6.73532485961914e-05, -5.963072180747986e-05, -5.190819501876831e-05, -4.418566823005676e-05, -3.6463141441345215e-05, -2.8740614652633667e-05, -2.101808786392212e-05, -1.3295561075210571e-05, -5.5730342864990234e-06, 2.1494925022125244e-06, 9.872019290924072e-06, 1.759454607963562e-05, 2.5317072868347168e-05, 3.3039599657058716e-05, 4.0762126445770264e-05, 4.848465323448181e-05, 5.620718002319336e-05, 6.392970681190491e-05, 7.165223360061646e-05, 7.9374760389328e-05, 8.709728717803955e-05, 9.48198139667511e-05, 0.00010254234075546265, 0.0001102648675441742, 0.00011798739433288574, 0.0001257099211215973, 0.00013343244791030884, 0.00014115497469902039, 0.00014887750148773193, 0.00015660002827644348, 0.00016432255506515503, 0.00017204508185386658, 0.00017976760864257812]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 11.0, 18.0, 46.0, 105.0, 362.0, 1217.0, 46448.0, 995563.0, 3885.0, 560.0, 180.0, 82.0, 25.0, 19.0, 11.0, 4.0, 6.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.50390625, -6.2813720703125, -6.058837890625, -5.8363037109375, -5.61376953125, -5.3912353515625, -5.168701171875, -4.9461669921875, -4.7236328125, -4.5010986328125, -4.278564453125, -4.0560302734375, -3.83349609375, -3.6109619140625, -3.388427734375, -3.1658935546875, -2.943359375, -2.7208251953125, -2.498291015625, -2.2757568359375, -2.05322265625, -1.8306884765625, -1.608154296875, -1.3856201171875, -1.1630859375, -0.9405517578125, -0.718017578125, -0.4954833984375, -0.27294921875, -0.0504150390625, 0.172119140625, 0.3946533203125, 0.6171875, 0.8397216796875, 1.062255859375, 1.2847900390625, 1.50732421875, 1.7298583984375, 1.952392578125, 2.1749267578125, 2.3974609375, 2.6199951171875, 2.842529296875, 3.0650634765625, 3.28759765625, 3.5101318359375, 3.732666015625, 3.9552001953125, 4.177734375, 4.4002685546875, 4.622802734375, 4.8453369140625, 5.06787109375, 5.2904052734375, 5.512939453125, 5.7354736328125, 5.9580078125, 6.1805419921875, 6.403076171875, 6.6256103515625, 6.84814453125, 7.0706787109375, 7.293212890625, 7.5157470703125, 7.73828125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 8.0, 18.0, 63.0, 232.0, 471.0, 154.0, 35.0, 14.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -2.964324951171875, -2.67669677734375, -2.389068603515625, -2.1014404296875, -1.813812255859375, -1.52618408203125, -1.238555908203125, -0.950927734375, -0.663299560546875, -0.37567138671875, -0.088043212890625, 0.1995849609375, 0.487213134765625, 0.77484130859375, 1.062469482421875, 1.35009765625, 1.637725830078125, 1.92535400390625, 2.212982177734375, 2.5006103515625, 2.788238525390625, 3.07586669921875, 3.363494873046875, 3.651123046875, 3.938751220703125, 4.22637939453125, 4.514007568359375, 4.8016357421875, 5.089263916015625, 5.37689208984375, 5.664520263671875, 5.9521484375, 6.239776611328125, 6.52740478515625, 6.815032958984375, 7.1026611328125, 7.390289306640625, 7.67791748046875, 7.965545654296875, 8.253173828125, 8.540802001953125, 8.82843017578125, 9.116058349609375, 9.4036865234375, 9.691314697265625, 9.97894287109375, 10.266571044921875, 10.55419921875, 10.841827392578125, 11.12945556640625, 11.417083740234375, 11.7047119140625, 11.992340087890625, 12.27996826171875, 12.567596435546875, 12.855224609375, 13.142852783203125, 13.43048095703125, 13.718109130859375, 14.0057373046875, 14.293365478515625, 14.58099365234375, 14.868621826171875, 15.15625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 9.0, 44.0, 571.0, 327.0, 38.0, 10.0, 9.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.04873657226562, -164.12355041503906, -158.19834899902344, -152.27316284179688, -146.34796142578125, -140.4227752685547, -134.49758911132812, -128.5723876953125, -122.6471939086914, -116.72200012207031, -110.79680633544922, -104.87161254882812, -98.94642639160156, -93.02122497558594, -87.09603881835938, -81.17084503173828, -75.24565124511719, -69.3204574584961, -63.395263671875, -57.47007369995117, -51.54487991333008, -45.619686126708984, -39.694496154785156, -33.76930236816406, -27.84410858154297, -21.918914794921875, -15.993722915649414, -10.068531036376953, -4.143337249755859, 1.7818565368652344, 7.7070465087890625, 13.632240295410156, 19.55743408203125, 25.482627868652344, 31.407819747924805, 37.333011627197266, 43.25820541381836, 49.18339920043945, 55.10858917236328, 61.033782958984375, 66.95897674560547, 72.88417053222656, 78.80936431884766, 84.73455810546875, 90.65974426269531, 96.58494567871094, 102.5101318359375, 108.4353256225586, 114.36051940917969, 120.28571319580078, 126.21090698242188, 132.13609313964844, 138.06129455566406, 143.98648071289062, 149.91168212890625, 155.8368682861328, 161.76205444335938, 167.68724060058594, 173.61244201660156, 179.53762817382812, 185.46282958984375, 191.3880157470703, 197.31320190429688, 203.2384033203125, 209.16360473632812]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 10.0, 9.0, 12.0, 16.0, 11.0, 15.0, 12.0, 19.0, 21.0, 23.0, 38.0, 44.0, 36.0, 36.0, 52.0, 52.0, 47.0, 52.0, 47.0, 45.0, 60.0, 43.0, 43.0, 37.0, 37.0, 31.0, 13.0, 25.0, 25.0, 19.0, 12.0, 11.0, 8.0, 7.0, 11.0, 4.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.665367126464844, -42.15768814086914, -40.6500129699707, -39.142333984375, -37.6346549987793, -36.126976013183594, -34.619300842285156, -33.11162185668945, -31.60394287109375, -30.09626579284668, -28.588586807250977, -27.080909729003906, -25.573230743408203, -24.065553665161133, -22.557876586914062, -21.05019760131836, -19.54252052307129, -18.03484344482422, -16.527164459228516, -15.019487380981445, -13.511808395385742, -12.004131317138672, -10.496453285217285, -8.988775253295898, -7.481097221374512, -5.973419189453125, -4.465741157531738, -2.9580636024475098, -1.450385570526123, 0.05729246139526367, 1.5649700164794922, 3.072648048400879, 4.580326080322266, 6.088004112243652, 7.595682144165039, 9.10335922241211, 10.611038208007812, 12.118715286254883, 13.62639331817627, 15.134071350097656, 16.64175033569336, 18.14942741394043, 19.657106399536133, 21.164783477783203, 22.672462463378906, 24.180139541625977, 25.687816619873047, 27.19549560546875, 28.70317268371582, 30.21084976196289, 31.718528747558594, 33.2262077331543, 34.733882904052734, 36.24156188964844, 37.74924087524414, 39.256919860839844, 40.76459503173828, 42.272274017333984, 43.77994918823242, 45.287628173828125, 46.79530715942383, 48.30298614501953, 49.81066131591797, 51.31834030151367, 52.826019287109375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 9.0, 12.0, 15.0, 13.0, 29.0, 20.0, 42.0, 53.0, 70.0, 89.0, 125.0, 175.0, 213.0, 254.0, 372.0, 528.0, 1039.0, 2122.0, 8154.0, 179746.0, 3985410.0, 10103.0, 2487.0, 1067.0, 563.0, 367.0, 276.0, 222.0, 156.0, 134.0, 116.0, 80.0, 67.0, 30.0, 35.0, 27.0, 21.0, 15.0, 8.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.548828125, -3.43817138671875, -3.3275146484375, -3.21685791015625, -3.106201171875, -2.99554443359375, -2.8848876953125, -2.77423095703125, -2.66357421875, -2.55291748046875, -2.4422607421875, -2.33160400390625, -2.220947265625, -2.11029052734375, -1.9996337890625, -1.88897705078125, -1.7783203125, -1.66766357421875, -1.5570068359375, -1.44635009765625, -1.335693359375, -1.22503662109375, -1.1143798828125, -1.00372314453125, -0.89306640625, -0.78240966796875, -0.6717529296875, -0.56109619140625, -0.450439453125, -0.33978271484375, -0.2291259765625, -0.11846923828125, -0.0078125, 0.10284423828125, 0.2135009765625, 0.32415771484375, 0.434814453125, 0.54547119140625, 0.6561279296875, 0.76678466796875, 0.87744140625, 0.98809814453125, 1.0987548828125, 1.20941162109375, 1.320068359375, 1.43072509765625, 1.5413818359375, 1.65203857421875, 1.7626953125, 1.87335205078125, 1.9840087890625, 2.09466552734375, 2.205322265625, 2.31597900390625, 2.4266357421875, 2.53729248046875, 2.64794921875, 2.75860595703125, 2.8692626953125, 2.97991943359375, 3.090576171875, 3.20123291015625, 3.3118896484375, 3.42254638671875, 3.533203125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 2.0, 7.0, 8.0, 8.0, 8.0, 10.0, 14.0, 12.0, 15.0, 20.0, 22.0, 32.0, 26.0, 32.0, 44.0, 50.0, 60.0, 57.0, 56.0, 52.0, 67.0, 48.0, 44.0, 31.0, 35.0, 28.0, 30.0, 41.0, 26.0, 23.0, 28.0, 16.0, 12.0, 9.0, 6.0, 6.0, 7.0, 8.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.68359375, -2.598236083984375, -2.51287841796875, -2.427520751953125, -2.3421630859375, -2.256805419921875, -2.17144775390625, -2.086090087890625, -2.000732421875, -1.915374755859375, -1.83001708984375, -1.744659423828125, -1.6593017578125, -1.573944091796875, -1.48858642578125, -1.403228759765625, -1.31787109375, -1.232513427734375, -1.14715576171875, -1.061798095703125, -0.9764404296875, -0.891082763671875, -0.80572509765625, -0.720367431640625, -0.635009765625, -0.549652099609375, -0.46429443359375, -0.378936767578125, -0.2935791015625, -0.208221435546875, -0.12286376953125, -0.037506103515625, 0.0478515625, 0.133209228515625, 0.21856689453125, 0.303924560546875, 0.3892822265625, 0.474639892578125, 0.55999755859375, 0.645355224609375, 0.730712890625, 0.816070556640625, 0.90142822265625, 0.986785888671875, 1.0721435546875, 1.157501220703125, 1.24285888671875, 1.328216552734375, 1.41357421875, 1.498931884765625, 1.58428955078125, 1.669647216796875, 1.7550048828125, 1.840362548828125, 1.92572021484375, 2.011077880859375, 2.096435546875, 2.181793212890625, 2.26715087890625, 2.352508544921875, 2.4378662109375, 2.523223876953125, 2.60858154296875, 2.693939208984375, 2.779296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 9.0, 5.0, 9.0, 17.0, 10.0, 23.0, 38.0, 56.0, 62.0, 86.0, 122.0, 128.0, 160.0, 226.0, 420.0, 1589.0, 20497.0, 4164701.0, 4233.0, 811.0, 292.0, 195.0, 136.0, 98.0, 101.0, 72.0, 54.0, 46.0, 32.0, 19.0, 12.0, 11.0, 12.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.1484375, -11.8133544921875, -11.478271484375, -11.1431884765625, -10.80810546875, -10.4730224609375, -10.137939453125, -9.8028564453125, -9.4677734375, -9.1326904296875, -8.797607421875, -8.4625244140625, -8.12744140625, -7.7923583984375, -7.457275390625, -7.1221923828125, -6.787109375, -6.4520263671875, -6.116943359375, -5.7818603515625, -5.44677734375, -5.1116943359375, -4.776611328125, -4.4415283203125, -4.1064453125, -3.7713623046875, -3.436279296875, -3.1011962890625, -2.76611328125, -2.4310302734375, -2.095947265625, -1.7608642578125, -1.42578125, -1.0906982421875, -0.755615234375, -0.4205322265625, -0.08544921875, 0.2496337890625, 0.584716796875, 0.9197998046875, 1.2548828125, 1.5899658203125, 1.925048828125, 2.2601318359375, 2.59521484375, 2.9302978515625, 3.265380859375, 3.6004638671875, 3.935546875, 4.2706298828125, 4.605712890625, 4.9407958984375, 5.27587890625, 5.6109619140625, 5.946044921875, 6.2811279296875, 6.6162109375, 6.9512939453125, 7.286376953125, 7.6214599609375, 7.95654296875, 8.2916259765625, 8.626708984375, 8.9617919921875, 9.296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 43.0, 3993.0, 28.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.47265625, -4.3468017578125, -4.220947265625, -4.0950927734375, -3.96923828125, -3.8433837890625, -3.717529296875, -3.5916748046875, -3.4658203125, -3.3399658203125, -3.214111328125, -3.0882568359375, -2.96240234375, -2.8365478515625, -2.710693359375, -2.5848388671875, -2.458984375, -2.3331298828125, -2.207275390625, -2.0814208984375, -1.95556640625, -1.8297119140625, -1.703857421875, -1.5780029296875, -1.4521484375, -1.3262939453125, -1.200439453125, -1.0745849609375, -0.94873046875, -0.8228759765625, -0.697021484375, -0.5711669921875, -0.4453125, -0.3194580078125, -0.193603515625, -0.0677490234375, 0.05810546875, 0.1839599609375, 0.309814453125, 0.4356689453125, 0.5615234375, 0.6873779296875, 0.813232421875, 0.9390869140625, 1.06494140625, 1.1907958984375, 1.316650390625, 1.4425048828125, 1.568359375, 1.6942138671875, 1.820068359375, 1.9459228515625, 2.07177734375, 2.1976318359375, 2.323486328125, 2.4493408203125, 2.5751953125, 2.7010498046875, 2.826904296875, 2.9527587890625, 3.07861328125, 3.2044677734375, 3.330322265625, 3.4561767578125, 3.58203125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 28.0, 87.0, 306.0, 435.0, 119.0, 20.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.674741744995117, -13.319316864013672, -12.963892936706543, -12.608469009399414, -12.253044128417969, -11.897619247436523, -11.542195320129395, -11.186771392822266, -10.83134651184082, -10.475921630859375, -10.120497703552246, -9.765073776245117, -9.409648895263672, -9.054224014282227, -8.698800086975098, -8.343376159667969, -7.987951278686523, -7.632526874542236, -7.277102470397949, -6.921678066253662, -6.566253662109375, -6.210829257965088, -5.855404853820801, -5.499980449676514, -5.144556045532227, -4.7891316413879395, -4.433707237243652, -4.078282833099365, -3.722858428955078, -3.367434024810791, -3.012009620666504, -2.656585216522217, -2.301161766052246, -1.945737361907959, -1.5903129577636719, -1.2348885536193848, -0.8794641494750977, -0.5240397453308105, -0.16861534118652344, 0.18680906295776367, 0.5422334671020508, 0.8976578712463379, 1.253082275390625, 1.608506679534912, 1.9639310836791992, 2.3193554878234863, 2.6747798919677734, 3.0302042961120605, 3.3856287002563477, 3.7410531044006348, 4.096477508544922, 4.451901912689209, 4.807326316833496, 5.162750720977783, 5.51817512512207, 5.873599529266357, 6.2290239334106445, 6.584448337554932, 6.939872741699219, 7.295297145843506, 7.650721549987793, 8.006145477294922, 8.361570358276367, 8.716995239257812, 9.072419166564941]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 5.0, 7.0, 13.0, 7.0, 7.0, 19.0, 15.0, 19.0, 22.0, 16.0, 25.0, 31.0, 26.0, 26.0, 33.0, 38.0, 28.0, 34.0, 31.0, 40.0, 37.0, 50.0, 41.0, 33.0, 46.0, 43.0, 41.0, 35.0, 26.0, 26.0, 29.0, 24.0, 23.0, 15.0, 15.0, 12.0, 12.0, 9.0, 10.0, 3.0, 5.0, 5.0, 7.0, 2.0, 5.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.5065388679504395, -2.421565294265747, -2.3365917205810547, -2.251617908477783, -2.166644334793091, -2.0816707611083984, -1.996697187423706, -1.9117236137390137, -1.8267499208450317, -1.7417763471603394, -1.6568026542663574, -1.571829080581665, -1.4868555068969727, -1.4018818140029907, -1.3169082403182983, -1.2319345474243164, -1.146960973739624, -1.0619874000549316, -0.9770137071609497, -0.8920401334762573, -0.8070665001869202, -0.722092866897583, -0.6371192932128906, -0.5521456599235535, -0.4671720266342163, -0.38219839334487915, -0.2972247898578644, -0.2122511863708496, -0.12727755308151245, -0.04230391979217529, 0.04266965389251709, 0.12764328718185425, 0.2126169204711914, 0.29759055376052856, 0.38256415724754333, 0.4675377607345581, 0.5525113940238953, 0.6374850273132324, 0.7224586009979248, 0.807432234287262, 0.8924058675765991, 0.9773795008659363, 1.0623531341552734, 1.1473267078399658, 1.2323002815246582, 1.3172739744186401, 1.4022475481033325, 1.4872212409973145, 1.5721948146820068, 1.6571683883666992, 1.7421420812606812, 1.8271156549453735, 1.9120893478393555, 1.9970629215240479, 2.0820364952087402, 2.1670100688934326, 2.251983642578125, 2.3369572162628174, 2.4219307899475098, 2.5069046020507812, 2.5918781757354736, 2.676851749420166, 2.7618253231048584, 2.846798896789551, 2.9317727088928223]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 4.0, 9.0, 17.0, 20.0, 27.0, 33.0, 61.0, 98.0, 174.0, 274.0, 440.0, 719.0, 1354.0, 2441.0, 4501.0, 8541.0, 16709.0, 35764.0, 83154.0, 212828.0, 356388.0, 186964.0, 73723.0, 32120.0, 15018.0, 7821.0, 4161.0, 2214.0, 1285.0, 665.0, 389.0, 226.0, 141.0, 92.0, 53.0, 37.0, 30.0, 22.0, 11.0, 6.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.939453125, -1.87774658203125, -1.8160400390625, -1.75433349609375, -1.692626953125, -1.63092041015625, -1.5692138671875, -1.50750732421875, -1.44580078125, -1.38409423828125, -1.3223876953125, -1.26068115234375, -1.198974609375, -1.13726806640625, -1.0755615234375, -1.01385498046875, -0.9521484375, -0.89044189453125, -0.8287353515625, -0.76702880859375, -0.705322265625, -0.64361572265625, -0.5819091796875, -0.52020263671875, -0.45849609375, -0.39678955078125, -0.3350830078125, -0.27337646484375, -0.211669921875, -0.14996337890625, -0.0882568359375, -0.02655029296875, 0.03515625, 0.09686279296875, 0.1585693359375, 0.22027587890625, 0.281982421875, 0.34368896484375, 0.4053955078125, 0.46710205078125, 0.52880859375, 0.59051513671875, 0.6522216796875, 0.71392822265625, 0.775634765625, 0.83734130859375, 0.8990478515625, 0.96075439453125, 1.0224609375, 1.08416748046875, 1.1458740234375, 1.20758056640625, 1.269287109375, 1.33099365234375, 1.3927001953125, 1.45440673828125, 1.51611328125, 1.57781982421875, 1.6395263671875, 1.70123291015625, 1.762939453125, 1.82464599609375, 1.8863525390625, 1.94805908203125, 2.009765625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 3.0, 5.0, 10.0, 7.0, 11.0, 8.0, 10.0, 16.0, 15.0, 25.0, 26.0, 31.0, 32.0, 26.0, 47.0, 43.0, 54.0, 61.0, 61.0, 53.0, 51.0, 52.0, 42.0, 34.0, 40.0, 27.0, 24.0, 31.0, 25.0, 23.0, 28.0, 20.0, 17.0, 8.0, 15.0, 6.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.208984375, -2.12786865234375, -2.0467529296875, -1.96563720703125, -1.884521484375, -1.80340576171875, -1.7222900390625, -1.64117431640625, -1.56005859375, -1.47894287109375, -1.3978271484375, -1.31671142578125, -1.235595703125, -1.15447998046875, -1.0733642578125, -0.99224853515625, -0.9111328125, -0.83001708984375, -0.7489013671875, -0.66778564453125, -0.586669921875, -0.50555419921875, -0.4244384765625, -0.34332275390625, -0.26220703125, -0.18109130859375, -0.0999755859375, -0.01885986328125, 0.062255859375, 0.14337158203125, 0.2244873046875, 0.30560302734375, 0.38671875, 0.46783447265625, 0.5489501953125, 0.63006591796875, 0.711181640625, 0.79229736328125, 0.8734130859375, 0.95452880859375, 1.03564453125, 1.11676025390625, 1.1978759765625, 1.27899169921875, 1.360107421875, 1.44122314453125, 1.5223388671875, 1.60345458984375, 1.6845703125, 1.76568603515625, 1.8468017578125, 1.92791748046875, 2.009033203125, 2.09014892578125, 2.1712646484375, 2.25238037109375, 2.33349609375, 2.41461181640625, 2.4957275390625, 2.57684326171875, 2.657958984375, 2.73907470703125, 2.8201904296875, 2.90130615234375, 2.982421875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 12.0, 6.0, 7.0, 10.0, 11.0, 14.0, 19.0, 23.0, 37.0, 47.0, 60.0, 73.0, 114.0, 155.0, 245.0, 617.0, 1275.0, 3655.0, 17394.0, 190536.0, 762252.0, 59248.0, 8367.0, 2325.0, 873.0, 398.0, 238.0, 153.0, 93.0, 69.0, 49.0, 50.0, 27.0, 23.0, 14.0, 14.0, 8.0, 14.0, 8.0, 4.0, 8.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.99609375, -5.81597900390625, -5.6358642578125, -5.45574951171875, -5.275634765625, -5.09552001953125, -4.9154052734375, -4.73529052734375, -4.55517578125, -4.37506103515625, -4.1949462890625, -4.01483154296875, -3.834716796875, -3.65460205078125, -3.4744873046875, -3.29437255859375, -3.1142578125, -2.93414306640625, -2.7540283203125, -2.57391357421875, -2.393798828125, -2.21368408203125, -2.0335693359375, -1.85345458984375, -1.67333984375, -1.49322509765625, -1.3131103515625, -1.13299560546875, -0.952880859375, -0.77276611328125, -0.5926513671875, -0.41253662109375, -0.232421875, -0.05230712890625, 0.1278076171875, 0.30792236328125, 0.488037109375, 0.66815185546875, 0.8482666015625, 1.02838134765625, 1.20849609375, 1.38861083984375, 1.5687255859375, 1.74884033203125, 1.928955078125, 2.10906982421875, 2.2891845703125, 2.46929931640625, 2.6494140625, 2.82952880859375, 3.0096435546875, 3.18975830078125, 3.369873046875, 3.54998779296875, 3.7301025390625, 3.91021728515625, 4.09033203125, 4.27044677734375, 4.4505615234375, 4.63067626953125, 4.810791015625, 4.99090576171875, 5.1710205078125, 5.35113525390625, 5.53125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 7.0, 3.0, 9.0, 7.0, 9.0, 14.0, 20.0, 22.0, 29.0, 42.0, 40.0, 44.0, 54.0, 72.0, 56.0, 64.0, 75.0, 55.0, 59.0, 50.0, 49.0, 47.0, 36.0, 26.0, 26.0, 23.0, 22.0, 13.0, 7.0, 7.0, 7.0, 3.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.25, -16.7860107421875, -16.322021484375, -15.8580322265625, -15.39404296875, -14.9300537109375, -14.466064453125, -14.0020751953125, -13.5380859375, -13.0740966796875, -12.610107421875, -12.1461181640625, -11.68212890625, -11.2181396484375, -10.754150390625, -10.2901611328125, -9.826171875, -9.3621826171875, -8.898193359375, -8.4342041015625, -7.97021484375, -7.5062255859375, -7.042236328125, -6.5782470703125, -6.1142578125, -5.6502685546875, -5.186279296875, -4.7222900390625, -4.25830078125, -3.7943115234375, -3.330322265625, -2.8663330078125, -2.40234375, -1.9383544921875, -1.474365234375, -1.0103759765625, -0.54638671875, -0.0823974609375, 0.381591796875, 0.8455810546875, 1.3095703125, 1.7735595703125, 2.237548828125, 2.7015380859375, 3.16552734375, 3.6295166015625, 4.093505859375, 4.5574951171875, 5.021484375, 5.4854736328125, 5.949462890625, 6.4134521484375, 6.87744140625, 7.3414306640625, 7.805419921875, 8.2694091796875, 8.7333984375, 9.1973876953125, 9.661376953125, 10.1253662109375, 10.58935546875, 11.0533447265625, 11.517333984375, 11.9813232421875, 12.4453125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 10.0, 7.0, 41.0, 180.0, 2551.0, 1043661.0, 1847.0, 168.0, 44.0, 17.0, 4.0, 8.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6328125, -8.1893310546875, -7.745849609375, -7.3023681640625, -6.85888671875, -6.4154052734375, -5.971923828125, -5.5284423828125, -5.0849609375, -4.6414794921875, -4.197998046875, -3.7545166015625, -3.31103515625, -2.8675537109375, -2.424072265625, -1.9805908203125, -1.537109375, -1.0936279296875, -0.650146484375, -0.2066650390625, 0.23681640625, 0.6802978515625, 1.123779296875, 1.5672607421875, 2.0107421875, 2.4542236328125, 2.897705078125, 3.3411865234375, 3.78466796875, 4.2281494140625, 4.671630859375, 5.1151123046875, 5.55859375, 6.0020751953125, 6.445556640625, 6.8890380859375, 7.33251953125, 7.7760009765625, 8.219482421875, 8.6629638671875, 9.1064453125, 9.5499267578125, 9.993408203125, 10.4368896484375, 10.88037109375, 11.3238525390625, 11.767333984375, 12.2108154296875, 12.654296875, 13.0977783203125, 13.541259765625, 13.9847412109375, 14.42822265625, 14.8717041015625, 15.315185546875, 15.7586669921875, 16.2021484375, 16.6456298828125, 17.089111328125, 17.5325927734375, 17.97607421875, 18.4195556640625, 18.863037109375, 19.3065185546875, 19.75]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 6.0, 11.0, 11.0, 17.0, 17.0, 31.0, 33.0, 61.0, 80.0, 91.0, 104.0, 111.0, 97.0, 81.0, 62.0, 49.0, 30.0, 32.0, 23.0, 13.0, 11.0, 5.0, 3.0, 3.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00016427040100097656, -0.00015943869948387146, -0.00015460699796676636, -0.00014977529644966125, -0.00014494359493255615, -0.00014011189341545105, -0.00013528019189834595, -0.00013044849038124084, -0.00012561678886413574, -0.00012078508734703064, -0.00011595338582992554, -0.00011112168431282043, -0.00010628998279571533, -0.00010145828127861023, -9.662657976150513e-05, -9.179487824440002e-05, -8.696317672729492e-05, -8.213147521018982e-05, -7.729977369308472e-05, -7.246807217597961e-05, -6.763637065887451e-05, -6.280466914176941e-05, -5.797296762466431e-05, -5.3141266107559204e-05, -4.83095645904541e-05, -4.3477863073349e-05, -3.8646161556243896e-05, -3.3814460039138794e-05, -2.898275852203369e-05, -2.415105700492859e-05, -1.9319355487823486e-05, -1.4487653970718384e-05, -9.655952453613281e-06, -4.824250936508179e-06, 7.450580596923828e-09, 4.839152097702026e-06, 9.670853614807129e-06, 1.4502555131912231e-05, 1.9334256649017334e-05, 2.4165958166122437e-05, 2.899765968322754e-05, 3.382936120033264e-05, 3.8661062717437744e-05, 4.349276423454285e-05, 4.832446575164795e-05, 5.315616726875305e-05, 5.7987868785858154e-05, 6.281957030296326e-05, 6.765127182006836e-05, 7.248297333717346e-05, 7.731467485427856e-05, 8.214637637138367e-05, 8.697807788848877e-05, 9.180977940559387e-05, 9.664148092269897e-05, 0.00010147318243980408, 0.00010630488395690918, 0.00011113658547401428, 0.00011596828699111938, 0.00012079998850822449, 0.0001256316900253296, 0.0001304633915424347, 0.0001352950930595398, 0.0001401267945766449, 0.00014495849609375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 2.0, 7.0, 10.0, 15.0, 28.0, 57.0, 87.0, 218.0, 586.0, 2440.0, 29598.0, 979641.0, 32280.0, 2520.0, 607.0, 218.0, 106.0, 49.0, 24.0, 22.0, 14.0, 6.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.91015625, -2.79608154296875, -2.6820068359375, -2.56793212890625, -2.453857421875, -2.33978271484375, -2.2257080078125, -2.11163330078125, -1.99755859375, -1.88348388671875, -1.7694091796875, -1.65533447265625, -1.541259765625, -1.42718505859375, -1.3131103515625, -1.19903564453125, -1.0849609375, -0.97088623046875, -0.8568115234375, -0.74273681640625, -0.628662109375, -0.51458740234375, -0.4005126953125, -0.28643798828125, -0.17236328125, -0.05828857421875, 0.0557861328125, 0.16986083984375, 0.283935546875, 0.39801025390625, 0.5120849609375, 0.62615966796875, 0.740234375, 0.85430908203125, 0.9683837890625, 1.08245849609375, 1.196533203125, 1.31060791015625, 1.4246826171875, 1.53875732421875, 1.65283203125, 1.76690673828125, 1.8809814453125, 1.99505615234375, 2.109130859375, 2.22320556640625, 2.3372802734375, 2.45135498046875, 2.5654296875, 2.67950439453125, 2.7935791015625, 2.90765380859375, 3.021728515625, 3.13580322265625, 3.2498779296875, 3.36395263671875, 3.47802734375, 3.59210205078125, 3.7061767578125, 3.82025146484375, 3.934326171875, 4.04840087890625, 4.1624755859375, 4.27655029296875, 4.390625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 15.0, 18.0, 97.0, 186.0, 268.0, 217.0, 107.0, 44.0, 12.0, 12.0, 1.0, 7.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.951171875, -3.750518798828125, -3.54986572265625, -3.349212646484375, -3.1485595703125, -2.947906494140625, -2.74725341796875, -2.546600341796875, -2.345947265625, -2.145294189453125, -1.94464111328125, -1.743988037109375, -1.5433349609375, -1.342681884765625, -1.14202880859375, -0.941375732421875, -0.74072265625, -0.540069580078125, -0.33941650390625, -0.138763427734375, 0.0618896484375, 0.262542724609375, 0.46319580078125, 0.663848876953125, 0.864501953125, 1.065155029296875, 1.26580810546875, 1.466461181640625, 1.6671142578125, 1.867767333984375, 2.06842041015625, 2.269073486328125, 2.4697265625, 2.670379638671875, 2.87103271484375, 3.071685791015625, 3.2723388671875, 3.472991943359375, 3.67364501953125, 3.874298095703125, 4.074951171875, 4.275604248046875, 4.47625732421875, 4.676910400390625, 4.8775634765625, 5.078216552734375, 5.27886962890625, 5.479522705078125, 5.68017578125, 5.880828857421875, 6.08148193359375, 6.282135009765625, 6.4827880859375, 6.683441162109375, 6.88409423828125, 7.084747314453125, 7.285400390625, 7.486053466796875, 7.68670654296875, 7.887359619140625, 8.0880126953125, 8.288665771484375, 8.48931884765625, 8.689971923828125, 8.890625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 21.0, 83.0, 296.0, 448.0, 114.0, 26.0, 7.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.44511413574219, -82.52705383300781, -79.60899353027344, -76.69093322753906, -73.77287292480469, -70.85481262207031, -67.93675231933594, -65.01869201660156, -62.10062789916992, -59.18256759643555, -56.26450729370117, -53.34644317626953, -50.428382873535156, -47.51032257080078, -44.592262268066406, -41.67420196533203, -38.756141662597656, -35.83808135986328, -32.920021057128906, -30.0019588470459, -27.083898544311523, -24.16583824157715, -21.24777603149414, -18.329715728759766, -15.41165542602539, -12.493595123291016, -9.575533866882324, -6.657472610473633, -3.739412307739258, -0.8213520050048828, 2.096710205078125, 5.0147705078125, 7.932823181152344, 10.850883483886719, 13.76894474029541, 16.6870059967041, 19.605066299438477, 22.52312660217285, 25.44118881225586, 28.359249114990234, 31.27730941772461, 34.195369720458984, 37.11343002319336, 40.031494140625, 42.949554443359375, 45.86761474609375, 48.785675048828125, 51.7037353515625, 54.621795654296875, 57.53985595703125, 60.457916259765625, 63.3759765625, 66.29403686523438, 69.21209716796875, 72.13015747070312, 75.0482177734375, 77.96627807617188, 80.88433837890625, 83.80239868164062, 86.720458984375, 89.63851928710938, 92.55657958984375, 95.47463989257812, 98.3927001953125, 101.3107681274414]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 9.0, 9.0, 8.0, 11.0, 15.0, 15.0, 11.0, 10.0, 27.0, 31.0, 26.0, 20.0, 33.0, 48.0, 41.0, 42.0, 46.0, 53.0, 47.0, 58.0, 43.0, 48.0, 41.0, 27.0, 30.0, 19.0, 37.0, 31.0, 19.0, 21.0, 23.0, 15.0, 17.0, 8.0, 7.0, 11.0, 7.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-48.65369415283203, -47.24525451660156, -45.83681106567383, -44.42837142944336, -43.019927978515625, -41.611488342285156, -40.20304870605469, -38.79460525512695, -37.386165618896484, -35.977725982666016, -34.56928253173828, -33.16084289550781, -31.75240135192871, -30.34395980834961, -28.935518264770508, -27.527076721191406, -26.118635177612305, -24.710193634033203, -23.3017520904541, -21.893310546875, -20.48487091064453, -19.07642936706543, -17.667987823486328, -16.25954818725586, -14.851105690002441, -13.44266414642334, -12.034223556518555, -10.625782012939453, -9.217340469360352, -7.808899879455566, -6.400458335876465, -4.99201774597168, -3.583576202392578, -2.1751351356506348, -0.7666938304901123, 0.6417474746704102, 2.0501885414123535, 3.458629608154297, 4.867071151733398, 6.275511741638184, 7.683953285217285, 9.092394828796387, 10.500835418701172, 11.909276962280273, 13.317718505859375, 14.72615909576416, 16.134601593017578, 17.543041229248047, 18.95148277282715, 20.35992431640625, 21.76836585998535, 23.176807403564453, 24.585247039794922, 25.993688583374023, 27.402130126953125, 28.810569763183594, 30.219013214111328, 31.62745475769043, 33.03589630126953, 34.4443359375, 35.852779388427734, 37.2612190246582, 38.66966247558594, 40.078102111816406, 41.486541748046875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 5.0, 4.0, 6.0, 21.0, 17.0, 31.0, 43.0, 69.0, 86.0, 118.0, 187.0, 252.0, 520.0, 1177.0, 3758.0, 50091.0, 4120692.0, 13294.0, 2058.0, 732.0, 376.0, 238.0, 163.0, 100.0, 64.0, 52.0, 36.0, 26.0, 18.0, 11.0, 9.0, 10.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.8671875, -6.68316650390625, -6.4991455078125, -6.31512451171875, -6.131103515625, -5.94708251953125, -5.7630615234375, -5.57904052734375, -5.39501953125, -5.21099853515625, -5.0269775390625, -4.84295654296875, -4.658935546875, -4.47491455078125, -4.2908935546875, -4.10687255859375, -3.9228515625, -3.73883056640625, -3.5548095703125, -3.37078857421875, -3.186767578125, -3.00274658203125, -2.8187255859375, -2.63470458984375, -2.45068359375, -2.26666259765625, -2.0826416015625, -1.89862060546875, -1.714599609375, -1.53057861328125, -1.3465576171875, -1.16253662109375, -0.978515625, -0.79449462890625, -0.6104736328125, -0.42645263671875, -0.242431640625, -0.05841064453125, 0.1256103515625, 0.30963134765625, 0.49365234375, 0.67767333984375, 0.8616943359375, 1.04571533203125, 1.229736328125, 1.41375732421875, 1.5977783203125, 1.78179931640625, 1.9658203125, 2.14984130859375, 2.3338623046875, 2.51788330078125, 2.701904296875, 2.88592529296875, 3.0699462890625, 3.25396728515625, 3.43798828125, 3.62200927734375, 3.8060302734375, 3.99005126953125, 4.174072265625, 4.35809326171875, 4.5421142578125, 4.72613525390625, 4.91015625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 4.0, 7.0, 4.0, 7.0, 16.0, 16.0, 14.0, 20.0, 21.0, 22.0, 27.0, 36.0, 48.0, 28.0, 45.0, 60.0, 55.0, 55.0, 53.0, 60.0, 49.0, 54.0, 42.0, 28.0, 27.0, 28.0, 36.0, 32.0, 21.0, 17.0, 16.0, 9.0, 8.0, 8.0, 5.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.1640625, -3.08050537109375, -2.9969482421875, -2.91339111328125, -2.829833984375, -2.74627685546875, -2.6627197265625, -2.57916259765625, -2.49560546875, -2.41204833984375, -2.3284912109375, -2.24493408203125, -2.161376953125, -2.07781982421875, -1.9942626953125, -1.91070556640625, -1.8271484375, -1.74359130859375, -1.6600341796875, -1.57647705078125, -1.492919921875, -1.40936279296875, -1.3258056640625, -1.24224853515625, -1.15869140625, -1.07513427734375, -0.9915771484375, -0.90802001953125, -0.824462890625, -0.74090576171875, -0.6573486328125, -0.57379150390625, -0.490234375, -0.40667724609375, -0.3231201171875, -0.23956298828125, -0.156005859375, -0.07244873046875, 0.0111083984375, 0.09466552734375, 0.17822265625, 0.26177978515625, 0.3453369140625, 0.42889404296875, 0.512451171875, 0.59600830078125, 0.6795654296875, 0.76312255859375, 0.8466796875, 0.93023681640625, 1.0137939453125, 1.09735107421875, 1.180908203125, 1.26446533203125, 1.3480224609375, 1.43157958984375, 1.51513671875, 1.59869384765625, 1.6822509765625, 1.76580810546875, 1.849365234375, 1.93292236328125, 2.0164794921875, 2.10003662109375, 2.18359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 6.0, 6.0, 9.0, 11.0, 20.0, 22.0, 17.0, 15.0, 18.0, 20.0, 31.0, 23.0, 36.0, 39.0, 49.0, 74.0, 125.0, 181.0, 309.0, 1046.0, 4165054.0, 25504.0, 653.0, 283.0, 182.0, 131.0, 71.0, 48.0, 33.0, 35.0, 20.0, 33.0, 24.0, 23.0, 15.0, 18.0, 14.0, 15.0, 20.0, 8.0, 7.0, 5.0, 7.0, 7.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.515625, -25.597412109375, -24.67919921875, -23.760986328125, -22.8427734375, -21.924560546875, -21.00634765625, -20.088134765625, -19.169921875, -18.251708984375, -17.33349609375, -16.415283203125, -15.4970703125, -14.578857421875, -13.66064453125, -12.742431640625, -11.82421875, -10.906005859375, -9.98779296875, -9.069580078125, -8.1513671875, -7.233154296875, -6.31494140625, -5.396728515625, -4.478515625, -3.560302734375, -2.64208984375, -1.723876953125, -0.8056640625, 0.112548828125, 1.03076171875, 1.948974609375, 2.8671875, 3.785400390625, 4.70361328125, 5.621826171875, 6.5400390625, 7.458251953125, 8.37646484375, 9.294677734375, 10.212890625, 11.131103515625, 12.04931640625, 12.967529296875, 13.8857421875, 14.803955078125, 15.72216796875, 16.640380859375, 17.55859375, 18.476806640625, 19.39501953125, 20.313232421875, 21.2314453125, 22.149658203125, 23.06787109375, 23.986083984375, 24.904296875, 25.822509765625, 26.74072265625, 27.658935546875, 28.5771484375, 29.495361328125, 30.41357421875, 31.331787109375, 32.25]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [4.0, 3.0, 21.0, 4040.0, 22.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.654296875, -1.910675048828125, -1.16705322265625, -0.423431396484375, 0.3201904296875, 1.063812255859375, 1.80743408203125, 2.551055908203125, 3.294677734375, 4.038299560546875, 4.78192138671875, 5.525543212890625, 6.2691650390625, 7.012786865234375, 7.75640869140625, 8.500030517578125, 9.24365234375, 9.987274169921875, 10.73089599609375, 11.474517822265625, 12.2181396484375, 12.961761474609375, 13.70538330078125, 14.449005126953125, 15.192626953125, 15.936248779296875, 16.67987060546875, 17.423492431640625, 18.1671142578125, 18.910736083984375, 19.65435791015625, 20.397979736328125, 21.1416015625, 21.885223388671875, 22.62884521484375, 23.372467041015625, 24.1160888671875, 24.859710693359375, 25.60333251953125, 26.346954345703125, 27.090576171875, 27.834197998046875, 28.57781982421875, 29.321441650390625, 30.0650634765625, 30.808685302734375, 31.55230712890625, 32.295928955078125, 33.03955078125, 33.783172607421875, 34.52679443359375, 35.270416259765625, 36.0140380859375, 36.757659912109375, 37.50128173828125, 38.244903564453125, 38.988525390625, 39.732147216796875, 40.47576904296875, 41.219390869140625, 41.9630126953125, 42.706634521484375, 43.45025634765625, 44.193878173828125, 44.9375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 6.0, 46.0, 727.0, 216.0, 15.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.04730224609375, -60.826637268066406, -57.60597229003906, -54.38530731201172, -51.164642333984375, -47.94397735595703, -44.72331619262695, -41.50265121459961, -38.281986236572266, -35.06132125854492, -31.840656280517578, -28.619993209838867, -25.399328231811523, -22.17866325378418, -18.95800018310547, -15.737335205078125, -12.516670227050781, -9.296005249023438, -6.07534122467041, -2.854677200317383, 0.36598777770996094, 3.5866527557373047, 6.807315826416016, 10.02798080444336, 13.248645782470703, 16.469310760498047, 19.68997573852539, 22.9106388092041, 26.131303787231445, 29.35196876525879, 32.5726318359375, 35.793296813964844, 39.01396179199219, 42.23462677001953, 45.455291748046875, 48.67595672607422, 51.89662170410156, 55.117286682128906, 58.337947845458984, 61.55861282348633, 64.77928161621094, 67.99994659423828, 71.22061157226562, 74.44127655029297, 77.66194152832031, 80.88260650634766, 84.103271484375, 87.32392883300781, 90.54459381103516, 93.7652587890625, 96.98592376708984, 100.20658874511719, 103.42725372314453, 106.64791870117188, 109.86857604980469, 113.08924865722656, 116.30990600585938, 119.53057098388672, 122.75123596191406, 125.9719009399414, 129.19256591796875, 132.41322326660156, 135.63389587402344, 138.85455322265625, 142.07522583007812]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 12.0, 26.0, 23.0, 35.0, 79.0, 135.0, 169.0, 185.0, 141.0, 80.0, 51.0, 29.0, 18.0, 8.0, 10.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-89.52603149414062, -87.03592681884766, -84.54582214355469, -82.05570983886719, -79.56560516357422, -77.07550048828125, -74.58539581298828, -72.09529113769531, -69.60518646240234, -67.11508178710938, -64.6249771118164, -62.13486862182617, -59.6447639465332, -57.15465545654297, -54.66455078125, -52.17444610595703, -49.6843376159668, -47.19423294067383, -44.704124450683594, -42.214019775390625, -39.723915100097656, -37.23381042480469, -34.74370193481445, -32.253597259521484, -29.763490676879883, -27.27338409423828, -24.783279418945312, -22.29317283630371, -19.80306625366211, -17.31296157836914, -14.822854995727539, -12.33275032043457, -9.842643737792969, -7.352538108825684, -4.86243200302124, -2.372325897216797, 0.11777973175048828, 2.6078853607177734, 5.097991943359375, 7.588096618652344, 10.078203201293945, 12.56830883026123, 15.058414459228516, 17.548521041870117, 20.03862762451172, 22.528732299804688, 25.01883888244629, 27.508943557739258, 29.99905014038086, 32.48915481567383, 34.97926330566406, 37.46936798095703, 39.95947265625, 42.44957733154297, 44.9396858215332, 47.42979049682617, 49.919898986816406, 52.410003662109375, 54.90011215209961, 57.39021682739258, 59.88032150268555, 62.37042999267578, 64.86053466796875, 67.35063934326172, 69.84074401855469]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 12.0, 15.0, 16.0, 17.0, 22.0, 41.0, 69.0, 109.0, 182.0, 339.0, 737.0, 1844.0, 5381.0, 21508.0, 148840.0, 727702.0, 115812.0, 18130.0, 4617.0, 1610.0, 706.0, 356.0, 173.0, 106.0, 69.0, 41.0, 29.0, 20.0, 15.0, 5.0, 10.0, 6.0, 4.0, 7.0, 2.0, 0.0, 2.0], "bins": [-8.5, -8.29974365234375, -8.0994873046875, -7.89923095703125, -7.698974609375, -7.49871826171875, -7.2984619140625, -7.09820556640625, -6.89794921875, -6.69769287109375, -6.4974365234375, -6.29718017578125, -6.096923828125, -5.89666748046875, -5.6964111328125, -5.49615478515625, -5.2958984375, -5.09564208984375, -4.8953857421875, -4.69512939453125, -4.494873046875, -4.29461669921875, -4.0943603515625, -3.89410400390625, -3.69384765625, -3.49359130859375, -3.2933349609375, -3.09307861328125, -2.892822265625, -2.69256591796875, -2.4923095703125, -2.29205322265625, -2.091796875, -1.89154052734375, -1.6912841796875, -1.49102783203125, -1.290771484375, -1.09051513671875, -0.8902587890625, -0.69000244140625, -0.48974609375, -0.28948974609375, -0.0892333984375, 0.11102294921875, 0.311279296875, 0.51153564453125, 0.7117919921875, 0.91204833984375, 1.1123046875, 1.31256103515625, 1.5128173828125, 1.71307373046875, 1.913330078125, 2.11358642578125, 2.3138427734375, 2.51409912109375, 2.71435546875, 2.91461181640625, 3.1148681640625, 3.31512451171875, 3.515380859375, 3.71563720703125, 3.9158935546875, 4.11614990234375, 4.31640625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 5.0, 1.0, 10.0, 12.0, 11.0, 16.0, 28.0, 39.0, 37.0, 55.0, 54.0, 83.0, 68.0, 90.0, 92.0, 73.0, 56.0, 74.0, 43.0, 42.0, 31.0, 16.0, 14.0, 8.0, 11.0, 5.0, 9.0, 5.0, 6.0, 4.0, 0.0, 1.0, 2.0, 4.0], "bins": [-6.8828125, -6.72552490234375, -6.5682373046875, -6.41094970703125, -6.253662109375, -6.09637451171875, -5.9390869140625, -5.78179931640625, -5.62451171875, -5.46722412109375, -5.3099365234375, -5.15264892578125, -4.995361328125, -4.83807373046875, -4.6807861328125, -4.52349853515625, -4.3662109375, -4.20892333984375, -4.0516357421875, -3.89434814453125, -3.737060546875, -3.57977294921875, -3.4224853515625, -3.26519775390625, -3.10791015625, -2.95062255859375, -2.7933349609375, -2.63604736328125, -2.478759765625, -2.32147216796875, -2.1641845703125, -2.00689697265625, -1.849609375, -1.69232177734375, -1.5350341796875, -1.37774658203125, -1.220458984375, -1.06317138671875, -0.9058837890625, -0.74859619140625, -0.59130859375, -0.43402099609375, -0.2767333984375, -0.11944580078125, 0.037841796875, 0.19512939453125, 0.3524169921875, 0.50970458984375, 0.6669921875, 0.82427978515625, 0.9815673828125, 1.13885498046875, 1.296142578125, 1.45343017578125, 1.6107177734375, 1.76800537109375, 1.92529296875, 2.08258056640625, 2.2398681640625, 2.39715576171875, 2.554443359375, 2.71173095703125, 2.8690185546875, 3.02630615234375, 3.18359375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 11.0, 20.0, 34.0, 73.0, 149.0, 445.0, 1560.0, 360419.0, 683267.0, 1840.0, 437.0, 148.0, 71.0, 29.0, 21.0, 11.0, 7.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.234375, -25.33056640625, -24.4267578125, -23.52294921875, -22.619140625, -21.71533203125, -20.8115234375, -19.90771484375, -19.00390625, -18.10009765625, -17.1962890625, -16.29248046875, -15.388671875, -14.48486328125, -13.5810546875, -12.67724609375, -11.7734375, -10.86962890625, -9.9658203125, -9.06201171875, -8.158203125, -7.25439453125, -6.3505859375, -5.44677734375, -4.54296875, -3.63916015625, -2.7353515625, -1.83154296875, -0.927734375, -0.02392578125, 0.8798828125, 1.78369140625, 2.6875, 3.59130859375, 4.4951171875, 5.39892578125, 6.302734375, 7.20654296875, 8.1103515625, 9.01416015625, 9.91796875, 10.82177734375, 11.7255859375, 12.62939453125, 13.533203125, 14.43701171875, 15.3408203125, 16.24462890625, 17.1484375, 18.05224609375, 18.9560546875, 19.85986328125, 20.763671875, 21.66748046875, 22.5712890625, 23.47509765625, 24.37890625, 25.28271484375, 26.1865234375, 27.09033203125, 27.994140625, 28.89794921875, 29.8017578125, 30.70556640625, 31.609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 14.0, 38.0, 133.0, 226.0, 255.0, 197.0, 94.0, 36.0, 9.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.40625, -33.47802734375, -31.5498046875, -29.62158203125, -27.693359375, -25.76513671875, -23.8369140625, -21.90869140625, -19.98046875, -18.05224609375, -16.1240234375, -14.19580078125, -12.267578125, -10.33935546875, -8.4111328125, -6.48291015625, -4.5546875, -2.62646484375, -0.6982421875, 1.22998046875, 3.158203125, 5.08642578125, 7.0146484375, 8.94287109375, 10.87109375, 12.79931640625, 14.7275390625, 16.65576171875, 18.583984375, 20.51220703125, 22.4404296875, 24.36865234375, 26.296875, 28.22509765625, 30.1533203125, 32.08154296875, 34.009765625, 35.93798828125, 37.8662109375, 39.79443359375, 41.72265625, 43.65087890625, 45.5791015625, 47.50732421875, 49.435546875, 51.36376953125, 53.2919921875, 55.22021484375, 57.1484375, 59.07666015625, 61.0048828125, 62.93310546875, 64.861328125, 66.78955078125, 68.7177734375, 70.64599609375, 72.57421875, 74.50244140625, 76.4306640625, 78.35888671875, 80.287109375, 82.21533203125, 84.1435546875, 86.07177734375, 88.0]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 12.0, 20.0, 41.0, 142.0, 931.0, 1033163.0, 13737.0, 382.0, 79.0, 31.0, 11.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.953125, -9.495849609375, -9.03857421875, -8.581298828125, -8.1240234375, -7.666748046875, -7.20947265625, -6.752197265625, -6.294921875, -5.837646484375, -5.38037109375, -4.923095703125, -4.4658203125, -4.008544921875, -3.55126953125, -3.093994140625, -2.63671875, -2.179443359375, -1.72216796875, -1.264892578125, -0.8076171875, -0.350341796875, 0.10693359375, 0.564208984375, 1.021484375, 1.478759765625, 1.93603515625, 2.393310546875, 2.8505859375, 3.307861328125, 3.76513671875, 4.222412109375, 4.6796875, 5.136962890625, 5.59423828125, 6.051513671875, 6.5087890625, 6.966064453125, 7.42333984375, 7.880615234375, 8.337890625, 8.795166015625, 9.25244140625, 9.709716796875, 10.1669921875, 10.624267578125, 11.08154296875, 11.538818359375, 11.99609375, 12.453369140625, 12.91064453125, 13.367919921875, 13.8251953125, 14.282470703125, 14.73974609375, 15.197021484375, 15.654296875, 16.111572265625, 16.56884765625, 17.026123046875, 17.4833984375, 17.940673828125, 18.39794921875, 18.855224609375, 19.3125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 7.0, 8.0, 9.0, 17.0, 14.0, 31.0, 29.0, 53.0, 77.0, 114.0, 149.0, 146.0, 93.0, 73.0, 45.0, 35.0, 22.0, 12.0, 13.0, 8.0, 11.0, 6.0, 6.0, 3.0, 2.0, 7.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001894235610961914, -0.00018262676894664764, -0.00017582997679710388, -0.00016903318464756012, -0.00016223639249801636, -0.0001554396003484726, -0.00014864280819892883, -0.00014184601604938507, -0.0001350492238998413, -0.00012825243175029755, -0.00012145563960075378, -0.00011465884745121002, -0.00010786205530166626, -0.0001010652631521225, -9.426847100257874e-05, -8.747167885303497e-05, -8.067488670349121e-05, -7.387809455394745e-05, -6.708130240440369e-05, -6.0284510254859924e-05, -5.348771810531616e-05, -4.66909259557724e-05, -3.989413380622864e-05, -3.3097341656684875e-05, -2.6300549507141113e-05, -1.950375735759735e-05, -1.2706965208053589e-05, -5.910173058509827e-06, 8.866190910339355e-07, 7.683411240577698e-06, 1.448020339012146e-05, 2.1276995539665222e-05, 2.8073787689208984e-05, 3.4870579838752747e-05, 4.166737198829651e-05, 4.846416413784027e-05, 5.526095628738403e-05, 6.20577484369278e-05, 6.885454058647156e-05, 7.565133273601532e-05, 8.244812488555908e-05, 8.924491703510284e-05, 9.60417091846466e-05, 0.00010283850133419037, 0.00010963529348373413, 0.00011643208563327789, 0.00012322887778282166, 0.00013002566993236542, 0.00013682246208190918, 0.00014361925423145294, 0.0001504160463809967, 0.00015721283853054047, 0.00016400963068008423, 0.000170806422829628, 0.00017760321497917175, 0.00018440000712871552, 0.00019119679927825928, 0.00019799359142780304, 0.0002047903835773468, 0.00021158717572689056, 0.00021838396787643433, 0.0002251807600259781, 0.00023197755217552185, 0.0002387743443250656, 0.0002455711364746094]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 3.0, 5.0, 7.0, 24.0, 48.0, 166.0, 642.0, 35337.0, 1010495.0, 1487.0, 231.0, 58.0, 32.0, 14.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.28125, -15.8951416015625, -15.509033203125, -15.1229248046875, -14.73681640625, -14.3507080078125, -13.964599609375, -13.5784912109375, -13.1923828125, -12.8062744140625, -12.420166015625, -12.0340576171875, -11.64794921875, -11.2618408203125, -10.875732421875, -10.4896240234375, -10.103515625, -9.7174072265625, -9.331298828125, -8.9451904296875, -8.55908203125, -8.1729736328125, -7.786865234375, -7.4007568359375, -7.0146484375, -6.6285400390625, -6.242431640625, -5.8563232421875, -5.47021484375, -5.0841064453125, -4.697998046875, -4.3118896484375, -3.92578125, -3.5396728515625, -3.153564453125, -2.7674560546875, -2.38134765625, -1.9952392578125, -1.609130859375, -1.2230224609375, -0.8369140625, -0.4508056640625, -0.064697265625, 0.3214111328125, 0.70751953125, 1.0936279296875, 1.479736328125, 1.8658447265625, 2.251953125, 2.6380615234375, 3.024169921875, 3.4102783203125, 3.79638671875, 4.1824951171875, 4.568603515625, 4.9547119140625, 5.3408203125, 5.7269287109375, 6.113037109375, 6.4991455078125, 6.88525390625, 7.2713623046875, 7.657470703125, 8.0435791015625, 8.4296875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 10.0, 28.0, 76.0, 421.0, 367.0, 64.0, 17.0, 12.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.5, -16.0970458984375, -15.694091796875, -15.2911376953125, -14.88818359375, -14.4852294921875, -14.082275390625, -13.6793212890625, -13.2763671875, -12.8734130859375, -12.470458984375, -12.0675048828125, -11.66455078125, -11.2615966796875, -10.858642578125, -10.4556884765625, -10.052734375, -9.6497802734375, -9.246826171875, -8.8438720703125, -8.44091796875, -8.0379638671875, -7.635009765625, -7.2320556640625, -6.8291015625, -6.4261474609375, -6.023193359375, -5.6202392578125, -5.21728515625, -4.8143310546875, -4.411376953125, -4.0084228515625, -3.60546875, -3.2025146484375, -2.799560546875, -2.3966064453125, -1.99365234375, -1.5906982421875, -1.187744140625, -0.7847900390625, -0.3818359375, 0.0211181640625, 0.424072265625, 0.8270263671875, 1.22998046875, 1.6329345703125, 2.035888671875, 2.4388427734375, 2.841796875, 3.2447509765625, 3.647705078125, 4.0506591796875, 4.45361328125, 4.8565673828125, 5.259521484375, 5.6624755859375, 6.0654296875, 6.4683837890625, 6.871337890625, 7.2742919921875, 7.67724609375, 8.0802001953125, 8.483154296875, 8.8861083984375, 9.2890625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 7.0, 5.0, 28.0, 156.0, 492.0, 222.0, 60.0, 17.0, 10.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-256.1046447753906, -250.3303985595703, -244.55615234375, -238.7819061279297, -233.00765991210938, -227.23341369628906, -221.45916748046875, -215.6849365234375, -209.91067504882812, -204.1364288330078, -198.3621826171875, -192.5879364013672, -186.81369018554688, -181.03944396972656, -175.26519775390625, -169.490966796875, -163.7167205810547, -157.94247436523438, -152.16822814941406, -146.39398193359375, -140.61973571777344, -134.84548950195312, -129.07125854492188, -123.29700469970703, -117.52275848388672, -111.7485122680664, -105.9742660522461, -100.20002746582031, -94.42578125, -88.65153503417969, -82.87728881835938, -77.10304260253906, -71.32878875732422, -65.5545425415039, -59.780296325683594, -54.00605392456055, -48.231807708740234, -42.45756149291992, -36.683319091796875, -30.909072875976562, -25.13482666015625, -19.360580444335938, -13.586336135864258, -7.812091827392578, -2.0378456115722656, 3.736400604248047, 9.510643005371094, 15.284889221191406, 21.05913543701172, 26.83338165283203, 32.607627868652344, 38.38187026977539, 44.1561164855957, 49.930362701416016, 55.70460510253906, 61.478851318359375, 67.25309753417969, 73.02734375, 78.80158996582031, 84.57583618164062, 90.35008239746094, 96.12432861328125, 101.89856719970703, 107.67281341552734, 113.44705963134766]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 10.0, 13.0, 13.0, 15.0, 21.0, 25.0, 34.0, 33.0, 44.0, 46.0, 60.0, 72.0, 82.0, 76.0, 66.0, 71.0, 64.0, 43.0, 45.0, 48.0, 31.0, 24.0, 11.0, 17.0, 13.0, 10.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.9471435546875, -77.71564483642578, -73.48414611816406, -69.25264739990234, -65.02114868164062, -60.789649963378906, -56.55815505981445, -52.326656341552734, -48.095157623291016, -43.8636589050293, -39.63216018676758, -35.400665283203125, -31.169164657592773, -26.937665939331055, -22.70616912841797, -18.47467041015625, -14.243171691894531, -10.011672973632812, -5.78017520904541, -1.5486774444580078, 2.682821273803711, 6.91431999206543, 11.145816802978516, 15.377315521240234, 19.608814239501953, 23.840312957763672, 28.07181167602539, 32.303306579589844, 36.53480529785156, 40.76630401611328, 44.997802734375, 49.22930145263672, 53.46080017089844, 57.692298889160156, 61.923797607421875, 66.1552963256836, 70.38679504394531, 74.61829376220703, 78.84979248046875, 83.08128356933594, 87.31278991699219, 91.5442886352539, 95.77578735351562, 100.00728607177734, 104.23878479003906, 108.47028350830078, 112.7017822265625, 116.93327331542969, 121.1647720336914, 125.39627075195312, 129.6277618408203, 133.85926818847656, 138.09075927734375, 142.322265625, 146.5537567138672, 150.78526306152344, 155.01675415039062, 159.2482452392578, 163.47975158691406, 167.71124267578125, 171.9427490234375, 176.1742401123047, 180.40574645996094, 184.63723754882812, 188.86874389648438]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 11.0, 9.0, 7.0, 26.0, 27.0, 47.0, 79.0, 91.0, 144.0, 252.0, 404.0, 733.0, 1210.0, 2190.0, 4264.0, 8955.0, 27393.0, 210128.0, 3373499.0, 496189.0, 44862.0, 12310.0, 5392.0, 2725.0, 1405.0, 796.0, 464.0, 260.0, 147.0, 99.0, 47.0, 34.0, 21.0, 23.0, 9.0, 11.0, 7.0, 7.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.759765625, -2.66668701171875, -2.5736083984375, -2.48052978515625, -2.387451171875, -2.29437255859375, -2.2012939453125, -2.10821533203125, -2.01513671875, -1.92205810546875, -1.8289794921875, -1.73590087890625, -1.642822265625, -1.54974365234375, -1.4566650390625, -1.36358642578125, -1.2705078125, -1.17742919921875, -1.0843505859375, -0.99127197265625, -0.898193359375, -0.80511474609375, -0.7120361328125, -0.61895751953125, -0.52587890625, -0.43280029296875, -0.3397216796875, -0.24664306640625, -0.153564453125, -0.06048583984375, 0.0325927734375, 0.12567138671875, 0.21875, 0.31182861328125, 0.4049072265625, 0.49798583984375, 0.591064453125, 0.68414306640625, 0.7772216796875, 0.87030029296875, 0.96337890625, 1.05645751953125, 1.1495361328125, 1.24261474609375, 1.335693359375, 1.42877197265625, 1.5218505859375, 1.61492919921875, 1.7080078125, 1.80108642578125, 1.8941650390625, 1.98724365234375, 2.080322265625, 2.17340087890625, 2.2664794921875, 2.35955810546875, 2.45263671875, 2.54571533203125, 2.6387939453125, 2.73187255859375, 2.824951171875, 2.91802978515625, 3.0111083984375, 3.10418701171875, 3.197265625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 6.0, 7.0, 9.0, 11.0, 8.0, 10.0, 16.0, 12.0, 27.0, 34.0, 33.0, 24.0, 44.0, 39.0, 46.0, 53.0, 59.0, 56.0, 57.0, 58.0, 60.0, 46.0, 38.0, 45.0, 32.0, 27.0, 19.0, 23.0, 14.0, 11.0, 16.0, 14.0, 14.0, 6.0, 4.0, 4.0, 6.0, 6.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.873046875, -2.78851318359375, -2.7039794921875, -2.61944580078125, -2.534912109375, -2.45037841796875, -2.3658447265625, -2.28131103515625, -2.19677734375, -2.11224365234375, -2.0277099609375, -1.94317626953125, -1.858642578125, -1.77410888671875, -1.6895751953125, -1.60504150390625, -1.5205078125, -1.43597412109375, -1.3514404296875, -1.26690673828125, -1.182373046875, -1.09783935546875, -1.0133056640625, -0.92877197265625, -0.84423828125, -0.75970458984375, -0.6751708984375, -0.59063720703125, -0.506103515625, -0.42156982421875, -0.3370361328125, -0.25250244140625, -0.16796875, -0.08343505859375, 0.0010986328125, 0.08563232421875, 0.170166015625, 0.25469970703125, 0.3392333984375, 0.42376708984375, 0.50830078125, 0.59283447265625, 0.6773681640625, 0.76190185546875, 0.846435546875, 0.93096923828125, 1.0155029296875, 1.10003662109375, 1.1845703125, 1.26910400390625, 1.3536376953125, 1.43817138671875, 1.522705078125, 1.60723876953125, 1.6917724609375, 1.77630615234375, 1.86083984375, 1.94537353515625, 2.0299072265625, 2.11444091796875, 2.198974609375, 2.28350830078125, 2.3680419921875, 2.45257568359375, 2.537109375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 9.0, 13.0, 25.0, 55.0, 142.0, 600.0, 49322.0, 4141759.0, 1955.0, 240.0, 91.0, 44.0, 23.0, 7.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.625, -26.766845703125, -25.90869140625, -25.050537109375, -24.1923828125, -23.334228515625, -22.47607421875, -21.617919921875, -20.759765625, -19.901611328125, -19.04345703125, -18.185302734375, -17.3271484375, -16.468994140625, -15.61083984375, -14.752685546875, -13.89453125, -13.036376953125, -12.17822265625, -11.320068359375, -10.4619140625, -9.603759765625, -8.74560546875, -7.887451171875, -7.029296875, -6.171142578125, -5.31298828125, -4.454833984375, -3.5966796875, -2.738525390625, -1.88037109375, -1.022216796875, -0.1640625, 0.694091796875, 1.55224609375, 2.410400390625, 3.2685546875, 4.126708984375, 4.98486328125, 5.843017578125, 6.701171875, 7.559326171875, 8.41748046875, 9.275634765625, 10.1337890625, 10.991943359375, 11.85009765625, 12.708251953125, 13.56640625, 14.424560546875, 15.28271484375, 16.140869140625, 16.9990234375, 17.857177734375, 18.71533203125, 19.573486328125, 20.431640625, 21.289794921875, 22.14794921875, 23.006103515625, 23.8642578125, 24.722412109375, 25.58056640625, 26.438720703125, 27.296875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 13.0, 6.0, 12.0, 26.0, 38.0, 73.0, 239.0, 2233.0, 1199.0, 114.0, 40.0, 24.0, 22.0, 13.0, 6.0, 4.0, 7.0, 2.0, 0.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.33203125, -6.98052978515625, -6.6290283203125, -6.27752685546875, -5.926025390625, -5.57452392578125, -5.2230224609375, -4.87152099609375, -4.52001953125, -4.16851806640625, -3.8170166015625, -3.46551513671875, -3.114013671875, -2.76251220703125, -2.4110107421875, -2.05950927734375, -1.7080078125, -1.35650634765625, -1.0050048828125, -0.65350341796875, -0.302001953125, 0.04949951171875, 0.4010009765625, 0.75250244140625, 1.10400390625, 1.45550537109375, 1.8070068359375, 2.15850830078125, 2.510009765625, 2.86151123046875, 3.2130126953125, 3.56451416015625, 3.916015625, 4.26751708984375, 4.6190185546875, 4.97052001953125, 5.322021484375, 5.67352294921875, 6.0250244140625, 6.37652587890625, 6.72802734375, 7.07952880859375, 7.4310302734375, 7.78253173828125, 8.134033203125, 8.48553466796875, 8.8370361328125, 9.18853759765625, 9.5400390625, 9.89154052734375, 10.2430419921875, 10.59454345703125, 10.946044921875, 11.29754638671875, 11.6490478515625, 12.00054931640625, 12.35205078125, 12.70355224609375, 13.0550537109375, 13.40655517578125, 13.758056640625, 14.10955810546875, 14.4610595703125, 14.81256103515625, 15.1640625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 8.0, 10.0, 13.0, 14.0, 33.0, 74.0, 158.0, 280.0, 220.0, 120.0, 35.0, 12.0, 4.0, 2.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.198890686035156, -51.682254791259766, -50.165618896484375, -48.648983001708984, -47.132347106933594, -45.6157112121582, -44.09907531738281, -42.582435607910156, -41.06580352783203, -39.54916763305664, -38.03253173828125, -36.51589584350586, -34.99925994873047, -33.48262405395508, -31.965986251831055, -30.449350357055664, -28.93271255493164, -27.41607666015625, -25.89944076538086, -24.38280487060547, -22.866168975830078, -21.349533081054688, -19.832895278930664, -18.316259384155273, -16.799623489379883, -15.282987594604492, -13.766351699829102, -12.249714851379395, -10.733078956604004, -9.216443061828613, -7.699806213378906, -6.183170318603516, -4.666538238525391, -3.149902105331421, -1.6332659721374512, -0.11662960052490234, 1.4000062942504883, 2.916642189025879, 4.433279037475586, 5.949914932250977, 7.466550827026367, 8.983186721801758, 10.499822616577148, 12.016459465026855, 13.533095359802246, 15.049731254577637, 16.566368103027344, 18.083003997802734, 19.599639892578125, 21.116275787353516, 22.632911682128906, 24.149547576904297, 25.666183471679688, 27.182819366455078, 28.6994571685791, 30.216093063354492, 31.732728958129883, 33.249366760253906, 34.7660026550293, 36.28263854980469, 37.79927444458008, 39.31591033935547, 40.83254623413086, 42.34918212890625, 43.86581802368164]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 12.0, 11.0, 13.0, 12.0, 27.0, 27.0, 27.0, 43.0, 40.0, 48.0, 36.0, 50.0, 53.0, 56.0, 56.0, 42.0, 55.0, 49.0, 40.0, 43.0, 44.0, 38.0, 34.0, 19.0, 22.0, 12.0, 11.0, 10.0, 6.0, 8.0, 10.0, 4.0, 7.0, 4.0, 6.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-25.131750106811523, -24.353090286254883, -23.574432373046875, -22.795772552490234, -22.017112731933594, -21.238452911376953, -20.459794998168945, -19.681135177612305, -18.902477264404297, -18.123817443847656, -17.34515953063965, -16.566499710083008, -15.787839889526367, -15.009181022644043, -14.230522155761719, -13.451862335205078, -12.673202514648438, -11.894543647766113, -11.115883827209473, -10.337224960327148, -9.558565139770508, -8.779906272888184, -8.00124740600586, -7.222588062286377, -6.4439287185668945, -5.665269374847412, -4.88661003112793, -4.1079511642456055, -3.329291820526123, -2.5506324768066406, -1.7719736099243164, -0.993314266204834, -0.21465301513671875, 0.5640062093734741, 1.342665433883667, 2.1213245391845703, 2.8999838829040527, 3.678643226623535, 4.457302093505859, 5.235961437225342, 6.014620780944824, 6.793280124664307, 7.571939468383789, 8.350598335266113, 9.129257202148438, 9.907917022705078, 10.686575889587402, 11.465234756469727, 12.243894577026367, 13.022553443908691, 13.801213264465332, 14.579872131347656, 15.358531951904297, 16.137191772460938, 16.915849685668945, 17.694509506225586, 18.473167419433594, 19.251827239990234, 20.030485153198242, 20.809144973754883, 21.587804794311523, 22.36646270751953, 23.145122528076172, 23.923782348632812, 24.702442169189453]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 6.0, 7.0, 8.0, 14.0, 21.0, 44.0, 46.0, 54.0, 95.0, 153.0, 244.0, 376.0, 544.0, 991.0, 1625.0, 2797.0, 4769.0, 9001.0, 16655.0, 34067.0, 74287.0, 170938.0, 323030.0, 222401.0, 96970.0, 43443.0, 21037.0, 10959.0, 5844.0, 3223.0, 1899.0, 1070.0, 652.0, 435.0, 291.0, 206.0, 114.0, 82.0, 41.0, 28.0, 27.0, 19.0, 8.0, 8.0, 7.0, 5.0, 5.0, 1.0, 5.0, 3.0, 3.0], "bins": [-2.12109375, -2.061614990234375, -2.00213623046875, -1.942657470703125, -1.8831787109375, -1.823699951171875, -1.76422119140625, -1.704742431640625, -1.645263671875, -1.585784912109375, -1.52630615234375, -1.466827392578125, -1.4073486328125, -1.347869873046875, -1.28839111328125, -1.228912353515625, -1.16943359375, -1.109954833984375, -1.05047607421875, -0.990997314453125, -0.9315185546875, -0.872039794921875, -0.81256103515625, -0.753082275390625, -0.693603515625, -0.634124755859375, -0.57464599609375, -0.515167236328125, -0.4556884765625, -0.396209716796875, -0.33673095703125, -0.277252197265625, -0.2177734375, -0.158294677734375, -0.09881591796875, -0.039337158203125, 0.0201416015625, 0.079620361328125, 0.13909912109375, 0.198577880859375, 0.258056640625, 0.317535400390625, 0.37701416015625, 0.436492919921875, 0.4959716796875, 0.555450439453125, 0.61492919921875, 0.674407958984375, 0.73388671875, 0.793365478515625, 0.85284423828125, 0.912322998046875, 0.9718017578125, 1.031280517578125, 1.09075927734375, 1.150238037109375, 1.209716796875, 1.269195556640625, 1.32867431640625, 1.388153076171875, 1.4476318359375, 1.507110595703125, 1.56658935546875, 1.626068115234375, 1.685546875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 5.0, 2.0, 8.0, 11.0, 12.0, 16.0, 8.0, 17.0, 10.0, 26.0, 26.0, 20.0, 20.0, 37.0, 39.0, 46.0, 45.0, 31.0, 37.0, 53.0, 41.0, 46.0, 55.0, 40.0, 43.0, 40.0, 42.0, 26.0, 31.0, 26.0, 15.0, 17.0, 20.0, 11.0, 15.0, 12.0, 8.0, 4.0, 4.0, 10.0, 2.0, 4.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0], "bins": [-2.265625, -2.19573974609375, -2.1258544921875, -2.05596923828125, -1.986083984375, -1.91619873046875, -1.8463134765625, -1.77642822265625, -1.70654296875, -1.63665771484375, -1.5667724609375, -1.49688720703125, -1.427001953125, -1.35711669921875, -1.2872314453125, -1.21734619140625, -1.1474609375, -1.07757568359375, -1.0076904296875, -0.93780517578125, -0.867919921875, -0.79803466796875, -0.7281494140625, -0.65826416015625, -0.58837890625, -0.51849365234375, -0.4486083984375, -0.37872314453125, -0.308837890625, -0.23895263671875, -0.1690673828125, -0.09918212890625, -0.029296875, 0.04058837890625, 0.1104736328125, 0.18035888671875, 0.250244140625, 0.32012939453125, 0.3900146484375, 0.45989990234375, 0.52978515625, 0.59967041015625, 0.6695556640625, 0.73944091796875, 0.809326171875, 0.87921142578125, 0.9490966796875, 1.01898193359375, 1.0888671875, 1.15875244140625, 1.2286376953125, 1.29852294921875, 1.368408203125, 1.43829345703125, 1.5081787109375, 1.57806396484375, 1.64794921875, 1.71783447265625, 1.7877197265625, 1.85760498046875, 1.927490234375, 1.99737548828125, 2.0672607421875, 2.13714599609375, 2.20703125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 5.0, 0.0, 2.0, 2.0, 11.0, 12.0, 9.0, 25.0, 40.0, 67.0, 81.0, 135.0, 213.0, 388.0, 730.0, 1928.0, 9508.0, 412215.0, 607978.0, 11285.0, 2070.0, 807.0, 438.0, 243.0, 136.0, 79.0, 45.0, 36.0, 22.0, 17.0, 10.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 3.0, 1.0], "bins": [-13.6484375, -13.32373046875, -12.9990234375, -12.67431640625, -12.349609375, -12.02490234375, -11.7001953125, -11.37548828125, -11.05078125, -10.72607421875, -10.4013671875, -10.07666015625, -9.751953125, -9.42724609375, -9.1025390625, -8.77783203125, -8.453125, -8.12841796875, -7.8037109375, -7.47900390625, -7.154296875, -6.82958984375, -6.5048828125, -6.18017578125, -5.85546875, -5.53076171875, -5.2060546875, -4.88134765625, -4.556640625, -4.23193359375, -3.9072265625, -3.58251953125, -3.2578125, -2.93310546875, -2.6083984375, -2.28369140625, -1.958984375, -1.63427734375, -1.3095703125, -0.98486328125, -0.66015625, -0.33544921875, -0.0107421875, 0.31396484375, 0.638671875, 0.96337890625, 1.2880859375, 1.61279296875, 1.9375, 2.26220703125, 2.5869140625, 2.91162109375, 3.236328125, 3.56103515625, 3.8857421875, 4.21044921875, 4.53515625, 4.85986328125, 5.1845703125, 5.50927734375, 5.833984375, 6.15869140625, 6.4833984375, 6.80810546875, 7.1328125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 6.0, 12.0, 6.0, 11.0, 8.0, 4.0, 17.0, 26.0, 27.0, 32.0, 42.0, 46.0, 56.0, 60.0, 63.0, 52.0, 57.0, 58.0, 56.0, 57.0, 64.0, 42.0, 40.0, 40.0, 24.0, 24.0, 18.0, 15.0, 9.0, 8.0, 8.0, 5.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-15.1484375, -14.7421875, -14.3359375, -13.9296875, -13.5234375, -13.1171875, -12.7109375, -12.3046875, -11.8984375, -11.4921875, -11.0859375, -10.6796875, -10.2734375, -9.8671875, -9.4609375, -9.0546875, -8.6484375, -8.2421875, -7.8359375, -7.4296875, -7.0234375, -6.6171875, -6.2109375, -5.8046875, -5.3984375, -4.9921875, -4.5859375, -4.1796875, -3.7734375, -3.3671875, -2.9609375, -2.5546875, -2.1484375, -1.7421875, -1.3359375, -0.9296875, -0.5234375, -0.1171875, 0.2890625, 0.6953125, 1.1015625, 1.5078125, 1.9140625, 2.3203125, 2.7265625, 3.1328125, 3.5390625, 3.9453125, 4.3515625, 4.7578125, 5.1640625, 5.5703125, 5.9765625, 6.3828125, 6.7890625, 7.1953125, 7.6015625, 8.0078125, 8.4140625, 8.8203125, 9.2265625, 9.6328125, 10.0390625, 10.4453125, 10.8515625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 9.0, 18.0, 20.0, 23.0, 35.0, 47.0, 97.0, 179.0, 347.0, 1081.0, 4270.0, 40886.0, 945830.0, 49286.0, 4503.0, 1054.0, 403.0, 189.0, 89.0, 55.0, 47.0, 22.0, 6.0, 14.0, 6.0, 7.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.896484375, -2.812591552734375, -2.72869873046875, -2.644805908203125, -2.5609130859375, -2.477020263671875, -2.39312744140625, -2.309234619140625, -2.225341796875, -2.141448974609375, -2.05755615234375, -1.973663330078125, -1.8897705078125, -1.805877685546875, -1.72198486328125, -1.638092041015625, -1.55419921875, -1.470306396484375, -1.38641357421875, -1.302520751953125, -1.2186279296875, -1.134735107421875, -1.05084228515625, -0.966949462890625, -0.883056640625, -0.799163818359375, -0.71527099609375, -0.631378173828125, -0.5474853515625, -0.463592529296875, -0.37969970703125, -0.295806884765625, -0.2119140625, -0.128021240234375, -0.04412841796875, 0.039764404296875, 0.1236572265625, 0.207550048828125, 0.29144287109375, 0.375335693359375, 0.459228515625, 0.543121337890625, 0.62701416015625, 0.710906982421875, 0.7947998046875, 0.878692626953125, 0.96258544921875, 1.046478271484375, 1.13037109375, 1.214263916015625, 1.29815673828125, 1.382049560546875, 1.4659423828125, 1.549835205078125, 1.63372802734375, 1.717620849609375, 1.801513671875, 1.885406494140625, 1.96929931640625, 2.053192138671875, 2.1370849609375, 2.220977783203125, 2.30487060546875, 2.388763427734375, 2.47265625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 3.0, 7.0, 12.0, 12.0, 16.0, 24.0, 32.0, 46.0, 49.0, 110.0, 125.0, 146.0, 120.0, 76.0, 77.0, 48.0, 19.0, 26.0, 18.0, 9.0, 8.0, 8.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00028324127197265625, -0.00027640722692012787, -0.0002695731818675995, -0.0002627391368150711, -0.0002559050917625427, -0.00024907104671001434, -0.00024223700165748596, -0.00023540295660495758, -0.0002285689115524292, -0.00022173486649990082, -0.00021490082144737244, -0.00020806677639484406, -0.00020123273134231567, -0.0001943986862897873, -0.0001875646412372589, -0.00018073059618473053, -0.00017389655113220215, -0.00016706250607967377, -0.00016022846102714539, -0.000153394415974617, -0.00014656037092208862, -0.00013972632586956024, -0.00013289228081703186, -0.00012605823576450348, -0.0001192241907119751, -0.00011239014565944672, -0.00010555610060691833, -9.872205555438995e-05, -9.188801050186157e-05, -8.505396544933319e-05, -7.821992039680481e-05, -7.138587534427643e-05, -6.455183029174805e-05, -5.7717785239219666e-05, -5.0883740186691284e-05, -4.40496951341629e-05, -3.721565008163452e-05, -3.038160502910614e-05, -2.354755997657776e-05, -1.6713514924049377e-05, -9.879469871520996e-06, -3.0454248189926147e-06, 3.7886202335357666e-06, 1.0622665286064148e-05, 1.745671033859253e-05, 2.429075539112091e-05, 3.112480044364929e-05, 3.795884549617767e-05, 4.4792890548706055e-05, 5.1626935601234436e-05, 5.846098065376282e-05, 6.52950257062912e-05, 7.212907075881958e-05, 7.896311581134796e-05, 8.579716086387634e-05, 9.263120591640472e-05, 9.94652509689331e-05, 0.00010629929602146149, 0.00011313334107398987, 0.00011996738612651825, 0.00012680143117904663, 0.000133635476231575, 0.0001404695212841034, 0.00014730356633663177, 0.00015413761138916016]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 5.0, 13.0, 27.0, 27.0, 50.0, 85.0, 178.0, 379.0, 871.0, 3369.0, 31457.0, 954189.0, 51844.0, 4097.0, 1115.0, 408.0, 189.0, 116.0, 43.0, 27.0, 20.0, 11.0, 11.0, 6.0, 3.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.330078125, -3.233734130859375, -3.13739013671875, -3.041046142578125, -2.9447021484375, -2.848358154296875, -2.75201416015625, -2.655670166015625, -2.559326171875, -2.462982177734375, -2.36663818359375, -2.270294189453125, -2.1739501953125, -2.077606201171875, -1.98126220703125, -1.884918212890625, -1.78857421875, -1.692230224609375, -1.59588623046875, -1.499542236328125, -1.4031982421875, -1.306854248046875, -1.21051025390625, -1.114166259765625, -1.017822265625, -0.921478271484375, -0.82513427734375, -0.728790283203125, -0.6324462890625, -0.536102294921875, -0.43975830078125, -0.343414306640625, -0.2470703125, -0.150726318359375, -0.05438232421875, 0.041961669921875, 0.1383056640625, 0.234649658203125, 0.33099365234375, 0.427337646484375, 0.523681640625, 0.620025634765625, 0.71636962890625, 0.812713623046875, 0.9090576171875, 1.005401611328125, 1.10174560546875, 1.198089599609375, 1.29443359375, 1.390777587890625, 1.48712158203125, 1.583465576171875, 1.6798095703125, 1.776153564453125, 1.87249755859375, 1.968841552734375, 2.065185546875, 2.161529541015625, 2.25787353515625, 2.354217529296875, 2.4505615234375, 2.546905517578125, 2.64324951171875, 2.739593505859375, 2.8359375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 13.0, 14.0, 15.0, 23.0, 36.0, 45.0, 51.0, 67.0, 72.0, 81.0, 81.0, 76.0, 76.0, 71.0, 59.0, 49.0, 35.0, 28.0, 28.0, 14.0, 13.0, 7.0, 4.0, 7.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8017578125, -1.7408905029296875, -1.680023193359375, -1.6191558837890625, -1.55828857421875, -1.4974212646484375, -1.436553955078125, -1.3756866455078125, -1.3148193359375, -1.2539520263671875, -1.193084716796875, -1.1322174072265625, -1.07135009765625, -1.0104827880859375, -0.949615478515625, -0.8887481689453125, -0.827880859375, -0.7670135498046875, -0.706146240234375, -0.6452789306640625, -0.58441162109375, -0.5235443115234375, -0.462677001953125, -0.4018096923828125, -0.3409423828125, -0.2800750732421875, -0.219207763671875, -0.1583404541015625, -0.09747314453125, -0.0366058349609375, 0.024261474609375, 0.0851287841796875, 0.14599609375, 0.2068634033203125, 0.267730712890625, 0.3285980224609375, 0.38946533203125, 0.4503326416015625, 0.511199951171875, 0.5720672607421875, 0.6329345703125, 0.6938018798828125, 0.754669189453125, 0.8155364990234375, 0.87640380859375, 0.9372711181640625, 0.998138427734375, 1.0590057373046875, 1.119873046875, 1.1807403564453125, 1.241607666015625, 1.3024749755859375, 1.36334228515625, 1.4242095947265625, 1.485076904296875, 1.5459442138671875, 1.6068115234375, 1.6676788330078125, 1.728546142578125, 1.7894134521484375, 1.85028076171875, 1.9111480712890625, 1.972015380859375, 2.0328826904296875, 2.09375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 21.0, 141.0, 650.0, 170.0, 14.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.50665283203125, -45.238956451416016, -40.97126007080078, -36.70356369018555, -32.43586730957031, -28.168170928955078, -23.900474548339844, -19.63277816772461, -15.365081787109375, -11.09738540649414, -6.829689025878906, -2.561992645263672, 1.7057037353515625, 5.973400115966797, 10.241096496582031, 14.508792877197266, 18.7764892578125, 23.044185638427734, 27.31188201904297, 31.579578399658203, 35.84727478027344, 40.11497116088867, 44.382667541503906, 48.65036392211914, 52.918060302734375, 57.18575668334961, 61.453453063964844, 65.72114562988281, 69.98884582519531, 74.25654602050781, 78.52423858642578, 82.79193115234375, 87.05961608886719, 91.32731628417969, 95.59500885009766, 99.86270141601562, 104.13040161132812, 108.39810180664062, 112.6657943725586, 116.93348693847656, 121.20118713378906, 125.46888732910156, 129.736572265625, 134.0042724609375, 138.27197265625, 142.5396728515625, 146.807373046875, 151.07505798339844, 155.34275817871094, 159.61045837402344, 163.87814331054688, 168.14584350585938, 172.41354370117188, 176.68124389648438, 180.94894409179688, 185.2166290283203, 189.4843292236328, 193.7520294189453, 198.01971435546875, 202.28741455078125, 206.55511474609375, 210.82281494140625, 215.09051513671875, 219.3582000732422, 223.6259002685547]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 12.0, 12.0, 17.0, 20.0, 27.0, 31.0, 31.0, 40.0, 53.0, 56.0, 62.0, 77.0, 81.0, 73.0, 59.0, 54.0, 64.0, 54.0, 35.0, 22.0, 29.0, 16.0, 7.0, 13.0, 13.0, 9.0, 10.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.91963195800781, -62.166988372802734, -60.41434860229492, -58.661705017089844, -56.909061431884766, -55.15641784667969, -53.403778076171875, -51.6511344909668, -49.89849090576172, -48.14584732055664, -46.39320755004883, -44.64056396484375, -42.88792037963867, -41.135276794433594, -39.38263702392578, -37.6299934387207, -35.87735366821289, -34.12471008300781, -32.3720703125, -30.619426727294922, -28.866783142089844, -27.1141414642334, -25.361499786376953, -23.608856201171875, -21.85621452331543, -20.103572845458984, -18.350929260253906, -16.59828758239746, -14.8456449508667, -13.093002319335938, -11.340360641479492, -9.58771800994873, -7.835079193115234, -6.082436561584473, -4.329794406890869, -2.5771522521972656, -0.8245096206665039, 0.9281330108642578, 2.680774688720703, 4.433417320251465, 6.186059951782227, 7.938702583312988, 9.69134521484375, 11.443986892700195, 13.196629524230957, 14.949272155761719, 16.701913833618164, 18.45455551147461, 20.207199096679688, 21.959840774536133, 23.71248435974121, 25.465126037597656, 27.217769622802734, 28.97041130065918, 30.723052978515625, 32.4756965637207, 34.22834014892578, 35.98098373413086, 37.73362350463867, 39.48626708984375, 41.23891067504883, 42.991554260253906, 44.74419403076172, 46.4968376159668, 48.24947738647461]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0, 8.0, 4.0, 12.0, 14.0, 9.0, 15.0, 27.0, 45.0, 47.0, 63.0, 94.0, 132.0, 185.0, 476.0, 3225.0, 2468854.0, 1716041.0, 3918.0, 510.0, 190.0, 119.0, 74.0, 55.0, 45.0, 31.0, 18.0, 23.0, 13.0, 9.0, 8.0, 5.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.75, -13.3201904296875, -12.890380859375, -12.4605712890625, -12.03076171875, -11.6009521484375, -11.171142578125, -10.7413330078125, -10.3115234375, -9.8817138671875, -9.451904296875, -9.0220947265625, -8.59228515625, -8.1624755859375, -7.732666015625, -7.3028564453125, -6.873046875, -6.4432373046875, -6.013427734375, -5.5836181640625, -5.15380859375, -4.7239990234375, -4.294189453125, -3.8643798828125, -3.4345703125, -3.0047607421875, -2.574951171875, -2.1451416015625, -1.71533203125, -1.2855224609375, -0.855712890625, -0.4259033203125, 0.00390625, 0.4337158203125, 0.863525390625, 1.2933349609375, 1.72314453125, 2.1529541015625, 2.582763671875, 3.0125732421875, 3.4423828125, 3.8721923828125, 4.302001953125, 4.7318115234375, 5.16162109375, 5.5914306640625, 6.021240234375, 6.4510498046875, 6.880859375, 7.3106689453125, 7.740478515625, 8.1702880859375, 8.60009765625, 9.0299072265625, 9.459716796875, 9.8895263671875, 10.3193359375, 10.7491455078125, 11.178955078125, 11.6087646484375, 12.03857421875, 12.4683837890625, 12.898193359375, 13.3280029296875, 13.7578125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 9.0, 15.0, 34.0, 43.0, 56.0, 104.0, 125.0, 136.0, 150.0, 118.0, 71.0, 60.0, 41.0, 24.0, 11.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.34375, -9.1396484375, -8.935546875, -8.7314453125, -8.52734375, -8.3232421875, -8.119140625, -7.9150390625, -7.7109375, -7.5068359375, -7.302734375, -7.0986328125, -6.89453125, -6.6904296875, -6.486328125, -6.2822265625, -6.078125, -5.8740234375, -5.669921875, -5.4658203125, -5.26171875, -5.0576171875, -4.853515625, -4.6494140625, -4.4453125, -4.2412109375, -4.037109375, -3.8330078125, -3.62890625, -3.4248046875, -3.220703125, -3.0166015625, -2.8125, -2.6083984375, -2.404296875, -2.2001953125, -1.99609375, -1.7919921875, -1.587890625, -1.3837890625, -1.1796875, -0.9755859375, -0.771484375, -0.5673828125, -0.36328125, -0.1591796875, 0.044921875, 0.2490234375, 0.453125, 0.6572265625, 0.861328125, 1.0654296875, 1.26953125, 1.4736328125, 1.677734375, 1.8818359375, 2.0859375, 2.2900390625, 2.494140625, 2.6982421875, 2.90234375, 3.1064453125, 3.310546875, 3.5146484375, 3.71875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 14.0, 25.0, 47.0, 58.0, 77.0, 315.0, 61885.0, 4131003.0, 472.0, 137.0, 89.0, 75.0, 43.0, 21.0, 12.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.734375, -30.518798828125, -29.30322265625, -28.087646484375, -26.8720703125, -25.656494140625, -24.44091796875, -23.225341796875, -22.009765625, -20.794189453125, -19.57861328125, -18.363037109375, -17.1474609375, -15.931884765625, -14.71630859375, -13.500732421875, -12.28515625, -11.069580078125, -9.85400390625, -8.638427734375, -7.4228515625, -6.207275390625, -4.99169921875, -3.776123046875, -2.560546875, -1.344970703125, -0.12939453125, 1.086181640625, 2.3017578125, 3.517333984375, 4.73291015625, 5.948486328125, 7.1640625, 8.379638671875, 9.59521484375, 10.810791015625, 12.0263671875, 13.241943359375, 14.45751953125, 15.673095703125, 16.888671875, 18.104248046875, 19.31982421875, 20.535400390625, 21.7509765625, 22.966552734375, 24.18212890625, 25.397705078125, 26.61328125, 27.828857421875, 29.04443359375, 30.260009765625, 31.4755859375, 32.691162109375, 33.90673828125, 35.122314453125, 36.337890625, 37.553466796875, 38.76904296875, 39.984619140625, 41.2001953125, 42.415771484375, 43.63134765625, 44.846923828125, 46.0625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 14.0, 20.0, 88.0, 3067.0, 805.0, 59.0, 12.0, 11.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.953125, -10.260498046875, -9.56787109375, -8.875244140625, -8.1826171875, -7.489990234375, -6.79736328125, -6.104736328125, -5.412109375, -4.719482421875, -4.02685546875, -3.334228515625, -2.6416015625, -1.948974609375, -1.25634765625, -0.563720703125, 0.12890625, 0.821533203125, 1.51416015625, 2.206787109375, 2.8994140625, 3.592041015625, 4.28466796875, 4.977294921875, 5.669921875, 6.362548828125, 7.05517578125, 7.747802734375, 8.4404296875, 9.133056640625, 9.82568359375, 10.518310546875, 11.2109375, 11.903564453125, 12.59619140625, 13.288818359375, 13.9814453125, 14.674072265625, 15.36669921875, 16.059326171875, 16.751953125, 17.444580078125, 18.13720703125, 18.829833984375, 19.5224609375, 20.215087890625, 20.90771484375, 21.600341796875, 22.29296875, 22.985595703125, 23.67822265625, 24.370849609375, 25.0634765625, 25.756103515625, 26.44873046875, 27.141357421875, 27.833984375, 28.526611328125, 29.21923828125, 29.911865234375, 30.6044921875, 31.297119140625, 31.98974609375, 32.682373046875, 33.375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 13.0, 21.0, 47.0, 148.0, 332.0, 260.0, 103.0, 39.0, 19.0, 8.0, 5.0, 2.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.54374313354492, -59.61746597290039, -57.69118881225586, -55.764915466308594, -53.83863830566406, -51.91236114501953, -49.986083984375, -48.05980682373047, -46.13352966308594, -44.207252502441406, -42.280975341796875, -40.354698181152344, -38.42842483520508, -36.50214767456055, -34.575870513916016, -32.649593353271484, -30.723318099975586, -28.797040939331055, -26.870765686035156, -24.944488525390625, -23.018211364746094, -21.091934204101562, -19.165658950805664, -17.239381790161133, -15.313105583190918, -13.386829376220703, -11.460552215576172, -9.534276008605957, -7.607999324798584, -5.681722640991211, -3.755446434020996, -1.8291692733764648, 0.09710693359375, 2.023383617401123, 3.949660062789917, 5.875936508178711, 7.802213191986084, 9.728489875793457, 11.654766082763672, 13.581043243408203, 15.507319450378418, 17.433595657348633, 19.359872817993164, 21.286148071289062, 23.212425231933594, 25.138702392578125, 27.064979553222656, 28.991256713867188, 30.917531967163086, 32.843807220458984, 34.770084381103516, 36.69636154174805, 38.62263870239258, 40.54891586303711, 42.475189208984375, 44.401466369628906, 46.32774353027344, 48.25402069091797, 50.1802978515625, 52.10657501220703, 54.0328483581543, 55.95912551879883, 57.88540267944336, 59.81167984008789, 61.73795700073242]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 8.0, 14.0, 8.0, 12.0, 13.0, 30.0, 40.0, 48.0, 58.0, 47.0, 56.0, 69.0, 69.0, 84.0, 65.0, 57.0, 49.0, 53.0, 44.0, 35.0, 30.0, 19.0, 24.0, 21.0, 11.0, 12.0, 8.0, 3.0, 6.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.435894012451172, -25.313499450683594, -24.19110679626465, -23.06871223449707, -21.946319580078125, -20.823925018310547, -19.70153045654297, -18.57913589477539, -17.456743240356445, -16.334348678588867, -15.211956024169922, -14.089561462402344, -12.967167854309082, -11.84477424621582, -10.722379684448242, -9.59998607635498, -8.477592468261719, -7.355198860168457, -6.232804775238037, -5.110410690307617, -3.9880170822143555, -2.8656234741210938, -1.7432293891906738, -0.6208353042602539, 0.5015583038330078, 1.6239521503448486, 2.7463459968566895, 3.8687398433685303, 4.991133689880371, 6.113527297973633, 7.235921382904053, 8.358315467834473, 9.480705261230469, 10.60309886932373, 11.725492477416992, 12.84788703918457, 13.970280647277832, 15.092674255371094, 16.215068817138672, 17.33746337890625, 18.459856033325195, 19.582250595092773, 20.70464324951172, 21.827037811279297, 22.949432373046875, 24.07182502746582, 25.1942195892334, 26.316612243652344, 27.439006805419922, 28.5614013671875, 29.683794021606445, 30.806188583374023, 31.92858123779297, 33.05097579956055, 34.173370361328125, 35.2957649230957, 36.41815948486328, 37.54055404663086, 38.66294860839844, 39.78533935546875, 40.90773391723633, 42.030128479003906, 43.152523040771484, 44.27491760253906, 45.397308349609375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 4.0, 12.0, 14.0, 26.0, 21.0, 57.0, 65.0, 101.0, 158.0, 224.0, 343.0, 583.0, 953.0, 1637.0, 2937.0, 5598.0, 12571.0, 30210.0, 82537.0, 258010.0, 413011.0, 150723.0, 50925.0, 19540.0, 8673.0, 4078.0, 2194.0, 1261.0, 789.0, 424.0, 303.0, 171.0, 121.0, 88.0, 67.0, 41.0, 27.0, 20.0, 7.0, 8.0, 4.0, 4.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.943359375, -2.8392333984375, -2.735107421875, -2.6309814453125, -2.52685546875, -2.4227294921875, -2.318603515625, -2.2144775390625, -2.1103515625, -2.0062255859375, -1.902099609375, -1.7979736328125, -1.69384765625, -1.5897216796875, -1.485595703125, -1.3814697265625, -1.27734375, -1.1732177734375, -1.069091796875, -0.9649658203125, -0.86083984375, -0.7567138671875, -0.652587890625, -0.5484619140625, -0.4443359375, -0.3402099609375, -0.236083984375, -0.1319580078125, -0.02783203125, 0.0762939453125, 0.180419921875, 0.2845458984375, 0.388671875, 0.4927978515625, 0.596923828125, 0.7010498046875, 0.80517578125, 0.9093017578125, 1.013427734375, 1.1175537109375, 1.2216796875, 1.3258056640625, 1.429931640625, 1.5340576171875, 1.63818359375, 1.7423095703125, 1.846435546875, 1.9505615234375, 2.0546875, 2.1588134765625, 2.262939453125, 2.3670654296875, 2.47119140625, 2.5753173828125, 2.679443359375, 2.7835693359375, 2.8876953125, 2.9918212890625, 3.095947265625, 3.2000732421875, 3.30419921875, 3.4083251953125, 3.512451171875, 3.6165771484375, 3.720703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 9.0, 4.0, 4.0, 10.0, 12.0, 14.0, 14.0, 19.0, 29.0, 22.0, 46.0, 41.0, 50.0, 53.0, 57.0, 61.0, 60.0, 69.0, 59.0, 47.0, 49.0, 46.0, 41.0, 39.0, 46.0, 26.0, 21.0, 13.0, 14.0, 4.0, 7.0, 10.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.69140625, -3.58258056640625, -3.4737548828125, -3.36492919921875, -3.256103515625, -3.14727783203125, -3.0384521484375, -2.92962646484375, -2.82080078125, -2.71197509765625, -2.6031494140625, -2.49432373046875, -2.385498046875, -2.27667236328125, -2.1678466796875, -2.05902099609375, -1.9501953125, -1.84136962890625, -1.7325439453125, -1.62371826171875, -1.514892578125, -1.40606689453125, -1.2972412109375, -1.18841552734375, -1.07958984375, -0.97076416015625, -0.8619384765625, -0.75311279296875, -0.644287109375, -0.53546142578125, -0.4266357421875, -0.31781005859375, -0.208984375, -0.10015869140625, 0.0086669921875, 0.11749267578125, 0.226318359375, 0.33514404296875, 0.4439697265625, 0.55279541015625, 0.66162109375, 0.77044677734375, 0.8792724609375, 0.98809814453125, 1.096923828125, 1.20574951171875, 1.3145751953125, 1.42340087890625, 1.5322265625, 1.64105224609375, 1.7498779296875, 1.85870361328125, 1.967529296875, 2.07635498046875, 2.1851806640625, 2.29400634765625, 2.40283203125, 2.51165771484375, 2.6204833984375, 2.72930908203125, 2.838134765625, 2.94696044921875, 3.0557861328125, 3.16461181640625, 3.2734375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 5.0, 5.0, 16.0, 17.0, 21.0, 41.0, 72.0, 127.0, 206.0, 413.0, 931.0, 2729.0, 18301.0, 764250.0, 247872.0, 9950.0, 2011.0, 766.0, 319.0, 176.0, 111.0, 68.0, 44.0, 30.0, 12.0, 20.0, 10.0, 4.0, 2.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.3203125, -11.9337158203125, -11.547119140625, -11.1605224609375, -10.77392578125, -10.3873291015625, -10.000732421875, -9.6141357421875, -9.2275390625, -8.8409423828125, -8.454345703125, -8.0677490234375, -7.68115234375, -7.2945556640625, -6.907958984375, -6.5213623046875, -6.134765625, -5.7481689453125, -5.361572265625, -4.9749755859375, -4.58837890625, -4.2017822265625, -3.815185546875, -3.4285888671875, -3.0419921875, -2.6553955078125, -2.268798828125, -1.8822021484375, -1.49560546875, -1.1090087890625, -0.722412109375, -0.3358154296875, 0.05078125, 0.4373779296875, 0.823974609375, 1.2105712890625, 1.59716796875, 1.9837646484375, 2.370361328125, 2.7569580078125, 3.1435546875, 3.5301513671875, 3.916748046875, 4.3033447265625, 4.68994140625, 5.0765380859375, 5.463134765625, 5.8497314453125, 6.236328125, 6.6229248046875, 7.009521484375, 7.3961181640625, 7.78271484375, 8.1693115234375, 8.555908203125, 8.9425048828125, 9.3291015625, 9.7156982421875, 10.102294921875, 10.4888916015625, 10.87548828125, 11.2620849609375, 11.648681640625, 12.0352783203125, 12.421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 7.0, 6.0, 10.0, 21.0, 21.0, 36.0, 48.0, 67.0, 74.0, 114.0, 109.0, 107.0, 98.0, 76.0, 72.0, 54.0, 26.0, 28.0, 10.0, 8.0, 7.0, 9.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.484375, -15.763916015625, -15.04345703125, -14.322998046875, -13.6025390625, -12.882080078125, -12.16162109375, -11.441162109375, -10.720703125, -10.000244140625, -9.27978515625, -8.559326171875, -7.8388671875, -7.118408203125, -6.39794921875, -5.677490234375, -4.95703125, -4.236572265625, -3.51611328125, -2.795654296875, -2.0751953125, -1.354736328125, -0.63427734375, 0.086181640625, 0.806640625, 1.527099609375, 2.24755859375, 2.968017578125, 3.6884765625, 4.408935546875, 5.12939453125, 5.849853515625, 6.5703125, 7.290771484375, 8.01123046875, 8.731689453125, 9.4521484375, 10.172607421875, 10.89306640625, 11.613525390625, 12.333984375, 13.054443359375, 13.77490234375, 14.495361328125, 15.2158203125, 15.936279296875, 16.65673828125, 17.377197265625, 18.09765625, 18.818115234375, 19.53857421875, 20.259033203125, 20.9794921875, 21.699951171875, 22.42041015625, 23.140869140625, 23.861328125, 24.581787109375, 25.30224609375, 26.022705078125, 26.7431640625, 27.463623046875, 28.18408203125, 28.904541015625, 29.625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 14.0, 7.0, 16.0, 17.0, 36.0, 79.0, 123.0, 245.0, 781.0, 3413.0, 35880.0, 928791.0, 72393.0, 5046.0, 1028.0, 314.0, 149.0, 69.0, 46.0, 26.0, 18.0, 15.0, 8.0, 4.0, 5.0, 6.0, 6.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.078125, -3.956756591796875, -3.83538818359375, -3.714019775390625, -3.5926513671875, -3.471282958984375, -3.34991455078125, -3.228546142578125, -3.107177734375, -2.985809326171875, -2.86444091796875, -2.743072509765625, -2.6217041015625, -2.500335693359375, -2.37896728515625, -2.257598876953125, -2.13623046875, -2.014862060546875, -1.89349365234375, -1.772125244140625, -1.6507568359375, -1.529388427734375, -1.40802001953125, -1.286651611328125, -1.165283203125, -1.043914794921875, -0.92254638671875, -0.801177978515625, -0.6798095703125, -0.558441162109375, -0.43707275390625, -0.315704345703125, -0.1943359375, -0.072967529296875, 0.04840087890625, 0.169769287109375, 0.2911376953125, 0.412506103515625, 0.53387451171875, 0.655242919921875, 0.776611328125, 0.897979736328125, 1.01934814453125, 1.140716552734375, 1.2620849609375, 1.383453369140625, 1.50482177734375, 1.626190185546875, 1.74755859375, 1.868927001953125, 1.99029541015625, 2.111663818359375, 2.2330322265625, 2.354400634765625, 2.47576904296875, 2.597137451171875, 2.718505859375, 2.839874267578125, 2.96124267578125, 3.082611083984375, 3.2039794921875, 3.325347900390625, 3.44671630859375, 3.568084716796875, 3.689453125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 3.0, 5.0, 5.0, 12.0, 13.0, 15.0, 15.0, 39.0, 61.0, 83.0, 131.0, 168.0, 141.0, 98.0, 53.0, 45.0, 29.0, 23.0, 16.0, 10.0, 6.0, 8.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00042366981506347656, -0.00041301921010017395, -0.00040236860513687134, -0.0003917180001735687, -0.0003810673952102661, -0.0003704167902469635, -0.0003597661852836609, -0.0003491155803203583, -0.00033846497535705566, -0.00032781437039375305, -0.00031716376543045044, -0.00030651316046714783, -0.0002958625555038452, -0.0002852119505405426, -0.00027456134557724, -0.0002639107406139374, -0.00025326013565063477, -0.00024260953068733215, -0.00023195892572402954, -0.00022130832076072693, -0.00021065771579742432, -0.0002000071108341217, -0.0001893565058708191, -0.00017870590090751648, -0.00016805529594421387, -0.00015740469098091125, -0.00014675408601760864, -0.00013610348105430603, -0.00012545287609100342, -0.0001148022711277008, -0.0001041516661643982, -9.350106120109558e-05, -8.285045623779297e-05, -7.219985127449036e-05, -6.154924631118774e-05, -5.089864134788513e-05, -4.024803638458252e-05, -2.9597431421279907e-05, -1.8946826457977295e-05, -8.296221494674683e-06, 2.3543834686279297e-06, 1.3004988431930542e-05, 2.3655593395233154e-05, 3.4306198358535767e-05, 4.495680332183838e-05, 5.560740828514099e-05, 6.62580132484436e-05, 7.690861821174622e-05, 8.755922317504883e-05, 9.820982813835144e-05, 0.00010886043310165405, 0.00011951103806495667, 0.00013016164302825928, 0.0001408122479915619, 0.0001514628529548645, 0.00016211345791816711, 0.00017276406288146973, 0.00018341466784477234, 0.00019406527280807495, 0.00020471587777137756, 0.00021536648273468018, 0.0002260170876979828, 0.0002366676926612854, 0.000247318297624588, 0.0002579689025878906]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 5.0, 1.0, 3.0, 6.0, 6.0, 9.0, 6.0, 9.0, 25.0, 25.0, 31.0, 54.0, 94.0, 137.0, 225.0, 455.0, 1015.0, 2460.0, 8382.0, 56525.0, 775435.0, 179849.0, 17096.0, 3909.0, 1398.0, 599.0, 271.0, 167.0, 104.0, 77.0, 42.0, 38.0, 19.0, 25.0, 17.0, 10.0, 9.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.744140625, -2.66729736328125, -2.5904541015625, -2.51361083984375, -2.436767578125, -2.35992431640625, -2.2830810546875, -2.20623779296875, -2.12939453125, -2.05255126953125, -1.9757080078125, -1.89886474609375, -1.822021484375, -1.74517822265625, -1.6683349609375, -1.59149169921875, -1.5146484375, -1.43780517578125, -1.3609619140625, -1.28411865234375, -1.207275390625, -1.13043212890625, -1.0535888671875, -0.97674560546875, -0.89990234375, -0.82305908203125, -0.7462158203125, -0.66937255859375, -0.592529296875, -0.51568603515625, -0.4388427734375, -0.36199951171875, -0.28515625, -0.20831298828125, -0.1314697265625, -0.05462646484375, 0.022216796875, 0.09906005859375, 0.1759033203125, 0.25274658203125, 0.32958984375, 0.40643310546875, 0.4832763671875, 0.56011962890625, 0.636962890625, 0.71380615234375, 0.7906494140625, 0.86749267578125, 0.9443359375, 1.02117919921875, 1.0980224609375, 1.17486572265625, 1.251708984375, 1.32855224609375, 1.4053955078125, 1.48223876953125, 1.55908203125, 1.63592529296875, 1.7127685546875, 1.78961181640625, 1.866455078125, 1.94329833984375, 2.0201416015625, 2.09698486328125, 2.173828125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 5.0, 17.0, 12.0, 12.0, 27.0, 27.0, 29.0, 36.0, 52.0, 52.0, 71.0, 78.0, 86.0, 90.0, 65.0, 69.0, 42.0, 41.0, 32.0, 27.0, 24.0, 18.0, 20.0, 10.0, 14.0, 4.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.044921875, -1.98590087890625, -1.9268798828125, -1.86785888671875, -1.808837890625, -1.74981689453125, -1.6907958984375, -1.63177490234375, -1.57275390625, -1.51373291015625, -1.4547119140625, -1.39569091796875, -1.336669921875, -1.27764892578125, -1.2186279296875, -1.15960693359375, -1.1005859375, -1.04156494140625, -0.9825439453125, -0.92352294921875, -0.864501953125, -0.80548095703125, -0.7464599609375, -0.68743896484375, -0.62841796875, -0.56939697265625, -0.5103759765625, -0.45135498046875, -0.392333984375, -0.33331298828125, -0.2742919921875, -0.21527099609375, -0.15625, -0.09722900390625, -0.0382080078125, 0.02081298828125, 0.079833984375, 0.13885498046875, 0.1978759765625, 0.25689697265625, 0.31591796875, 0.37493896484375, 0.4339599609375, 0.49298095703125, 0.552001953125, 0.61102294921875, 0.6700439453125, 0.72906494140625, 0.7880859375, 0.84710693359375, 0.9061279296875, 0.96514892578125, 1.024169921875, 1.08319091796875, 1.1422119140625, 1.20123291015625, 1.26025390625, 1.31927490234375, 1.3782958984375, 1.43731689453125, 1.496337890625, 1.55535888671875, 1.6143798828125, 1.67340087890625, 1.732421875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 29.0, 156.0, 594.0, 168.0, 37.0, 7.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.571998596191406, -44.29484939575195, -40.017696380615234, -35.74054718017578, -31.463396072387695, -27.18624496459961, -22.909095764160156, -18.63194465637207, -14.354793548583984, -10.077642440795898, -5.800492286682129, -1.5233421325683594, 2.7538089752197266, 7.0309600830078125, 11.308109283447266, 15.585260391235352, 19.862411499023438, 24.139562606811523, 28.41671371459961, 32.69386291503906, 36.97101593017578, 41.248165130615234, 45.52531433105469, 49.802467346191406, 54.07961654663086, 58.35676574707031, 62.63391876220703, 66.91107177734375, 71.18821716308594, 75.46537017822266, 79.74252319335938, 84.01966857910156, 88.29682922363281, 92.57398223876953, 96.85112762451172, 101.12828063964844, 105.40543365478516, 109.68258666992188, 113.95973205566406, 118.23688507080078, 122.5140380859375, 126.79119110107422, 131.06834411621094, 135.34548950195312, 139.6226348876953, 143.89979553222656, 148.17694091796875, 152.45408630371094, 156.73123168945312, 161.0083770751953, 165.28553771972656, 169.56268310546875, 173.83982849121094, 178.1169891357422, 182.39413452148438, 186.67127990722656, 190.9484405517578, 195.2255859375, 199.50274658203125, 203.77989196777344, 208.05703735351562, 212.33419799804688, 216.61134338378906, 220.88848876953125, 225.1656494140625]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 7.0, 13.0, 12.0, 25.0, 26.0, 37.0, 35.0, 51.0, 51.0, 61.0, 78.0, 87.0, 89.0, 87.0, 53.0, 53.0, 57.0, 43.0, 31.0, 30.0, 22.0, 17.0, 12.0, 5.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.364501953125, -78.12635803222656, -75.88821411132812, -73.65007019042969, -71.41192626953125, -69.17378234863281, -66.93563842773438, -64.69750213623047, -62.45935821533203, -60.221214294433594, -57.983070373535156, -55.74492645263672, -53.50678634643555, -51.26864242553711, -49.03049850463867, -46.792354583740234, -44.5542106628418, -42.31606674194336, -40.07792282104492, -37.83978271484375, -35.60163879394531, -33.363494873046875, -31.125350952148438, -28.88720703125, -26.649065017700195, -24.410921096801758, -22.172779083251953, -19.934635162353516, -17.696491241455078, -15.458349227905273, -13.220205307006836, -10.982062339782715, -8.743919372558594, -6.505776405334473, -4.267632961273193, -2.029489517211914, 0.20865345001220703, 2.446796417236328, 4.684940338134766, 6.923083305358887, 9.161226272583008, 11.399369239807129, 13.63751220703125, 15.875656127929688, 18.113800048828125, 20.35194206237793, 22.590085983276367, 24.828227996826172, 27.06637191772461, 29.304515838623047, 31.54265785217285, 33.780799865722656, 36.018943786621094, 38.25708770751953, 40.49523162841797, 42.733375549316406, 44.971519470214844, 47.20966339111328, 49.44780731201172, 51.685951232910156, 53.92409133911133, 56.162235260009766, 58.4003791809082, 60.63852310180664, 62.87666320800781]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 3.0, 6.0, 6.0, 13.0, 21.0, 19.0, 30.0, 55.0, 83.0, 117.0, 219.0, 470.0, 976.0, 2348.0, 5781.0, 19803.0, 185796.0, 3316025.0, 608068.0, 38834.0, 9233.0, 3658.0, 1452.0, 604.0, 282.0, 140.0, 96.0, 54.0, 40.0, 16.0, 15.0, 10.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.44921875, -5.315277099609375, -5.18133544921875, -5.047393798828125, -4.9134521484375, -4.779510498046875, -4.64556884765625, -4.511627197265625, -4.377685546875, -4.243743896484375, -4.10980224609375, -3.975860595703125, -3.8419189453125, -3.707977294921875, -3.57403564453125, -3.440093994140625, -3.30615234375, -3.172210693359375, -3.03826904296875, -2.904327392578125, -2.7703857421875, -2.636444091796875, -2.50250244140625, -2.368560791015625, -2.234619140625, -2.100677490234375, -1.96673583984375, -1.832794189453125, -1.6988525390625, -1.564910888671875, -1.43096923828125, -1.297027587890625, -1.1630859375, -1.029144287109375, -0.89520263671875, -0.761260986328125, -0.6273193359375, -0.493377685546875, -0.35943603515625, -0.225494384765625, -0.091552734375, 0.042388916015625, 0.17633056640625, 0.310272216796875, 0.4442138671875, 0.578155517578125, 0.71209716796875, 0.846038818359375, 0.97998046875, 1.113922119140625, 1.24786376953125, 1.381805419921875, 1.5157470703125, 1.649688720703125, 1.78363037109375, 1.917572021484375, 2.051513671875, 2.185455322265625, 2.31939697265625, 2.453338623046875, 2.5872802734375, 2.721221923828125, 2.85516357421875, 2.989105224609375, 3.123046875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 13.0, 14.0, 28.0, 27.0, 26.0, 42.0, 57.0, 61.0, 74.0, 72.0, 71.0, 72.0, 70.0, 77.0, 72.0, 53.0, 44.0, 38.0, 36.0, 9.0, 16.0, 6.0, 9.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0], "bins": [-5.83984375, -5.713043212890625, -5.58624267578125, -5.459442138671875, -5.3326416015625, -5.205841064453125, -5.07904052734375, -4.952239990234375, -4.825439453125, -4.698638916015625, -4.57183837890625, -4.445037841796875, -4.3182373046875, -4.191436767578125, -4.06463623046875, -3.937835693359375, -3.81103515625, -3.684234619140625, -3.55743408203125, -3.430633544921875, -3.3038330078125, -3.177032470703125, -3.05023193359375, -2.923431396484375, -2.796630859375, -2.669830322265625, -2.54302978515625, -2.416229248046875, -2.2894287109375, -2.162628173828125, -2.03582763671875, -1.909027099609375, -1.7822265625, -1.655426025390625, -1.52862548828125, -1.401824951171875, -1.2750244140625, -1.148223876953125, -1.02142333984375, -0.894622802734375, -0.767822265625, -0.641021728515625, -0.51422119140625, -0.387420654296875, -0.2606201171875, -0.133819580078125, -0.00701904296875, 0.119781494140625, 0.24658203125, 0.373382568359375, 0.50018310546875, 0.626983642578125, 0.7537841796875, 0.880584716796875, 1.00738525390625, 1.134185791015625, 1.260986328125, 1.387786865234375, 1.51458740234375, 1.641387939453125, 1.7681884765625, 1.894989013671875, 2.02178955078125, 2.148590087890625, 2.275390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 9.0, 4.0, 8.0, 9.0, 12.0, 23.0, 31.0, 43.0, 114.0, 220.0, 640.0, 1967.0, 9382.0, 108312.0, 4013312.0, 52378.0, 5723.0, 1299.0, 435.0, 170.0, 78.0, 43.0, 20.0, 14.0, 12.0, 11.0, 7.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.859375, -10.5435791015625, -10.227783203125, -9.9119873046875, -9.59619140625, -9.2803955078125, -8.964599609375, -8.6488037109375, -8.3330078125, -8.0172119140625, -7.701416015625, -7.3856201171875, -7.06982421875, -6.7540283203125, -6.438232421875, -6.1224365234375, -5.806640625, -5.4908447265625, -5.175048828125, -4.8592529296875, -4.54345703125, -4.2276611328125, -3.911865234375, -3.5960693359375, -3.2802734375, -2.9644775390625, -2.648681640625, -2.3328857421875, -2.01708984375, -1.7012939453125, -1.385498046875, -1.0697021484375, -0.75390625, -0.4381103515625, -0.122314453125, 0.1934814453125, 0.50927734375, 0.8250732421875, 1.140869140625, 1.4566650390625, 1.7724609375, 2.0882568359375, 2.404052734375, 2.7198486328125, 3.03564453125, 3.3514404296875, 3.667236328125, 3.9830322265625, 4.298828125, 4.6146240234375, 4.930419921875, 5.2462158203125, 5.56201171875, 5.8778076171875, 6.193603515625, 6.5093994140625, 6.8251953125, 7.1409912109375, 7.456787109375, 7.7725830078125, 8.08837890625, 8.4041748046875, 8.719970703125, 9.0357666015625, 9.3515625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 2.0, 2.0, 9.0, 6.0, 8.0, 6.0, 15.0, 9.0, 13.0, 33.0, 41.0, 58.0, 86.0, 214.0, 560.0, 1224.0, 978.0, 388.0, 139.0, 69.0, 42.0, 32.0, 33.0, 28.0, 15.0, 11.0, 9.0, 4.0, 4.0, 5.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.30859375, -6.1220703125, -5.935546875, -5.7490234375, -5.5625, -5.3759765625, -5.189453125, -5.0029296875, -4.81640625, -4.6298828125, -4.443359375, -4.2568359375, -4.0703125, -3.8837890625, -3.697265625, -3.5107421875, -3.32421875, -3.1376953125, -2.951171875, -2.7646484375, -2.578125, -2.3916015625, -2.205078125, -2.0185546875, -1.83203125, -1.6455078125, -1.458984375, -1.2724609375, -1.0859375, -0.8994140625, -0.712890625, -0.5263671875, -0.33984375, -0.1533203125, 0.033203125, 0.2197265625, 0.40625, 0.5927734375, 0.779296875, 0.9658203125, 1.15234375, 1.3388671875, 1.525390625, 1.7119140625, 1.8984375, 2.0849609375, 2.271484375, 2.4580078125, 2.64453125, 2.8310546875, 3.017578125, 3.2041015625, 3.390625, 3.5771484375, 3.763671875, 3.9501953125, 4.13671875, 4.3232421875, 4.509765625, 4.6962890625, 4.8828125, 5.0693359375, 5.255859375, 5.4423828125, 5.62890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 9.0, 11.0, 34.0, 63.0, 175.0, 380.0, 219.0, 73.0, 25.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.22975158691406, -105.90928649902344, -103.58881378173828, -101.26834106445312, -98.9478759765625, -96.62741088867188, -94.30693817138672, -91.98646545410156, -89.66600036621094, -87.34553527832031, -85.02506256103516, -82.70458984375, -80.38412475585938, -78.06365966796875, -75.7431869506836, -73.42271423339844, -71.10224914550781, -68.78178405761719, -66.46131134033203, -64.14083862304688, -61.82037353515625, -59.49990463256836, -57.17943572998047, -54.85896682739258, -52.53849792480469, -50.2180290222168, -47.897560119628906, -45.577091217041016, -43.256622314453125, -40.936153411865234, -38.615684509277344, -36.29521560668945, -33.97475051879883, -31.654281616210938, -29.333812713623047, -27.013343811035156, -24.692874908447266, -22.372406005859375, -20.051937103271484, -17.731468200683594, -15.410999298095703, -13.090530395507812, -10.770061492919922, -8.449592590332031, -6.129123687744141, -3.80865478515625, -1.4881858825683594, 0.8322830200195312, 3.152751922607422, 5.4732208251953125, 7.793689727783203, 10.114158630371094, 12.434627532958984, 14.755096435546875, 17.075565338134766, 19.396034240722656, 21.716503143310547, 24.036972045898438, 26.357440948486328, 28.67790985107422, 30.99837875366211, 33.31884765625, 35.63931655883789, 37.95978546142578, 40.28025436401367]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 5.0, 5.0, 10.0, 12.0, 9.0, 17.0, 23.0, 19.0, 43.0, 38.0, 50.0, 52.0, 50.0, 72.0, 72.0, 51.0, 65.0, 53.0, 68.0, 54.0, 34.0, 42.0, 30.0, 25.0, 22.0, 19.0, 9.0, 18.0, 11.0, 7.0, 7.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.516937255859375, -22.50958824157715, -21.502241134643555, -20.494892120361328, -19.487545013427734, -18.480195999145508, -17.47284698486328, -16.465499877929688, -15.458151817321777, -14.450803756713867, -13.443455696105957, -12.436107635498047, -11.42875862121582, -10.421411514282227, -9.4140625, -8.40671443939209, -7.39936637878418, -6.3920183181762695, -5.384670257568359, -4.377321720123291, -3.369973659515381, -2.3626255989074707, -1.3552770614624023, -0.3479290008544922, 0.659419059753418, 1.6667672395706177, 2.6741154193878174, 3.6814637184143066, 4.688811779022217, 5.696159839630127, 6.703508377075195, 7.7108564376831055, 8.718204498291016, 9.725552558898926, 10.732900619506836, 11.740249633789062, 12.747596740722656, 13.754945755004883, 14.762293815612793, 15.769641876220703, 16.776988983154297, 17.784337997436523, 18.791685104370117, 19.799034118652344, 20.806381225585938, 21.813730239868164, 22.82107925415039, 23.828426361083984, 24.83577537536621, 25.843124389648438, 26.85047149658203, 27.857820510864258, 28.86516761779785, 29.872516632080078, 30.879863739013672, 31.8872127532959, 32.894561767578125, 33.90190887451172, 34.90925979614258, 35.91660690307617, 36.923954010009766, 37.93130111694336, 38.93865203857422, 39.94599914550781, 40.953346252441406]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 18.0, 18.0, 25.0, 36.0, 48.0, 60.0, 84.0, 109.0, 176.0, 280.0, 464.0, 709.0, 1200.0, 2166.0, 3887.0, 7362.0, 14148.0, 29520.0, 67191.0, 163588.0, 330653.0, 241782.0, 100400.0, 42805.0, 19809.0, 9854.0, 5179.0, 2842.0, 1559.0, 945.0, 570.0, 338.0, 225.0, 141.0, 115.0, 67.0, 66.0, 28.0, 24.0, 15.0, 15.0, 5.0, 9.0, 1.0, 9.0, 1.0, 0.0, 2.0, 2.0, 1.0], "bins": [-2.68359375, -2.6063232421875, -2.529052734375, -2.4517822265625, -2.37451171875, -2.2972412109375, -2.219970703125, -2.1427001953125, -2.0654296875, -1.9881591796875, -1.910888671875, -1.8336181640625, -1.75634765625, -1.6790771484375, -1.601806640625, -1.5245361328125, -1.447265625, -1.3699951171875, -1.292724609375, -1.2154541015625, -1.13818359375, -1.0609130859375, -0.983642578125, -0.9063720703125, -0.8291015625, -0.7518310546875, -0.674560546875, -0.5972900390625, -0.52001953125, -0.4427490234375, -0.365478515625, -0.2882080078125, -0.2109375, -0.1336669921875, -0.056396484375, 0.0208740234375, 0.09814453125, 0.1754150390625, 0.252685546875, 0.3299560546875, 0.4072265625, 0.4844970703125, 0.561767578125, 0.6390380859375, 0.71630859375, 0.7935791015625, 0.870849609375, 0.9481201171875, 1.025390625, 1.1026611328125, 1.179931640625, 1.2572021484375, 1.33447265625, 1.4117431640625, 1.489013671875, 1.5662841796875, 1.6435546875, 1.7208251953125, 1.798095703125, 1.8753662109375, 1.95263671875, 2.0299072265625, 2.107177734375, 2.1844482421875, 2.26171875]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 6.0, 5.0, 2.0, 3.0, 12.0, 8.0, 14.0, 14.0, 6.0, 22.0, 22.0, 20.0, 35.0, 25.0, 38.0, 32.0, 33.0, 43.0, 44.0, 40.0, 50.0, 41.0, 54.0, 34.0, 55.0, 45.0, 48.0, 43.0, 34.0, 25.0, 27.0, 29.0, 17.0, 14.0, 23.0, 12.0, 7.0, 6.0, 10.0, 4.0, 4.0, 2.0, 2.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6015625, -2.524078369140625, -2.44659423828125, -2.369110107421875, -2.2916259765625, -2.214141845703125, -2.13665771484375, -2.059173583984375, -1.981689453125, -1.904205322265625, -1.82672119140625, -1.749237060546875, -1.6717529296875, -1.594268798828125, -1.51678466796875, -1.439300537109375, -1.36181640625, -1.284332275390625, -1.20684814453125, -1.129364013671875, -1.0518798828125, -0.974395751953125, -0.89691162109375, -0.819427490234375, -0.741943359375, -0.664459228515625, -0.58697509765625, -0.509490966796875, -0.4320068359375, -0.354522705078125, -0.27703857421875, -0.199554443359375, -0.1220703125, -0.044586181640625, 0.03289794921875, 0.110382080078125, 0.1878662109375, 0.265350341796875, 0.34283447265625, 0.420318603515625, 0.497802734375, 0.575286865234375, 0.65277099609375, 0.730255126953125, 0.8077392578125, 0.885223388671875, 0.96270751953125, 1.040191650390625, 1.11767578125, 1.195159912109375, 1.27264404296875, 1.350128173828125, 1.4276123046875, 1.505096435546875, 1.58258056640625, 1.660064697265625, 1.737548828125, 1.815032958984375, 1.89251708984375, 1.970001220703125, 2.0474853515625, 2.124969482421875, 2.20245361328125, 2.279937744140625, 2.357421875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 10.0, 12.0, 7.0, 9.0, 24.0, 25.0, 29.0, 45.0, 52.0, 82.0, 104.0, 159.0, 217.0, 317.0, 438.0, 653.0, 1116.0, 2666.0, 10656.0, 111091.0, 840115.0, 67500.0, 8048.0, 2179.0, 987.0, 607.0, 380.0, 294.0, 179.0, 150.0, 109.0, 79.0, 65.0, 35.0, 33.0, 24.0, 12.0, 13.0, 5.0, 12.0, 3.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0859375, -7.820068359375, -7.55419921875, -7.288330078125, -7.0224609375, -6.756591796875, -6.49072265625, -6.224853515625, -5.958984375, -5.693115234375, -5.42724609375, -5.161376953125, -4.8955078125, -4.629638671875, -4.36376953125, -4.097900390625, -3.83203125, -3.566162109375, -3.30029296875, -3.034423828125, -2.7685546875, -2.502685546875, -2.23681640625, -1.970947265625, -1.705078125, -1.439208984375, -1.17333984375, -0.907470703125, -0.6416015625, -0.375732421875, -0.10986328125, 0.156005859375, 0.421875, 0.687744140625, 0.95361328125, 1.219482421875, 1.4853515625, 1.751220703125, 2.01708984375, 2.282958984375, 2.548828125, 2.814697265625, 3.08056640625, 3.346435546875, 3.6123046875, 3.878173828125, 4.14404296875, 4.409912109375, 4.67578125, 4.941650390625, 5.20751953125, 5.473388671875, 5.7392578125, 6.005126953125, 6.27099609375, 6.536865234375, 6.802734375, 7.068603515625, 7.33447265625, 7.600341796875, 7.8662109375, 8.132080078125, 8.39794921875, 8.663818359375, 8.9296875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 1.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 6.0, 10.0, 14.0, 18.0, 20.0, 25.0, 28.0, 28.0, 30.0, 39.0, 47.0, 39.0, 51.0, 53.0, 48.0, 59.0, 50.0, 51.0, 48.0, 56.0, 35.0, 39.0, 33.0, 25.0, 23.0, 25.0, 21.0, 12.0, 13.0, 8.0, 4.0, 5.0, 12.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.6796875, -12.3231201171875, -11.966552734375, -11.6099853515625, -11.25341796875, -10.8968505859375, -10.540283203125, -10.1837158203125, -9.8271484375, -9.4705810546875, -9.114013671875, -8.7574462890625, -8.40087890625, -8.0443115234375, -7.687744140625, -7.3311767578125, -6.974609375, -6.6180419921875, -6.261474609375, -5.9049072265625, -5.54833984375, -5.1917724609375, -4.835205078125, -4.4786376953125, -4.1220703125, -3.7655029296875, -3.408935546875, -3.0523681640625, -2.69580078125, -2.3392333984375, -1.982666015625, -1.6260986328125, -1.26953125, -0.9129638671875, -0.556396484375, -0.1998291015625, 0.15673828125, 0.5133056640625, 0.869873046875, 1.2264404296875, 1.5830078125, 1.9395751953125, 2.296142578125, 2.6527099609375, 3.00927734375, 3.3658447265625, 3.722412109375, 4.0789794921875, 4.435546875, 4.7921142578125, 5.148681640625, 5.5052490234375, 5.86181640625, 6.2183837890625, 6.574951171875, 6.9315185546875, 7.2880859375, 7.6446533203125, 8.001220703125, 8.3577880859375, 8.71435546875, 9.0709228515625, 9.427490234375, 9.7840576171875, 10.140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 8.0, 15.0, 17.0, 21.0, 57.0, 108.0, 200.0, 587.0, 2048.0, 13204.0, 250180.0, 754201.0, 23415.0, 3120.0, 798.0, 304.0, 126.0, 70.0, 31.0, 15.0, 15.0, 6.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.142578125, -3.047698974609375, -2.95281982421875, -2.857940673828125, -2.7630615234375, -2.668182373046875, -2.57330322265625, -2.478424072265625, -2.383544921875, -2.288665771484375, -2.19378662109375, -2.098907470703125, -2.0040283203125, -1.909149169921875, -1.81427001953125, -1.719390869140625, -1.62451171875, -1.529632568359375, -1.43475341796875, -1.339874267578125, -1.2449951171875, -1.150115966796875, -1.05523681640625, -0.960357666015625, -0.865478515625, -0.770599365234375, -0.67572021484375, -0.580841064453125, -0.4859619140625, -0.391082763671875, -0.29620361328125, -0.201324462890625, -0.1064453125, -0.011566162109375, 0.08331298828125, 0.178192138671875, 0.2730712890625, 0.367950439453125, 0.46282958984375, 0.557708740234375, 0.652587890625, 0.747467041015625, 0.84234619140625, 0.937225341796875, 1.0321044921875, 1.126983642578125, 1.22186279296875, 1.316741943359375, 1.41162109375, 1.506500244140625, 1.60137939453125, 1.696258544921875, 1.7911376953125, 1.886016845703125, 1.98089599609375, 2.075775146484375, 2.170654296875, 2.265533447265625, 2.36041259765625, 2.455291748046875, 2.5501708984375, 2.645050048828125, 2.73992919921875, 2.834808349609375, 2.9296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 3.0, 8.0, 15.0, 13.0, 27.0, 37.0, 43.0, 97.0, 178.0, 202.0, 142.0, 70.0, 46.0, 34.0, 28.0, 17.0, 15.0, 10.0, 2.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0007724761962890625, -0.0007554627954959869, -0.0007384493947029114, -0.0007214359939098358, -0.0007044225931167603, -0.0006874091923236847, -0.0006703957915306091, -0.0006533823907375336, -0.000636368989944458, -0.0006193555891513824, -0.0006023421883583069, -0.0005853287875652313, -0.0005683153867721558, -0.0005513019859790802, -0.0005342885851860046, -0.0005172751843929291, -0.0005002617835998535, -0.00048324838280677795, -0.0004662349820137024, -0.00044922158122062683, -0.00043220818042755127, -0.0004151947796344757, -0.00039818137884140015, -0.0003811679780483246, -0.000364154577255249, -0.00034714117646217346, -0.0003301277756690979, -0.00031311437487602234, -0.0002961009740829468, -0.0002790875732898712, -0.00026207417249679565, -0.0002450607717037201, -0.00022804737091064453, -0.00021103397011756897, -0.0001940205693244934, -0.00017700716853141785, -0.00015999376773834229, -0.00014298036694526672, -0.00012596696615219116, -0.0001089535653591156, -9.194016456604004e-05, -7.492676377296448e-05, -5.7913362979888916e-05, -4.0899962186813354e-05, -2.3886561393737793e-05, -6.8731606006622314e-06, 1.014024019241333e-05, 2.715364098548889e-05, 4.416704177856445e-05, 6.118044257164001e-05, 7.819384336471558e-05, 9.520724415779114e-05, 0.0001122206449508667, 0.00012923404574394226, 0.00014624744653701782, 0.00016326084733009338, 0.00018027424812316895, 0.0001972876489162445, 0.00021430104970932007, 0.00023131445050239563, 0.0002483278512954712, 0.00026534125208854675, 0.0002823546528816223, 0.0002993680536746979, 0.00031638145446777344]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 9.0, 10.0, 14.0, 6.0, 26.0, 22.0, 37.0, 87.0, 77.0, 120.0, 161.0, 324.0, 566.0, 1122.0, 2865.0, 10519.0, 77504.0, 819816.0, 115360.0, 13569.0, 3407.0, 1331.0, 614.0, 360.0, 167.0, 152.0, 89.0, 52.0, 46.0, 28.0, 21.0, 21.0, 6.0, 10.0, 11.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.490234375, -2.4239654541015625, -2.357696533203125, -2.2914276123046875, -2.22515869140625, -2.1588897705078125, -2.092620849609375, -2.0263519287109375, -1.9600830078125, -1.8938140869140625, -1.827545166015625, -1.7612762451171875, -1.69500732421875, -1.6287384033203125, -1.562469482421875, -1.4962005615234375, -1.429931640625, -1.3636627197265625, -1.297393798828125, -1.2311248779296875, -1.16485595703125, -1.0985870361328125, -1.032318115234375, -0.9660491943359375, -0.8997802734375, -0.8335113525390625, -0.767242431640625, -0.7009735107421875, -0.63470458984375, -0.5684356689453125, -0.502166748046875, -0.4358978271484375, -0.36962890625, -0.3033599853515625, -0.237091064453125, -0.1708221435546875, -0.10455322265625, -0.0382843017578125, 0.027984619140625, 0.0942535400390625, 0.1605224609375, 0.2267913818359375, 0.293060302734375, 0.3593292236328125, 0.42559814453125, 0.4918670654296875, 0.558135986328125, 0.6244049072265625, 0.690673828125, 0.7569427490234375, 0.823211669921875, 0.8894805908203125, 0.95574951171875, 1.0220184326171875, 1.088287353515625, 1.1545562744140625, 1.2208251953125, 1.2870941162109375, 1.353363037109375, 1.4196319580078125, 1.48590087890625, 1.5521697998046875, 1.618438720703125, 1.6847076416015625, 1.7509765625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 4.0, 4.0, 8.0, 9.0, 4.0, 12.0, 13.0, 19.0, 23.0, 33.0, 21.0, 36.0, 44.0, 63.0, 58.0, 79.0, 77.0, 75.0, 74.0, 67.0, 53.0, 38.0, 40.0, 30.0, 17.0, 21.0, 9.0, 17.0, 8.0, 10.0, 9.0, 5.0, 5.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8720703125, -1.8163909912109375, -1.760711669921875, -1.7050323486328125, -1.64935302734375, -1.5936737060546875, -1.537994384765625, -1.4823150634765625, -1.4266357421875, -1.3709564208984375, -1.315277099609375, -1.2595977783203125, -1.20391845703125, -1.1482391357421875, -1.092559814453125, -1.0368804931640625, -0.981201171875, -0.9255218505859375, -0.869842529296875, -0.8141632080078125, -0.75848388671875, -0.7028045654296875, -0.647125244140625, -0.5914459228515625, -0.5357666015625, -0.4800872802734375, -0.424407958984375, -0.3687286376953125, -0.31304931640625, -0.2573699951171875, -0.201690673828125, -0.1460113525390625, -0.09033203125, -0.0346527099609375, 0.021026611328125, 0.0767059326171875, 0.13238525390625, 0.1880645751953125, 0.243743896484375, 0.2994232177734375, 0.3551025390625, 0.4107818603515625, 0.466461181640625, 0.5221405029296875, 0.57781982421875, 0.6334991455078125, 0.689178466796875, 0.7448577880859375, 0.800537109375, 0.8562164306640625, 0.911895751953125, 0.9675750732421875, 1.02325439453125, 1.0789337158203125, 1.134613037109375, 1.1902923583984375, 1.2459716796875, 1.3016510009765625, 1.357330322265625, 1.4130096435546875, 1.46868896484375, 1.5243682861328125, 1.580047607421875, 1.6357269287109375, 1.69140625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 7.0, 2.0, 1.0, 4.0, 9.0, 18.0, 39.0, 96.0, 213.0, 393.0, 146.0, 49.0, 21.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-104.24934387207031, -101.89994812011719, -99.55055236816406, -97.20115661621094, -94.85176086425781, -92.50237274169922, -90.1529769897461, -87.80358123779297, -85.45418548583984, -83.10478973388672, -80.7553939819336, -78.40599822998047, -76.05661010742188, -73.70721435546875, -71.35781860351562, -69.0084228515625, -66.65902709960938, -64.30963134765625, -61.960235595703125, -59.610843658447266, -57.26144790649414, -54.912052154541016, -52.562660217285156, -50.21326446533203, -47.863868713378906, -45.51447296142578, -43.165077209472656, -40.8156852722168, -38.46628952026367, -36.11689376831055, -33.76750183105469, -31.418106079101562, -29.06871795654297, -26.719322204589844, -24.36992835998535, -22.02053451538086, -19.671138763427734, -17.32174301147461, -14.972349166870117, -12.622955322265625, -10.2735595703125, -7.924164772033691, -5.574769973754883, -3.225375175476074, -0.8759803771972656, 1.473414421081543, 3.8228092193603516, 6.172203063964844, 8.521598815917969, 10.870993614196777, 13.220388412475586, 15.569783210754395, 17.919178009033203, 20.268573760986328, 22.61796760559082, 24.967361450195312, 27.316757202148438, 29.666152954101562, 32.01554870605469, 34.36494064331055, 36.71433639526367, 39.0637321472168, 41.413124084472656, 43.76251983642578, 46.111915588378906]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 6.0, 7.0, 10.0, 7.0, 13.0, 21.0, 22.0, 21.0, 17.0, 23.0, 28.0, 31.0, 29.0, 41.0, 36.0, 45.0, 46.0, 87.0, 62.0, 70.0, 44.0, 35.0, 27.0, 39.0, 28.0, 27.0, 28.0, 27.0, 19.0, 11.0, 21.0, 12.0, 9.0, 7.0, 5.0, 3.0, 9.0, 5.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-41.66759490966797, -40.36654281616211, -39.06549072265625, -37.764434814453125, -36.463382720947266, -35.162330627441406, -33.86127853393555, -32.56022644042969, -31.259172439575195, -29.958120346069336, -28.657066345214844, -27.356014251708984, -26.054962158203125, -24.753908157348633, -23.452856063842773, -22.15180206298828, -20.850749969482422, -19.549697875976562, -18.24864387512207, -16.94759178161621, -15.646538734436035, -14.34548568725586, -13.04443359375, -11.743380546569824, -10.442327499389648, -9.141274452209473, -7.840221881866455, -6.5391693115234375, -5.238116264343262, -3.937063217163086, -2.6360106468200684, -1.3349580764770508, -0.033901214599609375, 1.2671515941619873, 2.568204402923584, 3.8692572116851807, 5.170310020446777, 6.471363067626953, 7.772415637969971, 9.073468208312988, 10.374521255493164, 11.67557430267334, 12.976627349853516, 14.277679443359375, 15.57873249053955, 16.879785537719727, 18.180837631225586, 19.481891632080078, 20.782943725585938, 22.083995819091797, 23.38504981994629, 24.68610191345215, 25.98715591430664, 27.2882080078125, 28.58926010131836, 29.89031219482422, 31.19136619567871, 32.4924201965332, 33.79347229003906, 35.09452438354492, 36.39557647705078, 37.696632385253906, 38.997684478759766, 40.298736572265625, 41.599788665771484]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 4.0, 9.0, 15.0, 11.0, 17.0, 26.0, 49.0, 38.0, 65.0, 98.0, 110.0, 150.0, 185.0, 302.0, 466.0, 687.0, 1165.0, 2221.0, 4368.0, 10617.0, 39666.0, 229933.0, 1908455.0, 1721703.0, 217115.0, 37598.0, 9783.0, 4026.0, 2074.0, 1141.0, 729.0, 400.0, 297.0, 186.0, 130.0, 118.0, 82.0, 65.0, 40.0, 37.0, 26.0, 18.0, 15.0, 16.0, 9.0, 9.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.275390625, -2.201934814453125, -2.12847900390625, -2.055023193359375, -1.9815673828125, -1.908111572265625, -1.83465576171875, -1.761199951171875, -1.687744140625, -1.614288330078125, -1.54083251953125, -1.467376708984375, -1.3939208984375, -1.320465087890625, -1.24700927734375, -1.173553466796875, -1.10009765625, -1.026641845703125, -0.95318603515625, -0.879730224609375, -0.8062744140625, -0.732818603515625, -0.65936279296875, -0.585906982421875, -0.512451171875, -0.438995361328125, -0.36553955078125, -0.292083740234375, -0.2186279296875, -0.145172119140625, -0.07171630859375, 0.001739501953125, 0.0751953125, 0.148651123046875, 0.22210693359375, 0.295562744140625, 0.3690185546875, 0.442474365234375, 0.51593017578125, 0.589385986328125, 0.662841796875, 0.736297607421875, 0.80975341796875, 0.883209228515625, 0.9566650390625, 1.030120849609375, 1.10357666015625, 1.177032470703125, 1.25048828125, 1.323944091796875, 1.39739990234375, 1.470855712890625, 1.5443115234375, 1.617767333984375, 1.69122314453125, 1.764678955078125, 1.838134765625, 1.911590576171875, 1.98504638671875, 2.058502197265625, 2.1319580078125, 2.205413818359375, 2.27886962890625, 2.352325439453125, 2.42578125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 10.0, 12.0, 7.0, 15.0, 20.0, 26.0, 26.0, 33.0, 38.0, 36.0, 36.0, 52.0, 63.0, 46.0, 64.0, 66.0, 59.0, 58.0, 53.0, 44.0, 37.0, 35.0, 46.0, 22.0, 18.0, 13.0, 17.0, 16.0, 11.0, 12.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.177734375, -2.09381103515625, -2.0098876953125, -1.92596435546875, -1.842041015625, -1.75811767578125, -1.6741943359375, -1.59027099609375, -1.50634765625, -1.42242431640625, -1.3385009765625, -1.25457763671875, -1.170654296875, -1.08673095703125, -1.0028076171875, -0.91888427734375, -0.8349609375, -0.75103759765625, -0.6671142578125, -0.58319091796875, -0.499267578125, -0.41534423828125, -0.3314208984375, -0.24749755859375, -0.16357421875, -0.07965087890625, 0.0042724609375, 0.08819580078125, 0.172119140625, 0.25604248046875, 0.3399658203125, 0.42388916015625, 0.5078125, 0.59173583984375, 0.6756591796875, 0.75958251953125, 0.843505859375, 0.92742919921875, 1.0113525390625, 1.09527587890625, 1.17919921875, 1.26312255859375, 1.3470458984375, 1.43096923828125, 1.514892578125, 1.59881591796875, 1.6827392578125, 1.76666259765625, 1.8505859375, 1.93450927734375, 2.0184326171875, 2.10235595703125, 2.186279296875, 2.27020263671875, 2.3541259765625, 2.43804931640625, 2.52197265625, 2.60589599609375, 2.6898193359375, 2.77374267578125, 2.857666015625, 2.94158935546875, 3.0255126953125, 3.10943603515625, 3.193359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 5.0, 12.0, 10.0, 30.0, 44.0, 56.0, 121.0, 261.0, 529.0, 1341.0, 4761.0, 45941.0, 4003990.0, 125818.0, 8080.0, 1747.0, 705.0, 315.0, 207.0, 98.0, 58.0, 52.0, 32.0, 15.0, 15.0, 12.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.94140625, -6.65972900390625, -6.3780517578125, -6.09637451171875, -5.814697265625, -5.53302001953125, -5.2513427734375, -4.96966552734375, -4.68798828125, -4.40631103515625, -4.1246337890625, -3.84295654296875, -3.561279296875, -3.27960205078125, -2.9979248046875, -2.71624755859375, -2.4345703125, -2.15289306640625, -1.8712158203125, -1.58953857421875, -1.307861328125, -1.02618408203125, -0.7445068359375, -0.46282958984375, -0.18115234375, 0.10052490234375, 0.3822021484375, 0.66387939453125, 0.945556640625, 1.22723388671875, 1.5089111328125, 1.79058837890625, 2.072265625, 2.35394287109375, 2.6356201171875, 2.91729736328125, 3.198974609375, 3.48065185546875, 3.7623291015625, 4.04400634765625, 4.32568359375, 4.60736083984375, 4.8890380859375, 5.17071533203125, 5.452392578125, 5.73406982421875, 6.0157470703125, 6.29742431640625, 6.5791015625, 6.86077880859375, 7.1424560546875, 7.42413330078125, 7.705810546875, 7.98748779296875, 8.2691650390625, 8.55084228515625, 8.83251953125, 9.11419677734375, 9.3958740234375, 9.67755126953125, 9.959228515625, 10.24090576171875, 10.5225830078125, 10.80426025390625, 11.0859375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 19.0, 19.0, 34.0, 78.0, 136.0, 544.0, 1962.0, 919.0, 185.0, 64.0, 38.0, 26.0, 13.0, 16.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8203125, -8.5123291015625, -8.204345703125, -7.8963623046875, -7.58837890625, -7.2803955078125, -6.972412109375, -6.6644287109375, -6.3564453125, -6.0484619140625, -5.740478515625, -5.4324951171875, -5.12451171875, -4.8165283203125, -4.508544921875, -4.2005615234375, -3.892578125, -3.5845947265625, -3.276611328125, -2.9686279296875, -2.66064453125, -2.3526611328125, -2.044677734375, -1.7366943359375, -1.4287109375, -1.1207275390625, -0.812744140625, -0.5047607421875, -0.19677734375, 0.1112060546875, 0.419189453125, 0.7271728515625, 1.03515625, 1.3431396484375, 1.651123046875, 1.9591064453125, 2.26708984375, 2.5750732421875, 2.883056640625, 3.1910400390625, 3.4990234375, 3.8070068359375, 4.114990234375, 4.4229736328125, 4.73095703125, 5.0389404296875, 5.346923828125, 5.6549072265625, 5.962890625, 6.2708740234375, 6.578857421875, 6.8868408203125, 7.19482421875, 7.5028076171875, 7.810791015625, 8.1187744140625, 8.4267578125, 8.7347412109375, 9.042724609375, 9.3507080078125, 9.65869140625, 9.9666748046875, 10.274658203125, 10.5826416015625, 10.890625]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 5.0, 8.0, 23.0, 53.0, 175.0, 322.0, 267.0, 96.0, 28.0, 12.0, 3.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-67.02936553955078, -65.0513687133789, -63.0733642578125, -61.09536361694336, -59.11736297607422, -57.13936233520508, -55.16136169433594, -53.18336486816406, -51.205360412597656, -49.227359771728516, -47.249359130859375, -45.271358489990234, -43.293357849121094, -41.31535720825195, -39.33735656738281, -37.35935974121094, -35.3813591003418, -33.403358459472656, -31.425357818603516, -29.447357177734375, -27.469356536865234, -25.491355895996094, -23.513357162475586, -21.535356521606445, -19.557355880737305, -17.579355239868164, -15.601354598999023, -13.6233549118042, -11.645354270935059, -9.667353630065918, -7.689353942871094, -5.711353302001953, -3.733348846435547, -1.7553484439849854, 0.22265195846557617, 2.2006521224975586, 4.178652763366699, 6.15665340423584, 8.134653091430664, 10.112653732299805, 12.090654373168945, 14.068655014038086, 16.046655654907227, 18.024654388427734, 20.002655029296875, 21.980655670166016, 23.958656311035156, 25.936656951904297, 27.914657592773438, 29.892658233642578, 31.87065887451172, 33.84865951538086, 35.82666015625, 37.80466079711914, 39.78266143798828, 41.760658264160156, 43.73866271972656, 45.7166633605957, 47.694664001464844, 49.672664642333984, 51.650665283203125, 53.628665924072266, 55.606666564941406, 57.58466339111328, 59.56266403198242]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 7.0, 2.0, 2.0, 8.0, 16.0, 10.0, 11.0, 17.0, 24.0, 18.0, 38.0, 25.0, 36.0, 45.0, 35.0, 56.0, 48.0, 44.0, 47.0, 45.0, 52.0, 60.0, 41.0, 28.0, 40.0, 47.0, 29.0, 25.0, 23.0, 28.0, 18.0, 13.0, 16.0, 16.0, 8.0, 7.0, 4.0, 4.0, 6.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.314449310302734, -22.59934425354004, -21.884241104125977, -21.16913604736328, -20.45403289794922, -19.738927841186523, -19.023822784423828, -18.308719635009766, -17.59361457824707, -16.878509521484375, -16.163406372070312, -15.448301315307617, -14.733197212219238, -14.01809310913086, -13.302988052368164, -12.587883949279785, -11.872779846191406, -11.157675743103027, -10.442571640014648, -9.727466583251953, -9.012362480163574, -8.297258377075195, -7.582153797149658, -6.867049217224121, -6.151945114135742, -5.436841011047363, -4.721736431121826, -4.006631851196289, -3.29152774810791, -2.576423406600952, -1.8613190650939941, -1.146214485168457, -0.4311103820800781, 0.2839939594268799, 0.9990983009338379, 1.714202642440796, 2.429306983947754, 3.144411325454712, 3.85951566696167, 4.574620246887207, 5.289724349975586, 6.004828453063965, 6.719933032989502, 7.435037612915039, 8.150141716003418, 8.865245819091797, 9.580350875854492, 10.295454978942871, 11.01055908203125, 11.725663185119629, 12.440767288208008, 13.155872344970703, 13.870976448059082, 14.586080551147461, 15.301185607910156, 16.01628875732422, 16.731393814086914, 17.44649887084961, 18.161602020263672, 18.876707077026367, 19.591812133789062, 20.306915283203125, 21.02202033996582, 21.737125396728516, 22.452228546142578]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 9.0, 11.0, 7.0, 7.0, 20.0, 39.0, 43.0, 78.0, 99.0, 141.0, 206.0, 311.0, 450.0, 665.0, 1088.0, 1704.0, 2717.0, 4793.0, 8983.0, 18398.0, 41313.0, 105249.0, 292736.0, 343680.0, 130103.0, 49712.0, 21614.0, 10455.0, 5541.0, 3044.0, 1849.0, 1180.0, 730.0, 526.0, 330.0, 222.0, 165.0, 86.0, 74.0, 52.0, 47.0, 26.0, 24.0, 13.0, 7.0, 4.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.04296875, -2.9510498046875, -2.859130859375, -2.7672119140625, -2.67529296875, -2.5833740234375, -2.491455078125, -2.3995361328125, -2.3076171875, -2.2156982421875, -2.123779296875, -2.0318603515625, -1.93994140625, -1.8480224609375, -1.756103515625, -1.6641845703125, -1.572265625, -1.4803466796875, -1.388427734375, -1.2965087890625, -1.20458984375, -1.1126708984375, -1.020751953125, -0.9288330078125, -0.8369140625, -0.7449951171875, -0.653076171875, -0.5611572265625, -0.46923828125, -0.3773193359375, -0.285400390625, -0.1934814453125, -0.1015625, -0.0096435546875, 0.082275390625, 0.1741943359375, 0.26611328125, 0.3580322265625, 0.449951171875, 0.5418701171875, 0.6337890625, 0.7257080078125, 0.817626953125, 0.9095458984375, 1.00146484375, 1.0933837890625, 1.185302734375, 1.2772216796875, 1.369140625, 1.4610595703125, 1.552978515625, 1.6448974609375, 1.73681640625, 1.8287353515625, 1.920654296875, 2.0125732421875, 2.1044921875, 2.1964111328125, 2.288330078125, 2.3802490234375, 2.47216796875, 2.5640869140625, 2.656005859375, 2.7479248046875, 2.83984375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 14.0, 6.0, 9.0, 13.0, 15.0, 14.0, 11.0, 18.0, 28.0, 31.0, 29.0, 31.0, 32.0, 34.0, 38.0, 39.0, 43.0, 42.0, 37.0, 42.0, 46.0, 35.0, 36.0, 43.0, 33.0, 37.0, 37.0, 24.0, 23.0, 18.0, 21.0, 16.0, 15.0, 16.0, 11.0, 13.0, 6.0, 7.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.0859375, -2.0243988037109375, -1.962860107421875, -1.9013214111328125, -1.83978271484375, -1.7782440185546875, -1.716705322265625, -1.6551666259765625, -1.5936279296875, -1.5320892333984375, -1.470550537109375, -1.4090118408203125, -1.34747314453125, -1.2859344482421875, -1.224395751953125, -1.1628570556640625, -1.101318359375, -1.0397796630859375, -0.978240966796875, -0.9167022705078125, -0.85516357421875, -0.7936248779296875, -0.732086181640625, -0.6705474853515625, -0.6090087890625, -0.5474700927734375, -0.485931396484375, -0.4243927001953125, -0.36285400390625, -0.3013153076171875, -0.239776611328125, -0.1782379150390625, -0.11669921875, -0.0551605224609375, 0.006378173828125, 0.0679168701171875, 0.12945556640625, 0.1909942626953125, 0.252532958984375, 0.3140716552734375, 0.3756103515625, 0.4371490478515625, 0.498687744140625, 0.5602264404296875, 0.62176513671875, 0.6833038330078125, 0.744842529296875, 0.8063812255859375, 0.867919921875, 0.9294586181640625, 0.990997314453125, 1.0525360107421875, 1.11407470703125, 1.1756134033203125, 1.237152099609375, 1.2986907958984375, 1.3602294921875, 1.4217681884765625, 1.483306884765625, 1.5448455810546875, 1.60638427734375, 1.6679229736328125, 1.729461669921875, 1.7910003662109375, 1.8525390625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 2.0, 13.0, 14.0, 17.0, 37.0, 40.0, 52.0, 91.0, 166.0, 245.0, 388.0, 622.0, 1172.0, 3225.0, 15422.0, 276710.0, 718270.0, 24328.0, 4349.0, 1467.0, 662.0, 441.0, 257.0, 195.0, 105.0, 76.0, 73.0, 33.0, 26.0, 18.0, 10.0, 9.0, 4.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.40625, -12.0806884765625, -11.755126953125, -11.4295654296875, -11.10400390625, -10.7784423828125, -10.452880859375, -10.1273193359375, -9.8017578125, -9.4761962890625, -9.150634765625, -8.8250732421875, -8.49951171875, -8.1739501953125, -7.848388671875, -7.5228271484375, -7.197265625, -6.8717041015625, -6.546142578125, -6.2205810546875, -5.89501953125, -5.5694580078125, -5.243896484375, -4.9183349609375, -4.5927734375, -4.2672119140625, -3.941650390625, -3.6160888671875, -3.29052734375, -2.9649658203125, -2.639404296875, -2.3138427734375, -1.98828125, -1.6627197265625, -1.337158203125, -1.0115966796875, -0.68603515625, -0.3604736328125, -0.034912109375, 0.2906494140625, 0.6162109375, 0.9417724609375, 1.267333984375, 1.5928955078125, 1.91845703125, 2.2440185546875, 2.569580078125, 2.8951416015625, 3.220703125, 3.5462646484375, 3.871826171875, 4.1973876953125, 4.52294921875, 4.8485107421875, 5.174072265625, 5.4996337890625, 5.8251953125, 6.1507568359375, 6.476318359375, 6.8018798828125, 7.12744140625, 7.4530029296875, 7.778564453125, 8.1041259765625, 8.4296875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 5.0, 5.0, 1.0, 7.0, 18.0, 10.0, 13.0, 24.0, 23.0, 34.0, 32.0, 37.0, 41.0, 58.0, 44.0, 50.0, 52.0, 59.0, 49.0, 45.0, 64.0, 31.0, 40.0, 55.0, 38.0, 30.0, 23.0, 23.0, 23.0, 18.0, 13.0, 9.0, 6.0, 8.0, 2.0, 6.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.5390625, -9.2264404296875, -8.913818359375, -8.6011962890625, -8.28857421875, -7.9759521484375, -7.663330078125, -7.3507080078125, -7.0380859375, -6.7254638671875, -6.412841796875, -6.1002197265625, -5.78759765625, -5.4749755859375, -5.162353515625, -4.8497314453125, -4.537109375, -4.2244873046875, -3.911865234375, -3.5992431640625, -3.28662109375, -2.9739990234375, -2.661376953125, -2.3487548828125, -2.0361328125, -1.7235107421875, -1.410888671875, -1.0982666015625, -0.78564453125, -0.4730224609375, -0.160400390625, 0.1522216796875, 0.46484375, 0.7774658203125, 1.090087890625, 1.4027099609375, 1.71533203125, 2.0279541015625, 2.340576171875, 2.6531982421875, 2.9658203125, 3.2784423828125, 3.591064453125, 3.9036865234375, 4.21630859375, 4.5289306640625, 4.841552734375, 5.1541748046875, 5.466796875, 5.7794189453125, 6.092041015625, 6.4046630859375, 6.71728515625, 7.0299072265625, 7.342529296875, 7.6551513671875, 7.9677734375, 8.2803955078125, 8.593017578125, 8.9056396484375, 9.21826171875, 9.5308837890625, 9.843505859375, 10.1561279296875, 10.46875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 4.0, 11.0, 5.0, 6.0, 8.0, 10.0, 17.0, 16.0, 21.0, 30.0, 41.0, 89.0, 147.0, 254.0, 696.0, 1848.0, 6453.0, 36541.0, 712886.0, 261128.0, 21321.0, 4548.0, 1336.0, 537.0, 232.0, 125.0, 81.0, 39.0, 23.0, 18.0, 16.0, 14.0, 10.0, 5.0, 4.0, 5.0, 5.0, 5.0, 2.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-2.53125, -2.458648681640625, -2.38604736328125, -2.313446044921875, -2.2408447265625, -2.168243408203125, -2.09564208984375, -2.023040771484375, -1.950439453125, -1.877838134765625, -1.80523681640625, -1.732635498046875, -1.6600341796875, -1.587432861328125, -1.51483154296875, -1.442230224609375, -1.36962890625, -1.297027587890625, -1.22442626953125, -1.151824951171875, -1.0792236328125, -1.006622314453125, -0.93402099609375, -0.861419677734375, -0.788818359375, -0.716217041015625, -0.64361572265625, -0.571014404296875, -0.4984130859375, -0.425811767578125, -0.35321044921875, -0.280609130859375, -0.2080078125, -0.135406494140625, -0.06280517578125, 0.009796142578125, 0.0823974609375, 0.154998779296875, 0.22760009765625, 0.300201416015625, 0.372802734375, 0.445404052734375, 0.51800537109375, 0.590606689453125, 0.6632080078125, 0.735809326171875, 0.80841064453125, 0.881011962890625, 0.95361328125, 1.026214599609375, 1.09881591796875, 1.171417236328125, 1.2440185546875, 1.316619873046875, 1.38922119140625, 1.461822509765625, 1.534423828125, 1.607025146484375, 1.67962646484375, 1.752227783203125, 1.8248291015625, 1.897430419921875, 1.97003173828125, 2.042633056640625, 2.115234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 9.0, 7.0, 6.0, 13.0, 8.0, 21.0, 28.0, 39.0, 47.0, 86.0, 132.0, 165.0, 141.0, 90.0, 55.0, 49.0, 17.0, 24.0, 11.0, 10.0, 15.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0004911422729492188, -0.000477377325296402, -0.0004636123776435852, -0.00044984742999076843, -0.00043608248233795166, -0.0004223175346851349, -0.0004085525870323181, -0.00039478763937950134, -0.00038102269172668457, -0.0003672577440738678, -0.000353492796421051, -0.00033972784876823425, -0.0003259629011154175, -0.0003121979534626007, -0.00029843300580978394, -0.00028466805815696716, -0.0002709031105041504, -0.0002571381628513336, -0.00024337321519851685, -0.00022960826754570007, -0.0002158433198928833, -0.00020207837224006653, -0.00018831342458724976, -0.00017454847693443298, -0.0001607835292816162, -0.00014701858162879944, -0.00013325363397598267, -0.0001194886863231659, -0.00010572373867034912, -9.195879101753235e-05, -7.819384336471558e-05, -6.44288957118988e-05, -5.066394805908203e-05, -3.689900040626526e-05, -2.3134052753448486e-05, -9.369105100631714e-06, 4.395842552185059e-06, 1.816079020500183e-05, 3.1925737857818604e-05, 4.5690685510635376e-05, 5.945563316345215e-05, 7.322058081626892e-05, 8.69855284690857e-05, 0.00010075047612190247, 0.00011451542377471924, 0.000128280371427536, 0.00014204531908035278, 0.00015581026673316956, 0.00016957521438598633, 0.0001833401620388031, 0.00019710510969161987, 0.00021087005734443665, 0.00022463500499725342, 0.0002383999526500702, 0.00025216490030288696, 0.00026592984795570374, 0.0002796947956085205, 0.0002934597432613373, 0.00030722469091415405, 0.0003209896385669708, 0.0003347545862197876, 0.00034851953387260437, 0.00036228448152542114, 0.0003760494291782379, 0.0003898143768310547]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 7.0, 4.0, 5.0, 10.0, 12.0, 23.0, 35.0, 54.0, 78.0, 162.0, 379.0, 1024.0, 4208.0, 47216.0, 944927.0, 44560.0, 4029.0, 1053.0, 373.0, 183.0, 76.0, 46.0, 26.0, 19.0, 15.0, 11.0, 3.0, 4.0, 3.0, 0.0, 4.0, 1.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.0078125, -2.898406982421875, -2.78900146484375, -2.679595947265625, -2.5701904296875, -2.460784912109375, -2.35137939453125, -2.241973876953125, -2.132568359375, -2.023162841796875, -1.91375732421875, -1.804351806640625, -1.6949462890625, -1.585540771484375, -1.47613525390625, -1.366729736328125, -1.25732421875, -1.147918701171875, -1.03851318359375, -0.929107666015625, -0.8197021484375, -0.710296630859375, -0.60089111328125, -0.491485595703125, -0.382080078125, -0.272674560546875, -0.16326904296875, -0.053863525390625, 0.0555419921875, 0.164947509765625, 0.27435302734375, 0.383758544921875, 0.4931640625, 0.602569580078125, 0.71197509765625, 0.821380615234375, 0.9307861328125, 1.040191650390625, 1.14959716796875, 1.259002685546875, 1.368408203125, 1.477813720703125, 1.58721923828125, 1.696624755859375, 1.8060302734375, 1.915435791015625, 2.02484130859375, 2.134246826171875, 2.24365234375, 2.353057861328125, 2.46246337890625, 2.571868896484375, 2.6812744140625, 2.790679931640625, 2.90008544921875, 3.009490966796875, 3.118896484375, 3.228302001953125, 3.33770751953125, 3.447113037109375, 3.5565185546875, 3.665924072265625, 3.77532958984375, 3.884735107421875, 3.994140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 8.0, 9.0, 9.0, 13.0, 16.0, 23.0, 37.0, 58.0, 62.0, 78.0, 113.0, 99.0, 87.0, 96.0, 72.0, 69.0, 47.0, 22.0, 26.0, 16.0, 13.0, 8.0, 3.0, 9.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84765625, -1.784027099609375, -1.72039794921875, -1.656768798828125, -1.5931396484375, -1.529510498046875, -1.46588134765625, -1.402252197265625, -1.338623046875, -1.274993896484375, -1.21136474609375, -1.147735595703125, -1.0841064453125, -1.020477294921875, -0.95684814453125, -0.893218994140625, -0.82958984375, -0.765960693359375, -0.70233154296875, -0.638702392578125, -0.5750732421875, -0.511444091796875, -0.44781494140625, -0.384185791015625, -0.320556640625, -0.256927490234375, -0.19329833984375, -0.129669189453125, -0.0660400390625, -0.002410888671875, 0.06121826171875, 0.124847412109375, 0.1884765625, 0.252105712890625, 0.31573486328125, 0.379364013671875, 0.4429931640625, 0.506622314453125, 0.57025146484375, 0.633880615234375, 0.697509765625, 0.761138916015625, 0.82476806640625, 0.888397216796875, 0.9520263671875, 1.015655517578125, 1.07928466796875, 1.142913818359375, 1.20654296875, 1.270172119140625, 1.33380126953125, 1.397430419921875, 1.4610595703125, 1.524688720703125, 1.58831787109375, 1.651947021484375, 1.715576171875, 1.779205322265625, 1.84283447265625, 1.906463623046875, 1.9700927734375, 2.033721923828125, 2.09735107421875, 2.160980224609375, 2.224609375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 15.0, 19.0, 53.0, 135.0, 314.0, 253.0, 118.0, 55.0, 15.0, 16.0, 8.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.48570251464844, -93.44749450683594, -91.40928649902344, -89.37107849121094, -87.3328628540039, -85.2946548461914, -83.2564468383789, -81.2182388305664, -79.1800308227539, -77.1418228149414, -75.1036148071289, -73.06539916992188, -71.02719116210938, -68.98898315429688, -66.95077514648438, -64.91256713867188, -62.87435531616211, -60.83614730834961, -58.797935485839844, -56.759727478027344, -54.721519470214844, -52.683311462402344, -50.64509963989258, -48.60689163208008, -46.56867980957031, -44.53047180175781, -42.49225997924805, -40.45405197143555, -38.41584396362305, -36.37763214111328, -34.33942413330078, -32.30121612548828, -30.26300811767578, -28.22479820251465, -26.18659019470215, -24.148380279541016, -22.110172271728516, -20.071962356567383, -18.03375244140625, -15.995543479919434, -13.957334518432617, -11.9191255569458, -9.880916595458984, -7.842706680297852, -5.804497718811035, -3.7662887573242188, -1.728078842163086, 0.31013011932373047, 2.348339080810547, 4.386548042297363, 6.424757480621338, 8.462966918945312, 10.501175880432129, 12.539384841918945, 14.577594757080078, 16.615802764892578, 18.65401268005371, 20.692222595214844, 22.730430603027344, 24.768640518188477, 26.80685043334961, 28.84505844116211, 30.883268356323242, 32.921478271484375, 34.959686279296875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 5.0, 3.0, 5.0, 4.0, 4.0, 10.0, 5.0, 14.0, 17.0, 17.0, 23.0, 18.0, 28.0, 24.0, 18.0, 23.0, 30.0, 27.0, 39.0, 43.0, 51.0, 70.0, 62.0, 60.0, 65.0, 40.0, 33.0, 27.0, 32.0, 30.0, 25.0, 25.0, 32.0, 18.0, 16.0, 16.0, 9.0, 12.0, 14.0, 5.0, 6.0, 4.0, 4.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-42.14063262939453, -41.03972625732422, -39.93881607055664, -38.83790588378906, -37.73699951171875, -36.63609313964844, -35.53518295288086, -34.43427276611328, -33.33336639404297, -32.232460021972656, -31.131549835205078, -30.030641555786133, -28.929733276367188, -27.828824996948242, -26.727916717529297, -25.62700843811035, -24.526100158691406, -23.42519187927246, -22.324283599853516, -21.22337532043457, -20.122467041015625, -19.02155876159668, -17.920650482177734, -16.81974220275879, -15.718833923339844, -14.617925643920898, -13.517017364501953, -12.416109085083008, -11.315200805664062, -10.214292526245117, -9.113384246826172, -8.012475967407227, -6.911571502685547, -5.810663223266602, -4.709754943847656, -3.608846664428711, -2.5079383850097656, -1.4070301055908203, -0.306121826171875, 0.7947864532470703, 1.8956947326660156, 2.996603012084961, 4.097511291503906, 5.198419570922852, 6.299327850341797, 7.400236129760742, 8.501144409179688, 9.602052688598633, 10.702960968017578, 11.803869247436523, 12.904777526855469, 14.005685806274414, 15.10659408569336, 16.207502365112305, 17.30841064453125, 18.409318923950195, 19.51022720336914, 20.611135482788086, 21.71204376220703, 22.812952041625977, 23.913860321044922, 25.014768600463867, 26.115676879882812, 27.216585159301758, 28.317493438720703]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 7.0, 7.0, 11.0, 10.0, 13.0, 15.0, 27.0, 53.0, 59.0, 92.0, 136.0, 168.0, 278.0, 420.0, 581.0, 1110.0, 1988.0, 4219.0, 10944.0, 57172.0, 583740.0, 2982275.0, 481912.0, 50001.0, 10367.0, 3802.0, 1856.0, 1076.0, 607.0, 406.0, 258.0, 198.0, 140.0, 98.0, 63.0, 48.0, 24.0, 23.0, 19.0, 14.0, 12.0, 9.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.65625, -2.569061279296875, -2.48187255859375, -2.394683837890625, -2.3074951171875, -2.220306396484375, -2.13311767578125, -2.045928955078125, -1.958740234375, -1.871551513671875, -1.78436279296875, -1.697174072265625, -1.6099853515625, -1.522796630859375, -1.43560791015625, -1.348419189453125, -1.26123046875, -1.174041748046875, -1.08685302734375, -0.999664306640625, -0.9124755859375, -0.825286865234375, -0.73809814453125, -0.650909423828125, -0.563720703125, -0.476531982421875, -0.38934326171875, -0.302154541015625, -0.2149658203125, -0.127777099609375, -0.04058837890625, 0.046600341796875, 0.1337890625, 0.220977783203125, 0.30816650390625, 0.395355224609375, 0.4825439453125, 0.569732666015625, 0.65692138671875, 0.744110107421875, 0.831298828125, 0.918487548828125, 1.00567626953125, 1.092864990234375, 1.1800537109375, 1.267242431640625, 1.35443115234375, 1.441619873046875, 1.52880859375, 1.615997314453125, 1.70318603515625, 1.790374755859375, 1.8775634765625, 1.964752197265625, 2.05194091796875, 2.139129638671875, 2.226318359375, 2.313507080078125, 2.40069580078125, 2.487884521484375, 2.5750732421875, 2.662261962890625, 2.74945068359375, 2.836639404296875, 2.923828125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 7.0, 8.0, 8.0, 7.0, 12.0, 11.0, 10.0, 9.0, 19.0, 18.0, 22.0, 21.0, 18.0, 29.0, 38.0, 36.0, 38.0, 40.0, 44.0, 42.0, 56.0, 43.0, 34.0, 40.0, 40.0, 44.0, 33.0, 37.0, 35.0, 20.0, 23.0, 20.0, 19.0, 30.0, 11.0, 21.0, 12.0, 7.0, 10.0, 10.0, 13.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-2.044921875, -1.9871978759765625, -1.929473876953125, -1.8717498779296875, -1.81402587890625, -1.7563018798828125, -1.698577880859375, -1.6408538818359375, -1.5831298828125, -1.5254058837890625, -1.467681884765625, -1.4099578857421875, -1.35223388671875, -1.2945098876953125, -1.236785888671875, -1.1790618896484375, -1.121337890625, -1.0636138916015625, -1.005889892578125, -0.9481658935546875, -0.89044189453125, -0.8327178955078125, -0.774993896484375, -0.7172698974609375, -0.6595458984375, -0.6018218994140625, -0.544097900390625, -0.4863739013671875, -0.42864990234375, -0.3709259033203125, -0.313201904296875, -0.2554779052734375, -0.19775390625, -0.1400299072265625, -0.082305908203125, -0.0245819091796875, 0.03314208984375, 0.0908660888671875, 0.148590087890625, 0.2063140869140625, 0.2640380859375, 0.3217620849609375, 0.379486083984375, 0.4372100830078125, 0.49493408203125, 0.5526580810546875, 0.610382080078125, 0.6681060791015625, 0.725830078125, 0.7835540771484375, 0.841278076171875, 0.8990020751953125, 0.95672607421875, 1.0144500732421875, 1.072174072265625, 1.1298980712890625, 1.1876220703125, 1.2453460693359375, 1.303070068359375, 1.3607940673828125, 1.41851806640625, 1.4762420654296875, 1.533966064453125, 1.5916900634765625, 1.6494140625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 3.0, 6.0, 16.0, 15.0, 31.0, 42.0, 93.0, 147.0, 341.0, 789.0, 2153.0, 8058.0, 71334.0, 4018471.0, 80266.0, 8740.0, 2220.0, 785.0, 369.0, 166.0, 93.0, 38.0, 28.0, 23.0, 8.0, 11.0, 8.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-9.3203125, -9.0650634765625, -8.809814453125, -8.5545654296875, -8.29931640625, -8.0440673828125, -7.788818359375, -7.5335693359375, -7.2783203125, -7.0230712890625, -6.767822265625, -6.5125732421875, -6.25732421875, -6.0020751953125, -5.746826171875, -5.4915771484375, -5.236328125, -4.9810791015625, -4.725830078125, -4.4705810546875, -4.21533203125, -3.9600830078125, -3.704833984375, -3.4495849609375, -3.1943359375, -2.9390869140625, -2.683837890625, -2.4285888671875, -2.17333984375, -1.9180908203125, -1.662841796875, -1.4075927734375, -1.15234375, -0.8970947265625, -0.641845703125, -0.3865966796875, -0.13134765625, 0.1239013671875, 0.379150390625, 0.6343994140625, 0.8896484375, 1.1448974609375, 1.400146484375, 1.6553955078125, 1.91064453125, 2.1658935546875, 2.421142578125, 2.6763916015625, 2.931640625, 3.1868896484375, 3.442138671875, 3.6973876953125, 3.95263671875, 4.2078857421875, 4.463134765625, 4.7183837890625, 4.9736328125, 5.2288818359375, 5.484130859375, 5.7393798828125, 5.99462890625, 6.2498779296875, 6.505126953125, 6.7603759765625, 7.015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 7.0, 3.0, 3.0, 2.0, 10.0, 7.0, 10.0, 18.0, 32.0, 38.0, 75.0, 201.0, 574.0, 1329.0, 1079.0, 363.0, 139.0, 65.0, 36.0, 23.0, 16.0, 12.0, 8.0, 10.0, 2.0, 3.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.8828125, -6.6905517578125, -6.498291015625, -6.3060302734375, -6.11376953125, -5.9215087890625, -5.729248046875, -5.5369873046875, -5.3447265625, -5.1524658203125, -4.960205078125, -4.7679443359375, -4.57568359375, -4.3834228515625, -4.191162109375, -3.9989013671875, -3.806640625, -3.6143798828125, -3.422119140625, -3.2298583984375, -3.03759765625, -2.8453369140625, -2.653076171875, -2.4608154296875, -2.2685546875, -2.0762939453125, -1.884033203125, -1.6917724609375, -1.49951171875, -1.3072509765625, -1.114990234375, -0.9227294921875, -0.73046875, -0.5382080078125, -0.345947265625, -0.1536865234375, 0.03857421875, 0.2308349609375, 0.423095703125, 0.6153564453125, 0.8076171875, 0.9998779296875, 1.192138671875, 1.3843994140625, 1.57666015625, 1.7689208984375, 1.961181640625, 2.1534423828125, 2.345703125, 2.5379638671875, 2.730224609375, 2.9224853515625, 3.11474609375, 3.3070068359375, 3.499267578125, 3.6915283203125, 3.8837890625, 4.0760498046875, 4.268310546875, 4.4605712890625, 4.65283203125, 4.8450927734375, 5.037353515625, 5.2296142578125, 5.421875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 6.0, 13.0, 30.0, 77.0, 185.0, 293.0, 231.0, 94.0, 36.0, 19.0, 10.0, 4.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-81.15202331542969, -79.45350646972656, -77.75498962402344, -76.05647277832031, -74.35795593261719, -72.65943908691406, -70.96092224121094, -69.26241302490234, -67.56389617919922, -65.8653793334961, -64.16686248779297, -62.468345642089844, -60.769832611083984, -59.07131576538086, -57.372798919677734, -55.67428207397461, -53.975765228271484, -52.27724838256836, -50.578731536865234, -48.880218505859375, -47.18170166015625, -45.483184814453125, -43.78466796875, -42.086151123046875, -40.38763427734375, -38.689117431640625, -36.9906005859375, -35.292083740234375, -33.593570709228516, -31.89505386352539, -30.196537017822266, -28.49802017211914, -26.799510955810547, -25.100994110107422, -23.40247917175293, -21.703962326049805, -20.005447387695312, -18.306930541992188, -16.608413696289062, -14.909897804260254, -13.211381912231445, -11.512866020202637, -9.814350128173828, -8.115833282470703, -6.4173173904418945, -4.718801498413086, -3.020284652709961, -1.3217687606811523, 0.37674713134765625, 2.075263261795044, 3.7737793922424316, 5.472295761108398, 7.170811653137207, 8.869327545166016, 10.56784439086914, 12.26636028289795, 13.964876174926758, 15.663392066955566, 17.361907958984375, 19.0604248046875, 20.758941650390625, 22.457456588745117, 24.155973434448242, 25.854488372802734, 27.55300521850586]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 7.0, 5.0, 7.0, 16.0, 18.0, 20.0, 18.0, 22.0, 24.0, 25.0, 34.0, 32.0, 38.0, 49.0, 43.0, 43.0, 51.0, 44.0, 36.0, 43.0, 36.0, 32.0, 33.0, 48.0, 34.0, 31.0, 28.0, 26.0, 18.0, 19.0, 16.0, 18.0, 17.0, 11.0, 7.0, 9.0, 9.0, 5.0, 6.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-16.52326774597168, -16.01232147216797, -15.501375198364258, -14.990428924560547, -14.479482650756836, -13.968536376953125, -13.457590103149414, -12.946643829345703, -12.435697555541992, -11.924751281738281, -11.41380500793457, -10.90285873413086, -10.391912460327148, -9.880966186523438, -9.370019912719727, -8.859073638916016, -8.348127365112305, -7.837181091308594, -7.326234817504883, -6.815288543701172, -6.304342269897461, -5.79339599609375, -5.282449722290039, -4.771503448486328, -4.260557174682617, -3.7496109008789062, -3.2386646270751953, -2.7277183532714844, -2.2167720794677734, -1.7058258056640625, -1.1948795318603516, -0.6839332580566406, -0.1729888916015625, 0.33795738220214844, 0.8489036560058594, 1.3598499298095703, 1.8707962036132812, 2.381742477416992, 2.892688751220703, 3.403635025024414, 3.914581298828125, 4.425527572631836, 4.936473846435547, 5.447420120239258, 5.958366394042969, 6.46931266784668, 6.980258941650391, 7.491205215454102, 8.002151489257812, 8.513097763061523, 9.024044036865234, 9.534990310668945, 10.045936584472656, 10.556882858276367, 11.067829132080078, 11.578775405883789, 12.0897216796875, 12.600667953491211, 13.111614227294922, 13.622560501098633, 14.133506774902344, 14.644453048706055, 15.155399322509766, 15.666345596313477, 16.177291870117188]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 2.0, 14.0, 16.0, 36.0, 27.0, 71.0, 96.0, 126.0, 174.0, 319.0, 459.0, 742.0, 1061.0, 1837.0, 2861.0, 4902.0, 9090.0, 16730.0, 33995.0, 76467.0, 181675.0, 329842.0, 214747.0, 89926.0, 39608.0, 19241.0, 10118.0, 5734.0, 3248.0, 2013.0, 1215.0, 699.0, 554.0, 340.0, 211.0, 117.0, 79.0, 59.0, 32.0, 26.0, 16.0, 9.0, 7.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.078125, -2.012359619140625, -1.94659423828125, -1.880828857421875, -1.8150634765625, -1.749298095703125, -1.68353271484375, -1.617767333984375, -1.552001953125, -1.486236572265625, -1.42047119140625, -1.354705810546875, -1.2889404296875, -1.223175048828125, -1.15740966796875, -1.091644287109375, -1.02587890625, -0.960113525390625, -0.89434814453125, -0.828582763671875, -0.7628173828125, -0.697052001953125, -0.63128662109375, -0.565521240234375, -0.499755859375, -0.433990478515625, -0.36822509765625, -0.302459716796875, -0.2366943359375, -0.170928955078125, -0.10516357421875, -0.039398193359375, 0.0263671875, 0.092132568359375, 0.15789794921875, 0.223663330078125, 0.2894287109375, 0.355194091796875, 0.42095947265625, 0.486724853515625, 0.552490234375, 0.618255615234375, 0.68402099609375, 0.749786376953125, 0.8155517578125, 0.881317138671875, 0.94708251953125, 1.012847900390625, 1.07861328125, 1.144378662109375, 1.21014404296875, 1.275909423828125, 1.3416748046875, 1.407440185546875, 1.47320556640625, 1.538970947265625, 1.604736328125, 1.670501708984375, 1.73626708984375, 1.802032470703125, 1.8677978515625, 1.933563232421875, 1.99932861328125, 2.065093994140625, 2.130859375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 4.0, 5.0, 14.0, 14.0, 18.0, 16.0, 17.0, 19.0, 18.0, 26.0, 19.0, 38.0, 29.0, 42.0, 30.0, 41.0, 50.0, 43.0, 51.0, 42.0, 46.0, 40.0, 42.0, 33.0, 41.0, 29.0, 34.0, 22.0, 27.0, 33.0, 21.0, 17.0, 18.0, 5.0, 11.0, 9.0, 10.0, 7.0, 4.0, 7.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.248046875, -2.1855010986328125, -2.122955322265625, -2.0604095458984375, -1.99786376953125, -1.9353179931640625, -1.872772216796875, -1.8102264404296875, -1.7476806640625, -1.6851348876953125, -1.622589111328125, -1.5600433349609375, -1.49749755859375, -1.4349517822265625, -1.372406005859375, -1.3098602294921875, -1.247314453125, -1.1847686767578125, -1.122222900390625, -1.0596771240234375, -0.99713134765625, -0.9345855712890625, -0.872039794921875, -0.8094940185546875, -0.7469482421875, -0.6844024658203125, -0.621856689453125, -0.5593109130859375, -0.49676513671875, -0.4342193603515625, -0.371673583984375, -0.3091278076171875, -0.24658203125, -0.1840362548828125, -0.121490478515625, -0.0589447021484375, 0.00360107421875, 0.0661468505859375, 0.128692626953125, 0.1912384033203125, 0.2537841796875, 0.3163299560546875, 0.378875732421875, 0.4414215087890625, 0.50396728515625, 0.5665130615234375, 0.629058837890625, 0.6916046142578125, 0.754150390625, 0.8166961669921875, 0.879241943359375, 0.9417877197265625, 1.00433349609375, 1.0668792724609375, 1.129425048828125, 1.1919708251953125, 1.2545166015625, 1.3170623779296875, 1.379608154296875, 1.4421539306640625, 1.50469970703125, 1.5672454833984375, 1.629791259765625, 1.6923370361328125, 1.7548828125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 0.0, 4.0, 5.0, 6.0, 11.0, 9.0, 10.0, 15.0, 16.0, 26.0, 27.0, 50.0, 45.0, 64.0, 110.0, 192.0, 322.0, 587.0, 1388.0, 3988.0, 16974.0, 113776.0, 758383.0, 126857.0, 18557.0, 4199.0, 1397.0, 619.0, 312.0, 186.0, 105.0, 88.0, 40.0, 46.0, 27.0, 29.0, 15.0, 17.0, 10.0, 10.0, 5.0, 9.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-5.58984375, -5.4005126953125, -5.211181640625, -5.0218505859375, -4.83251953125, -4.6431884765625, -4.453857421875, -4.2645263671875, -4.0751953125, -3.8858642578125, -3.696533203125, -3.5072021484375, -3.31787109375, -3.1285400390625, -2.939208984375, -2.7498779296875, -2.560546875, -2.3712158203125, -2.181884765625, -1.9925537109375, -1.80322265625, -1.6138916015625, -1.424560546875, -1.2352294921875, -1.0458984375, -0.8565673828125, -0.667236328125, -0.4779052734375, -0.28857421875, -0.0992431640625, 0.090087890625, 0.2794189453125, 0.46875, 0.6580810546875, 0.847412109375, 1.0367431640625, 1.22607421875, 1.4154052734375, 1.604736328125, 1.7940673828125, 1.9833984375, 2.1727294921875, 2.362060546875, 2.5513916015625, 2.74072265625, 2.9300537109375, 3.119384765625, 3.3087158203125, 3.498046875, 3.6873779296875, 3.876708984375, 4.0660400390625, 4.25537109375, 4.4447021484375, 4.634033203125, 4.8233642578125, 5.0126953125, 5.2020263671875, 5.391357421875, 5.5806884765625, 5.77001953125, 5.9593505859375, 6.148681640625, 6.3380126953125, 6.52734375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 5.0, 4.0, 9.0, 9.0, 7.0, 16.0, 15.0, 17.0, 12.0, 22.0, 17.0, 19.0, 24.0, 24.0, 27.0, 47.0, 32.0, 37.0, 40.0, 41.0, 32.0, 35.0, 35.0, 51.0, 38.0, 36.0, 49.0, 30.0, 34.0, 30.0, 20.0, 21.0, 27.0, 24.0, 16.0, 13.0, 13.0, 17.0, 14.0, 6.0, 13.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0], "bins": [-6.640625, -6.44354248046875, -6.2464599609375, -6.04937744140625, -5.852294921875, -5.65521240234375, -5.4581298828125, -5.26104736328125, -5.06396484375, -4.86688232421875, -4.6697998046875, -4.47271728515625, -4.275634765625, -4.07855224609375, -3.8814697265625, -3.68438720703125, -3.4873046875, -3.29022216796875, -3.0931396484375, -2.89605712890625, -2.698974609375, -2.50189208984375, -2.3048095703125, -2.10772705078125, -1.91064453125, -1.71356201171875, -1.5164794921875, -1.31939697265625, -1.122314453125, -0.92523193359375, -0.7281494140625, -0.53106689453125, -0.333984375, -0.13690185546875, 0.0601806640625, 0.25726318359375, 0.454345703125, 0.65142822265625, 0.8485107421875, 1.04559326171875, 1.24267578125, 1.43975830078125, 1.6368408203125, 1.83392333984375, 2.031005859375, 2.22808837890625, 2.4251708984375, 2.62225341796875, 2.8193359375, 3.01641845703125, 3.2135009765625, 3.41058349609375, 3.607666015625, 3.80474853515625, 4.0018310546875, 4.19891357421875, 4.39599609375, 4.59307861328125, 4.7901611328125, 4.98724365234375, 5.184326171875, 5.38140869140625, 5.5784912109375, 5.77557373046875, 5.97265625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 3.0, 7.0, 5.0, 11.0, 10.0, 15.0, 17.0, 23.0, 41.0, 66.0, 80.0, 126.0, 267.0, 412.0, 839.0, 1952.0, 5140.0, 16675.0, 72800.0, 619060.0, 267654.0, 45069.0, 11442.0, 3737.0, 1524.0, 664.0, 340.0, 214.0, 120.0, 74.0, 46.0, 29.0, 22.0, 16.0, 14.0, 6.0, 11.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-1.580078125, -1.5334014892578125, -1.486724853515625, -1.4400482177734375, -1.39337158203125, -1.3466949462890625, -1.300018310546875, -1.2533416748046875, -1.2066650390625, -1.1599884033203125, -1.113311767578125, -1.0666351318359375, -1.01995849609375, -0.9732818603515625, -0.926605224609375, -0.8799285888671875, -0.833251953125, -0.7865753173828125, -0.739898681640625, -0.6932220458984375, -0.64654541015625, -0.5998687744140625, -0.553192138671875, -0.5065155029296875, -0.4598388671875, -0.4131622314453125, -0.366485595703125, -0.3198089599609375, -0.27313232421875, -0.2264556884765625, -0.179779052734375, -0.1331024169921875, -0.08642578125, -0.0397491455078125, 0.006927490234375, 0.0536041259765625, 0.10028076171875, 0.1469573974609375, 0.193634033203125, 0.2403106689453125, 0.2869873046875, 0.3336639404296875, 0.380340576171875, 0.4270172119140625, 0.47369384765625, 0.5203704833984375, 0.567047119140625, 0.6137237548828125, 0.660400390625, 0.7070770263671875, 0.753753662109375, 0.8004302978515625, 0.84710693359375, 0.8937835693359375, 0.940460205078125, 0.9871368408203125, 1.0338134765625, 1.0804901123046875, 1.127166748046875, 1.1738433837890625, 1.22052001953125, 1.2671966552734375, 1.313873291015625, 1.3605499267578125, 1.4072265625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 5.0, 22.0, 22.0, 35.0, 53.0, 71.0, 95.0, 148.0, 149.0, 108.0, 73.0, 65.0, 39.0, 31.0, 18.0, 16.0, 12.0, 11.0, 8.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004520416259765625, -0.0004402250051498413, -0.0004284083843231201, -0.0004165917634963989, -0.00040477514266967773, -0.00039295852184295654, -0.00038114190101623535, -0.00036932528018951416, -0.00035750865936279297, -0.0003456920385360718, -0.0003338754177093506, -0.0003220587968826294, -0.0003102421760559082, -0.000298425555229187, -0.0002866089344024658, -0.00027479231357574463, -0.00026297569274902344, -0.00025115907192230225, -0.00023934245109558105, -0.00022752583026885986, -0.00021570920944213867, -0.00020389258861541748, -0.0001920759677886963, -0.0001802593469619751, -0.0001684427261352539, -0.00015662610530853271, -0.00014480948448181152, -0.00013299286365509033, -0.00012117624282836914, -0.00010935962200164795, -9.754300117492676e-05, -8.572638034820557e-05, -7.390975952148438e-05, -6.209313869476318e-05, -5.027651786804199e-05, -3.84598970413208e-05, -2.664327621459961e-05, -1.4826655387878418e-05, -3.0100345611572266e-06, 8.806586265563965e-06, 2.0623207092285156e-05, 3.243982791900635e-05, 4.425644874572754e-05, 5.607306957244873e-05, 6.788969039916992e-05, 7.970631122589111e-05, 9.15229320526123e-05, 0.0001033395528793335, 0.00011515617370605469, 0.00012697279453277588, 0.00013878941535949707, 0.00015060603618621826, 0.00016242265701293945, 0.00017423927783966064, 0.00018605589866638184, 0.00019787251949310303, 0.00020968914031982422, 0.0002215057611465454, 0.0002333223819732666, 0.0002451390027999878, 0.000256955623626709, 0.0002687722444534302, 0.00028058886528015137, 0.00029240548610687256, 0.00030422210693359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 10.0, 12.0, 19.0, 24.0, 35.0, 67.0, 112.0, 164.0, 311.0, 633.0, 1489.0, 4663.0, 19040.0, 149140.0, 779518.0, 75398.0, 12371.0, 3218.0, 1162.0, 509.0, 248.0, 134.0, 91.0, 68.0, 39.0, 19.0, 16.0, 16.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.931640625, -1.863525390625, -1.79541015625, -1.727294921875, -1.6591796875, -1.591064453125, -1.52294921875, -1.454833984375, -1.38671875, -1.318603515625, -1.25048828125, -1.182373046875, -1.1142578125, -1.046142578125, -0.97802734375, -0.909912109375, -0.841796875, -0.773681640625, -0.70556640625, -0.637451171875, -0.5693359375, -0.501220703125, -0.43310546875, -0.364990234375, -0.296875, -0.228759765625, -0.16064453125, -0.092529296875, -0.0244140625, 0.043701171875, 0.11181640625, 0.179931640625, 0.248046875, 0.316162109375, 0.38427734375, 0.452392578125, 0.5205078125, 0.588623046875, 0.65673828125, 0.724853515625, 0.79296875, 0.861083984375, 0.92919921875, 0.997314453125, 1.0654296875, 1.133544921875, 1.20166015625, 1.269775390625, 1.337890625, 1.406005859375, 1.47412109375, 1.542236328125, 1.6103515625, 1.678466796875, 1.74658203125, 1.814697265625, 1.8828125, 1.950927734375, 2.01904296875, 2.087158203125, 2.1552734375, 2.223388671875, 2.29150390625, 2.359619140625, 2.427734375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 7.0, 6.0, 12.0, 14.0, 33.0, 24.0, 35.0, 24.0, 45.0, 54.0, 65.0, 108.0, 101.0, 100.0, 86.0, 65.0, 53.0, 34.0, 29.0, 29.0, 22.0, 11.0, 9.0, 11.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.548828125, -1.4963531494140625, -1.443878173828125, -1.3914031982421875, -1.33892822265625, -1.2864532470703125, -1.233978271484375, -1.1815032958984375, -1.1290283203125, -1.0765533447265625, -1.024078369140625, -0.9716033935546875, -0.91912841796875, -0.8666534423828125, -0.814178466796875, -0.7617034912109375, -0.709228515625, -0.6567535400390625, -0.604278564453125, -0.5518035888671875, -0.49932861328125, -0.4468536376953125, -0.394378662109375, -0.3419036865234375, -0.2894287109375, -0.2369537353515625, -0.184478759765625, -0.1320037841796875, -0.07952880859375, -0.0270538330078125, 0.025421142578125, 0.0778961181640625, 0.13037109375, 0.1828460693359375, 0.235321044921875, 0.2877960205078125, 0.34027099609375, 0.3927459716796875, 0.445220947265625, 0.4976959228515625, 0.5501708984375, 0.6026458740234375, 0.655120849609375, 0.7075958251953125, 0.76007080078125, 0.8125457763671875, 0.865020751953125, 0.9174957275390625, 0.969970703125, 1.0224456787109375, 1.074920654296875, 1.1273956298828125, 1.17987060546875, 1.2323455810546875, 1.284820556640625, 1.3372955322265625, 1.3897705078125, 1.4422454833984375, 1.494720458984375, 1.5471954345703125, 1.59967041015625, 1.6521453857421875, 1.704620361328125, 1.7570953369140625, 1.8095703125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 10.0, 13.0, 21.0, 73.0, 143.0, 341.0, 188.0, 108.0, 43.0, 23.0, 12.0, 9.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.65494155883789, -26.091903686523438, -24.528865814208984, -22.96582794189453, -21.402790069580078, -19.839752197265625, -18.276716232299805, -16.71367835998535, -15.150640487670898, -13.587602615356445, -12.024564743041992, -10.461527824401855, -8.898489952087402, -7.335452079772949, -5.7724151611328125, -4.209377288818359, -2.6463394165039062, -1.0833017826080322, 0.4797358512878418, 2.0427732467651367, 3.60581111907959, 5.168848991394043, 6.73188591003418, 8.294923782348633, 9.857961654663086, 11.420999526977539, 12.984037399291992, 14.547074317932129, 16.110111236572266, 17.67314910888672, 19.236186981201172, 20.799224853515625, 22.362258911132812, 23.925296783447266, 25.48833465576172, 27.051372528076172, 28.614410400390625, 30.177448272705078, 31.7404842376709, 33.30352020263672, 34.86656188964844, 36.42959976196289, 37.992637634277344, 39.5556755065918, 41.11871337890625, 42.6817512512207, 44.244789123535156, 45.807823181152344, 47.3708610534668, 48.93389892578125, 50.4969367980957, 52.059974670410156, 53.62301254272461, 55.18605041503906, 56.74908447265625, 58.31212615966797, 59.875160217285156, 61.43819808959961, 63.00123596191406, 64.56427001953125, 66.12731170654297, 67.69034576416016, 69.25338745117188, 70.81642150878906, 72.37946319580078]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 6.0, 10.0, 9.0, 10.0, 12.0, 13.0, 18.0, 15.0, 14.0, 20.0, 27.0, 27.0, 26.0, 29.0, 43.0, 34.0, 40.0, 48.0, 67.0, 65.0, 75.0, 53.0, 38.0, 30.0, 31.0, 25.0, 29.0, 25.0, 23.0, 20.0, 18.0, 16.0, 10.0, 9.0, 13.0, 10.0, 8.0, 2.0, 8.0, 4.0, 2.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.214447021484375, -22.41911506652832, -21.623783111572266, -20.82845115661621, -20.033119201660156, -19.2377872467041, -18.442455291748047, -17.647123336791992, -16.851791381835938, -16.056459426879883, -15.261127471923828, -14.465795516967773, -13.670463562011719, -12.875131607055664, -12.07979965209961, -11.284467697143555, -10.4891357421875, -9.693803787231445, -8.89847183227539, -8.103139877319336, -7.307807922363281, -6.512475967407227, -5.717144012451172, -4.921812057495117, -4.1264801025390625, -3.331148147583008, -2.535816192626953, -1.7404842376708984, -0.9451522827148438, -0.14982032775878906, 0.6455116271972656, 1.4408435821533203, 2.236173629760742, 3.031505584716797, 3.8268375396728516, 4.622169494628906, 5.417501449584961, 6.212833404541016, 7.00816535949707, 7.803497314453125, 8.59882926940918, 9.394161224365234, 10.189493179321289, 10.984825134277344, 11.780157089233398, 12.575489044189453, 13.370820999145508, 14.166152954101562, 14.961484909057617, 15.756816864013672, 16.552148818969727, 17.34748077392578, 18.142812728881836, 18.93814468383789, 19.733476638793945, 20.52880859375, 21.324140548706055, 22.11947250366211, 22.914804458618164, 23.71013641357422, 24.505468368530273, 25.300800323486328, 26.096132278442383, 26.891464233398438, 27.686796188354492]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 12.0, 9.0, 7.0, 18.0, 28.0, 54.0, 57.0, 83.0, 159.0, 182.0, 262.0, 368.0, 534.0, 951.0, 1308.0, 2236.0, 4040.0, 8803.0, 26296.0, 98901.0, 473016.0, 2012369.0, 1226519.0, 247187.0, 58714.0, 17474.0, 6334.0, 3180.0, 1777.0, 1071.0, 724.0, 482.0, 337.0, 229.0, 157.0, 129.0, 93.0, 49.0, 37.0, 30.0, 18.0, 15.0, 13.0, 8.0, 10.0, 5.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.7392578125, -1.690673828125, -1.64208984375, -1.593505859375, -1.544921875, -1.496337890625, -1.44775390625, -1.399169921875, -1.3505859375, -1.302001953125, -1.25341796875, -1.204833984375, -1.15625, -1.107666015625, -1.05908203125, -1.010498046875, -0.9619140625, -0.913330078125, -0.86474609375, -0.816162109375, -0.767578125, -0.718994140625, -0.67041015625, -0.621826171875, -0.5732421875, -0.524658203125, -0.47607421875, -0.427490234375, -0.37890625, -0.330322265625, -0.28173828125, -0.233154296875, -0.1845703125, -0.135986328125, -0.08740234375, -0.038818359375, 0.009765625, 0.058349609375, 0.10693359375, 0.155517578125, 0.2041015625, 0.252685546875, 0.30126953125, 0.349853515625, 0.3984375, 0.447021484375, 0.49560546875, 0.544189453125, 0.5927734375, 0.641357421875, 0.68994140625, 0.738525390625, 0.787109375, 0.835693359375, 0.88427734375, 0.932861328125, 0.9814453125, 1.030029296875, 1.07861328125, 1.127197265625, 1.17578125, 1.224365234375, 1.27294921875, 1.321533203125, 1.3701171875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 8.0, 10.0, 16.0, 17.0, 16.0, 13.0, 20.0, 23.0, 13.0, 26.0, 36.0, 33.0, 39.0, 43.0, 49.0, 47.0, 62.0, 44.0, 46.0, 38.0, 45.0, 37.0, 38.0, 35.0, 39.0, 31.0, 32.0, 27.0, 30.0, 12.0, 19.0, 11.0, 8.0, 8.0, 7.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.107421875, -2.046234130859375, -1.98504638671875, -1.923858642578125, -1.8626708984375, -1.801483154296875, -1.74029541015625, -1.679107666015625, -1.617919921875, -1.556732177734375, -1.49554443359375, -1.434356689453125, -1.3731689453125, -1.311981201171875, -1.25079345703125, -1.189605712890625, -1.12841796875, -1.067230224609375, -1.00604248046875, -0.944854736328125, -0.8836669921875, -0.822479248046875, -0.76129150390625, -0.700103759765625, -0.638916015625, -0.577728271484375, -0.51654052734375, -0.455352783203125, -0.3941650390625, -0.332977294921875, -0.27178955078125, -0.210601806640625, -0.1494140625, -0.088226318359375, -0.02703857421875, 0.034149169921875, 0.0953369140625, 0.156524658203125, 0.21771240234375, 0.278900146484375, 0.340087890625, 0.401275634765625, 0.46246337890625, 0.523651123046875, 0.5848388671875, 0.646026611328125, 0.70721435546875, 0.768402099609375, 0.82958984375, 0.890777587890625, 0.95196533203125, 1.013153076171875, 1.0743408203125, 1.135528564453125, 1.19671630859375, 1.257904052734375, 1.319091796875, 1.380279541015625, 1.44146728515625, 1.502655029296875, 1.5638427734375, 1.625030517578125, 1.68621826171875, 1.747406005859375, 1.80859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 9.0, 5.0, 11.0, 18.0, 34.0, 56.0, 121.0, 299.0, 1305.0, 26377.0, 4142510.0, 21632.0, 1345.0, 280.0, 122.0, 70.0, 47.0, 25.0, 14.0, 3.0, 5.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.1796875, -10.7728271484375, -10.365966796875, -9.9591064453125, -9.55224609375, -9.1453857421875, -8.738525390625, -8.3316650390625, -7.9248046875, -7.5179443359375, -7.111083984375, -6.7042236328125, -6.29736328125, -5.8905029296875, -5.483642578125, -5.0767822265625, -4.669921875, -4.2630615234375, -3.856201171875, -3.4493408203125, -3.04248046875, -2.6356201171875, -2.228759765625, -1.8218994140625, -1.4150390625, -1.0081787109375, -0.601318359375, -0.1944580078125, 0.21240234375, 0.6192626953125, 1.026123046875, 1.4329833984375, 1.83984375, 2.2467041015625, 2.653564453125, 3.0604248046875, 3.46728515625, 3.8741455078125, 4.281005859375, 4.6878662109375, 5.0947265625, 5.5015869140625, 5.908447265625, 6.3153076171875, 6.72216796875, 7.1290283203125, 7.535888671875, 7.9427490234375, 8.349609375, 8.7564697265625, 9.163330078125, 9.5701904296875, 9.97705078125, 10.3839111328125, 10.790771484375, 11.1976318359375, 11.6044921875, 12.0113525390625, 12.418212890625, 12.8250732421875, 13.23193359375, 13.6387939453125, 14.045654296875, 14.4525146484375, 14.859375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 4.0, 4.0, 7.0, 10.0, 15.0, 21.0, 43.0, 78.0, 197.0, 513.0, 1290.0, 1131.0, 440.0, 160.0, 74.0, 30.0, 25.0, 13.0, 7.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.826171875, -3.643341064453125, -3.46051025390625, -3.277679443359375, -3.0948486328125, -2.912017822265625, -2.72918701171875, -2.546356201171875, -2.363525390625, -2.180694580078125, -1.99786376953125, -1.815032958984375, -1.6322021484375, -1.449371337890625, -1.26654052734375, -1.083709716796875, -0.90087890625, -0.718048095703125, -0.53521728515625, -0.352386474609375, -0.1695556640625, 0.013275146484375, 0.19610595703125, 0.378936767578125, 0.561767578125, 0.744598388671875, 0.92742919921875, 1.110260009765625, 1.2930908203125, 1.475921630859375, 1.65875244140625, 1.841583251953125, 2.0244140625, 2.207244873046875, 2.39007568359375, 2.572906494140625, 2.7557373046875, 2.938568115234375, 3.12139892578125, 3.304229736328125, 3.487060546875, 3.669891357421875, 3.85272216796875, 4.035552978515625, 4.2183837890625, 4.401214599609375, 4.58404541015625, 4.766876220703125, 4.94970703125, 5.132537841796875, 5.31536865234375, 5.498199462890625, 5.6810302734375, 5.863861083984375, 6.04669189453125, 6.229522705078125, 6.412353515625, 6.595184326171875, 6.77801513671875, 6.960845947265625, 7.1436767578125, 7.326507568359375, 7.50933837890625, 7.692169189453125, 7.875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 10.0, 20.0, 65.0, 162.0, 355.0, 251.0, 98.0, 27.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.03592681884766, -69.33355712890625, -67.63119506835938, -65.92882537841797, -64.2264633178711, -62.52409744262695, -60.82173156738281, -59.11936569213867, -57.41699981689453, -55.71463394165039, -54.01226806640625, -52.30990219116211, -50.60753631591797, -48.90517044067383, -47.20280456542969, -45.50043869018555, -43.798072814941406, -42.095706939697266, -40.393341064453125, -38.690975189208984, -36.988609313964844, -35.2862434387207, -33.58387756347656, -31.881511688232422, -30.179141998291016, -28.476776123046875, -26.774410247802734, -25.072044372558594, -23.369678497314453, -21.667312622070312, -19.964946746826172, -18.26258087158203, -16.56021499633789, -14.85784912109375, -13.15548324584961, -11.453117370605469, -9.750751495361328, -8.048384666442871, -6.3460187911987305, -4.64365291595459, -2.941287040710449, -1.238921046257019, 0.46344494819641113, 2.165811061859131, 3.8681769371032715, 5.57054328918457, 7.272909164428711, 8.975275039672852, 10.677640914916992, 12.380006790161133, 14.082372665405273, 15.784738540649414, 17.487104415893555, 19.189472198486328, 20.89183807373047, 22.59420394897461, 24.29656982421875, 25.99893569946289, 27.70130157470703, 29.403667449951172, 31.106033325195312, 32.80839920043945, 34.510765075683594, 36.213130950927734, 37.915496826171875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 7.0, 6.0, 9.0, 7.0, 5.0, 8.0, 12.0, 11.0, 14.0, 23.0, 18.0, 28.0, 33.0, 36.0, 29.0, 38.0, 50.0, 32.0, 47.0, 32.0, 38.0, 38.0, 49.0, 32.0, 43.0, 31.0, 37.0, 33.0, 38.0, 25.0, 29.0, 28.0, 25.0, 19.0, 13.0, 10.0, 13.0, 12.0, 5.0, 6.0, 9.0, 4.0, 6.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-14.523801803588867, -14.1176176071167, -13.711434364318848, -13.30525016784668, -12.899065971374512, -12.492881774902344, -12.086698532104492, -11.680514335632324, -11.274330139160156, -10.868145942687988, -10.461962699890137, -10.055778503417969, -9.6495943069458, -9.243410110473633, -8.837226867675781, -8.431042671203613, -8.024859428405762, -7.618675708770752, -7.212491512298584, -6.806307792663574, -6.400123596191406, -5.9939398765563965, -5.587756156921387, -5.181571960449219, -4.775388240814209, -4.369204521179199, -3.9630203247070312, -3.5568366050720215, -3.1506526470184326, -2.7444686889648438, -2.338284969329834, -1.9321010112762451, -1.5259160995483398, -1.119732141494751, -0.7135483026504517, -0.30736446380615234, 0.09881949424743652, 0.5050034523010254, 0.9111871719360352, 1.317371129989624, 1.723555088043213, 2.1297390460968018, 2.5359230041503906, 2.9421067237854004, 3.3482906818389893, 3.754474639892578, 4.160658359527588, 4.566842079162598, 4.973026275634766, 5.379209995269775, 5.785394191741943, 6.191577911376953, 6.597762107849121, 7.003945827484131, 7.410129547119141, 7.816313743591309, 8.222497940063477, 8.628682136535645, 9.034865379333496, 9.441049575805664, 9.847233772277832, 10.25341796875, 10.659601211547852, 11.06578540802002, 11.471968650817871]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 9.0, 3.0, 6.0, 5.0, 11.0, 8.0, 18.0, 31.0, 37.0, 47.0, 68.0, 86.0, 167.0, 209.0, 300.0, 491.0, 808.0, 1279.0, 2249.0, 4080.0, 7837.0, 15612.0, 33644.0, 78697.0, 204745.0, 378786.0, 185222.0, 71700.0, 30972.0, 14520.0, 7443.0, 3924.0, 2126.0, 1230.0, 758.0, 473.0, 302.0, 182.0, 123.0, 103.0, 69.0, 48.0, 43.0, 31.0, 14.0, 16.0, 11.0, 8.0, 5.0, 0.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.234375, -2.163330078125, -2.09228515625, -2.021240234375, -1.9501953125, -1.879150390625, -1.80810546875, -1.737060546875, -1.666015625, -1.594970703125, -1.52392578125, -1.452880859375, -1.3818359375, -1.310791015625, -1.23974609375, -1.168701171875, -1.09765625, -1.026611328125, -0.95556640625, -0.884521484375, -0.8134765625, -0.742431640625, -0.67138671875, -0.600341796875, -0.529296875, -0.458251953125, -0.38720703125, -0.316162109375, -0.2451171875, -0.174072265625, -0.10302734375, -0.031982421875, 0.0390625, 0.110107421875, 0.18115234375, 0.252197265625, 0.3232421875, 0.394287109375, 0.46533203125, 0.536376953125, 0.607421875, 0.678466796875, 0.74951171875, 0.820556640625, 0.8916015625, 0.962646484375, 1.03369140625, 1.104736328125, 1.17578125, 1.246826171875, 1.31787109375, 1.388916015625, 1.4599609375, 1.531005859375, 1.60205078125, 1.673095703125, 1.744140625, 1.815185546875, 1.88623046875, 1.957275390625, 2.0283203125, 2.099365234375, 2.17041015625, 2.241455078125, 2.3125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 8.0, 10.0, 12.0, 9.0, 10.0, 17.0, 14.0, 13.0, 16.0, 35.0, 26.0, 21.0, 31.0, 28.0, 37.0, 38.0, 51.0, 47.0, 47.0, 46.0, 35.0, 52.0, 36.0, 40.0, 42.0, 27.0, 32.0, 36.0, 27.0, 22.0, 24.0, 22.0, 16.0, 12.0, 11.0, 8.0, 9.0, 7.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.07421875, -2.015533447265625, -1.95684814453125, -1.898162841796875, -1.8394775390625, -1.780792236328125, -1.72210693359375, -1.663421630859375, -1.604736328125, -1.546051025390625, -1.48736572265625, -1.428680419921875, -1.3699951171875, -1.311309814453125, -1.25262451171875, -1.193939208984375, -1.13525390625, -1.076568603515625, -1.01788330078125, -0.959197998046875, -0.9005126953125, -0.841827392578125, -0.78314208984375, -0.724456787109375, -0.665771484375, -0.607086181640625, -0.54840087890625, -0.489715576171875, -0.4310302734375, -0.372344970703125, -0.31365966796875, -0.254974365234375, -0.1962890625, -0.137603759765625, -0.07891845703125, -0.020233154296875, 0.0384521484375, 0.097137451171875, 0.15582275390625, 0.214508056640625, 0.273193359375, 0.331878662109375, 0.39056396484375, 0.449249267578125, 0.5079345703125, 0.566619873046875, 0.62530517578125, 0.683990478515625, 0.74267578125, 0.801361083984375, 0.86004638671875, 0.918731689453125, 0.9774169921875, 1.036102294921875, 1.09478759765625, 1.153472900390625, 1.212158203125, 1.270843505859375, 1.32952880859375, 1.388214111328125, 1.4468994140625, 1.505584716796875, 1.56427001953125, 1.622955322265625, 1.681640625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 0.0, 4.0, 3.0, 2.0, 6.0, 8.0, 16.0, 8.0, 16.0, 25.0, 29.0, 36.0, 50.0, 72.0, 107.0, 155.0, 189.0, 304.0, 532.0, 1212.0, 3262.0, 14097.0, 116343.0, 824770.0, 71858.0, 10237.0, 2655.0, 1030.0, 520.0, 303.0, 183.0, 154.0, 101.0, 63.0, 55.0, 43.0, 28.0, 14.0, 9.0, 15.0, 10.0, 5.0, 5.0, 7.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.3984375, -6.20098876953125, -6.0035400390625, -5.80609130859375, -5.608642578125, -5.41119384765625, -5.2137451171875, -5.01629638671875, -4.81884765625, -4.62139892578125, -4.4239501953125, -4.22650146484375, -4.029052734375, -3.83160400390625, -3.6341552734375, -3.43670654296875, -3.2392578125, -3.04180908203125, -2.8443603515625, -2.64691162109375, -2.449462890625, -2.25201416015625, -2.0545654296875, -1.85711669921875, -1.65966796875, -1.46221923828125, -1.2647705078125, -1.06732177734375, -0.869873046875, -0.67242431640625, -0.4749755859375, -0.27752685546875, -0.080078125, 0.11737060546875, 0.3148193359375, 0.51226806640625, 0.709716796875, 0.90716552734375, 1.1046142578125, 1.30206298828125, 1.49951171875, 1.69696044921875, 1.8944091796875, 2.09185791015625, 2.289306640625, 2.48675537109375, 2.6842041015625, 2.88165283203125, 3.0791015625, 3.27655029296875, 3.4739990234375, 3.67144775390625, 3.868896484375, 4.06634521484375, 4.2637939453125, 4.46124267578125, 4.65869140625, 4.85614013671875, 5.0535888671875, 5.25103759765625, 5.448486328125, 5.64593505859375, 5.8433837890625, 6.04083251953125, 6.23828125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 4.0, 17.0, 21.0, 19.0, 22.0, 23.0, 29.0, 32.0, 38.0, 44.0, 54.0, 56.0, 76.0, 66.0, 58.0, 68.0, 51.0, 60.0, 42.0, 39.0, 32.0, 23.0, 24.0, 18.0, 12.0, 18.0, 12.0, 11.0, 6.0, 7.0, 2.0, 6.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.953125, -8.67236328125, -8.3916015625, -8.11083984375, -7.830078125, -7.54931640625, -7.2685546875, -6.98779296875, -6.70703125, -6.42626953125, -6.1455078125, -5.86474609375, -5.583984375, -5.30322265625, -5.0224609375, -4.74169921875, -4.4609375, -4.18017578125, -3.8994140625, -3.61865234375, -3.337890625, -3.05712890625, -2.7763671875, -2.49560546875, -2.21484375, -1.93408203125, -1.6533203125, -1.37255859375, -1.091796875, -0.81103515625, -0.5302734375, -0.24951171875, 0.03125, 0.31201171875, 0.5927734375, 0.87353515625, 1.154296875, 1.43505859375, 1.7158203125, 1.99658203125, 2.27734375, 2.55810546875, 2.8388671875, 3.11962890625, 3.400390625, 3.68115234375, 3.9619140625, 4.24267578125, 4.5234375, 4.80419921875, 5.0849609375, 5.36572265625, 5.646484375, 5.92724609375, 6.2080078125, 6.48876953125, 6.76953125, 7.05029296875, 7.3310546875, 7.61181640625, 7.892578125, 8.17333984375, 8.4541015625, 8.73486328125, 9.015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 7.0, 9.0, 19.0, 51.0, 72.0, 115.0, 315.0, 838.0, 2913.0, 13064.0, 123833.0, 858595.0, 39501.0, 6606.0, 1616.0, 556.0, 198.0, 90.0, 45.0, 36.0, 22.0, 7.0, 5.0, 5.0, 7.0, 4.0, 6.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.29296875, -3.19964599609375, -3.1063232421875, -3.01300048828125, -2.919677734375, -2.82635498046875, -2.7330322265625, -2.63970947265625, -2.54638671875, -2.45306396484375, -2.3597412109375, -2.26641845703125, -2.173095703125, -2.07977294921875, -1.9864501953125, -1.89312744140625, -1.7998046875, -1.70648193359375, -1.6131591796875, -1.51983642578125, -1.426513671875, -1.33319091796875, -1.2398681640625, -1.14654541015625, -1.05322265625, -0.95989990234375, -0.8665771484375, -0.77325439453125, -0.679931640625, -0.58660888671875, -0.4932861328125, -0.39996337890625, -0.306640625, -0.21331787109375, -0.1199951171875, -0.02667236328125, 0.066650390625, 0.15997314453125, 0.2532958984375, 0.34661865234375, 0.43994140625, 0.53326416015625, 0.6265869140625, 0.71990966796875, 0.813232421875, 0.90655517578125, 0.9998779296875, 1.09320068359375, 1.1865234375, 1.27984619140625, 1.3731689453125, 1.46649169921875, 1.559814453125, 1.65313720703125, 1.7464599609375, 1.83978271484375, 1.93310546875, 2.02642822265625, 2.1197509765625, 2.21307373046875, 2.306396484375, 2.39971923828125, 2.4930419921875, 2.58636474609375, 2.6796875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 5.0, 6.0, 3.0, 12.0, 12.0, 24.0, 29.0, 51.0, 110.0, 225.0, 217.0, 124.0, 65.0, 40.0, 18.0, 15.0, 11.0, 10.0, 5.0, 2.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006418228149414062, -0.0006218254566192627, -0.0006018280982971191, -0.0005818307399749756, -0.000561833381652832, -0.0005418360233306885, -0.0005218386650085449, -0.0005018413066864014, -0.0004818439483642578, -0.00046184659004211426, -0.0004418492317199707, -0.00042185187339782715, -0.0004018545150756836, -0.00038185715675354004, -0.0003618597984313965, -0.00034186244010925293, -0.0003218650817871094, -0.0003018677234649658, -0.00028187036514282227, -0.0002618730068206787, -0.00024187564849853516, -0.0002218782901763916, -0.00020188093185424805, -0.0001818835735321045, -0.00016188621520996094, -0.00014188885688781738, -0.00012189149856567383, -0.00010189414024353027, -8.189678192138672e-05, -6.189942359924316e-05, -4.190206527709961e-05, -2.1904706954956055e-05, -1.9073486328125e-06, 1.8090009689331055e-05, 3.808736801147461e-05, 5.8084726333618164e-05, 7.808208465576172e-05, 9.807944297790527e-05, 0.00011807680130004883, 0.00013807415962219238, 0.00015807151794433594, 0.0001780688762664795, 0.00019806623458862305, 0.0002180635929107666, 0.00023806095123291016, 0.0002580583095550537, 0.00027805566787719727, 0.0002980530261993408, 0.0003180503845214844, 0.00033804774284362793, 0.0003580451011657715, 0.00037804245948791504, 0.0003980398178100586, 0.00041803717613220215, 0.0004380345344543457, 0.00045803189277648926, 0.0004780292510986328, 0.0004980266094207764, 0.0005180239677429199, 0.0005380213260650635, 0.000558018684387207, 0.0005780160427093506, 0.0005980134010314941, 0.0006180107593536377, 0.0006380081176757812]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0, 7.0, 7.0, 8.0, 10.0, 11.0, 35.0, 62.0, 126.0, 386.0, 1863.0, 33641.0, 997700.0, 13011.0, 1158.0, 288.0, 110.0, 39.0, 35.0, 19.0, 10.0, 12.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.265625, -5.07330322265625, -4.8809814453125, -4.68865966796875, -4.496337890625, -4.30401611328125, -4.1116943359375, -3.91937255859375, -3.72705078125, -3.53472900390625, -3.3424072265625, -3.15008544921875, -2.957763671875, -2.76544189453125, -2.5731201171875, -2.38079833984375, -2.1884765625, -1.99615478515625, -1.8038330078125, -1.61151123046875, -1.419189453125, -1.22686767578125, -1.0345458984375, -0.84222412109375, -0.64990234375, -0.45758056640625, -0.2652587890625, -0.07293701171875, 0.119384765625, 0.31170654296875, 0.5040283203125, 0.69635009765625, 0.888671875, 1.08099365234375, 1.2733154296875, 1.46563720703125, 1.657958984375, 1.85028076171875, 2.0426025390625, 2.23492431640625, 2.42724609375, 2.61956787109375, 2.8118896484375, 3.00421142578125, 3.196533203125, 3.38885498046875, 3.5811767578125, 3.77349853515625, 3.9658203125, 4.15814208984375, 4.3504638671875, 4.54278564453125, 4.735107421875, 4.92742919921875, 5.1197509765625, 5.31207275390625, 5.50439453125, 5.69671630859375, 5.8890380859375, 6.08135986328125, 6.273681640625, 6.46600341796875, 6.6583251953125, 6.85064697265625, 7.04296875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 9.0, 8.0, 16.0, 20.0, 46.0, 83.0, 146.0, 239.0, 205.0, 79.0, 52.0, 33.0, 28.0, 14.0, 7.0, 7.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.615234375, -3.508087158203125, -3.40093994140625, -3.293792724609375, -3.1866455078125, -3.079498291015625, -2.97235107421875, -2.865203857421875, -2.758056640625, -2.650909423828125, -2.54376220703125, -2.436614990234375, -2.3294677734375, -2.222320556640625, -2.11517333984375, -2.008026123046875, -1.90087890625, -1.793731689453125, -1.68658447265625, -1.579437255859375, -1.4722900390625, -1.365142822265625, -1.25799560546875, -1.150848388671875, -1.043701171875, -0.936553955078125, -0.82940673828125, -0.722259521484375, -0.6151123046875, -0.507965087890625, -0.40081787109375, -0.293670654296875, -0.1865234375, -0.079376220703125, 0.02777099609375, 0.134918212890625, 0.2420654296875, 0.349212646484375, 0.45635986328125, 0.563507080078125, 0.670654296875, 0.777801513671875, 0.88494873046875, 0.992095947265625, 1.0992431640625, 1.206390380859375, 1.31353759765625, 1.420684814453125, 1.52783203125, 1.634979248046875, 1.74212646484375, 1.849273681640625, 1.9564208984375, 2.063568115234375, 2.17071533203125, 2.277862548828125, 2.385009765625, 2.492156982421875, 2.59930419921875, 2.706451416015625, 2.8135986328125, 2.920745849609375, 3.02789306640625, 3.135040283203125, 3.2421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 11.0, 16.0, 35.0, 49.0, 112.0, 258.0, 253.0, 130.0, 67.0, 30.0, 13.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.383201599121094, -34.07194519042969, -32.76069259643555, -31.44943618774414, -30.138181686401367, -28.826927185058594, -27.515670776367188, -26.204416275024414, -24.89316177368164, -23.581907272338867, -22.270652770996094, -20.959396362304688, -19.648141860961914, -18.33688735961914, -17.025630950927734, -15.714376449584961, -14.403121948242188, -13.091867446899414, -11.780611991882324, -10.469356536865234, -9.158102035522461, -7.846847057342529, -6.535592079162598, -5.224336624145508, -3.9130821228027344, -2.6018271446228027, -1.290572166442871, 0.020682811737060547, 1.3319377899169922, 2.643192768096924, 3.9544477462768555, 5.265703201293945, 6.576953887939453, 7.888208866119385, 9.199463844299316, 10.510719299316406, 11.82197380065918, 13.133228302001953, 14.444483757019043, 15.755739212036133, 17.066993713378906, 18.37824821472168, 19.689502716064453, 21.00075912475586, 22.312013626098633, 23.623268127441406, 24.934524536132812, 26.245779037475586, 27.55703353881836, 28.868288040161133, 30.179542541503906, 31.490798950195312, 32.80205535888672, 34.11330795288086, 35.424564361572266, 36.735816955566406, 38.04707336425781, 39.35832977294922, 40.66958236694336, 41.980838775634766, 43.292091369628906, 44.60334777832031, 45.91460418701172, 47.225860595703125, 48.537113189697266]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 3.0, 3.0, 5.0, 2.0, 4.0, 4.0, 9.0, 2.0, 12.0, 11.0, 13.0, 8.0, 11.0, 15.0, 16.0, 16.0, 26.0, 35.0, 34.0, 37.0, 44.0, 62.0, 60.0, 94.0, 96.0, 60.0, 40.0, 38.0, 34.0, 25.0, 25.0, 15.0, 34.0, 17.0, 20.0, 16.0, 11.0, 11.0, 6.0, 11.0, 2.0, 9.0, 2.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.35497283935547, -22.480236053466797, -21.605499267578125, -20.730762481689453, -19.856027603149414, -18.981290817260742, -18.10655403137207, -17.2318172454834, -16.35708236694336, -15.482345581054688, -14.607609748840332, -13.73287296295166, -12.858137130737305, -11.983400344848633, -11.108663558959961, -10.233926773071289, -9.359189987182617, -8.484453201293945, -7.60971736907959, -6.734980583190918, -5.860244274139404, -4.985507965087891, -4.110771179199219, -3.236034870147705, -2.3612985610961914, -1.4865621328353882, -0.611825704574585, 0.2629108428955078, 1.1376471519470215, 2.012383460998535, 2.887120246887207, 3.7618565559387207, 4.636592864990234, 5.511329174041748, 6.386065483093262, 7.260802268981934, 8.135538101196289, 9.010274887084961, 9.885011672973633, 10.759748458862305, 11.63448429107666, 12.509221076965332, 13.383956909179688, 14.25869369506836, 15.133430480957031, 16.008167266845703, 16.882904052734375, 17.757638931274414, 18.632375717163086, 19.507112503051758, 20.38184928894043, 21.25658416748047, 22.13132095336914, 23.006057739257812, 23.880794525146484, 24.755531311035156, 25.630268096923828, 26.5050048828125, 27.379741668701172, 28.254478454589844, 29.129213333129883, 30.003950119018555, 30.878686904907227, 31.7534236907959, 32.62815856933594]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 10.0, 9.0, 12.0, 16.0, 33.0, 33.0, 39.0, 63.0, 102.0, 124.0, 195.0, 286.0, 430.0, 806.0, 1367.0, 2509.0, 5398.0, 15743.0, 114157.0, 1818787.0, 2070663.0, 133683.0, 17650.0, 5709.0, 2667.0, 1451.0, 823.0, 534.0, 334.0, 183.0, 134.0, 85.0, 58.0, 50.0, 30.0, 36.0, 13.0, 19.0, 9.0, 12.0, 5.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09765625, -2.9945068359375, -2.891357421875, -2.7882080078125, -2.68505859375, -2.5819091796875, -2.478759765625, -2.3756103515625, -2.2724609375, -2.1693115234375, -2.066162109375, -1.9630126953125, -1.85986328125, -1.7567138671875, -1.653564453125, -1.5504150390625, -1.447265625, -1.3441162109375, -1.240966796875, -1.1378173828125, -1.03466796875, -0.9315185546875, -0.828369140625, -0.7252197265625, -0.6220703125, -0.5189208984375, -0.415771484375, -0.3126220703125, -0.20947265625, -0.1063232421875, -0.003173828125, 0.0999755859375, 0.203125, 0.3062744140625, 0.409423828125, 0.5125732421875, 0.61572265625, 0.7188720703125, 0.822021484375, 0.9251708984375, 1.0283203125, 1.1314697265625, 1.234619140625, 1.3377685546875, 1.44091796875, 1.5440673828125, 1.647216796875, 1.7503662109375, 1.853515625, 1.9566650390625, 2.059814453125, 2.1629638671875, 2.26611328125, 2.3692626953125, 2.472412109375, 2.5755615234375, 2.6787109375, 2.7818603515625, 2.885009765625, 2.9881591796875, 3.09130859375, 3.1944580078125, 3.297607421875, 3.4007568359375, 3.50390625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 15.0, 20.0, 11.0, 17.0, 19.0, 22.0, 27.0, 24.0, 25.0, 29.0, 40.0, 40.0, 50.0, 35.0, 56.0, 57.0, 31.0, 42.0, 48.0, 61.0, 36.0, 42.0, 33.0, 36.0, 31.0, 25.0, 23.0, 14.0, 10.0, 8.0, 10.0, 12.0, 9.0, 4.0, 4.0, 6.0, 2.0, 1.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.07421875, -2.0109405517578125, -1.947662353515625, -1.8843841552734375, -1.82110595703125, -1.7578277587890625, -1.694549560546875, -1.6312713623046875, -1.5679931640625, -1.5047149658203125, -1.441436767578125, -1.3781585693359375, -1.31488037109375, -1.2516021728515625, -1.188323974609375, -1.1250457763671875, -1.061767578125, -0.9984893798828125, -0.935211181640625, -0.8719329833984375, -0.80865478515625, -0.7453765869140625, -0.682098388671875, -0.6188201904296875, -0.5555419921875, -0.4922637939453125, -0.428985595703125, -0.3657073974609375, -0.30242919921875, -0.2391510009765625, -0.175872802734375, -0.1125946044921875, -0.04931640625, 0.0139617919921875, 0.077239990234375, 0.1405181884765625, 0.20379638671875, 0.2670745849609375, 0.330352783203125, 0.3936309814453125, 0.4569091796875, 0.5201873779296875, 0.583465576171875, 0.6467437744140625, 0.71002197265625, 0.7733001708984375, 0.836578369140625, 0.8998565673828125, 0.963134765625, 1.0264129638671875, 1.089691162109375, 1.1529693603515625, 1.21624755859375, 1.2795257568359375, 1.342803955078125, 1.4060821533203125, 1.4693603515625, 1.5326385498046875, 1.595916748046875, 1.6591949462890625, 1.72247314453125, 1.7857513427734375, 1.849029541015625, 1.9123077392578125, 1.9755859375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 13.0, 12.0, 16.0, 20.0, 32.0, 54.0, 118.0, 277.0, 939.0, 3303.0, 28301.0, 4079854.0, 74315.0, 5089.0, 1245.0, 385.0, 142.0, 56.0, 29.0, 24.0, 17.0, 7.0, 10.0, 3.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-12.2421875, -11.8985595703125, -11.554931640625, -11.2113037109375, -10.86767578125, -10.5240478515625, -10.180419921875, -9.8367919921875, -9.4931640625, -9.1495361328125, -8.805908203125, -8.4622802734375, -8.11865234375, -7.7750244140625, -7.431396484375, -7.0877685546875, -6.744140625, -6.4005126953125, -6.056884765625, -5.7132568359375, -5.36962890625, -5.0260009765625, -4.682373046875, -4.3387451171875, -3.9951171875, -3.6514892578125, -3.307861328125, -2.9642333984375, -2.62060546875, -2.2769775390625, -1.933349609375, -1.5897216796875, -1.24609375, -0.9024658203125, -0.558837890625, -0.2152099609375, 0.12841796875, 0.4720458984375, 0.815673828125, 1.1593017578125, 1.5029296875, 1.8465576171875, 2.190185546875, 2.5338134765625, 2.87744140625, 3.2210693359375, 3.564697265625, 3.9083251953125, 4.251953125, 4.5955810546875, 4.939208984375, 5.2828369140625, 5.62646484375, 5.9700927734375, 6.313720703125, 6.6573486328125, 7.0009765625, 7.3446044921875, 7.688232421875, 8.0318603515625, 8.37548828125, 8.7191162109375, 9.062744140625, 9.4063720703125, 9.75]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 14.0, 19.0, 30.0, 45.0, 70.0, 176.0, 463.0, 1066.0, 1175.0, 550.0, 225.0, 87.0, 46.0, 36.0, 16.0, 8.0, 5.0, 2.0, 4.0, 6.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.21875, -7.01318359375, -6.8076171875, -6.60205078125, -6.396484375, -6.19091796875, -5.9853515625, -5.77978515625, -5.57421875, -5.36865234375, -5.1630859375, -4.95751953125, -4.751953125, -4.54638671875, -4.3408203125, -4.13525390625, -3.9296875, -3.72412109375, -3.5185546875, -3.31298828125, -3.107421875, -2.90185546875, -2.6962890625, -2.49072265625, -2.28515625, -2.07958984375, -1.8740234375, -1.66845703125, -1.462890625, -1.25732421875, -1.0517578125, -0.84619140625, -0.640625, -0.43505859375, -0.2294921875, -0.02392578125, 0.181640625, 0.38720703125, 0.5927734375, 0.79833984375, 1.00390625, 1.20947265625, 1.4150390625, 1.62060546875, 1.826171875, 2.03173828125, 2.2373046875, 2.44287109375, 2.6484375, 2.85400390625, 3.0595703125, 3.26513671875, 3.470703125, 3.67626953125, 3.8818359375, 4.08740234375, 4.29296875, 4.49853515625, 4.7041015625, 4.90966796875, 5.115234375, 5.32080078125, 5.5263671875, 5.73193359375, 5.9375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 15.0, 14.0, 25.0, 60.0, 115.0, 198.0, 216.0, 178.0, 81.0, 47.0, 22.0, 9.0, 2.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.022735595703125, -39.759361267089844, -38.49598693847656, -37.23261260986328, -35.969242095947266, -34.705867767333984, -33.4424934387207, -32.17911911010742, -30.91574478149414, -29.65237045288086, -28.38899803161621, -27.12562370300293, -25.86224937438965, -24.598876953125, -23.33550262451172, -22.072128295898438, -20.80875587463379, -19.545381546020508, -18.28200912475586, -17.018634796142578, -15.755260467529297, -14.491887092590332, -13.228513717651367, -11.965139389038086, -10.701766014099121, -9.438392639160156, -8.175018310546875, -6.91164493560791, -5.648271083831787, -4.384897232055664, -3.121523857116699, -1.858149528503418, -0.5947761535644531, 0.6685975790023804, 1.9319713115692139, 3.195344924926758, 4.458718776702881, 5.722092628479004, 6.985466003417969, 8.24884033203125, 9.512213706970215, 10.77558708190918, 12.038961410522461, 13.302334785461426, 14.56570816040039, 15.829082489013672, 17.092456817626953, 18.355831146240234, 19.619203567504883, 20.882577896118164, 22.145950317382812, 23.409324645996094, 24.672698974609375, 25.936073303222656, 27.199445724487305, 28.462820053100586, 29.726192474365234, 30.989566802978516, 32.2529411315918, 33.51631164550781, 34.779685974121094, 36.043060302734375, 37.306434631347656, 38.56980895996094, 39.83318328857422]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 1.0, 2.0, 8.0, 4.0, 14.0, 9.0, 20.0, 18.0, 21.0, 25.0, 28.0, 35.0, 54.0, 41.0, 51.0, 57.0, 59.0, 64.0, 63.0, 54.0, 66.0, 47.0, 41.0, 28.0, 36.0, 27.0, 27.0, 27.0, 23.0, 13.0, 12.0, 10.0, 9.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.63462257385254, -22.92302894592285, -22.211435317993164, -21.499841690063477, -20.78824806213379, -20.076656341552734, -19.365062713623047, -18.65346908569336, -17.941875457763672, -17.230281829833984, -16.518688201904297, -15.80709457397461, -15.095501899719238, -14.38390827178955, -13.672314643859863, -12.960721969604492, -12.249127388000488, -11.5375337600708, -10.825940132141113, -10.114347457885742, -9.402753829956055, -8.691160202026367, -7.97956657409668, -7.26797342300415, -6.556379795074463, -5.844786167144775, -5.133193016052246, -4.421599388122559, -3.71000599861145, -2.998412609100342, -2.2868189811706543, -1.575225830078125, -0.8636322021484375, -0.15203875303268433, 0.5595546960830688, 1.2711482048034668, 1.9827415943145752, 2.6943349838256836, 3.405928611755371, 4.1175217628479, 4.829115390777588, 5.540709018707275, 6.252302169799805, 6.963895797729492, 7.67548942565918, 8.387083053588867, 9.098676681518555, 9.810269355773926, 10.521862983703613, 11.2334566116333, 11.945050239562988, 12.65664291381836, 13.368236541748047, 14.079830169677734, 14.791423797607422, 15.50301742553711, 16.214611053466797, 16.926204681396484, 17.637798309326172, 18.34939193725586, 19.060985565185547, 19.772579193115234, 20.484172821044922, 21.195764541625977, 21.907358169555664]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 9.0, 12.0, 11.0, 28.0, 39.0, 49.0, 57.0, 110.0, 158.0, 237.0, 323.0, 493.0, 818.0, 1394.0, 2210.0, 4003.0, 7215.0, 14233.0, 32509.0, 92184.0, 335651.0, 382829.0, 104260.0, 35990.0, 15409.0, 7735.0, 4280.0, 2365.0, 1470.0, 856.0, 531.0, 341.0, 262.0, 147.0, 110.0, 75.0, 51.0, 22.0, 21.0, 24.0, 10.0, 4.0, 7.0, 8.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.564453125, -3.4627685546875, -3.361083984375, -3.2593994140625, -3.15771484375, -3.0560302734375, -2.954345703125, -2.8526611328125, -2.7509765625, -2.6492919921875, -2.547607421875, -2.4459228515625, -2.34423828125, -2.2425537109375, -2.140869140625, -2.0391845703125, -1.9375, -1.8358154296875, -1.734130859375, -1.6324462890625, -1.53076171875, -1.4290771484375, -1.327392578125, -1.2257080078125, -1.1240234375, -1.0223388671875, -0.920654296875, -0.8189697265625, -0.71728515625, -0.6156005859375, -0.513916015625, -0.4122314453125, -0.310546875, -0.2088623046875, -0.107177734375, -0.0054931640625, 0.09619140625, 0.1978759765625, 0.299560546875, 0.4012451171875, 0.5029296875, 0.6046142578125, 0.706298828125, 0.8079833984375, 0.90966796875, 1.0113525390625, 1.113037109375, 1.2147216796875, 1.31640625, 1.4180908203125, 1.519775390625, 1.6214599609375, 1.72314453125, 1.8248291015625, 1.926513671875, 2.0281982421875, 2.1298828125, 2.2315673828125, 2.333251953125, 2.4349365234375, 2.53662109375, 2.6383056640625, 2.739990234375, 2.8416748046875, 2.943359375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 3.0, 5.0, 6.0, 14.0, 18.0, 12.0, 15.0, 27.0, 28.0, 28.0, 46.0, 23.0, 28.0, 34.0, 41.0, 44.0, 41.0, 71.0, 46.0, 53.0, 53.0, 45.0, 49.0, 42.0, 32.0, 30.0, 32.0, 22.0, 26.0, 19.0, 11.0, 15.0, 11.0, 6.0, 7.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.359375, -2.288238525390625, -2.21710205078125, -2.145965576171875, -2.0748291015625, -2.003692626953125, -1.93255615234375, -1.861419677734375, -1.790283203125, -1.719146728515625, -1.64801025390625, -1.576873779296875, -1.5057373046875, -1.434600830078125, -1.36346435546875, -1.292327880859375, -1.22119140625, -1.150054931640625, -1.07891845703125, -1.007781982421875, -0.9366455078125, -0.865509033203125, -0.79437255859375, -0.723236083984375, -0.652099609375, -0.580963134765625, -0.50982666015625, -0.438690185546875, -0.3675537109375, -0.296417236328125, -0.22528076171875, -0.154144287109375, -0.0830078125, -0.011871337890625, 0.05926513671875, 0.130401611328125, 0.2015380859375, 0.272674560546875, 0.34381103515625, 0.414947509765625, 0.486083984375, 0.557220458984375, 0.62835693359375, 0.699493408203125, 0.7706298828125, 0.841766357421875, 0.91290283203125, 0.984039306640625, 1.05517578125, 1.126312255859375, 1.19744873046875, 1.268585205078125, 1.3397216796875, 1.410858154296875, 1.48199462890625, 1.553131103515625, 1.624267578125, 1.695404052734375, 1.76654052734375, 1.837677001953125, 1.9088134765625, 1.979949951171875, 2.05108642578125, 2.122222900390625, 2.193359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 11.0, 5.0, 11.0, 16.0, 21.0, 25.0, 32.0, 39.0, 48.0, 81.0, 91.0, 157.0, 219.0, 236.0, 484.0, 724.0, 1518.0, 4794.0, 37224.0, 909881.0, 81230.0, 7232.0, 1928.0, 929.0, 526.0, 310.0, 218.0, 138.0, 134.0, 60.0, 57.0, 43.0, 38.0, 19.0, 17.0, 17.0, 13.0, 5.0, 2.0, 8.0, 2.0, 8.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.09375, -7.820556640625, -7.54736328125, -7.274169921875, -7.0009765625, -6.727783203125, -6.45458984375, -6.181396484375, -5.908203125, -5.635009765625, -5.36181640625, -5.088623046875, -4.8154296875, -4.542236328125, -4.26904296875, -3.995849609375, -3.72265625, -3.449462890625, -3.17626953125, -2.903076171875, -2.6298828125, -2.356689453125, -2.08349609375, -1.810302734375, -1.537109375, -1.263916015625, -0.99072265625, -0.717529296875, -0.4443359375, -0.171142578125, 0.10205078125, 0.375244140625, 0.6484375, 0.921630859375, 1.19482421875, 1.468017578125, 1.7412109375, 2.014404296875, 2.28759765625, 2.560791015625, 2.833984375, 3.107177734375, 3.38037109375, 3.653564453125, 3.9267578125, 4.199951171875, 4.47314453125, 4.746337890625, 5.01953125, 5.292724609375, 5.56591796875, 5.839111328125, 6.1123046875, 6.385498046875, 6.65869140625, 6.931884765625, 7.205078125, 7.478271484375, 7.75146484375, 8.024658203125, 8.2978515625, 8.571044921875, 8.84423828125, 9.117431640625, 9.390625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 14.0, 9.0, 8.0, 15.0, 17.0, 18.0, 15.0, 37.0, 41.0, 44.0, 59.0, 67.0, 69.0, 52.0, 66.0, 54.0, 70.0, 49.0, 47.0, 38.0, 40.0, 31.0, 28.0, 19.0, 19.0, 21.0, 11.0, 4.0, 10.0, 4.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-10.9921875, -10.68994140625, -10.3876953125, -10.08544921875, -9.783203125, -9.48095703125, -9.1787109375, -8.87646484375, -8.57421875, -8.27197265625, -7.9697265625, -7.66748046875, -7.365234375, -7.06298828125, -6.7607421875, -6.45849609375, -6.15625, -5.85400390625, -5.5517578125, -5.24951171875, -4.947265625, -4.64501953125, -4.3427734375, -4.04052734375, -3.73828125, -3.43603515625, -3.1337890625, -2.83154296875, -2.529296875, -2.22705078125, -1.9248046875, -1.62255859375, -1.3203125, -1.01806640625, -0.7158203125, -0.41357421875, -0.111328125, 0.19091796875, 0.4931640625, 0.79541015625, 1.09765625, 1.39990234375, 1.7021484375, 2.00439453125, 2.306640625, 2.60888671875, 2.9111328125, 3.21337890625, 3.515625, 3.81787109375, 4.1201171875, 4.42236328125, 4.724609375, 5.02685546875, 5.3291015625, 5.63134765625, 5.93359375, 6.23583984375, 6.5380859375, 6.84033203125, 7.142578125, 7.44482421875, 7.7470703125, 8.04931640625, 8.3515625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 3.0, 8.0, 3.0, 2.0, 5.0, 5.0, 13.0, 12.0, 11.0, 22.0, 37.0, 50.0, 52.0, 74.0, 137.0, 225.0, 447.0, 889.0, 2170.0, 6268.0, 23531.0, 166804.0, 772259.0, 57083.0, 11949.0, 3596.0, 1403.0, 661.0, 286.0, 154.0, 122.0, 76.0, 63.0, 31.0, 22.0, 8.0, 10.0, 9.0, 7.0, 14.0, 11.0, 8.0, 5.0, 6.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2216796875, -1.183807373046875, -1.14593505859375, -1.108062744140625, -1.0701904296875, -1.032318115234375, -0.99444580078125, -0.956573486328125, -0.918701171875, -0.880828857421875, -0.84295654296875, -0.805084228515625, -0.7672119140625, -0.729339599609375, -0.69146728515625, -0.653594970703125, -0.61572265625, -0.577850341796875, -0.53997802734375, -0.502105712890625, -0.4642333984375, -0.426361083984375, -0.38848876953125, -0.350616455078125, -0.312744140625, -0.274871826171875, -0.23699951171875, -0.199127197265625, -0.1612548828125, -0.123382568359375, -0.08551025390625, -0.047637939453125, -0.009765625, 0.028106689453125, 0.06597900390625, 0.103851318359375, 0.1417236328125, 0.179595947265625, 0.21746826171875, 0.255340576171875, 0.293212890625, 0.331085205078125, 0.36895751953125, 0.406829833984375, 0.4447021484375, 0.482574462890625, 0.52044677734375, 0.558319091796875, 0.59619140625, 0.634063720703125, 0.67193603515625, 0.709808349609375, 0.7476806640625, 0.785552978515625, 0.82342529296875, 0.861297607421875, 0.899169921875, 0.937042236328125, 0.97491455078125, 1.012786865234375, 1.0506591796875, 1.088531494140625, 1.12640380859375, 1.164276123046875, 1.2021484375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 6.0, 15.0, 14.0, 26.0, 44.0, 89.0, 152.0, 257.0, 171.0, 96.0, 51.0, 29.0, 16.0, 12.0, 6.0, 2.0, 0.0, 6.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043272972106933594, -0.0004170127213001251, -0.0004012957215309143, -0.0003855787217617035, -0.0003698617219924927, -0.00035414472222328186, -0.00033842772245407104, -0.00032271072268486023, -0.0003069937229156494, -0.0002912767231464386, -0.0002755597233772278, -0.00025984272360801697, -0.00024412572383880615, -0.00022840872406959534, -0.00021269172430038452, -0.0001969747245311737, -0.0001812577247619629, -0.00016554072499275208, -0.00014982372522354126, -0.00013410672545433044, -0.00011838972568511963, -0.00010267272591590881, -8.6955726146698e-05, -7.123872637748718e-05, -5.552172660827637e-05, -3.980472683906555e-05, -2.4087727069854736e-05, -8.370727300643921e-06, 7.3462724685668945e-06, 2.306327223777771e-05, 3.8780272006988525e-05, 5.449727177619934e-05, 7.021427154541016e-05, 8.593127131462097e-05, 0.00010164827108383179, 0.0001173652708530426, 0.00013308227062225342, 0.00014879927039146423, 0.00016451627016067505, 0.00018023326992988586, 0.00019595026969909668, 0.0002116672694683075, 0.0002273842692375183, 0.00024310126900672913, 0.00025881826877593994, 0.00027453526854515076, 0.00029025226831436157, 0.0003059692680835724, 0.0003216862678527832, 0.000337403267621994, 0.00035312026739120483, 0.00036883726716041565, 0.00038455426692962646, 0.0004002712666988373, 0.0004159882664680481, 0.0004317052662372589, 0.0004474222660064697, 0.00046313926577568054, 0.00047885626554489136, 0.0004945732653141022, 0.000510290265083313, 0.0005260072648525238, 0.0005417242646217346, 0.0005574412643909454, 0.0005731582641601562]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 4.0, 9.0, 4.0, 11.0, 19.0, 22.0, 27.0, 27.0, 45.0, 76.0, 104.0, 141.0, 239.0, 408.0, 801.0, 1970.0, 6436.0, 43362.0, 812947.0, 160779.0, 15013.0, 3360.0, 1269.0, 586.0, 291.0, 189.0, 143.0, 69.0, 49.0, 48.0, 28.0, 19.0, 15.0, 8.0, 6.0, 9.0, 4.0, 9.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4140625, -1.3695220947265625, -1.324981689453125, -1.2804412841796875, -1.23590087890625, -1.1913604736328125, -1.146820068359375, -1.1022796630859375, -1.0577392578125, -1.0131988525390625, -0.968658447265625, -0.9241180419921875, -0.87957763671875, -0.8350372314453125, -0.790496826171875, -0.7459564208984375, -0.701416015625, -0.6568756103515625, -0.612335205078125, -0.5677947998046875, -0.52325439453125, -0.4787139892578125, -0.434173583984375, -0.3896331787109375, -0.3450927734375, -0.3005523681640625, -0.256011962890625, -0.2114715576171875, -0.16693115234375, -0.1223907470703125, -0.077850341796875, -0.0333099365234375, 0.01123046875, 0.0557708740234375, 0.100311279296875, 0.1448516845703125, 0.18939208984375, 0.2339324951171875, 0.278472900390625, 0.3230133056640625, 0.3675537109375, 0.4120941162109375, 0.456634521484375, 0.5011749267578125, 0.54571533203125, 0.5902557373046875, 0.634796142578125, 0.6793365478515625, 0.723876953125, 0.7684173583984375, 0.812957763671875, 0.8574981689453125, 0.90203857421875, 0.9465789794921875, 0.991119384765625, 1.0356597900390625, 1.0802001953125, 1.1247406005859375, 1.169281005859375, 1.2138214111328125, 1.25836181640625, 1.3029022216796875, 1.347442626953125, 1.3919830322265625, 1.4365234375]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 6.0, 5.0, 8.0, 8.0, 15.0, 19.0, 18.0, 21.0, 25.0, 35.0, 45.0, 56.0, 64.0, 73.0, 75.0, 89.0, 81.0, 66.0, 55.0, 37.0, 43.0, 31.0, 30.0, 17.0, 17.0, 14.0, 9.0, 10.0, 6.0, 5.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.025390625, -0.9953994750976562, -0.9654083251953125, -0.9354171752929688, -0.905426025390625, -0.8754348754882812, -0.8454437255859375, -0.8154525756835938, -0.78546142578125, -0.7554702758789062, -0.7254791259765625, -0.6954879760742188, -0.665496826171875, -0.6355056762695312, -0.6055145263671875, -0.5755233764648438, -0.5455322265625, -0.5155410766601562, -0.4855499267578125, -0.45555877685546875, -0.425567626953125, -0.39557647705078125, -0.3655853271484375, -0.33559417724609375, -0.30560302734375, -0.27561187744140625, -0.2456207275390625, -0.21562957763671875, -0.185638427734375, -0.15564727783203125, -0.1256561279296875, -0.09566497802734375, -0.065673828125, -0.03568267822265625, -0.0056915283203125, 0.02429962158203125, 0.054290771484375, 0.08428192138671875, 0.1142730712890625, 0.14426422119140625, 0.17425537109375, 0.20424652099609375, 0.2342376708984375, 0.26422882080078125, 0.294219970703125, 0.32421112060546875, 0.3542022705078125, 0.38419342041015625, 0.4141845703125, 0.44417572021484375, 0.4741668701171875, 0.5041580200195312, 0.534149169921875, 0.5641403198242188, 0.5941314697265625, 0.6241226196289062, 0.65411376953125, 0.6841049194335938, 0.7140960693359375, 0.7440872192382812, 0.774078369140625, 0.8040695190429688, 0.8340606689453125, 0.8640518188476562, 0.89404296875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 11.0, 22.0, 40.0, 94.0, 352.0, 208.0, 113.0, 73.0, 29.0, 17.0, 16.0, 14.0, 1.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.13120651245117, -41.9272346496582, -40.723262786865234, -39.519290924072266, -38.31532287597656, -37.111351013183594, -35.907379150390625, -34.703407287597656, -33.49943542480469, -32.29546356201172, -31.09149169921875, -29.887521743774414, -28.683549880981445, -27.479578018188477, -26.27560806274414, -25.071636199951172, -23.867664337158203, -22.663692474365234, -21.459720611572266, -20.25575065612793, -19.05177879333496, -17.847806930541992, -16.643836975097656, -15.439865112304688, -14.235893249511719, -13.03192138671875, -11.827950477600098, -10.623979568481445, -9.420007705688477, -8.216035842895508, -7.0120649337768555, -5.808094024658203, -4.6041259765625, -3.4001545906066895, -2.196183204650879, -0.9922118186950684, 0.2117595672607422, 1.4157309532165527, 2.6197023391723633, 3.8236732482910156, 5.027645111083984, 6.231616497039795, 7.4355878829956055, 8.639558792114258, 9.843530654907227, 11.047502517700195, 12.251473426818848, 13.4554443359375, 14.659416198730469, 15.863388061523438, 17.067359924316406, 18.271329879760742, 19.47530174255371, 20.67927360534668, 21.883243560791016, 23.087215423583984, 24.291187286376953, 25.495159149169922, 26.69913101196289, 27.903100967407227, 29.107072830200195, 30.311044692993164, 31.5150146484375, 32.71898651123047, 33.92295837402344]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 8.0, 6.0, 6.0, 13.0, 8.0, 15.0, 14.0, 15.0, 28.0, 18.0, 28.0, 34.0, 46.0, 29.0, 51.0, 77.0, 175.0, 112.0, 54.0, 30.0, 20.0, 26.0, 26.0, 31.0, 26.0, 17.0, 14.0, 12.0, 6.0, 13.0, 6.0, 5.0, 3.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-33.129966735839844, -32.083683013916016, -31.037399291992188, -29.991113662719727, -28.9448299407959, -27.89854621887207, -26.85226058959961, -25.80597686767578, -24.759693145751953, -23.713409423828125, -22.667125701904297, -21.620840072631836, -20.574556350708008, -19.52827262878418, -18.48198699951172, -17.43570327758789, -16.389419555664062, -15.343135833740234, -14.29685115814209, -13.250566482543945, -12.204282760620117, -11.157999038696289, -10.111714363098145, -9.0654296875, -8.019145965576172, -6.9728617668151855, -5.926577568054199, -4.880293369293213, -3.8340091705322266, -2.7877249717712402, -1.741440773010254, -0.6951565742492676, 0.35112762451171875, 1.397411823272705, 2.4436960220336914, 3.4899802207946777, 4.536264419555664, 5.58254861831665, 6.628832817077637, 7.675117015838623, 8.72140121459961, 9.767684936523438, 10.813969612121582, 11.860254287719727, 12.906538009643555, 13.952821731567383, 14.999106407165527, 16.045391082763672, 17.0916748046875, 18.137958526611328, 19.184242248535156, 20.230527877807617, 21.276811599731445, 22.323095321655273, 23.369380950927734, 24.415664672851562, 25.46194839477539, 26.50823211669922, 27.554515838623047, 28.600801467895508, 29.647085189819336, 30.693368911743164, 31.739654541015625, 32.78593826293945, 33.83222198486328]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 26.0, 25.0, 41.0, 51.0, 65.0, 88.0, 116.0, 146.0, 235.0, 366.0, 557.0, 897.0, 1623.0, 3174.0, 7105.0, 22003.0, 142993.0, 1277523.0, 2300143.0, 373849.0, 42865.0, 10699.0, 4436.0, 2108.0, 1134.0, 677.0, 422.0, 246.0, 176.0, 141.0, 90.0, 54.0, 53.0, 43.0, 34.0, 22.0, 10.0, 10.0, 9.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.37109375, -3.259490966796875, -3.14788818359375, -3.036285400390625, -2.9246826171875, -2.813079833984375, -2.70147705078125, -2.589874267578125, -2.478271484375, -2.366668701171875, -2.25506591796875, -2.143463134765625, -2.0318603515625, -1.920257568359375, -1.80865478515625, -1.697052001953125, -1.58544921875, -1.473846435546875, -1.36224365234375, -1.250640869140625, -1.1390380859375, -1.027435302734375, -0.91583251953125, -0.804229736328125, -0.692626953125, -0.581024169921875, -0.46942138671875, -0.357818603515625, -0.2462158203125, -0.134613037109375, -0.02301025390625, 0.088592529296875, 0.2001953125, 0.311798095703125, 0.42340087890625, 0.535003662109375, 0.6466064453125, 0.758209228515625, 0.86981201171875, 0.981414794921875, 1.093017578125, 1.204620361328125, 1.31622314453125, 1.427825927734375, 1.5394287109375, 1.651031494140625, 1.76263427734375, 1.874237060546875, 1.98583984375, 2.097442626953125, 2.20904541015625, 2.320648193359375, 2.4322509765625, 2.543853759765625, 2.65545654296875, 2.767059326171875, 2.878662109375, 2.990264892578125, 3.10186767578125, 3.213470458984375, 3.3250732421875, 3.436676025390625, 3.54827880859375, 3.659881591796875, 3.771484375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 8.0, 6.0, 5.0, 7.0, 15.0, 15.0, 25.0, 28.0, 30.0, 31.0, 26.0, 36.0, 39.0, 40.0, 53.0, 47.0, 59.0, 59.0, 51.0, 47.0, 47.0, 54.0, 53.0, 35.0, 27.0, 26.0, 15.0, 16.0, 32.0, 16.0, 16.0, 11.0, 10.0, 4.0, 4.0, 4.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.33984375, -2.269866943359375, -2.19989013671875, -2.129913330078125, -2.0599365234375, -1.989959716796875, -1.91998291015625, -1.850006103515625, -1.780029296875, -1.710052490234375, -1.64007568359375, -1.570098876953125, -1.5001220703125, -1.430145263671875, -1.36016845703125, -1.290191650390625, -1.22021484375, -1.150238037109375, -1.08026123046875, -1.010284423828125, -0.9403076171875, -0.870330810546875, -0.80035400390625, -0.730377197265625, -0.660400390625, -0.590423583984375, -0.52044677734375, -0.450469970703125, -0.3804931640625, -0.310516357421875, -0.24053955078125, -0.170562744140625, -0.1005859375, -0.030609130859375, 0.03936767578125, 0.109344482421875, 0.1793212890625, 0.249298095703125, 0.31927490234375, 0.389251708984375, 0.459228515625, 0.529205322265625, 0.59918212890625, 0.669158935546875, 0.7391357421875, 0.809112548828125, 0.87908935546875, 0.949066162109375, 1.01904296875, 1.089019775390625, 1.15899658203125, 1.228973388671875, 1.2989501953125, 1.368927001953125, 1.43890380859375, 1.508880615234375, 1.578857421875, 1.648834228515625, 1.71881103515625, 1.788787841796875, 1.8587646484375, 1.928741455078125, 1.99871826171875, 2.068695068359375, 2.138671875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 10.0, 14.0, 12.0, 21.0, 27.0, 46.0, 96.0, 146.0, 249.0, 397.0, 917.0, 2339.0, 11238.0, 1075574.0, 3086019.0, 13149.0, 2251.0, 815.0, 358.0, 210.0, 129.0, 88.0, 43.0, 36.0, 24.0, 21.0, 8.0, 8.0, 7.0, 12.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2421875, -10.8680419921875, -10.493896484375, -10.1197509765625, -9.74560546875, -9.3714599609375, -8.997314453125, -8.6231689453125, -8.2490234375, -7.8748779296875, -7.500732421875, -7.1265869140625, -6.75244140625, -6.3782958984375, -6.004150390625, -5.6300048828125, -5.255859375, -4.8817138671875, -4.507568359375, -4.1334228515625, -3.75927734375, -3.3851318359375, -3.010986328125, -2.6368408203125, -2.2626953125, -1.8885498046875, -1.514404296875, -1.1402587890625, -0.76611328125, -0.3919677734375, -0.017822265625, 0.3563232421875, 0.73046875, 1.1046142578125, 1.478759765625, 1.8529052734375, 2.22705078125, 2.6011962890625, 2.975341796875, 3.3494873046875, 3.7236328125, 4.0977783203125, 4.471923828125, 4.8460693359375, 5.22021484375, 5.5943603515625, 5.968505859375, 6.3426513671875, 6.716796875, 7.0909423828125, 7.465087890625, 7.8392333984375, 8.21337890625, 8.5875244140625, 8.961669921875, 9.3358154296875, 9.7099609375, 10.0841064453125, 10.458251953125, 10.8323974609375, 11.20654296875, 11.5806884765625, 11.954833984375, 12.3289794921875, 12.703125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 8.0, 4.0, 6.0, 9.0, 17.0, 28.0, 31.0, 38.0, 55.0, 78.0, 92.0, 154.0, 266.0, 479.0, 729.0, 729.0, 530.0, 307.0, 182.0, 98.0, 79.0, 50.0, 35.0, 30.0, 9.0, 5.0, 5.0, 7.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-7.078125, -6.87115478515625, -6.6641845703125, -6.45721435546875, -6.250244140625, -6.04327392578125, -5.8363037109375, -5.62933349609375, -5.42236328125, -5.21539306640625, -5.0084228515625, -4.80145263671875, -4.594482421875, -4.38751220703125, -4.1805419921875, -3.97357177734375, -3.7666015625, -3.55963134765625, -3.3526611328125, -3.14569091796875, -2.938720703125, -2.73175048828125, -2.5247802734375, -2.31781005859375, -2.11083984375, -1.90386962890625, -1.6968994140625, -1.48992919921875, -1.282958984375, -1.07598876953125, -0.8690185546875, -0.66204833984375, -0.455078125, -0.24810791015625, -0.0411376953125, 0.16583251953125, 0.372802734375, 0.57977294921875, 0.7867431640625, 0.99371337890625, 1.20068359375, 1.40765380859375, 1.6146240234375, 1.82159423828125, 2.028564453125, 2.23553466796875, 2.4425048828125, 2.64947509765625, 2.8564453125, 3.06341552734375, 3.2703857421875, 3.47735595703125, 3.684326171875, 3.89129638671875, 4.0982666015625, 4.30523681640625, 4.51220703125, 4.71917724609375, 4.9261474609375, 5.13311767578125, 5.340087890625, 5.54705810546875, 5.7540283203125, 5.96099853515625, 6.16796875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 13.0, 35.0, 54.0, 111.0, 201.0, 255.0, 179.0, 77.0, 41.0, 14.0, 6.0, 4.0, 7.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-134.59930419921875, -131.98284912109375, -129.3664093017578, -126.74996185302734, -124.13351440429688, -121.5170669555664, -118.90061950683594, -116.28417205810547, -113.667724609375, -111.05127716064453, -108.43482971191406, -105.8183822631836, -103.20193481445312, -100.58548736572266, -97.96903991699219, -95.35259246826172, -92.73614501953125, -90.11969757080078, -87.50325012207031, -84.88680267333984, -82.27035522460938, -79.6539077758789, -77.03746032714844, -74.42101287841797, -71.80455780029297, -69.1881103515625, -66.57166290283203, -63.95521545410156, -61.338768005371094, -58.722320556640625, -56.105873107910156, -53.48942565917969, -50.87297821044922, -48.25653076171875, -45.64008331298828, -43.02363586425781, -40.407188415527344, -37.790740966796875, -35.174293518066406, -32.55784606933594, -29.941396713256836, -27.324949264526367, -24.7085018157959, -22.092052459716797, -19.475605010986328, -16.85915756225586, -14.24271011352539, -11.626262664794922, -9.009815216064453, -6.393367767333984, -3.7769198417663574, -1.1604719161987305, 1.4559755325317383, 4.072422981262207, 6.688871383666992, 9.305318832397461, 11.92176628112793, 14.538213729858398, 17.154661178588867, 19.77111053466797, 22.387557983398438, 25.004005432128906, 27.620452880859375, 30.236900329589844, 32.85334777832031]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 6.0, 6.0, 9.0, 10.0, 19.0, 14.0, 25.0, 27.0, 30.0, 31.0, 42.0, 49.0, 42.0, 45.0, 63.0, 75.0, 57.0, 57.0, 47.0, 46.0, 53.0, 38.0, 43.0, 34.0, 23.0, 23.0, 14.0, 15.0, 23.0, 13.0, 6.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.91107177734375, -30.740110397338867, -29.569149017333984, -28.398189544677734, -27.22722816467285, -26.05626678466797, -24.88530731201172, -23.714345932006836, -22.543384552001953, -21.37242317199707, -20.201461791992188, -19.030502319335938, -17.859540939331055, -16.688579559326172, -15.517619132995605, -14.346658706665039, -13.175697326660156, -12.004735946655273, -10.833775520324707, -9.66281509399414, -8.491853713989258, -7.320892810821533, -6.149931907653809, -4.978971481323242, -3.8080101013183594, -2.6370491981506348, -1.4660882949829102, -0.29512739181518555, 0.8758335113525391, 2.0467944145202637, 3.2177553176879883, 4.388715744018555, 5.559680938720703, 6.730641841888428, 7.901602745056152, 9.072563171386719, 10.243524551391602, 11.414485931396484, 12.58544635772705, 13.756406784057617, 14.9273681640625, 16.098329544067383, 17.269290924072266, 18.440250396728516, 19.6112117767334, 20.78217315673828, 21.95313262939453, 23.124094009399414, 24.295055389404297, 25.46601676940918, 26.636978149414062, 27.807937622070312, 28.978899002075195, 30.149860382080078, 31.320819854736328, 32.491783142089844, 33.662742614746094, 34.833702087402344, 36.00466537475586, 37.17562484741211, 38.346588134765625, 39.517547607421875, 40.688507080078125, 41.859466552734375, 43.03042984008789]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 6.0, 10.0, 10.0, 11.0, 21.0, 24.0, 33.0, 34.0, 87.0, 130.0, 247.0, 444.0, 864.0, 1677.0, 3853.0, 8613.0, 21944.0, 75806.0, 629409.0, 235798.0, 43270.0, 14577.0, 6162.0, 2736.0, 1261.0, 622.0, 353.0, 201.0, 87.0, 81.0, 56.0, 44.0, 24.0, 17.0, 10.0, 8.0, 7.0, 6.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-3.71875, -3.6148681640625, -3.510986328125, -3.4071044921875, -3.30322265625, -3.1993408203125, -3.095458984375, -2.9915771484375, -2.8876953125, -2.7838134765625, -2.679931640625, -2.5760498046875, -2.47216796875, -2.3682861328125, -2.264404296875, -2.1605224609375, -2.056640625, -1.9527587890625, -1.848876953125, -1.7449951171875, -1.64111328125, -1.5372314453125, -1.433349609375, -1.3294677734375, -1.2255859375, -1.1217041015625, -1.017822265625, -0.9139404296875, -0.81005859375, -0.7061767578125, -0.602294921875, -0.4984130859375, -0.39453125, -0.2906494140625, -0.186767578125, -0.0828857421875, 0.02099609375, 0.1248779296875, 0.228759765625, 0.3326416015625, 0.4365234375, 0.5404052734375, 0.644287109375, 0.7481689453125, 0.85205078125, 0.9559326171875, 1.059814453125, 1.1636962890625, 1.267578125, 1.3714599609375, 1.475341796875, 1.5792236328125, 1.68310546875, 1.7869873046875, 1.890869140625, 1.9947509765625, 2.0986328125, 2.2025146484375, 2.306396484375, 2.4102783203125, 2.51416015625, 2.6180419921875, 2.721923828125, 2.8258056640625, 2.9296875]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 6.0, 10.0, 14.0, 24.0, 22.0, 37.0, 24.0, 44.0, 53.0, 75.0, 75.0, 80.0, 76.0, 59.0, 79.0, 60.0, 67.0, 47.0, 45.0, 31.0, 23.0, 15.0, 14.0, 12.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.072265625, -2.957305908203125, -2.84234619140625, -2.727386474609375, -2.6124267578125, -2.497467041015625, -2.38250732421875, -2.267547607421875, -2.152587890625, -2.037628173828125, -1.92266845703125, -1.807708740234375, -1.6927490234375, -1.577789306640625, -1.46282958984375, -1.347869873046875, -1.23291015625, -1.117950439453125, -1.00299072265625, -0.888031005859375, -0.7730712890625, -0.658111572265625, -0.54315185546875, -0.428192138671875, -0.313232421875, -0.198272705078125, -0.08331298828125, 0.031646728515625, 0.1466064453125, 0.261566162109375, 0.37652587890625, 0.491485595703125, 0.6064453125, 0.721405029296875, 0.83636474609375, 0.951324462890625, 1.0662841796875, 1.181243896484375, 1.29620361328125, 1.411163330078125, 1.526123046875, 1.641082763671875, 1.75604248046875, 1.871002197265625, 1.9859619140625, 2.100921630859375, 2.21588134765625, 2.330841064453125, 2.44580078125, 2.560760498046875, 2.67572021484375, 2.790679931640625, 2.9056396484375, 3.020599365234375, 3.13555908203125, 3.250518798828125, 3.365478515625, 3.480438232421875, 3.59539794921875, 3.710357666015625, 3.8253173828125, 3.940277099609375, 4.05523681640625, 4.170196533203125, 4.28515625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 3.0, 10.0, 17.0, 15.0, 24.0, 38.0, 55.0, 79.0, 133.0, 212.0, 365.0, 777.0, 2146.0, 12351.0, 885701.0, 136510.0, 7125.0, 1572.0, 620.0, 306.0, 163.0, 130.0, 73.0, 37.0, 29.0, 10.0, 22.0, 6.0, 12.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.48828125, -7.2672119140625, -7.046142578125, -6.8250732421875, -6.60400390625, -6.3829345703125, -6.161865234375, -5.9407958984375, -5.7197265625, -5.4986572265625, -5.277587890625, -5.0565185546875, -4.83544921875, -4.6143798828125, -4.393310546875, -4.1722412109375, -3.951171875, -3.7301025390625, -3.509033203125, -3.2879638671875, -3.06689453125, -2.8458251953125, -2.624755859375, -2.4036865234375, -2.1826171875, -1.9615478515625, -1.740478515625, -1.5194091796875, -1.29833984375, -1.0772705078125, -0.856201171875, -0.6351318359375, -0.4140625, -0.1929931640625, 0.028076171875, 0.2491455078125, 0.47021484375, 0.6912841796875, 0.912353515625, 1.1334228515625, 1.3544921875, 1.5755615234375, 1.796630859375, 2.0177001953125, 2.23876953125, 2.4598388671875, 2.680908203125, 2.9019775390625, 3.123046875, 3.3441162109375, 3.565185546875, 3.7862548828125, 4.00732421875, 4.2283935546875, 4.449462890625, 4.6705322265625, 4.8916015625, 5.1126708984375, 5.333740234375, 5.5548095703125, 5.77587890625, 5.9969482421875, 6.218017578125, 6.4390869140625, 6.66015625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 6.0, 14.0, 20.0, 18.0, 14.0, 36.0, 33.0, 48.0, 51.0, 63.0, 94.0, 96.0, 101.0, 84.0, 63.0, 47.0, 45.0, 48.0, 27.0, 23.0, 22.0, 10.0, 10.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.40625, -13.983642578125, -13.56103515625, -13.138427734375, -12.7158203125, -12.293212890625, -11.87060546875, -11.447998046875, -11.025390625, -10.602783203125, -10.18017578125, -9.757568359375, -9.3349609375, -8.912353515625, -8.48974609375, -8.067138671875, -7.64453125, -7.221923828125, -6.79931640625, -6.376708984375, -5.9541015625, -5.531494140625, -5.10888671875, -4.686279296875, -4.263671875, -3.841064453125, -3.41845703125, -2.995849609375, -2.5732421875, -2.150634765625, -1.72802734375, -1.305419921875, -0.8828125, -0.460205078125, -0.03759765625, 0.385009765625, 0.8076171875, 1.230224609375, 1.65283203125, 2.075439453125, 2.498046875, 2.920654296875, 3.34326171875, 3.765869140625, 4.1884765625, 4.611083984375, 5.03369140625, 5.456298828125, 5.87890625, 6.301513671875, 6.72412109375, 7.146728515625, 7.5693359375, 7.991943359375, 8.41455078125, 8.837158203125, 9.259765625, 9.682373046875, 10.10498046875, 10.527587890625, 10.9501953125, 11.372802734375, 11.79541015625, 12.218017578125, 12.640625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 4.0, 2.0, 7.0, 8.0, 15.0, 16.0, 24.0, 30.0, 58.0, 83.0, 116.0, 211.0, 379.0, 814.0, 2289.0, 8471.0, 69601.0, 927399.0, 30512.0, 5402.0, 1621.0, 644.0, 327.0, 185.0, 111.0, 68.0, 56.0, 25.0, 22.0, 15.0, 14.0, 6.0, 9.0, 7.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.1396484375, -1.1082916259765625, -1.076934814453125, -1.0455780029296875, -1.01422119140625, -0.9828643798828125, -0.951507568359375, -0.9201507568359375, -0.8887939453125, -0.8574371337890625, -0.826080322265625, -0.7947235107421875, -0.76336669921875, -0.7320098876953125, -0.700653076171875, -0.6692962646484375, -0.637939453125, -0.6065826416015625, -0.575225830078125, -0.5438690185546875, -0.51251220703125, -0.4811553955078125, -0.449798583984375, -0.4184417724609375, -0.3870849609375, -0.3557281494140625, -0.324371337890625, -0.2930145263671875, -0.26165771484375, -0.2303009033203125, -0.198944091796875, -0.1675872802734375, -0.13623046875, -0.1048736572265625, -0.073516845703125, -0.0421600341796875, -0.01080322265625, 0.0205535888671875, 0.051910400390625, 0.0832672119140625, 0.1146240234375, 0.1459808349609375, 0.177337646484375, 0.2086944580078125, 0.24005126953125, 0.2714080810546875, 0.302764892578125, 0.3341217041015625, 0.365478515625, 0.3968353271484375, 0.428192138671875, 0.4595489501953125, 0.49090576171875, 0.5222625732421875, 0.553619384765625, 0.5849761962890625, 0.6163330078125, 0.6476898193359375, 0.679046630859375, 0.7104034423828125, 0.74176025390625, 0.7731170654296875, 0.804473876953125, 0.8358306884765625, 0.8671875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 11.0, 7.0, 8.0, 13.0, 13.0, 28.0, 31.0, 41.0, 73.0, 107.0, 180.0, 139.0, 109.0, 65.0, 38.0, 31.0, 18.0, 21.0, 14.0, 7.0, 8.0, 3.0, 1.0, 5.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 3.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00020122528076171875, -0.0001951083540916443, -0.00018899142742156982, -0.00018287450075149536, -0.0001767575740814209, -0.00017064064741134644, -0.00016452372074127197, -0.0001584067940711975, -0.00015228986740112305, -0.00014617294073104858, -0.00014005601406097412, -0.00013393908739089966, -0.0001278221607208252, -0.00012170523405075073, -0.00011558830738067627, -0.0001094713807106018, -0.00010335445404052734, -9.723752737045288e-05, -9.112060070037842e-05, -8.500367403030396e-05, -7.888674736022949e-05, -7.276982069015503e-05, -6.665289402008057e-05, -6.0535967350006104e-05, -5.441904067993164e-05, -4.830211400985718e-05, -4.2185187339782715e-05, -3.606826066970825e-05, -2.995133399963379e-05, -2.3834407329559326e-05, -1.7717480659484863e-05, -1.16005539894104e-05, -5.4836273193359375e-06, 6.332993507385254e-07, 6.750226020812988e-06, 1.2867152690887451e-05, 1.8984079360961914e-05, 2.5101006031036377e-05, 3.121793270111084e-05, 3.73348593711853e-05, 4.3451786041259766e-05, 4.956871271133423e-05, 5.568563938140869e-05, 6.180256605148315e-05, 6.791949272155762e-05, 7.403641939163208e-05, 8.015334606170654e-05, 8.6270272731781e-05, 9.238719940185547e-05, 9.850412607192993e-05, 0.0001046210527420044, 0.00011073797941207886, 0.00011685490608215332, 0.00012297183275222778, 0.00012908875942230225, 0.0001352056860923767, 0.00014132261276245117, 0.00014743953943252563, 0.0001535564661026001, 0.00015967339277267456, 0.00016579031944274902, 0.00017190724611282349, 0.00017802417278289795, 0.0001841410994529724, 0.00019025802612304688]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 13.0, 11.0, 18.0, 20.0, 27.0, 63.0, 81.0, 156.0, 388.0, 1019.0, 3483.0, 19167.0, 897338.0, 113720.0, 9529.0, 2098.0, 683.0, 322.0, 152.0, 83.0, 38.0, 38.0, 17.0, 17.0, 11.0, 12.0, 5.0, 9.0, 7.0, 5.0, 5.0, 1.0, 4.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.779296875, -0.7435760498046875, -0.707855224609375, -0.6721343994140625, -0.63641357421875, -0.6006927490234375, -0.564971923828125, -0.5292510986328125, -0.4935302734375, -0.4578094482421875, -0.422088623046875, -0.3863677978515625, -0.35064697265625, -0.3149261474609375, -0.279205322265625, -0.2434844970703125, -0.207763671875, -0.1720428466796875, -0.136322021484375, -0.1006011962890625, -0.06488037109375, -0.0291595458984375, 0.006561279296875, 0.0422821044921875, 0.0780029296875, 0.1137237548828125, 0.149444580078125, 0.1851654052734375, 0.22088623046875, 0.2566070556640625, 0.292327880859375, 0.3280487060546875, 0.36376953125, 0.3994903564453125, 0.435211181640625, 0.4709320068359375, 0.50665283203125, 0.5423736572265625, 0.578094482421875, 0.6138153076171875, 0.6495361328125, 0.6852569580078125, 0.720977783203125, 0.7566986083984375, 0.79241943359375, 0.8281402587890625, 0.863861083984375, 0.8995819091796875, 0.935302734375, 0.9710235595703125, 1.006744384765625, 1.0424652099609375, 1.07818603515625, 1.1139068603515625, 1.149627685546875, 1.1853485107421875, 1.2210693359375, 1.2567901611328125, 1.292510986328125, 1.3282318115234375, 1.36395263671875, 1.3996734619140625, 1.435394287109375, 1.4711151123046875, 1.5068359375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 2.0, 4.0, 15.0, 15.0, 17.0, 22.0, 42.0, 36.0, 72.0, 110.0, 181.0, 145.0, 108.0, 67.0, 41.0, 28.0, 23.0, 20.0, 17.0, 7.0, 10.0, 10.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.685546875, -0.65277099609375, -0.6199951171875, -0.58721923828125, -0.554443359375, -0.52166748046875, -0.4888916015625, -0.45611572265625, -0.42333984375, -0.39056396484375, -0.3577880859375, -0.32501220703125, -0.292236328125, -0.25946044921875, -0.2266845703125, -0.19390869140625, -0.1611328125, -0.12835693359375, -0.0955810546875, -0.06280517578125, -0.030029296875, 0.00274658203125, 0.0355224609375, 0.06829833984375, 0.10107421875, 0.13385009765625, 0.1666259765625, 0.19940185546875, 0.232177734375, 0.26495361328125, 0.2977294921875, 0.33050537109375, 0.36328125, 0.39605712890625, 0.4288330078125, 0.46160888671875, 0.494384765625, 0.52716064453125, 0.5599365234375, 0.59271240234375, 0.62548828125, 0.65826416015625, 0.6910400390625, 0.72381591796875, 0.756591796875, 0.78936767578125, 0.8221435546875, 0.85491943359375, 0.8876953125, 0.92047119140625, 0.9532470703125, 0.98602294921875, 1.018798828125, 1.05157470703125, 1.0843505859375, 1.11712646484375, 1.14990234375, 1.18267822265625, 1.2154541015625, 1.24822998046875, 1.281005859375, 1.31378173828125, 1.3465576171875, 1.37933349609375, 1.412109375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 14.0, 37.0, 83.0, 631.0, 163.0, 41.0, 22.0, 9.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.5894775390625, -42.42793273925781, -40.26639175415039, -38.10485076904297, -35.94330596923828, -33.781761169433594, -31.620220184326172, -29.458677291870117, -27.297134399414062, -25.135591506958008, -22.974048614501953, -20.8125057220459, -18.650962829589844, -16.48941993713379, -14.327877044677734, -12.16633415222168, -10.004791259765625, -7.84324836730957, -5.681705474853516, -3.520162582397461, -1.3586196899414062, 0.8029232025146484, 2.964466094970703, 5.126008987426758, 7.2875518798828125, 9.449094772338867, 11.610637664794922, 13.772180557250977, 15.933723449707031, 18.095266342163086, 20.25680923461914, 22.418352127075195, 24.57988739013672, 26.741430282592773, 28.902973175048828, 31.064516067504883, 33.22605895996094, 35.387603759765625, 37.54914474487305, 39.71068572998047, 41.872230529785156, 44.033775329589844, 46.195316314697266, 48.35685729980469, 50.518402099609375, 52.67994689941406, 54.841487884521484, 57.003028869628906, 59.164573669433594, 61.32611846923828, 63.4876594543457, 65.64920043945312, 67.81074523925781, 69.9722900390625, 72.13383483886719, 74.29537200927734, 76.45691680908203, 78.61846160888672, 80.77999877929688, 82.94154357910156, 85.10308837890625, 87.26463317871094, 89.42617797851562, 91.58771514892578, 93.74925994873047]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 3.0, 7.0, 7.0, 10.0, 11.0, 15.0, 14.0, 8.0, 17.0, 21.0, 26.0, 22.0, 22.0, 24.0, 30.0, 96.0, 323.0, 92.0, 38.0, 28.0, 34.0, 19.0, 25.0, 15.0, 17.0, 18.0, 17.0, 3.0, 8.0, 6.0, 8.0, 2.0, 3.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.01758575439453, -29.12090301513672, -28.224220275878906, -27.32753562927246, -26.43085289001465, -25.534170150756836, -24.63748550415039, -23.740802764892578, -22.844120025634766, -21.947437286376953, -21.05075454711914, -20.154069900512695, -19.257387161254883, -18.36070442199707, -17.464019775390625, -16.567337036132812, -15.670654296875, -14.773971557617188, -13.877287864685059, -12.98060417175293, -12.083921432495117, -11.187238693237305, -10.290555000305176, -9.393871307373047, -8.497188568115234, -7.600505352020264, -6.703822135925293, -5.807138919830322, -4.910455703735352, -4.013772487640381, -3.11708927154541, -2.2204060554504395, -1.3237247467041016, -0.42704153060913086, 0.46964168548583984, 1.3663249015808105, 2.2630081176757812, 3.159691333770752, 4.056374549865723, 4.953057765960693, 5.849740982055664, 6.746424198150635, 7.6431074142456055, 8.539791107177734, 9.436473846435547, 10.33315658569336, 11.229840278625488, 12.126523971557617, 13.02320671081543, 13.919889450073242, 14.816573143005371, 15.7132568359375, 16.609939575195312, 17.506622314453125, 18.403305053710938, 19.299989700317383, 20.196672439575195, 21.093355178833008, 21.990039825439453, 22.886722564697266, 23.783405303955078, 24.68008804321289, 25.576770782470703, 26.47345542907715, 27.37013816833496]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 8.0, 4.0, 10.0, 8.0, 6.0, 12.0, 8.0, 15.0, 16.0, 15.0, 16.0, 28.0, 26.0, 34.0, 25.0, 38.0, 111.0, 229.0, 95.0, 48.0, 28.0, 32.0, 30.0, 19.0, 21.0, 20.0, 13.0, 16.0, 7.0, 9.0, 14.0, 11.0, 3.0, 6.0, 6.0, 2.0, 8.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.05859375, -1.994842529296875, -1.93109130859375, -1.867340087890625, -1.8035888671875, -1.739837646484375, -1.67608642578125, -1.612335205078125, -1.548583984375, -1.484832763671875, -1.42108154296875, -1.357330322265625, -1.2935791015625, -1.229827880859375, -1.16607666015625, -1.102325439453125, -1.03857421875, -0.974822998046875, -0.91107177734375, -0.847320556640625, -0.7835693359375, -0.719818115234375, -0.65606689453125, -0.592315673828125, -0.528564453125, -0.464813232421875, -0.40106201171875, -0.337310791015625, -0.2735595703125, -0.209808349609375, -0.14605712890625, -0.082305908203125, -0.0185546875, 0.045196533203125, 0.10894775390625, 0.172698974609375, 0.2364501953125, 0.300201416015625, 0.36395263671875, 0.427703857421875, 0.491455078125, 0.555206298828125, 0.61895751953125, 0.682708740234375, 0.7464599609375, 0.810211181640625, 0.87396240234375, 0.937713623046875, 1.00146484375, 1.065216064453125, 1.12896728515625, 1.192718505859375, 1.2564697265625, 1.320220947265625, 1.38397216796875, 1.447723388671875, 1.511474609375, 1.575225830078125, 1.63897705078125, 1.702728271484375, 1.7664794921875, 1.830230712890625, 1.89398193359375, 1.957733154296875, 2.021484375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 1.0, 4.0, 1.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 0.0, 1.0, 0.0, 4.0, 6.0, 9.0, 6.0, 4.0, 10.0, 29.0, 15.0, 31.0, 34.0, 52.0, 72.0, 152.0, 287.0, 766.0, 2809.0, 24296.0, 8348573.0, 8645.0, 1647.0, 513.0, 200.0, 138.0, 77.0, 50.0, 38.0, 19.0, 4.0, 12.0, 8.0, 3.0, 15.0, 1.0, 3.0, 8.0, 9.0, 3.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 3.0], "bins": [-25.266550064086914, -24.57072639465332, -23.874900817871094, -23.1790771484375, -22.483253479003906, -21.78742790222168, -21.091604232788086, -20.39577865600586, -19.699954986572266, -19.004131317138672, -18.308305740356445, -17.61248207092285, -16.916658401489258, -16.22083282470703, -15.525009155273438, -14.829184532165527, -14.133360862731934, -13.437536239624023, -12.74171257019043, -12.04588794708252, -11.35006332397461, -10.654239654541016, -9.958415031433105, -9.262590408325195, -8.566766738891602, -7.87094259262085, -7.1751179695129395, -6.4792938232421875, -5.783469200134277, -5.087645053863525, -4.391820907592773, -3.6959962844848633, -3.000171661376953, -2.304347276687622, -1.6085230112075806, -0.9126987457275391, -0.216874361038208, 0.47895002365112305, 1.174774169921875, 1.8705987930297852, 2.566422939300537, 3.262247323989868, 3.958071708679199, 4.653895854949951, 5.349720001220703, 6.045544624328613, 6.741368770599365, 7.437193393707275, 8.133017539978027, 8.828842163085938, 9.524665832519531, 10.220490455627441, 10.916315078735352, 11.612138748168945, 12.307963371276855, 13.003787994384766, 13.69961166381836, 14.39543628692627, 15.091259956359863, 15.787084579467773, 16.482908248901367, 17.178733825683594, 17.874557495117188, 18.57038116455078, 19.266206741333008]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 2.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 5.0, 2.0, 5.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.274808406829834, -6.750971794128418, -6.227134704589844, -5.7032976150512695, -5.1794610023498535, -4.6556243896484375, -4.131787300109863, -3.607950448989868, -3.084113597869873, -2.560276746749878, -2.036439895629883, -1.5126030445098877, -0.9887661933898926, -0.46492934226989746, 0.058907508850097656, 0.5827443599700928, 1.106581211090088, 1.630418062210083, 2.154254913330078, 2.6780917644500732, 3.2019286155700684, 3.7257654666900635, 4.249602317810059, 4.773439407348633, 5.297276020050049, 5.821112632751465, 6.344949722290039, 6.868786811828613, 7.392623424530029, 7.916460037231445, 8.44029712677002, 8.964134216308594, 9.487972259521484, 10.011809349060059, 10.535646438598633, 11.05948257446289, 11.583319664001465, 12.107156753540039, 12.630992889404297, 13.154829978942871, 13.678667068481445, 14.20250415802002, 14.726341247558594, 15.250177383422852, 15.774014472961426, 16.2978515625, 16.821687698364258, 17.34552574157715, 17.869361877441406, 18.393198013305664, 18.917036056518555, 19.440872192382812, 19.964710235595703, 20.48854637145996, 21.01238250732422, 21.53622055053711, 22.060056686401367, 22.583892822265625, 23.107730865478516, 23.631567001342773, 24.15540313720703, 24.679241180419922, 25.20307731628418, 25.72691535949707, 26.250751495361328]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 7.0, 6.0, 8.0, 12.0, 21.0, 39.0, 68.0, 105.0, 201.0, 438.0, 1033.0, 3259.0, 14337.0, 114720.0, 335215.0, 44581.0, 7056.0, 1803.0, 675.0, 291.0, 156.0, 85.0, 51.0, 38.0, 18.0, 21.0, 6.0, 8.0, 1.0, 6.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.078125, -22.128173828125, -21.17822265625, -20.228271484375, -19.2783203125, -18.328369140625, -17.37841796875, -16.428466796875, -15.478515625, -14.528564453125, -13.57861328125, -12.628662109375, -11.6787109375, -10.728759765625, -9.77880859375, -8.828857421875, -7.87890625, -6.928955078125, -5.97900390625, -5.029052734375, -4.0791015625, -3.129150390625, -2.17919921875, -1.229248046875, -0.279296875, 0.670654296875, 1.62060546875, 2.570556640625, 3.5205078125, 4.470458984375, 5.42041015625, 6.370361328125, 7.3203125, 8.270263671875, 9.22021484375, 10.170166015625, 11.1201171875, 12.070068359375, 13.02001953125, 13.969970703125, 14.919921875, 15.869873046875, 16.81982421875, 17.769775390625, 18.7197265625, 19.669677734375, 20.61962890625, 21.569580078125, 22.51953125, 23.469482421875, 24.41943359375, 25.369384765625, 26.3193359375, 27.269287109375, 28.21923828125, 29.169189453125, 30.119140625, 31.069091796875, 32.01904296875, 32.968994140625, 33.9189453125, 34.868896484375, 35.81884765625, 36.768798828125, 37.71875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 4.0, 6.0, 13.0, 13.0, 17.0, 17.0, 22.0, 23.0, 27.0, 35.0, 54.0, 55.0, 63.0, 71.0, 62.0, 83.0, 64.0, 54.0, 59.0, 53.0, 44.0, 37.0, 29.0, 20.0, 22.0, 7.0, 13.0, 10.0, 3.0, 2.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.060546875, -1.975677490234375, -1.89080810546875, -1.805938720703125, -1.7210693359375, -1.636199951171875, -1.55133056640625, -1.466461181640625, -1.381591796875, -1.296722412109375, -1.21185302734375, -1.126983642578125, -1.0421142578125, -0.957244873046875, -0.87237548828125, -0.787506103515625, -0.70263671875, -0.617767333984375, -0.53289794921875, -0.448028564453125, -0.3631591796875, -0.278289794921875, -0.19342041015625, -0.108551025390625, -0.023681640625, 0.061187744140625, 0.14605712890625, 0.230926513671875, 0.3157958984375, 0.400665283203125, 0.48553466796875, 0.570404052734375, 0.6552734375, 0.740142822265625, 0.82501220703125, 0.909881591796875, 0.9947509765625, 1.079620361328125, 1.16448974609375, 1.249359130859375, 1.334228515625, 1.419097900390625, 1.50396728515625, 1.588836669921875, 1.6737060546875, 1.758575439453125, 1.84344482421875, 1.928314208984375, 2.01318359375, 2.098052978515625, 2.18292236328125, 2.267791748046875, 2.3526611328125, 2.437530517578125, 2.52239990234375, 2.607269287109375, 2.692138671875, 2.777008056640625, 2.86187744140625, 2.946746826171875, 3.0316162109375, 3.116485595703125, 3.20135498046875, 3.286224365234375, 3.37109375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 5.0, 11.0, 24.0, 69.0, 119.0, 118.0, 52.0, 28.0, 17.0, 11.0, 5.0, 6.0, 5.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-36.02106857299805, -35.294490814208984, -34.567909240722656, -33.841331481933594, -33.11475372314453, -32.3881721496582, -31.66159439086914, -30.935014724731445, -30.20843505859375, -29.481855392456055, -28.755277633666992, -28.028697967529297, -27.3021183013916, -26.575538635253906, -25.848960876464844, -25.12238121032715, -24.395803451538086, -23.66922378540039, -22.942646026611328, -22.216066360473633, -21.489486694335938, -20.762908935546875, -20.03632926940918, -19.309749603271484, -18.583171844482422, -17.856592178344727, -17.130014419555664, -16.40343475341797, -15.676855087280273, -14.950276374816895, -14.223697662353516, -13.49711799621582, -12.770537376403809, -12.04395866394043, -11.317378997802734, -10.590800285339355, -9.864221572875977, -9.137641906738281, -8.411063194274902, -7.684484004974365, -6.957904815673828, -6.231325626373291, -5.504746437072754, -4.778167724609375, -4.051588535308838, -3.325009346008301, -2.598430633544922, -1.8718514442443848, -1.1452722549438477, -0.4186931848526001, 0.30788588523864746, 1.0344648361206055, 1.7610440254211426, 2.4876232147216797, 3.2142019271850586, 3.9407811164855957, 4.667360305786133, 5.39393949508667, 6.120518684387207, 6.847097396850586, 7.573676586151123, 8.30025577545166, 9.026834487915039, 9.753414154052734, 10.479992866516113]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 1.0, 3.0, 3.0, 6.0, 12.0, 13.0, 38.0, 73.0, 116.0, 75.0, 48.0, 30.0, 14.0, 9.0, 11.0, 1.0, 7.0, 3.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.470895767211914, -10.993066787719727, -10.515237808227539, -10.037407875061035, -9.559578895568848, -9.08174991607666, -8.603920936584473, -8.126091003417969, -7.648262023925781, -7.170433044433594, -6.692603588104248, -6.2147746086120605, -5.736945152282715, -5.259116172790527, -4.78128719329834, -4.303457736968994, -3.8256287574768066, -3.34779953956604, -2.8699703216552734, -2.392141342163086, -1.9143120050430298, -1.4364829063415527, -0.9586536884307861, -0.48082447052001953, -0.0029952526092529297, 0.4748339354991913, 0.9526631236076355, 1.4304922819137573, 1.908321499824524, 2.386150598526001, 2.8639798164367676, 3.341809034347534, 3.819638252258301, 4.297467231750488, 4.775296688079834, 5.2531256675720215, 5.730955123901367, 6.208784103393555, 6.686613082885742, 7.164442539215088, 7.642271995544434, 8.120100975036621, 8.597929954528809, 9.075759887695312, 9.5535888671875, 10.031417846679688, 10.509246826171875, 10.987075805664062, 11.46490478515625, 11.942733764648438, 12.420562744140625, 12.898392677307129, 13.376221656799316, 13.854050636291504, 14.331879615783691, 14.809709548950195, 15.287538528442383, 15.76536750793457, 16.243196487426758, 16.721025466918945, 17.198854446411133, 17.676685333251953, 18.15451431274414, 18.632343292236328, 19.110172271728516]}, "train/train_runtime": 4813.5869, "train/train_samples_per_second": 5.929, "train/train_steps_per_second": 0.062, "train/total_flos": 0.0, "train/train_loss": 4.3407110846805255, "eval/loss": 4.175893783569336, "eval/wer": 2.4477588258627527, "eval/runtime": 935.1251, "eval/samples_per_second": 2.825, "eval/steps_per_second": 0.236, "_wandb": {"runtime": 6088}} \ No newline at end of file