diff --git "a/wandb/run-20220228_093705-yn2gmwrw/files/wandb-summary.json" "b/wandb/run-20220228_093705-yn2gmwrw/files/wandb-summary.json" --- "a/wandb/run-20220228_093705-yn2gmwrw/files/wandb-summary.json" +++ "b/wandb/run-20220228_093705-yn2gmwrw/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 3.5732, "train/learning_rate": 3.1152647975077883e-08, "train/epoch": 1.0, "train/global_step": 1784, "_runtime": 10136, "_timestamp": 1646051161, "_step": 1788, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 9.0, 346.0, 631.0, 30.0, 2.0, 1.0], "bins": [-641.971923828125, -631.305908203125, -620.639892578125, -609.973876953125, -599.307861328125, -588.641845703125, -577.975830078125, -567.309814453125, -556.643798828125, -545.977783203125, -535.311767578125, -524.645751953125, -513.979736328125, -503.313720703125, -492.647705078125, -481.981689453125, -471.315673828125, -460.649658203125, -449.983642578125, -439.317626953125, -428.651611328125, -417.985595703125, -407.319580078125, -396.653564453125, -385.987548828125, -375.321533203125, -364.655517578125, -353.989501953125, -343.323486328125, -332.657470703125, -321.991455078125, -311.325439453125, -300.6593933105469, -289.9933776855469, -279.3273620605469, -268.6613464355469, -257.9953308105469, -247.32931518554688, -236.66329956054688, -225.99728393554688, -215.33126831054688, -204.66525268554688, -193.99923706054688, -183.33322143554688, -172.66720581054688, -162.00119018554688, -151.33517456054688, -140.66915893554688, -130.00314331054688, -119.33712768554688, -108.67111206054688, -98.00509643554688, -87.33908081054688, -76.67306518554688, -66.00704956054688, -55.341033935546875, -44.67502212524414, -34.00900650024414, -23.34299087524414, -12.67697525024414, -2.0109596252441406, 8.65505599975586, 19.32107162475586, 29.98708724975586, 40.65310287475586]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 10.0, 8.0, 10.0, 19.0, 21.0, 16.0, 27.0, 24.0, 29.0, 34.0, 38.0, 42.0, 38.0, 39.0, 44.0, 47.0, 51.0, 52.0, 45.0, 44.0, 38.0, 46.0, 33.0, 29.0, 45.0, 18.0, 31.0, 22.0, 13.0, 15.0, 10.0, 20.0, 11.0, 6.0, 4.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.822509765625, -73.62486267089844, -71.4272232055664, -69.22957611083984, -67.03193664550781, -64.83428955078125, -62.63664627075195, -60.439002990722656, -58.24135971069336, -56.04371643066406, -53.846073150634766, -51.64842987060547, -49.450782775878906, -47.253143310546875, -45.05549621582031, -42.857852935791016, -40.66020965576172, -38.46256637573242, -36.264923095703125, -34.06727981567383, -31.8696346282959, -29.6719913482666, -27.474346160888672, -25.276702880859375, -23.079059600830078, -20.88141632080078, -18.683773040771484, -16.486127853393555, -14.288484573364258, -12.090841293334961, -9.893197059631348, -7.695552825927734, -5.4979095458984375, -3.3002657890319824, -1.1026220321655273, 1.0950217247009277, 3.292665481567383, 5.49030876159668, 7.687952995300293, 9.885597229003906, 12.083240509033203, 14.2808837890625, 16.478527069091797, 18.676172256469727, 20.873815536499023, 23.07145881652832, 25.26910400390625, 27.466747283935547, 29.664390563964844, 31.86203384399414, 34.05967712402344, 36.257320404052734, 38.45496368408203, 40.652610778808594, 42.85025405883789, 45.04789733886719, 47.245540618896484, 49.44318389892578, 51.64082717895508, 53.838470458984375, 56.03611755371094, 58.23375701904297, 60.43140411376953, 62.62904739379883, 64.82669067382812]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 4.0, 8.0, 11.0, 16.0, 21.0, 32.0, 31.0, 38.0, 38.0, 50.0, 49.0, 55.0, 53.0, 54.0, 61.0, 48.0, 71.0, 50.0, 42.0, 49.0, 33.0, 43.0, 48.0, 24.0, 18.0, 14.0, 15.0, 7.0, 8.0, 7.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.375, -8.1734619140625, -7.971923828125, -7.7703857421875, -7.56884765625, -7.3673095703125, -7.165771484375, -6.9642333984375, -6.7626953125, -6.5611572265625, -6.359619140625, -6.1580810546875, -5.95654296875, -5.7550048828125, -5.553466796875, -5.3519287109375, -5.150390625, -4.9488525390625, -4.747314453125, -4.5457763671875, -4.34423828125, -4.1427001953125, -3.941162109375, -3.7396240234375, -3.5380859375, -3.3365478515625, -3.135009765625, -2.9334716796875, -2.73193359375, -2.5303955078125, -2.328857421875, -2.1273193359375, -1.92578125, -1.7242431640625, -1.522705078125, -1.3211669921875, -1.11962890625, -0.9180908203125, -0.716552734375, -0.5150146484375, -0.3134765625, -0.1119384765625, 0.089599609375, 0.2911376953125, 0.49267578125, 0.6942138671875, 0.895751953125, 1.0972900390625, 1.298828125, 1.5003662109375, 1.701904296875, 1.9034423828125, 2.10498046875, 2.3065185546875, 2.508056640625, 2.7095947265625, 2.9111328125, 3.1126708984375, 3.314208984375, 3.5157470703125, 3.71728515625, 3.9188232421875, 4.120361328125, 4.3218994140625, 4.5234375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 9.0, 6.0, 10.0, 12.0, 25.0, 27.0, 37.0, 68.0, 93.0, 165.0, 224.0, 442.0, 815.0, 1724.0, 4296.0, 14068.0, 99545.0, 2388338.0, 1594739.0, 70897.0, 11734.0, 3624.0, 1570.0, 781.0, 417.0, 250.0, 135.0, 84.0, 51.0, 38.0, 25.0, 10.0, 11.0, 3.0, 5.0, 3.0, 0.0, 2.0], "bins": [-27.78125, -27.148681640625, -26.51611328125, -25.883544921875, -25.2509765625, -24.618408203125, -23.98583984375, -23.353271484375, -22.720703125, -22.088134765625, -21.45556640625, -20.822998046875, -20.1904296875, -19.557861328125, -18.92529296875, -18.292724609375, -17.66015625, -17.027587890625, -16.39501953125, -15.762451171875, -15.1298828125, -14.497314453125, -13.86474609375, -13.232177734375, -12.599609375, -11.967041015625, -11.33447265625, -10.701904296875, -10.0693359375, -9.436767578125, -8.80419921875, -8.171630859375, -7.5390625, -6.906494140625, -6.27392578125, -5.641357421875, -5.0087890625, -4.376220703125, -3.74365234375, -3.111083984375, -2.478515625, -1.845947265625, -1.21337890625, -0.580810546875, 0.0517578125, 0.684326171875, 1.31689453125, 1.949462890625, 2.58203125, 3.214599609375, 3.84716796875, 4.479736328125, 5.1123046875, 5.744873046875, 6.37744140625, 7.010009765625, 7.642578125, 8.275146484375, 8.90771484375, 9.540283203125, 10.1728515625, 10.805419921875, 11.43798828125, 12.070556640625, 12.703125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 11.0, 23.0, 24.0, 57.0, 84.0, 139.0, 236.0, 372.0, 679.0, 886.0, 624.0, 364.0, 231.0, 126.0, 80.0, 38.0, 22.0, 20.0, 24.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.734375, -22.9287109375, -22.123046875, -21.3173828125, -20.51171875, -19.7060546875, -18.900390625, -18.0947265625, -17.2890625, -16.4833984375, -15.677734375, -14.8720703125, -14.06640625, -13.2607421875, -12.455078125, -11.6494140625, -10.84375, -10.0380859375, -9.232421875, -8.4267578125, -7.62109375, -6.8154296875, -6.009765625, -5.2041015625, -4.3984375, -3.5927734375, -2.787109375, -1.9814453125, -1.17578125, -0.3701171875, 0.435546875, 1.2412109375, 2.046875, 2.8525390625, 3.658203125, 4.4638671875, 5.26953125, 6.0751953125, 6.880859375, 7.6865234375, 8.4921875, 9.2978515625, 10.103515625, 10.9091796875, 11.71484375, 12.5205078125, 13.326171875, 14.1318359375, 14.9375, 15.7431640625, 16.548828125, 17.3544921875, 18.16015625, 18.9658203125, 19.771484375, 20.5771484375, 21.3828125, 22.1884765625, 22.994140625, 23.7998046875, 24.60546875, 25.4111328125, 26.216796875, 27.0224609375, 27.828125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 16.0, 14.0, 22.0, 40.0, 66.0, 96.0, 225.0, 408.0, 869.0, 2223.0, 22720.0, 4086441.0, 76007.0, 2997.0, 1028.0, 486.0, 245.0, 123.0, 97.0, 56.0, 23.0, 17.0, 15.0, 8.0, 5.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.0625, -71.3798828125, -68.697265625, -66.0146484375, -63.33203125, -60.6494140625, -57.966796875, -55.2841796875, -52.6015625, -49.9189453125, -47.236328125, -44.5537109375, -41.87109375, -39.1884765625, -36.505859375, -33.8232421875, -31.140625, -28.4580078125, -25.775390625, -23.0927734375, -20.41015625, -17.7275390625, -15.044921875, -12.3623046875, -9.6796875, -6.9970703125, -4.314453125, -1.6318359375, 1.05078125, 3.7333984375, 6.416015625, 9.0986328125, 11.78125, 14.4638671875, 17.146484375, 19.8291015625, 22.51171875, 25.1943359375, 27.876953125, 30.5595703125, 33.2421875, 35.9248046875, 38.607421875, 41.2900390625, 43.97265625, 46.6552734375, 49.337890625, 52.0205078125, 54.703125, 57.3857421875, 60.068359375, 62.7509765625, 65.43359375, 68.1162109375, 70.798828125, 73.4814453125, 76.1640625, 78.8466796875, 81.529296875, 84.2119140625, 86.89453125, 89.5771484375, 92.259765625, 94.9423828125, 97.625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 81.0, 553.0, 353.0, 21.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-270.17755126953125, -262.1882629394531, -254.198974609375, -246.20968627929688, -238.22039794921875, -230.23110961914062, -222.2418212890625, -214.25253295898438, -206.26324462890625, -198.27395629882812, -190.28466796875, -182.29537963867188, -174.30609130859375, -166.31680297851562, -158.3275146484375, -150.33822631835938, -142.3489532470703, -134.3596649169922, -126.37037658691406, -118.38108825683594, -110.39179992675781, -102.40251159667969, -94.4132308959961, -86.42394256591797, -78.43465423583984, -70.44536590576172, -62.456077575683594, -54.466793060302734, -46.47750473022461, -38.488216400146484, -30.498931884765625, -22.5096435546875, -14.520339965820312, -6.531052589416504, 1.4582347869873047, 9.447521209716797, 17.436809539794922, 25.426097869873047, 33.415382385253906, 41.40467071533203, 49.393959045410156, 57.38324737548828, 65.3725357055664, 73.36181640625, 81.35110473632812, 89.34039306640625, 97.32968139648438, 105.3189697265625, 113.30825805664062, 121.29754638671875, 129.28683471679688, 137.276123046875, 145.26541137695312, 153.25469970703125, 161.24398803710938, 169.2332763671875, 177.22256469726562, 185.21185302734375, 193.20114135742188, 201.1904296875, 209.17971801757812, 217.16900634765625, 225.15829467773438, 233.1475830078125, 241.13685607910156]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 0.0, 4.0, 3.0, 2.0, 10.0, 9.0, 4.0, 8.0, 8.0, 9.0, 15.0, 16.0, 7.0, 27.0, 25.0, 17.0, 24.0, 28.0, 22.0, 29.0, 36.0, 44.0, 38.0, 38.0, 34.0, 32.0, 49.0, 38.0, 45.0, 48.0, 40.0, 34.0, 32.0, 24.0, 24.0, 18.0, 21.0, 26.0, 16.0, 12.0, 20.0, 11.0, 14.0, 9.0, 8.0, 5.0, 4.0, 9.0, 6.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-49.61613464355469, -48.13227462768555, -46.64841842651367, -45.16455841064453, -43.68069839477539, -42.19683837890625, -40.712982177734375, -39.229122161865234, -37.745262145996094, -36.26140213012695, -34.77754592895508, -33.29368591308594, -31.809825897216797, -30.32596778869629, -28.84210968017578, -27.35824966430664, -25.874391555786133, -24.390533447265625, -22.906673431396484, -21.422815322875977, -19.938955307006836, -18.455097198486328, -16.971237182617188, -15.48737907409668, -14.003520011901855, -12.519660949707031, -11.035801887512207, -9.551942825317383, -8.068084716796875, -6.584225177764893, -5.100366592407227, -3.6165075302124023, -2.132648468017578, -0.6487895250320435, 0.8350694179534912, 2.3189282417297363, 3.8027873039245605, 5.286646366119385, 6.770504951477051, 8.254364013671875, 9.7382230758667, 11.222082138061523, 12.705941200256348, 14.189800262451172, 15.67365837097168, 17.15751838684082, 18.641376495361328, 20.12523651123047, 21.609094619750977, 23.092952728271484, 24.576812744140625, 26.060670852661133, 27.544530868530273, 29.02838897705078, 30.512248992919922, 31.99610710144043, 33.47996520996094, 34.96382522583008, 36.44768142700195, 37.931541442871094, 39.415401458740234, 40.899261474609375, 42.38311767578125, 43.86697769165039, 45.35083770751953]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 5.0, 10.0, 12.0, 17.0, 25.0, 24.0, 32.0, 29.0, 34.0, 53.0, 54.0, 40.0, 52.0, 48.0, 64.0, 45.0, 62.0, 44.0, 41.0, 58.0, 35.0, 41.0, 39.0, 40.0, 27.0, 13.0, 16.0, 17.0, 12.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.24139404296875, -7.0335693359375, -6.82574462890625, -6.617919921875, -6.41009521484375, -6.2022705078125, -5.99444580078125, -5.78662109375, -5.57879638671875, -5.3709716796875, -5.16314697265625, -4.955322265625, -4.74749755859375, -4.5396728515625, -4.33184814453125, -4.1240234375, -3.91619873046875, -3.7083740234375, -3.50054931640625, -3.292724609375, -3.08489990234375, -2.8770751953125, -2.66925048828125, -2.46142578125, -2.25360107421875, -2.0457763671875, -1.83795166015625, -1.630126953125, -1.42230224609375, -1.2144775390625, -1.00665283203125, -0.798828125, -0.59100341796875, -0.3831787109375, -0.17535400390625, 0.032470703125, 0.24029541015625, 0.4481201171875, 0.65594482421875, 0.86376953125, 1.07159423828125, 1.2794189453125, 1.48724365234375, 1.695068359375, 1.90289306640625, 2.1107177734375, 2.31854248046875, 2.5263671875, 2.73419189453125, 2.9420166015625, 3.14984130859375, 3.357666015625, 3.56549072265625, 3.7733154296875, 3.98114013671875, 4.18896484375, 4.39678955078125, 4.6046142578125, 4.81243896484375, 5.020263671875, 5.22808837890625, 5.4359130859375, 5.64373779296875, 5.8515625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 9.0, 10.0, 16.0, 22.0, 27.0, 41.0, 78.0, 98.0, 160.0, 212.0, 344.0, 494.0, 814.0, 1440.0, 2241.0, 3882.0, 6698.0, 11812.0, 20901.0, 36784.0, 65891.0, 114348.0, 199263.0, 246334.0, 144137.0, 82930.0, 47360.0, 26393.0, 14927.0, 8406.0, 5019.0, 2796.0, 1710.0, 1104.0, 640.0, 434.0, 259.0, 164.0, 142.0, 81.0, 39.0, 29.0, 21.0, 17.0, 14.0, 13.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.85986328125, -0.8323135375976562, -0.8047637939453125, -0.7772140502929688, -0.749664306640625, -0.7221145629882812, -0.6945648193359375, -0.6670150756835938, -0.63946533203125, -0.6119155883789062, -0.5843658447265625, -0.5568161010742188, -0.529266357421875, -0.5017166137695312, -0.4741668701171875, -0.44661712646484375, -0.4190673828125, -0.39151763916015625, -0.3639678955078125, -0.33641815185546875, -0.308868408203125, -0.28131866455078125, -0.2537689208984375, -0.22621917724609375, -0.19866943359375, -0.17111968994140625, -0.1435699462890625, -0.11602020263671875, -0.088470458984375, -0.06092071533203125, -0.0333709716796875, -0.00582122802734375, 0.021728515625, 0.04927825927734375, 0.0768280029296875, 0.10437774658203125, 0.131927490234375, 0.15947723388671875, 0.1870269775390625, 0.21457672119140625, 0.24212646484375, 0.26967620849609375, 0.2972259521484375, 0.32477569580078125, 0.352325439453125, 0.37987518310546875, 0.4074249267578125, 0.43497467041015625, 0.4625244140625, 0.49007415771484375, 0.5176239013671875, 0.5451736450195312, 0.572723388671875, 0.6002731323242188, 0.6278228759765625, 0.6553726196289062, 0.68292236328125, 0.7104721069335938, 0.7380218505859375, 0.7655715942382812, 0.793121337890625, 0.8206710815429688, 0.8482208251953125, 0.8757705688476562, 0.9033203125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 5.0, 2.0, 11.0, 7.0, 16.0, 15.0, 13.0, 7.0, 16.0, 20.0, 19.0, 31.0, 23.0, 25.0, 29.0, 27.0, 39.0, 34.0, 46.0, 43.0, 34.0, 1062.0, 40.0, 44.0, 37.0, 30.0, 31.0, 32.0, 26.0, 35.0, 26.0, 21.0, 25.0, 16.0, 18.0, 23.0, 15.0, 14.0, 5.0, 10.0, 7.0, 5.0, 5.0, 7.0, 8.0, 3.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.92578125, -2.833282470703125, -2.74078369140625, -2.648284912109375, -2.5557861328125, -2.463287353515625, -2.37078857421875, -2.278289794921875, -2.185791015625, -2.093292236328125, -2.00079345703125, -1.908294677734375, -1.8157958984375, -1.723297119140625, -1.63079833984375, -1.538299560546875, -1.44580078125, -1.353302001953125, -1.26080322265625, -1.168304443359375, -1.0758056640625, -0.983306884765625, -0.89080810546875, -0.798309326171875, -0.705810546875, -0.613311767578125, -0.52081298828125, -0.428314208984375, -0.3358154296875, -0.243316650390625, -0.15081787109375, -0.058319091796875, 0.0341796875, 0.126678466796875, 0.21917724609375, 0.311676025390625, 0.4041748046875, 0.496673583984375, 0.58917236328125, 0.681671142578125, 0.774169921875, 0.866668701171875, 0.95916748046875, 1.051666259765625, 1.1441650390625, 1.236663818359375, 1.32916259765625, 1.421661376953125, 1.51416015625, 1.606658935546875, 1.69915771484375, 1.791656494140625, 1.8841552734375, 1.976654052734375, 2.06915283203125, 2.161651611328125, 2.254150390625, 2.346649169921875, 2.43914794921875, 2.531646728515625, 2.6241455078125, 2.716644287109375, 2.80914306640625, 2.901641845703125, 2.994140625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 8.0, 11.0, 12.0, 26.0, 32.0, 55.0, 75.0, 105.0, 198.0, 248.0, 379.0, 566.0, 840.0, 1308.0, 1928.0, 2883.0, 4379.0, 7044.0, 10684.0, 16859.0, 26844.0, 42249.0, 67583.0, 108797.0, 176921.0, 1259102.0, 137087.0, 85135.0, 53181.0, 33406.0, 21081.0, 13297.0, 8725.0, 5455.0, 3610.0, 2356.0, 1571.0, 1032.0, 685.0, 476.0, 294.0, 196.0, 142.0, 101.0, 58.0, 40.0, 23.0, 15.0, 9.0, 16.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.66650390625, -0.646453857421875, -0.62640380859375, -0.606353759765625, -0.5863037109375, -0.566253662109375, -0.54620361328125, -0.526153564453125, -0.506103515625, -0.486053466796875, -0.46600341796875, -0.445953369140625, -0.4259033203125, -0.405853271484375, -0.38580322265625, -0.365753173828125, -0.345703125, -0.325653076171875, -0.30560302734375, -0.285552978515625, -0.2655029296875, -0.245452880859375, -0.22540283203125, -0.205352783203125, -0.185302734375, -0.165252685546875, -0.14520263671875, -0.125152587890625, -0.1051025390625, -0.085052490234375, -0.06500244140625, -0.044952392578125, -0.02490234375, -0.004852294921875, 0.01519775390625, 0.035247802734375, 0.0552978515625, 0.075347900390625, 0.09539794921875, 0.115447998046875, 0.135498046875, 0.155548095703125, 0.17559814453125, 0.195648193359375, 0.2156982421875, 0.235748291015625, 0.25579833984375, 0.275848388671875, 0.2958984375, 0.315948486328125, 0.33599853515625, 0.356048583984375, 0.3760986328125, 0.396148681640625, 0.41619873046875, 0.436248779296875, 0.456298828125, 0.476348876953125, 0.49639892578125, 0.516448974609375, 0.5364990234375, 0.556549072265625, 0.57659912109375, 0.596649169921875, 0.61669921875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 2.0, 4.0, 4.0, 5.0, 12.0, 8.0, 8.0, 16.0, 23.0, 19.0, 27.0, 33.0, 36.0, 41.0, 54.0, 46.0, 49.0, 63.0, 69.0, 63.0, 51.0, 59.0, 31.0, 43.0, 31.0, 39.0, 18.0, 27.0, 21.0, 31.0, 12.0, 10.0, 9.0, 8.0, 8.0, 8.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001129150390625, -0.0010925531387329102, -0.0010559558868408203, -0.0010193586349487305, -0.0009827613830566406, -0.0009461641311645508, -0.0009095668792724609, -0.0008729696273803711, -0.0008363723754882812, -0.0007997751235961914, -0.0007631778717041016, -0.0007265806198120117, -0.0006899833679199219, -0.000653386116027832, -0.0006167888641357422, -0.0005801916122436523, -0.0005435943603515625, -0.0005069971084594727, -0.0004703998565673828, -0.00043380260467529297, -0.0003972053527832031, -0.0003606081008911133, -0.00032401084899902344, -0.0002874135971069336, -0.00025081634521484375, -0.0002142190933227539, -0.00017762184143066406, -0.00014102458953857422, -0.00010442733764648438, -6.783008575439453e-05, -3.123283386230469e-05, 5.364418029785156e-06, 4.1961669921875e-05, 7.855892181396484e-05, 0.00011515617370605469, 0.00015175342559814453, 0.00018835067749023438, 0.00022494792938232422, 0.00026154518127441406, 0.0002981424331665039, 0.00033473968505859375, 0.0003713369369506836, 0.00040793418884277344, 0.0004445314407348633, 0.0004811286926269531, 0.000517725944519043, 0.0005543231964111328, 0.0005909204483032227, 0.0006275177001953125, 0.0006641149520874023, 0.0007007122039794922, 0.000737309455871582, 0.0007739067077636719, 0.0008105039596557617, 0.0008471012115478516, 0.0008836984634399414, 0.0009202957153320312, 0.0009568929672241211, 0.000993490219116211, 0.0010300874710083008, 0.0010666847229003906, 0.0011032819747924805, 0.0011398792266845703, 0.0011764764785766602, 0.00121307373046875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 11.0, 7.0, 18.0, 20.0, 14.0, 23.0, 27.0, 41.0, 48.0, 68.0, 75.0, 117.0, 129.0, 200.0, 225.0, 287.0, 558.0, 1094.0, 968621.0, 74439.0, 819.0, 463.0, 256.0, 220.0, 149.0, 134.0, 119.0, 85.0, 66.0, 50.0, 35.0, 19.0, 24.0, 19.0, 13.0, 14.0, 4.0, 7.0, 11.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02197265625, -0.02128291130065918, -0.02059316635131836, -0.01990342140197754, -0.01921367645263672, -0.0185239315032959, -0.017834186553955078, -0.017144441604614258, -0.016454696655273438, -0.015764951705932617, -0.015075206756591797, -0.014385461807250977, -0.013695716857910156, -0.013005971908569336, -0.012316226959228516, -0.011626482009887695, -0.010936737060546875, -0.010246992111206055, -0.009557247161865234, -0.008867502212524414, -0.008177757263183594, -0.0074880123138427734, -0.006798267364501953, -0.006108522415161133, -0.0054187774658203125, -0.004729032516479492, -0.004039287567138672, -0.0033495426177978516, -0.0026597976684570312, -0.001970052719116211, -0.0012803077697753906, -0.0005905628204345703, 9.918212890625e-05, 0.0007889270782470703, 0.0014786720275878906, 0.002168416976928711, 0.0028581619262695312, 0.0035479068756103516, 0.004237651824951172, 0.004927396774291992, 0.0056171417236328125, 0.006306886672973633, 0.006996631622314453, 0.0076863765716552734, 0.008376121520996094, 0.009065866470336914, 0.009755611419677734, 0.010445356369018555, 0.011135101318359375, 0.011824846267700195, 0.012514591217041016, 0.013204336166381836, 0.013894081115722656, 0.014583826065063477, 0.015273571014404297, 0.015963315963745117, 0.016653060913085938, 0.017342805862426758, 0.018032550811767578, 0.0187222957611084, 0.01941204071044922, 0.02010178565979004, 0.02079153060913086, 0.02148127555847168, 0.0221710205078125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 8.0, 160.0, 786.0, 61.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006038642022758722, -0.0004914011806249619, -0.000378938129870221, -0.0002664750791154802, -0.0001540120574645698, -4.154903581365943e-05, 7.091404404491186e-05, 0.00018337706569582224, 0.0002958400873467326, 0.000408303108997643, 0.0005207661306485534, 0.0006332292105071247, 0.000745692232158035, 0.0008581552538089454, 0.0009706183336675167, 0.001083081355318427, 0.0011955443769693375, 0.0013080073986202478, 0.0014204704202711582, 0.0015329334419220686, 0.001645396463572979, 0.0017578594852238894, 0.0018703226232901216, 0.0019827857613563538, 0.0020952485501766205, 0.002207711571827531, 0.0023201745934784412, 0.0024326376151293516, 0.002545100636780262, 0.0026575636584311724, 0.0027700266800820827, 0.0028824899345636368, 0.0029949527233839035, 0.003107415745034814, 0.0032198787666857243, 0.0033323417883366346, 0.003444804809987545, 0.0035572678316384554, 0.0036697308532893658, 0.00378219410777092, 0.0038946568965911865, 0.0040071201510727406, 0.004119582939893007, 0.004232046194374561, 0.004344508983194828, 0.004456972237676382, 0.004569435026496649, 0.004681898280978203, 0.0047943610697984695, 0.004906824324280024, 0.00501928711310029, 0.005131750367581844, 0.005244213156402111, 0.005356676410883665, 0.005469139199703932, 0.005581602454185486, 0.00569406570866704, 0.005806528963148594, 0.005918991751968861, 0.006031455006450415, 0.006143917795270681, 0.006256381049752235, 0.006368843838572502, 0.006481307093054056, 0.006593769881874323]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 7.0, 2.0, 5.0, 6.0, 10.0, 19.0, 15.0, 19.0, 20.0, 24.0, 24.0, 33.0, 40.0, 43.0, 44.0, 39.0, 44.0, 46.0, 53.0, 55.0, 47.0, 53.0, 53.0, 34.0, 32.0, 35.0, 23.0, 32.0, 24.0, 19.0, 23.0, 19.0, 19.0, 10.0, 9.0, 8.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005924105644226074, -0.0005711764097213745, -0.0005499422550201416, -0.0005287081003189087, -0.0005074739456176758, -0.00048623979091644287, -0.00046500563621520996, -0.00044377148151397705, -0.00042253732681274414, -0.00040130317211151123, -0.0003800690174102783, -0.0003588348627090454, -0.0003376007080078125, -0.0003163665533065796, -0.0002951323986053467, -0.00027389824390411377, -0.00025266408920288086, -0.00023142993450164795, -0.00021019577980041504, -0.00018896162509918213, -0.00016772747039794922, -0.0001464933156967163, -0.0001252591609954834, -0.00010402500629425049, -8.279085159301758e-05, -6.155669689178467e-05, -4.032254219055176e-05, -1.9088387489318848e-05, 2.1457672119140625e-06, 2.3379921913146973e-05, 4.461407661437988e-05, 6.584823131561279e-05, 8.70823860168457e-05, 0.00010831654071807861, 0.00012955069541931152, 0.00015078485012054443, 0.00017201900482177734, 0.00019325315952301025, 0.00021448731422424316, 0.00023572146892547607, 0.000256955623626709, 0.0002781897783279419, 0.0002994239330291748, 0.0003206580877304077, 0.0003418922424316406, 0.00036312639713287354, 0.00038436055183410645, 0.00040559470653533936, 0.00042682886123657227, 0.0004480630159378052, 0.0004692971706390381, 0.000490531325340271, 0.0005117654800415039, 0.0005329996347427368, 0.0005542337894439697, 0.0005754679441452026, 0.0005967020988464355, 0.0006179362535476685, 0.0006391704082489014, 0.0006604045629501343, 0.0006816387176513672, 0.0007028728723526001, 0.000724107027053833, 0.0007453411817550659, 0.0007665753364562988]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 5.0, 10.0, 12.0, 17.0, 25.0, 24.0, 32.0, 29.0, 34.0, 53.0, 54.0, 40.0, 52.0, 48.0, 64.0, 45.0, 62.0, 44.0, 41.0, 58.0, 35.0, 41.0, 39.0, 40.0, 27.0, 13.0, 16.0, 17.0, 12.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.24139404296875, -7.0335693359375, -6.82574462890625, -6.617919921875, -6.41009521484375, -6.2022705078125, -5.99444580078125, -5.78662109375, -5.57879638671875, -5.3709716796875, -5.16314697265625, -4.955322265625, -4.74749755859375, -4.5396728515625, -4.33184814453125, -4.1240234375, -3.91619873046875, -3.7083740234375, -3.50054931640625, -3.292724609375, -3.08489990234375, -2.8770751953125, -2.66925048828125, -2.46142578125, -2.25360107421875, -2.0457763671875, -1.83795166015625, -1.630126953125, -1.42230224609375, -1.2144775390625, -1.00665283203125, -0.798828125, -0.59100341796875, -0.3831787109375, -0.17535400390625, 0.032470703125, 0.24029541015625, 0.4481201171875, 0.65594482421875, 0.86376953125, 1.07159423828125, 1.2794189453125, 1.48724365234375, 1.695068359375, 1.90289306640625, 2.1107177734375, 2.31854248046875, 2.5263671875, 2.73419189453125, 2.9420166015625, 3.14984130859375, 3.357666015625, 3.56549072265625, 3.7733154296875, 3.98114013671875, 4.18896484375, 4.39678955078125, 4.6046142578125, 4.81243896484375, 5.020263671875, 5.22808837890625, 5.4359130859375, 5.64373779296875, 5.8515625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 9.0, 9.0, 10.0, 24.0, 35.0, 36.0, 50.0, 85.0, 115.0, 160.0, 244.0, 363.0, 486.0, 791.0, 1204.0, 2002.0, 3282.0, 5929.0, 13351.0, 58343.0, 879129.0, 55084.0, 13095.0, 5950.0, 3223.0, 1927.0, 1235.0, 733.0, 528.0, 341.0, 224.0, 173.0, 114.0, 72.0, 60.0, 33.0, 34.0, 21.0, 16.0, 12.0, 7.0, 8.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.34375, -35.22509765625, -34.1064453125, -32.98779296875, -31.869140625, -30.75048828125, -29.6318359375, -28.51318359375, -27.39453125, -26.27587890625, -25.1572265625, -24.03857421875, -22.919921875, -21.80126953125, -20.6826171875, -19.56396484375, -18.4453125, -17.32666015625, -16.2080078125, -15.08935546875, -13.970703125, -12.85205078125, -11.7333984375, -10.61474609375, -9.49609375, -8.37744140625, -7.2587890625, -6.14013671875, -5.021484375, -3.90283203125, -2.7841796875, -1.66552734375, -0.546875, 0.57177734375, 1.6904296875, 2.80908203125, 3.927734375, 5.04638671875, 6.1650390625, 7.28369140625, 8.40234375, 9.52099609375, 10.6396484375, 11.75830078125, 12.876953125, 13.99560546875, 15.1142578125, 16.23291015625, 17.3515625, 18.47021484375, 19.5888671875, 20.70751953125, 21.826171875, 22.94482421875, 24.0634765625, 25.18212890625, 26.30078125, 27.41943359375, 28.5380859375, 29.65673828125, 30.775390625, 31.89404296875, 33.0126953125, 34.13134765625, 35.25]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 2.0, 5.0, 8.0, 15.0, 17.0, 14.0, 13.0, 26.0, 26.0, 33.0, 24.0, 41.0, 38.0, 59.0, 50.0, 43.0, 103.0, 299.0, 1620.0, 179.0, 62.0, 51.0, 40.0, 44.0, 39.0, 29.0, 32.0, 20.0, 18.0, 17.0, 22.0, 10.0, 7.0, 14.0, 7.0, 5.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-20.0625, -19.524169921875, -18.98583984375, -18.447509765625, -17.9091796875, -17.370849609375, -16.83251953125, -16.294189453125, -15.755859375, -15.217529296875, -14.67919921875, -14.140869140625, -13.6025390625, -13.064208984375, -12.52587890625, -11.987548828125, -11.44921875, -10.910888671875, -10.37255859375, -9.834228515625, -9.2958984375, -8.757568359375, -8.21923828125, -7.680908203125, -7.142578125, -6.604248046875, -6.06591796875, -5.527587890625, -4.9892578125, -4.450927734375, -3.91259765625, -3.374267578125, -2.8359375, -2.297607421875, -1.75927734375, -1.220947265625, -0.6826171875, -0.144287109375, 0.39404296875, 0.932373046875, 1.470703125, 2.009033203125, 2.54736328125, 3.085693359375, 3.6240234375, 4.162353515625, 4.70068359375, 5.239013671875, 5.77734375, 6.315673828125, 6.85400390625, 7.392333984375, 7.9306640625, 8.468994140625, 9.00732421875, 9.545654296875, 10.083984375, 10.622314453125, 11.16064453125, 11.698974609375, 12.2373046875, 12.775634765625, 13.31396484375, 13.852294921875, 14.390625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 9.0, 11.0, 9.0, 12.0, 14.0, 16.0, 18.0, 28.0, 31.0, 27.0, 42.0, 55.0, 59.0, 140.0, 396.0, 2664.0, 3119780.0, 20947.0, 750.0, 229.0, 101.0, 79.0, 56.0, 35.0, 29.0, 29.0, 19.0, 18.0, 21.0, 14.0, 16.0, 15.0, 7.0, 7.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.9375, -63.556640625, -61.17578125, -58.794921875, -56.4140625, -54.033203125, -51.65234375, -49.271484375, -46.890625, -44.509765625, -42.12890625, -39.748046875, -37.3671875, -34.986328125, -32.60546875, -30.224609375, -27.84375, -25.462890625, -23.08203125, -20.701171875, -18.3203125, -15.939453125, -13.55859375, -11.177734375, -8.796875, -6.416015625, -4.03515625, -1.654296875, 0.7265625, 3.107421875, 5.48828125, 7.869140625, 10.25, 12.630859375, 15.01171875, 17.392578125, 19.7734375, 22.154296875, 24.53515625, 26.916015625, 29.296875, 31.677734375, 34.05859375, 36.439453125, 38.8203125, 41.201171875, 43.58203125, 45.962890625, 48.34375, 50.724609375, 53.10546875, 55.486328125, 57.8671875, 60.248046875, 62.62890625, 65.009765625, 67.390625, 69.771484375, 72.15234375, 74.533203125, 76.9140625, 79.294921875, 81.67578125, 84.056640625, 86.4375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 134.0, 874.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.75433349609375, -229.62741088867188, -222.50048828125, -215.37355041503906, -208.2466278076172, -201.1197052001953, -193.99276733398438, -186.8658447265625, -179.73892211914062, -172.61199951171875, -165.48507690429688, -158.35813903808594, -151.23121643066406, -144.1042938232422, -136.97735595703125, -129.85043334960938, -122.7235107421875, -115.59658813476562, -108.46965789794922, -101.34272766113281, -94.21580505371094, -87.08888244628906, -79.96195220947266, -72.83502197265625, -65.70809936523438, -58.581172943115234, -51.454246520996094, -44.32732009887695, -37.20039367675781, -30.073467254638672, -22.94654083251953, -15.81961441040039, -8.692672729492188, -1.5657463073730469, 5.561180114746094, 12.688106536865234, 19.815032958984375, 26.941959381103516, 34.068885803222656, 41.1958122253418, 48.32273864746094, 55.44966506958008, 62.57659149169922, 69.70352172851562, 76.8304443359375, 83.95736694335938, 91.08429718017578, 98.21122741699219, 105.33815002441406, 112.46507263183594, 119.59200286865234, 126.71893310546875, 133.84585571289062, 140.9727783203125, 148.09970092773438, 155.2266387939453, 162.3535614013672, 169.48048400878906, 176.607421875, 183.73434448242188, 190.86126708984375, 197.98818969726562, 205.1151123046875, 212.24205017089844, 219.3689727783203]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 6.0, 17.0, 5.0, 16.0, 10.0, 17.0, 21.0, 20.0, 31.0, 32.0, 16.0, 27.0, 25.0, 26.0, 54.0, 40.0, 53.0, 33.0, 51.0, 33.0, 35.0, 42.0, 40.0, 33.0, 29.0, 52.0, 38.0, 28.0, 26.0, 22.0, 17.0, 19.0, 13.0, 12.0, 9.0, 13.0, 6.0, 5.0, 6.0, 5.0, 8.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-66.52519226074219, -64.83065032958984, -63.13611602783203, -61.44157409667969, -59.74703598022461, -58.05249786376953, -56.35795593261719, -54.66341781616211, -52.96887969970703, -51.27434158325195, -49.579803466796875, -47.88526153564453, -46.19072341918945, -44.496185302734375, -42.80164337158203, -41.10710525512695, -39.412567138671875, -37.7180290222168, -36.02349090576172, -34.328948974609375, -32.6344108581543, -30.93987274169922, -29.245332717895508, -27.550792694091797, -25.85625457763672, -24.16171646118164, -22.46717643737793, -20.77263641357422, -19.07809829711914, -17.383560180664062, -15.689020156860352, -13.994481086730957, -12.299945831298828, -10.605406761169434, -8.910867691040039, -7.2163286209106445, -5.52178955078125, -3.8272504806518555, -2.132711410522461, -0.4381723403930664, 1.2563667297363281, 2.9509057998657227, 4.645444869995117, 6.339983940124512, 8.034523010253906, 9.7290620803833, 11.423601150512695, 13.11814022064209, 14.812679290771484, 16.507217407226562, 18.201757431030273, 19.896297454833984, 21.590835571289062, 23.28537368774414, 24.97991371154785, 26.674453735351562, 28.36899185180664, 30.06352996826172, 31.75806999206543, 33.45261001586914, 35.14714813232422, 36.8416862487793, 38.536224365234375, 40.23076629638672, 41.9253044128418]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 10.0, 15.0, 11.0, 13.0, 26.0, 20.0, 37.0, 27.0, 41.0, 45.0, 32.0, 55.0, 52.0, 40.0, 45.0, 57.0, 61.0, 49.0, 36.0, 53.0, 35.0, 51.0, 37.0, 27.0, 33.0, 25.0, 19.0, 11.0, 16.0, 11.0, 5.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.22265625, -7.01123046875, -6.7998046875, -6.58837890625, -6.376953125, -6.16552734375, -5.9541015625, -5.74267578125, -5.53125, -5.31982421875, -5.1083984375, -4.89697265625, -4.685546875, -4.47412109375, -4.2626953125, -4.05126953125, -3.83984375, -3.62841796875, -3.4169921875, -3.20556640625, -2.994140625, -2.78271484375, -2.5712890625, -2.35986328125, -2.1484375, -1.93701171875, -1.7255859375, -1.51416015625, -1.302734375, -1.09130859375, -0.8798828125, -0.66845703125, -0.45703125, -0.24560546875, -0.0341796875, 0.17724609375, 0.388671875, 0.60009765625, 0.8115234375, 1.02294921875, 1.234375, 1.44580078125, 1.6572265625, 1.86865234375, 2.080078125, 2.29150390625, 2.5029296875, 2.71435546875, 2.92578125, 3.13720703125, 3.3486328125, 3.56005859375, 3.771484375, 3.98291015625, 4.1943359375, 4.40576171875, 4.6171875, 4.82861328125, 5.0400390625, 5.25146484375, 5.462890625, 5.67431640625, 5.8857421875, 6.09716796875, 6.30859375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 11.0, 15.0, 22.0, 32.0, 45.0, 81.0, 132.0, 239.0, 383.0, 819.0, 1857.0, 4844.0, 15047.0, 81848.0, 3400880.0, 640020.0, 33620.0, 8549.0, 3156.0, 1293.0, 598.0, 309.0, 175.0, 107.0, 64.0, 41.0, 27.0, 17.0, 18.0, 5.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.3125, -41.095703125, -39.87890625, -38.662109375, -37.4453125, -36.228515625, -35.01171875, -33.794921875, -32.578125, -31.361328125, -30.14453125, -28.927734375, -27.7109375, -26.494140625, -25.27734375, -24.060546875, -22.84375, -21.626953125, -20.41015625, -19.193359375, -17.9765625, -16.759765625, -15.54296875, -14.326171875, -13.109375, -11.892578125, -10.67578125, -9.458984375, -8.2421875, -7.025390625, -5.80859375, -4.591796875, -3.375, -2.158203125, -0.94140625, 0.275390625, 1.4921875, 2.708984375, 3.92578125, 5.142578125, 6.359375, 7.576171875, 8.79296875, 10.009765625, 11.2265625, 12.443359375, 13.66015625, 14.876953125, 16.09375, 17.310546875, 18.52734375, 19.744140625, 20.9609375, 22.177734375, 23.39453125, 24.611328125, 25.828125, 27.044921875, 28.26171875, 29.478515625, 30.6953125, 31.912109375, 33.12890625, 34.345703125, 35.5625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 10.0, 11.0, 21.0, 19.0, 40.0, 55.0, 101.0, 160.0, 253.0, 427.0, 704.0, 828.0, 590.0, 332.0, 201.0, 121.0, 64.0, 40.0, 30.0, 29.0, 15.0, 8.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.25, -33.221435546875, -32.19287109375, -31.164306640625, -30.1357421875, -29.107177734375, -28.07861328125, -27.050048828125, -26.021484375, -24.992919921875, -23.96435546875, -22.935791015625, -21.9072265625, -20.878662109375, -19.85009765625, -18.821533203125, -17.79296875, -16.764404296875, -15.73583984375, -14.707275390625, -13.6787109375, -12.650146484375, -11.62158203125, -10.593017578125, -9.564453125, -8.535888671875, -7.50732421875, -6.478759765625, -5.4501953125, -4.421630859375, -3.39306640625, -2.364501953125, -1.3359375, -0.307373046875, 0.72119140625, 1.749755859375, 2.7783203125, 3.806884765625, 4.83544921875, 5.864013671875, 6.892578125, 7.921142578125, 8.94970703125, 9.978271484375, 11.0068359375, 12.035400390625, 13.06396484375, 14.092529296875, 15.12109375, 16.149658203125, 17.17822265625, 18.206787109375, 19.2353515625, 20.263916015625, 21.29248046875, 22.321044921875, 23.349609375, 24.378173828125, 25.40673828125, 26.435302734375, 27.4638671875, 28.492431640625, 29.52099609375, 30.549560546875, 31.578125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 8.0, 5.0, 11.0, 18.0, 19.0, 25.0, 51.0, 85.0, 118.0, 208.0, 425.0, 1958.0, 3494723.0, 694082.0, 1523.0, 433.0, 216.0, 133.0, 71.0, 59.0, 23.0, 31.0, 17.0, 15.0, 5.0, 5.0, 2.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.125, -93.845703125, -89.56640625, -85.287109375, -81.0078125, -76.728515625, -72.44921875, -68.169921875, -63.890625, -59.611328125, -55.33203125, -51.052734375, -46.7734375, -42.494140625, -38.21484375, -33.935546875, -29.65625, -25.376953125, -21.09765625, -16.818359375, -12.5390625, -8.259765625, -3.98046875, 0.298828125, 4.578125, 8.857421875, 13.13671875, 17.416015625, 21.6953125, 25.974609375, 30.25390625, 34.533203125, 38.8125, 43.091796875, 47.37109375, 51.650390625, 55.9296875, 60.208984375, 64.48828125, 68.767578125, 73.046875, 77.326171875, 81.60546875, 85.884765625, 90.1640625, 94.443359375, 98.72265625, 103.001953125, 107.28125, 111.560546875, 115.83984375, 120.119140625, 124.3984375, 128.677734375, 132.95703125, 137.236328125, 141.515625, 145.794921875, 150.07421875, 154.353515625, 158.6328125, 162.912109375, 167.19140625, 171.470703125, 175.75]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 82.0, 619.0, 298.0, 12.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-526.989501953125, -517.1840209960938, -507.37847900390625, -497.5729675292969, -487.7674560546875, -477.9619445800781, -468.15643310546875, -458.3509521484375, -448.54541015625, -438.7398986816406, -428.93438720703125, -419.1288757324219, -409.3233642578125, -399.5178527832031, -389.71234130859375, -379.9068603515625, -370.1013488769531, -360.29583740234375, -350.4903259277344, -340.684814453125, -330.8793029785156, -321.07379150390625, -311.2682800292969, -301.4627685546875, -291.65728759765625, -281.8517761230469, -272.0462646484375, -262.2407531738281, -252.43524169921875, -242.62973022460938, -232.82423400878906, -223.0187225341797, -213.2132110595703, -203.40769958496094, -193.60218811035156, -183.7966766357422, -173.99118041992188, -164.1856689453125, -154.38015747070312, -144.57464599609375, -134.76913452148438, -124.963623046875, -115.15811157226562, -105.35260772705078, -95.5470962524414, -85.74158477783203, -75.93608093261719, -66.13056945800781, -56.32505798339844, -46.51954650878906, -36.71403884887695, -26.90852928161621, -17.10301971435547, -7.297508239746094, 2.5079994201660156, 12.313507080078125, 22.1190185546875, 31.924528121948242, 41.730037689208984, 51.535545349121094, 61.34105682373047, 71.14656829833984, 80.95207214355469, 90.75758361816406, 100.56309509277344]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 5.0, 4.0, 5.0, 7.0, 11.0, 22.0, 24.0, 18.0, 30.0, 25.0, 38.0, 40.0, 42.0, 41.0, 45.0, 55.0, 54.0, 46.0, 43.0, 50.0, 53.0, 42.0, 34.0, 43.0, 25.0, 32.0, 20.0, 31.0, 24.0, 21.0, 22.0, 12.0, 7.0, 7.0, 4.0, 10.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.2261962890625, -72.79197692871094, -70.35775756835938, -67.92353057861328, -65.48931121826172, -63.055091857910156, -60.620872497558594, -58.18665313720703, -55.7524299621582, -53.31821060180664, -50.88398742675781, -48.44976806640625, -46.01554870605469, -43.58132553100586, -41.1471061706543, -38.71288299560547, -36.278663635253906, -33.844444274902344, -31.410221099853516, -28.976001739501953, -26.541780471801758, -24.107559204101562, -21.67333984375, -19.239118576049805, -16.80489730834961, -14.370676040649414, -11.936455726623535, -9.502235412597656, -7.068014144897461, -4.633792877197266, -2.1995725631713867, 0.2346477508544922, 2.6688613891601562, 5.103082180023193, 7.5373029708862305, 9.97152328491211, 12.405744552612305, 14.8399658203125, 17.274185180664062, 19.708406448364258, 22.142627716064453, 24.57684898376465, 27.011070251464844, 29.445289611816406, 31.8795108795166, 34.3137321472168, 36.74795150756836, 39.18217468261719, 41.61639404296875, 44.05061340332031, 46.48483657836914, 48.9190559387207, 51.35327911376953, 53.787498474121094, 56.221717834472656, 58.65593719482422, 61.09016036987305, 63.52437973022461, 65.95860290527344, 68.392822265625, 70.82704162597656, 73.26126098632812, 75.69548797607422, 78.12970733642578, 80.56392669677734]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 16.0, 17.0, 17.0, 23.0, 19.0, 19.0, 27.0, 38.0, 34.0, 41.0, 47.0, 43.0, 43.0, 36.0, 49.0, 52.0, 64.0, 41.0, 48.0, 41.0, 42.0, 36.0, 36.0, 25.0, 34.0, 22.0, 16.0, 16.0, 19.0, 9.0, 7.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -6.01800537109375, -5.8172607421875, -5.61651611328125, -5.415771484375, -5.21502685546875, -5.0142822265625, -4.81353759765625, -4.61279296875, -4.41204833984375, -4.2113037109375, -4.01055908203125, -3.809814453125, -3.60906982421875, -3.4083251953125, -3.20758056640625, -3.0068359375, -2.80609130859375, -2.6053466796875, -2.40460205078125, -2.203857421875, -2.00311279296875, -1.8023681640625, -1.60162353515625, -1.40087890625, -1.20013427734375, -0.9993896484375, -0.79864501953125, -0.597900390625, -0.39715576171875, -0.1964111328125, 0.00433349609375, 0.205078125, 0.40582275390625, 0.6065673828125, 0.80731201171875, 1.008056640625, 1.20880126953125, 1.4095458984375, 1.61029052734375, 1.81103515625, 2.01177978515625, 2.2125244140625, 2.41326904296875, 2.614013671875, 2.81475830078125, 3.0155029296875, 3.21624755859375, 3.4169921875, 3.61773681640625, 3.8184814453125, 4.01922607421875, 4.219970703125, 4.42071533203125, 4.6214599609375, 4.82220458984375, 5.02294921875, 5.22369384765625, 5.4244384765625, 5.62518310546875, 5.825927734375, 6.02667236328125, 6.2274169921875, 6.42816162109375, 6.62890625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 14.0, 11.0, 26.0, 49.0, 61.0, 105.0, 136.0, 232.0, 335.0, 551.0, 846.0, 1300.0, 2074.0, 3348.0, 5380.0, 8925.0, 14475.0, 24006.0, 39963.0, 66798.0, 109409.0, 176064.0, 225560.0, 144446.0, 88432.0, 53493.0, 32439.0, 19450.0, 11754.0, 7115.0, 4385.0, 2761.0, 1677.0, 1039.0, 665.0, 408.0, 253.0, 196.0, 111.0, 67.0, 54.0, 48.0, 24.0, 20.0, 18.0, 10.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.85546875, -0.8289718627929688, -0.8024749755859375, -0.7759780883789062, -0.749481201171875, -0.7229843139648438, -0.6964874267578125, -0.6699905395507812, -0.64349365234375, -0.6169967651367188, -0.5904998779296875, -0.5640029907226562, -0.537506103515625, -0.5110092163085938, -0.4845123291015625, -0.45801544189453125, -0.4315185546875, -0.40502166748046875, -0.3785247802734375, -0.35202789306640625, -0.325531005859375, -0.29903411865234375, -0.2725372314453125, -0.24604034423828125, -0.21954345703125, -0.19304656982421875, -0.1665496826171875, -0.14005279541015625, -0.113555908203125, -0.08705902099609375, -0.0605621337890625, -0.03406524658203125, -0.007568359375, 0.01892852783203125, 0.0454254150390625, 0.07192230224609375, 0.098419189453125, 0.12491607666015625, 0.1514129638671875, 0.17790985107421875, 0.20440673828125, 0.23090362548828125, 0.2574005126953125, 0.28389739990234375, 0.310394287109375, 0.33689117431640625, 0.3633880615234375, 0.38988494873046875, 0.4163818359375, 0.44287872314453125, 0.4693756103515625, 0.49587249755859375, 0.522369384765625, 0.5488662719726562, 0.5753631591796875, 0.6018600463867188, 0.62835693359375, 0.6548538208007812, 0.6813507080078125, 0.7078475952148438, 0.734344482421875, 0.7608413696289062, 0.7873382568359375, 0.8138351440429688, 0.84033203125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 1.0, 6.0, 3.0, 8.0, 15.0, 7.0, 17.0, 10.0, 14.0, 25.0, 33.0, 34.0, 19.0, 26.0, 34.0, 40.0, 35.0, 39.0, 47.0, 36.0, 1061.0, 51.0, 46.0, 40.0, 45.0, 42.0, 42.0, 32.0, 29.0, 29.0, 18.0, 20.0, 19.0, 23.0, 16.0, 10.0, 15.0, 7.0, 5.0, 6.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.576171875, -3.466796875, -3.357421875, -3.248046875, -3.138671875, -3.029296875, -2.919921875, -2.810546875, -2.701171875, -2.591796875, -2.482421875, -2.373046875, -2.263671875, -2.154296875, -2.044921875, -1.935546875, -1.826171875, -1.716796875, -1.607421875, -1.498046875, -1.388671875, -1.279296875, -1.169921875, -1.060546875, -0.951171875, -0.841796875, -0.732421875, -0.623046875, -0.513671875, -0.404296875, -0.294921875, -0.185546875, -0.076171875, 0.033203125, 0.142578125, 0.251953125, 0.361328125, 0.470703125, 0.580078125, 0.689453125, 0.798828125, 0.908203125, 1.017578125, 1.126953125, 1.236328125, 1.345703125, 1.455078125, 1.564453125, 1.673828125, 1.783203125, 1.892578125, 2.001953125, 2.111328125, 2.220703125, 2.330078125, 2.439453125, 2.548828125, 2.658203125, 2.767578125, 2.876953125, 2.986328125, 3.095703125, 3.205078125, 3.314453125, 3.423828125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 1.0, 2.0, 8.0, 6.0, 14.0, 21.0, 32.0, 40.0, 60.0, 104.0, 150.0, 224.0, 330.0, 512.0, 776.0, 1231.0, 1898.0, 2983.0, 4656.0, 7609.0, 11910.0, 19415.0, 31709.0, 51009.0, 83708.0, 133248.0, 1253794.0, 185341.0, 116215.0, 72561.0, 44711.0, 27564.0, 16985.0, 10397.0, 6547.0, 4056.0, 2569.0, 1624.0, 1060.0, 692.0, 474.0, 299.0, 212.0, 136.0, 87.0, 47.0, 40.0, 24.0, 17.0, 18.0, 9.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6337966918945312, -0.6118316650390625, -0.5898666381835938, -0.567901611328125, -0.5459365844726562, -0.5239715576171875, -0.5020065307617188, -0.48004150390625, -0.45807647705078125, -0.4361114501953125, -0.41414642333984375, -0.392181396484375, -0.37021636962890625, -0.3482513427734375, -0.32628631591796875, -0.3043212890625, -0.28235626220703125, -0.2603912353515625, -0.23842620849609375, -0.216461181640625, -0.19449615478515625, -0.1725311279296875, -0.15056610107421875, -0.12860107421875, -0.10663604736328125, -0.0846710205078125, -0.06270599365234375, -0.040740966796875, -0.01877593994140625, 0.0031890869140625, 0.02515411376953125, 0.047119140625, 0.06908416748046875, 0.0910491943359375, 0.11301422119140625, 0.134979248046875, 0.15694427490234375, 0.1789093017578125, 0.20087432861328125, 0.22283935546875, 0.24480438232421875, 0.2667694091796875, 0.28873443603515625, 0.310699462890625, 0.33266448974609375, 0.3546295166015625, 0.37659454345703125, 0.3985595703125, 0.42052459716796875, 0.4424896240234375, 0.46445465087890625, 0.486419677734375, 0.5083847045898438, 0.5303497314453125, 0.5523147583007812, 0.57427978515625, 0.5962448120117188, 0.6182098388671875, 0.6401748657226562, 0.662139892578125, 0.6841049194335938, 0.7060699462890625, 0.7280349731445312, 0.75]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 8.0, 8.0, 9.0, 17.0, 14.0, 25.0, 18.0, 33.0, 46.0, 50.0, 73.0, 59.0, 70.0, 85.0, 88.0, 79.0, 60.0, 51.0, 45.0, 36.0, 27.0, 17.0, 11.0, 19.0, 11.0, 11.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0014743804931640625, -0.001429229974746704, -0.0013840794563293457, -0.0013389289379119873, -0.001293778419494629, -0.0012486279010772705, -0.0012034773826599121, -0.0011583268642425537, -0.0011131763458251953, -0.001068025827407837, -0.0010228753089904785, -0.0009777247905731201, -0.0009325742721557617, -0.0008874237537384033, -0.0008422732353210449, -0.0007971227169036865, -0.0007519721984863281, -0.0007068216800689697, -0.0006616711616516113, -0.0006165206432342529, -0.0005713701248168945, -0.0005262196063995361, -0.00048106908798217773, -0.00043591856956481934, -0.00039076805114746094, -0.00034561753273010254, -0.00030046701431274414, -0.00025531649589538574, -0.00021016597747802734, -0.00016501545906066895, -0.00011986494064331055, -7.471442222595215e-05, -2.956390380859375e-05, 1.558661460876465e-05, 6.073713302612305e-05, 0.00010588765144348145, 0.00015103816986083984, 0.00019618868827819824, 0.00024133920669555664, 0.00028648972511291504, 0.00033164024353027344, 0.00037679076194763184, 0.00042194128036499023, 0.00046709179878234863, 0.000512242317199707, 0.0005573928356170654, 0.0006025433540344238, 0.0006476938724517822, 0.0006928443908691406, 0.000737994909286499, 0.0007831454277038574, 0.0008282959461212158, 0.0008734464645385742, 0.0009185969829559326, 0.000963747501373291, 0.0010088980197906494, 0.0010540485382080078, 0.0010991990566253662, 0.0011443495750427246, 0.001189500093460083, 0.0012346506118774414, 0.0012798011302947998, 0.0013249516487121582, 0.0013701021671295166, 0.001415252685546875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 7.0, 12.0, 20.0, 14.0, 19.0, 22.0, 34.0, 43.0, 48.0, 69.0, 123.0, 164.0, 181.0, 264.0, 642.0, 8181.0, 1034501.0, 2754.0, 499.0, 268.0, 199.0, 116.0, 86.0, 74.0, 47.0, 35.0, 23.0, 14.0, 17.0, 12.0, 12.0, 18.0, 7.0, 6.0, 1.0, 6.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025634765625, -0.024762630462646484, -0.02389049530029297, -0.023018360137939453, -0.022146224975585938, -0.021274089813232422, -0.020401954650878906, -0.01952981948852539, -0.018657684326171875, -0.01778554916381836, -0.016913414001464844, -0.016041278839111328, -0.015169143676757812, -0.014297008514404297, -0.013424873352050781, -0.012552738189697266, -0.01168060302734375, -0.010808467864990234, -0.009936332702636719, -0.009064197540283203, -0.008192062377929688, -0.007319927215576172, -0.006447792053222656, -0.005575656890869141, -0.004703521728515625, -0.0038313865661621094, -0.0029592514038085938, -0.002087116241455078, -0.0012149810791015625, -0.0003428459167480469, 0.0005292892456054688, 0.0014014244079589844, 0.0022735595703125, 0.0031456947326660156, 0.004017829895019531, 0.004889965057373047, 0.0057621002197265625, 0.006634235382080078, 0.007506370544433594, 0.00837850570678711, 0.009250640869140625, 0.01012277603149414, 0.010994911193847656, 0.011867046356201172, 0.012739181518554688, 0.013611316680908203, 0.014483451843261719, 0.015355587005615234, 0.01622772216796875, 0.017099857330322266, 0.01797199249267578, 0.018844127655029297, 0.019716262817382812, 0.020588397979736328, 0.021460533142089844, 0.02233266830444336, 0.023204803466796875, 0.02407693862915039, 0.024949073791503906, 0.025821208953857422, 0.026693344116210938, 0.027565479278564453, 0.02843761444091797, 0.029309749603271484, 0.030181884765625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 47.0, 370.0, 497.0, 81.0, 15.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0035810621920973063, -0.0034896391443908215, -0.0033982160966843367, -0.003306793048977852, -0.0032153702341020107, -0.003123947186395526, -0.003032524138689041, -0.0029411010909825563, -0.0028496780432760715, -0.0027582549955695868, -0.002666831947863102, -0.002575408900156617, -0.0024839858524501324, -0.0023925630375742912, -0.0023011399898678064, -0.0022097169421613216, -0.002118293894454837, -0.002026870846748352, -0.0019354477990418673, -0.0018440248677507043, -0.0017526018200442195, -0.0016611787723377347, -0.0015697558410465717, -0.001478332793340087, -0.0013869097456336021, -0.0012954866979271173, -0.0012040636502206326, -0.0011126407189294696, -0.0010212176712229848, -0.0009297946235165, -0.0008383716340176761, -0.0007469486445188522, -0.0006555255968123674, -0.0005641025491058826, -0.00047267955960705876, -0.0003812565410044044, -0.0002898335224017501, -0.00019841050379909575, -0.00010698748519644141, -1.556449569761753e-05, 7.585855200886726e-05, 0.0001672815706115216, 0.00025870458921417594, 0.0003501276078168303, 0.0004415506264194846, 0.0005329736741259694, 0.0006243966636247933, 0.0007158196531236172, 0.000807242700830102, 0.0008986657485365868, 0.0009900887962430716, 0.0010815117275342345, 0.0011729347752407193, 0.0012643578229472041, 0.001355780754238367, 0.0014472038019448519, 0.0015386268496513367, 0.0016300498973578215, 0.0017214729450643063, 0.0018128958763554692, 0.001904318924061954, 0.001995741855353117, 0.002087164903059602, 0.0021785879507660866, 0.0022700109984725714]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 6.0, 4.0, 12.0, 9.0, 11.0, 17.0, 18.0, 22.0, 22.0, 41.0, 27.0, 26.0, 21.0, 39.0, 29.0, 40.0, 38.0, 45.0, 46.0, 47.0, 53.0, 49.0, 40.0, 29.0, 37.0, 24.0, 34.0, 37.0, 24.0, 22.0, 21.0, 15.0, 21.0, 10.0, 12.0, 9.0, 9.0, 6.0, 11.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005835890769958496, -0.0005641374737024307, -0.0005446858704090118, -0.000525234267115593, -0.0005057826638221741, -0.0004863310605287552, -0.0004668794572353363, -0.0004474278539419174, -0.00042797625064849854, -0.00040852464735507965, -0.00038907304406166077, -0.0003696214407682419, -0.000350169837474823, -0.0003307182341814041, -0.00031126663088798523, -0.00029181502759456635, -0.00027236342430114746, -0.0002529118210077286, -0.0002334602177143097, -0.0002140086144208908, -0.00019455701112747192, -0.00017510540783405304, -0.00015565380454063416, -0.00013620220124721527, -0.00011675059795379639, -9.72989946603775e-05, -7.784739136695862e-05, -5.8395788073539734e-05, -3.894418478012085e-05, -1.9492581486701965e-05, -4.0978193283081055e-08, 1.9410625100135803e-05, 3.886222839355469e-05, 5.831383168697357e-05, 7.776543498039246e-05, 9.721703827381134e-05, 0.00011666864156723022, 0.0001361202448606491, 0.000155571848154068, 0.00017502345144748688, 0.00019447505474090576, 0.00021392665803432465, 0.00023337826132774353, 0.0002528298646211624, 0.0002722814679145813, 0.0002917330712080002, 0.00031118467450141907, 0.00033063627779483795, 0.00035008788108825684, 0.0003695394843816757, 0.0003889910876750946, 0.0004084426909685135, 0.0004278942942619324, 0.00044734589755535126, 0.00046679750084877014, 0.000486249104142189, 0.0005057007074356079, 0.0005251523107290268, 0.0005446039140224457, 0.0005640555173158646, 0.0005835071206092834, 0.0006029587239027023, 0.0006224103271961212, 0.0006418619304895401, 0.000661313533782959]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 16.0, 17.0, 17.0, 23.0, 19.0, 19.0, 27.0, 38.0, 34.0, 41.0, 47.0, 43.0, 43.0, 36.0, 49.0, 52.0, 64.0, 41.0, 48.0, 41.0, 42.0, 36.0, 36.0, 25.0, 34.0, 22.0, 16.0, 16.0, 19.0, 9.0, 7.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -6.01800537109375, -5.8172607421875, -5.61651611328125, -5.415771484375, -5.21502685546875, -5.0142822265625, -4.81353759765625, -4.61279296875, -4.41204833984375, -4.2113037109375, -4.01055908203125, -3.809814453125, -3.60906982421875, -3.4083251953125, -3.20758056640625, -3.0068359375, -2.80609130859375, -2.6053466796875, -2.40460205078125, -2.203857421875, -2.00311279296875, -1.8023681640625, -1.60162353515625, -1.40087890625, -1.20013427734375, -0.9993896484375, -0.79864501953125, -0.597900390625, -0.39715576171875, -0.1964111328125, 0.00433349609375, 0.205078125, 0.40582275390625, 0.6065673828125, 0.80731201171875, 1.008056640625, 1.20880126953125, 1.4095458984375, 1.61029052734375, 1.81103515625, 2.01177978515625, 2.2125244140625, 2.41326904296875, 2.614013671875, 2.81475830078125, 3.0155029296875, 3.21624755859375, 3.4169921875, 3.61773681640625, 3.8184814453125, 4.01922607421875, 4.219970703125, 4.42071533203125, 4.6214599609375, 4.82220458984375, 5.02294921875, 5.22369384765625, 5.4244384765625, 5.62518310546875, 5.825927734375, 6.02667236328125, 6.2274169921875, 6.42816162109375, 6.62890625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 13.0, 10.0, 22.0, 32.0, 47.0, 61.0, 85.0, 132.0, 197.0, 293.0, 442.0, 809.0, 1523.0, 3349.0, 9449.0, 33706.0, 160917.0, 589902.0, 190129.0, 39143.0, 10620.0, 3719.0, 1649.0, 835.0, 518.0, 293.0, 203.0, 138.0, 101.0, 70.0, 46.0, 24.0, 20.0, 19.0, 8.0, 8.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.28515625, -6.0859375, -5.88671875, -5.6875, -5.48828125, -5.2890625, -5.08984375, -4.890625, -4.69140625, -4.4921875, -4.29296875, -4.09375, -3.89453125, -3.6953125, -3.49609375, -3.296875, -3.09765625, -2.8984375, -2.69921875, -2.5, -2.30078125, -2.1015625, -1.90234375, -1.703125, -1.50390625, -1.3046875, -1.10546875, -0.90625, -0.70703125, -0.5078125, -0.30859375, -0.109375, 0.08984375, 0.2890625, 0.48828125, 0.6875, 0.88671875, 1.0859375, 1.28515625, 1.484375, 1.68359375, 1.8828125, 2.08203125, 2.28125, 2.48046875, 2.6796875, 2.87890625, 3.078125, 3.27734375, 3.4765625, 3.67578125, 3.875, 4.07421875, 4.2734375, 4.47265625, 4.671875, 4.87109375, 5.0703125, 5.26953125, 5.46875, 5.66796875, 5.8671875, 6.06640625, 6.265625, 6.46484375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 2.0, 9.0, 9.0, 4.0, 14.0, 13.0, 21.0, 18.0, 18.0, 26.0, 40.0, 29.0, 45.0, 48.0, 47.0, 51.0, 64.0, 354.0, 1728.0, 91.0, 63.0, 40.0, 23.0, 52.0, 41.0, 34.0, 25.0, 26.0, 18.0, 16.0, 18.0, 16.0, 9.0, 6.0, 7.0, 8.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.890625, -22.219970703125, -21.54931640625, -20.878662109375, -20.2080078125, -19.537353515625, -18.86669921875, -18.196044921875, -17.525390625, -16.854736328125, -16.18408203125, -15.513427734375, -14.8427734375, -14.172119140625, -13.50146484375, -12.830810546875, -12.16015625, -11.489501953125, -10.81884765625, -10.148193359375, -9.4775390625, -8.806884765625, -8.13623046875, -7.465576171875, -6.794921875, -6.124267578125, -5.45361328125, -4.782958984375, -4.1123046875, -3.441650390625, -2.77099609375, -2.100341796875, -1.4296875, -0.759033203125, -0.08837890625, 0.582275390625, 1.2529296875, 1.923583984375, 2.59423828125, 3.264892578125, 3.935546875, 4.606201171875, 5.27685546875, 5.947509765625, 6.6181640625, 7.288818359375, 7.95947265625, 8.630126953125, 9.30078125, 9.971435546875, 10.64208984375, 11.312744140625, 11.9833984375, 12.654052734375, 13.32470703125, 13.995361328125, 14.666015625, 15.336669921875, 16.00732421875, 16.677978515625, 17.3486328125, 18.019287109375, 18.68994140625, 19.360595703125, 20.03125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 5.0, 8.0, 7.0, 13.0, 14.0, 15.0, 12.0, 20.0, 24.0, 22.0, 48.0, 50.0, 74.0, 68.0, 127.0, 356.0, 1040.0, 47212.0, 3092069.0, 3242.0, 563.0, 218.0, 108.0, 81.0, 64.0, 40.0, 40.0, 28.0, 23.0, 20.0, 16.0, 12.0, 17.0, 8.0, 5.0, 6.0, 6.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.6875, -42.24365234375, -40.7998046875, -39.35595703125, -37.912109375, -36.46826171875, -35.0244140625, -33.58056640625, -32.13671875, -30.69287109375, -29.2490234375, -27.80517578125, -26.361328125, -24.91748046875, -23.4736328125, -22.02978515625, -20.5859375, -19.14208984375, -17.6982421875, -16.25439453125, -14.810546875, -13.36669921875, -11.9228515625, -10.47900390625, -9.03515625, -7.59130859375, -6.1474609375, -4.70361328125, -3.259765625, -1.81591796875, -0.3720703125, 1.07177734375, 2.515625, 3.95947265625, 5.4033203125, 6.84716796875, 8.291015625, 9.73486328125, 11.1787109375, 12.62255859375, 14.06640625, 15.51025390625, 16.9541015625, 18.39794921875, 19.841796875, 21.28564453125, 22.7294921875, 24.17333984375, 25.6171875, 27.06103515625, 28.5048828125, 29.94873046875, 31.392578125, 32.83642578125, 34.2802734375, 35.72412109375, 37.16796875, 38.61181640625, 40.0556640625, 41.49951171875, 42.943359375, 44.38720703125, 45.8310546875, 47.27490234375, 48.71875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.0, 778.0, 207.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.676727294921875, -34.175716400146484, -30.674705505371094, -27.17369270324707, -23.67268180847168, -20.17167091369629, -16.670658111572266, -13.169647216796875, -9.668636322021484, -6.1676249504089355, -2.6666135787963867, 0.8343982696533203, 4.335409164428711, 7.836420059204102, 11.337432861328125, 14.838443756103516, 18.339454650878906, 21.840465545654297, 25.341476440429688, 28.84248924255371, 32.34349822998047, 35.844512939453125, 39.345523834228516, 42.846534729003906, 46.3475456237793, 49.84855651855469, 53.34956741333008, 56.85057830810547, 60.351593017578125, 63.85260009765625, 67.3536148071289, 70.85462951660156, 74.35563659667969, 77.85665130615234, 81.35765838623047, 84.85867309570312, 88.35968017578125, 91.8606948852539, 95.36170959472656, 98.86271667480469, 102.36372375488281, 105.86473846435547, 109.3657455444336, 112.86676025390625, 116.36776733398438, 119.86878204345703, 123.36979675292969, 126.87080383300781, 130.371826171875, 133.87283325195312, 137.3738555908203, 140.87486267089844, 144.37586975097656, 147.8768768310547, 151.37789916992188, 154.87890625, 158.37991333007812, 161.88092041015625, 165.38194274902344, 168.88294982910156, 172.3839569091797, 175.8849639892578, 179.385986328125, 182.88699340820312, 186.38800048828125]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 8.0, 9.0, 7.0, 16.0, 19.0, 18.0, 19.0, 27.0, 25.0, 38.0, 44.0, 38.0, 41.0, 46.0, 54.0, 30.0, 51.0, 53.0, 47.0, 39.0, 52.0, 50.0, 28.0, 40.0, 36.0, 37.0, 21.0, 18.0, 16.0, 12.0, 18.0, 9.0, 3.0, 8.0, 5.0, 5.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.67066955566406, -55.525943756103516, -53.38121795654297, -51.23649215698242, -49.091766357421875, -46.94703674316406, -44.802310943603516, -42.65758514404297, -40.51285934448242, -38.368133544921875, -36.22340774536133, -34.07868194580078, -31.9339542388916, -29.789228439331055, -27.644500732421875, -25.499774932861328, -23.35504913330078, -21.210323333740234, -19.065597534179688, -16.920869827270508, -14.776144027709961, -12.631418228149414, -10.48669147491455, -8.341964721679688, -6.197238922119141, -4.0525126457214355, -1.9077863693237305, 0.2369399070739746, 2.3816661834716797, 4.526391983032227, 6.67111873626709, 8.815845489501953, 10.9605712890625, 13.105297088623047, 15.25002384185791, 17.394750595092773, 19.53947639465332, 21.684202194213867, 23.828929901123047, 25.973655700683594, 28.11838150024414, 30.263107299804688, 32.407833099365234, 34.55255889892578, 36.697288513183594, 38.842010498046875, 40.98674011230469, 43.131465911865234, 45.27619171142578, 47.42091751098633, 49.565643310546875, 51.71036911010742, 53.85509490966797, 55.99982452392578, 58.14455032348633, 60.289276123046875, 62.43400192260742, 64.57872772216797, 66.72345733642578, 68.86817932128906, 71.01290893554688, 73.15763092041016, 75.30236053466797, 77.44708251953125, 79.59181213378906]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 8.0, 18.0, 13.0, 17.0, 22.0, 21.0, 20.0, 25.0, 33.0, 48.0, 30.0, 49.0, 45.0, 40.0, 38.0, 52.0, 62.0, 44.0, 46.0, 43.0, 55.0, 34.0, 42.0, 31.0, 29.0, 27.0, 27.0, 13.0, 13.0, 17.0, 9.0, 11.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.11328125, -5.90863037109375, -5.7039794921875, -5.49932861328125, -5.294677734375, -5.09002685546875, -4.8853759765625, -4.68072509765625, -4.47607421875, -4.27142333984375, -4.0667724609375, -3.86212158203125, -3.657470703125, -3.45281982421875, -3.2481689453125, -3.04351806640625, -2.8388671875, -2.63421630859375, -2.4295654296875, -2.22491455078125, -2.020263671875, -1.81561279296875, -1.6109619140625, -1.40631103515625, -1.20166015625, -0.99700927734375, -0.7923583984375, -0.58770751953125, -0.383056640625, -0.17840576171875, 0.0262451171875, 0.23089599609375, 0.435546875, 0.64019775390625, 0.8448486328125, 1.04949951171875, 1.254150390625, 1.45880126953125, 1.6634521484375, 1.86810302734375, 2.07275390625, 2.27740478515625, 2.4820556640625, 2.68670654296875, 2.891357421875, 3.09600830078125, 3.3006591796875, 3.50531005859375, 3.7099609375, 3.91461181640625, 4.1192626953125, 4.32391357421875, 4.528564453125, 4.73321533203125, 4.9378662109375, 5.14251708984375, 5.34716796875, 5.55181884765625, 5.7564697265625, 5.96112060546875, 6.165771484375, 6.37042236328125, 6.5750732421875, 6.77972412109375, 6.984375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 8.0, 13.0, 5.0, 15.0, 22.0, 25.0, 37.0, 41.0, 65.0, 100.0, 141.0, 274.0, 667.0, 2686.0, 21747.0, 643685.0, 3342953.0, 169786.0, 9406.0, 1518.0, 476.0, 212.0, 121.0, 73.0, 47.0, 30.0, 35.0, 27.0, 19.0, 10.0, 9.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.4375, -24.696533203125, -23.95556640625, -23.214599609375, -22.4736328125, -21.732666015625, -20.99169921875, -20.250732421875, -19.509765625, -18.768798828125, -18.02783203125, -17.286865234375, -16.5458984375, -15.804931640625, -15.06396484375, -14.322998046875, -13.58203125, -12.841064453125, -12.10009765625, -11.359130859375, -10.6181640625, -9.877197265625, -9.13623046875, -8.395263671875, -7.654296875, -6.913330078125, -6.17236328125, -5.431396484375, -4.6904296875, -3.949462890625, -3.20849609375, -2.467529296875, -1.7265625, -0.985595703125, -0.24462890625, 0.496337890625, 1.2373046875, 1.978271484375, 2.71923828125, 3.460205078125, 4.201171875, 4.942138671875, 5.68310546875, 6.424072265625, 7.1650390625, 7.906005859375, 8.64697265625, 9.387939453125, 10.12890625, 10.869873046875, 11.61083984375, 12.351806640625, 13.0927734375, 13.833740234375, 14.57470703125, 15.315673828125, 16.056640625, 16.797607421875, 17.53857421875, 18.279541015625, 19.0205078125, 19.761474609375, 20.50244140625, 21.243408203125, 21.984375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 10.0, 7.0, 14.0, 25.0, 32.0, 53.0, 89.0, 115.0, 180.0, 268.0, 407.0, 607.0, 660.0, 523.0, 354.0, 265.0, 156.0, 95.0, 75.0, 47.0, 32.0, 17.0, 15.0, 12.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.34375, -24.560546875, -23.77734375, -22.994140625, -22.2109375, -21.427734375, -20.64453125, -19.861328125, -19.078125, -18.294921875, -17.51171875, -16.728515625, -15.9453125, -15.162109375, -14.37890625, -13.595703125, -12.8125, -12.029296875, -11.24609375, -10.462890625, -9.6796875, -8.896484375, -8.11328125, -7.330078125, -6.546875, -5.763671875, -4.98046875, -4.197265625, -3.4140625, -2.630859375, -1.84765625, -1.064453125, -0.28125, 0.501953125, 1.28515625, 2.068359375, 2.8515625, 3.634765625, 4.41796875, 5.201171875, 5.984375, 6.767578125, 7.55078125, 8.333984375, 9.1171875, 9.900390625, 10.68359375, 11.466796875, 12.25, 13.033203125, 13.81640625, 14.599609375, 15.3828125, 16.166015625, 16.94921875, 17.732421875, 18.515625, 19.298828125, 20.08203125, 20.865234375, 21.6484375, 22.431640625, 23.21484375, 23.998046875, 24.78125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 7.0, 12.0, 10.0, 31.0, 52.0, 77.0, 122.0, 208.0, 359.0, 780.0, 4845.0, 1651574.0, 2528988.0, 5417.0, 868.0, 365.0, 207.0, 121.0, 75.0, 53.0, 36.0, 22.0, 14.0, 12.0, 7.0, 4.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.25, -56.6767578125, -54.103515625, -51.5302734375, -48.95703125, -46.3837890625, -43.810546875, -41.2373046875, -38.6640625, -36.0908203125, -33.517578125, -30.9443359375, -28.37109375, -25.7978515625, -23.224609375, -20.6513671875, -18.078125, -15.5048828125, -12.931640625, -10.3583984375, -7.78515625, -5.2119140625, -2.638671875, -0.0654296875, 2.5078125, 5.0810546875, 7.654296875, 10.2275390625, 12.80078125, 15.3740234375, 17.947265625, 20.5205078125, 23.09375, 25.6669921875, 28.240234375, 30.8134765625, 33.38671875, 35.9599609375, 38.533203125, 41.1064453125, 43.6796875, 46.2529296875, 48.826171875, 51.3994140625, 53.97265625, 56.5458984375, 59.119140625, 61.6923828125, 64.265625, 66.8388671875, 69.412109375, 71.9853515625, 74.55859375, 77.1318359375, 79.705078125, 82.2783203125, 84.8515625, 87.4248046875, 89.998046875, 92.5712890625, 95.14453125, 97.7177734375, 100.291015625, 102.8642578125, 105.4375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 106.0, 490.0, 356.0, 59.0, 5.0], "bins": [-534.0560302734375, -525.2754516601562, -516.494873046875, -507.71429443359375, -498.9337158203125, -490.15313720703125, -481.37255859375, -472.5919494628906, -463.8113708496094, -455.0307922363281, -446.2502136230469, -437.4696350097656, -428.6890563964844, -419.908447265625, -411.12786865234375, -402.3472900390625, -393.56671142578125, -384.7861328125, -376.00555419921875, -367.2249755859375, -358.44439697265625, -349.663818359375, -340.88323974609375, -332.1026306152344, -323.32208251953125, -314.54150390625, -305.76092529296875, -296.9803466796875, -288.19976806640625, -279.419189453125, -270.63861083984375, -261.8580017089844, -253.0774383544922, -244.29685974121094, -235.5162811279297, -226.73568725585938, -217.95510864257812, -209.17453002929688, -200.39395141601562, -191.61337280273438, -182.83277893066406, -174.0522003173828, -165.27162170410156, -156.49102783203125, -147.71044921875, -138.92987060546875, -130.1492919921875, -121.36871337890625, -112.58812713623047, -103.80754852294922, -95.02696228027344, -86.24638366699219, -77.46580505371094, -68.68521881103516, -59.904640197753906, -51.12405776977539, -42.343475341796875, -33.56289291381836, -24.782312393188477, -16.001731872558594, -7.221149444580078, 1.5594329833984375, 10.340011596679688, 19.120594024658203, 27.901174545288086]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 2.0, 4.0, 3.0, 3.0, 8.0, 14.0, 8.0, 8.0, 17.0, 18.0, 27.0, 20.0, 37.0, 24.0, 37.0, 33.0, 17.0, 32.0, 38.0, 27.0, 46.0, 34.0, 41.0, 41.0, 28.0, 35.0, 41.0, 48.0, 38.0, 26.0, 26.0, 29.0, 24.0, 26.0, 16.0, 20.0, 15.0, 10.0, 11.0, 17.0, 6.0, 7.0, 10.0, 6.0, 10.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-62.429046630859375, -60.59641647338867, -58.76378631591797, -56.93115997314453, -55.09852981567383, -53.265899658203125, -51.43326950073242, -49.60063934326172, -47.76801300048828, -45.93538284301758, -44.102752685546875, -42.27012634277344, -40.437496185302734, -38.60486602783203, -36.77223587036133, -34.939605712890625, -33.10697555541992, -31.27434539794922, -29.44171714782715, -27.609086990356445, -25.776458740234375, -23.943828582763672, -22.11119842529297, -20.278568267822266, -18.445940017700195, -16.613309860229492, -14.780681610107422, -12.948051452636719, -11.115422248840332, -9.282793045043945, -7.450162887573242, -5.6175336837768555, -3.7849044799804688, -1.952275037765503, -0.11964559555053711, 1.7129840850830078, 3.5456132888793945, 5.378242492675781, 7.210872650146484, 9.043501853942871, 10.876131057739258, 12.708760261535645, 14.541389465332031, 16.374019622802734, 18.206649780273438, 20.039278030395508, 21.87190818786621, 23.70453643798828, 25.537166595458984, 27.369796752929688, 29.202425003051758, 31.03505516052246, 32.86768341064453, 34.700313568115234, 36.53294372558594, 38.36557388305664, 40.198204040527344, 42.03083419799805, 43.86346435546875, 45.69609069824219, 47.52872085571289, 49.361351013183594, 51.1939811706543, 53.026611328125, 54.85923767089844]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 14.0, 10.0, 9.0, 17.0, 10.0, 25.0, 24.0, 27.0, 27.0, 30.0, 32.0, 32.0, 44.0, 43.0, 46.0, 49.0, 45.0, 44.0, 46.0, 57.0, 42.0, 37.0, 49.0, 37.0, 32.0, 34.0, 23.0, 20.0, 23.0, 14.0, 14.0, 8.0, 9.0, 11.0, 6.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.7542724609375, -5.555419921875, -5.3565673828125, -5.15771484375, -4.9588623046875, -4.760009765625, -4.5611572265625, -4.3623046875, -4.1634521484375, -3.964599609375, -3.7657470703125, -3.56689453125, -3.3680419921875, -3.169189453125, -2.9703369140625, -2.771484375, -2.5726318359375, -2.373779296875, -2.1749267578125, -1.97607421875, -1.7772216796875, -1.578369140625, -1.3795166015625, -1.1806640625, -0.9818115234375, -0.782958984375, -0.5841064453125, -0.38525390625, -0.1864013671875, 0.012451171875, 0.2113037109375, 0.41015625, 0.6090087890625, 0.807861328125, 1.0067138671875, 1.20556640625, 1.4044189453125, 1.603271484375, 1.8021240234375, 2.0009765625, 2.1998291015625, 2.398681640625, 2.5975341796875, 2.79638671875, 2.9952392578125, 3.194091796875, 3.3929443359375, 3.591796875, 3.7906494140625, 3.989501953125, 4.1883544921875, 4.38720703125, 4.5860595703125, 4.784912109375, 4.9837646484375, 5.1826171875, 5.3814697265625, 5.580322265625, 5.7791748046875, 5.97802734375, 6.1768798828125, 6.375732421875, 6.5745849609375, 6.7734375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 10.0, 6.0, 7.0, 11.0, 31.0, 31.0, 53.0, 73.0, 128.0, 187.0, 308.0, 481.0, 718.0, 1219.0, 1949.0, 3326.0, 5491.0, 8985.0, 15255.0, 25142.0, 42550.0, 71816.0, 120532.0, 192259.0, 215563.0, 137405.0, 83017.0, 49137.0, 29052.0, 17386.0, 10431.0, 6310.0, 3739.0, 2252.0, 1402.0, 861.0, 544.0, 289.0, 209.0, 128.0, 96.0, 49.0, 42.0, 35.0, 11.0, 17.0, 8.0, 5.0, 3.0, 4.0, 1.0, 2.0], "bins": [-1.0087890625, -0.9808731079101562, -0.9529571533203125, -0.9250411987304688, -0.897125244140625, -0.8692092895507812, -0.8412933349609375, -0.8133773803710938, -0.78546142578125, -0.7575454711914062, -0.7296295166015625, -0.7017135620117188, -0.673797607421875, -0.6458816528320312, -0.6179656982421875, -0.5900497436523438, -0.5621337890625, -0.5342178344726562, -0.5063018798828125, -0.47838592529296875, -0.450469970703125, -0.42255401611328125, -0.3946380615234375, -0.36672210693359375, -0.33880615234375, -0.31089019775390625, -0.2829742431640625, -0.25505828857421875, -0.227142333984375, -0.19922637939453125, -0.1713104248046875, -0.14339447021484375, -0.115478515625, -0.08756256103515625, -0.0596466064453125, -0.03173065185546875, -0.003814697265625, 0.02410125732421875, 0.0520172119140625, 0.07993316650390625, 0.10784912109375, 0.13576507568359375, 0.1636810302734375, 0.19159698486328125, 0.219512939453125, 0.24742889404296875, 0.2753448486328125, 0.30326080322265625, 0.3311767578125, 0.35909271240234375, 0.3870086669921875, 0.41492462158203125, 0.442840576171875, 0.47075653076171875, 0.4986724853515625, 0.5265884399414062, 0.55450439453125, 0.5824203491210938, 0.6103363037109375, 0.6382522583007812, 0.666168212890625, 0.6940841674804688, 0.7220001220703125, 0.7499160766601562, 0.77783203125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 5.0, 7.0, 13.0, 14.0, 16.0, 22.0, 27.0, 18.0, 27.0, 29.0, 29.0, 33.0, 36.0, 46.0, 42.0, 53.0, 44.0, 45.0, 1068.0, 33.0, 40.0, 32.0, 32.0, 26.0, 31.0, 30.0, 28.0, 34.0, 29.0, 29.0, 20.0, 16.0, 14.0, 10.0, 10.0, 10.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.791839599609375, -3.67547607421875, -3.559112548828125, -3.4427490234375, -3.326385498046875, -3.21002197265625, -3.093658447265625, -2.977294921875, -2.860931396484375, -2.74456787109375, -2.628204345703125, -2.5118408203125, -2.395477294921875, -2.27911376953125, -2.162750244140625, -2.04638671875, -1.930023193359375, -1.81365966796875, -1.697296142578125, -1.5809326171875, -1.464569091796875, -1.34820556640625, -1.231842041015625, -1.115478515625, -0.999114990234375, -0.88275146484375, -0.766387939453125, -0.6500244140625, -0.533660888671875, -0.41729736328125, -0.300933837890625, -0.1845703125, -0.068206787109375, 0.04815673828125, 0.164520263671875, 0.2808837890625, 0.397247314453125, 0.51361083984375, 0.629974365234375, 0.746337890625, 0.862701416015625, 0.97906494140625, 1.095428466796875, 1.2117919921875, 1.328155517578125, 1.44451904296875, 1.560882568359375, 1.67724609375, 1.793609619140625, 1.90997314453125, 2.026336669921875, 2.1427001953125, 2.259063720703125, 2.37542724609375, 2.491790771484375, 2.608154296875, 2.724517822265625, 2.84088134765625, 2.957244873046875, 3.0736083984375, 3.189971923828125, 3.30633544921875, 3.422698974609375, 3.5390625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 13.0, 11.0, 8.0, 32.0, 35.0, 52.0, 101.0, 130.0, 201.0, 291.0, 437.0, 679.0, 1078.0, 1655.0, 2535.0, 4038.0, 6038.0, 9627.0, 14721.0, 22083.0, 34451.0, 54376.0, 85770.0, 136089.0, 1251012.0, 171601.0, 108281.0, 68698.0, 43321.0, 28185.0, 18023.0, 11866.0, 7501.0, 4983.0, 3203.0, 2126.0, 1313.0, 904.0, 571.0, 341.0, 255.0, 158.0, 108.0, 67.0, 71.0, 33.0, 26.0, 18.0, 6.0, 10.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7021484375, -0.6800384521484375, -0.657928466796875, -0.6358184814453125, -0.61370849609375, -0.5915985107421875, -0.569488525390625, -0.5473785400390625, -0.5252685546875, -0.5031585693359375, -0.481048583984375, -0.4589385986328125, -0.43682861328125, -0.4147186279296875, -0.392608642578125, -0.3704986572265625, -0.348388671875, -0.3262786865234375, -0.304168701171875, -0.2820587158203125, -0.25994873046875, -0.2378387451171875, -0.215728759765625, -0.1936187744140625, -0.1715087890625, -0.1493988037109375, -0.127288818359375, -0.1051788330078125, -0.08306884765625, -0.0609588623046875, -0.038848876953125, -0.0167388916015625, 0.00537109375, 0.0274810791015625, 0.049591064453125, 0.0717010498046875, 0.09381103515625, 0.1159210205078125, 0.138031005859375, 0.1601409912109375, 0.1822509765625, 0.2043609619140625, 0.226470947265625, 0.2485809326171875, 0.27069091796875, 0.2928009033203125, 0.314910888671875, 0.3370208740234375, 0.359130859375, 0.3812408447265625, 0.403350830078125, 0.4254608154296875, 0.44757080078125, 0.4696807861328125, 0.491790771484375, 0.5139007568359375, 0.5360107421875, 0.5581207275390625, 0.580230712890625, 0.6023406982421875, 0.62445068359375, 0.6465606689453125, 0.668670654296875, 0.6907806396484375, 0.712890625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 7.0, 5.0, 4.0, 5.0, 9.0, 8.0, 14.0, 29.0, 24.0, 27.0, 56.0, 61.0, 80.0, 90.0, 79.0, 99.0, 83.0, 70.0, 58.0, 44.0, 33.0, 29.0, 21.0, 14.0, 13.0, 4.0, 6.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001674652099609375, -0.0016166865825653076, -0.0015587210655212402, -0.0015007555484771729, -0.0014427900314331055, -0.001384824514389038, -0.0013268589973449707, -0.0012688934803009033, -0.001210927963256836, -0.0011529624462127686, -0.0010949969291687012, -0.0010370314121246338, -0.0009790658950805664, -0.000921100378036499, -0.0008631348609924316, -0.0008051693439483643, -0.0007472038269042969, -0.0006892383098602295, -0.0006312727928161621, -0.0005733072757720947, -0.0005153417587280273, -0.00045737624168395996, -0.0003994107246398926, -0.0003414452075958252, -0.0002834796905517578, -0.00022551417350769043, -0.00016754865646362305, -0.00010958313941955566, -5.161762237548828e-05, 6.3478946685791016e-06, 6.431341171264648e-05, 0.00012227892875671387, 0.00018024444580078125, 0.00023820996284484863, 0.000296175479888916, 0.0003541409969329834, 0.0004121065139770508, 0.00047007203102111816, 0.0005280375480651855, 0.0005860030651092529, 0.0006439685821533203, 0.0007019340991973877, 0.0007598996162414551, 0.0008178651332855225, 0.0008758306503295898, 0.0009337961673736572, 0.0009917616844177246, 0.001049727201461792, 0.0011076927185058594, 0.0011656582355499268, 0.0012236237525939941, 0.0012815892696380615, 0.001339554786682129, 0.0013975203037261963, 0.0014554858207702637, 0.001513451337814331, 0.0015714168548583984, 0.0016293823719024658, 0.0016873478889465332, 0.0017453134059906006, 0.001803278923034668, 0.0018612444400787354, 0.0019192099571228027, 0.00197717547416687, 0.0020351409912109375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 0.0, 5.0, 6.0, 6.0, 10.0, 7.0, 13.0, 18.0, 20.0, 23.0, 57.0, 72.0, 106.0, 163.0, 295.0, 536.0, 15372.0, 1029790.0, 1100.0, 342.0, 212.0, 120.0, 78.0, 70.0, 36.0, 23.0, 20.0, 10.0, 7.0, 8.0, 8.0, 7.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.044464111328125, -0.04320240020751953, -0.04194068908691406, -0.040678977966308594, -0.039417266845703125, -0.038155555725097656, -0.03689384460449219, -0.03563213348388672, -0.03437042236328125, -0.03310871124267578, -0.03184700012207031, -0.030585289001464844, -0.029323577880859375, -0.028061866760253906, -0.026800155639648438, -0.02553844451904297, -0.0242767333984375, -0.02301502227783203, -0.021753311157226562, -0.020491600036621094, -0.019229888916015625, -0.017968177795410156, -0.016706466674804688, -0.015444755554199219, -0.01418304443359375, -0.012921333312988281, -0.011659622192382812, -0.010397911071777344, -0.009136199951171875, -0.007874488830566406, -0.0066127777099609375, -0.005351066589355469, -0.00408935546875, -0.0028276443481445312, -0.0015659332275390625, -0.00030422210693359375, 0.000957489013671875, 0.0022192001342773438, 0.0034809112548828125, 0.004742622375488281, 0.00600433349609375, 0.007266044616699219, 0.008527755737304688, 0.009789466857910156, 0.011051177978515625, 0.012312889099121094, 0.013574600219726562, 0.014836311340332031, 0.0160980224609375, 0.01735973358154297, 0.018621444702148438, 0.019883155822753906, 0.021144866943359375, 0.022406578063964844, 0.023668289184570312, 0.02493000030517578, 0.02619171142578125, 0.02745342254638672, 0.028715133666992188, 0.029976844787597656, 0.031238555908203125, 0.032500267028808594, 0.03376197814941406, 0.03502368927001953, 0.036285400390625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 20.0, 409.0, 543.0, 44.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004643936641514301, -0.004494477994740009, -0.004345019347965717, -0.004195560701191425, -0.004046102054417133, -0.0038966434076428413, -0.0037471847608685493, -0.0035977261140942574, -0.0034482674673199654, -0.0032988088205456734, -0.0031493501737713814, -0.0029998915269970894, -0.0028504328802227974, -0.0027009742334485054, -0.0025515155866742134, -0.0024020569398999214, -0.0022525980602949858, -0.0021031394135206938, -0.001953680766746402, -0.0018042221199721098, -0.0016547634731978178, -0.0015053048264235258, -0.001355846063233912, -0.00120638741645962, -0.001056928769685328, -0.000907470122911036, -0.000758011476136744, -0.0006085527711547911, -0.0004590941243804991, -0.00030963547760620713, -0.00016017677262425423, -1.0718125849962234e-05, 0.00013874052092432976, 0.00028819916769862175, 0.0004376578435767442, 0.0005871165194548666, 0.0007365751662291586, 0.0008860338130034506, 0.0010354925179854035, 0.0011849511647596955, 0.0013344098115339875, 0.0014838684583082795, 0.0016333271050825715, 0.0017827858682721853, 0.0019322445150464773, 0.0020817031618207693, 0.0022311618085950613, 0.0023806204553693533, 0.0025300791021436453, 0.0026795377489179373, 0.0028289963956922293, 0.0029784550424665213, 0.0031279136892408133, 0.0032773723360151052, 0.003426831215620041, 0.003576289862394333, 0.003725748509168625, 0.003875207155942917, 0.004024665802717209, 0.004174124449491501, 0.004323583096265793, 0.004473041743040085, 0.004622500389814377, 0.004771959036588669, 0.004921417683362961]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 4.0, 8.0, 4.0, 5.0, 8.0, 9.0, 3.0, 12.0, 16.0, 15.0, 19.0, 28.0, 24.0, 28.0, 33.0, 22.0, 37.0, 29.0, 41.0, 48.0, 36.0, 47.0, 37.0, 52.0, 42.0, 36.0, 31.0, 38.0, 33.0, 36.0, 34.0, 31.0, 21.0, 17.0, 29.0, 10.0, 10.0, 11.0, 12.0, 12.0, 8.0, 2.0, 3.0, 5.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0007987618446350098, -0.000775020569562912, -0.0007512792944908142, -0.0007275380194187164, -0.0007037967443466187, -0.0006800554692745209, -0.0006563141942024231, -0.0006325729191303253, -0.0006088316440582275, -0.0005850903689861298, -0.000561349093914032, -0.0005376078188419342, -0.0005138665437698364, -0.0004901252686977386, -0.00046638399362564087, -0.0004426427185535431, -0.0004189014434814453, -0.00039516016840934753, -0.00037141889333724976, -0.000347677618265152, -0.0003239363431930542, -0.0003001950681209564, -0.00027645379304885864, -0.00025271251797676086, -0.00022897124290466309, -0.0002052299678325653, -0.00018148869276046753, -0.00015774741768836975, -0.00013400614261627197, -0.0001102648675441742, -8.652359247207642e-05, -6.278231739997864e-05, -3.904104232788086e-05, -1.529976725578308e-05, 8.441507816314697e-06, 3.2182782888412476e-05, 5.5924057960510254e-05, 7.966533303260803e-05, 0.00010340660810470581, 0.0001271478831768036, 0.00015088915824890137, 0.00017463043332099915, 0.00019837170839309692, 0.0002221129834651947, 0.0002458542585372925, 0.00026959553360939026, 0.00029333680868148804, 0.0003170780837535858, 0.0003408193588256836, 0.00036456063389778137, 0.00038830190896987915, 0.00041204318404197693, 0.0004357844591140747, 0.0004595257341861725, 0.00048326700925827026, 0.000507008284330368, 0.0005307495594024658, 0.0005544908344745636, 0.0005782321095466614, 0.0006019733846187592, 0.0006257146596908569, 0.0006494559347629547, 0.0006731972098350525, 0.0006969384849071503, 0.000720679759979248]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 14.0, 10.0, 9.0, 17.0, 10.0, 25.0, 24.0, 27.0, 27.0, 30.0, 32.0, 32.0, 44.0, 43.0, 46.0, 49.0, 45.0, 44.0, 46.0, 57.0, 42.0, 37.0, 49.0, 37.0, 32.0, 34.0, 23.0, 20.0, 23.0, 14.0, 14.0, 8.0, 9.0, 11.0, 6.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.7542724609375, -5.555419921875, -5.3565673828125, -5.15771484375, -4.9588623046875, -4.760009765625, -4.5611572265625, -4.3623046875, -4.1634521484375, -3.964599609375, -3.7657470703125, -3.56689453125, -3.3680419921875, -3.169189453125, -2.9703369140625, -2.771484375, -2.5726318359375, -2.373779296875, -2.1749267578125, -1.97607421875, -1.7772216796875, -1.578369140625, -1.3795166015625, -1.1806640625, -0.9818115234375, -0.782958984375, -0.5841064453125, -0.38525390625, -0.1864013671875, 0.012451171875, 0.2113037109375, 0.41015625, 0.6090087890625, 0.807861328125, 1.0067138671875, 1.20556640625, 1.4044189453125, 1.603271484375, 1.8021240234375, 2.0009765625, 2.1998291015625, 2.398681640625, 2.5975341796875, 2.79638671875, 2.9952392578125, 3.194091796875, 3.3929443359375, 3.591796875, 3.7906494140625, 3.989501953125, 4.1883544921875, 4.38720703125, 4.5860595703125, 4.784912109375, 4.9837646484375, 5.1826171875, 5.3814697265625, 5.580322265625, 5.7791748046875, 5.97802734375, 6.1768798828125, 6.375732421875, 6.5745849609375, 6.7734375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 17.0, 43.0, 31.0, 49.0, 97.0, 129.0, 282.0, 395.0, 728.0, 1294.0, 2335.0, 4368.0, 8990.0, 20549.0, 55672.0, 215835.0, 530116.0, 136491.0, 40039.0, 15741.0, 7175.0, 3595.0, 1880.0, 1143.0, 617.0, 342.0, 231.0, 156.0, 72.0, 51.0, 28.0, 19.0, 14.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9140625, -4.77099609375, -4.6279296875, -4.48486328125, -4.341796875, -4.19873046875, -4.0556640625, -3.91259765625, -3.76953125, -3.62646484375, -3.4833984375, -3.34033203125, -3.197265625, -3.05419921875, -2.9111328125, -2.76806640625, -2.625, -2.48193359375, -2.3388671875, -2.19580078125, -2.052734375, -1.90966796875, -1.7666015625, -1.62353515625, -1.48046875, -1.33740234375, -1.1943359375, -1.05126953125, -0.908203125, -0.76513671875, -0.6220703125, -0.47900390625, -0.3359375, -0.19287109375, -0.0498046875, 0.09326171875, 0.236328125, 0.37939453125, 0.5224609375, 0.66552734375, 0.80859375, 0.95166015625, 1.0947265625, 1.23779296875, 1.380859375, 1.52392578125, 1.6669921875, 1.81005859375, 1.953125, 2.09619140625, 2.2392578125, 2.38232421875, 2.525390625, 2.66845703125, 2.8115234375, 2.95458984375, 3.09765625, 3.24072265625, 3.3837890625, 3.52685546875, 3.669921875, 3.81298828125, 3.9560546875, 4.09912109375, 4.2421875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 8.0, 6.0, 7.0, 16.0, 16.0, 10.0, 18.0, 20.0, 24.0, 27.0, 26.0, 34.0, 38.0, 37.0, 39.0, 63.0, 85.0, 1715.0, 336.0, 77.0, 51.0, 45.0, 38.0, 48.0, 37.0, 24.0, 25.0, 26.0, 28.0, 21.0, 20.0, 21.0, 18.0, 11.0, 3.0, 6.0, 5.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.109375, -17.435791015625, -16.76220703125, -16.088623046875, -15.4150390625, -14.741455078125, -14.06787109375, -13.394287109375, -12.720703125, -12.047119140625, -11.37353515625, -10.699951171875, -10.0263671875, -9.352783203125, -8.67919921875, -8.005615234375, -7.33203125, -6.658447265625, -5.98486328125, -5.311279296875, -4.6376953125, -3.964111328125, -3.29052734375, -2.616943359375, -1.943359375, -1.269775390625, -0.59619140625, 0.077392578125, 0.7509765625, 1.424560546875, 2.09814453125, 2.771728515625, 3.4453125, 4.118896484375, 4.79248046875, 5.466064453125, 6.1396484375, 6.813232421875, 7.48681640625, 8.160400390625, 8.833984375, 9.507568359375, 10.18115234375, 10.854736328125, 11.5283203125, 12.201904296875, 12.87548828125, 13.549072265625, 14.22265625, 14.896240234375, 15.56982421875, 16.243408203125, 16.9169921875, 17.590576171875, 18.26416015625, 18.937744140625, 19.611328125, 20.284912109375, 20.95849609375, 21.632080078125, 22.3056640625, 22.979248046875, 23.65283203125, 24.326416015625, 25.0]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 5.0, 5.0, 3.0, 6.0, 14.0, 19.0, 20.0, 14.0, 28.0, 28.0, 34.0, 37.0, 43.0, 72.0, 92.0, 156.0, 260.0, 556.0, 2719.0, 140098.0, 2990659.0, 8915.0, 1032.0, 323.0, 151.0, 107.0, 78.0, 43.0, 25.0, 34.0, 26.0, 17.0, 16.0, 10.0, 16.0, 15.0, 3.0, 8.0, 7.0, 1.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-41.75, -40.628173828125, -39.50634765625, -38.384521484375, -37.2626953125, -36.140869140625, -35.01904296875, -33.897216796875, -32.775390625, -31.653564453125, -30.53173828125, -29.409912109375, -28.2880859375, -27.166259765625, -26.04443359375, -24.922607421875, -23.80078125, -22.678955078125, -21.55712890625, -20.435302734375, -19.3134765625, -18.191650390625, -17.06982421875, -15.947998046875, -14.826171875, -13.704345703125, -12.58251953125, -11.460693359375, -10.3388671875, -9.217041015625, -8.09521484375, -6.973388671875, -5.8515625, -4.729736328125, -3.60791015625, -2.486083984375, -1.3642578125, -0.242431640625, 0.87939453125, 2.001220703125, 3.123046875, 4.244873046875, 5.36669921875, 6.488525390625, 7.6103515625, 8.732177734375, 9.85400390625, 10.975830078125, 12.09765625, 13.219482421875, 14.34130859375, 15.463134765625, 16.5849609375, 17.706787109375, 18.82861328125, 19.950439453125, 21.072265625, 22.194091796875, 23.31591796875, 24.437744140625, 25.5595703125, 26.681396484375, 27.80322265625, 28.925048828125, 30.046875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [19.0, 846.0, 152.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.61663818359375, -4.067175388336182, 1.4822874069213867, 7.031749725341797, 12.581212997436523, 18.13067626953125, 23.680137634277344, 29.229602813720703, 34.7790641784668, 40.32852554321289, 45.87799072265625, 51.427452087402344, 56.97691345214844, 62.5263786315918, 68.07583618164062, 73.62530517578125, 79.17476654052734, 84.72422790527344, 90.27368927001953, 95.82315063476562, 101.37261962890625, 106.92208099365234, 112.47154235839844, 118.02101135253906, 123.57046508789062, 129.11993408203125, 134.6693878173828, 140.21885681152344, 145.768310546875, 151.31777954101562, 156.86724853515625, 162.4167022705078, 167.96617126464844, 173.51564025878906, 179.06509399414062, 184.61456298828125, 190.1640167236328, 195.71348571777344, 201.262939453125, 206.81240844726562, 212.36187744140625, 217.91134643554688, 223.46080017089844, 229.01026916503906, 234.55972290039062, 240.10919189453125, 245.65866088867188, 251.20811462402344, 256.757568359375, 262.3070373535156, 267.85650634765625, 273.40594482421875, 278.9554138183594, 284.5048828125, 290.0543518066406, 295.60382080078125, 301.1532897949219, 306.7027587890625, 312.2522277832031, 317.8016662597656, 323.35113525390625, 328.9006042480469, 334.4500732421875, 339.9995422363281, 345.5489807128906]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 8.0, 4.0, 7.0, 9.0, 8.0, 9.0, 11.0, 16.0, 23.0, 15.0, 18.0, 13.0, 32.0, 19.0, 31.0, 47.0, 40.0, 35.0, 37.0, 44.0, 40.0, 39.0, 44.0, 33.0, 49.0, 37.0, 37.0, 51.0, 26.0, 34.0, 28.0, 27.0, 24.0, 18.0, 17.0, 23.0, 20.0, 6.0, 4.0, 10.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-76.71792602539062, -74.57952880859375, -72.44113159179688, -70.30274200439453, -68.16434478759766, -66.02594757080078, -63.88755416870117, -61.74916076660156, -59.61076354980469, -57.47236633300781, -55.3339729309082, -53.195579528808594, -51.05718231201172, -48.918785095214844, -46.780391693115234, -44.641998291015625, -42.50360107421875, -40.365203857421875, -38.226810455322266, -36.088417053222656, -33.95001983642578, -31.81162452697754, -29.673229217529297, -27.534833908081055, -25.396438598632812, -23.25804328918457, -21.119647979736328, -18.981252670288086, -16.842857360839844, -14.704462051391602, -12.56606674194336, -10.427671432495117, -8.289268493652344, -6.150873184204102, -4.012477874755859, -1.8740825653076172, 0.264312744140625, 2.402708053588867, 4.541103363037109, 6.679498672485352, 8.817893981933594, 10.956289291381836, 13.094684600830078, 15.23307991027832, 17.371475219726562, 19.509870529174805, 21.648265838623047, 23.78666114807129, 25.92505645751953, 28.063451766967773, 30.201847076416016, 32.340240478515625, 34.4786376953125, 36.617034912109375, 38.755428314208984, 40.893821716308594, 43.03221893310547, 45.170616149902344, 47.30900955200195, 49.44740295410156, 51.58580017089844, 53.72419738769531, 55.86259078979492, 58.00098419189453, 60.139381408691406]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 10.0, 11.0, 9.0, 16.0, 13.0, 15.0, 34.0, 17.0, 28.0, 32.0, 29.0, 43.0, 36.0, 45.0, 39.0, 45.0, 42.0, 49.0, 58.0, 52.0, 46.0, 39.0, 33.0, 46.0, 33.0, 27.0, 29.0, 26.0, 17.0, 20.0, 13.0, 8.0, 8.0, 11.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.171875, -5.96710205078125, -5.7623291015625, -5.55755615234375, -5.352783203125, -5.14801025390625, -4.9432373046875, -4.73846435546875, -4.53369140625, -4.32891845703125, -4.1241455078125, -3.91937255859375, -3.714599609375, -3.50982666015625, -3.3050537109375, -3.10028076171875, -2.8955078125, -2.69073486328125, -2.4859619140625, -2.28118896484375, -2.076416015625, -1.87164306640625, -1.6668701171875, -1.46209716796875, -1.25732421875, -1.05255126953125, -0.8477783203125, -0.64300537109375, -0.438232421875, -0.23345947265625, -0.0286865234375, 0.17608642578125, 0.380859375, 0.58563232421875, 0.7904052734375, 0.99517822265625, 1.199951171875, 1.40472412109375, 1.6094970703125, 1.81427001953125, 2.01904296875, 2.22381591796875, 2.4285888671875, 2.63336181640625, 2.838134765625, 3.04290771484375, 3.2476806640625, 3.45245361328125, 3.6572265625, 3.86199951171875, 4.0667724609375, 4.27154541015625, 4.476318359375, 4.68109130859375, 4.8858642578125, 5.09063720703125, 5.29541015625, 5.50018310546875, 5.7049560546875, 5.90972900390625, 6.114501953125, 6.31927490234375, 6.5240478515625, 6.72882080078125, 6.93359375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 8.0, 14.0, 18.0, 17.0, 18.0, 28.0, 19.0, 26.0, 33.0, 29.0, 49.0, 44.0, 128.0, 695.0, 17168.0, 3430917.0, 740289.0, 4115.0, 262.0, 80.0, 42.0, 28.0, 42.0, 32.0, 41.0, 25.0, 22.0, 20.0, 15.0, 7.0, 10.0, 8.0, 5.0, 7.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.28125, -38.0068359375, -36.732421875, -35.4580078125, -34.18359375, -32.9091796875, -31.634765625, -30.3603515625, -29.0859375, -27.8115234375, -26.537109375, -25.2626953125, -23.98828125, -22.7138671875, -21.439453125, -20.1650390625, -18.890625, -17.6162109375, -16.341796875, -15.0673828125, -13.79296875, -12.5185546875, -11.244140625, -9.9697265625, -8.6953125, -7.4208984375, -6.146484375, -4.8720703125, -3.59765625, -2.3232421875, -1.048828125, 0.2255859375, 1.5, 2.7744140625, 4.048828125, 5.3232421875, 6.59765625, 7.8720703125, 9.146484375, 10.4208984375, 11.6953125, 12.9697265625, 14.244140625, 15.5185546875, 16.79296875, 18.0673828125, 19.341796875, 20.6162109375, 21.890625, 23.1650390625, 24.439453125, 25.7138671875, 26.98828125, 28.2626953125, 29.537109375, 30.8115234375, 32.0859375, 33.3603515625, 34.634765625, 35.9091796875, 37.18359375, 38.4580078125, 39.732421875, 41.0068359375, 42.28125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 5.0, 11.0, 16.0, 24.0, 38.0, 51.0, 72.0, 134.0, 222.0, 334.0, 511.0, 763.0, 662.0, 463.0, 308.0, 182.0, 111.0, 56.0, 42.0, 34.0, 23.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-38.75, -37.92236328125, -37.0947265625, -36.26708984375, -35.439453125, -34.61181640625, -33.7841796875, -32.95654296875, -32.12890625, -31.30126953125, -30.4736328125, -29.64599609375, -28.818359375, -27.99072265625, -27.1630859375, -26.33544921875, -25.5078125, -24.68017578125, -23.8525390625, -23.02490234375, -22.197265625, -21.36962890625, -20.5419921875, -19.71435546875, -18.88671875, -18.05908203125, -17.2314453125, -16.40380859375, -15.576171875, -14.74853515625, -13.9208984375, -13.09326171875, -12.265625, -11.43798828125, -10.6103515625, -9.78271484375, -8.955078125, -8.12744140625, -7.2998046875, -6.47216796875, -5.64453125, -4.81689453125, -3.9892578125, -3.16162109375, -2.333984375, -1.50634765625, -0.6787109375, 0.14892578125, 0.9765625, 1.80419921875, 2.6318359375, 3.45947265625, 4.287109375, 5.11474609375, 5.9423828125, 6.77001953125, 7.59765625, 8.42529296875, 9.2529296875, 10.08056640625, 10.908203125, 11.73583984375, 12.5634765625, 13.39111328125, 14.21875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 10.0, 8.0, 21.0, 35.0, 53.0, 106.0, 189.0, 256.0, 576.0, 4542.0, 3904237.0, 281852.0, 1420.0, 394.0, 211.0, 141.0, 86.0, 44.0, 36.0, 33.0, 20.0, 6.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.0, -41.744140625, -38.48828125, -35.232421875, -31.9765625, -28.720703125, -25.46484375, -22.208984375, -18.953125, -15.697265625, -12.44140625, -9.185546875, -5.9296875, -2.673828125, 0.58203125, 3.837890625, 7.09375, 10.349609375, 13.60546875, 16.861328125, 20.1171875, 23.373046875, 26.62890625, 29.884765625, 33.140625, 36.396484375, 39.65234375, 42.908203125, 46.1640625, 49.419921875, 52.67578125, 55.931640625, 59.1875, 62.443359375, 65.69921875, 68.955078125, 72.2109375, 75.466796875, 78.72265625, 81.978515625, 85.234375, 88.490234375, 91.74609375, 95.001953125, 98.2578125, 101.513671875, 104.76953125, 108.025390625, 111.28125, 114.537109375, 117.79296875, 121.048828125, 124.3046875, 127.560546875, 130.81640625, 134.072265625, 137.328125, 140.583984375, 143.83984375, 147.095703125, 150.3515625, 153.607421875, 156.86328125, 160.119140625, 163.375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 12.0, 52.0, 155.0, 306.0, 292.0, 130.0, 50.0, 13.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-261.0731201171875, -256.14556884765625, -251.21800231933594, -246.2904510498047, -241.36289978027344, -236.4353485107422, -231.50778198242188, -226.58023071289062, -221.65267944335938, -216.72512817382812, -211.7975616455078, -206.87001037597656, -201.9424591064453, -197.01490783691406, -192.08734130859375, -187.1597900390625, -182.23223876953125, -177.3046875, -172.3771209716797, -167.44956970214844, -162.5220184326172, -157.59446716308594, -152.66690063476562, -147.73934936523438, -142.81178283691406, -137.8842315673828, -132.9566650390625, -128.02911376953125, -123.1015625, -118.17400360107422, -113.24644470214844, -108.31889343261719, -103.39134216308594, -98.46378326416016, -93.5362319946289, -88.60867309570312, -83.68112182617188, -78.7535629272461, -73.82600402832031, -68.89845275878906, -63.97089767456055, -59.04334259033203, -54.115787506103516, -49.188232421875, -44.26067352294922, -39.33312225341797, -34.40556335449219, -29.478008270263672, -24.550453186035156, -19.62289810180664, -14.695342063903809, -9.767786026000977, -4.840230941772461, 0.08732414245605469, 5.014881134033203, 9.942436218261719, 14.869991302490234, 19.79754638671875, 24.725101470947266, 29.652658462524414, 34.58021545410156, 39.50776672363281, 44.435325622558594, 49.36288070678711, 54.290435791015625]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 10.0, 7.0, 6.0, 7.0, 9.0, 10.0, 20.0, 15.0, 17.0, 27.0, 25.0, 29.0, 34.0, 31.0, 36.0, 38.0, 45.0, 46.0, 45.0, 40.0, 40.0, 47.0, 33.0, 42.0, 43.0, 35.0, 39.0, 35.0, 30.0, 20.0, 12.0, 31.0, 16.0, 20.0, 16.0, 9.0, 10.0, 10.0, 5.0, 8.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.0679931640625, -53.16908645629883, -51.27018356323242, -49.37127685546875, -47.472373962402344, -45.57346725463867, -43.674560546875, -41.775657653808594, -39.87675476074219, -37.977848052978516, -36.07894515991211, -34.18003845214844, -32.28113555908203, -30.38222885131836, -28.48332405090332, -26.58441925048828, -24.68551254272461, -22.78660774230957, -20.88770294189453, -18.98879623413086, -17.089893341064453, -15.190987586975098, -13.292081832885742, -11.393177032470703, -9.494272232055664, -7.595367431640625, -5.696462154388428, -3.7975568771362305, -1.8986520767211914, 0.00025272369384765625, 1.8991584777832031, 3.798063278198242, 5.696968078613281, 7.59587287902832, 9.49477767944336, 11.393683433532715, 13.292588233947754, 15.191493034362793, 17.09039878845215, 18.989303588867188, 20.888208389282227, 22.787113189697266, 24.686017990112305, 26.584922790527344, 28.483829498291016, 30.382732391357422, 32.281639099121094, 34.1805419921875, 36.07944869995117, 37.978355407714844, 39.87725830078125, 41.77616500854492, 43.67506790161133, 45.573974609375, 47.472877502441406, 49.37178421020508, 51.27069091796875, 53.16959762573242, 55.06850051879883, 56.9674072265625, 58.866310119628906, 60.76521682739258, 62.66412353515625, 64.56302642822266, 66.46192932128906]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 1.0, 5.0, 8.0, 12.0, 15.0, 14.0, 14.0, 11.0, 20.0, 33.0, 24.0, 22.0, 26.0, 37.0, 33.0, 41.0, 39.0, 39.0, 43.0, 34.0, 45.0, 46.0, 55.0, 46.0, 43.0, 41.0, 33.0, 30.0, 26.0, 23.0, 26.0, 23.0, 16.0, 19.0, 19.0, 8.0, 6.0, 4.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83984375, -5.64495849609375, -5.4500732421875, -5.25518798828125, -5.060302734375, -4.86541748046875, -4.6705322265625, -4.47564697265625, -4.28076171875, -4.08587646484375, -3.8909912109375, -3.69610595703125, -3.501220703125, -3.30633544921875, -3.1114501953125, -2.91656494140625, -2.7216796875, -2.52679443359375, -2.3319091796875, -2.13702392578125, -1.942138671875, -1.74725341796875, -1.5523681640625, -1.35748291015625, -1.16259765625, -0.96771240234375, -0.7728271484375, -0.57794189453125, -0.383056640625, -0.18817138671875, 0.0067138671875, 0.20159912109375, 0.396484375, 0.59136962890625, 0.7862548828125, 0.98114013671875, 1.176025390625, 1.37091064453125, 1.5657958984375, 1.76068115234375, 1.95556640625, 2.15045166015625, 2.3453369140625, 2.54022216796875, 2.735107421875, 2.92999267578125, 3.1248779296875, 3.31976318359375, 3.5146484375, 3.70953369140625, 3.9044189453125, 4.09930419921875, 4.294189453125, 4.48907470703125, 4.6839599609375, 4.87884521484375, 5.07373046875, 5.26861572265625, 5.4635009765625, 5.65838623046875, 5.853271484375, 6.04815673828125, 6.2430419921875, 6.43792724609375, 6.6328125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 8.0, 10.0, 18.0, 24.0, 59.0, 93.0, 157.0, 210.0, 310.0, 542.0, 892.0, 1488.0, 2488.0, 4343.0, 7467.0, 12771.0, 23088.0, 41299.0, 74690.0, 137901.0, 242062.0, 223268.0, 122775.0, 66783.0, 36434.0, 21030.0, 11919.0, 6722.0, 3880.0, 2323.0, 1384.0, 814.0, 515.0, 286.0, 188.0, 111.0, 60.0, 49.0, 29.0, 21.0, 18.0, 12.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1513671875, -1.1183853149414062, -1.0854034423828125, -1.0524215698242188, -1.019439697265625, -0.9864578247070312, -0.9534759521484375, -0.9204940795898438, -0.88751220703125, -0.8545303344726562, -0.8215484619140625, -0.7885665893554688, -0.755584716796875, -0.7226028442382812, -0.6896209716796875, -0.6566390991210938, -0.6236572265625, -0.5906753540039062, -0.5576934814453125, -0.5247116088867188, -0.491729736328125, -0.45874786376953125, -0.4257659912109375, -0.39278411865234375, -0.35980224609375, -0.32682037353515625, -0.2938385009765625, -0.26085662841796875, -0.227874755859375, -0.19489288330078125, -0.1619110107421875, -0.12892913818359375, -0.095947265625, -0.06296539306640625, -0.0299835205078125, 0.00299835205078125, 0.035980224609375, 0.06896209716796875, 0.1019439697265625, 0.13492584228515625, 0.16790771484375, 0.20088958740234375, 0.2338714599609375, 0.26685333251953125, 0.299835205078125, 0.33281707763671875, 0.3657989501953125, 0.39878082275390625, 0.4317626953125, 0.46474456787109375, 0.4977264404296875, 0.5307083129882812, 0.563690185546875, 0.5966720581054688, 0.6296539306640625, 0.6626358032226562, 0.69561767578125, 0.7285995483398438, 0.7615814208984375, 0.7945632934570312, 0.827545166015625, 0.8605270385742188, 0.8935089111328125, 0.9264907836914062, 0.95947265625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 5.0, 10.0, 12.0, 12.0, 11.0, 18.0, 23.0, 22.0, 35.0, 25.0, 27.0, 28.0, 34.0, 35.0, 39.0, 43.0, 41.0, 42.0, 1066.0, 37.0, 42.0, 46.0, 47.0, 34.0, 45.0, 29.0, 28.0, 24.0, 24.0, 20.0, 8.0, 15.0, 12.0, 13.0, 9.0, 11.0, 10.0, 10.0, 6.0, 2.0, 5.0, 2.0, 7.0, 4.0, 1.0], "bins": [-4.39453125, -4.27777099609375, -4.1610107421875, -4.04425048828125, -3.927490234375, -3.81072998046875, -3.6939697265625, -3.57720947265625, -3.46044921875, -3.34368896484375, -3.2269287109375, -3.11016845703125, -2.993408203125, -2.87664794921875, -2.7598876953125, -2.64312744140625, -2.5263671875, -2.40960693359375, -2.2928466796875, -2.17608642578125, -2.059326171875, -1.94256591796875, -1.8258056640625, -1.70904541015625, -1.59228515625, -1.47552490234375, -1.3587646484375, -1.24200439453125, -1.125244140625, -1.00848388671875, -0.8917236328125, -0.77496337890625, -0.658203125, -0.54144287109375, -0.4246826171875, -0.30792236328125, -0.191162109375, -0.07440185546875, 0.0423583984375, 0.15911865234375, 0.27587890625, 0.39263916015625, 0.5093994140625, 0.62615966796875, 0.742919921875, 0.85968017578125, 0.9764404296875, 1.09320068359375, 1.2099609375, 1.32672119140625, 1.4434814453125, 1.56024169921875, 1.677001953125, 1.79376220703125, 1.9105224609375, 2.02728271484375, 2.14404296875, 2.26080322265625, 2.3775634765625, 2.49432373046875, 2.611083984375, 2.72784423828125, 2.8446044921875, 2.96136474609375, 3.078125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 13.0, 9.0, 9.0, 26.0, 34.0, 45.0, 87.0, 133.0, 196.0, 328.0, 517.0, 799.0, 1169.0, 1949.0, 3048.0, 4881.0, 7780.0, 12343.0, 20200.0, 33590.0, 55066.0, 92722.0, 158816.0, 1281879.0, 170331.0, 99590.0, 58753.0, 35364.0, 21679.0, 13362.0, 8288.0, 5202.0, 3226.0, 1993.0, 1375.0, 850.0, 520.0, 339.0, 224.0, 129.0, 110.0, 52.0, 44.0, 26.0, 9.0, 16.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.89453125, -0.86865234375, -0.8427734375, -0.81689453125, -0.791015625, -0.76513671875, -0.7392578125, -0.71337890625, -0.6875, -0.66162109375, -0.6357421875, -0.60986328125, -0.583984375, -0.55810546875, -0.5322265625, -0.50634765625, -0.48046875, -0.45458984375, -0.4287109375, -0.40283203125, -0.376953125, -0.35107421875, -0.3251953125, -0.29931640625, -0.2734375, -0.24755859375, -0.2216796875, -0.19580078125, -0.169921875, -0.14404296875, -0.1181640625, -0.09228515625, -0.06640625, -0.04052734375, -0.0146484375, 0.01123046875, 0.037109375, 0.06298828125, 0.0888671875, 0.11474609375, 0.140625, 0.16650390625, 0.1923828125, 0.21826171875, 0.244140625, 0.27001953125, 0.2958984375, 0.32177734375, 0.34765625, 0.37353515625, 0.3994140625, 0.42529296875, 0.451171875, 0.47705078125, 0.5029296875, 0.52880859375, 0.5546875, 0.58056640625, 0.6064453125, 0.63232421875, 0.658203125, 0.68408203125, 0.7099609375, 0.73583984375, 0.76171875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 4.0, 7.0, 6.0, 11.0, 10.0, 20.0, 23.0, 26.0, 28.0, 22.0, 29.0, 36.0, 38.0, 37.0, 50.0, 46.0, 67.0, 56.0, 50.0, 46.0, 47.0, 39.0, 40.0, 55.0, 30.0, 35.0, 23.0, 27.0, 21.0, 13.0, 12.0, 11.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0009469985961914062, -0.0009155869483947754, -0.0008841753005981445, -0.0008527636528015137, -0.0008213520050048828, -0.000789940357208252, -0.0007585287094116211, -0.0007271170616149902, -0.0006957054138183594, -0.0006642937660217285, -0.0006328821182250977, -0.0006014704704284668, -0.0005700588226318359, -0.0005386471748352051, -0.0005072355270385742, -0.00047582387924194336, -0.0004444122314453125, -0.00041300058364868164, -0.0003815889358520508, -0.0003501772880554199, -0.00031876564025878906, -0.0002873539924621582, -0.00025594234466552734, -0.00022453069686889648, -0.00019311904907226562, -0.00016170740127563477, -0.0001302957534790039, -9.888410568237305e-05, -6.747245788574219e-05, -3.606081008911133e-05, -4.649162292480469e-06, 2.676248550415039e-05, 5.817413330078125e-05, 8.958578109741211e-05, 0.00012099742889404297, 0.00015240907669067383, 0.0001838207244873047, 0.00021523237228393555, 0.0002466440200805664, 0.00027805566787719727, 0.0003094673156738281, 0.000340878963470459, 0.00037229061126708984, 0.0004037022590637207, 0.00043511390686035156, 0.0004665255546569824, 0.0004979372024536133, 0.0005293488502502441, 0.000560760498046875, 0.0005921721458435059, 0.0006235837936401367, 0.0006549954414367676, 0.0006864070892333984, 0.0007178187370300293, 0.0007492303848266602, 0.000780642032623291, 0.0008120536804199219, 0.0008434653282165527, 0.0008748769760131836, 0.0009062886238098145, 0.0009377002716064453, 0.0009691119194030762, 0.001000523567199707, 0.0010319352149963379, 0.0010633468627929688]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 2.0, 2.0, 2.0, 10.0, 7.0, 7.0, 14.0, 12.0, 39.0, 46.0, 57.0, 73.0, 126.0, 194.0, 331.0, 587.0, 6652.0, 1035684.0, 3267.0, 566.0, 301.0, 178.0, 94.0, 58.0, 56.0, 48.0, 22.0, 25.0, 29.0, 15.0, 13.0, 8.0, 7.0, 6.0, 1.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02850341796875, -0.027624845504760742, -0.026746273040771484, -0.025867700576782227, -0.02498912811279297, -0.02411055564880371, -0.023231983184814453, -0.022353410720825195, -0.021474838256835938, -0.02059626579284668, -0.019717693328857422, -0.018839120864868164, -0.017960548400878906, -0.01708197593688965, -0.01620340347290039, -0.015324831008911133, -0.014446258544921875, -0.013567686080932617, -0.01268911361694336, -0.011810541152954102, -0.010931968688964844, -0.010053396224975586, -0.009174823760986328, -0.00829625129699707, -0.0074176788330078125, -0.006539106369018555, -0.005660533905029297, -0.004781961441040039, -0.0039033889770507812, -0.0030248165130615234, -0.0021462440490722656, -0.0012676715850830078, -0.00038909912109375, 0.0004894733428955078, 0.0013680458068847656, 0.0022466182708740234, 0.0031251907348632812, 0.004003763198852539, 0.004882335662841797, 0.005760908126831055, 0.0066394805908203125, 0.00751805305480957, 0.008396625518798828, 0.009275197982788086, 0.010153770446777344, 0.011032342910766602, 0.01191091537475586, 0.012789487838745117, 0.013668060302734375, 0.014546632766723633, 0.01542520523071289, 0.01630377769470215, 0.017182350158691406, 0.018060922622680664, 0.018939495086669922, 0.01981806755065918, 0.020696640014648438, 0.021575212478637695, 0.022453784942626953, 0.02333235740661621, 0.02421092987060547, 0.025089502334594727, 0.025968074798583984, 0.026846647262573242, 0.0277252197265625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 48.0, 252.0, 519.0, 172.0, 14.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001175920944660902, -0.0010878217872232199, -0.000999722513370216, -0.0009116233559325337, -0.0008235241402871907, -0.0007354249246418476, -0.0006473257672041655, -0.0005592265515588224, -0.00047112733591347933, -0.00038302812026813626, -0.00029492893372662365, -0.00020682974718511105, -0.00011873053153976798, -3.0631315894424915e-05, 5.7467841543257236e-05, 0.0001455670571886003, 0.00023366627283394337, 0.00032176548847928643, 0.00040986467502079904, 0.0004979638615623116, 0.0005860630772076547, 0.0006741622928529978, 0.0007622614502906799, 0.000850360665936023, 0.0009384598815813661, 0.0010265590390190482, 0.0011146583128720522, 0.0012027574703097343, 0.0012908566277474165, 0.0013789559016004205, 0.0014670550590381026, 0.0015551543328911066, 0.0016432534903287888, 0.001731352647766471, 0.0018194519216194749, 0.001907551079057157, 0.001995650352910161, 0.002083749510347843, 0.0021718486677855253, 0.0022599478252232075, 0.0023480472154915333, 0.0024361463729292154, 0.0025242455303668976, 0.0026123449206352234, 0.0027004440780729055, 0.0027885432355105877, 0.00287664239294827, 0.002964741550385952, 0.003052840707823634, 0.0031409398652613163, 0.0032290390226989985, 0.0033171381801366806, 0.0034052375704050064, 0.0034933367278426886, 0.0035814358852803707, 0.003669535042718053, 0.003757634200155735, 0.003845733357593417, 0.003933832515031099, 0.004021931905299425, 0.004110030829906464, 0.004198130220174789, 0.004286229610443115, 0.004374328535050154, 0.0044624279253184795]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 3.0, 4.0, 12.0, 13.0, 11.0, 14.0, 12.0, 18.0, 16.0, 26.0, 19.0, 31.0, 23.0, 34.0, 30.0, 29.0, 34.0, 27.0, 48.0, 34.0, 33.0, 38.0, 31.0, 46.0, 41.0, 46.0, 30.0, 32.0, 30.0, 29.0, 24.0, 27.0, 28.0, 22.0, 17.0, 11.0, 16.0, 8.0, 9.0, 10.0, 7.0, 4.0, 11.0, 1.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.0005563497543334961, -0.0005402639508247375, -0.000524178147315979, -0.0005080923438072205, -0.0004920065402984619, -0.00047592073678970337, -0.0004598349332809448, -0.0004437491297721863, -0.00042766332626342773, -0.0004115775227546692, -0.00039549171924591064, -0.0003794059157371521, -0.00036332011222839355, -0.000347234308719635, -0.00033114850521087646, -0.0003150627017021179, -0.0002989768981933594, -0.00028289109468460083, -0.0002668052911758423, -0.00025071948766708374, -0.0002346336841583252, -0.00021854788064956665, -0.0002024620771408081, -0.00018637627363204956, -0.00017029047012329102, -0.00015420466661453247, -0.00013811886310577393, -0.00012203305959701538, -0.00010594725608825684, -8.986145257949829e-05, -7.377564907073975e-05, -5.76898455619812e-05, -4.1604042053222656e-05, -2.551823854446411e-05, -9.432435035705566e-06, 6.6533684730529785e-06, 2.2739171981811523e-05, 3.882497549057007e-05, 5.491077899932861e-05, 7.099658250808716e-05, 8.70823860168457e-05, 0.00010316818952560425, 0.00011925399303436279, 0.00013533979654312134, 0.00015142560005187988, 0.00016751140356063843, 0.00018359720706939697, 0.00019968301057815552, 0.00021576881408691406, 0.0002318546175956726, 0.00024794042110443115, 0.0002640262246131897, 0.00028011202812194824, 0.0002961978316307068, 0.00031228363513946533, 0.0003283694386482239, 0.0003444552421569824, 0.00036054104566574097, 0.0003766268491744995, 0.00039271265268325806, 0.0004087984561920166, 0.00042488425970077515, 0.0004409700632095337, 0.00045705586671829224, 0.0004731416702270508]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 1.0, 5.0, 8.0, 12.0, 15.0, 14.0, 14.0, 11.0, 20.0, 33.0, 24.0, 22.0, 26.0, 37.0, 33.0, 41.0, 39.0, 39.0, 43.0, 34.0, 45.0, 46.0, 55.0, 46.0, 43.0, 41.0, 33.0, 30.0, 26.0, 23.0, 26.0, 23.0, 16.0, 19.0, 19.0, 8.0, 6.0, 4.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83984375, -5.64495849609375, -5.4500732421875, -5.25518798828125, -5.060302734375, -4.86541748046875, -4.6705322265625, -4.47564697265625, -4.28076171875, -4.08587646484375, -3.8909912109375, -3.69610595703125, -3.501220703125, -3.30633544921875, -3.1114501953125, -2.91656494140625, -2.7216796875, -2.52679443359375, -2.3319091796875, -2.13702392578125, -1.942138671875, -1.74725341796875, -1.5523681640625, -1.35748291015625, -1.16259765625, -0.96771240234375, -0.7728271484375, -0.57794189453125, -0.383056640625, -0.18817138671875, 0.0067138671875, 0.20159912109375, 0.396484375, 0.59136962890625, 0.7862548828125, 0.98114013671875, 1.176025390625, 1.37091064453125, 1.5657958984375, 1.76068115234375, 1.95556640625, 2.15045166015625, 2.3453369140625, 2.54022216796875, 2.735107421875, 2.92999267578125, 3.1248779296875, 3.31976318359375, 3.5146484375, 3.70953369140625, 3.9044189453125, 4.09930419921875, 4.294189453125, 4.48907470703125, 4.6839599609375, 4.87884521484375, 5.07373046875, 5.26861572265625, 5.4635009765625, 5.65838623046875, 5.853271484375, 6.04815673828125, 6.2430419921875, 6.43792724609375, 6.6328125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 7.0, 10.0, 6.0, 11.0, 9.0, 22.0, 29.0, 45.0, 51.0, 81.0, 106.0, 166.0, 228.0, 348.0, 548.0, 910.0, 1476.0, 2709.0, 5431.0, 12255.0, 30655.0, 104704.0, 471814.0, 307115.0, 67895.0, 22397.0, 9278.0, 4458.0, 2206.0, 1284.0, 737.0, 517.0, 293.0, 205.0, 172.0, 114.0, 66.0, 56.0, 40.0, 28.0, 21.0, 18.0, 12.0, 13.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.35546875, -4.21868896484375, -4.0819091796875, -3.94512939453125, -3.808349609375, -3.67156982421875, -3.5347900390625, -3.39801025390625, -3.26123046875, -3.12445068359375, -2.9876708984375, -2.85089111328125, -2.714111328125, -2.57733154296875, -2.4405517578125, -2.30377197265625, -2.1669921875, -2.03021240234375, -1.8934326171875, -1.75665283203125, -1.619873046875, -1.48309326171875, -1.3463134765625, -1.20953369140625, -1.07275390625, -0.93597412109375, -0.7991943359375, -0.66241455078125, -0.525634765625, -0.38885498046875, -0.2520751953125, -0.11529541015625, 0.021484375, 0.15826416015625, 0.2950439453125, 0.43182373046875, 0.568603515625, 0.70538330078125, 0.8421630859375, 0.97894287109375, 1.11572265625, 1.25250244140625, 1.3892822265625, 1.52606201171875, 1.662841796875, 1.79962158203125, 1.9364013671875, 2.07318115234375, 2.2099609375, 2.34674072265625, 2.4835205078125, 2.62030029296875, 2.757080078125, 2.89385986328125, 3.0306396484375, 3.16741943359375, 3.30419921875, 3.44097900390625, 3.5777587890625, 3.71453857421875, 3.851318359375, 3.98809814453125, 4.1248779296875, 4.26165771484375, 4.3984375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 8.0, 3.0, 5.0, 10.0, 8.0, 9.0, 20.0, 22.0, 20.0, 22.0, 26.0, 36.0, 36.0, 45.0, 32.0, 55.0, 60.0, 67.0, 162.0, 1857.0, 119.0, 55.0, 43.0, 37.0, 45.0, 40.0, 34.0, 37.0, 23.0, 23.0, 21.0, 12.0, 11.0, 14.0, 9.0, 10.0, 4.0, 4.0, 6.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.9375, -24.251953125, -23.56640625, -22.880859375, -22.1953125, -21.509765625, -20.82421875, -20.138671875, -19.453125, -18.767578125, -18.08203125, -17.396484375, -16.7109375, -16.025390625, -15.33984375, -14.654296875, -13.96875, -13.283203125, -12.59765625, -11.912109375, -11.2265625, -10.541015625, -9.85546875, -9.169921875, -8.484375, -7.798828125, -7.11328125, -6.427734375, -5.7421875, -5.056640625, -4.37109375, -3.685546875, -3.0, -2.314453125, -1.62890625, -0.943359375, -0.2578125, 0.427734375, 1.11328125, 1.798828125, 2.484375, 3.169921875, 3.85546875, 4.541015625, 5.2265625, 5.912109375, 6.59765625, 7.283203125, 7.96875, 8.654296875, 9.33984375, 10.025390625, 10.7109375, 11.396484375, 12.08203125, 12.767578125, 13.453125, 14.138671875, 14.82421875, 15.509765625, 16.1953125, 16.880859375, 17.56640625, 18.251953125, 18.9375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 3.0, 6.0, 6.0, 7.0, 9.0, 13.0, 10.0, 10.0, 20.0, 18.0, 22.0, 38.0, 42.0, 58.0, 88.0, 111.0, 149.0, 274.0, 659.0, 3229.0, 267982.0, 2865153.0, 5869.0, 880.0, 370.0, 209.0, 114.0, 72.0, 56.0, 41.0, 29.0, 29.0, 26.0, 20.0, 19.0, 19.0, 9.0, 10.0, 7.0, 4.0, 2.0, 8.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.65625, -28.6376953125, -27.619140625, -26.6005859375, -25.58203125, -24.5634765625, -23.544921875, -22.5263671875, -21.5078125, -20.4892578125, -19.470703125, -18.4521484375, -17.43359375, -16.4150390625, -15.396484375, -14.3779296875, -13.359375, -12.3408203125, -11.322265625, -10.3037109375, -9.28515625, -8.2666015625, -7.248046875, -6.2294921875, -5.2109375, -4.1923828125, -3.173828125, -2.1552734375, -1.13671875, -0.1181640625, 0.900390625, 1.9189453125, 2.9375, 3.9560546875, 4.974609375, 5.9931640625, 7.01171875, 8.0302734375, 9.048828125, 10.0673828125, 11.0859375, 12.1044921875, 13.123046875, 14.1416015625, 15.16015625, 16.1787109375, 17.197265625, 18.2158203125, 19.234375, 20.2529296875, 21.271484375, 22.2900390625, 23.30859375, 24.3271484375, 25.345703125, 26.3642578125, 27.3828125, 28.4013671875, 29.419921875, 30.4384765625, 31.45703125, 32.4755859375, 33.494140625, 34.5126953125, 35.53125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 39.0, 641.0, 324.0, 10.0], "bins": [-212.79217529296875, -209.34825134277344, -205.90432739257812, -202.46038818359375, -199.01646423339844, -195.57254028320312, -192.1286163330078, -188.6846923828125, -185.24075317382812, -181.7968292236328, -178.3529052734375, -174.90896606445312, -171.4650421142578, -168.0211181640625, -164.5771942138672, -161.13327026367188, -157.6893310546875, -154.2454071044922, -150.80148315429688, -147.3575439453125, -143.9136199951172, -140.46969604492188, -137.02577209472656, -133.58184814453125, -130.13792419433594, -126.69400024414062, -123.25006866455078, -119.80614471435547, -116.36221313476562, -112.91828918457031, -109.474365234375, -106.03043365478516, -102.58650207519531, -99.142578125, -95.69864654541016, -92.25472259521484, -88.810791015625, -85.36686706542969, -81.92294311523438, -78.47901153564453, -75.03507995605469, -71.59115600585938, -68.14722442626953, -64.70330047607422, -61.259368896484375, -57.81544494628906, -54.371517181396484, -50.927589416503906, -47.48366165161133, -44.03973388671875, -40.59580612182617, -37.151878356933594, -33.70795440673828, -30.26402473449707, -26.820098876953125, -23.376171112060547, -19.93224334716797, -16.48831558227539, -13.044388771057129, -9.600461959838867, -6.156534194946289, -2.712606430053711, 0.7313194274902344, 4.1752471923828125, 7.619174003601074]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 7.0, 3.0, 6.0, 7.0, 12.0, 7.0, 11.0, 16.0, 25.0, 17.0, 15.0, 21.0, 21.0, 27.0, 28.0, 27.0, 28.0, 42.0, 42.0, 45.0, 37.0, 43.0, 26.0, 31.0, 30.0, 30.0, 34.0, 32.0, 34.0, 30.0, 20.0, 31.0, 26.0, 26.0, 23.0, 20.0, 19.0, 21.0, 17.0, 10.0, 14.0, 8.0, 6.0, 5.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0], "bins": [-63.172271728515625, -61.31330871582031, -59.454345703125, -57.59538269042969, -55.736419677734375, -53.87745666503906, -52.01849365234375, -50.15953063964844, -48.300567626953125, -46.44160461425781, -44.5826416015625, -42.72367858886719, -40.864715576171875, -39.00575256347656, -37.14678955078125, -35.28782653808594, -33.42886734008789, -31.569904327392578, -29.710941314697266, -27.851978302001953, -25.99301528930664, -24.134052276611328, -22.27509117126465, -20.416128158569336, -18.557165145874023, -16.69820213317871, -14.839239120483398, -12.980277061462402, -11.12131404876709, -9.262351036071777, -7.403388977050781, -5.544425964355469, -3.685466766357422, -1.8265039920806885, 0.03245878219604492, 1.8914213180541992, 3.7503843307495117, 5.609347343444824, 7.46830940246582, 9.327272415161133, 11.186235427856445, 13.045198440551758, 14.90416145324707, 16.76312255859375, 18.622085571289062, 20.481048583984375, 22.340011596679688, 24.198974609375, 26.057937622070312, 27.916900634765625, 29.775863647460938, 31.63482666015625, 33.49378967285156, 35.352752685546875, 37.21171569824219, 39.0706787109375, 40.92964172363281, 42.788604736328125, 44.64756774902344, 46.50653076171875, 48.36549377441406, 50.224456787109375, 52.08341979980469, 53.9423828125, 55.80134201049805]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 9.0, 15.0, 13.0, 13.0, 15.0, 20.0, 20.0, 31.0, 22.0, 27.0, 38.0, 40.0, 34.0, 43.0, 39.0, 37.0, 36.0, 45.0, 58.0, 45.0, 49.0, 47.0, 38.0, 34.0, 34.0, 22.0, 26.0, 17.0, 22.0, 21.0, 15.0, 18.0, 15.0, 4.0, 7.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0390625, -5.8382568359375, -5.637451171875, -5.4366455078125, -5.23583984375, -5.0350341796875, -4.834228515625, -4.6334228515625, -4.4326171875, -4.2318115234375, -4.031005859375, -3.8302001953125, -3.62939453125, -3.4285888671875, -3.227783203125, -3.0269775390625, -2.826171875, -2.6253662109375, -2.424560546875, -2.2237548828125, -2.02294921875, -1.8221435546875, -1.621337890625, -1.4205322265625, -1.2197265625, -1.0189208984375, -0.818115234375, -0.6173095703125, -0.41650390625, -0.2156982421875, -0.014892578125, 0.1859130859375, 0.38671875, 0.5875244140625, 0.788330078125, 0.9891357421875, 1.18994140625, 1.3907470703125, 1.591552734375, 1.7923583984375, 1.9931640625, 2.1939697265625, 2.394775390625, 2.5955810546875, 2.79638671875, 2.9971923828125, 3.197998046875, 3.3988037109375, 3.599609375, 3.8004150390625, 4.001220703125, 4.2020263671875, 4.40283203125, 4.6036376953125, 4.804443359375, 5.0052490234375, 5.2060546875, 5.4068603515625, 5.607666015625, 5.8084716796875, 6.00927734375, 6.2100830078125, 6.410888671875, 6.6116943359375, 6.8125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 5.0, 14.0, 11.0, 16.0, 20.0, 21.0, 26.0, 56.0, 80.0, 164.0, 309.0, 621.0, 1497.0, 4457.0, 16046.0, 82897.0, 729731.0, 2446273.0, 794242.0, 94145.0, 16699.0, 4306.0, 1391.0, 536.0, 283.0, 133.0, 80.0, 54.0, 32.0, 22.0, 25.0, 20.0, 16.0, 12.0, 6.0, 7.0, 2.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2890625, -11.899169921875, -11.50927734375, -11.119384765625, -10.7294921875, -10.339599609375, -9.94970703125, -9.559814453125, -9.169921875, -8.780029296875, -8.39013671875, -8.000244140625, -7.6103515625, -7.220458984375, -6.83056640625, -6.440673828125, -6.05078125, -5.660888671875, -5.27099609375, -4.881103515625, -4.4912109375, -4.101318359375, -3.71142578125, -3.321533203125, -2.931640625, -2.541748046875, -2.15185546875, -1.761962890625, -1.3720703125, -0.982177734375, -0.59228515625, -0.202392578125, 0.1875, 0.577392578125, 0.96728515625, 1.357177734375, 1.7470703125, 2.136962890625, 2.52685546875, 2.916748046875, 3.306640625, 3.696533203125, 4.08642578125, 4.476318359375, 4.8662109375, 5.256103515625, 5.64599609375, 6.035888671875, 6.42578125, 6.815673828125, 7.20556640625, 7.595458984375, 7.9853515625, 8.375244140625, 8.76513671875, 9.155029296875, 9.544921875, 9.934814453125, 10.32470703125, 10.714599609375, 11.1044921875, 11.494384765625, 11.88427734375, 12.274169921875, 12.6640625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 10.0, 14.0, 21.0, 21.0, 39.0, 50.0, 81.0, 107.0, 139.0, 189.0, 258.0, 420.0, 577.0, 554.0, 478.0, 339.0, 235.0, 143.0, 107.0, 84.0, 63.0, 37.0, 29.0, 22.0, 17.0, 11.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.515625, -18.890380859375, -18.26513671875, -17.639892578125, -17.0146484375, -16.389404296875, -15.76416015625, -15.138916015625, -14.513671875, -13.888427734375, -13.26318359375, -12.637939453125, -12.0126953125, -11.387451171875, -10.76220703125, -10.136962890625, -9.51171875, -8.886474609375, -8.26123046875, -7.635986328125, -7.0107421875, -6.385498046875, -5.76025390625, -5.135009765625, -4.509765625, -3.884521484375, -3.25927734375, -2.634033203125, -2.0087890625, -1.383544921875, -0.75830078125, -0.133056640625, 0.4921875, 1.117431640625, 1.74267578125, 2.367919921875, 2.9931640625, 3.618408203125, 4.24365234375, 4.868896484375, 5.494140625, 6.119384765625, 6.74462890625, 7.369873046875, 7.9951171875, 8.620361328125, 9.24560546875, 9.870849609375, 10.49609375, 11.121337890625, 11.74658203125, 12.371826171875, 12.9970703125, 13.622314453125, 14.24755859375, 14.872802734375, 15.498046875, 16.123291015625, 16.74853515625, 17.373779296875, 17.9990234375, 18.624267578125, 19.24951171875, 19.874755859375, 20.5]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 2.0, 7.0, 6.0, 9.0, 11.0, 14.0, 11.0, 17.0, 38.0, 26.0, 40.0, 49.0, 61.0, 73.0, 112.0, 178.0, 250.0, 484.0, 1149.0, 7787.0, 304715.0, 3818826.0, 55206.0, 3285.0, 723.0, 373.0, 216.0, 147.0, 90.0, 78.0, 75.0, 40.0, 36.0, 24.0, 22.0, 28.0, 15.0, 11.0, 9.0, 9.0, 5.0, 5.0, 6.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-49.34375, -47.66015625, -45.9765625, -44.29296875, -42.609375, -40.92578125, -39.2421875, -37.55859375, -35.875, -34.19140625, -32.5078125, -30.82421875, -29.140625, -27.45703125, -25.7734375, -24.08984375, -22.40625, -20.72265625, -19.0390625, -17.35546875, -15.671875, -13.98828125, -12.3046875, -10.62109375, -8.9375, -7.25390625, -5.5703125, -3.88671875, -2.203125, -0.51953125, 1.1640625, 2.84765625, 4.53125, 6.21484375, 7.8984375, 9.58203125, 11.265625, 12.94921875, 14.6328125, 16.31640625, 18.0, 19.68359375, 21.3671875, 23.05078125, 24.734375, 26.41796875, 28.1015625, 29.78515625, 31.46875, 33.15234375, 34.8359375, 36.51953125, 38.203125, 39.88671875, 41.5703125, 43.25390625, 44.9375, 46.62109375, 48.3046875, 49.98828125, 51.671875, 53.35546875, 55.0390625, 56.72265625, 58.40625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 11.0, 21.0, 55.0, 127.0, 174.0, 221.0, 201.0, 108.0, 51.0, 27.0, 11.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.68533325195312, -105.13290405273438, -101.58047485351562, -98.02804565429688, -94.47562408447266, -90.9231948852539, -87.37076568603516, -83.8183364868164, -80.26591491699219, -76.71348571777344, -73.16105651855469, -69.60862731933594, -66.05620574951172, -62.50377655029297, -58.95134735107422, -55.39891815185547, -51.84648895263672, -48.29405975341797, -44.741634368896484, -41.189205169677734, -37.63677978515625, -34.0843505859375, -30.53192138671875, -26.979494094848633, -23.427066802978516, -19.8746395111084, -16.32221221923828, -12.769783020019531, -9.217355728149414, -5.664928436279297, -2.112499237060547, 1.4399280548095703, 4.992362976074219, 8.544790267944336, 12.09721851348877, 15.649646759033203, 19.20207405090332, 22.754501342773438, 26.306930541992188, 29.859357833862305, 33.41178512573242, 36.96421432495117, 40.516639709472656, 44.069068908691406, 47.621498107910156, 51.17392349243164, 54.72635269165039, 58.278778076171875, 61.831207275390625, 65.38363647460938, 68.93606567382812, 72.48849487304688, 76.0409164428711, 79.59334564208984, 83.1457748413086, 86.69820404052734, 90.25062561035156, 93.80305480957031, 97.35548400878906, 100.90791320800781, 104.46033477783203, 108.01276397705078, 111.56519317626953, 115.11762237548828, 118.67005157470703]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 1.0, 0.0, 4.0, 7.0, 8.0, 16.0, 16.0, 11.0, 17.0, 12.0, 17.0, 30.0, 24.0, 39.0, 38.0, 38.0, 48.0, 32.0, 49.0, 43.0, 35.0, 43.0, 46.0, 40.0, 42.0, 57.0, 39.0, 32.0, 30.0, 41.0, 19.0, 21.0, 19.0, 21.0, 18.0, 10.0, 9.0, 5.0, 5.0, 3.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.154117584228516, -58.234718322753906, -56.31531524658203, -54.39591598510742, -52.47651290893555, -50.55711364746094, -48.63771057128906, -46.71831130981445, -44.798912048339844, -42.879512786865234, -40.96010971069336, -39.04071044921875, -37.121307373046875, -35.201908111572266, -33.282508850097656, -31.36310577392578, -29.443702697753906, -27.524301528930664, -25.604900360107422, -23.685501098632812, -21.766098022460938, -19.846698760986328, -17.927297592163086, -16.007896423339844, -14.088495254516602, -12.16909408569336, -10.249692916870117, -8.330292701721191, -6.410891532897949, -4.491490364074707, -2.5720901489257812, -0.6526889801025391, 1.2667160034179688, 3.186116933822632, 5.105517864227295, 7.024918556213379, 8.944319725036621, 10.863720893859863, 12.783121109008789, 14.702522277832031, 16.621923446655273, 18.541324615478516, 20.460725784301758, 22.380126953125, 24.29952621459961, 26.218929290771484, 28.138328552246094, 30.057729721069336, 31.977130889892578, 33.89653015136719, 35.81593322753906, 37.73533248901367, 39.65473556518555, 41.574134826660156, 43.49353790283203, 45.41293716430664, 47.33233642578125, 49.25173568725586, 51.171138763427734, 53.090538024902344, 55.00994110107422, 56.92934036254883, 58.84873962402344, 60.76814270019531, 62.68754577636719]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 10.0, 4.0, 9.0, 11.0, 13.0, 12.0, 15.0, 16.0, 29.0, 22.0, 27.0, 21.0, 35.0, 41.0, 33.0, 40.0, 46.0, 39.0, 45.0, 51.0, 31.0, 44.0, 52.0, 47.0, 44.0, 34.0, 27.0, 29.0, 35.0, 29.0, 18.0, 20.0, 15.0, 11.0, 10.0, 10.0, 11.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.48150634765625, -6.2755126953125, -6.06951904296875, -5.863525390625, -5.65753173828125, -5.4515380859375, -5.24554443359375, -5.03955078125, -4.83355712890625, -4.6275634765625, -4.42156982421875, -4.215576171875, -4.00958251953125, -3.8035888671875, -3.59759521484375, -3.3916015625, -3.18560791015625, -2.9796142578125, -2.77362060546875, -2.567626953125, -2.36163330078125, -2.1556396484375, -1.94964599609375, -1.74365234375, -1.53765869140625, -1.3316650390625, -1.12567138671875, -0.919677734375, -0.71368408203125, -0.5076904296875, -0.30169677734375, -0.095703125, 0.11029052734375, 0.3162841796875, 0.52227783203125, 0.728271484375, 0.93426513671875, 1.1402587890625, 1.34625244140625, 1.55224609375, 1.75823974609375, 1.9642333984375, 2.17022705078125, 2.376220703125, 2.58221435546875, 2.7882080078125, 2.99420166015625, 3.2001953125, 3.40618896484375, 3.6121826171875, 3.81817626953125, 4.024169921875, 4.23016357421875, 4.4361572265625, 4.64215087890625, 4.84814453125, 5.05413818359375, 5.2601318359375, 5.46612548828125, 5.672119140625, 5.87811279296875, 6.0841064453125, 6.29010009765625, 6.49609375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 10.0, 8.0, 14.0, 16.0, 28.0, 39.0, 47.0, 87.0, 115.0, 150.0, 229.0, 298.0, 493.0, 730.0, 1093.0, 1545.0, 2266.0, 3231.0, 4886.0, 6998.0, 10406.0, 15536.0, 23018.0, 34757.0, 53455.0, 83133.0, 129901.0, 194971.0, 168794.0, 108059.0, 69322.0, 44760.0, 29310.0, 19771.0, 13135.0, 8878.0, 6074.0, 4118.0, 2789.0, 1916.0, 1361.0, 858.0, 622.0, 387.0, 316.0, 184.0, 147.0, 81.0, 74.0, 42.0, 34.0, 24.0, 17.0, 15.0, 4.0, 2.0, 4.0, 4.0], "bins": [-0.85888671875, -0.8334732055664062, -0.8080596923828125, -0.7826461791992188, -0.757232666015625, -0.7318191528320312, -0.7064056396484375, -0.6809921264648438, -0.65557861328125, -0.6301651000976562, -0.6047515869140625, -0.5793380737304688, -0.553924560546875, -0.5285110473632812, -0.5030975341796875, -0.47768402099609375, -0.4522705078125, -0.42685699462890625, -0.4014434814453125, -0.37602996826171875, -0.350616455078125, -0.32520294189453125, -0.2997894287109375, -0.27437591552734375, -0.24896240234375, -0.22354888916015625, -0.1981353759765625, -0.17272186279296875, -0.147308349609375, -0.12189483642578125, -0.0964813232421875, -0.07106781005859375, -0.045654296875, -0.02024078369140625, 0.0051727294921875, 0.03058624267578125, 0.055999755859375, 0.08141326904296875, 0.1068267822265625, 0.13224029541015625, 0.15765380859375, 0.18306732177734375, 0.2084808349609375, 0.23389434814453125, 0.259307861328125, 0.28472137451171875, 0.3101348876953125, 0.33554840087890625, 0.3609619140625, 0.38637542724609375, 0.4117889404296875, 0.43720245361328125, 0.462615966796875, 0.48802947998046875, 0.5134429931640625, 0.5388565063476562, 0.56427001953125, 0.5896835327148438, 0.6150970458984375, 0.6405105590820312, 0.665924072265625, 0.6913375854492188, 0.7167510986328125, 0.7421646118164062, 0.767578125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 0.0, 6.0, 3.0, 4.0, 6.0, 5.0, 8.0, 10.0, 13.0, 9.0, 13.0, 15.0, 29.0, 15.0, 27.0, 26.0, 34.0, 41.0, 42.0, 35.0, 38.0, 42.0, 29.0, 45.0, 32.0, 1072.0, 43.0, 35.0, 42.0, 31.0, 25.0, 31.0, 29.0, 23.0, 25.0, 32.0, 17.0, 17.0, 12.0, 16.0, 13.0, 8.0, 9.0, 6.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.578125, -3.45892333984375, -3.3397216796875, -3.22052001953125, -3.101318359375, -2.98211669921875, -2.8629150390625, -2.74371337890625, -2.62451171875, -2.50531005859375, -2.3861083984375, -2.26690673828125, -2.147705078125, -2.02850341796875, -1.9093017578125, -1.79010009765625, -1.6708984375, -1.55169677734375, -1.4324951171875, -1.31329345703125, -1.194091796875, -1.07489013671875, -0.9556884765625, -0.83648681640625, -0.71728515625, -0.59808349609375, -0.4788818359375, -0.35968017578125, -0.240478515625, -0.12127685546875, -0.0020751953125, 0.11712646484375, 0.236328125, 0.35552978515625, 0.4747314453125, 0.59393310546875, 0.713134765625, 0.83233642578125, 0.9515380859375, 1.07073974609375, 1.18994140625, 1.30914306640625, 1.4283447265625, 1.54754638671875, 1.666748046875, 1.78594970703125, 1.9051513671875, 2.02435302734375, 2.1435546875, 2.26275634765625, 2.3819580078125, 2.50115966796875, 2.620361328125, 2.73956298828125, 2.8587646484375, 2.97796630859375, 3.09716796875, 3.21636962890625, 3.3355712890625, 3.45477294921875, 3.573974609375, 3.69317626953125, 3.8123779296875, 3.93157958984375, 4.05078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 8.0, 14.0, 20.0, 25.0, 37.0, 59.0, 91.0, 168.0, 208.0, 324.0, 524.0, 803.0, 1189.0, 1887.0, 2908.0, 4392.0, 6967.0, 10612.0, 16581.0, 25456.0, 40176.0, 63115.0, 100232.0, 156474.0, 1251585.0, 150536.0, 95168.0, 60107.0, 38257.0, 24304.0, 15801.0, 10185.0, 6650.0, 4226.0, 2780.0, 1878.0, 1214.0, 757.0, 547.0, 315.0, 180.0, 132.0, 97.0, 49.0, 35.0, 31.0, 16.0, 6.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.728515625, -0.70458984375, -0.6806640625, -0.65673828125, -0.6328125, -0.60888671875, -0.5849609375, -0.56103515625, -0.537109375, -0.51318359375, -0.4892578125, -0.46533203125, -0.44140625, -0.41748046875, -0.3935546875, -0.36962890625, -0.345703125, -0.32177734375, -0.2978515625, -0.27392578125, -0.25, -0.22607421875, -0.2021484375, -0.17822265625, -0.154296875, -0.13037109375, -0.1064453125, -0.08251953125, -0.05859375, -0.03466796875, -0.0107421875, 0.01318359375, 0.037109375, 0.06103515625, 0.0849609375, 0.10888671875, 0.1328125, 0.15673828125, 0.1806640625, 0.20458984375, 0.228515625, 0.25244140625, 0.2763671875, 0.30029296875, 0.32421875, 0.34814453125, 0.3720703125, 0.39599609375, 0.419921875, 0.44384765625, 0.4677734375, 0.49169921875, 0.515625, 0.53955078125, 0.5634765625, 0.58740234375, 0.611328125, 0.63525390625, 0.6591796875, 0.68310546875, 0.70703125, 0.73095703125, 0.7548828125, 0.77880859375, 0.802734375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 8.0, 5.0, 8.0, 14.0, 14.0, 11.0, 27.0, 20.0, 30.0, 32.0, 53.0, 42.0, 48.0, 78.0, 76.0, 60.0, 55.0, 65.0, 60.0, 56.0, 37.0, 35.0, 38.0, 27.0, 22.0, 14.0, 11.0, 10.0, 13.0, 10.0, 5.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014467239379882812, -0.001399114727973938, -0.0013515055179595947, -0.0013038963079452515, -0.0012562870979309082, -0.001208677887916565, -0.0011610686779022217, -0.0011134594678878784, -0.0010658502578735352, -0.001018241047859192, -0.0009706318378448486, -0.0009230226278305054, -0.0008754134178161621, -0.0008278042078018188, -0.0007801949977874756, -0.0007325857877731323, -0.0006849765777587891, -0.0006373673677444458, -0.0005897581577301025, -0.0005421489477157593, -0.000494539737701416, -0.00044693052768707275, -0.0003993213176727295, -0.00035171210765838623, -0.00030410289764404297, -0.0002564936876296997, -0.00020888447761535645, -0.00016127526760101318, -0.00011366605758666992, -6.605684757232666e-05, -1.84476375579834e-05, 2.9161572456359863e-05, 7.677078247070312e-05, 0.0001243799924850464, 0.00017198920249938965, 0.0002195984125137329, 0.00026720762252807617, 0.00031481683254241943, 0.0003624260425567627, 0.00041003525257110596, 0.0004576444625854492, 0.0005052536725997925, 0.0005528628826141357, 0.000600472092628479, 0.0006480813026428223, 0.0006956905126571655, 0.0007432997226715088, 0.000790908932685852, 0.0008385181427001953, 0.0008861273527145386, 0.0009337365627288818, 0.000981345772743225, 0.0010289549827575684, 0.0010765641927719116, 0.0011241734027862549, 0.0011717826128005981, 0.0012193918228149414, 0.0012670010328292847, 0.001314610242843628, 0.0013622194528579712, 0.0014098286628723145, 0.0014574378728866577, 0.001505047082901001, 0.0015526562929153442, 0.0016002655029296875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 8.0, 9.0, 8.0, 16.0, 28.0, 37.0, 53.0, 85.0, 105.0, 148.0, 227.0, 380.0, 1016.0, 243418.0, 800426.0, 1392.0, 428.0, 220.0, 177.0, 114.0, 59.0, 50.0, 37.0, 29.0, 19.0, 19.0, 12.0, 8.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.040985107421875, -0.039879560470581055, -0.03877401351928711, -0.037668466567993164, -0.03656291961669922, -0.03545737266540527, -0.03435182571411133, -0.03324627876281738, -0.03214073181152344, -0.031035184860229492, -0.029929637908935547, -0.0288240909576416, -0.027718544006347656, -0.02661299705505371, -0.025507450103759766, -0.02440190315246582, -0.023296356201171875, -0.02219080924987793, -0.021085262298583984, -0.01997971534729004, -0.018874168395996094, -0.01776862144470215, -0.016663074493408203, -0.015557527542114258, -0.014451980590820312, -0.013346433639526367, -0.012240886688232422, -0.011135339736938477, -0.010029792785644531, -0.008924245834350586, -0.00781869888305664, -0.006713151931762695, -0.00560760498046875, -0.004502058029174805, -0.0033965110778808594, -0.002290964126586914, -0.0011854171752929688, -7.987022399902344e-05, 0.0010256767272949219, 0.002131223678588867, 0.0032367706298828125, 0.004342317581176758, 0.005447864532470703, 0.0065534114837646484, 0.007658958435058594, 0.008764505386352539, 0.009870052337646484, 0.01097559928894043, 0.012081146240234375, 0.01318669319152832, 0.014292240142822266, 0.015397787094116211, 0.016503334045410156, 0.0176088809967041, 0.018714427947998047, 0.019819974899291992, 0.020925521850585938, 0.022031068801879883, 0.023136615753173828, 0.024242162704467773, 0.02534770965576172, 0.026453256607055664, 0.02755880355834961, 0.028664350509643555, 0.0297698974609375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 11.0, 44.0, 94.0, 236.0, 290.0, 207.0, 87.0, 29.0, 11.0, 2.0, 2.0], "bins": [-0.0037928707897663116, -0.0037267417646944523, -0.003660612739622593, -0.00359448348172009, -0.0035283544566482306, -0.003462225431576371, -0.003396096173673868, -0.003329967148602009, -0.0032638381235301495, -0.00319770909845829, -0.0031315800733864307, -0.0030654508154839277, -0.0029993217904120684, -0.002933192765340209, -0.002867063507437706, -0.0028009344823658466, -0.0027348054572939873, -0.002668676432222128, -0.0026025474071502686, -0.0025364181492477655, -0.002470289124175906, -0.002404160099104047, -0.002338030841201544, -0.0022719018161296844, -0.002205772791057825, -0.0021396437659859657, -0.0020735147409141064, -0.0020073854830116034, -0.001941256457939744, -0.0018751274328678846, -0.0018089982913807034, -0.0017428691498935223, -0.001676740124821663, -0.0016106110997498035, -0.0015444819582626224, -0.0014783528167754412, -0.0014122237917035818, -0.0013460947666317225, -0.0012799656251445413, -0.00121383648365736, -0.0011477074585855007, -0.0010815784335136414, -0.0010154492920264602, -0.0009493202087469399, -0.0008831911254674196, -0.0008170620421878994, -0.0007509329589083791, -0.0006848038756288588, -0.0006186748505569994, -0.0005525457672774792, -0.0004864166839979589, -0.0004202876007184386, -0.00035415851743891835, -0.0002880294341593981, -0.0002219003508798778, -0.00015577126760035753, -8.964218432083726e-05, -2.3513101041316986e-05, 4.261598223820329e-05, 0.00010874506551772356, 0.00017487414879724383, 0.0002410032320767641, 0.0003071323153562844, 0.00037326139863580465, 0.0004393904819153249]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 1.0, 6.0, 7.0, 14.0, 11.0, 5.0, 11.0, 16.0, 19.0, 17.0, 26.0, 29.0, 25.0, 23.0, 24.0, 21.0, 34.0, 34.0, 27.0, 30.0, 33.0, 28.0, 42.0, 32.0, 34.0, 31.0, 38.0, 31.0, 40.0, 20.0, 39.0, 33.0, 22.0, 22.0, 13.0, 15.0, 25.0, 15.0, 13.0, 11.0, 16.0, 13.0, 11.0, 7.0, 6.0, 9.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.000608980655670166, -0.000590234063565731, -0.0005714874714612961, -0.0005527408793568611, -0.0005339942872524261, -0.0005152476951479912, -0.0004965011030435562, -0.00047775451093912125, -0.0004590079188346863, -0.0004402613267302513, -0.00042151473462581635, -0.0004027681425213814, -0.0003840215504169464, -0.00036527495831251144, -0.0003465283662080765, -0.0003277817741036415, -0.00030903518199920654, -0.0002902885898947716, -0.0002715419977903366, -0.00025279540568590164, -0.00023404881358146667, -0.0002153022214770317, -0.00019655562937259674, -0.00017780903726816177, -0.0001590624451637268, -0.00014031585305929184, -0.00012156926095485687, -0.0001028226688504219, -8.407607674598694e-05, -6.532948464155197e-05, -4.6582892537117004e-05, -2.7836300432682037e-05, -9.08970832824707e-06, 9.656883776187897e-06, 2.8403475880622864e-05, 4.715006798505783e-05, 6.58966600894928e-05, 8.464325219392776e-05, 0.00010338984429836273, 0.0001221364364027977, 0.00014088302850723267, 0.00015962962061166763, 0.0001783762127161026, 0.00019712280482053757, 0.00021586939692497253, 0.0002346159890294075, 0.00025336258113384247, 0.00027210917323827744, 0.0002908557653427124, 0.00030960235744714737, 0.00032834894955158234, 0.0003470955416560173, 0.00036584213376045227, 0.00038458872586488724, 0.0004033353179693222, 0.00042208191007375717, 0.00044082850217819214, 0.0004595750942826271, 0.00047832168638706207, 0.000497068278491497, 0.000515814870595932, 0.000534561462700367, 0.0005533080548048019, 0.0005720546469092369, 0.0005908012390136719]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 10.0, 4.0, 9.0, 11.0, 13.0, 12.0, 15.0, 16.0, 29.0, 22.0, 27.0, 21.0, 35.0, 41.0, 33.0, 40.0, 46.0, 39.0, 45.0, 51.0, 31.0, 44.0, 52.0, 46.0, 45.0, 34.0, 27.0, 29.0, 35.0, 29.0, 18.0, 20.0, 15.0, 11.0, 10.0, 10.0, 11.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.48150634765625, -6.2755126953125, -6.06951904296875, -5.863525390625, -5.65753173828125, -5.4515380859375, -5.24554443359375, -5.03955078125, -4.83355712890625, -4.6275634765625, -4.42156982421875, -4.215576171875, -4.00958251953125, -3.8035888671875, -3.59759521484375, -3.3916015625, -3.18560791015625, -2.9796142578125, -2.77362060546875, -2.567626953125, -2.36163330078125, -2.1556396484375, -1.94964599609375, -1.74365234375, -1.53765869140625, -1.3316650390625, -1.12567138671875, -0.919677734375, -0.71368408203125, -0.5076904296875, -0.30169677734375, -0.095703125, 0.11029052734375, 0.3162841796875, 0.52227783203125, 0.728271484375, 0.93426513671875, 1.1402587890625, 1.34625244140625, 1.55224609375, 1.75823974609375, 1.9642333984375, 2.17022705078125, 2.376220703125, 2.58221435546875, 2.7882080078125, 2.99420166015625, 3.2001953125, 3.40618896484375, 3.6121826171875, 3.81817626953125, 4.024169921875, 4.23016357421875, 4.4361572265625, 4.64215087890625, 4.84814453125, 5.05413818359375, 5.2601318359375, 5.46612548828125, 5.672119140625, 5.87811279296875, 6.0841064453125, 6.29010009765625, 6.49609375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 9.0, 6.0, 9.0, 22.0, 14.0, 31.0, 40.0, 52.0, 74.0, 122.0, 145.0, 224.0, 353.0, 512.0, 817.0, 1328.0, 2160.0, 3745.0, 7003.0, 14664.0, 37347.0, 118126.0, 416637.0, 307477.0, 83308.0, 28204.0, 11842.0, 5972.0, 3203.0, 1832.0, 1119.0, 700.0, 482.0, 311.0, 208.0, 135.0, 110.0, 46.0, 42.0, 42.0, 29.0, 15.0, 11.0, 4.0, 7.0, 7.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0078125, -3.88201904296875, -3.7562255859375, -3.63043212890625, -3.504638671875, -3.37884521484375, -3.2530517578125, -3.12725830078125, -3.00146484375, -2.87567138671875, -2.7498779296875, -2.62408447265625, -2.498291015625, -2.37249755859375, -2.2467041015625, -2.12091064453125, -1.9951171875, -1.86932373046875, -1.7435302734375, -1.61773681640625, -1.491943359375, -1.36614990234375, -1.2403564453125, -1.11456298828125, -0.98876953125, -0.86297607421875, -0.7371826171875, -0.61138916015625, -0.485595703125, -0.35980224609375, -0.2340087890625, -0.10821533203125, 0.017578125, 0.14337158203125, 0.2691650390625, 0.39495849609375, 0.520751953125, 0.64654541015625, 0.7723388671875, 0.89813232421875, 1.02392578125, 1.14971923828125, 1.2755126953125, 1.40130615234375, 1.527099609375, 1.65289306640625, 1.7786865234375, 1.90447998046875, 2.0302734375, 2.15606689453125, 2.2818603515625, 2.40765380859375, 2.533447265625, 2.65924072265625, 2.7850341796875, 2.91082763671875, 3.03662109375, 3.16241455078125, 3.2882080078125, 3.41400146484375, 3.539794921875, 3.66558837890625, 3.7913818359375, 3.91717529296875, 4.04296875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 5.0, 6.0, 11.0, 10.0, 9.0, 15.0, 14.0, 15.0, 19.0, 22.0, 27.0, 34.0, 38.0, 51.0, 39.0, 41.0, 55.0, 80.0, 1584.0, 491.0, 76.0, 47.0, 42.0, 33.0, 32.0, 43.0, 30.0, 33.0, 20.0, 26.0, 23.0, 19.0, 12.0, 14.0, 7.0, 5.0, 8.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.9375, -22.17236328125, -21.4072265625, -20.64208984375, -19.876953125, -19.11181640625, -18.3466796875, -17.58154296875, -16.81640625, -16.05126953125, -15.2861328125, -14.52099609375, -13.755859375, -12.99072265625, -12.2255859375, -11.46044921875, -10.6953125, -9.93017578125, -9.1650390625, -8.39990234375, -7.634765625, -6.86962890625, -6.1044921875, -5.33935546875, -4.57421875, -3.80908203125, -3.0439453125, -2.27880859375, -1.513671875, -0.74853515625, 0.0166015625, 0.78173828125, 1.546875, 2.31201171875, 3.0771484375, 3.84228515625, 4.607421875, 5.37255859375, 6.1376953125, 6.90283203125, 7.66796875, 8.43310546875, 9.1982421875, 9.96337890625, 10.728515625, 11.49365234375, 12.2587890625, 13.02392578125, 13.7890625, 14.55419921875, 15.3193359375, 16.08447265625, 16.849609375, 17.61474609375, 18.3798828125, 19.14501953125, 19.91015625, 20.67529296875, 21.4404296875, 22.20556640625, 22.970703125, 23.73583984375, 24.5009765625, 25.26611328125, 26.03125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 6.0, 10.0, 18.0, 22.0, 22.0, 30.0, 36.0, 36.0, 58.0, 71.0, 92.0, 152.0, 285.0, 554.0, 2765.0, 573221.0, 2563095.0, 3719.0, 618.0, 288.0, 139.0, 100.0, 81.0, 63.0, 49.0, 29.0, 20.0, 24.0, 10.0, 11.0, 13.0, 8.0, 10.0, 10.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-42.21875, -40.97900390625, -39.7392578125, -38.49951171875, -37.259765625, -36.02001953125, -34.7802734375, -33.54052734375, -32.30078125, -31.06103515625, -29.8212890625, -28.58154296875, -27.341796875, -26.10205078125, -24.8623046875, -23.62255859375, -22.3828125, -21.14306640625, -19.9033203125, -18.66357421875, -17.423828125, -16.18408203125, -14.9443359375, -13.70458984375, -12.46484375, -11.22509765625, -9.9853515625, -8.74560546875, -7.505859375, -6.26611328125, -5.0263671875, -3.78662109375, -2.546875, -1.30712890625, -0.0673828125, 1.17236328125, 2.412109375, 3.65185546875, 4.8916015625, 6.13134765625, 7.37109375, 8.61083984375, 9.8505859375, 11.09033203125, 12.330078125, 13.56982421875, 14.8095703125, 16.04931640625, 17.2890625, 18.52880859375, 19.7685546875, 21.00830078125, 22.248046875, 23.48779296875, 24.7275390625, 25.96728515625, 27.20703125, 28.44677734375, 29.6865234375, 30.92626953125, 32.166015625, 33.40576171875, 34.6455078125, 35.88525390625, 37.125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [5.0, 167.0, 768.0, 78.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.039982795715332, -5.830307483673096, -1.6206321716308594, 2.589043617248535, 6.798718452453613, 11.008393287658691, 15.218070030212402, 19.427745819091797, 23.637420654296875, 27.847095489501953, 32.05677032470703, 36.266448974609375, 40.47611999511719, 44.68579864501953, 48.89547348022461, 53.10514831542969, 57.314823150634766, 61.524497985839844, 65.73417663574219, 69.94384765625, 74.15352630615234, 78.36319732666016, 82.5728759765625, 86.78254699707031, 90.99222564697266, 95.201904296875, 99.41157531738281, 103.62125396728516, 107.83092498779297, 112.04060363769531, 116.25027465820312, 120.45995330810547, 124.66963195800781, 128.87930297851562, 133.0889892578125, 137.2986602783203, 141.50833129882812, 145.71800231933594, 149.9276885986328, 154.13735961914062, 158.34703063964844, 162.55670166015625, 166.76638793945312, 170.97605895996094, 175.18572998046875, 179.39540100097656, 183.60508728027344, 187.81475830078125, 192.02444458007812, 196.23411560058594, 200.4438018798828, 204.65347290039062, 208.86314392089844, 213.07281494140625, 217.28250122070312, 221.49217224121094, 225.70184326171875, 229.91151428222656, 234.12120056152344, 238.33087158203125, 242.54054260253906, 246.75021362304688, 250.95989990234375, 255.16957092285156, 259.3792419433594]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 8.0, 7.0, 2.0, 7.0, 3.0, 13.0, 7.0, 11.0, 13.0, 19.0, 21.0, 17.0, 16.0, 25.0, 21.0, 24.0, 31.0, 30.0, 24.0, 37.0, 37.0, 41.0, 39.0, 48.0, 35.0, 40.0, 45.0, 43.0, 25.0, 41.0, 44.0, 28.0, 22.0, 20.0, 27.0, 13.0, 15.0, 9.0, 14.0, 17.0, 18.0, 14.0, 7.0, 3.0, 5.0, 9.0, 7.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-72.71269226074219, -70.53578186035156, -68.35887145996094, -66.18196105957031, -64.00505065917969, -61.82814025878906, -59.6512336730957, -57.47432327270508, -55.29741287231445, -53.12050247192383, -50.9435920715332, -48.76668167114258, -46.58977508544922, -44.412864685058594, -42.23595428466797, -40.059043884277344, -37.88213348388672, -35.705223083496094, -33.52831268310547, -31.351404190063477, -29.17449378967285, -26.997583389282227, -24.820674896240234, -22.64376449584961, -20.466854095458984, -18.28994369506836, -16.113033294677734, -13.936124801635742, -11.759214401245117, -9.582304000854492, -7.405394554138184, -5.228485107421875, -3.0515823364257812, -0.8746724128723145, 1.3022375106811523, 3.479147434234619, 5.656057357788086, 7.832967758178711, 10.00987720489502, 12.186786651611328, 14.363697052001953, 16.540607452392578, 18.717517852783203, 20.894426345825195, 23.07133674621582, 25.248247146606445, 27.425155639648438, 29.602066040039062, 31.778976440429688, 33.95588684082031, 36.13279724121094, 38.30970764160156, 40.48661804199219, 42.66352844238281, 44.84043502807617, 47.0173454284668, 49.19425582885742, 51.37116622924805, 53.54807662963867, 55.7249870300293, 57.901893615722656, 60.07880401611328, 62.255714416503906, 64.43262481689453, 66.60953521728516]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 7.0, 5.0, 10.0, 10.0, 13.0, 16.0, 10.0, 19.0, 24.0, 19.0, 34.0, 26.0, 31.0, 33.0, 39.0, 36.0, 43.0, 52.0, 32.0, 43.0, 45.0, 47.0, 48.0, 36.0, 47.0, 40.0, 20.0, 33.0, 31.0, 28.0, 24.0, 21.0, 15.0, 9.0, 10.0, 11.0, 12.0, 5.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.71875, -6.51177978515625, -6.3048095703125, -6.09783935546875, -5.890869140625, -5.68389892578125, -5.4769287109375, -5.26995849609375, -5.06298828125, -4.85601806640625, -4.6490478515625, -4.44207763671875, -4.235107421875, -4.02813720703125, -3.8211669921875, -3.61419677734375, -3.4072265625, -3.20025634765625, -2.9932861328125, -2.78631591796875, -2.579345703125, -2.37237548828125, -2.1654052734375, -1.95843505859375, -1.75146484375, -1.54449462890625, -1.3375244140625, -1.13055419921875, -0.923583984375, -0.71661376953125, -0.5096435546875, -0.30267333984375, -0.095703125, 0.11126708984375, 0.3182373046875, 0.52520751953125, 0.732177734375, 0.93914794921875, 1.1461181640625, 1.35308837890625, 1.56005859375, 1.76702880859375, 1.9739990234375, 2.18096923828125, 2.387939453125, 2.59490966796875, 2.8018798828125, 3.00885009765625, 3.2158203125, 3.42279052734375, 3.6297607421875, 3.83673095703125, 4.043701171875, 4.25067138671875, 4.4576416015625, 4.66461181640625, 4.87158203125, 5.07855224609375, 5.2855224609375, 5.49249267578125, 5.699462890625, 5.90643310546875, 6.1134033203125, 6.32037353515625, 6.52734375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 12.0, 13.0, 17.0, 16.0, 17.0, 15.0, 26.0, 28.0, 45.0, 76.0, 111.0, 193.0, 390.0, 1623.0, 8971.0, 108092.0, 2442870.0, 1564272.0, 59460.0, 6003.0, 1107.0, 376.0, 171.0, 94.0, 65.0, 37.0, 29.0, 37.0, 14.0, 16.0, 7.0, 15.0, 12.0, 9.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.140625, -20.498046875, -19.85546875, -19.212890625, -18.5703125, -17.927734375, -17.28515625, -16.642578125, -16.0, -15.357421875, -14.71484375, -14.072265625, -13.4296875, -12.787109375, -12.14453125, -11.501953125, -10.859375, -10.216796875, -9.57421875, -8.931640625, -8.2890625, -7.646484375, -7.00390625, -6.361328125, -5.71875, -5.076171875, -4.43359375, -3.791015625, -3.1484375, -2.505859375, -1.86328125, -1.220703125, -0.578125, 0.064453125, 0.70703125, 1.349609375, 1.9921875, 2.634765625, 3.27734375, 3.919921875, 4.5625, 5.205078125, 5.84765625, 6.490234375, 7.1328125, 7.775390625, 8.41796875, 9.060546875, 9.703125, 10.345703125, 10.98828125, 11.630859375, 12.2734375, 12.916015625, 13.55859375, 14.201171875, 14.84375, 15.486328125, 16.12890625, 16.771484375, 17.4140625, 18.056640625, 18.69921875, 19.341796875, 19.984375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 3.0, 12.0, 21.0, 22.0, 33.0, 63.0, 101.0, 127.0, 196.0, 268.0, 441.0, 569.0, 624.0, 524.0, 380.0, 231.0, 148.0, 99.0, 74.0, 42.0, 32.0, 26.0, 11.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.546875, -23.848876953125, -23.15087890625, -22.452880859375, -21.7548828125, -21.056884765625, -20.35888671875, -19.660888671875, -18.962890625, -18.264892578125, -17.56689453125, -16.868896484375, -16.1708984375, -15.472900390625, -14.77490234375, -14.076904296875, -13.37890625, -12.680908203125, -11.98291015625, -11.284912109375, -10.5869140625, -9.888916015625, -9.19091796875, -8.492919921875, -7.794921875, -7.096923828125, -6.39892578125, -5.700927734375, -5.0029296875, -4.304931640625, -3.60693359375, -2.908935546875, -2.2109375, -1.512939453125, -0.81494140625, -0.116943359375, 0.5810546875, 1.279052734375, 1.97705078125, 2.675048828125, 3.373046875, 4.071044921875, 4.76904296875, 5.467041015625, 6.1650390625, 6.863037109375, 7.56103515625, 8.259033203125, 8.95703125, 9.655029296875, 10.35302734375, 11.051025390625, 11.7490234375, 12.447021484375, 13.14501953125, 13.843017578125, 14.541015625, 15.239013671875, 15.93701171875, 16.635009765625, 17.3330078125, 18.031005859375, 18.72900390625, 19.427001953125, 20.125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 3.0, 5.0, 8.0, 18.0, 18.0, 24.0, 36.0, 52.0, 70.0, 97.0, 136.0, 193.0, 345.0, 944.0, 6419.0, 1688217.0, 2487962.0, 7783.0, 932.0, 327.0, 207.0, 134.0, 94.0, 71.0, 52.0, 37.0, 25.0, 24.0, 19.0, 5.0, 5.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.78125, -50.58447265625, -48.3876953125, -46.19091796875, -43.994140625, -41.79736328125, -39.6005859375, -37.40380859375, -35.20703125, -33.01025390625, -30.8134765625, -28.61669921875, -26.419921875, -24.22314453125, -22.0263671875, -19.82958984375, -17.6328125, -15.43603515625, -13.2392578125, -11.04248046875, -8.845703125, -6.64892578125, -4.4521484375, -2.25537109375, -0.05859375, 2.13818359375, 4.3349609375, 6.53173828125, 8.728515625, 10.92529296875, 13.1220703125, 15.31884765625, 17.515625, 19.71240234375, 21.9091796875, 24.10595703125, 26.302734375, 28.49951171875, 30.6962890625, 32.89306640625, 35.08984375, 37.28662109375, 39.4833984375, 41.68017578125, 43.876953125, 46.07373046875, 48.2705078125, 50.46728515625, 52.6640625, 54.86083984375, 57.0576171875, 59.25439453125, 61.451171875, 63.64794921875, 65.8447265625, 68.04150390625, 70.23828125, 72.43505859375, 74.6318359375, 76.82861328125, 79.025390625, 81.22216796875, 83.4189453125, 85.61572265625, 87.8125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 12.0, 46.0, 105.0, 197.0, 272.0, 196.0, 111.0, 52.0, 13.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.05514526367188, -158.57041931152344, -154.08570861816406, -149.60098266601562, -145.11627197265625, -140.6315460205078, -136.14682006835938, -131.662109375, -127.17738342285156, -122.69266510009766, -118.20794677734375, -113.72322082519531, -109.2385025024414, -104.7537841796875, -100.26905822753906, -95.78433990478516, -91.29962158203125, -86.81490325927734, -82.33018493652344, -77.845458984375, -73.3607406616211, -68.87602233886719, -64.39129638671875, -59.906578063964844, -55.42185974121094, -50.93714141845703, -46.45241928100586, -41.96769714355469, -37.48297882080078, -32.998260498046875, -28.513538360595703, -24.028818130493164, -19.544097900390625, -15.059377670288086, -10.574657440185547, -6.089937210083008, -1.6052169799804688, 2.8795032501220703, 7.364223480224609, 11.848943710327148, 16.333663940429688, 20.818384170532227, 25.303104400634766, 29.787824630737305, 34.272544860839844, 38.75726318359375, 43.24198532104492, 47.726707458496094, 52.21142578125, 56.696144104003906, 61.18086624145508, 65.66558837890625, 70.15030670166016, 74.63502502441406, 79.1197509765625, 83.6044692993164, 88.08918762207031, 92.57390594482422, 97.05862426757812, 101.54335021972656, 106.02806854248047, 110.51278686523438, 114.99751281738281, 119.48223114013672, 123.96694946289062]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 7.0, 7.0, 11.0, 8.0, 13.0, 11.0, 21.0, 20.0, 22.0, 22.0, 20.0, 25.0, 30.0, 26.0, 26.0, 28.0, 37.0, 36.0, 43.0, 37.0, 32.0, 31.0, 41.0, 44.0, 44.0, 41.0, 35.0, 23.0, 30.0, 24.0, 22.0, 22.0, 21.0, 26.0, 20.0, 20.0, 16.0, 10.0, 10.0, 10.0, 5.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.805999755859375, -49.17817687988281, -47.550350189208984, -45.922523498535156, -44.294700622558594, -42.66687774658203, -41.0390510559082, -39.411224365234375, -37.78340148925781, -36.15557861328125, -34.52775192260742, -32.899925231933594, -31.27210235595703, -29.644277572631836, -28.01645278930664, -26.388628005981445, -24.76080322265625, -23.132978439331055, -21.50515365600586, -19.877328872680664, -18.24950408935547, -16.621679306030273, -14.993854522705078, -13.366029739379883, -11.738204956054688, -10.110380172729492, -8.482555389404297, -6.854730606079102, -5.226905822753906, -3.599081039428711, -1.9712562561035156, -0.3434314727783203, 1.284393310546875, 2.9122180938720703, 4.540042877197266, 6.167867660522461, 7.795692443847656, 9.423517227172852, 11.051342010498047, 12.679166793823242, 14.306991577148438, 15.934816360473633, 17.562641143798828, 19.190465927124023, 20.81829071044922, 22.446115493774414, 24.07394027709961, 25.701765060424805, 27.32958984375, 28.957414627075195, 30.58523941040039, 32.21306610107422, 33.84088897705078, 35.468711853027344, 37.09653854370117, 38.724365234375, 40.35218811035156, 41.980010986328125, 43.60783767700195, 45.23566436767578, 46.863487243652344, 48.491310119628906, 50.119136810302734, 51.74696350097656, 53.374786376953125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 14.0, 10.0, 7.0, 17.0, 20.0, 16.0, 21.0, 19.0, 30.0, 25.0, 34.0, 29.0, 31.0, 39.0, 41.0, 36.0, 35.0, 46.0, 43.0, 48.0, 39.0, 37.0, 40.0, 32.0, 29.0, 37.0, 29.0, 35.0, 21.0, 23.0, 11.0, 15.0, 21.0, 9.0, 9.0, 12.0, 8.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.68359375, -6.48138427734375, -6.2791748046875, -6.07696533203125, -5.874755859375, -5.67254638671875, -5.4703369140625, -5.26812744140625, -5.06591796875, -4.86370849609375, -4.6614990234375, -4.45928955078125, -4.257080078125, -4.05487060546875, -3.8526611328125, -3.65045166015625, -3.4482421875, -3.24603271484375, -3.0438232421875, -2.84161376953125, -2.639404296875, -2.43719482421875, -2.2349853515625, -2.03277587890625, -1.83056640625, -1.62835693359375, -1.4261474609375, -1.22393798828125, -1.021728515625, -0.81951904296875, -0.6173095703125, -0.41510009765625, -0.212890625, -0.01068115234375, 0.1915283203125, 0.39373779296875, 0.595947265625, 0.79815673828125, 1.0003662109375, 1.20257568359375, 1.40478515625, 1.60699462890625, 1.8092041015625, 2.01141357421875, 2.213623046875, 2.41583251953125, 2.6180419921875, 2.82025146484375, 3.0224609375, 3.22467041015625, 3.4268798828125, 3.62908935546875, 3.831298828125, 4.03350830078125, 4.2357177734375, 4.43792724609375, 4.64013671875, 4.84234619140625, 5.0445556640625, 5.24676513671875, 5.448974609375, 5.65118408203125, 5.8533935546875, 6.05560302734375, 6.2578125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 6.0, 5.0, 12.0, 20.0, 25.0, 26.0, 43.0, 66.0, 100.0, 154.0, 188.0, 256.0, 410.0, 610.0, 863.0, 1221.0, 1764.0, 2702.0, 3810.0, 5770.0, 8495.0, 12696.0, 19409.0, 29798.0, 46139.0, 72337.0, 113949.0, 180878.0, 196869.0, 125031.0, 78774.0, 50229.0, 32163.0, 21011.0, 13904.0, 9401.0, 6178.0, 4119.0, 2787.0, 1977.0, 1382.0, 888.0, 647.0, 432.0, 324.0, 198.0, 159.0, 113.0, 78.0, 52.0, 32.0, 26.0, 11.0, 12.0, 7.0, 3.0, 2.0, 4.0, 3.0, 2.0], "bins": [-0.86572265625, -0.8387527465820312, -0.8117828369140625, -0.7848129272460938, -0.757843017578125, -0.7308731079101562, -0.7039031982421875, -0.6769332885742188, -0.64996337890625, -0.6229934692382812, -0.5960235595703125, -0.5690536499023438, -0.542083740234375, -0.5151138305664062, -0.4881439208984375, -0.46117401123046875, -0.4342041015625, -0.40723419189453125, -0.3802642822265625, -0.35329437255859375, -0.326324462890625, -0.29935455322265625, -0.2723846435546875, -0.24541473388671875, -0.21844482421875, -0.19147491455078125, -0.1645050048828125, -0.13753509521484375, -0.110565185546875, -0.08359527587890625, -0.0566253662109375, -0.02965545654296875, -0.002685546875, 0.02428436279296875, 0.0512542724609375, 0.07822418212890625, 0.105194091796875, 0.13216400146484375, 0.1591339111328125, 0.18610382080078125, 0.21307373046875, 0.24004364013671875, 0.2670135498046875, 0.29398345947265625, 0.320953369140625, 0.34792327880859375, 0.3748931884765625, 0.40186309814453125, 0.4288330078125, 0.45580291748046875, 0.4827728271484375, 0.5097427368164062, 0.536712646484375, 0.5636825561523438, 0.5906524658203125, 0.6176223754882812, 0.64459228515625, 0.6715621948242188, 0.6985321044921875, 0.7255020141601562, 0.752471923828125, 0.7794418334960938, 0.8064117431640625, 0.8333816528320312, 0.8603515625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 5.0, 4.0, 6.0, 4.0, 5.0, 6.0, 12.0, 5.0, 7.0, 13.0, 20.0, 18.0, 29.0, 24.0, 31.0, 15.0, 33.0, 31.0, 42.0, 35.0, 33.0, 36.0, 49.0, 36.0, 1065.0, 45.0, 43.0, 43.0, 36.0, 29.0, 31.0, 20.0, 32.0, 28.0, 26.0, 19.0, 17.0, 16.0, 17.0, 14.0, 9.0, 13.0, 10.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.140625, -4.021087646484375, -3.90155029296875, -3.782012939453125, -3.6624755859375, -3.542938232421875, -3.42340087890625, -3.303863525390625, -3.184326171875, -3.064788818359375, -2.94525146484375, -2.825714111328125, -2.7061767578125, -2.586639404296875, -2.46710205078125, -2.347564697265625, -2.22802734375, -2.108489990234375, -1.98895263671875, -1.869415283203125, -1.7498779296875, -1.630340576171875, -1.51080322265625, -1.391265869140625, -1.271728515625, -1.152191162109375, -1.03265380859375, -0.913116455078125, -0.7935791015625, -0.674041748046875, -0.55450439453125, -0.434967041015625, -0.3154296875, -0.195892333984375, -0.07635498046875, 0.043182373046875, 0.1627197265625, 0.282257080078125, 0.40179443359375, 0.521331787109375, 0.640869140625, 0.760406494140625, 0.87994384765625, 0.999481201171875, 1.1190185546875, 1.238555908203125, 1.35809326171875, 1.477630615234375, 1.59716796875, 1.716705322265625, 1.83624267578125, 1.955780029296875, 2.0753173828125, 2.194854736328125, 2.31439208984375, 2.433929443359375, 2.553466796875, 2.673004150390625, 2.79254150390625, 2.912078857421875, 3.0316162109375, 3.151153564453125, 3.27069091796875, 3.390228271484375, 3.509765625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 13.0, 11.0, 11.0, 24.0, 42.0, 55.0, 91.0, 147.0, 190.0, 298.0, 419.0, 592.0, 951.0, 1467.0, 2134.0, 3223.0, 4615.0, 6981.0, 10335.0, 15839.0, 24434.0, 37499.0, 57957.0, 89813.0, 139460.0, 1247682.0, 159945.0, 102280.0, 66171.0, 43212.0, 27602.0, 17958.0, 11736.0, 7930.0, 5350.0, 3445.0, 2356.0, 1576.0, 1069.0, 741.0, 485.0, 319.0, 216.0, 173.0, 99.0, 70.0, 34.0, 31.0, 23.0, 13.0, 8.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.77490234375, -0.7504196166992188, -0.7259368896484375, -0.7014541625976562, -0.676971435546875, -0.6524887084960938, -0.6280059814453125, -0.6035232543945312, -0.57904052734375, -0.5545578002929688, -0.5300750732421875, -0.5055923461914062, -0.481109619140625, -0.45662689208984375, -0.4321441650390625, -0.40766143798828125, -0.3831787109375, -0.35869598388671875, -0.3342132568359375, -0.30973052978515625, -0.285247802734375, -0.26076507568359375, -0.2362823486328125, -0.21179962158203125, -0.18731689453125, -0.16283416748046875, -0.1383514404296875, -0.11386871337890625, -0.089385986328125, -0.06490325927734375, -0.0404205322265625, -0.01593780517578125, 0.008544921875, 0.03302764892578125, 0.0575103759765625, 0.08199310302734375, 0.106475830078125, 0.13095855712890625, 0.1554412841796875, 0.17992401123046875, 0.20440673828125, 0.22888946533203125, 0.2533721923828125, 0.27785491943359375, 0.302337646484375, 0.32682037353515625, 0.3513031005859375, 0.37578582763671875, 0.4002685546875, 0.42475128173828125, 0.4492340087890625, 0.47371673583984375, 0.498199462890625, 0.5226821899414062, 0.5471649169921875, 0.5716476440429688, 0.59613037109375, 0.6206130981445312, 0.6450958251953125, 0.6695785522460938, 0.694061279296875, 0.7185440063476562, 0.7430267333984375, 0.7675094604492188, 0.7919921875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 7.0, 9.0, 7.0, 8.0, 12.0, 12.0, 11.0, 15.0, 20.0, 20.0, 27.0, 34.0, 42.0, 47.0, 61.0, 63.0, 68.0, 93.0, 74.0, 62.0, 59.0, 42.0, 27.0, 36.0, 24.0, 28.0, 25.0, 17.0, 14.0, 6.0, 8.0, 9.0, 3.0, 0.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0018682479858398438, -0.0018110424280166626, -0.0017538368701934814, -0.0016966313123703003, -0.0016394257545471191, -0.001582220196723938, -0.0015250146389007568, -0.0014678090810775757, -0.0014106035232543945, -0.0013533979654312134, -0.0012961924076080322, -0.001238986849784851, -0.00118178129196167, -0.0011245757341384888, -0.0010673701763153076, -0.0010101646184921265, -0.0009529590606689453, -0.0008957535028457642, -0.000838547945022583, -0.0007813423871994019, -0.0007241368293762207, -0.0006669312715530396, -0.0006097257137298584, -0.0005525201559066772, -0.0004953145980834961, -0.00043810904026031494, -0.0003809034824371338, -0.00032369792461395264, -0.0002664923667907715, -0.00020928680896759033, -0.00015208125114440918, -9.487569332122803e-05, -3.7670135498046875e-05, 1.9535422325134277e-05, 7.674098014831543e-05, 0.00013394653797149658, 0.00019115209579467773, 0.0002483576536178589, 0.00030556321144104004, 0.0003627687692642212, 0.00041997432708740234, 0.0004771798849105835, 0.0005343854427337646, 0.0005915910005569458, 0.000648796558380127, 0.0007060021162033081, 0.0007632076740264893, 0.0008204132318496704, 0.0008776187896728516, 0.0009348243474960327, 0.0009920299053192139, 0.001049235463142395, 0.0011064410209655762, 0.0011636465787887573, 0.0012208521366119385, 0.0012780576944351196, 0.0013352632522583008, 0.001392468810081482, 0.001449674367904663, 0.0015068799257278442, 0.0015640854835510254, 0.0016212910413742065, 0.0016784965991973877, 0.0017357021570205688, 0.00179290771484375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 11.0, 4.0, 13.0, 9.0, 23.0, 18.0, 32.0, 45.0, 60.0, 95.0, 160.0, 281.0, 647.0, 28193.0, 1016093.0, 1786.0, 430.0, 205.0, 125.0, 74.0, 43.0, 32.0, 30.0, 23.0, 21.0, 19.0, 12.0, 9.0, 8.0, 10.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0372314453125, -0.035913944244384766, -0.03459644317626953, -0.0332789421081543, -0.03196144104003906, -0.030643939971923828, -0.029326438903808594, -0.02800893783569336, -0.026691436767578125, -0.02537393569946289, -0.024056434631347656, -0.022738933563232422, -0.021421432495117188, -0.020103931427001953, -0.01878643035888672, -0.017468929290771484, -0.01615142822265625, -0.014833927154541016, -0.013516426086425781, -0.012198925018310547, -0.010881423950195312, -0.009563922882080078, -0.008246421813964844, -0.006928920745849609, -0.005611419677734375, -0.004293918609619141, -0.0029764175415039062, -0.0016589164733886719, -0.0003414154052734375, 0.0009760856628417969, 0.0022935867309570312, 0.0036110877990722656, 0.0049285888671875, 0.006246089935302734, 0.007563591003417969, 0.008881092071533203, 0.010198593139648438, 0.011516094207763672, 0.012833595275878906, 0.01415109634399414, 0.015468597412109375, 0.01678609848022461, 0.018103599548339844, 0.019421100616455078, 0.020738601684570312, 0.022056102752685547, 0.02337360382080078, 0.024691104888916016, 0.02600860595703125, 0.027326107025146484, 0.02864360809326172, 0.029961109161376953, 0.03127861022949219, 0.03259611129760742, 0.033913612365722656, 0.03523111343383789, 0.036548614501953125, 0.03786611557006836, 0.039183616638183594, 0.04050111770629883, 0.04181861877441406, 0.0431361198425293, 0.04445362091064453, 0.045771121978759766, 0.047088623046875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 53.0, 427.0, 449.0, 75.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0084548844024539, -0.008292448706924915, -0.008130013011395931, -0.007967577315866947, -0.00780514208599925, -0.007642706390470266, -0.007480270694941282, -0.0073178354650735855, -0.0071553997695446014, -0.006992964074015617, -0.006830528378486633, -0.0066680931486189365, -0.0065056574530899525, -0.006343221757560968, -0.006180786062031984, -0.006018350832164288, -0.0058559151366353035, -0.005693479441106319, -0.005531043745577335, -0.005368608515709639, -0.0052061728201806545, -0.0050437371246516705, -0.004881301429122686, -0.00471886619925499, -0.004556430038064718, -0.004393994342535734, -0.00423155864700675, -0.004069123417139053, -0.003906687721610069, -0.003744252026081085, -0.003581816330552101, -0.0034193808678537607, -0.003256945637986064, -0.00309450994245708, -0.0029320744797587395, -0.0027696387842297554, -0.002607203321531415, -0.002444767626002431, -0.0022823321633040905, -0.0021198964677751064, -0.0019574607722461224, -0.0017950251931324601, -0.0016325896140187979, -0.0014701539184898138, -0.0013077184557914734, -0.0011452827602624893, -0.000982847181148827, -0.0008204116020351648, -0.0006579761393368244, -0.0004955405602231622, -0.0003331049520056695, -0.00017066934378817677, -8.233764674514532e-06, 0.0001542018144391477, 0.00031663745176047087, 0.0004790730308741331, 0.0006415086099877954, 0.0008039441891014576, 0.0009663797682151198, 0.001128815347328782, 0.0012912510428577662, 0.0014536865055561066, 0.0016161222010850906, 0.0017785577801987529, 0.0019409933593124151]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 9.0, 6.0, 1.0, 5.0, 9.0, 5.0, 10.0, 22.0, 19.0, 24.0, 21.0, 25.0, 32.0, 31.0, 30.0, 30.0, 34.0, 30.0, 41.0, 36.0, 45.0, 43.0, 47.0, 28.0, 29.0, 46.0, 47.0, 35.0, 33.0, 31.0, 20.0, 23.0, 29.0, 21.0, 28.0, 17.0, 14.0, 11.0, 8.0, 11.0, 7.0, 1.0, 2.0, 6.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009077787399291992, -0.0008791247382760048, -0.0008504707366228104, -0.0008218167349696159, -0.0007931627333164215, -0.0007645087316632271, -0.0007358547300100327, -0.0007072007283568382, -0.0006785467267036438, -0.0006498927250504494, -0.0006212387233972549, -0.0005925847217440605, -0.0005639307200908661, -0.0005352767184376717, -0.0005066227167844772, -0.0004779687151312828, -0.0004493147134780884, -0.00042066071182489395, -0.0003920067101716995, -0.0003633527085185051, -0.00033469870686531067, -0.00030604470521211624, -0.0002773907035589218, -0.0002487367019057274, -0.00022008270025253296, -0.00019142869859933853, -0.0001627746969461441, -0.00013412069529294968, -0.00010546669363975525, -7.681269198656082e-05, -4.8158690333366394e-05, -1.9504688680171967e-05, 9.149312973022461e-06, 3.780331462621689e-05, 6.645731627941132e-05, 9.511131793260574e-05, 0.00012376531958580017, 0.0001524193212389946, 0.00018107332289218903, 0.00020972732454538345, 0.00023838132619857788, 0.0002670353278517723, 0.00029568932950496674, 0.00032434333115816116, 0.0003529973328113556, 0.00038165133446455, 0.00041030533611774445, 0.0004389593377709389, 0.0004676133394241333, 0.0004962673410773277, 0.0005249213427305222, 0.0005535753443837166, 0.000582229346036911, 0.0006108833476901054, 0.0006395373493432999, 0.0006681913509964943, 0.0006968453526496887, 0.0007254993543028831, 0.0007541533559560776, 0.000782807357609272, 0.0008114613592624664, 0.0008401153609156609, 0.0008687693625688553, 0.0008974233642220497, 0.0009260773658752441]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 14.0, 10.0, 7.0, 17.0, 20.0, 16.0, 21.0, 19.0, 30.0, 25.0, 34.0, 29.0, 31.0, 39.0, 41.0, 36.0, 35.0, 46.0, 43.0, 48.0, 39.0, 37.0, 40.0, 32.0, 29.0, 37.0, 29.0, 35.0, 21.0, 23.0, 11.0, 15.0, 21.0, 9.0, 9.0, 13.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.68359375, -6.48138427734375, -6.2791748046875, -6.07696533203125, -5.874755859375, -5.67254638671875, -5.4703369140625, -5.26812744140625, -5.06591796875, -4.86370849609375, -4.6614990234375, -4.45928955078125, -4.257080078125, -4.05487060546875, -3.8526611328125, -3.65045166015625, -3.4482421875, -3.24603271484375, -3.0438232421875, -2.84161376953125, -2.639404296875, -2.43719482421875, -2.2349853515625, -2.03277587890625, -1.83056640625, -1.62835693359375, -1.4261474609375, -1.22393798828125, -1.021728515625, -0.81951904296875, -0.6173095703125, -0.41510009765625, -0.212890625, -0.01068115234375, 0.1915283203125, 0.39373779296875, 0.595947265625, 0.79815673828125, 1.0003662109375, 1.20257568359375, 1.40478515625, 1.60699462890625, 1.8092041015625, 2.01141357421875, 2.213623046875, 2.41583251953125, 2.6180419921875, 2.82025146484375, 3.0224609375, 3.22467041015625, 3.4268798828125, 3.62908935546875, 3.831298828125, 4.03350830078125, 4.2357177734375, 4.43792724609375, 4.64013671875, 4.84234619140625, 5.0445556640625, 5.24676513671875, 5.448974609375, 5.65118408203125, 5.8533935546875, 6.05560302734375, 6.2578125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 3.0, 4.0, 9.0, 11.0, 17.0, 33.0, 39.0, 67.0, 84.0, 111.0, 182.0, 260.0, 384.0, 609.0, 851.0, 1277.0, 1856.0, 2898.0, 4496.0, 7324.0, 12885.0, 26989.0, 73030.0, 301512.0, 442315.0, 99486.0, 33646.0, 15385.0, 8154.0, 5000.0, 3213.0, 2102.0, 1374.0, 934.0, 647.0, 424.0, 313.0, 183.0, 137.0, 92.0, 77.0, 42.0, 35.0, 18.0, 18.0, 10.0, 3.0, 10.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.23046875, -5.07257080078125, -4.9146728515625, -4.75677490234375, -4.598876953125, -4.44097900390625, -4.2830810546875, -4.12518310546875, -3.96728515625, -3.80938720703125, -3.6514892578125, -3.49359130859375, -3.335693359375, -3.17779541015625, -3.0198974609375, -2.86199951171875, -2.7041015625, -2.54620361328125, -2.3883056640625, -2.23040771484375, -2.072509765625, -1.91461181640625, -1.7567138671875, -1.59881591796875, -1.44091796875, -1.28302001953125, -1.1251220703125, -0.96722412109375, -0.809326171875, -0.65142822265625, -0.4935302734375, -0.33563232421875, -0.177734375, -0.01983642578125, 0.1380615234375, 0.29595947265625, 0.453857421875, 0.61175537109375, 0.7696533203125, 0.92755126953125, 1.08544921875, 1.24334716796875, 1.4012451171875, 1.55914306640625, 1.717041015625, 1.87493896484375, 2.0328369140625, 2.19073486328125, 2.3486328125, 2.50653076171875, 2.6644287109375, 2.82232666015625, 2.980224609375, 3.13812255859375, 3.2960205078125, 3.45391845703125, 3.61181640625, 3.76971435546875, 3.9276123046875, 4.08551025390625, 4.243408203125, 4.40130615234375, 4.5592041015625, 4.71710205078125, 4.875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 11.0, 3.0, 5.0, 6.0, 13.0, 10.0, 20.0, 15.0, 17.0, 22.0, 25.0, 38.0, 30.0, 38.0, 33.0, 35.0, 47.0, 52.0, 76.0, 222.0, 1708.0, 160.0, 65.0, 38.0, 37.0, 47.0, 36.0, 34.0, 34.0, 24.0, 28.0, 26.0, 20.0, 15.0, 13.0, 20.0, 4.0, 7.0, 4.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-27.734375, -26.991455078125, -26.24853515625, -25.505615234375, -24.7626953125, -24.019775390625, -23.27685546875, -22.533935546875, -21.791015625, -21.048095703125, -20.30517578125, -19.562255859375, -18.8193359375, -18.076416015625, -17.33349609375, -16.590576171875, -15.84765625, -15.104736328125, -14.36181640625, -13.618896484375, -12.8759765625, -12.133056640625, -11.39013671875, -10.647216796875, -9.904296875, -9.161376953125, -8.41845703125, -7.675537109375, -6.9326171875, -6.189697265625, -5.44677734375, -4.703857421875, -3.9609375, -3.218017578125, -2.47509765625, -1.732177734375, -0.9892578125, -0.246337890625, 0.49658203125, 1.239501953125, 1.982421875, 2.725341796875, 3.46826171875, 4.211181640625, 4.9541015625, 5.697021484375, 6.43994140625, 7.182861328125, 7.92578125, 8.668701171875, 9.41162109375, 10.154541015625, 10.8974609375, 11.640380859375, 12.38330078125, 13.126220703125, 13.869140625, 14.612060546875, 15.35498046875, 16.097900390625, 16.8408203125, 17.583740234375, 18.32666015625, 19.069580078125, 19.8125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 5.0, 3.0, 9.0, 6.0, 8.0, 14.0, 19.0, 21.0, 39.0, 35.0, 37.0, 54.0, 90.0, 136.0, 211.0, 309.0, 880.0, 7277.0, 2919289.0, 212619.0, 3169.0, 592.0, 271.0, 181.0, 115.0, 71.0, 66.0, 46.0, 25.0, 29.0, 21.0, 17.0, 13.0, 7.0, 4.0, 10.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.375, -45.7880859375, -44.201171875, -42.6142578125, -41.02734375, -39.4404296875, -37.853515625, -36.2666015625, -34.6796875, -33.0927734375, -31.505859375, -29.9189453125, -28.33203125, -26.7451171875, -25.158203125, -23.5712890625, -21.984375, -20.3974609375, -18.810546875, -17.2236328125, -15.63671875, -14.0498046875, -12.462890625, -10.8759765625, -9.2890625, -7.7021484375, -6.115234375, -4.5283203125, -2.94140625, -1.3544921875, 0.232421875, 1.8193359375, 3.40625, 4.9931640625, 6.580078125, 8.1669921875, 9.75390625, 11.3408203125, 12.927734375, 14.5146484375, 16.1015625, 17.6884765625, 19.275390625, 20.8623046875, 22.44921875, 24.0361328125, 25.623046875, 27.2099609375, 28.796875, 30.3837890625, 31.970703125, 33.5576171875, 35.14453125, 36.7314453125, 38.318359375, 39.9052734375, 41.4921875, 43.0791015625, 44.666015625, 46.2529296875, 47.83984375, 49.4267578125, 51.013671875, 52.6005859375, 54.1875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 111.0, 324.0, 400.0, 127.0, 30.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.56564712524414, -19.198305130004883, -16.830963134765625, -14.463619232177734, -12.096277236938477, -9.728935241699219, -7.3615922927856445, -4.99424934387207, -2.6269073486328125, -0.2595648765563965, 2.1077775955200195, 4.4751200675964355, 6.842462539672852, 9.20980453491211, 11.577147483825684, 13.944490432739258, 16.311832427978516, 18.679174423217773, 21.04651641845703, 23.413860321044922, 25.78120231628418, 28.148544311523438, 30.515888214111328, 32.88323211669922, 35.250572204589844, 37.617916107177734, 39.98525619506836, 42.35260009765625, 44.719940185546875, 47.087284088134766, 49.454627990722656, 51.82196807861328, 54.18931579589844, 56.55665969848633, 58.92399978637695, 61.291343688964844, 63.65868377685547, 66.02603149414062, 68.39337158203125, 70.76071166992188, 73.1280517578125, 75.49539184570312, 77.86273956298828, 80.2300796508789, 82.59741973876953, 84.96476745605469, 87.33210754394531, 89.69944763183594, 92.0667953491211, 94.43413543701172, 96.80148315429688, 99.1688232421875, 101.53616333007812, 103.90350341796875, 106.2708511352539, 108.63819122314453, 111.00553894042969, 113.37287902832031, 115.74022674560547, 118.1075668334961, 120.47490692138672, 122.84225463867188, 125.2095947265625, 127.57693481445312, 129.94427490234375]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 3.0, 5.0, 5.0, 6.0, 7.0, 17.0, 21.0, 20.0, 19.0, 28.0, 18.0, 34.0, 25.0, 27.0, 35.0, 35.0, 28.0, 37.0, 49.0, 44.0, 41.0, 32.0, 34.0, 39.0, 34.0, 36.0, 31.0, 32.0, 35.0, 31.0, 28.0, 25.0, 19.0, 11.0, 24.0, 14.0, 8.0, 9.0, 8.0, 11.0, 11.0, 7.0, 2.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-73.367431640625, -71.26718139648438, -69.16693115234375, -67.06668090820312, -64.9664306640625, -62.866180419921875, -60.765933990478516, -58.66568374633789, -56.565433502197266, -54.46518325805664, -52.364933013916016, -50.26468276977539, -48.16443634033203, -46.064186096191406, -43.96393585205078, -41.863685607910156, -39.76343536376953, -37.663185119628906, -35.56293487548828, -33.462684631347656, -31.362436294555664, -29.26218605041504, -27.161937713623047, -25.061687469482422, -22.961437225341797, -20.861186981201172, -18.760936737060547, -16.660688400268555, -14.56043815612793, -12.460187911987305, -10.359938621520996, -8.259689331054688, -6.159431457519531, -4.0591816902160645, -1.9589319229125977, 0.14131784439086914, 2.241567611694336, 4.341817855834961, 6.4420671463012695, 8.542316436767578, 10.642566680908203, 12.742816925048828, 14.843066215515137, 16.943315505981445, 19.04356575012207, 21.143815994262695, 23.244064331054688, 25.344314575195312, 27.444564819335938, 29.544815063476562, 31.645065307617188, 33.74531555175781, 35.84556579589844, 37.94581604003906, 40.04606246948242, 42.14631271362305, 44.24656295776367, 46.3468132019043, 48.44706344604492, 50.54731369018555, 52.647560119628906, 54.74781036376953, 56.848060607910156, 58.94831085205078, 61.048561096191406]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 8.0, 14.0, 9.0, 20.0, 13.0, 10.0, 20.0, 12.0, 28.0, 28.0, 33.0, 30.0, 31.0, 32.0, 38.0, 33.0, 41.0, 32.0, 41.0, 54.0, 37.0, 34.0, 41.0, 36.0, 32.0, 29.0, 30.0, 28.0, 35.0, 21.0, 17.0, 23.0, 16.0, 14.0, 16.0, 9.0, 10.0, 8.0, 9.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-6.7421875, -6.54388427734375, -6.3455810546875, -6.14727783203125, -5.948974609375, -5.75067138671875, -5.5523681640625, -5.35406494140625, -5.15576171875, -4.95745849609375, -4.7591552734375, -4.56085205078125, -4.362548828125, -4.16424560546875, -3.9659423828125, -3.76763916015625, -3.5693359375, -3.37103271484375, -3.1727294921875, -2.97442626953125, -2.776123046875, -2.57781982421875, -2.3795166015625, -2.18121337890625, -1.98291015625, -1.78460693359375, -1.5863037109375, -1.38800048828125, -1.189697265625, -0.99139404296875, -0.7930908203125, -0.59478759765625, -0.396484375, -0.19818115234375, 0.0001220703125, 0.19842529296875, 0.396728515625, 0.59503173828125, 0.7933349609375, 0.99163818359375, 1.18994140625, 1.38824462890625, 1.5865478515625, 1.78485107421875, 1.983154296875, 2.18145751953125, 2.3797607421875, 2.57806396484375, 2.7763671875, 2.97467041015625, 3.1729736328125, 3.37127685546875, 3.569580078125, 3.76788330078125, 3.9661865234375, 4.16448974609375, 4.36279296875, 4.56109619140625, 4.7593994140625, 4.95770263671875, 5.156005859375, 5.35430908203125, 5.5526123046875, 5.75091552734375, 5.94921875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 6.0, 1.0, 4.0, 12.0, 17.0, 18.0, 22.0, 39.0, 55.0, 72.0, 100.0, 145.0, 258.0, 425.0, 739.0, 1381.0, 2491.0, 5022.0, 10919.0, 27431.0, 81999.0, 297956.0, 943012.0, 1503351.0, 904241.0, 289908.0, 77680.0, 26095.0, 10496.0, 4789.0, 2444.0, 1284.0, 709.0, 446.0, 245.0, 144.0, 90.0, 64.0, 38.0, 46.0, 30.0, 21.0, 13.0, 12.0, 6.0, 4.0, 5.0, 4.0, 5.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.83526611328125, -7.6080322265625, -7.38079833984375, -7.153564453125, -6.92633056640625, -6.6990966796875, -6.47186279296875, -6.24462890625, -6.01739501953125, -5.7901611328125, -5.56292724609375, -5.335693359375, -5.10845947265625, -4.8812255859375, -4.65399169921875, -4.4267578125, -4.19952392578125, -3.9722900390625, -3.74505615234375, -3.517822265625, -3.29058837890625, -3.0633544921875, -2.83612060546875, -2.60888671875, -2.38165283203125, -2.1544189453125, -1.92718505859375, -1.699951171875, -1.47271728515625, -1.2454833984375, -1.01824951171875, -0.791015625, -0.56378173828125, -0.3365478515625, -0.10931396484375, 0.117919921875, 0.34515380859375, 0.5723876953125, 0.79962158203125, 1.02685546875, 1.25408935546875, 1.4813232421875, 1.70855712890625, 1.935791015625, 2.16302490234375, 2.3902587890625, 2.61749267578125, 2.8447265625, 3.07196044921875, 3.2991943359375, 3.52642822265625, 3.753662109375, 3.98089599609375, 4.2081298828125, 4.43536376953125, 4.66259765625, 4.88983154296875, 5.1170654296875, 5.34429931640625, 5.571533203125, 5.79876708984375, 6.0260009765625, 6.25323486328125, 6.48046875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 2.0, 5.0, 11.0, 17.0, 17.0, 25.0, 41.0, 43.0, 50.0, 54.0, 82.0, 78.0, 122.0, 146.0, 209.0, 253.0, 281.0, 379.0, 396.0, 364.0, 312.0, 267.0, 202.0, 160.0, 118.0, 87.0, 75.0, 41.0, 61.0, 39.0, 31.0, 26.0, 21.0, 14.0, 6.0, 6.0, 12.0, 3.0, 2.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.015625, -14.5924072265625, -14.169189453125, -13.7459716796875, -13.32275390625, -12.8995361328125, -12.476318359375, -12.0531005859375, -11.6298828125, -11.2066650390625, -10.783447265625, -10.3602294921875, -9.93701171875, -9.5137939453125, -9.090576171875, -8.6673583984375, -8.244140625, -7.8209228515625, -7.397705078125, -6.9744873046875, -6.55126953125, -6.1280517578125, -5.704833984375, -5.2816162109375, -4.8583984375, -4.4351806640625, -4.011962890625, -3.5887451171875, -3.16552734375, -2.7423095703125, -2.319091796875, -1.8958740234375, -1.47265625, -1.0494384765625, -0.626220703125, -0.2030029296875, 0.22021484375, 0.6434326171875, 1.066650390625, 1.4898681640625, 1.9130859375, 2.3363037109375, 2.759521484375, 3.1827392578125, 3.60595703125, 4.0291748046875, 4.452392578125, 4.8756103515625, 5.298828125, 5.7220458984375, 6.145263671875, 6.5684814453125, 6.99169921875, 7.4149169921875, 7.838134765625, 8.2613525390625, 8.6845703125, 9.1077880859375, 9.531005859375, 9.9542236328125, 10.37744140625, 10.8006591796875, 11.223876953125, 11.6470947265625, 12.0703125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 9.0, 13.0, 11.0, 29.0, 29.0, 32.0, 49.0, 66.0, 101.0, 138.0, 211.0, 388.0, 1128.0, 23521.0, 4022601.0, 142538.0, 2150.0, 490.0, 262.0, 154.0, 101.0, 52.0, 49.0, 46.0, 33.0, 20.0, 16.0, 13.0, 9.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.34375, -56.06982421875, -53.7958984375, -51.52197265625, -49.248046875, -46.97412109375, -44.7001953125, -42.42626953125, -40.15234375, -37.87841796875, -35.6044921875, -33.33056640625, -31.056640625, -28.78271484375, -26.5087890625, -24.23486328125, -21.9609375, -19.68701171875, -17.4130859375, -15.13916015625, -12.865234375, -10.59130859375, -8.3173828125, -6.04345703125, -3.76953125, -1.49560546875, 0.7783203125, 3.05224609375, 5.326171875, 7.60009765625, 9.8740234375, 12.14794921875, 14.421875, 16.69580078125, 18.9697265625, 21.24365234375, 23.517578125, 25.79150390625, 28.0654296875, 30.33935546875, 32.61328125, 34.88720703125, 37.1611328125, 39.43505859375, 41.708984375, 43.98291015625, 46.2568359375, 48.53076171875, 50.8046875, 53.07861328125, 55.3525390625, 57.62646484375, 59.900390625, 62.17431640625, 64.4482421875, 66.72216796875, 68.99609375, 71.27001953125, 73.5439453125, 75.81787109375, 78.091796875, 80.36572265625, 82.6396484375, 84.91357421875, 87.1875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 19.0, 30.0, 66.0, 103.0, 140.0, 195.0, 163.0, 125.0, 83.0, 47.0, 17.0, 11.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-136.95057678222656, -133.8875274658203, -130.824462890625, -127.76141357421875, -124.69835662841797, -121.63529968261719, -118.5722427368164, -115.50918579101562, -112.44612884521484, -109.38307189941406, -106.32001495361328, -103.2569580078125, -100.19390869140625, -97.13085174560547, -94.06779479980469, -91.0047378540039, -87.94168090820312, -84.87862396240234, -81.81556701660156, -78.75251770019531, -75.68946075439453, -72.62640380859375, -69.56334686279297, -66.50028991699219, -63.43724060058594, -60.374183654785156, -57.31113052368164, -54.24807357788086, -51.18501663208008, -48.12196350097656, -45.05890655517578, -41.995849609375, -38.932796478271484, -35.8697395324707, -32.80668640136719, -29.743629455566406, -26.680572509765625, -23.617517471313477, -20.554462432861328, -17.491405487060547, -14.428350448608398, -11.365294456481934, -8.302238464355469, -5.23918342590332, -2.1761274337768555, 0.8869285583496094, 3.949983596801758, 7.013040542602539, 10.076095581054688, 13.139151573181152, 16.202207565307617, 19.265262603759766, 22.328319549560547, 25.391374588012695, 28.454429626464844, 31.517486572265625, 34.580543518066406, 37.64360046386719, 40.7066535949707, 43.769710540771484, 46.832767486572266, 49.89582061767578, 52.95887756347656, 56.021934509277344, 59.08498764038086]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 5.0, 12.0, 8.0, 12.0, 17.0, 17.0, 14.0, 14.0, 19.0, 32.0, 25.0, 27.0, 21.0, 29.0, 30.0, 30.0, 32.0, 42.0, 40.0, 33.0, 38.0, 35.0, 42.0, 42.0, 37.0, 29.0, 32.0, 29.0, 31.0, 25.0, 16.0, 21.0, 15.0, 18.0, 19.0, 14.0, 15.0, 5.0, 11.0, 12.0, 14.0, 2.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0], "bins": [-51.87261962890625, -50.37895202636719, -48.88528823852539, -47.391624450683594, -45.89795684814453, -44.40428924560547, -42.91062545776367, -41.416961669921875, -39.92329406738281, -38.42962646484375, -36.93596267700195, -35.442298889160156, -33.948631286621094, -32.45496368408203, -30.961299896240234, -29.467634201049805, -27.973968505859375, -26.480302810668945, -24.986637115478516, -23.492971420288086, -21.999305725097656, -20.505640029907227, -19.011974334716797, -17.518308639526367, -16.024642944335938, -14.530977249145508, -13.037311553955078, -11.543645858764648, -10.049980163574219, -8.556314468383789, -7.062648773193359, -5.56898307800293, -4.0753173828125, -2.5816516876220703, -1.0879859924316406, 0.40567970275878906, 1.8993453979492188, 3.3930110931396484, 4.886676788330078, 6.380342483520508, 7.8740081787109375, 9.367673873901367, 10.861339569091797, 12.355005264282227, 13.848670959472656, 15.342336654663086, 16.836002349853516, 18.329668045043945, 19.823333740234375, 21.316999435424805, 22.810665130615234, 24.304330825805664, 25.797996520996094, 27.291662216186523, 28.785327911376953, 30.278993606567383, 31.772659301757812, 33.266326904296875, 34.75999069213867, 36.25365447998047, 37.74732208251953, 39.240989685058594, 40.73465347290039, 42.22831726074219, 43.72198486328125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 15.0, 12.0, 13.0, 11.0, 11.0, 16.0, 19.0, 27.0, 33.0, 30.0, 39.0, 29.0, 32.0, 37.0, 49.0, 36.0, 32.0, 28.0, 39.0, 47.0, 37.0, 36.0, 35.0, 40.0, 33.0, 35.0, 29.0, 22.0, 19.0, 27.0, 18.0, 17.0, 14.0, 9.0, 12.0, 12.0, 7.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.70703125, -6.5042724609375, -6.301513671875, -6.0987548828125, -5.89599609375, -5.6932373046875, -5.490478515625, -5.2877197265625, -5.0849609375, -4.8822021484375, -4.679443359375, -4.4766845703125, -4.27392578125, -4.0711669921875, -3.868408203125, -3.6656494140625, -3.462890625, -3.2601318359375, -3.057373046875, -2.8546142578125, -2.65185546875, -2.4490966796875, -2.246337890625, -2.0435791015625, -1.8408203125, -1.6380615234375, -1.435302734375, -1.2325439453125, -1.02978515625, -0.8270263671875, -0.624267578125, -0.4215087890625, -0.21875, -0.0159912109375, 0.186767578125, 0.3895263671875, 0.59228515625, 0.7950439453125, 0.997802734375, 1.2005615234375, 1.4033203125, 1.6060791015625, 1.808837890625, 2.0115966796875, 2.21435546875, 2.4171142578125, 2.619873046875, 2.8226318359375, 3.025390625, 3.2281494140625, 3.430908203125, 3.6336669921875, 3.83642578125, 4.0391845703125, 4.241943359375, 4.4447021484375, 4.6474609375, 4.8502197265625, 5.052978515625, 5.2557373046875, 5.45849609375, 5.6612548828125, 5.864013671875, 6.0667724609375, 6.26953125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 11.0, 4.0, 20.0, 40.0, 37.0, 48.0, 77.0, 101.0, 153.0, 233.0, 341.0, 466.0, 654.0, 1014.0, 1497.0, 2048.0, 3012.0, 4218.0, 6172.0, 8682.0, 12628.0, 17771.0, 26541.0, 38487.0, 56806.0, 83962.0, 124107.0, 173788.0, 155264.0, 104948.0, 71257.0, 47931.0, 33047.0, 22203.0, 15215.0, 10780.0, 7659.0, 5198.0, 3748.0, 2582.0, 1738.0, 1191.0, 855.0, 616.0, 447.0, 328.0, 188.0, 148.0, 110.0, 75.0, 39.0, 29.0, 20.0, 7.0, 8.0, 8.0, 5.0, 3.0, 4.0], "bins": [-0.80078125, -0.7763595581054688, -0.7519378662109375, -0.7275161743164062, -0.703094482421875, -0.6786727905273438, -0.6542510986328125, -0.6298294067382812, -0.60540771484375, -0.5809860229492188, -0.5565643310546875, -0.5321426391601562, -0.507720947265625, -0.48329925537109375, -0.4588775634765625, -0.43445587158203125, -0.4100341796875, -0.38561248779296875, -0.3611907958984375, -0.33676910400390625, -0.312347412109375, -0.28792572021484375, -0.2635040283203125, -0.23908233642578125, -0.21466064453125, -0.19023895263671875, -0.1658172607421875, -0.14139556884765625, -0.116973876953125, -0.09255218505859375, -0.0681304931640625, -0.04370880126953125, -0.019287109375, 0.00513458251953125, 0.0295562744140625, 0.05397796630859375, 0.078399658203125, 0.10282135009765625, 0.1272430419921875, 0.15166473388671875, 0.17608642578125, 0.20050811767578125, 0.2249298095703125, 0.24935150146484375, 0.273773193359375, 0.29819488525390625, 0.3226165771484375, 0.34703826904296875, 0.3714599609375, 0.39588165283203125, 0.4203033447265625, 0.44472503662109375, 0.469146728515625, 0.49356842041015625, 0.5179901123046875, 0.5424118041992188, 0.56683349609375, 0.5912551879882812, 0.6156768798828125, 0.6400985717773438, 0.664520263671875, 0.6889419555664062, 0.7133636474609375, 0.7377853393554688, 0.76220703125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 5.0, 6.0, 8.0, 5.0, 9.0, 14.0, 11.0, 13.0, 16.0, 15.0, 18.0, 20.0, 33.0, 32.0, 30.0, 33.0, 44.0, 35.0, 31.0, 39.0, 30.0, 1067.0, 44.0, 43.0, 40.0, 42.0, 32.0, 28.0, 29.0, 29.0, 29.0, 29.0, 22.0, 27.0, 24.0, 18.0, 11.0, 12.0, 10.0, 10.0, 11.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.21875, -4.09466552734375, -3.9705810546875, -3.84649658203125, -3.722412109375, -3.59832763671875, -3.4742431640625, -3.35015869140625, -3.22607421875, -3.10198974609375, -2.9779052734375, -2.85382080078125, -2.729736328125, -2.60565185546875, -2.4815673828125, -2.35748291015625, -2.2333984375, -2.10931396484375, -1.9852294921875, -1.86114501953125, -1.737060546875, -1.61297607421875, -1.4888916015625, -1.36480712890625, -1.24072265625, -1.11663818359375, -0.9925537109375, -0.86846923828125, -0.744384765625, -0.62030029296875, -0.4962158203125, -0.37213134765625, -0.248046875, -0.12396240234375, 0.0001220703125, 0.12420654296875, 0.248291015625, 0.37237548828125, 0.4964599609375, 0.62054443359375, 0.74462890625, 0.86871337890625, 0.9927978515625, 1.11688232421875, 1.240966796875, 1.36505126953125, 1.4891357421875, 1.61322021484375, 1.7373046875, 1.86138916015625, 1.9854736328125, 2.10955810546875, 2.233642578125, 2.35772705078125, 2.4818115234375, 2.60589599609375, 2.72998046875, 2.85406494140625, 2.9781494140625, 3.10223388671875, 3.226318359375, 3.35040283203125, 3.4744873046875, 3.59857177734375, 3.72265625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 2.0, 11.0, 13.0, 18.0, 31.0, 29.0, 43.0, 67.0, 120.0, 159.0, 289.0, 413.0, 707.0, 987.0, 1595.0, 2362.0, 3672.0, 6031.0, 9601.0, 15319.0, 24954.0, 40471.0, 66298.0, 107691.0, 173559.0, 1263729.0, 144575.0, 89822.0, 55249.0, 34149.0, 20543.0, 12711.0, 7922.0, 5064.0, 3121.0, 2055.0, 1247.0, 884.0, 574.0, 372.0, 204.0, 156.0, 114.0, 71.0, 52.0, 25.0, 20.0, 14.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.8642578125, -0.8375091552734375, -0.810760498046875, -0.7840118408203125, -0.75726318359375, -0.7305145263671875, -0.703765869140625, -0.6770172119140625, -0.6502685546875, -0.6235198974609375, -0.596771240234375, -0.5700225830078125, -0.54327392578125, -0.5165252685546875, -0.489776611328125, -0.4630279541015625, -0.436279296875, -0.4095306396484375, -0.382781982421875, -0.3560333251953125, -0.32928466796875, -0.3025360107421875, -0.275787353515625, -0.2490386962890625, -0.2222900390625, -0.1955413818359375, -0.168792724609375, -0.1420440673828125, -0.11529541015625, -0.0885467529296875, -0.061798095703125, -0.0350494384765625, -0.00830078125, 0.0184478759765625, 0.045196533203125, 0.0719451904296875, 0.09869384765625, 0.1254425048828125, 0.152191162109375, 0.1789398193359375, 0.2056884765625, 0.2324371337890625, 0.259185791015625, 0.2859344482421875, 0.31268310546875, 0.3394317626953125, 0.366180419921875, 0.3929290771484375, 0.419677734375, 0.4464263916015625, 0.473175048828125, 0.4999237060546875, 0.52667236328125, 0.5534210205078125, 0.580169677734375, 0.6069183349609375, 0.6336669921875, 0.6604156494140625, 0.687164306640625, 0.7139129638671875, 0.74066162109375, 0.7674102783203125, 0.794158935546875, 0.8209075927734375, 0.84765625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 8.0, 11.0, 14.0, 7.0, 10.0, 16.0, 18.0, 19.0, 30.0, 34.0, 41.0, 38.0, 49.0, 50.0, 45.0, 58.0, 53.0, 55.0, 41.0, 32.0, 50.0, 51.0, 33.0, 32.0, 33.0, 27.0, 16.0, 30.0, 20.0, 14.0, 15.0, 12.0, 5.0, 3.0, 3.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015764236450195312, -0.0015301108360290527, -0.0014837980270385742, -0.0014374852180480957, -0.0013911724090576172, -0.0013448596000671387, -0.0012985467910766602, -0.0012522339820861816, -0.0012059211730957031, -0.0011596083641052246, -0.001113295555114746, -0.0010669827461242676, -0.001020669937133789, -0.0009743571281433105, -0.000928044319152832, -0.0008817315101623535, -0.000835418701171875, -0.0007891058921813965, -0.000742793083190918, -0.0006964802742004395, -0.0006501674652099609, -0.0006038546562194824, -0.0005575418472290039, -0.0005112290382385254, -0.0004649162292480469, -0.00041860342025756836, -0.00037229061126708984, -0.00032597780227661133, -0.0002796649932861328, -0.0002333521842956543, -0.00018703937530517578, -0.00014072656631469727, -9.441375732421875e-05, -4.8100948333740234e-05, -1.7881393432617188e-06, 4.45246696472168e-05, 9.083747863769531e-05, 0.00013715028762817383, 0.00018346309661865234, 0.00022977590560913086, 0.0002760887145996094, 0.0003224015235900879, 0.0003687143325805664, 0.0004150271415710449, 0.00046133995056152344, 0.000507652759552002, 0.0005539655685424805, 0.000600278377532959, 0.0006465911865234375, 0.000692903995513916, 0.0007392168045043945, 0.000785529613494873, 0.0008318424224853516, 0.0008781552314758301, 0.0009244680404663086, 0.0009707808494567871, 0.0010170936584472656, 0.0010634064674377441, 0.0011097192764282227, 0.0011560320854187012, 0.0012023448944091797, 0.0012486577033996582, 0.0012949705123901367, 0.0013412833213806152, 0.0013875961303710938]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 2.0, 8.0, 2.0, 11.0, 6.0, 5.0, 12.0, 20.0, 25.0, 18.0, 22.0, 24.0, 46.0, 55.0, 74.0, 139.0, 258.0, 485.0, 1601.0, 974583.0, 69334.0, 835.0, 370.0, 201.0, 121.0, 71.0, 45.0, 39.0, 23.0, 23.0, 23.0, 11.0, 11.0, 9.0, 9.0, 9.0, 4.0, 4.0, 6.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033905029296875, -0.03272819519042969, -0.031551361083984375, -0.030374526977539062, -0.02919769287109375, -0.028020858764648438, -0.026844024658203125, -0.025667190551757812, -0.0244903564453125, -0.023313522338867188, -0.022136688232421875, -0.020959854125976562, -0.01978302001953125, -0.018606185913085938, -0.017429351806640625, -0.016252517700195312, -0.01507568359375, -0.013898849487304688, -0.012722015380859375, -0.011545181274414062, -0.01036834716796875, -0.009191513061523438, -0.008014678955078125, -0.0068378448486328125, -0.0056610107421875, -0.0044841766357421875, -0.003307342529296875, -0.0021305084228515625, -0.00095367431640625, 0.0002231597900390625, 0.001399993896484375, 0.0025768280029296875, 0.003753662109375, 0.0049304962158203125, 0.006107330322265625, 0.0072841644287109375, 0.00846099853515625, 0.009637832641601562, 0.010814666748046875, 0.011991500854492188, 0.0131683349609375, 0.014345169067382812, 0.015522003173828125, 0.016698837280273438, 0.01787567138671875, 0.019052505493164062, 0.020229339599609375, 0.021406173706054688, 0.0225830078125, 0.023759841918945312, 0.024936676025390625, 0.026113510131835938, 0.02729034423828125, 0.028467178344726562, 0.029644012451171875, 0.030820846557617188, 0.0319976806640625, 0.03317451477050781, 0.034351348876953125, 0.03552818298339844, 0.03670501708984375, 0.03788185119628906, 0.039058685302734375, 0.04023551940917969, 0.041412353515625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 21.0, 145.0, 488.0, 298.0, 55.0, 8.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024785022251307964, -0.0023590559139847755, -0.0022396096028387547, -0.0021201632916927338, -0.002000716980546713, -0.001881270669400692, -0.001761824358254671, -0.0016423780471086502, -0.0015229317359626293, -0.0014034854248166084, -0.0012840391136705875, -0.0011645928025245667, -0.0010451464913785458, -0.0009257001802325249, -0.000806253869086504, -0.0006868075579404831, -0.0005673612467944622, -0.0004479149356484413, -0.0003284686245024204, -0.00020902231335639954, -8.957600221037865e-05, 2.9870308935642242e-05, 0.00014931662008166313, 0.000268762931227684, 0.0003882092423737049, 0.0005076555535197258, 0.0006271018646657467, 0.0007465481758117676, 0.0008659944869577885, 0.0009854407981038094, 0.0011048871092498302, 0.0012243334203958511, 0.001343779731541872, 0.001463226042687893, 0.0015826723538339138, 0.0017021186649799347, 0.0018215649761259556, 0.0019410112872719765, 0.0020604575984179974, 0.0021799039095640182, 0.002299350220710039, 0.00241879653185606, 0.002538242843002081, 0.002657689154148102, 0.0027771354652941227, 0.0028965817764401436, 0.0030160280875861645, 0.0031354743987321854, 0.0032549207098782063, 0.003374367021024227, 0.003493813332170248, 0.003613259643316269, 0.00373270595446229, 0.0038521522656083107, 0.003971598576754332, 0.0040910448879003525, 0.004210491199046373, 0.004329937510192394, 0.004449383821338415, 0.004568830132484436, 0.004688276443630457, 0.004807722754776478, 0.004927169065922499, 0.00504661537706852, 0.0051660616882145405]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 8.0, 5.0, 13.0, 11.0, 14.0, 19.0, 18.0, 16.0, 23.0, 26.0, 18.0, 25.0, 33.0, 30.0, 27.0, 39.0, 26.0, 34.0, 34.0, 32.0, 45.0, 36.0, 46.0, 33.0, 35.0, 33.0, 26.0, 32.0, 23.0, 25.0, 26.0, 26.0, 21.0, 20.0, 14.0, 10.0, 14.0, 9.0, 12.0, 6.0, 9.0, 3.0, 10.0, 5.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.0006586909294128418, -0.0006370516493916512, -0.0006154123693704605, -0.0005937730893492699, -0.0005721338093280792, -0.0005504945293068886, -0.0005288552492856979, -0.0005072159692645073, -0.00048557668924331665, -0.000463937409222126, -0.00044229812920093536, -0.0004206588491797447, -0.0003990195691585541, -0.00037738028913736343, -0.0003557410091161728, -0.00033410172909498215, -0.0003124624490737915, -0.00029082316905260086, -0.0002691838890314102, -0.0002475446090102196, -0.00022590532898902893, -0.0002042660489678383, -0.00018262676894664764, -0.000160987488925457, -0.00013934820890426636, -0.00011770892888307571, -9.606964886188507e-05, -7.443036884069443e-05, -5.2791088819503784e-05, -3.115180879831314e-05, -9.512528777122498e-06, 1.2126751244068146e-05, 3.376603126525879e-05, 5.540531128644943e-05, 7.704459130764008e-05, 9.868387132883072e-05, 0.00012032315135002136, 0.000141962431371212, 0.00016360171139240265, 0.0001852409914135933, 0.00020688027143478394, 0.00022851955145597458, 0.0002501588314771652, 0.00027179811149835587, 0.0002934373915195465, 0.00031507667154073715, 0.0003367159515619278, 0.00035835523158311844, 0.0003799945116043091, 0.0004016337916254997, 0.00042327307164669037, 0.000444912351667881, 0.00046655163168907166, 0.0004881909117102623, 0.0005098301917314529, 0.0005314694717526436, 0.0005531087517738342, 0.0005747480317950249, 0.0005963873118162155, 0.0006180265918374062, 0.0006396658718585968, 0.0006613051518797874, 0.0006829444319009781, 0.0007045837119221687, 0.0007262229919433594]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 15.0, 12.0, 13.0, 11.0, 11.0, 16.0, 19.0, 27.0, 33.0, 30.0, 39.0, 29.0, 32.0, 37.0, 49.0, 36.0, 32.0, 28.0, 39.0, 47.0, 37.0, 36.0, 35.0, 40.0, 33.0, 35.0, 29.0, 22.0, 19.0, 27.0, 18.0, 17.0, 14.0, 9.0, 12.0, 12.0, 7.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.70703125, -6.5042724609375, -6.301513671875, -6.0987548828125, -5.89599609375, -5.6932373046875, -5.490478515625, -5.2877197265625, -5.0849609375, -4.8822021484375, -4.679443359375, -4.4766845703125, -4.27392578125, -4.0711669921875, -3.868408203125, -3.6656494140625, -3.462890625, -3.2601318359375, -3.057373046875, -2.8546142578125, -2.65185546875, -2.4490966796875, -2.246337890625, -2.0435791015625, -1.8408203125, -1.6380615234375, -1.435302734375, -1.2325439453125, -1.02978515625, -0.8270263671875, -0.624267578125, -0.4215087890625, -0.21875, -0.0159912109375, 0.186767578125, 0.3895263671875, 0.59228515625, 0.7950439453125, 0.997802734375, 1.2005615234375, 1.4033203125, 1.6060791015625, 1.808837890625, 2.0115966796875, 2.21435546875, 2.4171142578125, 2.619873046875, 2.8226318359375, 3.025390625, 3.2281494140625, 3.430908203125, 3.6336669921875, 3.83642578125, 4.0391845703125, 4.241943359375, 4.4447021484375, 4.6474609375, 4.8502197265625, 5.052978515625, 5.2557373046875, 5.45849609375, 5.6612548828125, 5.864013671875, 6.0667724609375, 6.26953125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 8.0, 2.0, 15.0, 8.0, 28.0, 27.0, 36.0, 47.0, 62.0, 105.0, 158.0, 262.0, 386.0, 556.0, 848.0, 1326.0, 2264.0, 4325.0, 8776.0, 20464.0, 54509.0, 180705.0, 461629.0, 207498.0, 61177.0, 22498.0, 9685.0, 4663.0, 2459.0, 1408.0, 871.0, 571.0, 388.0, 229.0, 180.0, 104.0, 83.0, 52.0, 36.0, 28.0, 23.0, 11.0, 10.0, 9.0, 5.0, 4.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.66015625, -4.50762939453125, -4.3551025390625, -4.20257568359375, -4.050048828125, -3.89752197265625, -3.7449951171875, -3.59246826171875, -3.43994140625, -3.28741455078125, -3.1348876953125, -2.98236083984375, -2.829833984375, -2.67730712890625, -2.5247802734375, -2.37225341796875, -2.2197265625, -2.06719970703125, -1.9146728515625, -1.76214599609375, -1.609619140625, -1.45709228515625, -1.3045654296875, -1.15203857421875, -0.99951171875, -0.84698486328125, -0.6944580078125, -0.54193115234375, -0.389404296875, -0.23687744140625, -0.0843505859375, 0.06817626953125, 0.220703125, 0.37322998046875, 0.5257568359375, 0.67828369140625, 0.830810546875, 0.98333740234375, 1.1358642578125, 1.28839111328125, 1.44091796875, 1.59344482421875, 1.7459716796875, 1.89849853515625, 2.051025390625, 2.20355224609375, 2.3560791015625, 2.50860595703125, 2.6611328125, 2.81365966796875, 2.9661865234375, 3.11871337890625, 3.271240234375, 3.42376708984375, 3.5762939453125, 3.72882080078125, 3.88134765625, 4.03387451171875, 4.1864013671875, 4.33892822265625, 4.491455078125, 4.64398193359375, 4.7965087890625, 4.94903564453125, 5.1015625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 3.0, 5.0, 5.0, 5.0, 9.0, 20.0, 22.0, 20.0, 18.0, 23.0, 34.0, 31.0, 47.0, 42.0, 43.0, 57.0, 69.0, 175.0, 1774.0, 157.0, 70.0, 65.0, 48.0, 45.0, 31.0, 40.0, 22.0, 32.0, 21.0, 20.0, 16.0, 14.0, 11.0, 11.0, 11.0, 5.0, 5.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.375, -25.562744140625, -24.75048828125, -23.938232421875, -23.1259765625, -22.313720703125, -21.50146484375, -20.689208984375, -19.876953125, -19.064697265625, -18.25244140625, -17.440185546875, -16.6279296875, -15.815673828125, -15.00341796875, -14.191162109375, -13.37890625, -12.566650390625, -11.75439453125, -10.942138671875, -10.1298828125, -9.317626953125, -8.50537109375, -7.693115234375, -6.880859375, -6.068603515625, -5.25634765625, -4.444091796875, -3.6318359375, -2.819580078125, -2.00732421875, -1.195068359375, -0.3828125, 0.429443359375, 1.24169921875, 2.053955078125, 2.8662109375, 3.678466796875, 4.49072265625, 5.302978515625, 6.115234375, 6.927490234375, 7.73974609375, 8.552001953125, 9.3642578125, 10.176513671875, 10.98876953125, 11.801025390625, 12.61328125, 13.425537109375, 14.23779296875, 15.050048828125, 15.8623046875, 16.674560546875, 17.48681640625, 18.299072265625, 19.111328125, 19.923583984375, 20.73583984375, 21.548095703125, 22.3603515625, 23.172607421875, 23.98486328125, 24.797119140625, 25.609375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 12.0, 9.0, 14.0, 16.0, 16.0, 33.0, 23.0, 49.0, 47.0, 77.0, 92.0, 151.0, 173.0, 278.0, 569.0, 3793.0, 2950023.0, 187259.0, 1693.0, 448.0, 249.0, 190.0, 110.0, 73.0, 79.0, 40.0, 36.0, 31.0, 29.0, 20.0, 13.0, 9.0, 5.0, 10.0, 5.0, 7.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.15625, -49.49853515625, -47.8408203125, -46.18310546875, -44.525390625, -42.86767578125, -41.2099609375, -39.55224609375, -37.89453125, -36.23681640625, -34.5791015625, -32.92138671875, -31.263671875, -29.60595703125, -27.9482421875, -26.29052734375, -24.6328125, -22.97509765625, -21.3173828125, -19.65966796875, -18.001953125, -16.34423828125, -14.6865234375, -13.02880859375, -11.37109375, -9.71337890625, -8.0556640625, -6.39794921875, -4.740234375, -3.08251953125, -1.4248046875, 0.23291015625, 1.890625, 3.54833984375, 5.2060546875, 6.86376953125, 8.521484375, 10.17919921875, 11.8369140625, 13.49462890625, 15.15234375, 16.81005859375, 18.4677734375, 20.12548828125, 21.783203125, 23.44091796875, 25.0986328125, 26.75634765625, 28.4140625, 30.07177734375, 31.7294921875, 33.38720703125, 35.044921875, 36.70263671875, 38.3603515625, 40.01806640625, 41.67578125, 43.33349609375, 44.9912109375, 46.64892578125, 48.306640625, 49.96435546875, 51.6220703125, 53.27978515625, 54.9375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [344.0, 666.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9185028076171875, -0.8384151458740234, 5.241672515869141, 11.321760177612305, 17.40184783935547, 23.481935501098633, 29.562023162841797, 35.642112731933594, 41.722198486328125, 47.802284240722656, 53.88237380981445, 59.96246337890625, 66.04254913330078, 72.12263488769531, 78.20272827148438, 84.2828140258789, 90.36289978027344, 96.44298553466797, 102.5230712890625, 108.60316467285156, 114.6832504272461, 120.76333618164062, 126.84342956542969, 132.92352294921875, 139.00360107421875, 145.0836944580078, 151.1637725830078, 157.24386596679688, 163.32394409179688, 169.40403747558594, 175.484130859375, 181.564208984375, 187.64431762695312, 193.7244110107422, 199.8044891357422, 205.88458251953125, 211.96466064453125, 218.0447540283203, 224.12484741210938, 230.20492553710938, 236.28501892089844, 242.3651123046875, 248.4451904296875, 254.52528381347656, 260.6053771972656, 266.6854553222656, 272.7655334472656, 278.84564208984375, 284.92572021484375, 291.00579833984375, 297.0859069824219, 303.1659851074219, 309.2460632324219, 315.326171875, 321.40625, 327.486328125, 333.56640625, 339.646484375, 345.7265930175781, 351.8066711425781, 357.8867492675781, 363.96685791015625, 370.04693603515625, 376.12701416015625, 382.2071228027344]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 14.0, 5.0, 10.0, 11.0, 8.0, 8.0, 12.0, 13.0, 16.0, 21.0, 32.0, 35.0, 20.0, 27.0, 35.0, 24.0, 34.0, 24.0, 39.0, 39.0, 40.0, 33.0, 33.0, 36.0, 34.0, 38.0, 35.0, 30.0, 34.0, 31.0, 39.0, 19.0, 22.0, 19.0, 18.0, 17.0, 20.0, 9.0, 13.0, 9.0, 8.0, 6.0, 1.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-59.544830322265625, -57.8148307800293, -56.08483123779297, -54.35483169555664, -52.62483215332031, -50.894832611083984, -49.164833068847656, -47.43482971191406, -45.704833984375, -43.97483444213867, -42.244834899902344, -40.514835357666016, -38.78483581542969, -37.05483627319336, -35.32483673095703, -33.59483337402344, -31.86483383178711, -30.13483428955078, -28.404834747314453, -26.674835205078125, -24.944835662841797, -23.21483612060547, -21.484834671020508, -19.75483512878418, -18.02483558654785, -16.294836044311523, -14.564836502075195, -12.83483600616455, -11.104836463928223, -9.374836921691895, -7.64483642578125, -5.914836883544922, -4.184833526611328, -2.454833745956421, -0.7248339653015137, 1.0051660537719727, 2.735165596008301, 4.465165138244629, 6.195165634155273, 7.925165176391602, 9.65516471862793, 11.385164260864258, 13.115163803100586, 14.84516429901123, 16.575164794921875, 18.305164337158203, 20.03516387939453, 21.76516342163086, 23.495162963867188, 25.225162506103516, 26.955162048339844, 28.685161590576172, 30.4151611328125, 32.14516067504883, 33.875160217285156, 35.60516357421875, 37.33515930175781, 39.06515884399414, 40.79515838623047, 42.5251579284668, 44.255157470703125, 45.98515701293945, 47.71515655517578, 49.445159912109375, 51.1751594543457]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 4.0, 3.0, 14.0, 9.0, 10.0, 14.0, 15.0, 12.0, 19.0, 19.0, 22.0, 37.0, 34.0, 26.0, 23.0, 58.0, 37.0, 38.0, 36.0, 36.0, 42.0, 28.0, 43.0, 44.0, 32.0, 41.0, 30.0, 36.0, 27.0, 29.0, 24.0, 21.0, 28.0, 15.0, 19.0, 13.0, 9.0, 13.0, 6.0, 8.0, 11.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.0390625, -6.831298828125, -6.62353515625, -6.415771484375, -6.2080078125, -6.000244140625, -5.79248046875, -5.584716796875, -5.376953125, -5.169189453125, -4.96142578125, -4.753662109375, -4.5458984375, -4.338134765625, -4.13037109375, -3.922607421875, -3.71484375, -3.507080078125, -3.29931640625, -3.091552734375, -2.8837890625, -2.676025390625, -2.46826171875, -2.260498046875, -2.052734375, -1.844970703125, -1.63720703125, -1.429443359375, -1.2216796875, -1.013916015625, -0.80615234375, -0.598388671875, -0.390625, -0.182861328125, 0.02490234375, 0.232666015625, 0.4404296875, 0.648193359375, 0.85595703125, 1.063720703125, 1.271484375, 1.479248046875, 1.68701171875, 1.894775390625, 2.1025390625, 2.310302734375, 2.51806640625, 2.725830078125, 2.93359375, 3.141357421875, 3.34912109375, 3.556884765625, 3.7646484375, 3.972412109375, 4.18017578125, 4.387939453125, 4.595703125, 4.803466796875, 5.01123046875, 5.218994140625, 5.4267578125, 5.634521484375, 5.84228515625, 6.050048828125, 6.2578125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 4.0, 8.0, 14.0, 13.0, 15.0, 23.0, 8.0, 14.0, 29.0, 36.0, 20.0, 41.0, 56.0, 61.0, 102.0, 139.0, 493.0, 4409.0, 328102.0, 3801132.0, 56746.0, 1938.0, 327.0, 124.0, 70.0, 58.0, 57.0, 37.0, 25.0, 26.0, 31.0, 20.0, 12.0, 15.0, 13.0, 13.0, 8.0, 11.0, 3.0, 7.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0], "bins": [-40.4375, -39.29345703125, -38.1494140625, -37.00537109375, -35.861328125, -34.71728515625, -33.5732421875, -32.42919921875, -31.28515625, -30.14111328125, -28.9970703125, -27.85302734375, -26.708984375, -25.56494140625, -24.4208984375, -23.27685546875, -22.1328125, -20.98876953125, -19.8447265625, -18.70068359375, -17.556640625, -16.41259765625, -15.2685546875, -14.12451171875, -12.98046875, -11.83642578125, -10.6923828125, -9.54833984375, -8.404296875, -7.26025390625, -6.1162109375, -4.97216796875, -3.828125, -2.68408203125, -1.5400390625, -0.39599609375, 0.748046875, 1.89208984375, 3.0361328125, 4.18017578125, 5.32421875, 6.46826171875, 7.6123046875, 8.75634765625, 9.900390625, 11.04443359375, 12.1884765625, 13.33251953125, 14.4765625, 15.62060546875, 16.7646484375, 17.90869140625, 19.052734375, 20.19677734375, 21.3408203125, 22.48486328125, 23.62890625, 24.77294921875, 25.9169921875, 27.06103515625, 28.205078125, 29.34912109375, 30.4931640625, 31.63720703125, 32.78125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 4.0, 7.0, 12.0, 14.0, 12.0, 20.0, 30.0, 48.0, 49.0, 60.0, 88.0, 113.0, 179.0, 225.0, 290.0, 397.0, 413.0, 427.0, 390.0, 331.0, 245.0, 214.0, 131.0, 99.0, 78.0, 46.0, 29.0, 31.0, 21.0, 17.0, 15.0, 12.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.59375, -11.13134765625, -10.6689453125, -10.20654296875, -9.744140625, -9.28173828125, -8.8193359375, -8.35693359375, -7.89453125, -7.43212890625, -6.9697265625, -6.50732421875, -6.044921875, -5.58251953125, -5.1201171875, -4.65771484375, -4.1953125, -3.73291015625, -3.2705078125, -2.80810546875, -2.345703125, -1.88330078125, -1.4208984375, -0.95849609375, -0.49609375, -0.03369140625, 0.4287109375, 0.89111328125, 1.353515625, 1.81591796875, 2.2783203125, 2.74072265625, 3.203125, 3.66552734375, 4.1279296875, 4.59033203125, 5.052734375, 5.51513671875, 5.9775390625, 6.43994140625, 6.90234375, 7.36474609375, 7.8271484375, 8.28955078125, 8.751953125, 9.21435546875, 9.6767578125, 10.13916015625, 10.6015625, 11.06396484375, 11.5263671875, 11.98876953125, 12.451171875, 12.91357421875, 13.3759765625, 13.83837890625, 14.30078125, 14.76318359375, 15.2255859375, 15.68798828125, 16.150390625, 16.61279296875, 17.0751953125, 17.53759765625, 18.0]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 5.0, 11.0, 6.0, 18.0, 22.0, 26.0, 32.0, 43.0, 68.0, 80.0, 87.0, 151.0, 203.0, 304.0, 528.0, 1497.0, 43787.0, 4030168.0, 113346.0, 2149.0, 614.0, 340.0, 206.0, 134.0, 105.0, 75.0, 75.0, 42.0, 28.0, 29.0, 25.0, 13.0, 15.0, 11.0, 4.0, 6.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.78125, -53.75927734375, -51.7373046875, -49.71533203125, -47.693359375, -45.67138671875, -43.6494140625, -41.62744140625, -39.60546875, -37.58349609375, -35.5615234375, -33.53955078125, -31.517578125, -29.49560546875, -27.4736328125, -25.45166015625, -23.4296875, -21.40771484375, -19.3857421875, -17.36376953125, -15.341796875, -13.31982421875, -11.2978515625, -9.27587890625, -7.25390625, -5.23193359375, -3.2099609375, -1.18798828125, 0.833984375, 2.85595703125, 4.8779296875, 6.89990234375, 8.921875, 10.94384765625, 12.9658203125, 14.98779296875, 17.009765625, 19.03173828125, 21.0537109375, 23.07568359375, 25.09765625, 27.11962890625, 29.1416015625, 31.16357421875, 33.185546875, 35.20751953125, 37.2294921875, 39.25146484375, 41.2734375, 43.29541015625, 45.3173828125, 47.33935546875, 49.361328125, 51.38330078125, 53.4052734375, 55.42724609375, 57.44921875, 59.47119140625, 61.4931640625, 63.51513671875, 65.537109375, 67.55908203125, 69.5810546875, 71.60302734375, 73.625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 50.0, 146.0, 259.0, 297.0, 161.0, 70.0, 18.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-262.4325866699219, -257.2919006347656, -252.15122985839844, -247.01055908203125, -241.869873046875, -236.72918701171875, -231.58851623535156, -226.44784545898438, -221.30715942382812, -216.16647338867188, -211.0258026123047, -205.8851318359375, -200.74444580078125, -195.603759765625, -190.4630889892578, -185.32241821289062, -180.18173217773438, -175.04104614257812, -169.90037536621094, -164.75970458984375, -159.6190185546875, -154.47833251953125, -149.33766174316406, -144.19699096679688, -139.05630493164062, -133.91561889648438, -128.7749481201172, -123.63426971435547, -118.49359130859375, -113.35291290283203, -108.21223449707031, -103.0715560913086, -97.9308853149414, -92.79020690917969, -87.64952850341797, -82.50885009765625, -77.36817169189453, -72.22749328613281, -67.0868148803711, -61.946136474609375, -56.805458068847656, -51.66477966308594, -46.52410125732422, -41.3834228515625, -36.24274444580078, -31.102066040039062, -25.961387634277344, -20.820709228515625, -15.680030822753906, -10.539352416992188, -5.398674011230469, -0.25799560546875, 4.882682800292969, 10.023361206054688, 15.164039611816406, 20.304718017578125, 25.445396423339844, 30.586074829101562, 35.72675323486328, 40.867431640625, 46.00811004638672, 51.14878845214844, 56.289466857910156, 61.430145263671875, 66.5708236694336]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 5.0, 6.0, 9.0, 11.0, 12.0, 15.0, 11.0, 18.0, 15.0, 26.0, 17.0, 18.0, 23.0, 23.0, 29.0, 40.0, 41.0, 29.0, 49.0, 34.0, 36.0, 35.0, 39.0, 34.0, 26.0, 41.0, 39.0, 35.0, 32.0, 24.0, 26.0, 25.0, 25.0, 21.0, 16.0, 23.0, 19.0, 12.0, 16.0, 5.0, 7.0, 12.0, 5.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-43.546993255615234, -42.135963439941406, -40.724937438964844, -39.313907623291016, -37.90287780761719, -36.49184799194336, -35.08081817626953, -33.66979217529297, -32.25876235961914, -30.847732543945312, -29.436704635620117, -28.025676727294922, -26.614646911621094, -25.203617095947266, -23.79258918762207, -22.381561279296875, -20.970531463623047, -19.55950164794922, -18.148473739624023, -16.737445831298828, -15.326416015625, -13.915387153625488, -12.504358291625977, -11.093329429626465, -9.682300567626953, -8.271271705627441, -6.86024284362793, -5.449213981628418, -4.038185119628906, -2.6271562576293945, -1.2161273956298828, 0.1949014663696289, 1.605926513671875, 3.0169553756713867, 4.427984237670898, 5.83901309967041, 7.250041961669922, 8.661070823669434, 10.072099685668945, 11.483128547668457, 12.894157409667969, 14.30518627166748, 15.716215133666992, 17.127243041992188, 18.538272857666016, 19.949302673339844, 21.36033058166504, 22.771358489990234, 24.182388305664062, 25.59341812133789, 27.004446029663086, 28.41547393798828, 29.82650375366211, 31.237533569335938, 32.6485595703125, 34.05958938598633, 35.470619201660156, 36.881649017333984, 38.29267883300781, 39.703704833984375, 41.1147346496582, 42.52576446533203, 43.936790466308594, 45.34782028198242, 46.75885009765625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 11.0, 7.0, 7.0, 13.0, 9.0, 9.0, 16.0, 17.0, 21.0, 25.0, 21.0, 28.0, 33.0, 27.0, 33.0, 38.0, 39.0, 35.0, 44.0, 28.0, 33.0, 35.0, 40.0, 34.0, 31.0, 33.0, 34.0, 30.0, 29.0, 18.0, 28.0, 24.0, 25.0, 21.0, 16.0, 19.0, 15.0, 14.0, 16.0, 3.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0], "bins": [-6.26171875, -6.06634521484375, -5.8709716796875, -5.67559814453125, -5.480224609375, -5.28485107421875, -5.0894775390625, -4.89410400390625, -4.69873046875, -4.50335693359375, -4.3079833984375, -4.11260986328125, -3.917236328125, -3.72186279296875, -3.5264892578125, -3.33111572265625, -3.1357421875, -2.94036865234375, -2.7449951171875, -2.54962158203125, -2.354248046875, -2.15887451171875, -1.9635009765625, -1.76812744140625, -1.57275390625, -1.37738037109375, -1.1820068359375, -0.98663330078125, -0.791259765625, -0.59588623046875, -0.4005126953125, -0.20513916015625, -0.009765625, 0.18560791015625, 0.3809814453125, 0.57635498046875, 0.771728515625, 0.96710205078125, 1.1624755859375, 1.35784912109375, 1.55322265625, 1.74859619140625, 1.9439697265625, 2.13934326171875, 2.334716796875, 2.53009033203125, 2.7254638671875, 2.92083740234375, 3.1162109375, 3.31158447265625, 3.5069580078125, 3.70233154296875, 3.897705078125, 4.09307861328125, 4.2884521484375, 4.48382568359375, 4.67919921875, 4.87457275390625, 5.0699462890625, 5.26531982421875, 5.460693359375, 5.65606689453125, 5.8514404296875, 6.04681396484375, 6.2421875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 16.0, 21.0, 25.0, 34.0, 71.0, 86.0, 158.0, 234.0, 265.0, 438.0, 621.0, 952.0, 1322.0, 2068.0, 2981.0, 4435.0, 6624.0, 9956.0, 14815.0, 22238.0, 34247.0, 52210.0, 80934.0, 125483.0, 186072.0, 173130.0, 114869.0, 73524.0, 47701.0, 31196.0, 20445.0, 13579.0, 8929.0, 6116.0, 4165.0, 2720.0, 1880.0, 1231.0, 883.0, 612.0, 419.0, 275.0, 187.0, 134.0, 84.0, 68.0, 32.0, 30.0, 14.0, 11.0, 5.0, 3.0, 6.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.87939453125, -0.8509292602539062, -0.8224639892578125, -0.7939987182617188, -0.765533447265625, -0.7370681762695312, -0.7086029052734375, -0.6801376342773438, -0.65167236328125, -0.6232070922851562, -0.5947418212890625, -0.5662765502929688, -0.537811279296875, -0.5093460083007812, -0.4808807373046875, -0.45241546630859375, -0.4239501953125, -0.39548492431640625, -0.3670196533203125, -0.33855438232421875, -0.310089111328125, -0.28162384033203125, -0.2531585693359375, -0.22469329833984375, -0.19622802734375, -0.16776275634765625, -0.1392974853515625, -0.11083221435546875, -0.082366943359375, -0.05390167236328125, -0.0254364013671875, 0.00302886962890625, 0.031494140625, 0.05995941162109375, 0.0884246826171875, 0.11688995361328125, 0.145355224609375, 0.17382049560546875, 0.2022857666015625, 0.23075103759765625, 0.25921630859375, 0.28768157958984375, 0.3161468505859375, 0.34461212158203125, 0.373077392578125, 0.40154266357421875, 0.4300079345703125, 0.45847320556640625, 0.4869384765625, 0.5154037475585938, 0.5438690185546875, 0.5723342895507812, 0.600799560546875, 0.6292648315429688, 0.6577301025390625, 0.6861953735351562, 0.71466064453125, 0.7431259155273438, 0.7715911865234375, 0.8000564575195312, 0.828521728515625, 0.8569869995117188, 0.8854522705078125, 0.9139175415039062, 0.9423828125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 7.0, 10.0, 8.0, 13.0, 12.0, 12.0, 14.0, 22.0, 21.0, 28.0, 29.0, 30.0, 21.0, 34.0, 32.0, 39.0, 46.0, 44.0, 45.0, 1055.0, 49.0, 51.0, 39.0, 45.0, 36.0, 36.0, 36.0, 32.0, 31.0, 20.0, 19.0, 19.0, 16.0, 15.0, 10.0, 10.0, 9.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.5625, -4.41912841796875, -4.2757568359375, -4.13238525390625, -3.989013671875, -3.84564208984375, -3.7022705078125, -3.55889892578125, -3.41552734375, -3.27215576171875, -3.1287841796875, -2.98541259765625, -2.842041015625, -2.69866943359375, -2.5552978515625, -2.41192626953125, -2.2685546875, -2.12518310546875, -1.9818115234375, -1.83843994140625, -1.695068359375, -1.55169677734375, -1.4083251953125, -1.26495361328125, -1.12158203125, -0.97821044921875, -0.8348388671875, -0.69146728515625, -0.548095703125, -0.40472412109375, -0.2613525390625, -0.11798095703125, 0.025390625, 0.16876220703125, 0.3121337890625, 0.45550537109375, 0.598876953125, 0.74224853515625, 0.8856201171875, 1.02899169921875, 1.17236328125, 1.31573486328125, 1.4591064453125, 1.60247802734375, 1.745849609375, 1.88922119140625, 2.0325927734375, 2.17596435546875, 2.3193359375, 2.46270751953125, 2.6060791015625, 2.74945068359375, 2.892822265625, 3.03619384765625, 3.1795654296875, 3.32293701171875, 3.46630859375, 3.60968017578125, 3.7530517578125, 3.89642333984375, 4.039794921875, 4.18316650390625, 4.3265380859375, 4.46990966796875, 4.61328125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 16.0, 17.0, 22.0, 41.0, 44.0, 73.0, 112.0, 197.0, 272.0, 383.0, 587.0, 954.0, 1421.0, 2154.0, 3202.0, 5005.0, 7637.0, 11823.0, 18295.0, 28566.0, 45317.0, 71421.0, 113664.0, 182420.0, 1248983.0, 130481.0, 81607.0, 51209.0, 32301.0, 20482.0, 13379.0, 8519.0, 5644.0, 3660.0, 2477.0, 1594.0, 1040.0, 727.0, 480.0, 286.0, 233.0, 110.0, 94.0, 68.0, 39.0, 29.0, 19.0, 11.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.8896484375, -0.861968994140625, -0.83428955078125, -0.806610107421875, -0.7789306640625, -0.751251220703125, -0.72357177734375, -0.695892333984375, -0.668212890625, -0.640533447265625, -0.61285400390625, -0.585174560546875, -0.5574951171875, -0.529815673828125, -0.50213623046875, -0.474456787109375, -0.44677734375, -0.419097900390625, -0.39141845703125, -0.363739013671875, -0.3360595703125, -0.308380126953125, -0.28070068359375, -0.253021240234375, -0.225341796875, -0.197662353515625, -0.16998291015625, -0.142303466796875, -0.1146240234375, -0.086944580078125, -0.05926513671875, -0.031585693359375, -0.00390625, 0.023773193359375, 0.05145263671875, 0.079132080078125, 0.1068115234375, 0.134490966796875, 0.16217041015625, 0.189849853515625, 0.217529296875, 0.245208740234375, 0.27288818359375, 0.300567626953125, 0.3282470703125, 0.355926513671875, 0.38360595703125, 0.411285400390625, 0.43896484375, 0.466644287109375, 0.49432373046875, 0.522003173828125, 0.5496826171875, 0.577362060546875, 0.60504150390625, 0.632720947265625, 0.660400390625, 0.688079833984375, 0.71575927734375, 0.743438720703125, 0.7711181640625, 0.798797607421875, 0.82647705078125, 0.854156494140625, 0.8818359375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 16.0, 10.0, 10.0, 23.0, 24.0, 24.0, 30.0, 39.0, 38.0, 41.0, 54.0, 56.0, 68.0, 70.0, 67.0, 42.0, 59.0, 55.0, 41.0, 45.0, 32.0, 29.0, 18.0, 17.0, 24.0, 11.0, 8.0, 8.0, 12.0, 7.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00154876708984375, -0.0014983564615249634, -0.0014479458332061768, -0.0013975352048873901, -0.0013471245765686035, -0.001296713948249817, -0.0012463033199310303, -0.0011958926916122437, -0.001145482063293457, -0.0010950714349746704, -0.0010446608066558838, -0.0009942501783370972, -0.0009438395500183105, -0.0008934289216995239, -0.0008430182933807373, -0.0007926076650619507, -0.0007421970367431641, -0.0006917864084243774, -0.0006413757801055908, -0.0005909651517868042, -0.0005405545234680176, -0.000490143895149231, -0.00043973326683044434, -0.0003893226385116577, -0.0003389120101928711, -0.00028850138187408447, -0.00023809075355529785, -0.00018768012523651123, -0.0001372694969177246, -8.685886859893799e-05, -3.644824028015137e-05, 1.3962388038635254e-05, 6.437301635742188e-05, 0.0001147836446762085, 0.00016519427299499512, 0.00021560490131378174, 0.00026601552963256836, 0.000316426157951355, 0.0003668367862701416, 0.0004172474145889282, 0.00046765804290771484, 0.0005180686712265015, 0.0005684792995452881, 0.0006188899278640747, 0.0006693005561828613, 0.000719711184501648, 0.0007701218128204346, 0.0008205324411392212, 0.0008709430694580078, 0.0009213536977767944, 0.0009717643260955811, 0.0010221749544143677, 0.0010725855827331543, 0.001122996211051941, 0.0011734068393707275, 0.0012238174676895142, 0.0012742280960083008, 0.0013246387243270874, 0.001375049352645874, 0.0014254599809646606, 0.0014758706092834473, 0.0015262812376022339, 0.0015766918659210205, 0.0016271024942398071, 0.0016775131225585938]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 9.0, 11.0, 8.0, 14.0, 20.0, 15.0, 22.0, 37.0, 44.0, 59.0, 87.0, 126.0, 208.0, 517.0, 2968.0, 1025286.0, 17589.0, 743.0, 291.0, 153.0, 95.0, 60.0, 47.0, 33.0, 28.0, 23.0, 15.0, 11.0, 6.0, 6.0, 1.0, 8.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039093017578125, -0.03789567947387695, -0.036698341369628906, -0.03550100326538086, -0.03430366516113281, -0.033106327056884766, -0.03190898895263672, -0.030711650848388672, -0.029514312744140625, -0.028316974639892578, -0.02711963653564453, -0.025922298431396484, -0.024724960327148438, -0.02352762222290039, -0.022330284118652344, -0.021132946014404297, -0.01993560791015625, -0.018738269805908203, -0.017540931701660156, -0.01634359359741211, -0.015146255493164062, -0.013948917388916016, -0.012751579284667969, -0.011554241180419922, -0.010356903076171875, -0.009159564971923828, -0.007962226867675781, -0.006764888763427734, -0.0055675506591796875, -0.004370212554931641, -0.0031728744506835938, -0.001975536346435547, -0.0007781982421875, 0.0004191398620605469, 0.0016164779663085938, 0.0028138160705566406, 0.0040111541748046875, 0.005208492279052734, 0.006405830383300781, 0.007603168487548828, 0.008800506591796875, 0.009997844696044922, 0.011195182800292969, 0.012392520904541016, 0.013589859008789062, 0.01478719711303711, 0.015984535217285156, 0.017181873321533203, 0.01837921142578125, 0.019576549530029297, 0.020773887634277344, 0.02197122573852539, 0.023168563842773438, 0.024365901947021484, 0.02556324005126953, 0.026760578155517578, 0.027957916259765625, 0.029155254364013672, 0.03035259246826172, 0.031549930572509766, 0.03274726867675781, 0.03394460678100586, 0.035141944885253906, 0.03633928298950195, 0.03753662109375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 4.0, 16.0, 42.0, 106.0, 184.0, 210.0, 199.0, 127.0, 69.0, 29.0, 17.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0020032308530062437, -0.0019485864322632551, -0.0018939421279355884, -0.0018392977071925998, -0.0017846532864496112, -0.0017300089821219444, -0.0016753645613789558, -0.0016207201406359673, -0.0015660757198929787, -0.00151143129914999, -0.0014567869948223233, -0.0014021425740793347, -0.0013474981533363461, -0.0012928538490086794, -0.0012382094282656908, -0.0011835650075227022, -0.0011289207031950355, -0.0010742762824520469, -0.0010196319781243801, -0.0009649875573813915, -0.0009103431366384029, -0.0008556987741030753, -0.0008010544115677476, -0.000746409990824759, -0.0006917656282894313, -0.0006371212657541037, -0.0005824768450111151, -0.0005278324824757874, -0.00047318809083662927, -0.00041854369919747114, -0.00036389933666214347, -0.00030925494502298534, -0.0002546104369685054, -0.00019996604532934725, -0.00014532166824210435, -9.067729115486145e-05, -3.603289951570332e-05, 1.861149212345481e-05, 7.325585465878248e-05, 0.0001279002462979406, 0.00018254463793709874, 0.00023718902957625687, 0.000291833421215415, 0.0003464777837507427, 0.0004011221753899008, 0.00045576656702905893, 0.0005104109295643866, 0.0005650552920997143, 0.0006196997128427029, 0.0006743440753780305, 0.0007289884961210191, 0.0007836328586563468, 0.0008382772793993354, 0.0008929216419346631, 0.0009475660044699907, 0.0010022104252129793, 0.001056854845955968, 0.0011114992666989565, 0.0011661435710266232, 0.0012207879917696118, 0.0012754324125126004, 0.0013300767168402672, 0.0013847211375832558, 0.0014393655583262444, 0.0014940098626539111]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 3.0, 9.0, 4.0, 6.0, 13.0, 14.0, 22.0, 11.0, 18.0, 26.0, 23.0, 32.0, 28.0, 29.0, 29.0, 42.0, 32.0, 34.0, 37.0, 41.0, 41.0, 43.0, 40.0, 40.0, 35.0, 32.0, 28.0, 32.0, 29.0, 28.0, 26.0, 31.0, 19.0, 14.0, 13.0, 19.0, 18.0, 11.0, 13.0, 9.0, 7.0, 4.0, 1.0, 6.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0007635951042175293, -0.0007400056347250938, -0.0007164161652326584, -0.0006928266957402229, -0.0006692372262477875, -0.000645647756755352, -0.0006220582872629166, -0.0005984688177704811, -0.0005748793482780457, -0.0005512898787856102, -0.0005277004092931747, -0.0005041109398007393, -0.00048052147030830383, -0.0004569320008158684, -0.0004333425313234329, -0.00040975306183099747, -0.000386163592338562, -0.00036257412284612656, -0.0003389846533536911, -0.00031539518386125565, -0.0002918057143688202, -0.00026821624487638474, -0.0002446267753839493, -0.00022103730589151382, -0.00019744783639907837, -0.00017385836690664291, -0.00015026889741420746, -0.000126679427921772, -0.00010308995842933655, -7.950048893690109e-05, -5.591101944446564e-05, -3.232154995203018e-05, -8.732080459594727e-06, 1.4857389032840729e-05, 3.8446858525276184e-05, 6.203632801771164e-05, 8.56257975101471e-05, 0.00010921526700258255, 0.000132804736495018, 0.00015639420598745346, 0.00017998367547988892, 0.00020357314497232437, 0.00022716261446475983, 0.0002507520839571953, 0.00027434155344963074, 0.0002979310229420662, 0.00032152049243450165, 0.0003451099619269371, 0.00036869943141937256, 0.000392288900911808, 0.00041587837040424347, 0.0004394678398966789, 0.0004630573093891144, 0.00048664677888154984, 0.0005102362483739853, 0.0005338257178664207, 0.0005574151873588562, 0.0005810046568512917, 0.0006045941263437271, 0.0006281835958361626, 0.000651773065328598, 0.0006753625348210335, 0.0006989520043134689, 0.0007225414738059044, 0.0007461309432983398]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 11.0, 7.0, 7.0, 13.0, 9.0, 9.0, 15.0, 18.0, 21.0, 25.0, 21.0, 28.0, 32.0, 28.0, 33.0, 37.0, 39.0, 34.0, 46.0, 28.0, 32.0, 36.0, 39.0, 34.0, 32.0, 32.0, 34.0, 31.0, 29.0, 17.0, 29.0, 24.0, 23.0, 23.0, 16.0, 18.0, 16.0, 13.0, 17.0, 3.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0], "bins": [-6.26171875, -6.06640625, -5.87109375, -5.67578125, -5.48046875, -5.28515625, -5.08984375, -4.89453125, -4.69921875, -4.50390625, -4.30859375, -4.11328125, -3.91796875, -3.72265625, -3.52734375, -3.33203125, -3.13671875, -2.94140625, -2.74609375, -2.55078125, -2.35546875, -2.16015625, -1.96484375, -1.76953125, -1.57421875, -1.37890625, -1.18359375, -0.98828125, -0.79296875, -0.59765625, -0.40234375, -0.20703125, -0.01171875, 0.18359375, 0.37890625, 0.57421875, 0.76953125, 0.96484375, 1.16015625, 1.35546875, 1.55078125, 1.74609375, 1.94140625, 2.13671875, 2.33203125, 2.52734375, 2.72265625, 2.91796875, 3.11328125, 3.30859375, 3.50390625, 3.69921875, 3.89453125, 4.08984375, 4.28515625, 4.48046875, 4.67578125, 4.87109375, 5.06640625, 5.26171875, 5.45703125, 5.65234375, 5.84765625, 6.04296875, 6.23828125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 5.0, 2.0, 7.0, 11.0, 17.0, 25.0, 35.0, 52.0, 80.0, 113.0, 178.0, 248.0, 381.0, 577.0, 864.0, 1256.0, 1840.0, 2951.0, 4765.0, 7662.0, 12692.0, 22361.0, 43130.0, 93370.0, 236044.0, 347861.0, 139205.0, 60609.0, 29932.0, 16184.0, 9658.0, 5766.0, 3681.0, 2399.0, 1565.0, 1006.0, 654.0, 417.0, 297.0, 191.0, 145.0, 95.0, 65.0, 46.0, 37.0, 23.0, 20.0, 10.0, 7.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.3828125, -3.281005859375, -3.17919921875, -3.077392578125, -2.9755859375, -2.873779296875, -2.77197265625, -2.670166015625, -2.568359375, -2.466552734375, -2.36474609375, -2.262939453125, -2.1611328125, -2.059326171875, -1.95751953125, -1.855712890625, -1.75390625, -1.652099609375, -1.55029296875, -1.448486328125, -1.3466796875, -1.244873046875, -1.14306640625, -1.041259765625, -0.939453125, -0.837646484375, -0.73583984375, -0.634033203125, -0.5322265625, -0.430419921875, -0.32861328125, -0.226806640625, -0.125, -0.023193359375, 0.07861328125, 0.180419921875, 0.2822265625, 0.384033203125, 0.48583984375, 0.587646484375, 0.689453125, 0.791259765625, 0.89306640625, 0.994873046875, 1.0966796875, 1.198486328125, 1.30029296875, 1.402099609375, 1.50390625, 1.605712890625, 1.70751953125, 1.809326171875, 1.9111328125, 2.012939453125, 2.11474609375, 2.216552734375, 2.318359375, 2.420166015625, 2.52197265625, 2.623779296875, 2.7255859375, 2.827392578125, 2.92919921875, 3.031005859375, 3.1328125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 6.0, 7.0, 15.0, 14.0, 10.0, 8.0, 20.0, 15.0, 23.0, 27.0, 39.0, 53.0, 46.0, 33.0, 44.0, 62.0, 149.0, 1739.0, 219.0, 72.0, 53.0, 52.0, 42.0, 43.0, 24.0, 34.0, 30.0, 21.0, 28.0, 27.0, 13.0, 13.0, 9.0, 15.0, 9.0, 8.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.328125, -21.51904296875, -20.7099609375, -19.90087890625, -19.091796875, -18.28271484375, -17.4736328125, -16.66455078125, -15.85546875, -15.04638671875, -14.2373046875, -13.42822265625, -12.619140625, -11.81005859375, -11.0009765625, -10.19189453125, -9.3828125, -8.57373046875, -7.7646484375, -6.95556640625, -6.146484375, -5.33740234375, -4.5283203125, -3.71923828125, -2.91015625, -2.10107421875, -1.2919921875, -0.48291015625, 0.326171875, 1.13525390625, 1.9443359375, 2.75341796875, 3.5625, 4.37158203125, 5.1806640625, 5.98974609375, 6.798828125, 7.60791015625, 8.4169921875, 9.22607421875, 10.03515625, 10.84423828125, 11.6533203125, 12.46240234375, 13.271484375, 14.08056640625, 14.8896484375, 15.69873046875, 16.5078125, 17.31689453125, 18.1259765625, 18.93505859375, 19.744140625, 20.55322265625, 21.3623046875, 22.17138671875, 22.98046875, 23.78955078125, 24.5986328125, 25.40771484375, 26.216796875, 27.02587890625, 27.8349609375, 28.64404296875, 29.453125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 8.0, 6.0, 9.0, 16.0, 35.0, 23.0, 34.0, 58.0, 55.0, 88.0, 116.0, 182.0, 354.0, 681.0, 4077.0, 3034288.0, 102925.0, 1499.0, 464.0, 260.0, 180.0, 109.0, 60.0, 39.0, 20.0, 29.0, 25.0, 17.0, 11.0, 12.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-78.5625, -76.484375, -74.40625, -72.328125, -70.25, -68.171875, -66.09375, -64.015625, -61.9375, -59.859375, -57.78125, -55.703125, -53.625, -51.546875, -49.46875, -47.390625, -45.3125, -43.234375, -41.15625, -39.078125, -37.0, -34.921875, -32.84375, -30.765625, -28.6875, -26.609375, -24.53125, -22.453125, -20.375, -18.296875, -16.21875, -14.140625, -12.0625, -9.984375, -7.90625, -5.828125, -3.75, -1.671875, 0.40625, 2.484375, 4.5625, 6.640625, 8.71875, 10.796875, 12.875, 14.953125, 17.03125, 19.109375, 21.1875, 23.265625, 25.34375, 27.421875, 29.5, 31.578125, 33.65625, 35.734375, 37.8125, 39.890625, 41.96875, 44.046875, 46.125, 48.203125, 50.28125, 52.359375, 54.4375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 8.0, 13.0, 33.0, 93.0, 176.0, 213.0, 219.0, 140.0, 76.0, 27.0, 7.0, 3.0, 1.0, 1.0, 2.0], "bins": [-77.00790405273438, -75.60250854492188, -74.1971206665039, -72.79173278808594, -71.38633728027344, -69.98094177246094, -68.57555389404297, -67.170166015625, -65.7647705078125, -64.359375, -62.95398712158203, -61.5485954284668, -60.14320373535156, -58.73781204223633, -57.332420349121094, -55.92702865600586, -54.521636962890625, -53.11624526977539, -51.710853576660156, -50.30546188354492, -48.90007019042969, -47.49467849731445, -46.08928680419922, -44.683895111083984, -43.27850341796875, -41.873111724853516, -40.46772003173828, -39.06232833862305, -37.65693664550781, -36.25154495239258, -34.846153259277344, -33.44076156616211, -32.035369873046875, -30.62997817993164, -29.224586486816406, -27.819194793701172, -26.413803100585938, -25.008411407470703, -23.60301971435547, -22.197628021240234, -20.792236328125, -19.386844635009766, -17.98145294189453, -16.576061248779297, -15.170669555664062, -13.765277862548828, -12.359886169433594, -10.95449447631836, -9.549103736877441, -8.143712043762207, -6.738320350646973, -5.332928657531738, -3.927536964416504, -2.5221452713012695, -1.1167535781860352, 0.2886381149291992, 1.6940298080444336, 3.099421501159668, 4.504813194274902, 5.910204887390137, 7.315596580505371, 8.720988273620605, 10.12637996673584, 11.531771659851074, 12.937163352966309]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 4.0, 2.0, 7.0, 7.0, 9.0, 7.0, 13.0, 10.0, 22.0, 29.0, 24.0, 29.0, 20.0, 33.0, 29.0, 39.0, 26.0, 32.0, 51.0, 52.0, 35.0, 43.0, 43.0, 38.0, 39.0, 41.0, 32.0, 31.0, 31.0, 34.0, 24.0, 24.0, 26.0, 22.0, 8.0, 18.0, 21.0, 8.0, 6.0, 12.0, 2.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-63.31575012207031, -61.22175598144531, -59.12776184082031, -57.03377151489258, -54.93977737426758, -52.84578323364258, -50.751792907714844, -48.657798767089844, -46.563804626464844, -44.469810485839844, -42.375816345214844, -40.28182601928711, -38.18783187866211, -36.09383773803711, -33.999847412109375, -31.905853271484375, -29.811859130859375, -27.717864990234375, -25.623872756958008, -23.52988052368164, -21.43588638305664, -19.34189224243164, -17.247900009155273, -15.15390682220459, -13.059913635253906, -10.965920448303223, -8.871927261352539, -6.7779340744018555, -4.683940887451172, -2.5899477005004883, -0.4959545135498047, 1.598038673400879, 3.6920394897460938, 5.786032676696777, 7.880025863647461, 9.974019050598145, 12.068012237548828, 14.162005424499512, 16.255998611450195, 18.349990844726562, 20.443984985351562, 22.537979125976562, 24.63197135925293, 26.725963592529297, 28.819957733154297, 30.913951873779297, 33.00794219970703, 35.10193634033203, 37.19593048095703, 39.28992462158203, 41.38391876220703, 43.477909088134766, 45.571903228759766, 47.665897369384766, 49.7598876953125, 51.8538818359375, 53.9478759765625, 56.0418701171875, 58.1358642578125, 60.229854583740234, 62.323848724365234, 64.41783905029297, 66.51183319091797, 68.60582733154297, 70.69982147216797]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 8.0, 9.0, 5.0, 10.0, 12.0, 5.0, 16.0, 9.0, 22.0, 13.0, 22.0, 19.0, 30.0, 32.0, 27.0, 25.0, 23.0, 44.0, 33.0, 34.0, 34.0, 30.0, 35.0, 32.0, 33.0, 33.0, 33.0, 36.0, 32.0, 35.0, 21.0, 23.0, 28.0, 18.0, 22.0, 20.0, 16.0, 19.0, 16.0, 21.0, 9.0, 13.0, 6.0, 7.0, 6.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 3.0], "bins": [-5.97265625, -5.781494140625, -5.59033203125, -5.399169921875, -5.2080078125, -5.016845703125, -4.82568359375, -4.634521484375, -4.443359375, -4.252197265625, -4.06103515625, -3.869873046875, -3.6787109375, -3.487548828125, -3.29638671875, -3.105224609375, -2.9140625, -2.722900390625, -2.53173828125, -2.340576171875, -2.1494140625, -1.958251953125, -1.76708984375, -1.575927734375, -1.384765625, -1.193603515625, -1.00244140625, -0.811279296875, -0.6201171875, -0.428955078125, -0.23779296875, -0.046630859375, 0.14453125, 0.335693359375, 0.52685546875, 0.718017578125, 0.9091796875, 1.100341796875, 1.29150390625, 1.482666015625, 1.673828125, 1.864990234375, 2.05615234375, 2.247314453125, 2.4384765625, 2.629638671875, 2.82080078125, 3.011962890625, 3.203125, 3.394287109375, 3.58544921875, 3.776611328125, 3.9677734375, 4.158935546875, 4.35009765625, 4.541259765625, 4.732421875, 4.923583984375, 5.11474609375, 5.305908203125, 5.4970703125, 5.688232421875, 5.87939453125, 6.070556640625, 6.26171875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 13.0, 15.0, 18.0, 28.0, 43.0, 53.0, 73.0, 104.0, 136.0, 231.0, 347.0, 610.0, 1163.0, 2351.0, 5673.0, 16109.0, 66709.0, 369911.0, 1421316.0, 1677084.0, 513443.0, 86435.0, 19875.0, 6569.0, 2761.0, 1344.0, 662.0, 398.0, 234.0, 165.0, 96.0, 74.0, 64.0, 49.0, 40.0, 26.0, 16.0, 12.0, 13.0, 10.0, 4.0, 2.0, 2.0, 3.0], "bins": [-12.4375, -12.119384765625, -11.80126953125, -11.483154296875, -11.1650390625, -10.846923828125, -10.52880859375, -10.210693359375, -9.892578125, -9.574462890625, -9.25634765625, -8.938232421875, -8.6201171875, -8.302001953125, -7.98388671875, -7.665771484375, -7.34765625, -7.029541015625, -6.71142578125, -6.393310546875, -6.0751953125, -5.757080078125, -5.43896484375, -5.120849609375, -4.802734375, -4.484619140625, -4.16650390625, -3.848388671875, -3.5302734375, -3.212158203125, -2.89404296875, -2.575927734375, -2.2578125, -1.939697265625, -1.62158203125, -1.303466796875, -0.9853515625, -0.667236328125, -0.34912109375, -0.031005859375, 0.287109375, 0.605224609375, 0.92333984375, 1.241455078125, 1.5595703125, 1.877685546875, 2.19580078125, 2.513916015625, 2.83203125, 3.150146484375, 3.46826171875, 3.786376953125, 4.1044921875, 4.422607421875, 4.74072265625, 5.058837890625, 5.376953125, 5.695068359375, 6.01318359375, 6.331298828125, 6.6494140625, 6.967529296875, 7.28564453125, 7.603759765625, 7.921875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 3.0, 1.0, 9.0, 9.0, 8.0, 9.0, 10.0, 12.0, 13.0, 18.0, 20.0, 29.0, 42.0, 57.0, 69.0, 85.0, 102.0, 161.0, 176.0, 241.0, 291.0, 335.0, 366.0, 383.0, 319.0, 281.0, 227.0, 176.0, 123.0, 113.0, 78.0, 76.0, 58.0, 39.0, 37.0, 22.0, 23.0, 19.0, 19.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.4375, -10.0361328125, -9.634765625, -9.2333984375, -8.83203125, -8.4306640625, -8.029296875, -7.6279296875, -7.2265625, -6.8251953125, -6.423828125, -6.0224609375, -5.62109375, -5.2197265625, -4.818359375, -4.4169921875, -4.015625, -3.6142578125, -3.212890625, -2.8115234375, -2.41015625, -2.0087890625, -1.607421875, -1.2060546875, -0.8046875, -0.4033203125, -0.001953125, 0.3994140625, 0.80078125, 1.2021484375, 1.603515625, 2.0048828125, 2.40625, 2.8076171875, 3.208984375, 3.6103515625, 4.01171875, 4.4130859375, 4.814453125, 5.2158203125, 5.6171875, 6.0185546875, 6.419921875, 6.8212890625, 7.22265625, 7.6240234375, 8.025390625, 8.4267578125, 8.828125, 9.2294921875, 9.630859375, 10.0322265625, 10.43359375, 10.8349609375, 11.236328125, 11.6376953125, 12.0390625, 12.4404296875, 12.841796875, 13.2431640625, 13.64453125, 14.0458984375, 14.447265625, 14.8486328125, 15.25]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 0.0, 4.0, 5.0, 10.0, 14.0, 12.0, 23.0, 20.0, 15.0, 40.0, 27.0, 54.0, 73.0, 80.0, 108.0, 152.0, 245.0, 389.0, 1067.0, 14258.0, 3378750.0, 791433.0, 5569.0, 775.0, 321.0, 221.0, 149.0, 100.0, 70.0, 59.0, 46.0, 50.0, 29.0, 24.0, 17.0, 20.0, 8.0, 6.0, 13.0, 3.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0], "bins": [-65.9375, -64.04638671875, -62.1552734375, -60.26416015625, -58.373046875, -56.48193359375, -54.5908203125, -52.69970703125, -50.80859375, -48.91748046875, -47.0263671875, -45.13525390625, -43.244140625, -41.35302734375, -39.4619140625, -37.57080078125, -35.6796875, -33.78857421875, -31.8974609375, -30.00634765625, -28.115234375, -26.22412109375, -24.3330078125, -22.44189453125, -20.55078125, -18.65966796875, -16.7685546875, -14.87744140625, -12.986328125, -11.09521484375, -9.2041015625, -7.31298828125, -5.421875, -3.53076171875, -1.6396484375, 0.25146484375, 2.142578125, 4.03369140625, 5.9248046875, 7.81591796875, 9.70703125, 11.59814453125, 13.4892578125, 15.38037109375, 17.271484375, 19.16259765625, 21.0537109375, 22.94482421875, 24.8359375, 26.72705078125, 28.6181640625, 30.50927734375, 32.400390625, 34.29150390625, 36.1826171875, 38.07373046875, 39.96484375, 41.85595703125, 43.7470703125, 45.63818359375, 47.529296875, 49.42041015625, 51.3115234375, 53.20263671875, 55.09375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 7.0, 11.0, 10.0, 14.0, 16.0, 19.0, 26.0, 50.0, 42.0, 58.0, 63.0, 74.0, 82.0, 82.0, 89.0, 91.0, 58.0, 59.0, 38.0, 33.0, 28.0, 19.0, 14.0, 11.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.831884384155273, -21.42334747314453, -20.014812469482422, -18.60627555847168, -17.19774055480957, -15.789203643798828, -14.380667686462402, -12.972131729125977, -11.56359577178955, -10.155059814453125, -8.7465238571167, -7.337987422943115, -5.9294514656066895, -4.520915508270264, -3.1123790740966797, -1.703843116760254, -0.2953071594238281, 1.1132289171218872, 2.5217649936676025, 3.9303011894226074, 5.338837146759033, 6.747373104095459, 8.155909538269043, 9.564445495605469, 10.972981452941895, 12.38151741027832, 13.790053367614746, 15.198589324951172, 16.607126235961914, 18.015661239624023, 19.424198150634766, 20.832733154296875, 22.241268157958984, 23.649805068969727, 25.058340072631836, 26.466876983642578, 27.875411987304688, 29.28394889831543, 30.692485809326172, 32.10102081298828, 33.50955581665039, 34.9180908203125, 36.326629638671875, 37.735164642333984, 39.143699645996094, 40.5522346496582, 41.96077346801758, 43.36930847167969, 44.77784729003906, 46.18638229370117, 47.59492111206055, 49.003456115722656, 50.411991119384766, 51.820526123046875, 53.22906494140625, 54.63759994506836, 56.04613494873047, 57.45466995239258, 58.86320877075195, 60.27174377441406, 61.68027877807617, 63.08881378173828, 64.49735260009766, 65.9058837890625, 67.31442260742188]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 12.0, 7.0, 7.0, 6.0, 12.0, 16.0, 19.0, 27.0, 22.0, 27.0, 31.0, 35.0, 39.0, 44.0, 39.0, 30.0, 36.0, 49.0, 46.0, 37.0, 39.0, 33.0, 43.0, 35.0, 31.0, 30.0, 29.0, 26.0, 24.0, 29.0, 27.0, 20.0, 15.0, 13.0, 9.0, 15.0, 11.0, 6.0, 8.0, 2.0, 8.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0], "bins": [-53.66212463378906, -52.12750244140625, -50.59288024902344, -49.058258056640625, -47.52363204956055, -45.989009857177734, -44.45438766479492, -42.91976547241211, -41.3851432800293, -39.850521087646484, -38.31589889526367, -36.781272888183594, -35.24665069580078, -33.71202850341797, -32.177406311035156, -30.642784118652344, -29.1081600189209, -27.573537826538086, -26.03891372680664, -24.504291534423828, -22.969669342041016, -21.435047149658203, -19.900423049926758, -18.365800857543945, -16.8311767578125, -15.296553611755371, -13.761931419372559, -12.22730827331543, -10.692686080932617, -9.158062934875488, -7.623439788818359, -6.088817596435547, -4.554195404052734, -3.0195727348327637, -1.4849498271942139, 0.04967308044433594, 1.5842957496643066, 3.1189184188842773, 4.653541564941406, 6.188163757324219, 7.722786903381348, 9.257410049438477, 10.792032241821289, 12.326655387878418, 13.861278533935547, 15.39590072631836, 16.930522918701172, 18.465145111083984, 19.99976921081543, 21.534391403198242, 23.069015502929688, 24.6036376953125, 26.138259887695312, 27.672882080078125, 29.20750617980957, 30.742128372192383, 32.27675247192383, 33.81137466430664, 35.34599685668945, 36.88062286376953, 38.415245056152344, 39.949867248535156, 41.48448944091797, 43.01911163330078, 44.553733825683594]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 9.0, 13.0, 10.0, 11.0, 19.0, 12.0, 18.0, 16.0, 20.0, 18.0, 21.0, 14.0, 39.0, 41.0, 32.0, 40.0, 40.0, 21.0, 29.0, 44.0, 41.0, 34.0, 33.0, 38.0, 34.0, 27.0, 29.0, 30.0, 32.0, 28.0, 23.0, 23.0, 21.0, 21.0, 20.0, 24.0, 6.0, 8.0, 15.0, 7.0, 8.0, 1.0, 6.0, 8.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0], "bins": [-6.0703125, -5.87359619140625, -5.6768798828125, -5.48016357421875, -5.283447265625, -5.08673095703125, -4.8900146484375, -4.69329833984375, -4.49658203125, -4.29986572265625, -4.1031494140625, -3.90643310546875, -3.709716796875, -3.51300048828125, -3.3162841796875, -3.11956787109375, -2.9228515625, -2.72613525390625, -2.5294189453125, -2.33270263671875, -2.135986328125, -1.93927001953125, -1.7425537109375, -1.54583740234375, -1.34912109375, -1.15240478515625, -0.9556884765625, -0.75897216796875, -0.562255859375, -0.36553955078125, -0.1688232421875, 0.02789306640625, 0.224609375, 0.42132568359375, 0.6180419921875, 0.81475830078125, 1.011474609375, 1.20819091796875, 1.4049072265625, 1.60162353515625, 1.79833984375, 1.99505615234375, 2.1917724609375, 2.38848876953125, 2.585205078125, 2.78192138671875, 2.9786376953125, 3.17535400390625, 3.3720703125, 3.56878662109375, 3.7655029296875, 3.96221923828125, 4.158935546875, 4.35565185546875, 4.5523681640625, 4.74908447265625, 4.94580078125, 5.14251708984375, 5.3392333984375, 5.53594970703125, 5.732666015625, 5.92938232421875, 6.1260986328125, 6.32281494140625, 6.51953125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 7.0, 8.0, 10.0, 30.0, 32.0, 39.0, 70.0, 98.0, 123.0, 213.0, 329.0, 491.0, 771.0, 1147.0, 1708.0, 2510.0, 3928.0, 5996.0, 8971.0, 13847.0, 20933.0, 32373.0, 50135.0, 77998.0, 125635.0, 199954.0, 184197.0, 113842.0, 71252.0, 45859.0, 29566.0, 19456.0, 12794.0, 8237.0, 5389.0, 3506.0, 2369.0, 1569.0, 982.0, 745.0, 490.0, 296.0, 227.0, 156.0, 96.0, 52.0, 47.0, 27.0, 12.0, 10.0, 11.0, 10.0, 2.0, 4.0, 1.0, 1.0, 3.0], "bins": [-1.0263671875, -0.9951705932617188, -0.9639739990234375, -0.9327774047851562, -0.901580810546875, -0.8703842163085938, -0.8391876220703125, -0.8079910278320312, -0.77679443359375, -0.7455978393554688, -0.7144012451171875, -0.6832046508789062, -0.652008056640625, -0.6208114624023438, -0.5896148681640625, -0.5584182739257812, -0.5272216796875, -0.49602508544921875, -0.4648284912109375, -0.43363189697265625, -0.402435302734375, -0.37123870849609375, -0.3400421142578125, -0.30884552001953125, -0.27764892578125, -0.24645233154296875, -0.2152557373046875, -0.18405914306640625, -0.152862548828125, -0.12166595458984375, -0.0904693603515625, -0.05927276611328125, -0.028076171875, 0.00312042236328125, 0.0343170166015625, 0.06551361083984375, 0.096710205078125, 0.12790679931640625, 0.1591033935546875, 0.19029998779296875, 0.22149658203125, 0.25269317626953125, 0.2838897705078125, 0.31508636474609375, 0.346282958984375, 0.37747955322265625, 0.4086761474609375, 0.43987274169921875, 0.4710693359375, 0.5022659301757812, 0.5334625244140625, 0.5646591186523438, 0.595855712890625, 0.6270523071289062, 0.6582489013671875, 0.6894454956054688, 0.72064208984375, 0.7518386840820312, 0.7830352783203125, 0.8142318725585938, 0.845428466796875, 0.8766250610351562, 0.9078216552734375, 0.9390182495117188, 0.97021484375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 4.0, 4.0, 6.0, 10.0, 8.0, 15.0, 8.0, 13.0, 17.0, 20.0, 20.0, 20.0, 32.0, 31.0, 33.0, 29.0, 39.0, 47.0, 52.0, 45.0, 1064.0, 42.0, 35.0, 40.0, 41.0, 37.0, 39.0, 33.0, 39.0, 28.0, 25.0, 23.0, 26.0, 21.0, 16.0, 10.0, 10.0, 10.0, 9.0, 6.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.860107421875, -3.71630859375, -3.572509765625, -3.4287109375, -3.284912109375, -3.14111328125, -2.997314453125, -2.853515625, -2.709716796875, -2.56591796875, -2.422119140625, -2.2783203125, -2.134521484375, -1.99072265625, -1.846923828125, -1.703125, -1.559326171875, -1.41552734375, -1.271728515625, -1.1279296875, -0.984130859375, -0.84033203125, -0.696533203125, -0.552734375, -0.408935546875, -0.26513671875, -0.121337890625, 0.0224609375, 0.166259765625, 0.31005859375, 0.453857421875, 0.59765625, 0.741455078125, 0.88525390625, 1.029052734375, 1.1728515625, 1.316650390625, 1.46044921875, 1.604248046875, 1.748046875, 1.891845703125, 2.03564453125, 2.179443359375, 2.3232421875, 2.467041015625, 2.61083984375, 2.754638671875, 2.8984375, 3.042236328125, 3.18603515625, 3.329833984375, 3.4736328125, 3.617431640625, 3.76123046875, 3.905029296875, 4.048828125, 4.192626953125, 4.33642578125, 4.480224609375, 4.6240234375, 4.767822265625, 4.91162109375, 5.055419921875, 5.19921875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 3.0, 12.0, 16.0, 17.0, 26.0, 45.0, 61.0, 94.0, 116.0, 184.0, 288.0, 442.0, 630.0, 995.0, 1431.0, 2174.0, 3116.0, 4750.0, 7234.0, 10626.0, 15837.0, 24025.0, 35958.0, 54169.0, 81564.0, 124827.0, 1231444.0, 167791.0, 111383.0, 72680.0, 48415.0, 32446.0, 21393.0, 14114.0, 9551.0, 6264.0, 4183.0, 2925.0, 1925.0, 1298.0, 848.0, 635.0, 383.0, 273.0, 189.0, 122.0, 86.0, 58.0, 36.0, 27.0, 10.0, 7.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.78857421875, -0.7630233764648438, -0.7374725341796875, -0.7119216918945312, -0.686370849609375, -0.6608200073242188, -0.6352691650390625, -0.6097183227539062, -0.58416748046875, -0.5586166381835938, -0.5330657958984375, -0.5075149536132812, -0.481964111328125, -0.45641326904296875, -0.4308624267578125, -0.40531158447265625, -0.3797607421875, -0.35420989990234375, -0.3286590576171875, -0.30310821533203125, -0.277557373046875, -0.25200653076171875, -0.2264556884765625, -0.20090484619140625, -0.17535400390625, -0.14980316162109375, -0.1242523193359375, -0.09870147705078125, -0.073150634765625, -0.04759979248046875, -0.0220489501953125, 0.00350189208984375, 0.029052734375, 0.05460357666015625, 0.0801544189453125, 0.10570526123046875, 0.131256103515625, 0.15680694580078125, 0.1823577880859375, 0.20790863037109375, 0.23345947265625, 0.25901031494140625, 0.2845611572265625, 0.31011199951171875, 0.335662841796875, 0.36121368408203125, 0.3867645263671875, 0.41231536865234375, 0.4378662109375, 0.46341705322265625, 0.4889678955078125, 0.5145187377929688, 0.540069580078125, 0.5656204223632812, 0.5911712646484375, 0.6167221069335938, 0.64227294921875, 0.6678237915039062, 0.6933746337890625, 0.7189254760742188, 0.744476318359375, 0.7700271606445312, 0.7955780029296875, 0.8211288452148438, 0.8466796875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 5.0, 7.0, 7.0, 10.0, 7.0, 16.0, 20.0, 31.0, 41.0, 36.0, 42.0, 67.0, 98.0, 82.0, 72.0, 59.0, 52.0, 71.0, 53.0, 39.0, 30.0, 31.0, 32.0, 20.0, 15.0, 4.0, 7.0, 9.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019407272338867188, -0.0018734186887741089, -0.001806110143661499, -0.0017388015985488892, -0.0016714930534362793, -0.0016041845083236694, -0.0015368759632110596, -0.0014695674180984497, -0.0014022588729858398, -0.00133495032787323, -0.0012676417827606201, -0.0012003332376480103, -0.0011330246925354004, -0.0010657161474227905, -0.0009984076023101807, -0.0009310990571975708, -0.0008637905120849609, -0.0007964819669723511, -0.0007291734218597412, -0.0006618648767471313, -0.0005945563316345215, -0.0005272477865219116, -0.00045993924140930176, -0.0003926306962966919, -0.00032532215118408203, -0.00025801360607147217, -0.0001907050609588623, -0.00012339651584625244, -5.608797073364258e-05, 1.1220574378967285e-05, 7.852911949157715e-05, 0.000145837664604187, 0.00021314620971679688, 0.00028045475482940674, 0.0003477632999420166, 0.00041507184505462646, 0.00048238039016723633, 0.0005496889352798462, 0.0006169974803924561, 0.0006843060255050659, 0.0007516145706176758, 0.0008189231157302856, 0.0008862316608428955, 0.0009535402059555054, 0.0010208487510681152, 0.001088157296180725, 0.001155465841293335, 0.0012227743864059448, 0.0012900829315185547, 0.0013573914766311646, 0.0014247000217437744, 0.0014920085668563843, 0.0015593171119689941, 0.001626625657081604, 0.0016939342021942139, 0.0017612427473068237, 0.0018285512924194336, 0.0018958598375320435, 0.0019631683826446533, 0.002030476927757263, 0.002097785472869873, 0.002165094017982483, 0.0022324025630950928, 0.0022997111082077026, 0.0023670196533203125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 5.0, 8.0, 8.0, 12.0, 9.0, 15.0, 23.0, 30.0, 41.0, 51.0, 70.0, 91.0, 201.0, 578.0, 3636.0, 1034777.0, 7668.0, 626.0, 253.0, 136.0, 81.0, 53.0, 37.0, 25.0, 36.0, 13.0, 8.0, 8.0, 11.0, 10.0, 5.0, 3.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.05267333984375, -0.051192283630371094, -0.04971122741699219, -0.04823017120361328, -0.046749114990234375, -0.04526805877685547, -0.04378700256347656, -0.042305946350097656, -0.04082489013671875, -0.039343833923339844, -0.03786277770996094, -0.03638172149658203, -0.034900665283203125, -0.03341960906982422, -0.03193855285644531, -0.030457496643066406, -0.0289764404296875, -0.027495384216308594, -0.026014328002929688, -0.02453327178955078, -0.023052215576171875, -0.02157115936279297, -0.020090103149414062, -0.018609046936035156, -0.01712799072265625, -0.015646934509277344, -0.014165878295898438, -0.012684822082519531, -0.011203765869140625, -0.009722709655761719, -0.008241653442382812, -0.006760597229003906, -0.005279541015625, -0.0037984848022460938, -0.0023174285888671875, -0.0008363723754882812, 0.000644683837890625, 0.0021257400512695312, 0.0036067962646484375, 0.005087852478027344, 0.00656890869140625, 0.008049964904785156, 0.009531021118164062, 0.011012077331542969, 0.012493133544921875, 0.013974189758300781, 0.015455245971679688, 0.016936302185058594, 0.0184173583984375, 0.019898414611816406, 0.021379470825195312, 0.02286052703857422, 0.024341583251953125, 0.02582263946533203, 0.027303695678710938, 0.028784751892089844, 0.03026580810546875, 0.031746864318847656, 0.03322792053222656, 0.03470897674560547, 0.036190032958984375, 0.03767108917236328, 0.03915214538574219, 0.040633201599121094, 0.0421142578125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 94.0, 419.0, 408.0, 77.0, 10.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002539523644372821, -0.002380147809162736, -0.0022207722067832947, -0.0020613963715732098, -0.0019020205363631248, -0.00174264470115304, -0.0015832689823582768, -0.0014238932635635138, -0.0012645174283534288, -0.001105141593143344, -0.0009457658743485808, -0.0007863900973461568, -0.0006270143203437328, -0.00046763854334130883, -0.00030826276633888483, -0.00014888704754412174, 1.0488787665963173e-05, 0.00016986456466838717, 0.0003292403416708112, 0.0004886161186732352, 0.0006479918956756592, 0.0008073676726780832, 0.0009667434496805072, 0.0011261191684752703, 0.0012854950036853552, 0.00144487083889544, 0.0016042465576902032, 0.0017636222764849663, 0.0019229981116950512, 0.002082373946905136, 0.002241749782115221, 0.0024011253844946623, 0.002560501452535391, 0.0027198772877454758, 0.0028792531229555607, 0.003038628725335002, 0.003198004560545087, 0.0033573803957551718, 0.003516755998134613, 0.003676131833344698, 0.003835507668554783, 0.003994883503764868, 0.004154259338974953, 0.004313635174185038, 0.0044730110093951225, 0.00463238637894392, 0.004791762214154005, 0.00495113804936409, 0.005110513884574175, 0.00526988971978426, 0.005429265554994345, 0.00558864139020443, 0.005748016759753227, 0.005907392594963312, 0.006066768430173397, 0.006226144265383482, 0.006385520100593567, 0.006544895935803652, 0.006704271771013737, 0.006863647606223822, 0.0070230234414339066, 0.007182398810982704, 0.007341774646192789, 0.007501150481402874, 0.007660526316612959]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 3.0, 1.0, 7.0, 5.0, 6.0, 11.0, 13.0, 16.0, 15.0, 16.0, 25.0, 20.0, 22.0, 36.0, 25.0, 25.0, 39.0, 29.0, 26.0, 33.0, 30.0, 37.0, 33.0, 44.0, 46.0, 32.0, 36.0, 34.0, 38.0, 29.0, 26.0, 18.0, 27.0, 23.0, 26.0, 26.0, 18.0, 13.0, 19.0, 17.0, 9.0, 10.0, 6.0, 6.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009249448776245117, -0.0008970508351922035, -0.0008691567927598953, -0.0008412627503275871, -0.0008133687078952789, -0.0007854746654629707, -0.0007575806230306625, -0.0007296865805983543, -0.0007017925381660461, -0.0006738984957337379, -0.0006460044533014297, -0.0006181104108691216, -0.0005902163684368134, -0.0005623223260045052, -0.000534428283572197, -0.0005065342411398888, -0.00047864019870758057, -0.00045074615627527237, -0.00042285211384296417, -0.000394958071410656, -0.0003670640289783478, -0.0003391699865460396, -0.0003112759441137314, -0.0002833819016814232, -0.000255487859249115, -0.0002275938168168068, -0.0001996997743844986, -0.0001718057319521904, -0.0001439116895198822, -0.000116017647087574, -8.812360465526581e-05, -6.022956222295761e-05, -3.2335519790649414e-05, -4.441477358341217e-06, 2.345256507396698e-05, 5.134660750627518e-05, 7.924064993858337e-05, 0.00010713469237089157, 0.00013502873480319977, 0.00016292277723550797, 0.00019081681966781616, 0.00021871086210012436, 0.00024660490453243256, 0.00027449894696474075, 0.00030239298939704895, 0.00033028703182935715, 0.00035818107426166534, 0.00038607511669397354, 0.00041396915912628174, 0.00044186320155858994, 0.00046975724399089813, 0.0004976512864232063, 0.0005255453288555145, 0.0005534393712878227, 0.0005813334137201309, 0.0006092274561524391, 0.0006371214985847473, 0.0006650155410170555, 0.0006929095834493637, 0.0007208036258816719, 0.0007486976683139801, 0.0007765917107462883, 0.0008044857531785965, 0.0008323797956109047, 0.0008602738380432129]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 9.0, 13.0, 10.0, 11.0, 19.0, 12.0, 18.0, 16.0, 20.0, 18.0, 21.0, 14.0, 39.0, 41.0, 32.0, 40.0, 40.0, 21.0, 29.0, 44.0, 41.0, 34.0, 33.0, 38.0, 34.0, 27.0, 29.0, 30.0, 32.0, 28.0, 23.0, 23.0, 21.0, 21.0, 20.0, 24.0, 6.0, 8.0, 15.0, 7.0, 8.0, 1.0, 6.0, 8.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0], "bins": [-6.0703125, -5.87359619140625, -5.6768798828125, -5.48016357421875, -5.283447265625, -5.08673095703125, -4.8900146484375, -4.69329833984375, -4.49658203125, -4.29986572265625, -4.1031494140625, -3.90643310546875, -3.709716796875, -3.51300048828125, -3.3162841796875, -3.11956787109375, -2.9228515625, -2.72613525390625, -2.5294189453125, -2.33270263671875, -2.135986328125, -1.93927001953125, -1.7425537109375, -1.54583740234375, -1.34912109375, -1.15240478515625, -0.9556884765625, -0.75897216796875, -0.562255859375, -0.36553955078125, -0.1688232421875, 0.02789306640625, 0.224609375, 0.42132568359375, 0.6180419921875, 0.81475830078125, 1.011474609375, 1.20819091796875, 1.4049072265625, 1.60162353515625, 1.79833984375, 1.99505615234375, 2.1917724609375, 2.38848876953125, 2.585205078125, 2.78192138671875, 2.9786376953125, 3.17535400390625, 3.3720703125, 3.56878662109375, 3.7655029296875, 3.96221923828125, 4.158935546875, 4.35565185546875, 4.5523681640625, 4.74908447265625, 4.94580078125, 5.14251708984375, 5.3392333984375, 5.53594970703125, 5.732666015625, 5.92938232421875, 6.1260986328125, 6.32281494140625, 6.51953125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 8.0, 3.0, 5.0, 5.0, 23.0, 18.0, 27.0, 48.0, 79.0, 91.0, 148.0, 187.0, 300.0, 422.0, 739.0, 1142.0, 2050.0, 3930.0, 7369.0, 15137.0, 31468.0, 68924.0, 164716.0, 380561.0, 211066.0, 84144.0, 38463.0, 17927.0, 8831.0, 4436.0, 2449.0, 1406.0, 859.0, 499.0, 334.0, 223.0, 152.0, 105.0, 92.0, 48.0, 30.0, 24.0, 19.0, 16.0, 8.0, 9.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.25103759765625, -4.1075439453125, -3.96405029296875, -3.820556640625, -3.67706298828125, -3.5335693359375, -3.39007568359375, -3.24658203125, -3.10308837890625, -2.9595947265625, -2.81610107421875, -2.672607421875, -2.52911376953125, -2.3856201171875, -2.24212646484375, -2.0986328125, -1.95513916015625, -1.8116455078125, -1.66815185546875, -1.524658203125, -1.38116455078125, -1.2376708984375, -1.09417724609375, -0.95068359375, -0.80718994140625, -0.6636962890625, -0.52020263671875, -0.376708984375, -0.23321533203125, -0.0897216796875, 0.05377197265625, 0.197265625, 0.34075927734375, 0.4842529296875, 0.62774658203125, 0.771240234375, 0.91473388671875, 1.0582275390625, 1.20172119140625, 1.34521484375, 1.48870849609375, 1.6322021484375, 1.77569580078125, 1.919189453125, 2.06268310546875, 2.2061767578125, 2.34967041015625, 2.4931640625, 2.63665771484375, 2.7801513671875, 2.92364501953125, 3.067138671875, 3.21063232421875, 3.3541259765625, 3.49761962890625, 3.64111328125, 3.78460693359375, 3.9281005859375, 4.07159423828125, 4.215087890625, 4.35858154296875, 4.5020751953125, 4.64556884765625, 4.7890625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 6.0, 3.0, 7.0, 14.0, 16.0, 17.0, 23.0, 27.0, 26.0, 35.0, 39.0, 32.0, 59.0, 57.0, 80.0, 151.0, 1691.0, 277.0, 82.0, 59.0, 55.0, 44.0, 38.0, 28.0, 22.0, 25.0, 24.0, 29.0, 16.0, 15.0, 11.0, 7.0, 9.0, 9.0, 0.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-34.4375, -33.50048828125, -32.5634765625, -31.62646484375, -30.689453125, -29.75244140625, -28.8154296875, -27.87841796875, -26.94140625, -26.00439453125, -25.0673828125, -24.13037109375, -23.193359375, -22.25634765625, -21.3193359375, -20.38232421875, -19.4453125, -18.50830078125, -17.5712890625, -16.63427734375, -15.697265625, -14.76025390625, -13.8232421875, -12.88623046875, -11.94921875, -11.01220703125, -10.0751953125, -9.13818359375, -8.201171875, -7.26416015625, -6.3271484375, -5.39013671875, -4.453125, -3.51611328125, -2.5791015625, -1.64208984375, -0.705078125, 0.23193359375, 1.1689453125, 2.10595703125, 3.04296875, 3.97998046875, 4.9169921875, 5.85400390625, 6.791015625, 7.72802734375, 8.6650390625, 9.60205078125, 10.5390625, 11.47607421875, 12.4130859375, 13.35009765625, 14.287109375, 15.22412109375, 16.1611328125, 17.09814453125, 18.03515625, 18.97216796875, 19.9091796875, 20.84619140625, 21.783203125, 22.72021484375, 23.6572265625, 24.59423828125, 25.53125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 12.0, 4.0, 13.0, 22.0, 19.0, 20.0, 38.0, 40.0, 55.0, 63.0, 105.0, 126.0, 175.0, 247.0, 450.0, 1498.0, 171382.0, 2966596.0, 3136.0, 596.0, 332.0, 233.0, 138.0, 97.0, 74.0, 50.0, 51.0, 31.0, 30.0, 16.0, 14.0, 8.0, 5.0, 12.0, 3.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.46875, -55.35205078125, -53.2353515625, -51.11865234375, -49.001953125, -46.88525390625, -44.7685546875, -42.65185546875, -40.53515625, -38.41845703125, -36.3017578125, -34.18505859375, -32.068359375, -29.95166015625, -27.8349609375, -25.71826171875, -23.6015625, -21.48486328125, -19.3681640625, -17.25146484375, -15.134765625, -13.01806640625, -10.9013671875, -8.78466796875, -6.66796875, -4.55126953125, -2.4345703125, -0.31787109375, 1.798828125, 3.91552734375, 6.0322265625, 8.14892578125, 10.265625, 12.38232421875, 14.4990234375, 16.61572265625, 18.732421875, 20.84912109375, 22.9658203125, 25.08251953125, 27.19921875, 29.31591796875, 31.4326171875, 33.54931640625, 35.666015625, 37.78271484375, 39.8994140625, 42.01611328125, 44.1328125, 46.24951171875, 48.3662109375, 50.48291015625, 52.599609375, 54.71630859375, 56.8330078125, 58.94970703125, 61.06640625, 63.18310546875, 65.2998046875, 67.41650390625, 69.533203125, 71.64990234375, 73.7666015625, 75.88330078125, 78.0]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 15.0, 166.0, 460.0, 319.0, 48.0, 3.0, 4.0, 2.0], "bins": [-185.8696746826172, -182.70724487304688, -179.5447998046875, -176.3823699951172, -173.21994018554688, -170.0574951171875, -166.8950653076172, -163.73263549804688, -160.5701904296875, -157.4077606201172, -154.2453155517578, -151.0828857421875, -147.9204559326172, -144.7580108642578, -141.5955810546875, -138.43313598632812, -135.2707061767578, -132.1082763671875, -128.94583129882812, -125.78340148925781, -122.62096405029297, -119.45852661132812, -116.29609680175781, -113.13365936279297, -109.97122955322266, -106.80879211425781, -103.6463623046875, -100.48392486572266, -97.32148742675781, -94.15904998779297, -90.99662017822266, -87.83418273925781, -84.67174530029297, -81.50930786132812, -78.34687805175781, -75.18444061279297, -72.02200317382812, -68.85956573486328, -65.69713592529297, -62.534698486328125, -59.37226104736328, -56.2098274230957, -53.04738998413086, -49.88495635986328, -46.72251892089844, -43.56008529663086, -40.39765167236328, -37.23521423339844, -34.07278060913086, -30.91034507751465, -27.747909545898438, -24.58547592163086, -21.423038482666016, -18.260604858398438, -15.098169326782227, -11.935733795166016, -8.773298263549805, -5.610862731933594, -2.448427677154541, 0.7140073776245117, 3.8764429092407227, 7.038878440856934, 10.201313018798828, 13.363748550415039, 16.52618408203125]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 7.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 17.0, 8.0, 11.0, 19.0, 17.0, 24.0, 17.0, 33.0, 31.0, 26.0, 35.0, 37.0, 38.0, 41.0, 37.0, 34.0, 36.0, 34.0, 49.0, 41.0, 35.0, 47.0, 39.0, 33.0, 23.0, 30.0, 27.0, 34.0, 17.0, 18.0, 16.0, 9.0, 12.0, 17.0, 2.0, 6.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.16265869140625, -52.25460433959961, -50.34654998779297, -48.43849563598633, -46.53044128417969, -44.62238693237305, -42.714332580566406, -40.806278228759766, -38.898223876953125, -36.990169525146484, -35.082115173339844, -33.1740608215332, -31.266006469726562, -29.357952117919922, -27.44989776611328, -25.54184341430664, -23.6337890625, -21.72573471069336, -19.81768035888672, -17.909626007080078, -16.001571655273438, -14.093517303466797, -12.185462951660156, -10.277408599853516, -8.369354248046875, -6.461299896240234, -4.553245544433594, -2.645191192626953, -0.7371368408203125, 1.1709175109863281, 3.0789718627929688, 4.987026214599609, 6.89508056640625, 8.80313491821289, 10.711189270019531, 12.619243621826172, 14.527297973632812, 16.435352325439453, 18.343406677246094, 20.251461029052734, 22.159515380859375, 24.067569732666016, 25.975624084472656, 27.883678436279297, 29.791732788085938, 31.699787139892578, 33.60784149169922, 35.51589584350586, 37.4239501953125, 39.33200454711914, 41.24005889892578, 43.14811325073242, 45.05616760253906, 46.9642219543457, 48.872276306152344, 50.780330657958984, 52.688385009765625, 54.596439361572266, 56.504493713378906, 58.41254806518555, 60.32060241699219, 62.22865676879883, 64.13671112060547, 66.04476928710938, 67.95281982421875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 7.0, 8.0, 9.0, 11.0, 18.0, 12.0, 13.0, 15.0, 18.0, 19.0, 22.0, 14.0, 31.0, 30.0, 35.0, 53.0, 34.0, 33.0, 23.0, 37.0, 44.0, 33.0, 36.0, 31.0, 31.0, 35.0, 41.0, 33.0, 25.0, 26.0, 25.0, 16.0, 25.0, 19.0, 26.0, 14.0, 18.0, 12.0, 12.0, 6.0, 11.0, 6.0, 4.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0], "bins": [-6.3984375, -6.19512939453125, -5.9918212890625, -5.78851318359375, -5.585205078125, -5.38189697265625, -5.1785888671875, -4.97528076171875, -4.77197265625, -4.56866455078125, -4.3653564453125, -4.16204833984375, -3.958740234375, -3.75543212890625, -3.5521240234375, -3.34881591796875, -3.1455078125, -2.94219970703125, -2.7388916015625, -2.53558349609375, -2.332275390625, -2.12896728515625, -1.9256591796875, -1.72235107421875, -1.51904296875, -1.31573486328125, -1.1124267578125, -0.90911865234375, -0.705810546875, -0.50250244140625, -0.2991943359375, -0.09588623046875, 0.107421875, 0.31072998046875, 0.5140380859375, 0.71734619140625, 0.920654296875, 1.12396240234375, 1.3272705078125, 1.53057861328125, 1.73388671875, 1.93719482421875, 2.1405029296875, 2.34381103515625, 2.547119140625, 2.75042724609375, 2.9537353515625, 3.15704345703125, 3.3603515625, 3.56365966796875, 3.7669677734375, 3.97027587890625, 4.173583984375, 4.37689208984375, 4.5802001953125, 4.78350830078125, 4.98681640625, 5.19012451171875, 5.3934326171875, 5.59674072265625, 5.800048828125, 6.00335693359375, 6.2066650390625, 6.40997314453125, 6.61328125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 6.0, 7.0, 13.0, 10.0, 17.0, 9.0, 17.0, 20.0, 18.0, 15.0, 19.0, 24.0, 22.0, 44.0, 36.0, 73.0, 162.0, 548.0, 2917.0, 31630.0, 1675492.0, 2428421.0, 49747.0, 3740.0, 677.0, 201.0, 76.0, 47.0, 39.0, 25.0, 24.0, 24.0, 13.0, 16.0, 25.0, 20.0, 15.0, 14.0, 9.0, 6.0, 3.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-26.140625, -25.29931640625, -24.4580078125, -23.61669921875, -22.775390625, -21.93408203125, -21.0927734375, -20.25146484375, -19.41015625, -18.56884765625, -17.7275390625, -16.88623046875, -16.044921875, -15.20361328125, -14.3623046875, -13.52099609375, -12.6796875, -11.83837890625, -10.9970703125, -10.15576171875, -9.314453125, -8.47314453125, -7.6318359375, -6.79052734375, -5.94921875, -5.10791015625, -4.2666015625, -3.42529296875, -2.583984375, -1.74267578125, -0.9013671875, -0.06005859375, 0.78125, 1.62255859375, 2.4638671875, 3.30517578125, 4.146484375, 4.98779296875, 5.8291015625, 6.67041015625, 7.51171875, 8.35302734375, 9.1943359375, 10.03564453125, 10.876953125, 11.71826171875, 12.5595703125, 13.40087890625, 14.2421875, 15.08349609375, 15.9248046875, 16.76611328125, 17.607421875, 18.44873046875, 19.2900390625, 20.13134765625, 20.97265625, 21.81396484375, 22.6552734375, 23.49658203125, 24.337890625, 25.17919921875, 26.0205078125, 26.86181640625, 27.703125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 11.0, 14.0, 17.0, 34.0, 25.0, 25.0, 49.0, 67.0, 60.0, 85.0, 120.0, 148.0, 194.0, 244.0, 338.0, 379.0, 388.0, 384.0, 315.0, 269.0, 209.0, 162.0, 128.0, 86.0, 81.0, 57.0, 40.0, 27.0, 25.0, 17.0, 14.0, 12.0, 11.0, 4.0, 10.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-15.65625, -15.2490234375, -14.841796875, -14.4345703125, -14.02734375, -13.6201171875, -13.212890625, -12.8056640625, -12.3984375, -11.9912109375, -11.583984375, -11.1767578125, -10.76953125, -10.3623046875, -9.955078125, -9.5478515625, -9.140625, -8.7333984375, -8.326171875, -7.9189453125, -7.51171875, -7.1044921875, -6.697265625, -6.2900390625, -5.8828125, -5.4755859375, -5.068359375, -4.6611328125, -4.25390625, -3.8466796875, -3.439453125, -3.0322265625, -2.625, -2.2177734375, -1.810546875, -1.4033203125, -0.99609375, -0.5888671875, -0.181640625, 0.2255859375, 0.6328125, 1.0400390625, 1.447265625, 1.8544921875, 2.26171875, 2.6689453125, 3.076171875, 3.4833984375, 3.890625, 4.2978515625, 4.705078125, 5.1123046875, 5.51953125, 5.9267578125, 6.333984375, 6.7412109375, 7.1484375, 7.5556640625, 7.962890625, 8.3701171875, 8.77734375, 9.1845703125, 9.591796875, 9.9990234375, 10.40625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 8.0, 16.0, 16.0, 29.0, 33.0, 35.0, 49.0, 97.0, 99.0, 169.0, 256.0, 461.0, 1560.0, 175870.0, 4002877.0, 10867.0, 777.0, 347.0, 202.0, 141.0, 82.0, 69.0, 54.0, 25.0, 30.0, 19.0, 19.0, 13.0, 11.0, 8.0, 7.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.25, -63.8212890625, -61.392578125, -58.9638671875, -56.53515625, -54.1064453125, -51.677734375, -49.2490234375, -46.8203125, -44.3916015625, -41.962890625, -39.5341796875, -37.10546875, -34.6767578125, -32.248046875, -29.8193359375, -27.390625, -24.9619140625, -22.533203125, -20.1044921875, -17.67578125, -15.2470703125, -12.818359375, -10.3896484375, -7.9609375, -5.5322265625, -3.103515625, -0.6748046875, 1.75390625, 4.1826171875, 6.611328125, 9.0400390625, 11.46875, 13.8974609375, 16.326171875, 18.7548828125, 21.18359375, 23.6123046875, 26.041015625, 28.4697265625, 30.8984375, 33.3271484375, 35.755859375, 38.1845703125, 40.61328125, 43.0419921875, 45.470703125, 47.8994140625, 50.328125, 52.7568359375, 55.185546875, 57.6142578125, 60.04296875, 62.4716796875, 64.900390625, 67.3291015625, 69.7578125, 72.1865234375, 74.615234375, 77.0439453125, 79.47265625, 81.9013671875, 84.330078125, 86.7587890625, 89.1875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 96.0, 292.0, 409.0, 176.0, 29.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.19850158691406, -240.38058471679688, -233.56268310546875, -226.74476623535156, -219.92684936523438, -213.1089324951172, -206.291015625, -199.47311401367188, -192.6551971435547, -185.8372802734375, -179.01937866210938, -172.2014617919922, -165.383544921875, -158.5656280517578, -151.74771118164062, -144.9298095703125, -138.1118927001953, -131.29397583007812, -124.47606658935547, -117.65815734863281, -110.84024047851562, -104.02232360839844, -97.20441436767578, -90.38650512695312, -83.56858825683594, -76.75067138671875, -69.9327621459961, -63.11484909057617, -56.29693603515625, -49.47902297973633, -42.661109924316406, -35.843196868896484, -29.025299072265625, -22.207386016845703, -15.389472961425781, -8.57155990600586, -1.7536468505859375, 5.064266204833984, 11.882179260253906, 18.700092315673828, 25.51800537109375, 32.33591842651367, 39.153831481933594, 45.971744537353516, 52.78965759277344, 59.60757064819336, 66.42548370361328, 73.24339294433594, 80.06130981445312, 86.87922668457031, 93.69713592529297, 100.51504516601562, 107.33296203613281, 114.15087890625, 120.96878814697266, 127.78669738769531, 134.6046142578125, 141.4225311279297, 148.24044799804688, 155.058349609375, 161.8762664794922, 168.69418334960938, 175.5120849609375, 182.3300018310547, 189.14791870117188]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 8.0, 6.0, 8.0, 14.0, 20.0, 17.0, 19.0, 19.0, 25.0, 32.0, 30.0, 36.0, 35.0, 39.0, 44.0, 49.0, 48.0, 40.0, 34.0, 31.0, 49.0, 39.0, 39.0, 35.0, 21.0, 36.0, 29.0, 28.0, 24.0, 27.0, 20.0, 18.0, 11.0, 19.0, 9.0, 6.0, 9.0, 4.0, 3.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.380706787109375, -49.83909606933594, -48.297489166259766, -46.75587844848633, -45.21426773071289, -43.67266082763672, -42.13105010986328, -40.589439392089844, -39.047828674316406, -37.50621795654297, -35.9646110534668, -34.42300033569336, -32.88138961791992, -31.339780807495117, -29.798171997070312, -28.256561279296875, -26.714954376220703, -25.1733455657959, -23.63173484802246, -22.090126037597656, -20.54851531982422, -19.006906509399414, -17.46529769897461, -15.923687934875488, -14.382078170776367, -12.840468406677246, -11.298858642578125, -9.75724983215332, -8.2156400680542, -6.674030303955078, -5.132421493530273, -3.5908117294311523, -2.0492019653320312, -0.5075924396514893, 1.0340170860290527, 2.5756263732910156, 4.117236137390137, 5.658845901489258, 7.2004547119140625, 8.742064476013184, 10.283674240112305, 11.825284004211426, 13.366893768310547, 14.908502578735352, 16.450111389160156, 17.991722106933594, 19.5333309173584, 21.074939727783203, 22.61655044555664, 24.158159255981445, 25.699769973754883, 27.241378784179688, 28.782989501953125, 30.32459831237793, 31.866207122802734, 33.40781784057617, 34.949424743652344, 36.49103546142578, 38.03264236450195, 39.57425308227539, 41.11586380004883, 42.657470703125, 44.19908142089844, 45.740692138671875, 47.28230285644531]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 5.0, 10.0, 14.0, 16.0, 16.0, 17.0, 23.0, 13.0, 21.0, 25.0, 23.0, 42.0, 29.0, 38.0, 38.0, 43.0, 37.0, 36.0, 39.0, 44.0, 30.0, 47.0, 40.0, 25.0, 41.0, 34.0, 30.0, 24.0, 26.0, 20.0, 22.0, 22.0, 22.0, 12.0, 11.0, 7.0, 16.0, 7.0, 5.0, 4.0, 1.0, 2.0, 5.0, 5.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.52734375, -6.30364990234375, -6.0799560546875, -5.85626220703125, -5.632568359375, -5.40887451171875, -5.1851806640625, -4.96148681640625, -4.73779296875, -4.51409912109375, -4.2904052734375, -4.06671142578125, -3.843017578125, -3.61932373046875, -3.3956298828125, -3.17193603515625, -2.9482421875, -2.72454833984375, -2.5008544921875, -2.27716064453125, -2.053466796875, -1.82977294921875, -1.6060791015625, -1.38238525390625, -1.15869140625, -0.93499755859375, -0.7113037109375, -0.48760986328125, -0.263916015625, -0.04022216796875, 0.1834716796875, 0.40716552734375, 0.630859375, 0.85455322265625, 1.0782470703125, 1.30194091796875, 1.525634765625, 1.74932861328125, 1.9730224609375, 2.19671630859375, 2.42041015625, 2.64410400390625, 2.8677978515625, 3.09149169921875, 3.315185546875, 3.53887939453125, 3.7625732421875, 3.98626708984375, 4.2099609375, 4.43365478515625, 4.6573486328125, 4.88104248046875, 5.104736328125, 5.32843017578125, 5.5521240234375, 5.77581787109375, 5.99951171875, 6.22320556640625, 6.4468994140625, 6.67059326171875, 6.894287109375, 7.11798095703125, 7.3416748046875, 7.56536865234375, 7.7890625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 20.0, 23.0, 38.0, 62.0, 82.0, 114.0, 199.0, 249.0, 375.0, 547.0, 771.0, 1169.0, 1695.0, 2435.0, 3682.0, 5495.0, 8040.0, 12034.0, 18359.0, 26891.0, 40721.0, 61028.0, 94501.0, 148852.0, 200418.0, 146404.0, 92568.0, 60323.0, 39958.0, 26946.0, 17963.0, 11907.0, 7997.0, 5404.0, 3589.0, 2480.0, 1681.0, 1089.0, 799.0, 508.0, 360.0, 247.0, 187.0, 117.0, 71.0, 51.0, 39.0, 18.0, 22.0, 5.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.94140625, -0.9105224609375, -0.879638671875, -0.8487548828125, -0.81787109375, -0.7869873046875, -0.756103515625, -0.7252197265625, -0.6943359375, -0.6634521484375, -0.632568359375, -0.6016845703125, -0.57080078125, -0.5399169921875, -0.509033203125, -0.4781494140625, -0.447265625, -0.4163818359375, -0.385498046875, -0.3546142578125, -0.32373046875, -0.2928466796875, -0.261962890625, -0.2310791015625, -0.2001953125, -0.1693115234375, -0.138427734375, -0.1075439453125, -0.07666015625, -0.0457763671875, -0.014892578125, 0.0159912109375, 0.046875, 0.0777587890625, 0.108642578125, 0.1395263671875, 0.17041015625, 0.2012939453125, 0.232177734375, 0.2630615234375, 0.2939453125, 0.3248291015625, 0.355712890625, 0.3865966796875, 0.41748046875, 0.4483642578125, 0.479248046875, 0.5101318359375, 0.541015625, 0.5718994140625, 0.602783203125, 0.6336669921875, 0.66455078125, 0.6954345703125, 0.726318359375, 0.7572021484375, 0.7880859375, 0.8189697265625, 0.849853515625, 0.8807373046875, 0.91162109375, 0.9425048828125, 0.973388671875, 1.0042724609375, 1.03515625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 11.0, 10.0, 9.0, 10.0, 12.0, 11.0, 15.0, 17.0, 17.0, 23.0, 19.0, 18.0, 25.0, 38.0, 40.0, 40.0, 49.0, 47.0, 40.0, 1070.0, 42.0, 38.0, 38.0, 41.0, 32.0, 52.0, 38.0, 31.0, 21.0, 21.0, 28.0, 20.0, 17.0, 19.0, 17.0, 6.0, 7.0, 5.0, 8.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.078125, -4.9241943359375, -4.770263671875, -4.6163330078125, -4.46240234375, -4.3084716796875, -4.154541015625, -4.0006103515625, -3.8466796875, -3.6927490234375, -3.538818359375, -3.3848876953125, -3.23095703125, -3.0770263671875, -2.923095703125, -2.7691650390625, -2.615234375, -2.4613037109375, -2.307373046875, -2.1534423828125, -1.99951171875, -1.8455810546875, -1.691650390625, -1.5377197265625, -1.3837890625, -1.2298583984375, -1.075927734375, -0.9219970703125, -0.76806640625, -0.6141357421875, -0.460205078125, -0.3062744140625, -0.15234375, 0.0015869140625, 0.155517578125, 0.3094482421875, 0.46337890625, 0.6173095703125, 0.771240234375, 0.9251708984375, 1.0791015625, 1.2330322265625, 1.386962890625, 1.5408935546875, 1.69482421875, 1.8487548828125, 2.002685546875, 2.1566162109375, 2.310546875, 2.4644775390625, 2.618408203125, 2.7723388671875, 2.92626953125, 3.0802001953125, 3.234130859375, 3.3880615234375, 3.5419921875, 3.6959228515625, 3.849853515625, 4.0037841796875, 4.15771484375, 4.3116455078125, 4.465576171875, 4.6195068359375, 4.7734375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 7.0, 9.0, 9.0, 19.0, 22.0, 35.0, 59.0, 82.0, 142.0, 253.0, 379.0, 538.0, 954.0, 1358.0, 2200.0, 3480.0, 5607.0, 8729.0, 13539.0, 21325.0, 33152.0, 53236.0, 88243.0, 149082.0, 1271338.0, 174569.0, 102753.0, 61545.0, 37790.0, 24353.0, 15070.0, 9953.0, 6226.0, 4059.0, 2515.0, 1637.0, 1091.0, 650.0, 426.0, 239.0, 156.0, 113.0, 68.0, 55.0, 26.0, 25.0, 10.0, 7.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96630859375, -0.9347763061523438, -0.9032440185546875, -0.8717117309570312, -0.840179443359375, -0.8086471557617188, -0.7771148681640625, -0.7455825805664062, -0.71405029296875, -0.6825180053710938, -0.6509857177734375, -0.6194534301757812, -0.587921142578125, -0.5563888549804688, -0.5248565673828125, -0.49332427978515625, -0.4617919921875, -0.43025970458984375, -0.3987274169921875, -0.36719512939453125, -0.335662841796875, -0.30413055419921875, -0.2725982666015625, -0.24106597900390625, -0.20953369140625, -0.17800140380859375, -0.1464691162109375, -0.11493682861328125, -0.083404541015625, -0.05187225341796875, -0.0203399658203125, 0.01119232177734375, 0.042724609375, 0.07425689697265625, 0.1057891845703125, 0.13732147216796875, 0.168853759765625, 0.20038604736328125, 0.2319183349609375, 0.26345062255859375, 0.29498291015625, 0.32651519775390625, 0.3580474853515625, 0.38957977294921875, 0.421112060546875, 0.45264434814453125, 0.4841766357421875, 0.5157089233398438, 0.5472412109375, 0.5787734985351562, 0.6103057861328125, 0.6418380737304688, 0.673370361328125, 0.7049026489257812, 0.7364349365234375, 0.7679672241210938, 0.79949951171875, 0.8310317993164062, 0.8625640869140625, 0.8940963745117188, 0.925628662109375, 0.9571609497070312, 0.9886932373046875, 1.0202255249023438, 1.0517578125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 9.0, 10.0, 7.0, 11.0, 19.0, 19.0, 32.0, 56.0, 53.0, 73.0, 77.0, 88.0, 116.0, 93.0, 60.0, 51.0, 50.0, 39.0, 28.0, 27.0, 22.0, 14.0, 15.0, 4.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0025882720947265625, -0.002512216567993164, -0.0024361610412597656, -0.002360105514526367, -0.0022840499877929688, -0.0022079944610595703, -0.002131938934326172, -0.0020558834075927734, -0.001979827880859375, -0.0019037723541259766, -0.0018277168273925781, -0.0017516613006591797, -0.0016756057739257812, -0.0015995502471923828, -0.0015234947204589844, -0.001447439193725586, -0.0013713836669921875, -0.001295328140258789, -0.0012192726135253906, -0.0011432170867919922, -0.0010671615600585938, -0.0009911060333251953, -0.0009150505065917969, -0.0008389949798583984, -0.000762939453125, -0.0006868839263916016, -0.0006108283996582031, -0.0005347728729248047, -0.00045871734619140625, -0.0003826618194580078, -0.0003066062927246094, -0.00023055076599121094, -0.0001544952392578125, -7.843971252441406e-05, -2.384185791015625e-06, 7.367134094238281e-05, 0.00014972686767578125, 0.0002257823944091797, 0.0003018379211425781, 0.00037789344787597656, 0.000453948974609375, 0.0005300045013427734, 0.0006060600280761719, 0.0006821155548095703, 0.0007581710815429688, 0.0008342266082763672, 0.0009102821350097656, 0.000986337661743164, 0.0010623931884765625, 0.001138448715209961, 0.0012145042419433594, 0.0012905597686767578, 0.0013666152954101562, 0.0014426708221435547, 0.0015187263488769531, 0.0015947818756103516, 0.00167083740234375, 0.0017468929290771484, 0.0018229484558105469, 0.0018990039825439453, 0.0019750595092773438, 0.002051115036010742, 0.0021271705627441406, 0.002203226089477539, 0.0022792816162109375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 6.0, 14.0, 16.0, 11.0, 33.0, 37.0, 42.0, 55.0, 104.0, 225.0, 611.0, 28148.0, 1017358.0, 1222.0, 285.0, 144.0, 74.0, 44.0, 29.0, 23.0, 14.0, 7.0, 6.0, 9.0, 7.0, 11.0, 0.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.054473876953125, -0.05267000198364258, -0.050866127014160156, -0.049062252044677734, -0.04725837707519531, -0.04545450210571289, -0.04365062713623047, -0.04184675216674805, -0.040042877197265625, -0.0382390022277832, -0.03643512725830078, -0.03463125228881836, -0.03282737731933594, -0.031023502349853516, -0.029219627380371094, -0.027415752410888672, -0.02561187744140625, -0.023808002471923828, -0.022004127502441406, -0.020200252532958984, -0.018396377563476562, -0.01659250259399414, -0.014788627624511719, -0.012984752655029297, -0.011180877685546875, -0.009377002716064453, -0.007573127746582031, -0.005769252777099609, -0.0039653778076171875, -0.0021615028381347656, -0.00035762786865234375, 0.0014462471008300781, 0.0032501220703125, 0.005053997039794922, 0.006857872009277344, 0.008661746978759766, 0.010465621948242188, 0.01226949691772461, 0.014073371887207031, 0.015877246856689453, 0.017681121826171875, 0.019484996795654297, 0.02128887176513672, 0.02309274673461914, 0.024896621704101562, 0.026700496673583984, 0.028504371643066406, 0.030308246612548828, 0.03211212158203125, 0.03391599655151367, 0.035719871520996094, 0.037523746490478516, 0.03932762145996094, 0.04113149642944336, 0.04293537139892578, 0.0447392463684082, 0.046543121337890625, 0.04834699630737305, 0.05015087127685547, 0.05195474624633789, 0.05375862121582031, 0.055562496185302734, 0.057366371154785156, 0.05917024612426758, 0.06097412109375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 14.0, 161.0, 499.0, 291.0, 41.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025693662464618683, -0.0024316562339663506, -0.002293946221470833, -0.0021562364418059587, -0.002018526429310441, -0.0018808164168149233, -0.0017431065207347274, -0.0016053966246545315, -0.0014676866121590137, -0.001329976599663496, -0.0011922667035833001, -0.0010545568075031042, -0.0009168467950075865, -0.0007791368407197297, -0.0006414268864318728, -0.000503716932144016, -0.0003660069778561592, -0.0002282970235683024, -9.058706928044558e-05, 4.712288500741124e-05, 0.00018483283929526806, 0.0003225427935831249, 0.0004602527478709817, 0.0005979627021588385, 0.0007356726564466953, 0.0008733826107345521, 0.001011092565022409, 0.0011488024611026049, 0.0012865124735981226, 0.0014242224860936403, 0.0015619323821738362, 0.0016996422782540321, 0.0018373527564108372, 0.001975062768906355, 0.0021127727814018726, 0.0022504825610667467, 0.0023881925735622644, 0.002525902586057782, 0.0026636123657226562, 0.002801322378218174, 0.0029390323907136917, 0.0030767424032092094, 0.003214452415704727, 0.0033521621953696012, 0.003489872207865119, 0.0036275822203606367, 0.003765292000025511, 0.0039030020125210285, 0.004040712025016546, 0.004178422037512064, 0.004316132050007582, 0.0044538420625030994, 0.00459155160933733, 0.004729261621832848, 0.004866971634328365, 0.005004681646823883, 0.005142391659319401, 0.0052801016718149185, 0.005417811684310436, 0.005555521696805954, 0.005693231709301472, 0.005830941256135702, 0.00596865126863122, 0.006106361281126738, 0.006244071293622255]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 7.0, 11.0, 10.0, 15.0, 24.0, 16.0, 28.0, 19.0, 18.0, 23.0, 27.0, 32.0, 26.0, 39.0, 32.0, 41.0, 30.0, 36.0, 40.0, 46.0, 30.0, 47.0, 38.0, 39.0, 34.0, 25.0, 26.0, 18.0, 29.0, 27.0, 29.0, 19.0, 19.0, 19.0, 14.0, 12.0, 7.0, 13.0, 8.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008105039596557617, -0.000783972442150116, -0.0007574409246444702, -0.0007309094071388245, -0.0007043778896331787, -0.000677846372127533, -0.0006513148546218872, -0.0006247833371162415, -0.0005982518196105957, -0.00057172030210495, -0.0005451887845993042, -0.0005186572670936584, -0.0004921257495880127, -0.00046559423208236694, -0.0004390627145767212, -0.00041253119707107544, -0.0003859996795654297, -0.00035946816205978394, -0.0003329366445541382, -0.00030640512704849243, -0.0002798736095428467, -0.00025334209203720093, -0.00022681057453155518, -0.00020027905702590942, -0.00017374753952026367, -0.00014721602201461792, -0.00012068450450897217, -9.415298700332642e-05, -6.762146949768066e-05, -4.108995199203491e-05, -1.455843448638916e-05, 1.1973083019256592e-05, 3.8504600524902344e-05, 6.50361180305481e-05, 9.156763553619385e-05, 0.0001180991530418396, 0.00014463067054748535, 0.0001711621880531311, 0.00019769370555877686, 0.0002242252230644226, 0.00025075674057006836, 0.0002772882580757141, 0.00030381977558135986, 0.0003303512930870056, 0.00035688281059265137, 0.0003834143280982971, 0.00040994584560394287, 0.0004364773631095886, 0.0004630088806152344, 0.0004895403981208801, 0.0005160719156265259, 0.0005426034331321716, 0.0005691349506378174, 0.0005956664681434631, 0.0006221979856491089, 0.0006487295031547546, 0.0006752610206604004, 0.0007017925381660461, 0.0007283240556716919, 0.0007548555731773376, 0.0007813870906829834, 0.0008079186081886292, 0.0008344501256942749, 0.0008609816431999207, 0.0008875131607055664]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 5.0, 10.0, 14.0, 16.0, 16.0, 17.0, 23.0, 13.0, 21.0, 25.0, 23.0, 42.0, 29.0, 38.0, 38.0, 43.0, 37.0, 36.0, 39.0, 44.0, 30.0, 47.0, 40.0, 25.0, 41.0, 34.0, 30.0, 24.0, 26.0, 20.0, 22.0, 22.0, 22.0, 12.0, 11.0, 7.0, 16.0, 7.0, 5.0, 4.0, 1.0, 2.0, 5.0, 5.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.52734375, -6.30364990234375, -6.0799560546875, -5.85626220703125, -5.632568359375, -5.40887451171875, -5.1851806640625, -4.96148681640625, -4.73779296875, -4.51409912109375, -4.2904052734375, -4.06671142578125, -3.843017578125, -3.61932373046875, -3.3956298828125, -3.17193603515625, -2.9482421875, -2.72454833984375, -2.5008544921875, -2.27716064453125, -2.053466796875, -1.82977294921875, -1.6060791015625, -1.38238525390625, -1.15869140625, -0.93499755859375, -0.7113037109375, -0.48760986328125, -0.263916015625, -0.04022216796875, 0.1834716796875, 0.40716552734375, 0.630859375, 0.85455322265625, 1.0782470703125, 1.30194091796875, 1.525634765625, 1.74932861328125, 1.9730224609375, 2.19671630859375, 2.42041015625, 2.64410400390625, 2.8677978515625, 3.09149169921875, 3.315185546875, 3.53887939453125, 3.7625732421875, 3.98626708984375, 4.2099609375, 4.43365478515625, 4.6573486328125, 4.88104248046875, 5.104736328125, 5.32843017578125, 5.5521240234375, 5.77581787109375, 5.99951171875, 6.22320556640625, 6.4468994140625, 6.67059326171875, 6.894287109375, 7.11798095703125, 7.3416748046875, 7.56536865234375, 7.7890625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 8.0, 7.0, 8.0, 29.0, 20.0, 38.0, 51.0, 78.0, 112.0, 149.0, 202.0, 328.0, 466.0, 885.0, 1562.0, 2837.0, 5641.0, 12122.0, 29697.0, 81469.0, 252799.0, 439947.0, 137187.0, 47649.0, 18381.0, 8036.0, 3850.0, 2084.0, 1100.0, 654.0, 386.0, 242.0, 144.0, 112.0, 76.0, 57.0, 51.0, 22.0, 21.0, 23.0, 11.0, 8.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.59375, -4.4117431640625, -4.229736328125, -4.0477294921875, -3.86572265625, -3.6837158203125, -3.501708984375, -3.3197021484375, -3.1376953125, -2.9556884765625, -2.773681640625, -2.5916748046875, -2.40966796875, -2.2276611328125, -2.045654296875, -1.8636474609375, -1.681640625, -1.4996337890625, -1.317626953125, -1.1356201171875, -0.95361328125, -0.7716064453125, -0.589599609375, -0.4075927734375, -0.2255859375, -0.0435791015625, 0.138427734375, 0.3204345703125, 0.50244140625, 0.6844482421875, 0.866455078125, 1.0484619140625, 1.23046875, 1.4124755859375, 1.594482421875, 1.7764892578125, 1.95849609375, 2.1405029296875, 2.322509765625, 2.5045166015625, 2.6865234375, 2.8685302734375, 3.050537109375, 3.2325439453125, 3.41455078125, 3.5965576171875, 3.778564453125, 3.9605712890625, 4.142578125, 4.3245849609375, 4.506591796875, 4.6885986328125, 4.87060546875, 5.0526123046875, 5.234619140625, 5.4166259765625, 5.5986328125, 5.7806396484375, 5.962646484375, 6.1446533203125, 6.32666015625, 6.5086669921875, 6.690673828125, 6.8726806640625, 7.0546875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 5.0, 2.0, 6.0, 8.0, 4.0, 9.0, 23.0, 11.0, 20.0, 32.0, 15.0, 30.0, 28.0, 39.0, 39.0, 42.0, 59.0, 59.0, 66.0, 121.0, 1463.0, 404.0, 129.0, 63.0, 50.0, 45.0, 40.0, 30.0, 35.0, 33.0, 20.0, 23.0, 26.0, 23.0, 11.0, 9.0, 6.0, 5.0, 8.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.171875, -22.34375, -21.515625, -20.6875, -19.859375, -19.03125, -18.203125, -17.375, -16.546875, -15.71875, -14.890625, -14.0625, -13.234375, -12.40625, -11.578125, -10.75, -9.921875, -9.09375, -8.265625, -7.4375, -6.609375, -5.78125, -4.953125, -4.125, -3.296875, -2.46875, -1.640625, -0.8125, 0.015625, 0.84375, 1.671875, 2.5, 3.328125, 4.15625, 4.984375, 5.8125, 6.640625, 7.46875, 8.296875, 9.125, 9.953125, 10.78125, 11.609375, 12.4375, 13.265625, 14.09375, 14.921875, 15.75, 16.578125, 17.40625, 18.234375, 19.0625, 19.890625, 20.71875, 21.546875, 22.375, 23.203125, 24.03125, 24.859375, 25.6875, 26.515625, 27.34375, 28.171875, 29.0, 29.828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 10.0, 15.0, 23.0, 38.0, 50.0, 68.0, 108.0, 161.0, 310.0, 581.0, 3460.0, 3129814.0, 9328.0, 791.0, 376.0, 191.0, 129.0, 76.0, 66.0, 41.0, 26.0, 16.0, 9.0, 7.0, 8.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.625, -115.3837890625, -112.142578125, -108.9013671875, -105.66015625, -102.4189453125, -99.177734375, -95.9365234375, -92.6953125, -89.4541015625, -86.212890625, -82.9716796875, -79.73046875, -76.4892578125, -73.248046875, -70.0068359375, -66.765625, -63.5244140625, -60.283203125, -57.0419921875, -53.80078125, -50.5595703125, -47.318359375, -44.0771484375, -40.8359375, -37.5947265625, -34.353515625, -31.1123046875, -27.87109375, -24.6298828125, -21.388671875, -18.1474609375, -14.90625, -11.6650390625, -8.423828125, -5.1826171875, -1.94140625, 1.2998046875, 4.541015625, 7.7822265625, 11.0234375, 14.2646484375, 17.505859375, 20.7470703125, 23.98828125, 27.2294921875, 30.470703125, 33.7119140625, 36.953125, 40.1943359375, 43.435546875, 46.6767578125, 49.91796875, 53.1591796875, 56.400390625, 59.6416015625, 62.8828125, 66.1240234375, 69.365234375, 72.6064453125, 75.84765625, 79.0888671875, 82.330078125, 85.5712890625, 88.8125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 608.0, 400.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-446.26690673828125, -437.6774597167969, -429.0880126953125, -420.49859619140625, -411.9091491699219, -403.3197021484375, -394.7302551269531, -386.14080810546875, -377.5513916015625, -368.9619445800781, -360.37249755859375, -351.7830810546875, -343.1936340332031, -334.60418701171875, -326.0147399902344, -317.42529296875, -308.83587646484375, -300.2464294433594, -291.656982421875, -283.06756591796875, -274.4781188964844, -265.888671875, -257.2992248535156, -248.7097930908203, -240.12033081054688, -231.5308837890625, -222.9414520263672, -214.3520050048828, -205.7625732421875, -197.17312622070312, -188.58367919921875, -179.99424743652344, -171.40481567382812, -162.81536865234375, -154.22593688964844, -145.63648986816406, -137.04705810546875, -128.45761108398438, -119.86817169189453, -111.27873229980469, -102.68930053710938, -94.09986114501953, -85.51042175292969, -76.92097473144531, -68.33154296875, -59.74209976196289, -51.15265655517578, -42.56321716308594, -33.973777770996094, -25.38433837890625, -16.794897079467773, -8.205455780029297, 0.3839836120605469, 8.97342300415039, 17.5628662109375, 26.152305603027344, 34.74174499511719, 43.33118438720703, 51.920623779296875, 60.510066986083984, 69.09950256347656, 77.68894958496094, 86.27838897705078, 94.86782836914062, 103.45726776123047]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 6.0, 6.0, 7.0, 10.0, 16.0, 17.0, 13.0, 21.0, 29.0, 25.0, 35.0, 37.0, 29.0, 36.0, 43.0, 33.0, 30.0, 51.0, 53.0, 45.0, 47.0, 41.0, 45.0, 33.0, 30.0, 39.0, 26.0, 31.0, 20.0, 29.0, 23.0, 14.0, 14.0, 6.0, 17.0, 8.0, 12.0, 5.0, 6.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.63656616210938, -71.29840087890625, -68.96024322509766, -66.62207794189453, -64.2839126586914, -61.94575500488281, -59.60758972167969, -57.26942825317383, -54.93126678466797, -52.59310531616211, -50.254940032958984, -47.916778564453125, -45.578617095947266, -43.240455627441406, -40.90229034423828, -38.56412887573242, -36.2259635925293, -33.88780212402344, -31.549638748168945, -29.211475372314453, -26.873313903808594, -24.5351505279541, -22.19698715209961, -19.85882568359375, -17.520662307739258, -15.182499885559082, -12.844337463378906, -10.506174087524414, -8.168011665344238, -5.8298492431640625, -3.4916858673095703, -1.153524398803711, 1.1846389770507812, 3.522801637649536, 5.860964298248291, 8.199127197265625, 10.5372896194458, 12.875452041625977, 15.213615417480469, 17.551776885986328, 19.88994026184082, 22.228103637695312, 24.566265106201172, 26.904428482055664, 29.242591857910156, 31.580753326416016, 33.918914794921875, 36.257080078125, 38.59524154663086, 40.93340301513672, 43.271568298339844, 45.6097297668457, 47.94789123535156, 50.28605651855469, 52.62421798706055, 54.962379455566406, 57.30054473876953, 59.63870620727539, 61.976871490478516, 64.31503295898438, 66.6531982421875, 68.9913558959961, 71.32952117919922, 73.66767883300781, 76.00584411621094]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 6.0, 8.0, 9.0, 13.0, 17.0, 18.0, 17.0, 19.0, 16.0, 24.0, 33.0, 39.0, 24.0, 45.0, 38.0, 32.0, 30.0, 42.0, 43.0, 41.0, 26.0, 39.0, 32.0, 27.0, 44.0, 31.0, 27.0, 34.0, 25.0, 21.0, 27.0, 16.0, 30.0, 14.0, 15.0, 15.0, 14.0, 12.0, 4.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.91796875, -6.6854248046875, -6.452880859375, -6.2203369140625, -5.98779296875, -5.7552490234375, -5.522705078125, -5.2901611328125, -5.0576171875, -4.8250732421875, -4.592529296875, -4.3599853515625, -4.12744140625, -3.8948974609375, -3.662353515625, -3.4298095703125, -3.197265625, -2.9647216796875, -2.732177734375, -2.4996337890625, -2.26708984375, -2.0345458984375, -1.802001953125, -1.5694580078125, -1.3369140625, -1.1043701171875, -0.871826171875, -0.6392822265625, -0.40673828125, -0.1741943359375, 0.058349609375, 0.2908935546875, 0.5234375, 0.7559814453125, 0.988525390625, 1.2210693359375, 1.45361328125, 1.6861572265625, 1.918701171875, 2.1512451171875, 2.3837890625, 2.6163330078125, 2.848876953125, 3.0814208984375, 3.31396484375, 3.5465087890625, 3.779052734375, 4.0115966796875, 4.244140625, 4.4766845703125, 4.709228515625, 4.9417724609375, 5.17431640625, 5.4068603515625, 5.639404296875, 5.8719482421875, 6.1044921875, 6.3370361328125, 6.569580078125, 6.8021240234375, 7.03466796875, 7.2672119140625, 7.499755859375, 7.7322998046875, 7.96484375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 9.0, 12.0, 5.0, 7.0, 8.0, 13.0, 15.0, 17.0, 25.0, 11.0, 27.0, 31.0, 38.0, 25.0, 33.0, 57.0, 91.0, 301.0, 1151.0, 6002.0, 100222.0, 2837205.0, 1218902.0, 25788.0, 2915.0, 740.0, 223.0, 87.0, 51.0, 33.0, 34.0, 20.0, 33.0, 16.0, 19.0, 23.0, 14.0, 21.0, 9.0, 12.0, 10.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-25.734375, -24.899169921875, -24.06396484375, -23.228759765625, -22.3935546875, -21.558349609375, -20.72314453125, -19.887939453125, -19.052734375, -18.217529296875, -17.38232421875, -16.547119140625, -15.7119140625, -14.876708984375, -14.04150390625, -13.206298828125, -12.37109375, -11.535888671875, -10.70068359375, -9.865478515625, -9.0302734375, -8.195068359375, -7.35986328125, -6.524658203125, -5.689453125, -4.854248046875, -4.01904296875, -3.183837890625, -2.3486328125, -1.513427734375, -0.67822265625, 0.156982421875, 0.9921875, 1.827392578125, 2.66259765625, 3.497802734375, 4.3330078125, 5.168212890625, 6.00341796875, 6.838623046875, 7.673828125, 8.509033203125, 9.34423828125, 10.179443359375, 11.0146484375, 11.849853515625, 12.68505859375, 13.520263671875, 14.35546875, 15.190673828125, 16.02587890625, 16.861083984375, 17.6962890625, 18.531494140625, 19.36669921875, 20.201904296875, 21.037109375, 21.872314453125, 22.70751953125, 23.542724609375, 24.3779296875, 25.213134765625, 26.04833984375, 26.883544921875, 27.71875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 14.0, 11.0, 15.0, 9.0, 28.0, 34.0, 43.0, 46.0, 68.0, 94.0, 107.0, 182.0, 228.0, 336.0, 396.0, 493.0, 483.0, 384.0, 298.0, 217.0, 150.0, 105.0, 85.0, 83.0, 53.0, 38.0, 16.0, 18.0, 14.0, 5.0, 7.0, 5.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.53125, -12.026123046875, -11.52099609375, -11.015869140625, -10.5107421875, -10.005615234375, -9.50048828125, -8.995361328125, -8.490234375, -7.985107421875, -7.47998046875, -6.974853515625, -6.4697265625, -5.964599609375, -5.45947265625, -4.954345703125, -4.44921875, -3.944091796875, -3.43896484375, -2.933837890625, -2.4287109375, -1.923583984375, -1.41845703125, -0.913330078125, -0.408203125, 0.096923828125, 0.60205078125, 1.107177734375, 1.6123046875, 2.117431640625, 2.62255859375, 3.127685546875, 3.6328125, 4.137939453125, 4.64306640625, 5.148193359375, 5.6533203125, 6.158447265625, 6.66357421875, 7.168701171875, 7.673828125, 8.178955078125, 8.68408203125, 9.189208984375, 9.6943359375, 10.199462890625, 10.70458984375, 11.209716796875, 11.71484375, 12.219970703125, 12.72509765625, 13.230224609375, 13.7353515625, 14.240478515625, 14.74560546875, 15.250732421875, 15.755859375, 16.260986328125, 16.76611328125, 17.271240234375, 17.7763671875, 18.281494140625, 18.78662109375, 19.291748046875, 19.796875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 8.0, 3.0, 7.0, 7.0, 13.0, 18.0, 21.0, 31.0, 46.0, 64.0, 70.0, 105.0, 134.0, 175.0, 233.0, 334.0, 614.0, 2358.0, 482984.0, 3697316.0, 7537.0, 829.0, 377.0, 249.0, 166.0, 131.0, 89.0, 86.0, 57.0, 53.0, 37.0, 26.0, 25.0, 32.0, 9.0, 9.0, 15.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.875, -66.591796875, -64.30859375, -62.025390625, -59.7421875, -57.458984375, -55.17578125, -52.892578125, -50.609375, -48.326171875, -46.04296875, -43.759765625, -41.4765625, -39.193359375, -36.91015625, -34.626953125, -32.34375, -30.060546875, -27.77734375, -25.494140625, -23.2109375, -20.927734375, -18.64453125, -16.361328125, -14.078125, -11.794921875, -9.51171875, -7.228515625, -4.9453125, -2.662109375, -0.37890625, 1.904296875, 4.1875, 6.470703125, 8.75390625, 11.037109375, 13.3203125, 15.603515625, 17.88671875, 20.169921875, 22.453125, 24.736328125, 27.01953125, 29.302734375, 31.5859375, 33.869140625, 36.15234375, 38.435546875, 40.71875, 43.001953125, 45.28515625, 47.568359375, 49.8515625, 52.134765625, 54.41796875, 56.701171875, 58.984375, 61.267578125, 63.55078125, 65.833984375, 68.1171875, 70.400390625, 72.68359375, 74.966796875, 77.25]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 8.0, 10.0, 47.0, 84.0, 179.0, 228.0, 195.0, 146.0, 70.0, 24.0, 12.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.67079162597656, -94.01847076416016, -90.36614990234375, -86.71383666992188, -83.06151580810547, -79.40919494628906, -75.75687408447266, -72.10455322265625, -68.45223236083984, -64.79991149902344, -61.1475944519043, -57.49527359008789, -53.842952728271484, -50.190635681152344, -46.53831481933594, -42.88599395751953, -39.23367691040039, -35.581356048583984, -31.92903709411621, -28.276718139648438, -24.62439727783203, -20.972078323364258, -17.319759368896484, -13.667438507080078, -10.015119552612305, -6.362799644470215, -2.710480213165283, 0.9418392181396484, 4.594159126281738, 8.246479034423828, 11.898797988891602, 15.551118850708008, 19.20343780517578, 22.855756759643555, 26.50807762145996, 30.160396575927734, 33.81271743774414, 37.46503448486328, 41.11735534667969, 44.769676208496094, 48.4219970703125, 52.074317932128906, 55.72663497924805, 59.37895584106445, 63.03127670288086, 66.68359375, 70.3359146118164, 73.98823547363281, 77.64054870605469, 81.2928695678711, 84.9451904296875, 88.59750366210938, 92.24982452392578, 95.90214538574219, 99.5544662475586, 103.206787109375, 106.8591079711914, 110.51142883300781, 114.16374969482422, 117.81607055664062, 121.4683837890625, 125.1207046508789, 128.7730255126953, 132.42535400390625, 136.07766723632812]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 2.0, 7.0, 8.0, 6.0, 9.0, 8.0, 14.0, 14.0, 19.0, 25.0, 18.0, 22.0, 19.0, 27.0, 21.0, 30.0, 25.0, 32.0, 21.0, 41.0, 40.0, 38.0, 46.0, 34.0, 39.0, 35.0, 37.0, 30.0, 28.0, 31.0, 29.0, 25.0, 27.0, 26.0, 23.0, 16.0, 27.0, 15.0, 10.0, 11.0, 11.0, 14.0, 6.0, 5.0, 6.0, 5.0, 3.0, 4.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-44.66520309448242, -43.26557159423828, -41.865936279296875, -40.466304779052734, -39.066673278808594, -37.66703796386719, -36.26740646362305, -34.867774963378906, -33.4681396484375, -32.06850814819336, -30.668874740600586, -29.269241333007812, -27.869609832763672, -26.4699764251709, -25.070343017578125, -23.670711517333984, -22.271080017089844, -20.87144660949707, -19.47181510925293, -18.072181701660156, -16.672550201416016, -15.272916793823242, -13.873283386230469, -12.473650932312012, -11.074018478393555, -9.674386024475098, -8.27475357055664, -6.875120162963867, -5.47548770904541, -4.075855255126953, -2.6762218475341797, -1.2765893936157227, 0.12303924560546875, 1.5226719379425049, 2.922304630279541, 4.321937561035156, 5.721570014953613, 7.12120246887207, 8.520835876464844, 9.9204683303833, 11.320100784301758, 12.719733238220215, 14.119365692138672, 15.518999099731445, 16.91863250732422, 18.31826400756836, 19.717897415161133, 21.117530822753906, 22.517162322998047, 23.91679573059082, 25.31642723083496, 26.716060638427734, 28.115692138671875, 29.51532554626465, 30.914958953857422, 32.31459045410156, 33.71422576904297, 35.11385726928711, 36.513492584228516, 37.913124084472656, 39.3127555847168, 40.71238708496094, 42.112022399902344, 43.511653900146484, 44.911285400390625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 6.0, 5.0, 8.0, 9.0, 11.0, 12.0, 17.0, 12.0, 13.0, 14.0, 30.0, 21.0, 34.0, 40.0, 17.0, 37.0, 39.0, 43.0, 36.0, 42.0, 37.0, 35.0, 44.0, 33.0, 31.0, 30.0, 29.0, 31.0, 37.0, 29.0, 22.0, 22.0, 26.0, 21.0, 16.0, 17.0, 19.0, 17.0, 15.0, 8.0, 8.0, 7.0, 7.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.73046875, -6.5057373046875, -6.281005859375, -6.0562744140625, -5.83154296875, -5.6068115234375, -5.382080078125, -5.1573486328125, -4.9326171875, -4.7078857421875, -4.483154296875, -4.2584228515625, -4.03369140625, -3.8089599609375, -3.584228515625, -3.3594970703125, -3.134765625, -2.9100341796875, -2.685302734375, -2.4605712890625, -2.23583984375, -2.0111083984375, -1.786376953125, -1.5616455078125, -1.3369140625, -1.1121826171875, -0.887451171875, -0.6627197265625, -0.43798828125, -0.2132568359375, 0.011474609375, 0.2362060546875, 0.4609375, 0.6856689453125, 0.910400390625, 1.1351318359375, 1.35986328125, 1.5845947265625, 1.809326171875, 2.0340576171875, 2.2587890625, 2.4835205078125, 2.708251953125, 2.9329833984375, 3.15771484375, 3.3824462890625, 3.607177734375, 3.8319091796875, 4.056640625, 4.2813720703125, 4.506103515625, 4.7308349609375, 4.95556640625, 5.1802978515625, 5.405029296875, 5.6297607421875, 5.8544921875, 6.0792236328125, 6.303955078125, 6.5286865234375, 6.75341796875, 6.9781494140625, 7.202880859375, 7.4276123046875, 7.65234375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 9.0, 6.0, 13.0, 13.0, 31.0, 63.0, 80.0, 135.0, 196.0, 282.0, 530.0, 719.0, 1143.0, 1699.0, 2689.0, 3944.0, 5913.0, 8764.0, 13254.0, 20579.0, 31210.0, 47709.0, 72824.0, 111570.0, 180168.0, 194906.0, 121791.0, 78296.0, 51532.0, 33485.0, 21991.0, 14623.0, 9597.0, 6306.0, 4238.0, 2816.0, 1886.0, 1227.0, 822.0, 505.0, 352.0, 235.0, 160.0, 84.0, 56.0, 49.0, 24.0, 14.0, 12.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0361328125, -1.0028076171875, -0.969482421875, -0.9361572265625, -0.90283203125, -0.8695068359375, -0.836181640625, -0.8028564453125, -0.76953125, -0.7362060546875, -0.702880859375, -0.6695556640625, -0.63623046875, -0.6029052734375, -0.569580078125, -0.5362548828125, -0.5029296875, -0.4696044921875, -0.436279296875, -0.4029541015625, -0.36962890625, -0.3363037109375, -0.302978515625, -0.2696533203125, -0.236328125, -0.2030029296875, -0.169677734375, -0.1363525390625, -0.10302734375, -0.0697021484375, -0.036376953125, -0.0030517578125, 0.0302734375, 0.0635986328125, 0.096923828125, 0.1302490234375, 0.16357421875, 0.1968994140625, 0.230224609375, 0.2635498046875, 0.296875, 0.3302001953125, 0.363525390625, 0.3968505859375, 0.43017578125, 0.4635009765625, 0.496826171875, 0.5301513671875, 0.5634765625, 0.5968017578125, 0.630126953125, 0.6634521484375, 0.69677734375, 0.7301025390625, 0.763427734375, 0.7967529296875, 0.830078125, 0.8634033203125, 0.896728515625, 0.9300537109375, 0.96337890625, 0.9967041015625, 1.030029296875, 1.0633544921875, 1.0966796875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 5.0, 1.0, 7.0, 9.0, 13.0, 7.0, 7.0, 15.0, 15.0, 17.0, 22.0, 23.0, 34.0, 31.0, 28.0, 31.0, 34.0, 41.0, 39.0, 40.0, 40.0, 45.0, 1068.0, 39.0, 49.0, 32.0, 42.0, 39.0, 34.0, 27.0, 33.0, 21.0, 19.0, 15.0, 18.0, 23.0, 16.0, 13.0, 11.0, 8.0, 11.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1484375, -4.98284912109375, -4.8172607421875, -4.65167236328125, -4.486083984375, -4.32049560546875, -4.1549072265625, -3.98931884765625, -3.82373046875, -3.65814208984375, -3.4925537109375, -3.32696533203125, -3.161376953125, -2.99578857421875, -2.8302001953125, -2.66461181640625, -2.4990234375, -2.33343505859375, -2.1678466796875, -2.00225830078125, -1.836669921875, -1.67108154296875, -1.5054931640625, -1.33990478515625, -1.17431640625, -1.00872802734375, -0.8431396484375, -0.67755126953125, -0.511962890625, -0.34637451171875, -0.1807861328125, -0.01519775390625, 0.150390625, 0.31597900390625, 0.4815673828125, 0.64715576171875, 0.812744140625, 0.97833251953125, 1.1439208984375, 1.30950927734375, 1.47509765625, 1.64068603515625, 1.8062744140625, 1.97186279296875, 2.137451171875, 2.30303955078125, 2.4686279296875, 2.63421630859375, 2.7998046875, 2.96539306640625, 3.1309814453125, 3.29656982421875, 3.462158203125, 3.62774658203125, 3.7933349609375, 3.95892333984375, 4.12451171875, 4.29010009765625, 4.4556884765625, 4.62127685546875, 4.786865234375, 4.95245361328125, 5.1180419921875, 5.28363037109375, 5.44921875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 14.0, 31.0, 38.0, 58.0, 74.0, 125.0, 173.0, 250.0, 349.0, 576.0, 900.0, 1331.0, 2092.0, 3159.0, 4913.0, 7306.0, 11623.0, 17846.0, 27776.0, 44486.0, 70525.0, 111512.0, 176367.0, 1251410.0, 133307.0, 84631.0, 52667.0, 33453.0, 21090.0, 13559.0, 8772.0, 5691.0, 3759.0, 2401.0, 1646.0, 1064.0, 725.0, 463.0, 335.0, 207.0, 138.0, 94.0, 49.0, 45.0, 28.0, 26.0, 9.0, 15.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.048828125, -1.0162506103515625, -0.983673095703125, -0.9510955810546875, -0.91851806640625, -0.8859405517578125, -0.853363037109375, -0.8207855224609375, -0.7882080078125, -0.7556304931640625, -0.723052978515625, -0.6904754638671875, -0.65789794921875, -0.6253204345703125, -0.592742919921875, -0.5601654052734375, -0.527587890625, -0.4950103759765625, -0.462432861328125, -0.4298553466796875, -0.39727783203125, -0.3647003173828125, -0.332122802734375, -0.2995452880859375, -0.2669677734375, -0.2343902587890625, -0.201812744140625, -0.1692352294921875, -0.13665771484375, -0.1040802001953125, -0.071502685546875, -0.0389251708984375, -0.00634765625, 0.0262298583984375, 0.058807373046875, 0.0913848876953125, 0.12396240234375, 0.1565399169921875, 0.189117431640625, 0.2216949462890625, 0.2542724609375, 0.2868499755859375, 0.319427490234375, 0.3520050048828125, 0.38458251953125, 0.4171600341796875, 0.449737548828125, 0.4823150634765625, 0.514892578125, 0.5474700927734375, 0.580047607421875, 0.6126251220703125, 0.64520263671875, 0.6777801513671875, 0.710357666015625, 0.7429351806640625, 0.7755126953125, 0.8080902099609375, 0.840667724609375, 0.8732452392578125, 0.90582275390625, 0.9384002685546875, 0.970977783203125, 1.0035552978515625, 1.0361328125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 7.0, 2.0, 5.0, 7.0, 12.0, 12.0, 18.0, 26.0, 23.0, 25.0, 30.0, 50.0, 39.0, 41.0, 59.0, 70.0, 67.0, 80.0, 70.0, 58.0, 58.0, 46.0, 40.0, 34.0, 28.0, 12.0, 15.0, 16.0, 16.0, 13.0, 3.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002178192138671875, -0.0021116137504577637, -0.0020450353622436523, -0.001978456974029541, -0.0019118785858154297, -0.0018453001976013184, -0.001778721809387207, -0.0017121434211730957, -0.0016455650329589844, -0.001578986644744873, -0.0015124082565307617, -0.0014458298683166504, -0.001379251480102539, -0.0013126730918884277, -0.0012460947036743164, -0.001179516315460205, -0.0011129379272460938, -0.0010463595390319824, -0.000979781150817871, -0.0009132027626037598, -0.0008466243743896484, -0.0007800459861755371, -0.0007134675979614258, -0.0006468892097473145, -0.0005803108215332031, -0.0005137324333190918, -0.00044715404510498047, -0.00038057565689086914, -0.0003139972686767578, -0.0002474188804626465, -0.00018084049224853516, -0.00011426210403442383, -4.76837158203125e-05, 1.8894672393798828e-05, 8.547306060791016e-05, 0.00015205144882202148, 0.0002186298370361328, 0.00028520822525024414, 0.00035178661346435547, 0.0004183650016784668, 0.0004849433898925781, 0.0005515217781066895, 0.0006181001663208008, 0.0006846785545349121, 0.0007512569427490234, 0.0008178353309631348, 0.0008844137191772461, 0.0009509921073913574, 0.0010175704956054688, 0.00108414888381958, 0.0011507272720336914, 0.0012173056602478027, 0.001283884048461914, 0.0013504624366760254, 0.0014170408248901367, 0.001483619213104248, 0.0015501976013183594, 0.0016167759895324707, 0.001683354377746582, 0.0017499327659606934, 0.0018165111541748047, 0.001883089542388916, 0.0019496679306030273, 0.0020162463188171387, 0.00208282470703125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 8.0, 10.0, 7.0, 14.0, 14.0, 12.0, 22.0, 30.0, 36.0, 45.0, 66.0, 99.0, 184.0, 419.0, 3466.0, 1039629.0, 3568.0, 390.0, 169.0, 88.0, 66.0, 43.0, 34.0, 35.0, 28.0, 17.0, 14.0, 10.0, 6.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045257568359375, -0.043612003326416016, -0.04196643829345703, -0.04032087326049805, -0.03867530822753906, -0.03702974319458008, -0.035384178161621094, -0.03373861312866211, -0.032093048095703125, -0.03044748306274414, -0.028801918029785156, -0.027156352996826172, -0.025510787963867188, -0.023865222930908203, -0.02221965789794922, -0.020574092864990234, -0.01892852783203125, -0.017282962799072266, -0.01563739776611328, -0.013991832733154297, -0.012346267700195312, -0.010700702667236328, -0.009055137634277344, -0.007409572601318359, -0.005764007568359375, -0.004118442535400391, -0.0024728775024414062, -0.0008273124694824219, 0.0008182525634765625, 0.002463817596435547, 0.004109382629394531, 0.005754947662353516, 0.0074005126953125, 0.009046077728271484, 0.010691642761230469, 0.012337207794189453, 0.013982772827148438, 0.015628337860107422, 0.017273902893066406, 0.01891946792602539, 0.020565032958984375, 0.02221059799194336, 0.023856163024902344, 0.025501728057861328, 0.027147293090820312, 0.028792858123779297, 0.03043842315673828, 0.032083988189697266, 0.03372955322265625, 0.035375118255615234, 0.03702068328857422, 0.0386662483215332, 0.04031181335449219, 0.04195737838745117, 0.043602943420410156, 0.04524850845336914, 0.046894073486328125, 0.04853963851928711, 0.050185203552246094, 0.05183076858520508, 0.05347633361816406, 0.05512189865112305, 0.05676746368408203, 0.058413028717041016, 0.06005859375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 14.0, 35.0, 103.0, 228.0, 309.0, 198.0, 84.0, 33.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004105939995497465, -0.004026070237159729, -0.003946200478821993, -0.0038663307204842567, -0.0037864609621465206, -0.0037065912038087845, -0.0036267214454710484, -0.0035468516871333122, -0.003466981928795576, -0.00338711217045784, -0.003307242412120104, -0.0032273726537823677, -0.0031475028954446316, -0.0030676331371068954, -0.0029877633787691593, -0.002907893620431423, -0.0028280240949243307, -0.0027481543365865946, -0.0026682845782488585, -0.0025884148199111223, -0.002508545061573386, -0.00242867530323565, -0.002348805544897914, -0.0022689360193908215, -0.0021890662610530853, -0.002109196502715349, -0.002029326744377613, -0.001949456986039877, -0.0018695872277021408, -0.0017897174693644047, -0.0017098478274419904, -0.0016299780691042542, -0.0015501080779358745, -0.0014702383195981383, -0.0013903685612604022, -0.001310498802922666, -0.0012306291610002518, -0.0011507594026625156, -0.0010708896443247795, -0.0009910198859870434, -0.0009111501276493073, -0.0008312803693115711, -0.000751410610973835, -0.0006715409108437598, -0.0005916711525060236, -0.0005118013941682875, -0.00043193166493438184, -0.00035206193570047617, -0.00027219217736274004, -0.00019232243357691914, -0.00011245268979109824, -3.2582946005277336e-05, 4.7286797780543566e-05, 0.0001271565561182797, 0.00020702628535218537, 0.00028689601458609104, 0.00036676577292382717, 0.0004466355312615633, 0.0005265052895992994, 0.0006063749897293746, 0.0006862447480671108, 0.0007661145064048469, 0.0008459842065349221, 0.0009258539648726583, 0.0010057237232103944]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 6.0, 7.0, 4.0, 8.0, 7.0, 16.0, 9.0, 15.0, 17.0, 11.0, 25.0, 20.0, 21.0, 37.0, 32.0, 26.0, 46.0, 32.0, 33.0, 38.0, 49.0, 37.0, 31.0, 36.0, 36.0, 34.0, 35.0, 41.0, 37.0, 29.0, 31.0, 24.0, 27.0, 19.0, 20.0, 16.0, 12.0, 11.0, 12.0, 11.0, 13.0, 6.0, 9.0, 4.0, 4.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008845329284667969, -0.0008559860289096832, -0.0008274391293525696, -0.0007988922297954559, -0.0007703453302383423, -0.0007417984306812286, -0.000713251531124115, -0.0006847046315670013, -0.0006561577320098877, -0.000627610832452774, -0.0005990639328956604, -0.0005705170333385468, -0.0005419701337814331, -0.0005134232342243195, -0.0004848763346672058, -0.00045632943511009216, -0.0004277825355529785, -0.00039923563599586487, -0.0003706887364387512, -0.0003421418368816376, -0.0003135949373245239, -0.0002850480377674103, -0.00025650113821029663, -0.00022795423865318298, -0.00019940733909606934, -0.0001708604395389557, -0.00014231353998184204, -0.0001137666404247284, -8.521974086761475e-05, -5.66728413105011e-05, -2.812594175338745e-05, 4.209578037261963e-07, 2.8967857360839844e-05, 5.751475691795349e-05, 8.606165647506714e-05, 0.00011460855603218079, 0.00014315545558929443, 0.00017170235514640808, 0.00020024925470352173, 0.00022879615426063538, 0.000257343053817749, 0.00028588995337486267, 0.0003144368529319763, 0.00034298375248908997, 0.0003715306520462036, 0.00040007755160331726, 0.0004286244511604309, 0.00045717135071754456, 0.0004857182502746582, 0.0005142651498317719, 0.0005428120493888855, 0.0005713589489459991, 0.0005999058485031128, 0.0006284527480602264, 0.0006569996476173401, 0.0006855465471744537, 0.0007140934467315674, 0.000742640346288681, 0.0007711872458457947, 0.0007997341454029083, 0.000828281044960022, 0.0008568279445171356, 0.0008853748440742493, 0.0009139217436313629, 0.0009424686431884766]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 6.0, 5.0, 8.0, 9.0, 11.0, 12.0, 17.0, 12.0, 13.0, 14.0, 30.0, 21.0, 34.0, 40.0, 17.0, 37.0, 39.0, 43.0, 36.0, 42.0, 37.0, 35.0, 44.0, 33.0, 31.0, 30.0, 29.0, 31.0, 37.0, 29.0, 22.0, 22.0, 26.0, 21.0, 17.0, 16.0, 19.0, 17.0, 15.0, 8.0, 7.0, 8.0, 7.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.73046875, -6.5057373046875, -6.281005859375, -6.0562744140625, -5.83154296875, -5.6068115234375, -5.382080078125, -5.1573486328125, -4.9326171875, -4.7078857421875, -4.483154296875, -4.2584228515625, -4.03369140625, -3.8089599609375, -3.584228515625, -3.3594970703125, -3.134765625, -2.9100341796875, -2.685302734375, -2.4605712890625, -2.23583984375, -2.0111083984375, -1.786376953125, -1.5616455078125, -1.3369140625, -1.1121826171875, -0.887451171875, -0.6627197265625, -0.43798828125, -0.2132568359375, 0.011474609375, 0.2362060546875, 0.4609375, 0.6856689453125, 0.910400390625, 1.1351318359375, 1.35986328125, 1.5845947265625, 1.809326171875, 2.0340576171875, 2.2587890625, 2.4835205078125, 2.708251953125, 2.9329833984375, 3.15771484375, 3.3824462890625, 3.607177734375, 3.8319091796875, 4.056640625, 4.2813720703125, 4.506103515625, 4.7308349609375, 4.95556640625, 5.1802978515625, 5.405029296875, 5.6297607421875, 5.8544921875, 6.0792236328125, 6.303955078125, 6.5286865234375, 6.75341796875, 6.9781494140625, 7.202880859375, 7.4276123046875, 7.65234375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 16.0, 15.0, 17.0, 40.0, 45.0, 61.0, 81.0, 109.0, 135.0, 193.0, 284.0, 427.0, 632.0, 997.0, 1807.0, 3298.0, 6005.0, 12248.0, 26092.0, 61734.0, 165667.0, 399695.0, 223175.0, 80697.0, 33321.0, 14836.0, 7340.0, 3862.0, 2121.0, 1256.0, 732.0, 469.0, 347.0, 208.0, 163.0, 104.0, 80.0, 68.0, 38.0, 32.0, 24.0, 22.0, 13.0, 14.0, 12.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.45599365234375, -4.2947998046875, -4.13360595703125, -3.972412109375, -3.81121826171875, -3.6500244140625, -3.48883056640625, -3.32763671875, -3.16644287109375, -3.0052490234375, -2.84405517578125, -2.682861328125, -2.52166748046875, -2.3604736328125, -2.19927978515625, -2.0380859375, -1.87689208984375, -1.7156982421875, -1.55450439453125, -1.393310546875, -1.23211669921875, -1.0709228515625, -0.90972900390625, -0.74853515625, -0.58734130859375, -0.4261474609375, -0.26495361328125, -0.103759765625, 0.05743408203125, 0.2186279296875, 0.37982177734375, 0.541015625, 0.70220947265625, 0.8634033203125, 1.02459716796875, 1.185791015625, 1.34698486328125, 1.5081787109375, 1.66937255859375, 1.83056640625, 1.99176025390625, 2.1529541015625, 2.31414794921875, 2.475341796875, 2.63653564453125, 2.7977294921875, 2.95892333984375, 3.1201171875, 3.28131103515625, 3.4425048828125, 3.60369873046875, 3.764892578125, 3.92608642578125, 4.0872802734375, 4.24847412109375, 4.40966796875, 4.57086181640625, 4.7320556640625, 4.89324951171875, 5.054443359375, 5.21563720703125, 5.3768310546875, 5.53802490234375, 5.69921875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 6.0, 6.0, 11.0, 9.0, 15.0, 13.0, 18.0, 16.0, 19.0, 21.0, 16.0, 25.0, 30.0, 28.0, 35.0, 37.0, 49.0, 67.0, 75.0, 242.0, 1632.0, 147.0, 70.0, 60.0, 42.0, 37.0, 38.0, 29.0, 40.0, 29.0, 30.0, 19.0, 12.0, 18.0, 23.0, 13.0, 9.0, 7.0, 9.0, 13.0, 6.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.84375, -21.146484375, -20.44921875, -19.751953125, -19.0546875, -18.357421875, -17.66015625, -16.962890625, -16.265625, -15.568359375, -14.87109375, -14.173828125, -13.4765625, -12.779296875, -12.08203125, -11.384765625, -10.6875, -9.990234375, -9.29296875, -8.595703125, -7.8984375, -7.201171875, -6.50390625, -5.806640625, -5.109375, -4.412109375, -3.71484375, -3.017578125, -2.3203125, -1.623046875, -0.92578125, -0.228515625, 0.46875, 1.166015625, 1.86328125, 2.560546875, 3.2578125, 3.955078125, 4.65234375, 5.349609375, 6.046875, 6.744140625, 7.44140625, 8.138671875, 8.8359375, 9.533203125, 10.23046875, 10.927734375, 11.625, 12.322265625, 13.01953125, 13.716796875, 14.4140625, 15.111328125, 15.80859375, 16.505859375, 17.203125, 17.900390625, 18.59765625, 19.294921875, 19.9921875, 20.689453125, 21.38671875, 22.083984375, 22.78125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 4.0, 2.0, 2.0, 9.0, 3.0, 0.0, 10.0, 15.0, 7.0, 17.0, 30.0, 39.0, 45.0, 70.0, 70.0, 136.0, 173.0, 236.0, 366.0, 676.0, 7416.0, 3113837.0, 20469.0, 821.0, 376.0, 246.0, 164.0, 108.0, 89.0, 78.0, 48.0, 39.0, 26.0, 19.0, 16.0, 14.0, 8.0, 8.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.875, -64.5361328125, -62.197265625, -59.8583984375, -57.51953125, -55.1806640625, -52.841796875, -50.5029296875, -48.1640625, -45.8251953125, -43.486328125, -41.1474609375, -38.80859375, -36.4697265625, -34.130859375, -31.7919921875, -29.453125, -27.1142578125, -24.775390625, -22.4365234375, -20.09765625, -17.7587890625, -15.419921875, -13.0810546875, -10.7421875, -8.4033203125, -6.064453125, -3.7255859375, -1.38671875, 0.9521484375, 3.291015625, 5.6298828125, 7.96875, 10.3076171875, 12.646484375, 14.9853515625, 17.32421875, 19.6630859375, 22.001953125, 24.3408203125, 26.6796875, 29.0185546875, 31.357421875, 33.6962890625, 36.03515625, 38.3740234375, 40.712890625, 43.0517578125, 45.390625, 47.7294921875, 50.068359375, 52.4072265625, 54.74609375, 57.0849609375, 59.423828125, 61.7626953125, 64.1015625, 66.4404296875, 68.779296875, 71.1181640625, 73.45703125, 75.7958984375, 78.134765625, 80.4736328125, 82.8125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [2.0, 29.0, 815.0, 172.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.58217430114746, -12.40479850769043, -5.227422714233398, 1.9499530792236328, 9.127328872680664, 16.304704666137695, 23.482080459594727, 30.659456253051758, 37.836830139160156, 45.01420593261719, 52.19158172607422, 59.36895751953125, 66.54633331298828, 73.72370910644531, 80.90108489990234, 88.07846069335938, 95.2558364868164, 102.43321228027344, 109.61058807373047, 116.7879638671875, 123.96533966064453, 131.14271545410156, 138.32009887695312, 145.49746704101562, 152.6748504638672, 159.85223388671875, 167.02960205078125, 174.20697021484375, 181.3843536376953, 188.56173706054688, 195.73910522460938, 202.91647338867188, 210.09384155273438, 217.27120971679688, 224.44859313964844, 231.6259765625, 238.8033447265625, 245.980712890625, 253.15809631347656, 260.3354797363281, 267.5128479003906, 274.6902160644531, 281.86761474609375, 289.04498291015625, 296.22235107421875, 303.39971923828125, 310.57708740234375, 317.7544860839844, 324.9318542480469, 332.1092224121094, 339.28662109375, 346.4639892578125, 353.641357421875, 360.8187255859375, 367.99609375, 375.1734924316406, 382.3508605957031, 389.5282287597656, 396.70562744140625, 403.88299560546875, 411.06036376953125, 418.23773193359375, 425.41510009765625, 432.5924987792969, 439.7698669433594]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 9.0, 7.0, 9.0, 8.0, 13.0, 13.0, 14.0, 21.0, 16.0, 25.0, 25.0, 35.0, 35.0, 43.0, 39.0, 55.0, 44.0, 42.0, 51.0, 57.0, 36.0, 47.0, 34.0, 40.0, 37.0, 34.0, 42.0, 29.0, 31.0, 17.0, 19.0, 13.0, 20.0, 10.0, 5.0, 4.0, 10.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-76.5431900024414, -74.22920989990234, -71.91523742675781, -69.60125732421875, -67.28728485107422, -64.97330474853516, -62.659332275390625, -60.34535217285156, -58.03137969970703, -55.717403411865234, -53.40342712402344, -51.08945083618164, -48.775474548339844, -46.46149826049805, -44.14752197265625, -41.83354187011719, -39.51956558227539, -37.205589294433594, -34.8916130065918, -32.57763671875, -30.263660430908203, -27.949684143066406, -25.635705947875977, -23.32172966003418, -21.007753372192383, -18.693777084350586, -16.37980079650879, -14.065823554992676, -11.751847267150879, -9.437870979309082, -7.123893737792969, -4.809917449951172, -2.495941162109375, -0.18196463584899902, 2.132011890411377, 4.445988655090332, 6.759964942932129, 9.073941230773926, 11.387918472290039, 13.701894760131836, 16.015871047973633, 18.32984733581543, 20.643823623657227, 22.957801818847656, 25.271778106689453, 27.58575439453125, 29.899730682373047, 32.213706970214844, 34.52768325805664, 36.84165954589844, 39.155635833740234, 41.46961212158203, 43.78358840942383, 46.097564697265625, 48.41154479980469, 50.72551727294922, 53.03949737548828, 55.35347366333008, 57.667449951171875, 59.98142623901367, 62.29540252685547, 64.60938262939453, 66.92335510253906, 69.23733520507812, 71.55130767822266]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 11.0, 8.0, 9.0, 11.0, 13.0, 8.0, 15.0, 16.0, 13.0, 20.0, 20.0, 37.0, 25.0, 39.0, 32.0, 29.0, 41.0, 35.0, 51.0, 29.0, 43.0, 38.0, 34.0, 35.0, 33.0, 29.0, 30.0, 26.0, 27.0, 35.0, 23.0, 23.0, 16.0, 15.0, 18.0, 21.0, 14.0, 11.0, 11.0, 16.0, 6.0, 5.0, 7.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.92578125, -6.697021484375, -6.46826171875, -6.239501953125, -6.0107421875, -5.781982421875, -5.55322265625, -5.324462890625, -5.095703125, -4.866943359375, -4.63818359375, -4.409423828125, -4.1806640625, -3.951904296875, -3.72314453125, -3.494384765625, -3.265625, -3.036865234375, -2.80810546875, -2.579345703125, -2.3505859375, -2.121826171875, -1.89306640625, -1.664306640625, -1.435546875, -1.206787109375, -0.97802734375, -0.749267578125, -0.5205078125, -0.291748046875, -0.06298828125, 0.165771484375, 0.39453125, 0.623291015625, 0.85205078125, 1.080810546875, 1.3095703125, 1.538330078125, 1.76708984375, 1.995849609375, 2.224609375, 2.453369140625, 2.68212890625, 2.910888671875, 3.1396484375, 3.368408203125, 3.59716796875, 3.825927734375, 4.0546875, 4.283447265625, 4.51220703125, 4.740966796875, 4.9697265625, 5.198486328125, 5.42724609375, 5.656005859375, 5.884765625, 6.113525390625, 6.34228515625, 6.571044921875, 6.7998046875, 7.028564453125, 7.25732421875, 7.486083984375, 7.71484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 9.0, 9.0, 16.0, 7.0, 11.0, 12.0, 17.0, 13.0, 22.0, 23.0, 32.0, 46.0, 67.0, 115.0, 186.0, 369.0, 882.0, 2690.0, 11395.0, 134189.0, 2009562.0, 1911760.0, 108268.0, 10255.0, 2486.0, 841.0, 355.0, 197.0, 115.0, 65.0, 40.0, 36.0, 31.0, 23.0, 17.0, 17.0, 10.0, 16.0, 17.0, 9.0, 9.0, 12.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.75, -18.12451171875, -17.4990234375, -16.87353515625, -16.248046875, -15.62255859375, -14.9970703125, -14.37158203125, -13.74609375, -13.12060546875, -12.4951171875, -11.86962890625, -11.244140625, -10.61865234375, -9.9931640625, -9.36767578125, -8.7421875, -8.11669921875, -7.4912109375, -6.86572265625, -6.240234375, -5.61474609375, -4.9892578125, -4.36376953125, -3.73828125, -3.11279296875, -2.4873046875, -1.86181640625, -1.236328125, -0.61083984375, 0.0146484375, 0.64013671875, 1.265625, 1.89111328125, 2.5166015625, 3.14208984375, 3.767578125, 4.39306640625, 5.0185546875, 5.64404296875, 6.26953125, 6.89501953125, 7.5205078125, 8.14599609375, 8.771484375, 9.39697265625, 10.0224609375, 10.64794921875, 11.2734375, 11.89892578125, 12.5244140625, 13.14990234375, 13.775390625, 14.40087890625, 15.0263671875, 15.65185546875, 16.27734375, 16.90283203125, 17.5283203125, 18.15380859375, 18.779296875, 19.40478515625, 20.0302734375, 20.65576171875, 21.28125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 2.0, 7.0, 16.0, 5.0, 17.0, 24.0, 23.0, 35.0, 37.0, 44.0, 68.0, 80.0, 115.0, 133.0, 176.0, 215.0, 257.0, 344.0, 402.0, 358.0, 372.0, 304.0, 226.0, 187.0, 137.0, 92.0, 81.0, 62.0, 50.0, 54.0, 32.0, 28.0, 22.0, 17.0, 16.0, 8.0, 7.0, 9.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6875, -10.2791748046875, -9.870849609375, -9.4625244140625, -9.05419921875, -8.6458740234375, -8.237548828125, -7.8292236328125, -7.4208984375, -7.0125732421875, -6.604248046875, -6.1959228515625, -5.78759765625, -5.3792724609375, -4.970947265625, -4.5626220703125, -4.154296875, -3.7459716796875, -3.337646484375, -2.9293212890625, -2.52099609375, -2.1126708984375, -1.704345703125, -1.2960205078125, -0.8876953125, -0.4793701171875, -0.071044921875, 0.3372802734375, 0.74560546875, 1.1539306640625, 1.562255859375, 1.9705810546875, 2.37890625, 2.7872314453125, 3.195556640625, 3.6038818359375, 4.01220703125, 4.4205322265625, 4.828857421875, 5.2371826171875, 5.6455078125, 6.0538330078125, 6.462158203125, 6.8704833984375, 7.27880859375, 7.6871337890625, 8.095458984375, 8.5037841796875, 8.912109375, 9.3204345703125, 9.728759765625, 10.1370849609375, 10.54541015625, 10.9537353515625, 11.362060546875, 11.7703857421875, 12.1787109375, 12.5870361328125, 12.995361328125, 13.4036865234375, 13.81201171875, 14.2203369140625, 14.628662109375, 15.0369873046875, 15.4453125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 11.0, 10.0, 9.0, 10.0, 28.0, 27.0, 34.0, 41.0, 52.0, 70.0, 80.0, 128.0, 121.0, 190.0, 260.0, 416.0, 923.0, 46247.0, 4109348.0, 33803.0, 820.0, 475.0, 288.0, 218.0, 155.0, 115.0, 83.0, 61.0, 62.0, 50.0, 20.0, 34.0, 28.0, 9.0, 15.0, 7.0, 8.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-74.625, -72.3271484375, -70.029296875, -67.7314453125, -65.43359375, -63.1357421875, -60.837890625, -58.5400390625, -56.2421875, -53.9443359375, -51.646484375, -49.3486328125, -47.05078125, -44.7529296875, -42.455078125, -40.1572265625, -37.859375, -35.5615234375, -33.263671875, -30.9658203125, -28.66796875, -26.3701171875, -24.072265625, -21.7744140625, -19.4765625, -17.1787109375, -14.880859375, -12.5830078125, -10.28515625, -7.9873046875, -5.689453125, -3.3916015625, -1.09375, 1.2041015625, 3.501953125, 5.7998046875, 8.09765625, 10.3955078125, 12.693359375, 14.9912109375, 17.2890625, 19.5869140625, 21.884765625, 24.1826171875, 26.48046875, 28.7783203125, 31.076171875, 33.3740234375, 35.671875, 37.9697265625, 40.267578125, 42.5654296875, 44.86328125, 47.1611328125, 49.458984375, 51.7568359375, 54.0546875, 56.3525390625, 58.650390625, 60.9482421875, 63.24609375, 65.5439453125, 67.841796875, 70.1396484375, 72.4375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 31.0, 89.0, 213.0, 249.0, 214.0, 121.0, 64.0, 12.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.55559539794922, -95.68846893310547, -91.82134246826172, -87.95421600341797, -84.08708190917969, -80.21995544433594, -76.35282897949219, -72.48570251464844, -68.61857604980469, -64.75144958496094, -60.88432312011719, -57.01719284057617, -53.15006637573242, -49.28293991088867, -45.415809631347656, -41.548683166503906, -37.681556701660156, -33.814430236816406, -29.947301864624023, -26.08017349243164, -22.21304702758789, -18.34592056274414, -14.478792190551758, -10.611663818359375, -6.744537353515625, -2.8774099349975586, 0.9897174835205078, 4.856844902038574, 8.72397232055664, 12.59109878540039, 16.458227157592773, 20.325355529785156, 24.192489624023438, 28.059616088867188, 31.92674446105957, 35.79387283325195, 39.6609992980957, 43.52812576293945, 47.39525604248047, 51.26238250732422, 55.12950897216797, 58.99663543701172, 62.86376190185547, 66.73088836669922, 70.5980224609375, 74.46514892578125, 78.332275390625, 82.19940185546875, 86.0665283203125, 89.93365478515625, 93.80078125, 97.66790771484375, 101.5350341796875, 105.40216064453125, 109.26929473876953, 113.13642120361328, 117.00354766845703, 120.87067413330078, 124.73780059814453, 128.6049346923828, 132.47206115722656, 136.3391876220703, 140.20631408691406, 144.0734405517578, 147.94056701660156]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 6.0, 11.0, 11.0, 11.0, 22.0, 28.0, 20.0, 24.0, 25.0, 33.0, 42.0, 46.0, 45.0, 39.0, 49.0, 49.0, 47.0, 49.0, 46.0, 35.0, 64.0, 41.0, 45.0, 31.0, 34.0, 23.0, 20.0, 15.0, 17.0, 16.0, 13.0, 11.0, 9.0, 9.0, 5.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-62.331787109375, -60.52672576904297, -58.7216682434082, -56.91661071777344, -55.111549377441406, -53.306488037109375, -51.50143051147461, -49.696372985839844, -47.89131164550781, -46.08625030517578, -44.281192779541016, -42.47613525390625, -40.67107391357422, -38.86601257324219, -37.06095504760742, -35.255897521972656, -33.450836181640625, -31.645776748657227, -29.840717315673828, -28.03565788269043, -26.23059844970703, -24.425539016723633, -22.620479583740234, -20.815420150756836, -19.010360717773438, -17.20530128479004, -15.40024185180664, -13.595182418823242, -11.790122985839844, -9.985063552856445, -8.180004119873047, -6.374944686889648, -4.56988525390625, -2.7648258209228516, -0.9597663879394531, 0.8452930450439453, 2.6503524780273438, 4.455411911010742, 6.260471343994141, 8.065530776977539, 9.870590209960938, 11.675649642944336, 13.480709075927734, 15.285768508911133, 17.09082794189453, 18.89588737487793, 20.700946807861328, 22.506006240844727, 24.311065673828125, 26.116125106811523, 27.921184539794922, 29.72624397277832, 31.53130340576172, 33.33636474609375, 35.141422271728516, 36.94647979736328, 38.75154113769531, 40.556602478027344, 42.36166000366211, 44.166717529296875, 45.971778869628906, 47.77684020996094, 49.5818977355957, 51.38695526123047, 53.1920166015625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 11.0, 9.0, 6.0, 17.0, 6.0, 13.0, 18.0, 19.0, 22.0, 19.0, 29.0, 29.0, 22.0, 37.0, 32.0, 36.0, 50.0, 37.0, 40.0, 33.0, 55.0, 32.0, 39.0, 31.0, 24.0, 38.0, 33.0, 20.0, 32.0, 19.0, 29.0, 18.0, 16.0, 19.0, 16.0, 15.0, 14.0, 6.0, 8.0, 13.0, 5.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.70703125, -6.47802734375, -6.2490234375, -6.02001953125, -5.791015625, -5.56201171875, -5.3330078125, -5.10400390625, -4.875, -4.64599609375, -4.4169921875, -4.18798828125, -3.958984375, -3.72998046875, -3.5009765625, -3.27197265625, -3.04296875, -2.81396484375, -2.5849609375, -2.35595703125, -2.126953125, -1.89794921875, -1.6689453125, -1.43994140625, -1.2109375, -0.98193359375, -0.7529296875, -0.52392578125, -0.294921875, -0.06591796875, 0.1630859375, 0.39208984375, 0.62109375, 0.85009765625, 1.0791015625, 1.30810546875, 1.537109375, 1.76611328125, 1.9951171875, 2.22412109375, 2.453125, 2.68212890625, 2.9111328125, 3.14013671875, 3.369140625, 3.59814453125, 3.8271484375, 4.05615234375, 4.28515625, 4.51416015625, 4.7431640625, 4.97216796875, 5.201171875, 5.43017578125, 5.6591796875, 5.88818359375, 6.1171875, 6.34619140625, 6.5751953125, 6.80419921875, 7.033203125, 7.26220703125, 7.4912109375, 7.72021484375, 7.94921875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 6.0, 7.0, 14.0, 9.0, 14.0, 21.0, 41.0, 68.0, 90.0, 145.0, 238.0, 353.0, 475.0, 775.0, 1168.0, 1686.0, 2556.0, 3947.0, 5795.0, 8764.0, 12952.0, 19375.0, 29528.0, 44489.0, 67979.0, 104105.0, 161181.0, 195636.0, 133743.0, 86192.0, 56937.0, 37061.0, 24332.0, 16238.0, 11006.0, 7146.0, 4808.0, 3272.0, 2169.0, 1418.0, 917.0, 665.0, 462.0, 245.0, 165.0, 123.0, 87.0, 49.0, 34.0, 29.0, 22.0, 10.0, 9.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.98486328125, -0.9523391723632812, -0.9198150634765625, -0.8872909545898438, -0.854766845703125, -0.8222427368164062, -0.7897186279296875, -0.7571945190429688, -0.72467041015625, -0.6921463012695312, -0.6596221923828125, -0.6270980834960938, -0.594573974609375, -0.5620498657226562, -0.5295257568359375, -0.49700164794921875, -0.4644775390625, -0.43195343017578125, -0.3994293212890625, -0.36690521240234375, -0.334381103515625, -0.30185699462890625, -0.2693328857421875, -0.23680877685546875, -0.20428466796875, -0.17176055908203125, -0.1392364501953125, -0.10671234130859375, -0.074188232421875, -0.04166412353515625, -0.0091400146484375, 0.02338409423828125, 0.055908203125, 0.08843231201171875, 0.1209564208984375, 0.15348052978515625, 0.186004638671875, 0.21852874755859375, 0.2510528564453125, 0.28357696533203125, 0.31610107421875, 0.34862518310546875, 0.3811492919921875, 0.41367340087890625, 0.446197509765625, 0.47872161865234375, 0.5112457275390625, 0.5437698364257812, 0.5762939453125, 0.6088180541992188, 0.6413421630859375, 0.6738662719726562, 0.706390380859375, 0.7389144897460938, 0.7714385986328125, 0.8039627075195312, 0.83648681640625, 0.8690109252929688, 0.9015350341796875, 0.9340591430664062, 0.966583251953125, 0.9991073608398438, 1.0316314697265625, 1.0641555786132812, 1.0966796875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 8.0, 7.0, 15.0, 3.0, 14.0, 8.0, 9.0, 11.0, 16.0, 12.0, 13.0, 27.0, 22.0, 27.0, 25.0, 30.0, 22.0, 29.0, 33.0, 43.0, 40.0, 40.0, 36.0, 1050.0, 41.0, 39.0, 43.0, 45.0, 22.0, 37.0, 30.0, 27.0, 24.0, 25.0, 20.0, 18.0, 12.0, 24.0, 10.0, 17.0, 8.0, 6.0, 9.0, 4.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.08984375, -3.95098876953125, -3.8121337890625, -3.67327880859375, -3.534423828125, -3.39556884765625, -3.2567138671875, -3.11785888671875, -2.97900390625, -2.84014892578125, -2.7012939453125, -2.56243896484375, -2.423583984375, -2.28472900390625, -2.1458740234375, -2.00701904296875, -1.8681640625, -1.72930908203125, -1.5904541015625, -1.45159912109375, -1.312744140625, -1.17388916015625, -1.0350341796875, -0.89617919921875, -0.75732421875, -0.61846923828125, -0.4796142578125, -0.34075927734375, -0.201904296875, -0.06304931640625, 0.0758056640625, 0.21466064453125, 0.353515625, 0.49237060546875, 0.6312255859375, 0.77008056640625, 0.908935546875, 1.04779052734375, 1.1866455078125, 1.32550048828125, 1.46435546875, 1.60321044921875, 1.7420654296875, 1.88092041015625, 2.019775390625, 2.15863037109375, 2.2974853515625, 2.43634033203125, 2.5751953125, 2.71405029296875, 2.8529052734375, 2.99176025390625, 3.130615234375, 3.26947021484375, 3.4083251953125, 3.54718017578125, 3.68603515625, 3.82489013671875, 3.9637451171875, 4.10260009765625, 4.241455078125, 4.38031005859375, 4.5191650390625, 4.65802001953125, 4.796875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 10.0, 14.0, 25.0, 35.0, 52.0, 77.0, 110.0, 187.0, 281.0, 436.0, 680.0, 1050.0, 1578.0, 2398.0, 3724.0, 5751.0, 8921.0, 13597.0, 20887.0, 32869.0, 51438.0, 81986.0, 130514.0, 1245213.0, 180424.0, 115427.0, 72368.0, 45296.0, 28742.0, 18470.0, 12003.0, 7745.0, 5146.0, 3389.0, 2179.0, 1432.0, 929.0, 638.0, 387.0, 277.0, 162.0, 109.0, 63.0, 37.0, 23.0, 19.0, 17.0, 7.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.041015625, -1.00933837890625, -0.9776611328125, -0.94598388671875, -0.914306640625, -0.88262939453125, -0.8509521484375, -0.81927490234375, -0.78759765625, -0.75592041015625, -0.7242431640625, -0.69256591796875, -0.660888671875, -0.62921142578125, -0.5975341796875, -0.56585693359375, -0.5341796875, -0.50250244140625, -0.4708251953125, -0.43914794921875, -0.407470703125, -0.37579345703125, -0.3441162109375, -0.31243896484375, -0.28076171875, -0.24908447265625, -0.2174072265625, -0.18572998046875, -0.154052734375, -0.12237548828125, -0.0906982421875, -0.05902099609375, -0.02734375, 0.00433349609375, 0.0360107421875, 0.06768798828125, 0.099365234375, 0.13104248046875, 0.1627197265625, 0.19439697265625, 0.22607421875, 0.25775146484375, 0.2894287109375, 0.32110595703125, 0.352783203125, 0.38446044921875, 0.4161376953125, 0.44781494140625, 0.4794921875, 0.51116943359375, 0.5428466796875, 0.57452392578125, 0.606201171875, 0.63787841796875, 0.6695556640625, 0.70123291015625, 0.73291015625, 0.76458740234375, 0.7962646484375, 0.82794189453125, 0.859619140625, 0.89129638671875, 0.9229736328125, 0.95465087890625, 0.986328125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 11.0, 2.0, 5.0, 4.0, 12.0, 8.0, 15.0, 8.0, 16.0, 21.0, 23.0, 27.0, 34.0, 42.0, 44.0, 40.0, 61.0, 43.0, 54.0, 48.0, 54.0, 43.0, 37.0, 49.0, 48.0, 36.0, 41.0, 34.0, 28.0, 25.0, 17.0, 16.0, 14.0, 7.0, 8.0, 4.0, 3.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0017833709716796875, -0.0017272084951400757, -0.0016710460186004639, -0.001614883542060852, -0.0015587210655212402, -0.0015025585889816284, -0.0014463961124420166, -0.0013902336359024048, -0.001334071159362793, -0.0012779086828231812, -0.0012217462062835693, -0.0011655837297439575, -0.0011094212532043457, -0.0010532587766647339, -0.000997096300125122, -0.0009409338235855103, -0.0008847713470458984, -0.0008286088705062866, -0.0007724463939666748, -0.000716283917427063, -0.0006601214408874512, -0.0006039589643478394, -0.0005477964878082275, -0.0004916340112686157, -0.0004354715347290039, -0.0003793090581893921, -0.0003231465816497803, -0.00026698410511016846, -0.00021082162857055664, -0.00015465915203094482, -9.849667549133301e-05, -4.233419895172119e-05, 1.3828277587890625e-05, 6.999075412750244e-05, 0.00012615323066711426, 0.00018231570720672607, 0.0002384781837463379, 0.0002946406602859497, 0.0003508031368255615, 0.00040696561336517334, 0.00046312808990478516, 0.000519290566444397, 0.0005754530429840088, 0.0006316155195236206, 0.0006877779960632324, 0.0007439404726028442, 0.0008001029491424561, 0.0008562654256820679, 0.0009124279022216797, 0.0009685903787612915, 0.0010247528553009033, 0.0010809153318405151, 0.001137077808380127, 0.0011932402849197388, 0.0012494027614593506, 0.0013055652379989624, 0.0013617277145385742, 0.001417890191078186, 0.0014740526676177979, 0.0015302151441574097, 0.0015863776206970215, 0.0016425400972366333, 0.0016987025737762451, 0.001754865050315857, 0.0018110275268554688]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 2.0, 5.0, 7.0, 5.0, 6.0, 12.0, 17.0, 26.0, 13.0, 27.0, 47.0, 49.0, 54.0, 64.0, 74.0, 119.0, 278.0, 696.0, 7042.0, 1034554.0, 4049.0, 626.0, 239.0, 119.0, 71.0, 72.0, 50.0, 44.0, 33.0, 17.0, 28.0, 17.0, 15.0, 18.0, 7.0, 6.0, 11.0, 6.0, 2.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04229736328125, -0.040993690490722656, -0.03969001770019531, -0.03838634490966797, -0.037082672119140625, -0.03577899932861328, -0.03447532653808594, -0.033171653747558594, -0.03186798095703125, -0.030564308166503906, -0.029260635375976562, -0.02795696258544922, -0.026653289794921875, -0.02534961700439453, -0.024045944213867188, -0.022742271423339844, -0.0214385986328125, -0.020134925842285156, -0.018831253051757812, -0.01752758026123047, -0.016223907470703125, -0.014920234680175781, -0.013616561889648438, -0.012312889099121094, -0.01100921630859375, -0.009705543518066406, -0.008401870727539062, -0.007098197937011719, -0.005794525146484375, -0.004490852355957031, -0.0031871795654296875, -0.0018835067749023438, -0.000579833984375, 0.0007238388061523438, 0.0020275115966796875, 0.0033311843872070312, 0.004634857177734375, 0.005938529968261719, 0.0072422027587890625, 0.008545875549316406, 0.00984954833984375, 0.011153221130371094, 0.012456893920898438, 0.013760566711425781, 0.015064239501953125, 0.01636791229248047, 0.017671585083007812, 0.018975257873535156, 0.0202789306640625, 0.021582603454589844, 0.022886276245117188, 0.02418994903564453, 0.025493621826171875, 0.02679729461669922, 0.028100967407226562, 0.029404640197753906, 0.03070831298828125, 0.032011985778808594, 0.03331565856933594, 0.03461933135986328, 0.035923004150390625, 0.03722667694091797, 0.03853034973144531, 0.039834022521972656, 0.0411376953125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 82.0, 609.0, 306.0, 14.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010601067915558815, -0.010411077179014683, -0.010221085511147976, -0.010031094774603844, -0.009841103106737137, -0.009651112370193005, -0.009461120702326298, -0.009271129965782166, -0.009081138297915459, -0.008891147561371326, -0.00870115589350462, -0.008511165156960487, -0.00832117348909378, -0.008131182752549648, -0.007941191084682941, -0.007751200348138809, -0.00756120914593339, -0.00737121794372797, -0.007181226741522551, -0.006991235539317131, -0.0068012443371117115, -0.006611253134906292, -0.00642126239836216, -0.006231270730495453, -0.006041279993951321, -0.005851288791745901, -0.005661297589540482, -0.005471306387335062, -0.0052813151851296425, -0.005091323982924223, -0.004901332780718803, -0.004711342044174671, -0.004521349910646677, -0.0043313587084412575, -0.004141367506235838, -0.003951376304030418, -0.003761385101824999, -0.0035713938996195793, -0.0033814029302448034, -0.003191411728039384, -0.003001420758664608, -0.0028114295564591885, -0.002621438354253769, -0.0024314471520483494, -0.00224145594984293, -0.0020514647476375103, -0.0018614737782627344, -0.0016714825760573149, -0.0014814912574365735, -0.001291500055231154, -0.0011015089694410563, -0.0009115177672356367, -0.0007215265650302172, -0.0005315353628247976, -0.0003415442770346999, -0.00015155307482928038, 3.8438127376139164e-05, 0.00022842930047772825, 0.00041842047357931733, 0.000608411617577076, 0.0007984028197824955, 0.000988394021987915, 0.0011783851077780128, 0.0013683763099834323, 0.0015583675121888518]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 9.0, 11.0, 11.0, 11.0, 15.0, 20.0, 26.0, 28.0, 21.0, 17.0, 30.0, 29.0, 41.0, 37.0, 41.0, 32.0, 43.0, 37.0, 30.0, 56.0, 39.0, 44.0, 30.0, 49.0, 41.0, 33.0, 29.0, 32.0, 26.0, 20.0, 19.0, 17.0, 16.0, 13.0, 7.0, 13.0, 9.0, 2.0, 3.0, 1.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010439157485961914, -0.0010119974613189697, -0.000980079174041748, -0.0009481608867645264, -0.0009162425994873047, -0.000884324312210083, -0.0008524060249328613, -0.0008204877376556396, -0.000788569450378418, -0.0007566511631011963, -0.0007247328758239746, -0.0006928145885467529, -0.0006608963012695312, -0.0006289780139923096, -0.0005970597267150879, -0.0005651414394378662, -0.0005332231521606445, -0.0005013048648834229, -0.00046938657760620117, -0.0004374682903289795, -0.0004055500030517578, -0.00037363171577453613, -0.00034171342849731445, -0.0003097951412200928, -0.0002778768539428711, -0.0002459585666656494, -0.00021404027938842773, -0.00018212199211120605, -0.00015020370483398438, -0.0001182854175567627, -8.636713027954102e-05, -5.4448843002319336e-05, -2.2530555725097656e-05, 9.387731552124023e-06, 4.13060188293457e-05, 7.322430610656738e-05, 0.00010514259338378906, 0.00013706088066101074, 0.00016897916793823242, 0.0002008974552154541, 0.00023281574249267578, 0.00026473402976989746, 0.00029665231704711914, 0.0003285706043243408, 0.0003604888916015625, 0.0003924071788787842, 0.00042432546615600586, 0.00045624375343322754, 0.0004881620407104492, 0.0005200803279876709, 0.0005519986152648926, 0.0005839169025421143, 0.0006158351898193359, 0.0006477534770965576, 0.0006796717643737793, 0.000711590051651001, 0.0007435083389282227, 0.0007754266262054443, 0.000807344913482666, 0.0008392632007598877, 0.0008711814880371094, 0.0009030997753143311, 0.0009350180625915527, 0.0009669363498687744, 0.000998854637145996]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 11.0, 9.0, 6.0, 17.0, 6.0, 13.0, 18.0, 19.0, 22.0, 19.0, 29.0, 29.0, 22.0, 37.0, 32.0, 36.0, 50.0, 37.0, 40.0, 34.0, 54.0, 32.0, 39.0, 31.0, 24.0, 38.0, 33.0, 20.0, 32.0, 19.0, 29.0, 18.0, 16.0, 19.0, 16.0, 15.0, 14.0, 6.0, 8.0, 13.0, 5.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.70703125, -6.47802734375, -6.2490234375, -6.02001953125, -5.791015625, -5.56201171875, -5.3330078125, -5.10400390625, -4.875, -4.64599609375, -4.4169921875, -4.18798828125, -3.958984375, -3.72998046875, -3.5009765625, -3.27197265625, -3.04296875, -2.81396484375, -2.5849609375, -2.35595703125, -2.126953125, -1.89794921875, -1.6689453125, -1.43994140625, -1.2109375, -0.98193359375, -0.7529296875, -0.52392578125, -0.294921875, -0.06591796875, 0.1630859375, 0.39208984375, 0.62109375, 0.85009765625, 1.0791015625, 1.30810546875, 1.537109375, 1.76611328125, 1.9951171875, 2.22412109375, 2.453125, 2.68212890625, 2.9111328125, 3.14013671875, 3.369140625, 3.59814453125, 3.8271484375, 4.05615234375, 4.28515625, 4.51416015625, 4.7431640625, 4.97216796875, 5.201171875, 5.43017578125, 5.6591796875, 5.88818359375, 6.1171875, 6.34619140625, 6.5751953125, 6.80419921875, 7.033203125, 7.26220703125, 7.4912109375, 7.72021484375, 7.94921875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 11.0, 10.0, 14.0, 11.0, 22.0, 15.0, 29.0, 42.0, 51.0, 71.0, 97.0, 129.0, 199.0, 352.0, 583.0, 1165.0, 2466.0, 6013.0, 16936.0, 58012.0, 246051.0, 526306.0, 136032.0, 34655.0, 11072.0, 4110.0, 1844.0, 875.0, 475.0, 280.0, 165.0, 127.0, 85.0, 62.0, 37.0, 26.0, 29.0, 20.0, 11.0, 14.0, 14.0, 6.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.51171875, -6.28948974609375, -6.0672607421875, -5.84503173828125, -5.622802734375, -5.40057373046875, -5.1783447265625, -4.95611572265625, -4.73388671875, -4.51165771484375, -4.2894287109375, -4.06719970703125, -3.844970703125, -3.62274169921875, -3.4005126953125, -3.17828369140625, -2.9560546875, -2.73382568359375, -2.5115966796875, -2.28936767578125, -2.067138671875, -1.84490966796875, -1.6226806640625, -1.40045166015625, -1.17822265625, -0.95599365234375, -0.7337646484375, -0.51153564453125, -0.289306640625, -0.06707763671875, 0.1551513671875, 0.37738037109375, 0.599609375, 0.82183837890625, 1.0440673828125, 1.26629638671875, 1.488525390625, 1.71075439453125, 1.9329833984375, 2.15521240234375, 2.37744140625, 2.59967041015625, 2.8218994140625, 3.04412841796875, 3.266357421875, 3.48858642578125, 3.7108154296875, 3.93304443359375, 4.1552734375, 4.37750244140625, 4.5997314453125, 4.82196044921875, 5.044189453125, 5.26641845703125, 5.4886474609375, 5.71087646484375, 5.93310546875, 6.15533447265625, 6.3775634765625, 6.59979248046875, 6.822021484375, 7.04425048828125, 7.2664794921875, 7.48870849609375, 7.7109375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 9.0, 11.0, 13.0, 9.0, 10.0, 17.0, 12.0, 28.0, 21.0, 20.0, 33.0, 31.0, 39.0, 33.0, 34.0, 41.0, 45.0, 89.0, 223.0, 1712.0, 145.0, 63.0, 40.0, 48.0, 30.0, 34.0, 37.0, 28.0, 20.0, 35.0, 19.0, 21.0, 21.0, 14.0, 10.0, 10.0, 8.0, 4.0, 5.0, 6.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.59375, -23.78271484375, -22.9716796875, -22.16064453125, -21.349609375, -20.53857421875, -19.7275390625, -18.91650390625, -18.10546875, -17.29443359375, -16.4833984375, -15.67236328125, -14.861328125, -14.05029296875, -13.2392578125, -12.42822265625, -11.6171875, -10.80615234375, -9.9951171875, -9.18408203125, -8.373046875, -7.56201171875, -6.7509765625, -5.93994140625, -5.12890625, -4.31787109375, -3.5068359375, -2.69580078125, -1.884765625, -1.07373046875, -0.2626953125, 0.54833984375, 1.359375, 2.17041015625, 2.9814453125, 3.79248046875, 4.603515625, 5.41455078125, 6.2255859375, 7.03662109375, 7.84765625, 8.65869140625, 9.4697265625, 10.28076171875, 11.091796875, 11.90283203125, 12.7138671875, 13.52490234375, 14.3359375, 15.14697265625, 15.9580078125, 16.76904296875, 17.580078125, 18.39111328125, 19.2021484375, 20.01318359375, 20.82421875, 21.63525390625, 22.4462890625, 23.25732421875, 24.068359375, 24.87939453125, 25.6904296875, 26.50146484375, 27.3125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 14.0, 21.0, 35.0, 55.0, 114.0, 217.0, 408.0, 1358.0, 3123436.0, 18615.0, 721.0, 340.0, 156.0, 87.0, 46.0, 33.0, 18.0, 9.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.0, -133.37109375, -128.7421875, -124.11328125, -119.484375, -114.85546875, -110.2265625, -105.59765625, -100.96875, -96.33984375, -91.7109375, -87.08203125, -82.453125, -77.82421875, -73.1953125, -68.56640625, -63.9375, -59.30859375, -54.6796875, -50.05078125, -45.421875, -40.79296875, -36.1640625, -31.53515625, -26.90625, -22.27734375, -17.6484375, -13.01953125, -8.390625, -3.76171875, 0.8671875, 5.49609375, 10.125, 14.75390625, 19.3828125, 24.01171875, 28.640625, 33.26953125, 37.8984375, 42.52734375, 47.15625, 51.78515625, 56.4140625, 61.04296875, 65.671875, 70.30078125, 74.9296875, 79.55859375, 84.1875, 88.81640625, 93.4453125, 98.07421875, 102.703125, 107.33203125, 111.9609375, 116.58984375, 121.21875, 125.84765625, 130.4765625, 135.10546875, 139.734375, 144.36328125, 148.9921875, 153.62109375, 158.25]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 11.0, 429.0, 560.0, 16.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.37947845458984, -62.586734771728516, -57.79398727416992, -53.001243591308594, -48.20849609375, -43.41575241088867, -38.623008728027344, -33.83026123046875, -29.037517547607422, -24.24477195739746, -19.4520263671875, -14.659282684326172, -9.866537094116211, -5.07379150390625, -0.2810478210449219, 4.511699676513672, 9.304443359375, 14.097188949584961, 18.889934539794922, 23.68267822265625, 28.47542381286621, 33.26816940307617, 38.0609130859375, 42.853660583496094, 47.64640426635742, 52.43914794921875, 57.231895446777344, 62.02463912963867, 66.8173828125, 71.6101303100586, 76.40287780761719, 81.19561767578125, 85.98835754394531, 90.7811050415039, 95.57384490966797, 100.36659240722656, 105.15933990478516, 109.95208740234375, 114.74482727050781, 119.5375747680664, 124.330322265625, 129.12306213378906, 133.9158172607422, 138.70855712890625, 143.5012969970703, 148.29405212402344, 153.0867919921875, 157.87954711914062, 162.67227172851562, 167.4650115966797, 172.2577667236328, 177.05050659179688, 181.84324645996094, 186.63600158691406, 191.42874145507812, 196.22149658203125, 201.0142364501953, 205.80697631835938, 210.5997314453125, 215.39247131347656, 220.18521118164062, 224.97796630859375, 229.7707061767578, 234.56344604492188, 239.356201171875]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 10.0, 10.0, 9.0, 15.0, 19.0, 23.0, 29.0, 23.0, 25.0, 30.0, 29.0, 41.0, 41.0, 45.0, 36.0, 47.0, 41.0, 46.0, 46.0, 54.0, 53.0, 34.0, 45.0, 30.0, 21.0, 26.0, 22.0, 22.0, 26.0, 17.0, 15.0, 15.0, 12.0, 13.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.66453552246094, -73.23259735107422, -70.80065155029297, -68.36871337890625, -65.936767578125, -63.504825592041016, -61.07288360595703, -58.64094543457031, -56.20899963378906, -53.77705764770508, -51.345115661621094, -48.91317367553711, -46.481231689453125, -44.04928970336914, -41.617347717285156, -39.18540954589844, -36.75346755981445, -34.32152557373047, -31.889583587646484, -29.4576416015625, -27.025699615478516, -24.59375762939453, -22.16181755065918, -19.729875564575195, -17.29793357849121, -14.865991592407227, -12.434049606323242, -10.002108573913574, -7.57016658782959, -5.1382246017456055, -2.7062835693359375, -0.2743415832519531, 2.1576004028320312, 4.589542388916016, 7.021483898162842, 9.453425407409668, 11.885367393493652, 14.317309379577637, 16.749250411987305, 19.18119239807129, 21.613134384155273, 24.045076370239258, 26.477018356323242, 28.908958435058594, 31.340900421142578, 33.77284240722656, 36.20478439331055, 38.63672637939453, 41.068668365478516, 43.5006103515625, 45.932552337646484, 48.36449432373047, 50.79643630981445, 53.22837829589844, 55.660316467285156, 58.092262268066406, 60.524200439453125, 62.95614242553711, 65.3880844116211, 67.82002258300781, 70.25196838378906, 72.68390655517578, 75.11585235595703, 77.54779052734375, 79.979736328125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 11.0, 6.0, 11.0, 10.0, 12.0, 11.0, 14.0, 19.0, 20.0, 23.0, 24.0, 18.0, 34.0, 42.0, 35.0, 34.0, 44.0, 52.0, 29.0, 45.0, 37.0, 37.0, 36.0, 37.0, 38.0, 36.0, 23.0, 26.0, 37.0, 24.0, 16.0, 21.0, 22.0, 19.0, 11.0, 11.0, 14.0, 11.0, 11.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.05859375, -6.81732177734375, -6.5760498046875, -6.33477783203125, -6.093505859375, -5.85223388671875, -5.6109619140625, -5.36968994140625, -5.12841796875, -4.88714599609375, -4.6458740234375, -4.40460205078125, -4.163330078125, -3.92205810546875, -3.6807861328125, -3.43951416015625, -3.1982421875, -2.95697021484375, -2.7156982421875, -2.47442626953125, -2.233154296875, -1.99188232421875, -1.7506103515625, -1.50933837890625, -1.26806640625, -1.02679443359375, -0.7855224609375, -0.54425048828125, -0.302978515625, -0.06170654296875, 0.1795654296875, 0.42083740234375, 0.662109375, 0.90338134765625, 1.1446533203125, 1.38592529296875, 1.627197265625, 1.86846923828125, 2.1097412109375, 2.35101318359375, 2.59228515625, 2.83355712890625, 3.0748291015625, 3.31610107421875, 3.557373046875, 3.79864501953125, 4.0399169921875, 4.28118896484375, 4.5224609375, 4.76373291015625, 5.0050048828125, 5.24627685546875, 5.487548828125, 5.72882080078125, 5.9700927734375, 6.21136474609375, 6.45263671875, 6.69390869140625, 6.9351806640625, 7.17645263671875, 7.417724609375, 7.65899658203125, 7.9002685546875, 8.14154052734375, 8.3828125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 10.0, 5.0, 15.0, 13.0, 12.0, 10.0, 18.0, 25.0, 26.0, 28.0, 34.0, 30.0, 42.0, 54.0, 63.0, 76.0, 110.0, 127.0, 240.0, 545.0, 1398.0, 5784.0, 50551.0, 897838.0, 2761164.0, 444690.0, 25146.0, 3832.0, 1080.0, 410.0, 201.0, 162.0, 115.0, 67.0, 62.0, 41.0, 39.0, 45.0, 28.0, 35.0, 21.0, 20.0, 19.0, 15.0, 6.0, 7.0, 8.0, 4.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-18.0625, -17.4677734375, -16.873046875, -16.2783203125, -15.68359375, -15.0888671875, -14.494140625, -13.8994140625, -13.3046875, -12.7099609375, -12.115234375, -11.5205078125, -10.92578125, -10.3310546875, -9.736328125, -9.1416015625, -8.546875, -7.9521484375, -7.357421875, -6.7626953125, -6.16796875, -5.5732421875, -4.978515625, -4.3837890625, -3.7890625, -3.1943359375, -2.599609375, -2.0048828125, -1.41015625, -0.8154296875, -0.220703125, 0.3740234375, 0.96875, 1.5634765625, 2.158203125, 2.7529296875, 3.34765625, 3.9423828125, 4.537109375, 5.1318359375, 5.7265625, 6.3212890625, 6.916015625, 7.5107421875, 8.10546875, 8.7001953125, 9.294921875, 9.8896484375, 10.484375, 11.0791015625, 11.673828125, 12.2685546875, 12.86328125, 13.4580078125, 14.052734375, 14.6474609375, 15.2421875, 15.8369140625, 16.431640625, 17.0263671875, 17.62109375, 18.2158203125, 18.810546875, 19.4052734375, 20.0]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 7.0, 8.0, 14.0, 18.0, 17.0, 27.0, 34.0, 36.0, 57.0, 84.0, 75.0, 89.0, 132.0, 150.0, 195.0, 264.0, 315.0, 387.0, 425.0, 397.0, 315.0, 236.0, 156.0, 145.0, 107.0, 81.0, 76.0, 40.0, 43.0, 39.0, 17.0, 22.0, 16.0, 17.0, 9.0, 4.0, 5.0, 5.0, 2.0, 0.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.375, -12.97314453125, -12.5712890625, -12.16943359375, -11.767578125, -11.36572265625, -10.9638671875, -10.56201171875, -10.16015625, -9.75830078125, -9.3564453125, -8.95458984375, -8.552734375, -8.15087890625, -7.7490234375, -7.34716796875, -6.9453125, -6.54345703125, -6.1416015625, -5.73974609375, -5.337890625, -4.93603515625, -4.5341796875, -4.13232421875, -3.73046875, -3.32861328125, -2.9267578125, -2.52490234375, -2.123046875, -1.72119140625, -1.3193359375, -0.91748046875, -0.515625, -0.11376953125, 0.2880859375, 0.68994140625, 1.091796875, 1.49365234375, 1.8955078125, 2.29736328125, 2.69921875, 3.10107421875, 3.5029296875, 3.90478515625, 4.306640625, 4.70849609375, 5.1103515625, 5.51220703125, 5.9140625, 6.31591796875, 6.7177734375, 7.11962890625, 7.521484375, 7.92333984375, 8.3251953125, 8.72705078125, 9.12890625, 9.53076171875, 9.9326171875, 10.33447265625, 10.736328125, 11.13818359375, 11.5400390625, 11.94189453125, 12.34375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 5.0, 3.0, 7.0, 12.0, 16.0, 16.0, 10.0, 25.0, 25.0, 38.0, 38.0, 52.0, 67.0, 89.0, 119.0, 137.0, 158.0, 180.0, 227.0, 375.0, 702.0, 6966.0, 3331977.0, 847734.0, 3061.0, 581.0, 372.0, 225.0, 195.0, 160.0, 135.0, 109.0, 97.0, 75.0, 69.0, 41.0, 35.0, 37.0, 25.0, 23.0, 13.0, 10.0, 6.0, 6.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-64.6875, -62.6591796875, -60.630859375, -58.6025390625, -56.57421875, -54.5458984375, -52.517578125, -50.4892578125, -48.4609375, -46.4326171875, -44.404296875, -42.3759765625, -40.34765625, -38.3193359375, -36.291015625, -34.2626953125, -32.234375, -30.2060546875, -28.177734375, -26.1494140625, -24.12109375, -22.0927734375, -20.064453125, -18.0361328125, -16.0078125, -13.9794921875, -11.951171875, -9.9228515625, -7.89453125, -5.8662109375, -3.837890625, -1.8095703125, 0.21875, 2.2470703125, 4.275390625, 6.3037109375, 8.33203125, 10.3603515625, 12.388671875, 14.4169921875, 16.4453125, 18.4736328125, 20.501953125, 22.5302734375, 24.55859375, 26.5869140625, 28.615234375, 30.6435546875, 32.671875, 34.7001953125, 36.728515625, 38.7568359375, 40.78515625, 42.8134765625, 44.841796875, 46.8701171875, 48.8984375, 50.9267578125, 52.955078125, 54.9833984375, 57.01171875, 59.0400390625, 61.068359375, 63.0966796875, 65.125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 21.0, 126.0, 411.0, 346.0, 92.0, 18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.4569854736328, -141.6826171875, -134.90823364257812, -128.13385009765625, -121.35948181152344, -114.5851058959961, -107.81072998046875, -101.0363540649414, -94.26197814941406, -87.48760223388672, -80.71322631835938, -73.93885040283203, -67.16447448730469, -60.390098571777344, -53.61572265625, -46.841346740722656, -40.06697082519531, -33.29259490966797, -26.518218994140625, -19.74384307861328, -12.969467163085938, -6.195091247558594, 0.57928466796875, 7.353660583496094, 14.128036499023438, 20.90241241455078, 27.676788330078125, 34.45116424560547, 41.22554016113281, 47.999916076660156, 54.7742919921875, 61.548667907714844, 68.32302856445312, 75.09740447998047, 81.87178039550781, 88.64615631103516, 95.4205322265625, 102.19490814208984, 108.96928405761719, 115.74365997314453, 122.51803588867188, 129.29241943359375, 136.06678771972656, 142.84115600585938, 149.61553955078125, 156.38992309570312, 163.16429138183594, 169.93865966796875, 176.71304321289062, 183.4874267578125, 190.2617950439453, 197.03616333007812, 203.810546875, 210.58493041992188, 217.3592987060547, 224.1336669921875, 230.90805053710938, 237.68243408203125, 244.45680236816406, 251.23117065429688, 258.00555419921875, 264.7799377441406, 271.5543212890625, 278.32867431640625, 285.1030578613281]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 8.0, 7.0, 9.0, 15.0, 17.0, 15.0, 22.0, 9.0, 17.0, 28.0, 26.0, 28.0, 40.0, 50.0, 40.0, 43.0, 59.0, 47.0, 33.0, 58.0, 34.0, 39.0, 53.0, 39.0, 35.0, 32.0, 35.0, 21.0, 26.0, 21.0, 27.0, 14.0, 13.0, 3.0, 11.0, 3.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.80086135864258, -54.11524963378906, -52.42964172363281, -50.7440299987793, -49.05842208862305, -47.37281036376953, -45.68720245361328, -44.001590728759766, -42.31597900390625, -40.630367279052734, -38.944759368896484, -37.25914764404297, -35.57353973388672, -33.8879280090332, -32.20231628417969, -30.516708374023438, -28.831100463867188, -27.145490646362305, -25.459880828857422, -23.774269104003906, -22.088661193847656, -20.40304946899414, -18.717439651489258, -17.031829833984375, -15.346220016479492, -13.66061019897461, -11.975000381469727, -10.289389610290527, -8.603779792785645, -6.918169975280762, -5.2325592041015625, -3.5469493865966797, -1.8613357543945312, -0.17572569847106934, 1.5098843574523926, 3.1954946517944336, 4.881104469299316, 6.566714286804199, 8.252325057983398, 9.937934875488281, 11.623544692993164, 13.309154510498047, 14.99476432800293, 16.680374145507812, 18.365985870361328, 20.051593780517578, 21.737205505371094, 23.422815322875977, 25.10842514038086, 26.794034957885742, 28.479644775390625, 30.16525650024414, 31.85086441040039, 33.536476135253906, 35.222084045410156, 36.90769577026367, 38.59330749511719, 40.2789192199707, 41.96452713012695, 43.65013885498047, 45.33574676513672, 47.021358489990234, 48.70697021484375, 50.392578125, 52.07818603515625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 4.0, 8.0, 14.0, 9.0, 8.0, 9.0, 20.0, 16.0, 14.0, 23.0, 30.0, 14.0, 23.0, 44.0, 30.0, 30.0, 43.0, 28.0, 40.0, 46.0, 48.0, 38.0, 33.0, 39.0, 31.0, 37.0, 32.0, 26.0, 26.0, 29.0, 31.0, 16.0, 17.0, 21.0, 12.0, 11.0, 21.0, 14.0, 8.0, 13.0, 16.0, 6.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.4453125, -7.21331787109375, -6.9813232421875, -6.74932861328125, -6.517333984375, -6.28533935546875, -6.0533447265625, -5.82135009765625, -5.58935546875, -5.35736083984375, -5.1253662109375, -4.89337158203125, -4.661376953125, -4.42938232421875, -4.1973876953125, -3.96539306640625, -3.7333984375, -3.50140380859375, -3.2694091796875, -3.03741455078125, -2.805419921875, -2.57342529296875, -2.3414306640625, -2.10943603515625, -1.87744140625, -1.64544677734375, -1.4134521484375, -1.18145751953125, -0.949462890625, -0.71746826171875, -0.4854736328125, -0.25347900390625, -0.021484375, 0.21051025390625, 0.4425048828125, 0.67449951171875, 0.906494140625, 1.13848876953125, 1.3704833984375, 1.60247802734375, 1.83447265625, 2.06646728515625, 2.2984619140625, 2.53045654296875, 2.762451171875, 2.99444580078125, 3.2264404296875, 3.45843505859375, 3.6904296875, 3.92242431640625, 4.1544189453125, 4.38641357421875, 4.618408203125, 4.85040283203125, 5.0823974609375, 5.31439208984375, 5.54638671875, 5.77838134765625, 6.0103759765625, 6.24237060546875, 6.474365234375, 6.70635986328125, 6.9383544921875, 7.17034912109375, 7.40234375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 9.0, 8.0, 12.0, 19.0, 24.0, 40.0, 62.0, 86.0, 130.0, 192.0, 234.0, 381.0, 444.0, 710.0, 1041.0, 1468.0, 2302.0, 3366.0, 4906.0, 7489.0, 11277.0, 16981.0, 25510.0, 39470.0, 60386.0, 92045.0, 139230.0, 195465.0, 151911.0, 100225.0, 66293.0, 42503.0, 28327.0, 18428.0, 12328.0, 8161.0, 5554.0, 3648.0, 2480.0, 1691.0, 1111.0, 797.0, 571.0, 386.0, 262.0, 188.0, 118.0, 83.0, 63.0, 46.0, 43.0, 19.0, 18.0, 9.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.0634765625, -1.0298309326171875, -0.996185302734375, -0.9625396728515625, -0.92889404296875, -0.8952484130859375, -0.861602783203125, -0.8279571533203125, -0.7943115234375, -0.7606658935546875, -0.727020263671875, -0.6933746337890625, -0.65972900390625, -0.6260833740234375, -0.592437744140625, -0.5587921142578125, -0.525146484375, -0.4915008544921875, -0.457855224609375, -0.4242095947265625, -0.39056396484375, -0.3569183349609375, -0.323272705078125, -0.2896270751953125, -0.2559814453125, -0.2223358154296875, -0.188690185546875, -0.1550445556640625, -0.12139892578125, -0.0877532958984375, -0.054107666015625, -0.0204620361328125, 0.01318359375, 0.0468292236328125, 0.080474853515625, 0.1141204833984375, 0.14776611328125, 0.1814117431640625, 0.215057373046875, 0.2487030029296875, 0.2823486328125, 0.3159942626953125, 0.349639892578125, 0.3832855224609375, 0.41693115234375, 0.4505767822265625, 0.484222412109375, 0.5178680419921875, 0.551513671875, 0.5851593017578125, 0.618804931640625, 0.6524505615234375, 0.68609619140625, 0.7197418212890625, 0.753387451171875, 0.7870330810546875, 0.8206787109375, 0.8543243408203125, 0.887969970703125, 0.9216156005859375, 0.95526123046875, 0.9889068603515625, 1.022552490234375, 1.0561981201171875, 1.08984375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 12.0, 2.0, 8.0, 11.0, 14.0, 13.0, 16.0, 20.0, 20.0, 30.0, 36.0, 33.0, 37.0, 33.0, 31.0, 33.0, 45.0, 34.0, 39.0, 1064.0, 35.0, 48.0, 37.0, 45.0, 44.0, 32.0, 35.0, 40.0, 25.0, 22.0, 25.0, 14.0, 16.0, 17.0, 15.0, 8.0, 7.0, 5.0, 8.0, 1.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.26171875, -5.09674072265625, -4.9317626953125, -4.76678466796875, -4.601806640625, -4.43682861328125, -4.2718505859375, -4.10687255859375, -3.94189453125, -3.77691650390625, -3.6119384765625, -3.44696044921875, -3.281982421875, -3.11700439453125, -2.9520263671875, -2.78704833984375, -2.6220703125, -2.45709228515625, -2.2921142578125, -2.12713623046875, -1.962158203125, -1.79718017578125, -1.6322021484375, -1.46722412109375, -1.30224609375, -1.13726806640625, -0.9722900390625, -0.80731201171875, -0.642333984375, -0.47735595703125, -0.3123779296875, -0.14739990234375, 0.017578125, 0.18255615234375, 0.3475341796875, 0.51251220703125, 0.677490234375, 0.84246826171875, 1.0074462890625, 1.17242431640625, 1.33740234375, 1.50238037109375, 1.6673583984375, 1.83233642578125, 1.997314453125, 2.16229248046875, 2.3272705078125, 2.49224853515625, 2.6572265625, 2.82220458984375, 2.9871826171875, 3.15216064453125, 3.317138671875, 3.48211669921875, 3.6470947265625, 3.81207275390625, 3.97705078125, 4.14202880859375, 4.3070068359375, 4.47198486328125, 4.636962890625, 4.80194091796875, 4.9669189453125, 5.13189697265625, 5.296875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 12.0, 17.0, 11.0, 25.0, 22.0, 46.0, 67.0, 96.0, 118.0, 172.0, 281.0, 386.0, 549.0, 876.0, 1228.0, 1842.0, 2721.0, 3916.0, 5924.0, 8790.0, 13717.0, 20413.0, 31658.0, 48940.0, 76555.0, 118493.0, 184608.0, 1225779.0, 123189.0, 79653.0, 50835.0, 32636.0, 21406.0, 13997.0, 9264.0, 5967.0, 4159.0, 2756.0, 1897.0, 1333.0, 830.0, 622.0, 424.0, 272.0, 211.0, 137.0, 99.0, 61.0, 48.0, 29.0, 17.0, 15.0, 10.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0], "bins": [-0.9521484375, -0.921478271484375, -0.89080810546875, -0.860137939453125, -0.8294677734375, -0.798797607421875, -0.76812744140625, -0.737457275390625, -0.706787109375, -0.676116943359375, -0.64544677734375, -0.614776611328125, -0.5841064453125, -0.553436279296875, -0.52276611328125, -0.492095947265625, -0.46142578125, -0.430755615234375, -0.40008544921875, -0.369415283203125, -0.3387451171875, -0.308074951171875, -0.27740478515625, -0.246734619140625, -0.216064453125, -0.185394287109375, -0.15472412109375, -0.124053955078125, -0.0933837890625, -0.062713623046875, -0.03204345703125, -0.001373291015625, 0.029296875, 0.059967041015625, 0.09063720703125, 0.121307373046875, 0.1519775390625, 0.182647705078125, 0.21331787109375, 0.243988037109375, 0.274658203125, 0.305328369140625, 0.33599853515625, 0.366668701171875, 0.3973388671875, 0.428009033203125, 0.45867919921875, 0.489349365234375, 0.52001953125, 0.550689697265625, 0.58135986328125, 0.612030029296875, 0.6427001953125, 0.673370361328125, 0.70404052734375, 0.734710693359375, 0.765380859375, 0.796051025390625, 0.82672119140625, 0.857391357421875, 0.8880615234375, 0.918731689453125, 0.94940185546875, 0.980072021484375, 1.0107421875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 3.0, 5.0, 6.0, 7.0, 9.0, 10.0, 16.0, 25.0, 25.0, 32.0, 27.0, 49.0, 49.0, 48.0, 48.0, 49.0, 63.0, 60.0, 63.0, 40.0, 56.0, 44.0, 48.0, 27.0, 38.0, 35.0, 19.0, 26.0, 12.0, 9.0, 12.0, 9.0, 3.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0017633438110351562, -0.0017117857933044434, -0.0016602277755737305, -0.0016086697578430176, -0.0015571117401123047, -0.0015055537223815918, -0.001453995704650879, -0.001402437686920166, -0.0013508796691894531, -0.0012993216514587402, -0.0012477636337280273, -0.0011962056159973145, -0.0011446475982666016, -0.0010930895805358887, -0.0010415315628051758, -0.0009899735450744629, -0.00093841552734375, -0.0008868575096130371, -0.0008352994918823242, -0.0007837414741516113, -0.0007321834564208984, -0.0006806254386901855, -0.0006290674209594727, -0.0005775094032287598, -0.0005259513854980469, -0.000474393367767334, -0.0004228353500366211, -0.0003712773323059082, -0.0003197193145751953, -0.0002681612968444824, -0.00021660327911376953, -0.00016504526138305664, -0.00011348724365234375, -6.192922592163086e-05, -1.0371208190917969e-05, 4.118680953979492e-05, 9.274482727050781e-05, 0.0001443028450012207, 0.0001958608627319336, 0.0002474188804626465, 0.0002989768981933594, 0.00035053491592407227, 0.00040209293365478516, 0.00045365095138549805, 0.0005052089691162109, 0.0005567669868469238, 0.0006083250045776367, 0.0006598830223083496, 0.0007114410400390625, 0.0007629990577697754, 0.0008145570755004883, 0.0008661150932312012, 0.0009176731109619141, 0.000969231128692627, 0.0010207891464233398, 0.0010723471641540527, 0.0011239051818847656, 0.0011754631996154785, 0.0012270212173461914, 0.0012785792350769043, 0.0013301372528076172, 0.00138169527053833, 0.001433253288269043, 0.0014848113059997559, 0.0015363693237304688]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 8.0, 0.0, 6.0, 3.0, 8.0, 5.0, 7.0, 8.0, 24.0, 24.0, 21.0, 31.0, 42.0, 39.0, 73.0, 82.0, 115.0, 178.0, 455.0, 2586.0, 1013602.0, 29722.0, 714.0, 263.0, 152.0, 87.0, 65.0, 51.0, 31.0, 28.0, 21.0, 23.0, 23.0, 10.0, 10.0, 9.0, 6.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03759765625, -0.036411285400390625, -0.03522491455078125, -0.034038543701171875, -0.0328521728515625, -0.031665802001953125, -0.03047943115234375, -0.029293060302734375, -0.028106689453125, -0.026920318603515625, -0.02573394775390625, -0.024547576904296875, -0.0233612060546875, -0.022174835205078125, -0.02098846435546875, -0.019802093505859375, -0.01861572265625, -0.017429351806640625, -0.01624298095703125, -0.015056610107421875, -0.0138702392578125, -0.012683868408203125, -0.01149749755859375, -0.010311126708984375, -0.009124755859375, -0.007938385009765625, -0.00675201416015625, -0.005565643310546875, -0.0043792724609375, -0.003192901611328125, -0.00200653076171875, -0.000820159912109375, 0.0003662109375, 0.001552581787109375, 0.00273895263671875, 0.003925323486328125, 0.0051116943359375, 0.006298065185546875, 0.00748443603515625, 0.008670806884765625, 0.009857177734375, 0.011043548583984375, 0.01222991943359375, 0.013416290283203125, 0.0146026611328125, 0.015789031982421875, 0.01697540283203125, 0.018161773681640625, 0.01934814453125, 0.020534515380859375, 0.02172088623046875, 0.022907257080078125, 0.0240936279296875, 0.025279998779296875, 0.02646636962890625, 0.027652740478515625, 0.028839111328125, 0.030025482177734375, 0.03121185302734375, 0.032398223876953125, 0.0335845947265625, 0.034770965576171875, 0.03595733642578125, 0.037143707275390625, 0.038330078125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 12.0, 22.0, 29.0, 52.0, 92.0, 110.0, 144.0, 153.0, 156.0, 86.0, 69.0, 37.0, 24.0, 9.0, 6.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.002105479361489415, -0.002065099310129881, -0.0020247192587703466, -0.0019843392074108124, -0.0019439592724666, -0.0019035792211070657, -0.0018631991697475314, -0.0018228191183879972, -0.0017824391834437847, -0.0017420591320842505, -0.0017016790807247162, -0.0016612991457805037, -0.0016209190944209695, -0.0015805390430614352, -0.001540158991701901, -0.0014997789403423667, -0.0014593988889828324, -0.0014190188376232982, -0.001378638786263764, -0.0013382588513195515, -0.0012978787999600172, -0.001257498748600483, -0.0012171186972409487, -0.0011767386458814144, -0.0011363585945218801, -0.0010959785431623459, -0.0010555984918028116, -0.0010152185568585992, -0.0009748385054990649, -0.0009344584541395307, -0.0008940784027799964, -0.0008536983514204621, -0.0008133184164762497, -0.0007729383651167154, -0.0007325583719648421, -0.0006921783206053078, -0.0006517983274534345, -0.0006114182760939002, -0.0005710382247343659, -0.0005306581733748317, -0.0004902781220152974, -0.0004498980997595936, -0.0004095180775038898, -0.00036913802614435554, -0.00032875800388865173, -0.0002883779816329479, -0.00024799793027341366, -0.00020761790801770985, -0.0001672379148658365, -0.0001268578926101327, -8.647785580251366e-05, -4.609782627085224e-05, -5.717796739190817e-06, 3.466222551651299e-05, 7.504226232413203e-05, 0.00011542229913175106, 0.00015580232138745487, 0.00019618234364315867, 0.0002365623804507777, 0.00027694241725839674, 0.00031732243951410055, 0.00035770246176980436, 0.00039808248402550817, 0.00043846253538504243, 0.00047884255764074624]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 6.0, 4.0, 15.0, 15.0, 8.0, 14.0, 17.0, 25.0, 20.0, 30.0, 21.0, 32.0, 25.0, 32.0, 39.0, 28.0, 36.0, 43.0, 36.0, 33.0, 34.0, 42.0, 39.0, 37.0, 37.0, 38.0, 31.0, 32.0, 30.0, 26.0, 24.0, 19.0, 20.0, 14.0, 10.0, 15.0, 10.0, 13.0, 8.0, 8.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0007726550102233887, -0.0007470259442925453, -0.000721396878361702, -0.0006957678124308586, -0.0006701387465000153, -0.0006445096805691719, -0.0006188806146383286, -0.0005932515487074852, -0.0005676224827766418, -0.0005419934168457985, -0.0005163643509149551, -0.0004907352849841118, -0.00046510621905326843, -0.0004394771531224251, -0.0004138480871915817, -0.00038821902126073837, -0.000362589955329895, -0.00033696088939905167, -0.0003113318234682083, -0.00028570275753736496, -0.0002600736916065216, -0.00023444462567567825, -0.0002088155597448349, -0.00018318649381399155, -0.0001575574278831482, -0.00013192836195230484, -0.00010629929602146149, -8.067023009061813e-05, -5.504116415977478e-05, -2.9412098228931427e-05, -3.7830322980880737e-06, 2.184603363275528e-05, 4.747509956359863e-05, 7.310416549444199e-05, 9.873323142528534e-05, 0.0001243622973561287, 0.00014999136328697205, 0.0001756204292178154, 0.00020124949514865875, 0.0002268785610795021, 0.00025250762701034546, 0.0002781366929411888, 0.00030376575887203217, 0.0003293948248028755, 0.00035502389073371887, 0.0003806529566645622, 0.0004062820225954056, 0.00043191108852624893, 0.0004575401544570923, 0.00048316922038793564, 0.000508798286318779, 0.0005344273522496223, 0.0005600564181804657, 0.000585685484111309, 0.0006113145500421524, 0.0006369436159729958, 0.0006625726819038391, 0.0006882017478346825, 0.0007138308137655258, 0.0007394598796963692, 0.0007650889456272125, 0.0007907180115580559, 0.0008163470774888992, 0.0008419761434197426, 0.0008676052093505859]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 4.0, 8.0, 14.0, 9.0, 8.0, 9.0, 20.0, 16.0, 14.0, 23.0, 30.0, 14.0, 23.0, 44.0, 30.0, 30.0, 43.0, 28.0, 40.0, 46.0, 48.0, 38.0, 33.0, 39.0, 31.0, 37.0, 32.0, 26.0, 26.0, 29.0, 31.0, 16.0, 17.0, 21.0, 12.0, 11.0, 21.0, 14.0, 8.0, 13.0, 16.0, 6.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.4453125, -7.21331787109375, -6.9813232421875, -6.74932861328125, -6.517333984375, -6.28533935546875, -6.0533447265625, -5.82135009765625, -5.58935546875, -5.35736083984375, -5.1253662109375, -4.89337158203125, -4.661376953125, -4.42938232421875, -4.1973876953125, -3.96539306640625, -3.7333984375, -3.50140380859375, -3.2694091796875, -3.03741455078125, -2.805419921875, -2.57342529296875, -2.3414306640625, -2.10943603515625, -1.87744140625, -1.64544677734375, -1.4134521484375, -1.18145751953125, -0.949462890625, -0.71746826171875, -0.4854736328125, -0.25347900390625, -0.021484375, 0.21051025390625, 0.4425048828125, 0.67449951171875, 0.906494140625, 1.13848876953125, 1.3704833984375, 1.60247802734375, 1.83447265625, 2.06646728515625, 2.2984619140625, 2.53045654296875, 2.762451171875, 2.99444580078125, 3.2264404296875, 3.45843505859375, 3.6904296875, 3.92242431640625, 4.1544189453125, 4.38641357421875, 4.618408203125, 4.85040283203125, 5.0823974609375, 5.31439208984375, 5.54638671875, 5.77838134765625, 6.0103759765625, 6.24237060546875, 6.474365234375, 6.70635986328125, 6.9383544921875, 7.17034912109375, 7.40234375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 5.0, 2.0, 7.0, 11.0, 5.0, 8.0, 16.0, 24.0, 25.0, 49.0, 61.0, 107.0, 175.0, 296.0, 493.0, 905.0, 1616.0, 2939.0, 5550.0, 10590.0, 22013.0, 53815.0, 155357.0, 431130.0, 229212.0, 76272.0, 29136.0, 13569.0, 6691.0, 3751.0, 2046.0, 1085.0, 611.0, 377.0, 237.0, 128.0, 73.0, 46.0, 30.0, 23.0, 23.0, 15.0, 9.0, 9.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.45703125, -5.28472900390625, -5.1124267578125, -4.94012451171875, -4.767822265625, -4.59552001953125, -4.4232177734375, -4.25091552734375, -4.07861328125, -3.90631103515625, -3.7340087890625, -3.56170654296875, -3.389404296875, -3.21710205078125, -3.0447998046875, -2.87249755859375, -2.7001953125, -2.52789306640625, -2.3555908203125, -2.18328857421875, -2.010986328125, -1.83868408203125, -1.6663818359375, -1.49407958984375, -1.32177734375, -1.14947509765625, -0.9771728515625, -0.80487060546875, -0.632568359375, -0.46026611328125, -0.2879638671875, -0.11566162109375, 0.056640625, 0.22894287109375, 0.4012451171875, 0.57354736328125, 0.745849609375, 0.91815185546875, 1.0904541015625, 1.26275634765625, 1.43505859375, 1.60736083984375, 1.7796630859375, 1.95196533203125, 2.124267578125, 2.29656982421875, 2.4688720703125, 2.64117431640625, 2.8134765625, 2.98577880859375, 3.1580810546875, 3.33038330078125, 3.502685546875, 3.67498779296875, 3.8472900390625, 4.01959228515625, 4.19189453125, 4.36419677734375, 4.5364990234375, 4.70880126953125, 4.881103515625, 5.05340576171875, 5.2257080078125, 5.39801025390625, 5.5703125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 9.0, 14.0, 11.0, 7.0, 30.0, 19.0, 24.0, 26.0, 29.0, 34.0, 42.0, 41.0, 63.0, 63.0, 89.0, 337.0, 1687.0, 102.0, 50.0, 56.0, 50.0, 30.0, 28.0, 43.0, 34.0, 29.0, 14.0, 19.0, 12.0, 11.0, 9.0, 13.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.4375, -25.462890625, -24.48828125, -23.513671875, -22.5390625, -21.564453125, -20.58984375, -19.615234375, -18.640625, -17.666015625, -16.69140625, -15.716796875, -14.7421875, -13.767578125, -12.79296875, -11.818359375, -10.84375, -9.869140625, -8.89453125, -7.919921875, -6.9453125, -5.970703125, -4.99609375, -4.021484375, -3.046875, -2.072265625, -1.09765625, -0.123046875, 0.8515625, 1.826171875, 2.80078125, 3.775390625, 4.75, 5.724609375, 6.69921875, 7.673828125, 8.6484375, 9.623046875, 10.59765625, 11.572265625, 12.546875, 13.521484375, 14.49609375, 15.470703125, 16.4453125, 17.419921875, 18.39453125, 19.369140625, 20.34375, 21.318359375, 22.29296875, 23.267578125, 24.2421875, 25.216796875, 26.19140625, 27.166015625, 28.140625, 29.115234375, 30.08984375, 31.064453125, 32.0390625, 33.013671875, 33.98828125, 34.962890625, 35.9375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 3.0, 5.0, 8.0, 13.0, 14.0, 21.0, 13.0, 22.0, 30.0, 55.0, 46.0, 87.0, 110.0, 156.0, 215.0, 336.0, 724.0, 10956.0, 3119198.0, 11748.0, 698.0, 362.0, 227.0, 179.0, 114.0, 72.0, 65.0, 45.0, 42.0, 37.0, 26.0, 11.0, 22.0, 12.0, 8.0, 5.0, 7.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-85.0625, -82.732421875, -80.40234375, -78.072265625, -75.7421875, -73.412109375, -71.08203125, -68.751953125, -66.421875, -64.091796875, -61.76171875, -59.431640625, -57.1015625, -54.771484375, -52.44140625, -50.111328125, -47.78125, -45.451171875, -43.12109375, -40.791015625, -38.4609375, -36.130859375, -33.80078125, -31.470703125, -29.140625, -26.810546875, -24.48046875, -22.150390625, -19.8203125, -17.490234375, -15.16015625, -12.830078125, -10.5, -8.169921875, -5.83984375, -3.509765625, -1.1796875, 1.150390625, 3.48046875, 5.810546875, 8.140625, 10.470703125, 12.80078125, 15.130859375, 17.4609375, 19.791015625, 22.12109375, 24.451171875, 26.78125, 29.111328125, 31.44140625, 33.771484375, 36.1015625, 38.431640625, 40.76171875, 43.091796875, 45.421875, 47.751953125, 50.08203125, 52.412109375, 54.7421875, 57.072265625, 59.40234375, 61.732421875, 64.0625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [3.0, 80.0, 740.0, 190.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.543399810791016, -7.847620487213135, -3.151841163635254, 1.5439376831054688, 6.239717483520508, 10.935497283935547, 15.631275177001953, 20.327056884765625, 25.02283477783203, 29.71861457824707, 34.41439437866211, 39.110172271728516, 43.80595397949219, 48.501731872558594, 53.197509765625, 57.89329147338867, 62.58906936645508, 67.28485107421875, 71.98062896728516, 76.67640686035156, 81.37218475341797, 86.06796264648438, 90.76374816894531, 95.45952606201172, 100.15530395507812, 104.85108184814453, 109.54685974121094, 114.24264526367188, 118.93842315673828, 123.63420104980469, 128.32998657226562, 133.0257568359375, 137.72154235839844, 142.41732788085938, 147.11309814453125, 151.8088836669922, 156.50465393066406, 161.200439453125, 165.89620971679688, 170.5919952392578, 175.28778076171875, 179.9835662841797, 184.67933654785156, 189.3751220703125, 194.07089233398438, 198.7666778564453, 203.46246337890625, 208.15823364257812, 212.85400390625, 217.54978942871094, 222.2455596923828, 226.94134521484375, 231.63711547851562, 236.33290100097656, 241.0286865234375, 245.72445678710938, 250.4202423095703, 255.11602783203125, 259.8117980957031, 264.507568359375, 269.203369140625, 273.8991394042969, 278.59490966796875, 283.29071044921875, 287.9864807128906]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 7.0, 2.0, 4.0, 3.0, 7.0, 7.0, 6.0, 7.0, 11.0, 13.0, 14.0, 11.0, 20.0, 27.0, 22.0, 28.0, 25.0, 37.0, 21.0, 45.0, 52.0, 44.0, 40.0, 36.0, 41.0, 44.0, 42.0, 44.0, 32.0, 45.0, 38.0, 26.0, 23.0, 20.0, 26.0, 15.0, 19.0, 9.0, 17.0, 4.0, 16.0, 5.0, 14.0, 6.0, 7.0, 6.0, 6.0, 3.0, 6.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.086910247802734, -57.02975082397461, -54.97259521484375, -52.915435791015625, -50.8582763671875, -48.801116943359375, -46.74395751953125, -44.68680191040039, -42.629642486572266, -40.57248306274414, -38.51532745361328, -36.458168029785156, -34.40100860595703, -32.343849182128906, -30.286691665649414, -28.229534149169922, -26.172374725341797, -24.115215301513672, -22.05805778503418, -20.000900268554688, -17.943740844726562, -15.886582374572754, -13.829423904418945, -11.772265434265137, -9.715106964111328, -7.6579484939575195, -5.600790023803711, -3.5436315536499023, -1.4864730834960938, 0.5706853866577148, 2.6278438568115234, 4.685002326965332, 6.742156982421875, 8.799315452575684, 10.856473922729492, 12.9136323928833, 14.97079086303711, 17.027950286865234, 19.085107803344727, 21.14226531982422, 23.199424743652344, 25.25658416748047, 27.31374168395996, 29.370899200439453, 31.428058624267578, 33.4852180480957, 35.54237365722656, 37.59953308105469, 39.65669250488281, 41.71385192871094, 43.77101135253906, 45.82816696166992, 47.88532638549805, 49.94248580932617, 51.99964141845703, 54.056800842285156, 56.11396026611328, 58.171119689941406, 60.22827911376953, 62.28543472290039, 64.34259033203125, 66.39974975585938, 68.4569091796875, 70.51406860351562, 72.57122802734375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 6.0, 6.0, 7.0, 11.0, 13.0, 11.0, 17.0, 19.0, 11.0, 17.0, 20.0, 23.0, 33.0, 33.0, 30.0, 34.0, 34.0, 36.0, 34.0, 38.0, 45.0, 35.0, 38.0, 38.0, 44.0, 37.0, 21.0, 31.0, 29.0, 26.0, 22.0, 22.0, 13.0, 25.0, 17.0, 15.0, 16.0, 17.0, 10.0, 14.0, 12.0, 4.0, 12.0, 3.0, 5.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.1875, -6.9527587890625, -6.718017578125, -6.4832763671875, -6.24853515625, -6.0137939453125, -5.779052734375, -5.5443115234375, -5.3095703125, -5.0748291015625, -4.840087890625, -4.6053466796875, -4.37060546875, -4.1358642578125, -3.901123046875, -3.6663818359375, -3.431640625, -3.1968994140625, -2.962158203125, -2.7274169921875, -2.49267578125, -2.2579345703125, -2.023193359375, -1.7884521484375, -1.5537109375, -1.3189697265625, -1.084228515625, -0.8494873046875, -0.61474609375, -0.3800048828125, -0.145263671875, 0.0894775390625, 0.32421875, 0.5589599609375, 0.793701171875, 1.0284423828125, 1.26318359375, 1.4979248046875, 1.732666015625, 1.9674072265625, 2.2021484375, 2.4368896484375, 2.671630859375, 2.9063720703125, 3.14111328125, 3.3758544921875, 3.610595703125, 3.8453369140625, 4.080078125, 4.3148193359375, 4.549560546875, 4.7843017578125, 5.01904296875, 5.2537841796875, 5.488525390625, 5.7232666015625, 5.9580078125, 6.1927490234375, 6.427490234375, 6.6622314453125, 6.89697265625, 7.1317138671875, 7.366455078125, 7.6011962890625, 7.8359375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 7.0, 4.0, 8.0, 9.0, 18.0, 11.0, 15.0, 13.0, 13.0, 22.0, 23.0, 33.0, 35.0, 49.0, 89.0, 125.0, 225.0, 493.0, 1116.0, 3793.0, 23033.0, 526528.0, 3106704.0, 503074.0, 22602.0, 3756.0, 1207.0, 507.0, 254.0, 133.0, 67.0, 59.0, 39.0, 24.0, 26.0, 21.0, 12.0, 13.0, 15.0, 15.0, 17.0, 13.0, 11.0, 11.0, 9.0, 2.0, 5.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0], "bins": [-20.328125, -19.638916015625, -18.94970703125, -18.260498046875, -17.5712890625, -16.882080078125, -16.19287109375, -15.503662109375, -14.814453125, -14.125244140625, -13.43603515625, -12.746826171875, -12.0576171875, -11.368408203125, -10.67919921875, -9.989990234375, -9.30078125, -8.611572265625, -7.92236328125, -7.233154296875, -6.5439453125, -5.854736328125, -5.16552734375, -4.476318359375, -3.787109375, -3.097900390625, -2.40869140625, -1.719482421875, -1.0302734375, -0.341064453125, 0.34814453125, 1.037353515625, 1.7265625, 2.415771484375, 3.10498046875, 3.794189453125, 4.4833984375, 5.172607421875, 5.86181640625, 6.551025390625, 7.240234375, 7.929443359375, 8.61865234375, 9.307861328125, 9.9970703125, 10.686279296875, 11.37548828125, 12.064697265625, 12.75390625, 13.443115234375, 14.13232421875, 14.821533203125, 15.5107421875, 16.199951171875, 16.88916015625, 17.578369140625, 18.267578125, 18.956787109375, 19.64599609375, 20.335205078125, 21.0244140625, 21.713623046875, 22.40283203125, 23.092041015625, 23.78125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 8.0, 12.0, 22.0, 17.0, 11.0, 16.0, 22.0, 27.0, 36.0, 41.0, 70.0, 75.0, 66.0, 77.0, 112.0, 136.0, 172.0, 233.0, 243.0, 313.0, 346.0, 361.0, 318.0, 256.0, 195.0, 157.0, 129.0, 120.0, 88.0, 74.0, 57.0, 49.0, 35.0, 32.0, 28.0, 18.0, 9.0, 15.0, 19.0, 7.0, 10.0, 6.0, 9.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 4.0], "bins": [-11.515625, -11.175537109375, -10.83544921875, -10.495361328125, -10.1552734375, -9.815185546875, -9.47509765625, -9.135009765625, -8.794921875, -8.454833984375, -8.11474609375, -7.774658203125, -7.4345703125, -7.094482421875, -6.75439453125, -6.414306640625, -6.07421875, -5.734130859375, -5.39404296875, -5.053955078125, -4.7138671875, -4.373779296875, -4.03369140625, -3.693603515625, -3.353515625, -3.013427734375, -2.67333984375, -2.333251953125, -1.9931640625, -1.653076171875, -1.31298828125, -0.972900390625, -0.6328125, -0.292724609375, 0.04736328125, 0.387451171875, 0.7275390625, 1.067626953125, 1.40771484375, 1.747802734375, 2.087890625, 2.427978515625, 2.76806640625, 3.108154296875, 3.4482421875, 3.788330078125, 4.12841796875, 4.468505859375, 4.80859375, 5.148681640625, 5.48876953125, 5.828857421875, 6.1689453125, 6.509033203125, 6.84912109375, 7.189208984375, 7.529296875, 7.869384765625, 8.20947265625, 8.549560546875, 8.8896484375, 9.229736328125, 9.56982421875, 9.909912109375, 10.25]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 5.0, 6.0, 6.0, 16.0, 19.0, 19.0, 24.0, 25.0, 22.0, 42.0, 51.0, 49.0, 51.0, 86.0, 98.0, 134.0, 161.0, 157.0, 217.0, 304.0, 466.0, 2008.0, 217158.0, 3949513.0, 21029.0, 800.0, 377.0, 273.0, 202.0, 142.0, 148.0, 124.0, 87.0, 79.0, 75.0, 50.0, 46.0, 43.0, 35.0, 35.0, 27.0, 22.0, 8.0, 12.0, 10.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-60.84375, -58.83544921875, -56.8271484375, -54.81884765625, -52.810546875, -50.80224609375, -48.7939453125, -46.78564453125, -44.77734375, -42.76904296875, -40.7607421875, -38.75244140625, -36.744140625, -34.73583984375, -32.7275390625, -30.71923828125, -28.7109375, -26.70263671875, -24.6943359375, -22.68603515625, -20.677734375, -18.66943359375, -16.6611328125, -14.65283203125, -12.64453125, -10.63623046875, -8.6279296875, -6.61962890625, -4.611328125, -2.60302734375, -0.5947265625, 1.41357421875, 3.421875, 5.43017578125, 7.4384765625, 9.44677734375, 11.455078125, 13.46337890625, 15.4716796875, 17.47998046875, 19.48828125, 21.49658203125, 23.5048828125, 25.51318359375, 27.521484375, 29.52978515625, 31.5380859375, 33.54638671875, 35.5546875, 37.56298828125, 39.5712890625, 41.57958984375, 43.587890625, 45.59619140625, 47.6044921875, 49.61279296875, 51.62109375, 53.62939453125, 55.6376953125, 57.64599609375, 59.654296875, 61.66259765625, 63.6708984375, 65.67919921875, 67.6875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 7.0, 13.0, 29.0, 41.0, 64.0, 95.0, 113.0, 134.0, 123.0, 112.0, 78.0, 85.0, 51.0, 32.0, 13.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.03321838378906, -68.19615936279297, -66.35910034179688, -64.52204132080078, -62.68497848510742, -60.84791946411133, -59.010860443115234, -57.17380142211914, -55.33673858642578, -53.49967956542969, -51.662620544433594, -49.8255615234375, -47.98849868774414, -46.15143966674805, -44.31438064575195, -42.47732162475586, -40.640262603759766, -38.80320358276367, -36.96614456176758, -35.12908172607422, -33.292022705078125, -31.45496368408203, -29.617904663085938, -27.780845642089844, -25.943784713745117, -24.106725692749023, -22.269664764404297, -20.432605743408203, -18.59554672241211, -16.758485794067383, -14.921426773071289, -13.084366798400879, -11.247306823730469, -9.410246849060059, -7.573187351226807, -5.736127853393555, -3.8990678787231445, -2.0620079040527344, -0.22494888305664062, 1.6121110916137695, 3.4491710662841797, 5.28623104095459, 7.123290538787842, 8.960350036621094, 10.797410011291504, 12.634469985961914, 14.471529006958008, 16.308589935302734, 18.145648956298828, 19.982707977294922, 21.81976890563965, 23.656827926635742, 25.49388885498047, 27.330947875976562, 29.168006896972656, 31.00506591796875, 32.842124938964844, 34.67918395996094, 36.51624298095703, 38.353302001953125, 40.190364837646484, 42.02742385864258, 43.86448287963867, 45.701541900634766, 47.538604736328125]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 7.0, 4.0, 10.0, 14.0, 3.0, 20.0, 16.0, 14.0, 21.0, 27.0, 25.0, 35.0, 37.0, 38.0, 33.0, 38.0, 46.0, 39.0, 43.0, 36.0, 49.0, 32.0, 32.0, 34.0, 38.0, 38.0, 31.0, 32.0, 26.0, 30.0, 24.0, 18.0, 22.0, 24.0, 17.0, 14.0, 7.0, 6.0, 11.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.86654281616211, -48.255897521972656, -46.6452522277832, -45.03460693359375, -43.42396545410156, -41.81332015991211, -40.202674865722656, -38.5920295715332, -36.98138427734375, -35.3707389831543, -33.760093688964844, -32.149452209472656, -30.538806915283203, -28.92816162109375, -27.317516326904297, -25.706871032714844, -24.096229553222656, -22.485584259033203, -20.874940872192383, -19.26429557800293, -17.65365219116211, -16.043006896972656, -14.432361602783203, -12.821717262268066, -11.21107292175293, -9.600428581237793, -7.989783763885498, -6.379138946533203, -4.768494606018066, -3.1578502655029297, -1.5472049713134766, 0.06343936920166016, 1.6740798950195312, 3.284724473953247, 4.895369052886963, 6.506013870239258, 8.116658210754395, 9.727302551269531, 11.337947845458984, 12.948592185974121, 14.559236526489258, 16.16988182067871, 17.78052520751953, 19.391170501708984, 21.001815795898438, 22.612459182739258, 24.22310447692871, 25.83374786376953, 27.444393157958984, 29.055038452148438, 30.665681838989258, 32.276329040527344, 33.88697052001953, 35.497615814208984, 37.10826110839844, 38.71890640258789, 40.329551696777344, 41.9401969909668, 43.55084228515625, 45.16148376464844, 46.77212905883789, 48.382774353027344, 49.9934196472168, 51.60406494140625, 53.21470642089844]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 10.0, 7.0, 11.0, 8.0, 14.0, 13.0, 16.0, 12.0, 15.0, 21.0, 20.0, 31.0, 14.0, 22.0, 25.0, 31.0, 26.0, 27.0, 49.0, 36.0, 44.0, 35.0, 34.0, 38.0, 36.0, 37.0, 53.0, 33.0, 24.0, 26.0, 22.0, 26.0, 25.0, 31.0, 16.0, 21.0, 10.0, 15.0, 16.0, 8.0, 9.0, 5.0, 7.0, 7.0, 2.0, 3.0, 2.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.1328125, -6.90472412109375, -6.6766357421875, -6.44854736328125, -6.220458984375, -5.99237060546875, -5.7642822265625, -5.53619384765625, -5.30810546875, -5.08001708984375, -4.8519287109375, -4.62384033203125, -4.395751953125, -4.16766357421875, -3.9395751953125, -3.71148681640625, -3.4833984375, -3.25531005859375, -3.0272216796875, -2.79913330078125, -2.571044921875, -2.34295654296875, -2.1148681640625, -1.88677978515625, -1.65869140625, -1.43060302734375, -1.2025146484375, -0.97442626953125, -0.746337890625, -0.51824951171875, -0.2901611328125, -0.06207275390625, 0.166015625, 0.39410400390625, 0.6221923828125, 0.85028076171875, 1.078369140625, 1.30645751953125, 1.5345458984375, 1.76263427734375, 1.99072265625, 2.21881103515625, 2.4468994140625, 2.67498779296875, 2.903076171875, 3.13116455078125, 3.3592529296875, 3.58734130859375, 3.8154296875, 4.04351806640625, 4.2716064453125, 4.49969482421875, 4.727783203125, 4.95587158203125, 5.1839599609375, 5.41204833984375, 5.64013671875, 5.86822509765625, 6.0963134765625, 6.32440185546875, 6.552490234375, 6.78057861328125, 7.0086669921875, 7.23675537109375, 7.46484375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 13.0, 23.0, 32.0, 42.0, 86.0, 137.0, 189.0, 354.0, 583.0, 912.0, 1400.0, 2046.0, 3268.0, 4979.0, 7319.0, 11651.0, 18109.0, 28930.0, 46520.0, 76119.0, 128777.0, 216045.0, 198711.0, 116524.0, 69437.0, 42427.0, 26546.0, 16667.0, 10708.0, 7053.0, 4737.0, 2914.0, 1954.0, 1221.0, 780.0, 499.0, 291.0, 202.0, 127.0, 79.0, 52.0, 35.0, 16.0, 17.0, 7.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.2578125, -1.2207183837890625, -1.183624267578125, -1.1465301513671875, -1.10943603515625, -1.0723419189453125, -1.035247802734375, -0.9981536865234375, -0.9610595703125, -0.9239654541015625, -0.886871337890625, -0.8497772216796875, -0.81268310546875, -0.7755889892578125, -0.738494873046875, -0.7014007568359375, -0.664306640625, -0.6272125244140625, -0.590118408203125, -0.5530242919921875, -0.51593017578125, -0.4788360595703125, -0.441741943359375, -0.4046478271484375, -0.3675537109375, -0.3304595947265625, -0.293365478515625, -0.2562713623046875, -0.21917724609375, -0.1820831298828125, -0.144989013671875, -0.1078948974609375, -0.07080078125, -0.0337066650390625, 0.003387451171875, 0.0404815673828125, 0.07757568359375, 0.1146697998046875, 0.151763916015625, 0.1888580322265625, 0.2259521484375, 0.2630462646484375, 0.300140380859375, 0.3372344970703125, 0.37432861328125, 0.4114227294921875, 0.448516845703125, 0.4856109619140625, 0.522705078125, 0.5597991943359375, 0.596893310546875, 0.6339874267578125, 0.67108154296875, 0.7081756591796875, 0.745269775390625, 0.7823638916015625, 0.8194580078125, 0.8565521240234375, 0.893646240234375, 0.9307403564453125, 0.96783447265625, 1.0049285888671875, 1.042022705078125, 1.0791168212890625, 1.1162109375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 12.0, 13.0, 17.0, 15.0, 20.0, 21.0, 23.0, 20.0, 33.0, 34.0, 38.0, 46.0, 48.0, 40.0, 42.0, 43.0, 40.0, 1066.0, 56.0, 45.0, 42.0, 34.0, 30.0, 42.0, 29.0, 32.0, 23.0, 24.0, 20.0, 10.0, 21.0, 5.0, 11.0, 6.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.640625, -5.46484375, -5.2890625, -5.11328125, -4.9375, -4.76171875, -4.5859375, -4.41015625, -4.234375, -4.05859375, -3.8828125, -3.70703125, -3.53125, -3.35546875, -3.1796875, -3.00390625, -2.828125, -2.65234375, -2.4765625, -2.30078125, -2.125, -1.94921875, -1.7734375, -1.59765625, -1.421875, -1.24609375, -1.0703125, -0.89453125, -0.71875, -0.54296875, -0.3671875, -0.19140625, -0.015625, 0.16015625, 0.3359375, 0.51171875, 0.6875, 0.86328125, 1.0390625, 1.21484375, 1.390625, 1.56640625, 1.7421875, 1.91796875, 2.09375, 2.26953125, 2.4453125, 2.62109375, 2.796875, 2.97265625, 3.1484375, 3.32421875, 3.5, 3.67578125, 3.8515625, 4.02734375, 4.203125, 4.37890625, 4.5546875, 4.73046875, 4.90625, 5.08203125, 5.2578125, 5.43359375, 5.609375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 10.0, 12.0, 8.0, 20.0, 39.0, 39.0, 76.0, 111.0, 153.0, 216.0, 326.0, 516.0, 819.0, 1269.0, 2003.0, 3180.0, 4893.0, 7964.0, 12811.0, 20387.0, 32579.0, 53967.0, 89005.0, 146293.0, 1264745.0, 176899.0, 107427.0, 65455.0, 39849.0, 24527.0, 15296.0, 9637.0, 6050.0, 3790.0, 2446.0, 1513.0, 963.0, 616.0, 450.0, 271.0, 171.0, 129.0, 71.0, 50.0, 28.0, 23.0, 15.0, 7.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1279296875, -1.09234619140625, -1.0567626953125, -1.02117919921875, -0.985595703125, -0.95001220703125, -0.9144287109375, -0.87884521484375, -0.84326171875, -0.80767822265625, -0.7720947265625, -0.73651123046875, -0.700927734375, -0.66534423828125, -0.6297607421875, -0.59417724609375, -0.55859375, -0.52301025390625, -0.4874267578125, -0.45184326171875, -0.416259765625, -0.38067626953125, -0.3450927734375, -0.30950927734375, -0.27392578125, -0.23834228515625, -0.2027587890625, -0.16717529296875, -0.131591796875, -0.09600830078125, -0.0604248046875, -0.02484130859375, 0.0107421875, 0.04632568359375, 0.0819091796875, 0.11749267578125, 0.153076171875, 0.18865966796875, 0.2242431640625, 0.25982666015625, 0.29541015625, 0.33099365234375, 0.3665771484375, 0.40216064453125, 0.437744140625, 0.47332763671875, 0.5089111328125, 0.54449462890625, 0.580078125, 0.61566162109375, 0.6512451171875, 0.68682861328125, 0.722412109375, 0.75799560546875, 0.7935791015625, 0.82916259765625, 0.86474609375, 0.90032958984375, 0.9359130859375, 0.97149658203125, 1.007080078125, 1.04266357421875, 1.0782470703125, 1.11383056640625, 1.1494140625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 5.0, 11.0, 9.0, 15.0, 15.0, 14.0, 30.0, 30.0, 33.0, 52.0, 43.0, 37.0, 50.0, 49.0, 63.0, 51.0, 52.0, 56.0, 44.0, 52.0, 31.0, 41.0, 31.0, 21.0, 26.0, 20.0, 29.0, 15.0, 14.0, 7.0, 12.0, 8.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0], "bins": [-0.001979827880859375, -0.0019268542528152466, -0.0018738806247711182, -0.0018209069967269897, -0.0017679333686828613, -0.001714959740638733, -0.0016619861125946045, -0.001609012484550476, -0.0015560388565063477, -0.0015030652284622192, -0.0014500916004180908, -0.0013971179723739624, -0.001344144344329834, -0.0012911707162857056, -0.0012381970882415771, -0.0011852234601974487, -0.0011322498321533203, -0.001079276204109192, -0.0010263025760650635, -0.0009733289480209351, -0.0009203553199768066, -0.0008673816919326782, -0.0008144080638885498, -0.0007614344358444214, -0.000708460807800293, -0.0006554871797561646, -0.0006025135517120361, -0.0005495399236679077, -0.0004965662956237793, -0.0004435926675796509, -0.00039061903953552246, -0.00033764541149139404, -0.0002846717834472656, -0.0002316981554031372, -0.0001787245273590088, -0.00012575089931488037, -7.277727127075195e-05, -1.9803643226623535e-05, 3.316998481750488e-05, 8.61436128616333e-05, 0.00013911724090576172, 0.00019209086894989014, 0.00024506449699401855, 0.00029803812503814697, 0.0003510117530822754, 0.0004039853811264038, 0.0004569590091705322, 0.0005099326372146606, 0.0005629062652587891, 0.0006158798933029175, 0.0006688535213470459, 0.0007218271493911743, 0.0007748007774353027, 0.0008277744054794312, 0.0008807480335235596, 0.000933721661567688, 0.0009866952896118164, 0.0010396689176559448, 0.0010926425457000732, 0.0011456161737442017, 0.00119858980178833, 0.0012515634298324585, 0.001304537057876587, 0.0013575106859207153, 0.0014104843139648438]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 5.0, 2.0, 6.0, 8.0, 8.0, 12.0, 10.0, 14.0, 23.0, 27.0, 25.0, 32.0, 39.0, 49.0, 82.0, 113.0, 153.0, 411.0, 1812.0, 1029906.0, 14499.0, 617.0, 211.0, 126.0, 90.0, 61.0, 47.0, 29.0, 34.0, 19.0, 18.0, 15.0, 8.0, 8.0, 9.0, 5.0, 1.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.03765869140625, -0.03629875183105469, -0.034938812255859375, -0.03357887268066406, -0.03221893310546875, -0.030858993530273438, -0.029499053955078125, -0.028139114379882812, -0.0267791748046875, -0.025419235229492188, -0.024059295654296875, -0.022699356079101562, -0.02133941650390625, -0.019979476928710938, -0.018619537353515625, -0.017259597778320312, -0.015899658203125, -0.014539718627929688, -0.013179779052734375, -0.011819839477539062, -0.01045989990234375, -0.009099960327148438, -0.007740020751953125, -0.0063800811767578125, -0.0050201416015625, -0.0036602020263671875, -0.002300262451171875, -0.0009403228759765625, 0.00041961669921875, 0.0017795562744140625, 0.003139495849609375, 0.0044994354248046875, 0.005859375, 0.0072193145751953125, 0.008579254150390625, 0.009939193725585938, 0.01129913330078125, 0.012659072875976562, 0.014019012451171875, 0.015378952026367188, 0.0167388916015625, 0.018098831176757812, 0.019458770751953125, 0.020818710327148438, 0.02217864990234375, 0.023538589477539062, 0.024898529052734375, 0.026258468627929688, 0.027618408203125, 0.028978347778320312, 0.030338287353515625, 0.03169822692871094, 0.03305816650390625, 0.03441810607910156, 0.035778045654296875, 0.03713798522949219, 0.0384979248046875, 0.03985786437988281, 0.041217803955078125, 0.04257774353027344, 0.04393768310546875, 0.04529762268066406, 0.046657562255859375, 0.04801750183105469, 0.04937744140625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 5.0, 62.0, 463.0, 423.0, 62.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006158868200145662, -0.00046125007793307304, -0.00030661336495541036, -0.00015197665197774768, 2.6600901037454605e-06, 0.0001572968321852386, 0.0003119335160590708, 0.0004665703163482249, 0.0006212070002220571, 0.0007758437423035502, 0.0009304804261773825, 0.0010851172264665365, 0.0012397539103403687, 0.001394390594214201, 0.001549027394503355, 0.001703664194792509, 0.0018583007622510195, 0.0020129375625401735, 0.002167574129998684, 0.002322210930287838, 0.002476847730576992, 0.002631484530866146, 0.0027861210983246565, 0.0029407578986138105, 0.0030953946989029646, 0.0032500314991921186, 0.003404668066650629, 0.003559304866939783, 0.003713941667228937, 0.003868578467518091, 0.004023214802145958, 0.004177851602435112, 0.004332488868385553, 0.004487125668674707, 0.0046417624689638615, 0.004796398803591728, 0.004951035603880882, 0.005105672404170036, 0.00526030920445919, 0.005414946004748344, 0.0055695828050374985, 0.0057242196053266525, 0.005878856405615807, 0.006033493205904961, 0.006188129540532827, 0.006342766340821981, 0.0064974031411111355, 0.0066520399414002895, 0.006806676276028156, 0.00696131307631731, 0.007115949876606464, 0.0072705866768956184, 0.007425223011523485, 0.007579859811812639, 0.007734496612101793, 0.00788913294672966, 0.008043770678341389, 0.008198407478630543, 0.008353044278919697, 0.00850768107920885, 0.008662317879498005, 0.008816954679787159, 0.008971590548753738, 0.009126227349042892, 0.009280864149332047]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 11.0, 10.0, 8.0, 8.0, 13.0, 13.0, 12.0, 21.0, 19.0, 25.0, 23.0, 34.0, 27.0, 35.0, 37.0, 39.0, 45.0, 44.0, 50.0, 41.0, 38.0, 32.0, 39.0, 32.0, 32.0, 36.0, 27.0, 32.0, 33.0, 36.0, 21.0, 31.0, 17.0, 16.0, 12.0, 14.0, 12.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00106126070022583, -0.0010304655879735947, -0.0009996704757213593, -0.0009688753634691238, -0.0009380802512168884, -0.000907285138964653, -0.0008764900267124176, -0.0008456949144601822, -0.0008148998022079468, -0.0007841046899557114, -0.000753309577703476, -0.0007225144654512405, -0.0006917193531990051, -0.0006609242409467697, -0.0006301291286945343, -0.0005993340164422989, -0.0005685389041900635, -0.0005377437919378281, -0.0005069486796855927, -0.00047615356743335724, -0.0004453584551811218, -0.0004145633429288864, -0.000383768230676651, -0.0003529731184244156, -0.0003221780061721802, -0.00029138289391994476, -0.00026058778166770935, -0.00022979266941547394, -0.00019899755716323853, -0.0001682024449110031, -0.0001374073326587677, -0.00010661222040653229, -7.581710815429688e-05, -4.502199590206146e-05, -1.422688364982605e-05, 1.6568228602409363e-05, 4.7363340854644775e-05, 7.815845310688019e-05, 0.0001089535653591156, 0.000139748677611351, 0.00017054378986358643, 0.00020133890211582184, 0.00023213401436805725, 0.00026292912662029266, 0.0002937242388725281, 0.0003245193511247635, 0.0003553144633769989, 0.0003861095756292343, 0.0004169046878814697, 0.00044769980013370514, 0.00047849491238594055, 0.000509290024638176, 0.0005400851368904114, 0.0005708802491426468, 0.0006016753613948822, 0.0006324704736471176, 0.000663265585899353, 0.0006940606981515884, 0.0007248558104038239, 0.0007556509226560593, 0.0007864460349082947, 0.0008172411471605301, 0.0008480362594127655, 0.0008788313716650009, 0.0009096264839172363]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 10.0, 7.0, 11.0, 8.0, 14.0, 13.0, 16.0, 12.0, 15.0, 21.0, 20.0, 31.0, 14.0, 23.0, 24.0, 31.0, 26.0, 27.0, 49.0, 36.0, 44.0, 35.0, 34.0, 38.0, 36.0, 37.0, 53.0, 33.0, 24.0, 26.0, 22.0, 26.0, 25.0, 31.0, 16.0, 21.0, 10.0, 15.0, 16.0, 8.0, 9.0, 5.0, 7.0, 7.0, 2.0, 3.0, 2.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.1328125, -6.90472412109375, -6.6766357421875, -6.44854736328125, -6.220458984375, -5.99237060546875, -5.7642822265625, -5.53619384765625, -5.30810546875, -5.08001708984375, -4.8519287109375, -4.62384033203125, -4.395751953125, -4.16766357421875, -3.9395751953125, -3.71148681640625, -3.4833984375, -3.25531005859375, -3.0272216796875, -2.79913330078125, -2.571044921875, -2.34295654296875, -2.1148681640625, -1.88677978515625, -1.65869140625, -1.43060302734375, -1.2025146484375, -0.97442626953125, -0.746337890625, -0.51824951171875, -0.2901611328125, -0.06207275390625, 0.166015625, 0.39410400390625, 0.6221923828125, 0.85028076171875, 1.078369140625, 1.30645751953125, 1.5345458984375, 1.76263427734375, 1.99072265625, 2.21881103515625, 2.4468994140625, 2.67498779296875, 2.903076171875, 3.13116455078125, 3.3592529296875, 3.58734130859375, 3.8154296875, 4.04351806640625, 4.2716064453125, 4.49969482421875, 4.727783203125, 4.95587158203125, 5.1839599609375, 5.41204833984375, 5.64013671875, 5.86822509765625, 6.0963134765625, 6.32440185546875, 6.552490234375, 6.78057861328125, 7.0086669921875, 7.23675537109375, 7.46484375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 8.0, 9.0, 11.0, 9.0, 22.0, 25.0, 39.0, 46.0, 69.0, 74.0, 91.0, 109.0, 172.0, 248.0, 421.0, 791.0, 1592.0, 3644.0, 8697.0, 23064.0, 61624.0, 180445.0, 477799.0, 186153.0, 63537.0, 23431.0, 8879.0, 3679.0, 1649.0, 831.0, 435.0, 290.0, 151.0, 133.0, 90.0, 50.0, 53.0, 35.0, 28.0, 19.0, 22.0, 17.0, 12.0, 16.0, 10.0, 8.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.953125, -6.717529296875, -6.48193359375, -6.246337890625, -6.0107421875, -5.775146484375, -5.53955078125, -5.303955078125, -5.068359375, -4.832763671875, -4.59716796875, -4.361572265625, -4.1259765625, -3.890380859375, -3.65478515625, -3.419189453125, -3.18359375, -2.947998046875, -2.71240234375, -2.476806640625, -2.2412109375, -2.005615234375, -1.77001953125, -1.534423828125, -1.298828125, -1.063232421875, -0.82763671875, -0.592041015625, -0.3564453125, -0.120849609375, 0.11474609375, 0.350341796875, 0.5859375, 0.821533203125, 1.05712890625, 1.292724609375, 1.5283203125, 1.763916015625, 1.99951171875, 2.235107421875, 2.470703125, 2.706298828125, 2.94189453125, 3.177490234375, 3.4130859375, 3.648681640625, 3.88427734375, 4.119873046875, 4.35546875, 4.591064453125, 4.82666015625, 5.062255859375, 5.2978515625, 5.533447265625, 5.76904296875, 6.004638671875, 6.240234375, 6.475830078125, 6.71142578125, 6.947021484375, 7.1826171875, 7.418212890625, 7.65380859375, 7.889404296875, 8.125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 2.0, 7.0, 9.0, 13.0, 9.0, 11.0, 20.0, 18.0, 23.0, 23.0, 36.0, 27.0, 30.0, 42.0, 52.0, 53.0, 54.0, 136.0, 1710.0, 260.0, 79.0, 61.0, 50.0, 33.0, 44.0, 38.0, 26.0, 27.0, 22.0, 19.0, 17.0, 16.0, 12.0, 15.0, 10.0, 12.0, 6.0, 8.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-27.390625, -26.57861328125, -25.7666015625, -24.95458984375, -24.142578125, -23.33056640625, -22.5185546875, -21.70654296875, -20.89453125, -20.08251953125, -19.2705078125, -18.45849609375, -17.646484375, -16.83447265625, -16.0224609375, -15.21044921875, -14.3984375, -13.58642578125, -12.7744140625, -11.96240234375, -11.150390625, -10.33837890625, -9.5263671875, -8.71435546875, -7.90234375, -7.09033203125, -6.2783203125, -5.46630859375, -4.654296875, -3.84228515625, -3.0302734375, -2.21826171875, -1.40625, -0.59423828125, 0.2177734375, 1.02978515625, 1.841796875, 2.65380859375, 3.4658203125, 4.27783203125, 5.08984375, 5.90185546875, 6.7138671875, 7.52587890625, 8.337890625, 9.14990234375, 9.9619140625, 10.77392578125, 11.5859375, 12.39794921875, 13.2099609375, 14.02197265625, 14.833984375, 15.64599609375, 16.4580078125, 17.27001953125, 18.08203125, 18.89404296875, 19.7060546875, 20.51806640625, 21.330078125, 22.14208984375, 22.9541015625, 23.76611328125, 24.578125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 8.0, 12.0, 12.0, 25.0, 25.0, 35.0, 37.0, 31.0, 46.0, 57.0, 107.0, 94.0, 183.0, 251.0, 472.0, 801.0, 2646.0, 459542.0, 2674891.0, 3939.0, 1030.0, 488.0, 254.0, 167.0, 108.0, 89.0, 58.0, 57.0, 42.0, 38.0, 19.0, 33.0, 13.0, 11.0, 10.0, 11.0, 8.0, 9.0, 8.0, 4.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-61.40625, -59.5498046875, -57.693359375, -55.8369140625, -53.98046875, -52.1240234375, -50.267578125, -48.4111328125, -46.5546875, -44.6982421875, -42.841796875, -40.9853515625, -39.12890625, -37.2724609375, -35.416015625, -33.5595703125, -31.703125, -29.8466796875, -27.990234375, -26.1337890625, -24.27734375, -22.4208984375, -20.564453125, -18.7080078125, -16.8515625, -14.9951171875, -13.138671875, -11.2822265625, -9.42578125, -7.5693359375, -5.712890625, -3.8564453125, -2.0, -0.1435546875, 1.712890625, 3.5693359375, 5.42578125, 7.2822265625, 9.138671875, 10.9951171875, 12.8515625, 14.7080078125, 16.564453125, 18.4208984375, 20.27734375, 22.1337890625, 23.990234375, 25.8466796875, 27.703125, 29.5595703125, 31.416015625, 33.2724609375, 35.12890625, 36.9853515625, 38.841796875, 40.6982421875, 42.5546875, 44.4111328125, 46.267578125, 48.1240234375, 49.98046875, 51.8369140625, 53.693359375, 55.5498046875, 57.40625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 68.0, 672.0, 260.0, 13.0, 1.0, 2.0], "bins": [-266.497802734375, -262.031005859375, -257.5642395019531, -253.09744262695312, -248.6306610107422, -244.16387939453125, -239.69708251953125, -235.2303009033203, -230.76351928710938, -226.29673767089844, -221.8299560546875, -217.3631591796875, -212.89637756347656, -208.42959594726562, -203.96279907226562, -199.4960174560547, -195.02923583984375, -190.5624542236328, -186.09567260742188, -181.62887573242188, -177.16209411621094, -172.6953125, -168.228515625, -163.76173400878906, -159.29495239257812, -154.8281707763672, -150.36138916015625, -145.89459228515625, -141.4278106689453, -136.96102905273438, -132.49423217773438, -128.02745056152344, -123.56065368652344, -119.0938720703125, -114.62708282470703, -110.16029357910156, -105.69351196289062, -101.22673034667969, -96.75994110107422, -92.29315185546875, -87.82637023925781, -83.35958862304688, -78.8927993774414, -74.42601013183594, -69.959228515625, -65.49244689941406, -61.025657653808594, -56.55887222290039, -52.09208679199219, -47.625301361083984, -43.15851593017578, -38.69173049926758, -34.224945068359375, -29.758159637451172, -25.29137420654297, -20.824588775634766, -16.357803344726562, -11.89101791381836, -7.424232482910156, -2.957447052001953, 1.50933837890625, 5.976123809814453, 10.442909240722656, 14.90969467163086, 19.376480102539062]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 7.0, 8.0, 12.0, 8.0, 13.0, 16.0, 17.0, 12.0, 13.0, 22.0, 23.0, 34.0, 32.0, 34.0, 42.0, 28.0, 44.0, 39.0, 35.0, 38.0, 27.0, 41.0, 36.0, 40.0, 38.0, 36.0, 32.0, 37.0, 28.0, 29.0, 23.0, 16.0, 15.0, 22.0, 16.0, 14.0, 15.0, 13.0, 7.0, 10.0, 8.0, 8.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-67.62173461914062, -65.60232543945312, -63.582908630371094, -61.56349563598633, -59.54408264160156, -57.5246696472168, -55.50525665283203, -53.485843658447266, -51.4664306640625, -49.447017669677734, -47.42760467529297, -45.4081916809082, -43.38877868652344, -41.36936569213867, -39.349952697753906, -37.33053970336914, -35.311126708984375, -33.29171371459961, -31.272300720214844, -29.252887725830078, -27.233474731445312, -25.214061737060547, -23.19464874267578, -21.175235748291016, -19.15582275390625, -17.136409759521484, -15.116996765136719, -13.097583770751953, -11.078170776367188, -9.058757781982422, -7.039344787597656, -5.019931793212891, -3.0005264282226562, -0.9811134338378906, 1.038299560546875, 3.0577125549316406, 5.077125549316406, 7.096538543701172, 9.115951538085938, 11.135364532470703, 13.154777526855469, 15.174190521240234, 17.193603515625, 19.213016510009766, 21.23242950439453, 23.251842498779297, 25.271255493164062, 27.290668487548828, 29.310081481933594, 31.32949447631836, 33.348907470703125, 35.36832046508789, 37.387733459472656, 39.40714645385742, 41.42655944824219, 43.44597244262695, 45.46538543701172, 47.484798431396484, 49.50421142578125, 51.523624420166016, 53.54303741455078, 55.56245040893555, 57.58186340332031, 59.60127639770508, 61.620689392089844]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 7.0, 8.0, 11.0, 7.0, 10.0, 16.0, 15.0, 15.0, 20.0, 26.0, 20.0, 28.0, 19.0, 30.0, 28.0, 31.0, 32.0, 38.0, 57.0, 49.0, 40.0, 37.0, 36.0, 37.0, 27.0, 41.0, 38.0, 29.0, 23.0, 28.0, 25.0, 29.0, 17.0, 18.0, 18.0, 14.0, 12.0, 9.0, 12.0, 9.0, 6.0, 4.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-8.015625, -7.764892578125, -7.51416015625, -7.263427734375, -7.0126953125, -6.761962890625, -6.51123046875, -6.260498046875, -6.009765625, -5.759033203125, -5.50830078125, -5.257568359375, -5.0068359375, -4.756103515625, -4.50537109375, -4.254638671875, -4.00390625, -3.753173828125, -3.50244140625, -3.251708984375, -3.0009765625, -2.750244140625, -2.49951171875, -2.248779296875, -1.998046875, -1.747314453125, -1.49658203125, -1.245849609375, -0.9951171875, -0.744384765625, -0.49365234375, -0.242919921875, 0.0078125, 0.258544921875, 0.50927734375, 0.760009765625, 1.0107421875, 1.261474609375, 1.51220703125, 1.762939453125, 2.013671875, 2.264404296875, 2.51513671875, 2.765869140625, 3.0166015625, 3.267333984375, 3.51806640625, 3.768798828125, 4.01953125, 4.270263671875, 4.52099609375, 4.771728515625, 5.0224609375, 5.273193359375, 5.52392578125, 5.774658203125, 6.025390625, 6.276123046875, 6.52685546875, 6.777587890625, 7.0283203125, 7.279052734375, 7.52978515625, 7.780517578125, 8.03125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 3.0, 2.0, 7.0, 4.0, 10.0, 9.0, 12.0, 10.0, 21.0, 18.0, 31.0, 24.0, 44.0, 49.0, 68.0, 58.0, 120.0, 180.0, 311.0, 768.0, 2952.0, 25932.0, 1128912.0, 2921941.0, 103854.0, 6368.0, 1316.0, 465.0, 227.0, 136.0, 92.0, 59.0, 57.0, 38.0, 32.0, 33.0, 20.0, 21.0, 13.0, 14.0, 9.0, 7.0, 10.0, 6.0, 5.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-26.0, -25.166748046875, -24.33349609375, -23.500244140625, -22.6669921875, -21.833740234375, -21.00048828125, -20.167236328125, -19.333984375, -18.500732421875, -17.66748046875, -16.834228515625, -16.0009765625, -15.167724609375, -14.33447265625, -13.501220703125, -12.66796875, -11.834716796875, -11.00146484375, -10.168212890625, -9.3349609375, -8.501708984375, -7.66845703125, -6.835205078125, -6.001953125, -5.168701171875, -4.33544921875, -3.502197265625, -2.6689453125, -1.835693359375, -1.00244140625, -0.169189453125, 0.6640625, 1.497314453125, 2.33056640625, 3.163818359375, 3.9970703125, 4.830322265625, 5.66357421875, 6.496826171875, 7.330078125, 8.163330078125, 8.99658203125, 9.829833984375, 10.6630859375, 11.496337890625, 12.32958984375, 13.162841796875, 13.99609375, 14.829345703125, 15.66259765625, 16.495849609375, 17.3291015625, 18.162353515625, 18.99560546875, 19.828857421875, 20.662109375, 21.495361328125, 22.32861328125, 23.161865234375, 23.9951171875, 24.828369140625, 25.66162109375, 26.494873046875, 27.328125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 10.0, 9.0, 5.0, 15.0, 23.0, 26.0, 45.0, 62.0, 98.0, 146.0, 172.0, 280.0, 433.0, 586.0, 653.0, 511.0, 344.0, 230.0, 137.0, 95.0, 58.0, 48.0, 34.0, 19.0, 12.0, 6.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.34375, -18.72314453125, -18.1025390625, -17.48193359375, -16.861328125, -16.24072265625, -15.6201171875, -14.99951171875, -14.37890625, -13.75830078125, -13.1376953125, -12.51708984375, -11.896484375, -11.27587890625, -10.6552734375, -10.03466796875, -9.4140625, -8.79345703125, -8.1728515625, -7.55224609375, -6.931640625, -6.31103515625, -5.6904296875, -5.06982421875, -4.44921875, -3.82861328125, -3.2080078125, -2.58740234375, -1.966796875, -1.34619140625, -0.7255859375, -0.10498046875, 0.515625, 1.13623046875, 1.7568359375, 2.37744140625, 2.998046875, 3.61865234375, 4.2392578125, 4.85986328125, 5.48046875, 6.10107421875, 6.7216796875, 7.34228515625, 7.962890625, 8.58349609375, 9.2041015625, 9.82470703125, 10.4453125, 11.06591796875, 11.6865234375, 12.30712890625, 12.927734375, 13.54833984375, 14.1689453125, 14.78955078125, 15.41015625, 16.03076171875, 16.6513671875, 17.27197265625, 17.892578125, 18.51318359375, 19.1337890625, 19.75439453125, 20.375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 6.0, 14.0, 4.0, 19.0, 40.0, 43.0, 68.0, 91.0, 125.0, 201.0, 224.0, 370.0, 638.0, 5900.0, 4141783.0, 42478.0, 881.0, 359.0, 241.0, 190.0, 140.0, 122.0, 114.0, 64.0, 50.0, 42.0, 22.0, 8.0, 9.0, 17.0, 5.0, 6.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-111.6875, -108.2666015625, -104.845703125, -101.4248046875, -98.00390625, -94.5830078125, -91.162109375, -87.7412109375, -84.3203125, -80.8994140625, -77.478515625, -74.0576171875, -70.63671875, -67.2158203125, -63.794921875, -60.3740234375, -56.953125, -53.5322265625, -50.111328125, -46.6904296875, -43.26953125, -39.8486328125, -36.427734375, -33.0068359375, -29.5859375, -26.1650390625, -22.744140625, -19.3232421875, -15.90234375, -12.4814453125, -9.060546875, -5.6396484375, -2.21875, 1.2021484375, 4.623046875, 8.0439453125, 11.46484375, 14.8857421875, 18.306640625, 21.7275390625, 25.1484375, 28.5693359375, 31.990234375, 35.4111328125, 38.83203125, 42.2529296875, 45.673828125, 49.0947265625, 52.515625, 55.9365234375, 59.357421875, 62.7783203125, 66.19921875, 69.6201171875, 73.041015625, 76.4619140625, 79.8828125, 83.3037109375, 86.724609375, 90.1455078125, 93.56640625, 96.9873046875, 100.408203125, 103.8291015625, 107.25]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 27.0, 186.0, 464.0, 275.0, 48.0, 11.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-360.4863586425781, -353.8907470703125, -347.2951354980469, -340.69952392578125, -334.1039123535156, -327.50830078125, -320.9126892089844, -314.31707763671875, -307.72149658203125, -301.1258850097656, -294.5302734375, -287.9346618652344, -281.33905029296875, -274.7434387207031, -268.1478271484375, -261.55224609375, -254.95660400390625, -248.36099243164062, -241.765380859375, -235.16976928710938, -228.57415771484375, -221.97854614257812, -215.38294982910156, -208.78733825683594, -202.1917266845703, -195.5961151123047, -189.00050354003906, -182.40489196777344, -175.80929565429688, -169.21368408203125, -162.61807250976562, -156.0224609375, -149.42684936523438, -142.83123779296875, -136.23562622070312, -129.6400146484375, -123.0444107055664, -116.44879913330078, -109.85319519042969, -103.25758361816406, -96.66197204589844, -90.06636047363281, -83.47074890136719, -76.8751449584961, -70.27953338623047, -63.683921813964844, -57.088314056396484, -50.492706298828125, -43.897090911865234, -37.301483154296875, -30.70587158203125, -24.110261917114258, -17.514652252197266, -10.91904067993164, -4.323432922363281, 2.272174835205078, 8.867786407470703, 15.463396072387695, 22.059005737304688, 28.65461540222168, 35.25022506713867, 41.8458366394043, 48.441444396972656, 55.037052154541016, 61.63266372680664]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 6.0, 8.0, 11.0, 8.0, 10.0, 12.0, 13.0, 16.0, 26.0, 25.0, 33.0, 28.0, 28.0, 32.0, 37.0, 50.0, 35.0, 39.0, 36.0, 40.0, 53.0, 36.0, 54.0, 36.0, 30.0, 33.0, 34.0, 26.0, 34.0, 25.0, 16.0, 18.0, 16.0, 21.0, 12.0, 15.0, 5.0, 15.0, 7.0, 5.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.81153106689453, -48.25680923461914, -46.70208740234375, -45.147361755371094, -43.5926399230957, -42.03791809082031, -40.48319625854492, -38.92847442626953, -37.37375259399414, -35.81903076171875, -34.26430892944336, -32.70958709716797, -31.154863357543945, -29.600139617919922, -28.04541778564453, -26.49069595336914, -24.935972213745117, -23.381250381469727, -21.826526641845703, -20.271804809570312, -18.717082977294922, -17.16236114501953, -15.607637405395508, -14.052915573120117, -12.49819278717041, -10.943470001220703, -9.388748168945312, -7.8340253829956055, -6.279303073883057, -4.724580764770508, -3.169857978820801, -1.6151361465454102, -0.060413360595703125, 1.4943090677261353, 3.0490314960479736, 4.603754043579102, 6.15847635269165, 7.713198661804199, 9.267921447753906, 10.822643280029297, 12.377366065979004, 13.932088851928711, 15.486810684204102, 17.041534423828125, 18.596256256103516, 20.150978088378906, 21.705699920654297, 23.260421752929688, 24.81514549255371, 26.3698673248291, 27.924591064453125, 29.479312896728516, 31.034034729003906, 32.5887565612793, 34.14347839355469, 35.698204040527344, 37.252925872802734, 38.807647705078125, 40.362369537353516, 41.917091369628906, 43.47181701660156, 45.02653884887695, 46.581260681152344, 48.135982513427734, 49.690704345703125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 1.0, 5.0, 8.0, 17.0, 5.0, 11.0, 11.0, 14.0, 19.0, 22.0, 22.0, 23.0, 20.0, 16.0, 28.0, 27.0, 44.0, 30.0, 51.0, 40.0, 39.0, 49.0, 38.0, 37.0, 51.0, 41.0, 23.0, 33.0, 37.0, 28.0, 27.0, 22.0, 19.0, 25.0, 15.0, 20.0, 15.0, 14.0, 13.0, 5.0, 3.0, 6.0, 5.0, 5.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.55859375, -7.30609130859375, -7.0535888671875, -6.80108642578125, -6.548583984375, -6.29608154296875, -6.0435791015625, -5.79107666015625, -5.53857421875, -5.28607177734375, -5.0335693359375, -4.78106689453125, -4.528564453125, -4.27606201171875, -4.0235595703125, -3.77105712890625, -3.5185546875, -3.26605224609375, -3.0135498046875, -2.76104736328125, -2.508544921875, -2.25604248046875, -2.0035400390625, -1.75103759765625, -1.49853515625, -1.24603271484375, -0.9935302734375, -0.74102783203125, -0.488525390625, -0.23602294921875, 0.0164794921875, 0.26898193359375, 0.521484375, 0.77398681640625, 1.0264892578125, 1.27899169921875, 1.531494140625, 1.78399658203125, 2.0364990234375, 2.28900146484375, 2.54150390625, 2.79400634765625, 3.0465087890625, 3.29901123046875, 3.551513671875, 3.80401611328125, 4.0565185546875, 4.30902099609375, 4.5615234375, 4.81402587890625, 5.0665283203125, 5.31903076171875, 5.571533203125, 5.82403564453125, 6.0765380859375, 6.32904052734375, 6.58154296875, 6.83404541015625, 7.0865478515625, 7.33905029296875, 7.591552734375, 7.84405517578125, 8.0965576171875, 8.34906005859375, 8.6015625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 6.0, 10.0, 16.0, 39.0, 49.0, 71.0, 126.0, 187.0, 268.0, 437.0, 655.0, 1101.0, 1552.0, 2450.0, 3772.0, 5810.0, 9110.0, 14171.0, 22815.0, 35903.0, 59225.0, 97962.0, 166807.0, 228347.0, 156867.0, 91926.0, 55897.0, 33845.0, 21248.0, 13515.0, 8735.0, 5437.0, 3464.0, 2368.0, 1555.0, 1053.0, 609.0, 400.0, 281.0, 140.0, 115.0, 76.0, 51.0, 26.0, 23.0, 13.0, 11.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1806640625, -1.141876220703125, -1.10308837890625, -1.064300537109375, -1.0255126953125, -0.986724853515625, -0.94793701171875, -0.909149169921875, -0.870361328125, -0.831573486328125, -0.79278564453125, -0.753997802734375, -0.7152099609375, -0.676422119140625, -0.63763427734375, -0.598846435546875, -0.56005859375, -0.521270751953125, -0.48248291015625, -0.443695068359375, -0.4049072265625, -0.366119384765625, -0.32733154296875, -0.288543701171875, -0.249755859375, -0.210968017578125, -0.17218017578125, -0.133392333984375, -0.0946044921875, -0.055816650390625, -0.01702880859375, 0.021759033203125, 0.060546875, 0.099334716796875, 0.13812255859375, 0.176910400390625, 0.2156982421875, 0.254486083984375, 0.29327392578125, 0.332061767578125, 0.370849609375, 0.409637451171875, 0.44842529296875, 0.487213134765625, 0.5260009765625, 0.564788818359375, 0.60357666015625, 0.642364501953125, 0.68115234375, 0.719940185546875, 0.75872802734375, 0.797515869140625, 0.8363037109375, 0.875091552734375, 0.91387939453125, 0.952667236328125, 0.991455078125, 1.030242919921875, 1.06903076171875, 1.107818603515625, 1.1466064453125, 1.185394287109375, 1.22418212890625, 1.262969970703125, 1.3017578125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 2.0, 6.0, 5.0, 5.0, 15.0, 12.0, 11.0, 19.0, 25.0, 19.0, 30.0, 33.0, 31.0, 40.0, 34.0, 42.0, 49.0, 39.0, 34.0, 1058.0, 38.0, 51.0, 36.0, 39.0, 35.0, 41.0, 28.0, 34.0, 35.0, 28.0, 27.0, 13.0, 14.0, 19.0, 15.0, 11.0, 12.0, 7.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-5.69921875, -5.528564453125, -5.35791015625, -5.187255859375, -5.0166015625, -4.845947265625, -4.67529296875, -4.504638671875, -4.333984375, -4.163330078125, -3.99267578125, -3.822021484375, -3.6513671875, -3.480712890625, -3.31005859375, -3.139404296875, -2.96875, -2.798095703125, -2.62744140625, -2.456787109375, -2.2861328125, -2.115478515625, -1.94482421875, -1.774169921875, -1.603515625, -1.432861328125, -1.26220703125, -1.091552734375, -0.9208984375, -0.750244140625, -0.57958984375, -0.408935546875, -0.23828125, -0.067626953125, 0.10302734375, 0.273681640625, 0.4443359375, 0.614990234375, 0.78564453125, 0.956298828125, 1.126953125, 1.297607421875, 1.46826171875, 1.638916015625, 1.8095703125, 1.980224609375, 2.15087890625, 2.321533203125, 2.4921875, 2.662841796875, 2.83349609375, 3.004150390625, 3.1748046875, 3.345458984375, 3.51611328125, 3.686767578125, 3.857421875, 4.028076171875, 4.19873046875, 4.369384765625, 4.5400390625, 4.710693359375, 4.88134765625, 5.052001953125, 5.22265625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 4.0, 14.0, 22.0, 39.0, 58.0, 84.0, 130.0, 221.0, 334.0, 547.0, 824.0, 1359.0, 2305.0, 3755.0, 6182.0, 10427.0, 17941.0, 30189.0, 52425.0, 90520.0, 160765.0, 1297047.0, 179307.0, 101854.0, 58141.0, 33698.0, 19725.0, 11744.0, 6865.0, 4118.0, 2455.0, 1469.0, 933.0, 608.0, 348.0, 234.0, 162.0, 88.0, 65.0, 42.0, 26.0, 19.0, 14.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.267578125, -1.2261505126953125, -1.184722900390625, -1.1432952880859375, -1.10186767578125, -1.0604400634765625, -1.019012451171875, -0.9775848388671875, -0.9361572265625, -0.8947296142578125, -0.853302001953125, -0.8118743896484375, -0.77044677734375, -0.7290191650390625, -0.687591552734375, -0.6461639404296875, -0.604736328125, -0.5633087158203125, -0.521881103515625, -0.4804534912109375, -0.43902587890625, -0.3975982666015625, -0.356170654296875, -0.3147430419921875, -0.2733154296875, -0.2318878173828125, -0.190460205078125, -0.1490325927734375, -0.10760498046875, -0.0661773681640625, -0.024749755859375, 0.0166778564453125, 0.05810546875, 0.0995330810546875, 0.140960693359375, 0.1823883056640625, 0.22381591796875, 0.2652435302734375, 0.306671142578125, 0.3480987548828125, 0.3895263671875, 0.4309539794921875, 0.472381591796875, 0.5138092041015625, 0.55523681640625, 0.5966644287109375, 0.638092041015625, 0.6795196533203125, 0.720947265625, 0.7623748779296875, 0.803802490234375, 0.8452301025390625, 0.88665771484375, 0.9280853271484375, 0.969512939453125, 1.0109405517578125, 1.0523681640625, 1.0937957763671875, 1.135223388671875, 1.1766510009765625, 1.21807861328125, 1.2595062255859375, 1.300933837890625, 1.3423614501953125, 1.3837890625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 5.0, 8.0, 15.0, 17.0, 17.0, 20.0, 25.0, 40.0, 35.0, 34.0, 43.0, 52.0, 50.0, 62.0, 51.0, 62.0, 54.0, 63.0, 41.0, 42.0, 36.0, 35.0, 19.0, 28.0, 17.0, 17.0, 12.0, 11.0, 21.0, 11.0, 9.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0016422271728515625, -0.0015890896320343018, -0.001535952091217041, -0.0014828145503997803, -0.0014296770095825195, -0.0013765394687652588, -0.001323401927947998, -0.0012702643871307373, -0.0012171268463134766, -0.0011639893054962158, -0.001110851764678955, -0.0010577142238616943, -0.0010045766830444336, -0.0009514391422271729, -0.0008983016014099121, -0.0008451640605926514, -0.0007920265197753906, -0.0007388889789581299, -0.0006857514381408691, -0.0006326138973236084, -0.0005794763565063477, -0.0005263388156890869, -0.00047320127487182617, -0.00042006373405456543, -0.0003669261932373047, -0.00031378865242004395, -0.0002606511116027832, -0.00020751357078552246, -0.00015437602996826172, -0.00010123848915100098, -4.8100948333740234e-05, 5.036592483520508e-06, 5.817413330078125e-05, 0.00011131167411804199, 0.00016444921493530273, 0.00021758675575256348, 0.0002707242965698242, 0.00032386183738708496, 0.0003769993782043457, 0.00043013691902160645, 0.0004832744598388672, 0.0005364120006561279, 0.0005895495414733887, 0.0006426870822906494, 0.0006958246231079102, 0.0007489621639251709, 0.0008020997047424316, 0.0008552372455596924, 0.0009083747863769531, 0.0009615123271942139, 0.0010146498680114746, 0.0010677874088287354, 0.001120924949645996, 0.0011740624904632568, 0.0012272000312805176, 0.0012803375720977783, 0.001333475112915039, 0.0013866126537322998, 0.0014397501945495605, 0.0014928877353668213, 0.001546025276184082, 0.0015991628170013428, 0.0016523003578186035, 0.0017054378986358643, 0.001758575439453125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 4.0, 6.0, 9.0, 9.0, 18.0, 17.0, 17.0, 15.0, 31.0, 44.0, 44.0, 50.0, 77.0, 115.0, 177.0, 452.0, 2042.0, 1024301.0, 19655.0, 685.0, 263.0, 136.0, 81.0, 55.0, 55.0, 32.0, 33.0, 30.0, 13.0, 19.0, 13.0, 10.0, 14.0, 3.0, 8.0, 3.0, 3.0, 0.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.045623779296875, -0.04427003860473633, -0.042916297912597656, -0.041562557220458984, -0.04020881652832031, -0.03885507583618164, -0.03750133514404297, -0.0361475944519043, -0.034793853759765625, -0.03344011306762695, -0.03208637237548828, -0.03073263168334961, -0.029378890991210938, -0.028025150299072266, -0.026671409606933594, -0.025317668914794922, -0.02396392822265625, -0.022610187530517578, -0.021256446838378906, -0.019902706146240234, -0.018548965454101562, -0.01719522476196289, -0.01584148406982422, -0.014487743377685547, -0.013134002685546875, -0.011780261993408203, -0.010426521301269531, -0.00907278060913086, -0.0077190399169921875, -0.006365299224853516, -0.005011558532714844, -0.003657817840576172, -0.0023040771484375, -0.0009503364562988281, 0.00040340423583984375, 0.0017571449279785156, 0.0031108856201171875, 0.004464626312255859, 0.005818367004394531, 0.007172107696533203, 0.008525848388671875, 0.009879589080810547, 0.011233329772949219, 0.01258707046508789, 0.013940811157226562, 0.015294551849365234, 0.016648292541503906, 0.018002033233642578, 0.01935577392578125, 0.020709514617919922, 0.022063255310058594, 0.023416996002197266, 0.024770736694335938, 0.02612447738647461, 0.02747821807861328, 0.028831958770751953, 0.030185699462890625, 0.0315394401550293, 0.03289318084716797, 0.03424692153930664, 0.03560066223144531, 0.036954402923583984, 0.038308143615722656, 0.03966188430786133, 0.041015625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 8.0, 17.0, 32.0, 69.0, 126.0, 188.0, 196.0, 173.0, 98.0, 54.0, 34.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022862080950289965, -0.002235752996057272, -0.0021852978970855474, -0.002134842798113823, -0.0020843876991420984, -0.002033932600170374, -0.0019834775011986494, -0.001933022285811603, -0.0018825671868398786, -0.001832112087868154, -0.0017816569888964295, -0.001731201889924705, -0.0016807467909529805, -0.0016302915755659342, -0.0015798364765942097, -0.0015293813776224852, -0.0014789262786507607, -0.0014284711796790361, -0.0013780160807073116, -0.0013275609817355871, -0.0012771058827638626, -0.001226650783792138, -0.0011761956848204136, -0.0011257404694333673, -0.0010752854868769646, -0.00102483038790524, -0.0009743752889335155, -0.000923920189961791, -0.0008734650327824056, -0.0008230099338106811, -0.0007725548348389566, -0.0007220996776595712, -0.0006716445786878467, -0.0006211894797161222, -0.0005707343807443976, -0.0005202792817726731, -0.0004698241245932877, -0.0004193690256215632, -0.0003689139266498387, -0.0003184587985742837, -0.0002680036996025592, -0.00021754858607891947, -0.00016709347255527973, -0.00011663837358355522, -6.618326005991548e-05, -1.5728146536275744e-05, 3.4726952435448766e-05, 8.518208051100373e-05, 0.00013563717948272824, 0.00018609229300636798, 0.00023654740653000772, 0.00028700250550173223, 0.0003374576335772872, 0.0003879127325490117, 0.0004383678315207362, 0.0004888229304924607, 0.0005392780294641852, 0.0005897331284359097, 0.0006401882274076343, 0.0006906433263793588, 0.0007410984835587442, 0.0007915535825304687, 0.0008420086815021932, 0.0008924638386815786, 0.0009429189376533031]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 6.0, 13.0, 7.0, 6.0, 10.0, 17.0, 5.0, 19.0, 21.0, 22.0, 28.0, 25.0, 28.0, 40.0, 29.0, 34.0, 30.0, 26.0, 45.0, 36.0, 40.0, 40.0, 42.0, 39.0, 35.0, 35.0, 36.0, 35.0, 26.0, 31.0, 23.0, 26.0, 22.0, 22.0, 23.0, 15.0, 11.0, 11.0, 7.0, 6.0, 10.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0009571313858032227, -0.0009287148714065552, -0.0009002983570098877, -0.0008718818426132202, -0.0008434653282165527, -0.0008150488138198853, -0.0007866322994232178, -0.0007582157850265503, -0.0007297992706298828, -0.0007013827562332153, -0.0006729662418365479, -0.0006445497274398804, -0.0006161332130432129, -0.0005877166986465454, -0.0005593001842498779, -0.0005308836698532104, -0.000502467155456543, -0.0004740506410598755, -0.000445634126663208, -0.00041721761226654053, -0.00038880109786987305, -0.00036038458347320557, -0.0003319680690765381, -0.0003035515546798706, -0.0002751350402832031, -0.00024671852588653564, -0.00021830201148986816, -0.00018988549709320068, -0.0001614689826965332, -0.00013305246829986572, -0.00010463595390319824, -7.621943950653076e-05, -4.780292510986328e-05, -1.93864107131958e-05, 9.03010368347168e-06, 3.744661808013916e-05, 6.586313247680664e-05, 9.427964687347412e-05, 0.0001226961612701416, 0.00015111267566680908, 0.00017952919006347656, 0.00020794570446014404, 0.00023636221885681152, 0.000264778733253479, 0.0002931952476501465, 0.00032161176204681396, 0.00035002827644348145, 0.0003784447908401489, 0.0004068613052368164, 0.0004352778196334839, 0.00046369433403015137, 0.0004921108484268188, 0.0005205273628234863, 0.0005489438772201538, 0.0005773603916168213, 0.0006057769060134888, 0.0006341934204101562, 0.0006626099348068237, 0.0006910264492034912, 0.0007194429636001587, 0.0007478594779968262, 0.0007762759923934937, 0.0008046925067901611, 0.0008331090211868286, 0.0008615255355834961]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 1.0, 5.0, 7.0, 18.0, 5.0, 11.0, 11.0, 14.0, 19.0, 22.0, 21.0, 24.0, 20.0, 16.0, 27.0, 28.0, 44.0, 30.0, 51.0, 40.0, 38.0, 50.0, 38.0, 37.0, 51.0, 40.0, 24.0, 33.0, 35.0, 29.0, 28.0, 22.0, 19.0, 25.0, 15.0, 20.0, 15.0, 14.0, 13.0, 5.0, 3.0, 6.0, 5.0, 5.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.5625, -7.3099365234375, -7.057373046875, -6.8048095703125, -6.55224609375, -6.2996826171875, -6.047119140625, -5.7945556640625, -5.5419921875, -5.2894287109375, -5.036865234375, -4.7843017578125, -4.53173828125, -4.2791748046875, -4.026611328125, -3.7740478515625, -3.521484375, -3.2689208984375, -3.016357421875, -2.7637939453125, -2.51123046875, -2.2586669921875, -2.006103515625, -1.7535400390625, -1.5009765625, -1.2484130859375, -0.995849609375, -0.7432861328125, -0.49072265625, -0.2381591796875, 0.014404296875, 0.2669677734375, 0.51953125, 0.7720947265625, 1.024658203125, 1.2772216796875, 1.52978515625, 1.7823486328125, 2.034912109375, 2.2874755859375, 2.5400390625, 2.7926025390625, 3.045166015625, 3.2977294921875, 3.55029296875, 3.8028564453125, 4.055419921875, 4.3079833984375, 4.560546875, 4.8131103515625, 5.065673828125, 5.3182373046875, 5.57080078125, 5.8233642578125, 6.075927734375, 6.3284912109375, 6.5810546875, 6.8336181640625, 7.086181640625, 7.3387451171875, 7.59130859375, 7.8438720703125, 8.096435546875, 8.3489990234375, 8.6015625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 6.0, 2.0, 6.0, 3.0, 6.0, 25.0, 12.0, 17.0, 22.0, 23.0, 35.0, 59.0, 45.0, 69.0, 92.0, 148.0, 172.0, 287.0, 453.0, 918.0, 2205.0, 7583.0, 40485.0, 569883.0, 382884.0, 32543.0, 6457.0, 1848.0, 827.0, 413.0, 283.0, 214.0, 121.0, 92.0, 75.0, 56.0, 37.0, 25.0, 29.0, 27.0, 21.0, 10.0, 5.0, 6.0, 8.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.921875, -13.4569091796875, -12.991943359375, -12.5269775390625, -12.06201171875, -11.5970458984375, -11.132080078125, -10.6671142578125, -10.2021484375, -9.7371826171875, -9.272216796875, -8.8072509765625, -8.34228515625, -7.8773193359375, -7.412353515625, -6.9473876953125, -6.482421875, -6.0174560546875, -5.552490234375, -5.0875244140625, -4.62255859375, -4.1575927734375, -3.692626953125, -3.2276611328125, -2.7626953125, -2.2977294921875, -1.832763671875, -1.3677978515625, -0.90283203125, -0.4378662109375, 0.027099609375, 0.4920654296875, 0.95703125, 1.4219970703125, 1.886962890625, 2.3519287109375, 2.81689453125, 3.2818603515625, 3.746826171875, 4.2117919921875, 4.6767578125, 5.1417236328125, 5.606689453125, 6.0716552734375, 6.53662109375, 7.0015869140625, 7.466552734375, 7.9315185546875, 8.396484375, 8.8614501953125, 9.326416015625, 9.7913818359375, 10.25634765625, 10.7213134765625, 11.186279296875, 11.6512451171875, 12.1162109375, 12.5811767578125, 13.046142578125, 13.5111083984375, 13.97607421875, 14.4410400390625, 14.906005859375, 15.3709716796875, 15.8359375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 3.0, 5.0, 11.0, 9.0, 7.0, 11.0, 9.0, 14.0, 14.0, 11.0, 15.0, 20.0, 15.0, 24.0, 25.0, 26.0, 26.0, 44.0, 32.0, 36.0, 56.0, 83.0, 406.0, 1564.0, 87.0, 73.0, 46.0, 43.0, 44.0, 34.0, 34.0, 29.0, 32.0, 25.0, 26.0, 14.0, 12.0, 15.0, 12.0, 10.0, 3.0, 6.0, 7.0, 9.0, 7.0, 7.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-22.953125, -22.21337890625, -21.4736328125, -20.73388671875, -19.994140625, -19.25439453125, -18.5146484375, -17.77490234375, -17.03515625, -16.29541015625, -15.5556640625, -14.81591796875, -14.076171875, -13.33642578125, -12.5966796875, -11.85693359375, -11.1171875, -10.37744140625, -9.6376953125, -8.89794921875, -8.158203125, -7.41845703125, -6.6787109375, -5.93896484375, -5.19921875, -4.45947265625, -3.7197265625, -2.97998046875, -2.240234375, -1.50048828125, -0.7607421875, -0.02099609375, 0.71875, 1.45849609375, 2.1982421875, 2.93798828125, 3.677734375, 4.41748046875, 5.1572265625, 5.89697265625, 6.63671875, 7.37646484375, 8.1162109375, 8.85595703125, 9.595703125, 10.33544921875, 11.0751953125, 11.81494140625, 12.5546875, 13.29443359375, 14.0341796875, 14.77392578125, 15.513671875, 16.25341796875, 16.9931640625, 17.73291015625, 18.47265625, 19.21240234375, 19.9521484375, 20.69189453125, 21.431640625, 22.17138671875, 22.9111328125, 23.65087890625, 24.390625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 6.0, 7.0, 5.0, 9.0, 7.0, 7.0, 9.0, 20.0, 15.0, 20.0, 21.0, 24.0, 24.0, 46.0, 48.0, 60.0, 73.0, 101.0, 176.0, 251.0, 557.0, 2233.0, 2909123.0, 230236.0, 1357.0, 424.0, 242.0, 151.0, 100.0, 71.0, 50.0, 29.0, 30.0, 14.0, 23.0, 18.0, 15.0, 15.0, 12.0, 19.0, 6.0, 9.0, 7.0, 15.0, 7.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-72.9375, -70.720703125, -68.50390625, -66.287109375, -64.0703125, -61.853515625, -59.63671875, -57.419921875, -55.203125, -52.986328125, -50.76953125, -48.552734375, -46.3359375, -44.119140625, -41.90234375, -39.685546875, -37.46875, -35.251953125, -33.03515625, -30.818359375, -28.6015625, -26.384765625, -24.16796875, -21.951171875, -19.734375, -17.517578125, -15.30078125, -13.083984375, -10.8671875, -8.650390625, -6.43359375, -4.216796875, -2.0, 0.216796875, 2.43359375, 4.650390625, 6.8671875, 9.083984375, 11.30078125, 13.517578125, 15.734375, 17.951171875, 20.16796875, 22.384765625, 24.6015625, 26.818359375, 29.03515625, 31.251953125, 33.46875, 35.685546875, 37.90234375, 40.119140625, 42.3359375, 44.552734375, 46.76953125, 48.986328125, 51.203125, 53.419921875, 55.63671875, 57.853515625, 60.0703125, 62.287109375, 64.50390625, 66.720703125, 68.9375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 238.0, 708.0, 70.0], "bins": [-266.7608947753906, -262.4787902832031, -258.19671630859375, -253.91461181640625, -249.63250732421875, -245.35040283203125, -241.0683135986328, -236.78622436523438, -232.50411987304688, -228.22201538085938, -223.93992614746094, -219.6578369140625, -215.375732421875, -211.0936279296875, -206.81153869628906, -202.52944946289062, -198.24734497070312, -193.96524047851562, -189.6831512451172, -185.40106201171875, -181.11895751953125, -176.83685302734375, -172.5547637939453, -168.27267456054688, -163.99057006835938, -159.70846557617188, -155.42637634277344, -151.144287109375, -146.8621826171875, -142.580078125, -138.29798889160156, -134.01589965820312, -129.73377990722656, -125.4516830444336, -121.16958618164062, -116.88748931884766, -112.60539245605469, -108.32329559326172, -104.04119873046875, -99.75910186767578, -95.47700500488281, -91.19490814208984, -86.91281127929688, -82.6307144165039, -78.34861755371094, -74.06652069091797, -69.784423828125, -65.50232696533203, -61.22023391723633, -56.93813705444336, -52.65604019165039, -48.37394332885742, -44.09184646606445, -39.809749603271484, -35.527652740478516, -31.245555877685547, -26.963457107543945, -22.681360244750977, -18.399263381958008, -14.117166519165039, -9.83506965637207, -5.552972793579102, -1.2708759307861328, 3.011220932006836, 7.2933173179626465]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 6.0, 4.0, 7.0, 4.0, 10.0, 18.0, 10.0, 15.0, 11.0, 23.0, 22.0, 20.0, 20.0, 32.0, 28.0, 45.0, 28.0, 50.0, 47.0, 49.0, 29.0, 40.0, 34.0, 37.0, 46.0, 39.0, 36.0, 31.0, 37.0, 33.0, 24.0, 19.0, 21.0, 20.0, 23.0, 8.0, 16.0, 11.0, 11.0, 7.0, 6.0, 10.0, 2.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-80.03221130371094, -77.61380767822266, -75.19539642333984, -72.77699279785156, -70.35858154296875, -67.94017791748047, -65.52176666259766, -63.103363037109375, -60.68495559692383, -58.26654815673828, -55.848140716552734, -53.42973327636719, -51.011329650878906, -48.592918395996094, -46.17451477050781, -43.756107330322266, -41.33769989013672, -38.91929244995117, -36.500885009765625, -34.08247756958008, -31.664072036743164, -29.245664596557617, -26.827259063720703, -24.408851623535156, -21.99044418334961, -19.572036743164062, -17.153629302978516, -14.735223770141602, -12.316816329956055, -9.898408889770508, -7.480002403259277, -5.061595916748047, -2.6431808471679688, -0.22477388381958008, 2.1936330795288086, 4.612040042877197, 7.030447006225586, 9.448854446411133, 11.867260932922363, 14.285667419433594, 16.70407485961914, 19.122482299804688, 21.540889739990234, 23.95929527282715, 26.377702713012695, 28.796110153198242, 31.214515686035156, 33.6329231262207, 36.05133056640625, 38.4697380065918, 40.888145446777344, 43.30655288696289, 45.72496032714844, 48.14336395263672, 50.561771392822266, 52.98017883300781, 55.39858627319336, 57.816993713378906, 60.23540115356445, 62.65380859375, 65.07221221923828, 67.4906234741211, 69.90902709960938, 72.32743835449219, 74.74584197998047]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 9.0, 4.0, 7.0, 10.0, 11.0, 13.0, 16.0, 18.0, 18.0, 16.0, 17.0, 23.0, 28.0, 30.0, 28.0, 36.0, 38.0, 38.0, 41.0, 49.0, 44.0, 52.0, 53.0, 39.0, 35.0, 40.0, 38.0, 21.0, 36.0, 19.0, 32.0, 23.0, 17.0, 16.0, 15.0, 14.0, 16.0, 7.0, 4.0, 10.0, 4.0, 3.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.7835693359375, -7.504638671875, -7.2257080078125, -6.94677734375, -6.6678466796875, -6.388916015625, -6.1099853515625, -5.8310546875, -5.5521240234375, -5.273193359375, -4.9942626953125, -4.71533203125, -4.4364013671875, -4.157470703125, -3.8785400390625, -3.599609375, -3.3206787109375, -3.041748046875, -2.7628173828125, -2.48388671875, -2.2049560546875, -1.926025390625, -1.6470947265625, -1.3681640625, -1.0892333984375, -0.810302734375, -0.5313720703125, -0.25244140625, 0.0264892578125, 0.305419921875, 0.5843505859375, 0.86328125, 1.1422119140625, 1.421142578125, 1.7000732421875, 1.97900390625, 2.2579345703125, 2.536865234375, 2.8157958984375, 3.0947265625, 3.3736572265625, 3.652587890625, 3.9315185546875, 4.21044921875, 4.4893798828125, 4.768310546875, 5.0472412109375, 5.326171875, 5.6051025390625, 5.884033203125, 6.1629638671875, 6.44189453125, 6.7208251953125, 6.999755859375, 7.2786865234375, 7.5576171875, 7.8365478515625, 8.115478515625, 8.3944091796875, 8.67333984375, 8.9522705078125, 9.231201171875, 9.5101318359375, 9.7890625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 8.0, 9.0, 5.0, 9.0, 6.0, 16.0, 20.0, 17.0, 24.0, 33.0, 39.0, 62.0, 90.0, 89.0, 194.0, 263.0, 440.0, 747.0, 1409.0, 2518.0, 5546.0, 13621.0, 41992.0, 168976.0, 641277.0, 1450368.0, 1243760.0, 455921.0, 115826.0, 30216.0, 10752.0, 4595.0, 2291.0, 1189.0, 699.0, 408.0, 248.0, 159.0, 113.0, 91.0, 60.0, 42.0, 34.0, 24.0, 19.0, 15.0, 11.0, 10.0, 3.0, 6.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.96875, -9.6558837890625, -9.343017578125, -9.0301513671875, -8.71728515625, -8.4044189453125, -8.091552734375, -7.7786865234375, -7.4658203125, -7.1529541015625, -6.840087890625, -6.5272216796875, -6.21435546875, -5.9014892578125, -5.588623046875, -5.2757568359375, -4.962890625, -4.6500244140625, -4.337158203125, -4.0242919921875, -3.71142578125, -3.3985595703125, -3.085693359375, -2.7728271484375, -2.4599609375, -2.1470947265625, -1.834228515625, -1.5213623046875, -1.20849609375, -0.8956298828125, -0.582763671875, -0.2698974609375, 0.04296875, 0.3558349609375, 0.668701171875, 0.9815673828125, 1.29443359375, 1.6072998046875, 1.920166015625, 2.2330322265625, 2.5458984375, 2.8587646484375, 3.171630859375, 3.4844970703125, 3.79736328125, 4.1102294921875, 4.423095703125, 4.7359619140625, 5.048828125, 5.3616943359375, 5.674560546875, 5.9874267578125, 6.30029296875, 6.6131591796875, 6.926025390625, 7.2388916015625, 7.5517578125, 7.8646240234375, 8.177490234375, 8.4903564453125, 8.80322265625, 9.1160888671875, 9.428955078125, 9.7418212890625, 10.0546875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 4.0, 3.0, 10.0, 9.0, 17.0, 23.0, 32.0, 61.0, 89.0, 128.0, 177.0, 263.0, 391.0, 543.0, 653.0, 524.0, 396.0, 269.0, 153.0, 119.0, 79.0, 58.0, 33.0, 18.0, 12.0, 9.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-33.25, -32.519287109375, -31.78857421875, -31.057861328125, -30.3271484375, -29.596435546875, -28.86572265625, -28.135009765625, -27.404296875, -26.673583984375, -25.94287109375, -25.212158203125, -24.4814453125, -23.750732421875, -23.02001953125, -22.289306640625, -21.55859375, -20.827880859375, -20.09716796875, -19.366455078125, -18.6357421875, -17.905029296875, -17.17431640625, -16.443603515625, -15.712890625, -14.982177734375, -14.25146484375, -13.520751953125, -12.7900390625, -12.059326171875, -11.32861328125, -10.597900390625, -9.8671875, -9.136474609375, -8.40576171875, -7.675048828125, -6.9443359375, -6.213623046875, -5.48291015625, -4.752197265625, -4.021484375, -3.290771484375, -2.56005859375, -1.829345703125, -1.0986328125, -0.367919921875, 0.36279296875, 1.093505859375, 1.82421875, 2.554931640625, 3.28564453125, 4.016357421875, 4.7470703125, 5.477783203125, 6.20849609375, 6.939208984375, 7.669921875, 8.400634765625, 9.13134765625, 9.862060546875, 10.5927734375, 11.323486328125, 12.05419921875, 12.784912109375, 13.515625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 11.0, 16.0, 23.0, 46.0, 66.0, 101.0, 157.0, 223.0, 335.0, 570.0, 1504.0, 111574.0, 4073539.0, 4061.0, 773.0, 443.0, 276.0, 192.0, 148.0, 73.0, 62.0, 39.0, 25.0, 11.0, 10.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.6875, -104.1259765625, -100.564453125, -97.0029296875, -93.44140625, -89.8798828125, -86.318359375, -82.7568359375, -79.1953125, -75.6337890625, -72.072265625, -68.5107421875, -64.94921875, -61.3876953125, -57.826171875, -54.2646484375, -50.703125, -47.1416015625, -43.580078125, -40.0185546875, -36.45703125, -32.8955078125, -29.333984375, -25.7724609375, -22.2109375, -18.6494140625, -15.087890625, -11.5263671875, -7.96484375, -4.4033203125, -0.841796875, 2.7197265625, 6.28125, 9.8427734375, 13.404296875, 16.9658203125, 20.52734375, 24.0888671875, 27.650390625, 31.2119140625, 34.7734375, 38.3349609375, 41.896484375, 45.4580078125, 49.01953125, 52.5810546875, 56.142578125, 59.7041015625, 63.265625, 66.8271484375, 70.388671875, 73.9501953125, 77.51171875, 81.0732421875, 84.634765625, 88.1962890625, 91.7578125, 95.3193359375, 98.880859375, 102.4423828125, 106.00390625, 109.5654296875, 113.126953125, 116.6884765625, 120.25]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 582.0, 435.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1828.9698486328125, -1795.708251953125, -1762.4466552734375, -1729.1851806640625, -1695.923583984375, -1662.6619873046875, -1629.400390625, -1596.138916015625, -1562.8773193359375, -1529.61572265625, -1496.3541259765625, -1463.0926513671875, -1429.8310546875, -1396.5694580078125, -1363.307861328125, -1330.04638671875, -1296.78466796875, -1263.5230712890625, -1230.261474609375, -1197.0, -1163.7384033203125, -1130.476806640625, -1097.2152099609375, -1063.95361328125, -1030.692138671875, -997.4305419921875, -964.1690063476562, -930.9074096679688, -897.6458740234375, -864.38427734375, -831.1226806640625, -797.8611450195312, -764.599609375, -731.3380126953125, -698.0764770507812, -664.8148803710938, -631.5533447265625, -598.291748046875, -565.0301513671875, -531.7686157226562, -498.507080078125, -465.2455139160156, -431.98394775390625, -398.72235107421875, -365.4608154296875, -332.19921875, -298.9376525878906, -265.67608642578125, -232.41452026367188, -199.1529541015625, -165.89138793945312, -132.6298065185547, -99.36824035644531, -66.10667419433594, -32.8450927734375, 0.416473388671875, 33.67803955078125, 66.93960571289062, 100.20117950439453, 133.46275329589844, 166.7243194580078, 199.9858856201172, 233.24746704101562, 266.509033203125, 299.7705993652344]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 8.0, 12.0, 17.0, 26.0, 33.0, 39.0, 33.0, 37.0, 45.0, 43.0, 52.0, 65.0, 52.0, 60.0, 68.0, 67.0, 52.0, 48.0, 50.0, 36.0, 42.0, 31.0, 17.0, 12.0, 10.0, 14.0, 11.0, 11.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.33647155761719, -55.7484130859375, -53.16035079956055, -50.57229232788086, -47.984230041503906, -45.39617156982422, -42.80811309814453, -40.22005081176758, -37.631988525390625, -35.04393005371094, -32.455867767333984, -29.867809295654297, -27.279747009277344, -24.691688537597656, -22.103628158569336, -19.515567779541016, -16.927509307861328, -14.339448928833008, -11.751388549804688, -9.163329124450684, -6.575268745422363, -3.987208366394043, -1.399148941040039, 1.1889114379882812, 3.7769718170166016, 6.365032196044922, 8.953092575073242, 11.541152000427246, 14.129212379455566, 16.717273712158203, 19.30533218383789, 21.89339256286621, 24.48145294189453, 27.06951332092285, 29.657573699951172, 32.24563217163086, 34.83369445800781, 37.4217529296875, 40.00981140136719, 42.59787368774414, 45.185935974121094, 47.77399444580078, 50.362056732177734, 52.95011520385742, 55.538177490234375, 58.12623596191406, 60.71429443359375, 63.3023567199707, 65.89041137695312, 68.47846984863281, 71.0665283203125, 73.65459442138672, 76.2426528930664, 78.8307113647461, 81.41876983642578, 84.0068359375, 86.59489440917969, 89.18295288085938, 91.77101135253906, 94.35907745361328, 96.94713592529297, 99.53519439697266, 102.12325286865234, 104.71131896972656, 107.29937744140625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 5.0, 3.0, 4.0, 5.0, 6.0, 5.0, 11.0, 12.0, 15.0, 18.0, 21.0, 22.0, 17.0, 27.0, 32.0, 28.0, 44.0, 44.0, 36.0, 50.0, 43.0, 50.0, 45.0, 50.0, 46.0, 45.0, 40.0, 48.0, 34.0, 26.0, 20.0, 24.0, 18.0, 20.0, 20.0, 14.0, 14.0, 11.0, 4.0, 7.0, 3.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8359375, -8.55126953125, -8.2666015625, -7.98193359375, -7.697265625, -7.41259765625, -7.1279296875, -6.84326171875, -6.55859375, -6.27392578125, -5.9892578125, -5.70458984375, -5.419921875, -5.13525390625, -4.8505859375, -4.56591796875, -4.28125, -3.99658203125, -3.7119140625, -3.42724609375, -3.142578125, -2.85791015625, -2.5732421875, -2.28857421875, -2.00390625, -1.71923828125, -1.4345703125, -1.14990234375, -0.865234375, -0.58056640625, -0.2958984375, -0.01123046875, 0.2734375, 0.55810546875, 0.8427734375, 1.12744140625, 1.412109375, 1.69677734375, 1.9814453125, 2.26611328125, 2.55078125, 2.83544921875, 3.1201171875, 3.40478515625, 3.689453125, 3.97412109375, 4.2587890625, 4.54345703125, 4.828125, 5.11279296875, 5.3974609375, 5.68212890625, 5.966796875, 6.25146484375, 6.5361328125, 6.82080078125, 7.10546875, 7.39013671875, 7.6748046875, 7.95947265625, 8.244140625, 8.52880859375, 8.8134765625, 9.09814453125, 9.3828125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 7.0, 2.0, 14.0, 24.0, 21.0, 36.0, 49.0, 80.0, 109.0, 163.0, 199.0, 354.0, 477.0, 679.0, 938.0, 1443.0, 2059.0, 3033.0, 4424.0, 6366.0, 9271.0, 13525.0, 19563.0, 28001.0, 41595.0, 62630.0, 99367.0, 160021.0, 202115.0, 136025.0, 84958.0, 54647.0, 36148.0, 24741.0, 17215.0, 11899.0, 8301.0, 5606.0, 3869.0, 2712.0, 1882.0, 1213.0, 864.0, 590.0, 420.0, 278.0, 199.0, 140.0, 79.0, 63.0, 57.0, 31.0, 22.0, 12.0, 12.0, 8.0, 5.0, 2.0, 1.0, 2.0], "bins": [-1.0927734375, -1.0589752197265625, -1.025177001953125, -0.9913787841796875, -0.95758056640625, -0.9237823486328125, -0.889984130859375, -0.8561859130859375, -0.8223876953125, -0.7885894775390625, -0.754791259765625, -0.7209930419921875, -0.68719482421875, -0.6533966064453125, -0.619598388671875, -0.5858001708984375, -0.552001953125, -0.5182037353515625, -0.484405517578125, -0.4506072998046875, -0.41680908203125, -0.3830108642578125, -0.349212646484375, -0.3154144287109375, -0.2816162109375, -0.2478179931640625, -0.214019775390625, -0.1802215576171875, -0.14642333984375, -0.1126251220703125, -0.078826904296875, -0.0450286865234375, -0.01123046875, 0.0225677490234375, 0.056365966796875, 0.0901641845703125, 0.12396240234375, 0.1577606201171875, 0.191558837890625, 0.2253570556640625, 0.2591552734375, 0.2929534912109375, 0.326751708984375, 0.3605499267578125, 0.39434814453125, 0.4281463623046875, 0.461944580078125, 0.4957427978515625, 0.529541015625, 0.5633392333984375, 0.597137451171875, 0.6309356689453125, 0.66473388671875, 0.6985321044921875, 0.732330322265625, 0.7661285400390625, 0.7999267578125, 0.8337249755859375, 0.867523193359375, 0.9013214111328125, 0.93511962890625, 0.9689178466796875, 1.002716064453125, 1.0365142822265625, 1.0703125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 5.0, 5.0, 6.0, 8.0, 6.0, 20.0, 10.0, 15.0, 14.0, 18.0, 14.0, 23.0, 18.0, 28.0, 28.0, 26.0, 33.0, 24.0, 26.0, 30.0, 43.0, 44.0, 36.0, 1060.0, 43.0, 35.0, 33.0, 30.0, 32.0, 20.0, 27.0, 29.0, 32.0, 23.0, 29.0, 21.0, 18.0, 14.0, 16.0, 11.0, 11.0, 12.0, 9.0, 4.0, 7.0, 5.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.578125, -4.4312744140625, -4.284423828125, -4.1375732421875, -3.99072265625, -3.8438720703125, -3.697021484375, -3.5501708984375, -3.4033203125, -3.2564697265625, -3.109619140625, -2.9627685546875, -2.81591796875, -2.6690673828125, -2.522216796875, -2.3753662109375, -2.228515625, -2.0816650390625, -1.934814453125, -1.7879638671875, -1.64111328125, -1.4942626953125, -1.347412109375, -1.2005615234375, -1.0537109375, -0.9068603515625, -0.760009765625, -0.6131591796875, -0.46630859375, -0.3194580078125, -0.172607421875, -0.0257568359375, 0.12109375, 0.2679443359375, 0.414794921875, 0.5616455078125, 0.70849609375, 0.8553466796875, 1.002197265625, 1.1490478515625, 1.2958984375, 1.4427490234375, 1.589599609375, 1.7364501953125, 1.88330078125, 2.0301513671875, 2.177001953125, 2.3238525390625, 2.470703125, 2.6175537109375, 2.764404296875, 2.9112548828125, 3.05810546875, 3.2049560546875, 3.351806640625, 3.4986572265625, 3.6455078125, 3.7923583984375, 3.939208984375, 4.0860595703125, 4.23291015625, 4.3797607421875, 4.526611328125, 4.6734619140625, 4.8203125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 10.0, 10.0, 10.0, 25.0, 50.0, 57.0, 66.0, 120.0, 197.0, 291.0, 432.0, 701.0, 1091.0, 1595.0, 2353.0, 3533.0, 5483.0, 8487.0, 12847.0, 20010.0, 31411.0, 48849.0, 77319.0, 120659.0, 486522.0, 937513.0, 121485.0, 77358.0, 49474.0, 31526.0, 20028.0, 12889.0, 8466.0, 5580.0, 3707.0, 2379.0, 1619.0, 973.0, 686.0, 455.0, 309.0, 204.0, 133.0, 84.0, 42.0, 41.0, 16.0, 8.0, 9.0, 15.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.138671875, -1.1041717529296875, -1.069671630859375, -1.0351715087890625, -1.00067138671875, -0.9661712646484375, -0.931671142578125, -0.8971710205078125, -0.8626708984375, -0.8281707763671875, -0.793670654296875, -0.7591705322265625, -0.72467041015625, -0.6901702880859375, -0.655670166015625, -0.6211700439453125, -0.586669921875, -0.5521697998046875, -0.517669677734375, -0.4831695556640625, -0.44866943359375, -0.4141693115234375, -0.379669189453125, -0.3451690673828125, -0.3106689453125, -0.2761688232421875, -0.241668701171875, -0.2071685791015625, -0.17266845703125, -0.1381683349609375, -0.103668212890625, -0.0691680908203125, -0.03466796875, -0.0001678466796875, 0.034332275390625, 0.0688323974609375, 0.10333251953125, 0.1378326416015625, 0.172332763671875, 0.2068328857421875, 0.2413330078125, 0.2758331298828125, 0.310333251953125, 0.3448333740234375, 0.37933349609375, 0.4138336181640625, 0.448333740234375, 0.4828338623046875, 0.517333984375, 0.5518341064453125, 0.586334228515625, 0.6208343505859375, 0.65533447265625, 0.6898345947265625, 0.724334716796875, 0.7588348388671875, 0.7933349609375, 0.8278350830078125, 0.862335205078125, 0.8968353271484375, 0.93133544921875, 0.9658355712890625, 1.000335693359375, 1.0348358154296875, 1.0693359375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 6.0, 10.0, 11.0, 13.0, 17.0, 17.0, 26.0, 32.0, 35.0, 30.0, 42.0, 40.0, 50.0, 52.0, 54.0, 52.0, 58.0, 58.0, 53.0, 56.0, 50.0, 41.0, 37.0, 32.0, 16.0, 25.0, 19.0, 14.0, 11.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0018224716186523438, -0.0017687678337097168, -0.0017150640487670898, -0.0016613602638244629, -0.001607656478881836, -0.001553952693939209, -0.001500248908996582, -0.001446545124053955, -0.0013928413391113281, -0.0013391375541687012, -0.0012854337692260742, -0.0012317299842834473, -0.0011780261993408203, -0.0011243224143981934, -0.0010706186294555664, -0.0010169148445129395, -0.0009632110595703125, -0.0009095072746276855, -0.0008558034896850586, -0.0008020997047424316, -0.0007483959197998047, -0.0006946921348571777, -0.0006409883499145508, -0.0005872845649719238, -0.0005335807800292969, -0.0004798769950866699, -0.00042617321014404297, -0.000372469425201416, -0.00031876564025878906, -0.0002650618553161621, -0.00021135807037353516, -0.0001576542854309082, -0.00010395050048828125, -5.02467155456543e-05, 3.4570693969726562e-06, 5.716085433959961e-05, 0.00011086463928222656, 0.00016456842422485352, 0.00021827220916748047, 0.0002719759941101074, 0.0003256797790527344, 0.00037938356399536133, 0.0004330873489379883, 0.00048679113388061523, 0.0005404949188232422, 0.0005941987037658691, 0.0006479024887084961, 0.000701606273651123, 0.00075531005859375, 0.000809013843536377, 0.0008627176284790039, 0.0009164214134216309, 0.0009701251983642578, 0.0010238289833068848, 0.0010775327682495117, 0.0011312365531921387, 0.0011849403381347656, 0.0012386441230773926, 0.0012923479080200195, 0.0013460516929626465, 0.0013997554779052734, 0.0014534592628479004, 0.0015071630477905273, 0.0015608668327331543, 0.0016145706176757812]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 10.0, 20.0, 25.0, 22.0, 27.0, 36.0, 67.0, 69.0, 96.0, 142.0, 224.0, 524.0, 2062.0, 1000731.0, 42458.0, 976.0, 369.0, 181.0, 102.0, 80.0, 80.0, 57.0, 45.0, 28.0, 27.0, 15.0, 9.0, 14.0, 9.0, 12.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.040313720703125, -0.03900289535522461, -0.03769207000732422, -0.03638124465942383, -0.03507041931152344, -0.03375959396362305, -0.032448768615722656, -0.031137943267822266, -0.029827117919921875, -0.028516292572021484, -0.027205467224121094, -0.025894641876220703, -0.024583816528320312, -0.023272991180419922, -0.02196216583251953, -0.02065134048461914, -0.01934051513671875, -0.01802968978881836, -0.01671886444091797, -0.015408039093017578, -0.014097213745117188, -0.012786388397216797, -0.011475563049316406, -0.010164737701416016, -0.008853912353515625, -0.007543087005615234, -0.006232261657714844, -0.004921436309814453, -0.0036106109619140625, -0.002299785614013672, -0.0009889602661132812, 0.0003218650817871094, 0.0016326904296875, 0.0029435157775878906, 0.004254341125488281, 0.005565166473388672, 0.0068759918212890625, 0.008186817169189453, 0.009497642517089844, 0.010808467864990234, 0.012119293212890625, 0.013430118560791016, 0.014740943908691406, 0.016051769256591797, 0.017362594604492188, 0.018673419952392578, 0.01998424530029297, 0.02129507064819336, 0.02260589599609375, 0.02391672134399414, 0.02522754669189453, 0.026538372039794922, 0.027849197387695312, 0.029160022735595703, 0.030470848083496094, 0.031781673431396484, 0.033092498779296875, 0.034403324127197266, 0.035714149475097656, 0.03702497482299805, 0.03833580017089844, 0.03964662551879883, 0.04095745086669922, 0.04226827621459961, 0.0435791015625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 19.0, 61.0, 151.0, 269.0, 270.0, 159.0, 59.0, 17.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0031445971690118313, -0.0030660019256174564, -0.0029874066822230816, -0.002908811205998063, -0.0028302159626036882, -0.0027516207192093134, -0.0026730254758149385, -0.00259442999958992, -0.002515834756195545, -0.0024372395128011703, -0.0023586442694067955, -0.002280048793181777, -0.002201453549787402, -0.0021228583063930273, -0.0020442630629986525, -0.001965667586773634, -0.001887072459794581, -0.001808477216400206, -0.0017298818565905094, -0.0016512866131961346, -0.001572691253386438, -0.001494096009992063, -0.0014155006501823664, -0.0013369054067879915, -0.0012583101633936167, -0.0011797149199992418, -0.0011011195601895452, -0.0010225243167951703, -0.0009439289569854736, -0.0008653337135910988, -0.000786738411989063, -0.0007081431103870273, -0.0006295477505773306, -0.0005509524489752948, -0.00047235714737325907, -0.00039376187487505376, -0.000315166573273018, -0.00023657127167098224, -0.00015797599917277694, -7.938069757074118e-05, -7.853959687054157e-07, 7.780989835737273e-05, 0.00015640519268345088, 0.0002350004797335714, 0.00031359578133560717, 0.00039219108293764293, 0.00047078635543584824, 0.000549381657037884, 0.0006279769586399198, 0.0007065722602419555, 0.0007851675618439913, 0.0008637628052383661, 0.0009423581650480628, 0.0010209534084424376, 0.0010995487682521343, 0.0011781440116465092, 0.001256739255040884, 0.0013353344984352589, 0.0014139298582449555, 0.0014925251016393304, 0.001571120461449027, 0.001649715704843402, 0.0017283109482377768, 0.0018069063080474734, 0.00188550166785717]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 10.0, 13.0, 14.0, 14.0, 15.0, 16.0, 30.0, 27.0, 24.0, 30.0, 36.0, 27.0, 24.0, 51.0, 49.0, 52.0, 52.0, 51.0, 37.0, 38.0, 44.0, 48.0, 34.0, 35.0, 34.0, 28.0, 26.0, 20.0, 14.0, 22.0, 16.0, 14.0, 6.0, 8.0, 6.0, 9.0, 5.0, 5.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009677410125732422, -0.000937717966735363, -0.0009076949208974838, -0.0008776718750596046, -0.0008476488292217255, -0.0008176257833838463, -0.0007876027375459671, -0.0007575796917080879, -0.0007275566458702087, -0.0006975336000323296, -0.0006675105541944504, -0.0006374875083565712, -0.000607464462518692, -0.0005774414166808128, -0.0005474183708429337, -0.0005173953250050545, -0.0004873722791671753, -0.0004573492333292961, -0.00042732618749141693, -0.00039730314165353775, -0.00036728009581565857, -0.0003372570499777794, -0.0003072340041399002, -0.000277210958302021, -0.00024718791246414185, -0.00021716486662626266, -0.00018714182078838348, -0.0001571187749505043, -0.00012709572911262512, -9.707268327474594e-05, -6.704963743686676e-05, -3.702659159898758e-05, -7.0035457611083984e-06, 2.3019500076770782e-05, 5.304254591464996e-05, 8.306559175252914e-05, 0.00011308863759040833, 0.0001431116834282875, 0.0001731347292661667, 0.00020315777510404587, 0.00023318082094192505, 0.00026320386677980423, 0.0002932269126176834, 0.0003232499584555626, 0.00035327300429344177, 0.00038329605013132095, 0.00041331909596920013, 0.0004433421418070793, 0.0004733651876449585, 0.0005033882334828377, 0.0005334112793207169, 0.000563434325158596, 0.0005934573709964752, 0.0006234804168343544, 0.0006535034626722336, 0.0006835265085101128, 0.0007135495543479919, 0.0007435726001858711, 0.0007735956460237503, 0.0008036186918616295, 0.0008336417376995087, 0.0008636647835373878, 0.000893687829375267, 0.0009237108752131462, 0.0009537339210510254]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 5.0, 3.0, 4.0, 5.0, 6.0, 5.0, 11.0, 12.0, 15.0, 18.0, 21.0, 22.0, 17.0, 27.0, 32.0, 28.0, 44.0, 44.0, 36.0, 50.0, 43.0, 50.0, 45.0, 50.0, 46.0, 45.0, 40.0, 48.0, 34.0, 26.0, 20.0, 24.0, 18.0, 20.0, 20.0, 14.0, 14.0, 11.0, 4.0, 7.0, 3.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8359375, -8.55126953125, -8.2666015625, -7.98193359375, -7.697265625, -7.41259765625, -7.1279296875, -6.84326171875, -6.55859375, -6.27392578125, -5.9892578125, -5.70458984375, -5.419921875, -5.13525390625, -4.8505859375, -4.56591796875, -4.28125, -3.99658203125, -3.7119140625, -3.42724609375, -3.142578125, -2.85791015625, -2.5732421875, -2.28857421875, -2.00390625, -1.71923828125, -1.4345703125, -1.14990234375, -0.865234375, -0.58056640625, -0.2958984375, -0.01123046875, 0.2734375, 0.55810546875, 0.8427734375, 1.12744140625, 1.412109375, 1.69677734375, 1.9814453125, 2.26611328125, 2.55078125, 2.83544921875, 3.1201171875, 3.40478515625, 3.689453125, 3.97412109375, 4.2587890625, 4.54345703125, 4.828125, 5.11279296875, 5.3974609375, 5.68212890625, 5.966796875, 6.25146484375, 6.5361328125, 6.82080078125, 7.10546875, 7.39013671875, 7.6748046875, 7.95947265625, 8.244140625, 8.52880859375, 8.8134765625, 9.09814453125, 9.3828125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 10.0, 11.0, 23.0, 17.0, 32.0, 36.0, 48.0, 84.0, 108.0, 170.0, 395.0, 743.0, 1650.0, 3526.0, 8626.0, 21335.0, 54551.0, 156613.0, 439405.0, 234982.0, 76305.0, 29234.0, 11636.0, 4835.0, 2097.0, 940.0, 434.0, 246.0, 138.0, 90.0, 61.0, 41.0, 30.0, 23.0, 15.0, 11.0, 11.0, 5.0, 6.0, 7.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8359375, -7.5885009765625, -7.341064453125, -7.0936279296875, -6.84619140625, -6.5987548828125, -6.351318359375, -6.1038818359375, -5.8564453125, -5.6090087890625, -5.361572265625, -5.1141357421875, -4.86669921875, -4.6192626953125, -4.371826171875, -4.1243896484375, -3.876953125, -3.6295166015625, -3.382080078125, -3.1346435546875, -2.88720703125, -2.6397705078125, -2.392333984375, -2.1448974609375, -1.8974609375, -1.6500244140625, -1.402587890625, -1.1551513671875, -0.90771484375, -0.6602783203125, -0.412841796875, -0.1654052734375, 0.08203125, 0.3294677734375, 0.576904296875, 0.8243408203125, 1.07177734375, 1.3192138671875, 1.566650390625, 1.8140869140625, 2.0615234375, 2.3089599609375, 2.556396484375, 2.8038330078125, 3.05126953125, 3.2987060546875, 3.546142578125, 3.7935791015625, 4.041015625, 4.2884521484375, 4.535888671875, 4.7833251953125, 5.03076171875, 5.2781982421875, 5.525634765625, 5.7730712890625, 6.0205078125, 6.2679443359375, 6.515380859375, 6.7628173828125, 7.01025390625, 7.2576904296875, 7.505126953125, 7.7525634765625, 8.0]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 5.0, 4.0, 5.0, 9.0, 12.0, 14.0, 12.0, 14.0, 18.0, 18.0, 26.0, 25.0, 25.0, 41.0, 39.0, 36.0, 55.0, 48.0, 76.0, 199.0, 1563.0, 279.0, 77.0, 55.0, 40.0, 46.0, 42.0, 40.0, 32.0, 28.0, 31.0, 19.0, 23.0, 16.0, 14.0, 17.0, 9.0, 4.0, 8.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-26.421875, -25.5859375, -24.75, -23.9140625, -23.078125, -22.2421875, -21.40625, -20.5703125, -19.734375, -18.8984375, -18.0625, -17.2265625, -16.390625, -15.5546875, -14.71875, -13.8828125, -13.046875, -12.2109375, -11.375, -10.5390625, -9.703125, -8.8671875, -8.03125, -7.1953125, -6.359375, -5.5234375, -4.6875, -3.8515625, -3.015625, -2.1796875, -1.34375, -0.5078125, 0.328125, 1.1640625, 2.0, 2.8359375, 3.671875, 4.5078125, 5.34375, 6.1796875, 7.015625, 7.8515625, 8.6875, 9.5234375, 10.359375, 11.1953125, 12.03125, 12.8671875, 13.703125, 14.5390625, 15.375, 16.2109375, 17.046875, 17.8828125, 18.71875, 19.5546875, 20.390625, 21.2265625, 22.0625, 22.8984375, 23.734375, 24.5703125, 25.40625, 26.2421875, 27.078125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 3.0, 8.0, 7.0, 13.0, 13.0, 16.0, 32.0, 28.0, 28.0, 45.0, 62.0, 95.0, 115.0, 161.0, 187.0, 337.0, 609.0, 2074.0, 98432.0, 3023566.0, 17195.0, 1212.0, 479.0, 284.0, 213.0, 120.0, 77.0, 71.0, 36.0, 47.0, 33.0, 31.0, 18.0, 20.0, 7.0, 3.0, 3.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-54.4375, -52.8515625, -51.265625, -49.6796875, -48.09375, -46.5078125, -44.921875, -43.3359375, -41.75, -40.1640625, -38.578125, -36.9921875, -35.40625, -33.8203125, -32.234375, -30.6484375, -29.0625, -27.4765625, -25.890625, -24.3046875, -22.71875, -21.1328125, -19.546875, -17.9609375, -16.375, -14.7890625, -13.203125, -11.6171875, -10.03125, -8.4453125, -6.859375, -5.2734375, -3.6875, -2.1015625, -0.515625, 1.0703125, 2.65625, 4.2421875, 5.828125, 7.4140625, 9.0, 10.5859375, 12.171875, 13.7578125, 15.34375, 16.9296875, 18.515625, 20.1015625, 21.6875, 23.2734375, 24.859375, 26.4453125, 28.03125, 29.6171875, 31.203125, 32.7890625, 34.375, 35.9609375, 37.546875, 39.1328125, 40.71875, 42.3046875, 43.890625, 45.4765625, 47.0625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 141.0, 845.0, 28.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-445.35626220703125, -437.0059814453125, -428.6556701660156, -420.3053894042969, -411.9551086425781, -403.60479736328125, -395.2545166015625, -386.90423583984375, -378.5539245605469, -370.2036437988281, -361.85333251953125, -353.5030517578125, -345.15277099609375, -336.8024597167969, -328.4521789550781, -320.1018981933594, -311.7515869140625, -303.40130615234375, -295.0509948730469, -286.7007141113281, -278.3504333496094, -270.0001220703125, -261.64984130859375, -253.29954528808594, -244.94927978515625, -236.59898376464844, -228.2487030029297, -219.89840698242188, -211.54811096191406, -203.19781494140625, -194.8475341796875, -186.4972381591797, -178.14697265625, -169.7966766357422, -161.44639587402344, -153.09609985351562, -144.7458038330078, -136.3955078125, -128.04522705078125, -119.69493103027344, -111.34463500976562, -102.99434661865234, -94.64405059814453, -86.29376220703125, -77.94346618652344, -69.59317779541016, -61.242889404296875, -52.89259719848633, -44.54230499267578, -36.192012786865234, -27.84172248840332, -19.491432189941406, -11.14113998413086, -2.7908477783203125, 5.559440612792969, 13.909732818603516, 22.260025024414062, 30.61031723022461, 38.960609436035156, 47.31089782714844, 55.661190032958984, 64.01148223876953, 72.36177062988281, 80.71206665039062, 89.0623550415039]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 3.0, 6.0, 9.0, 8.0, 14.0, 4.0, 16.0, 10.0, 26.0, 22.0, 27.0, 24.0, 23.0, 25.0, 38.0, 41.0, 31.0, 33.0, 38.0, 49.0, 43.0, 41.0, 45.0, 34.0, 34.0, 33.0, 34.0, 38.0, 26.0, 18.0, 33.0, 20.0, 25.0, 21.0, 14.0, 17.0, 9.0, 16.0, 11.0, 9.0, 9.0, 8.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-63.102821350097656, -61.157371520996094, -59.211917877197266, -57.2664680480957, -55.321014404296875, -53.37556457519531, -51.430110931396484, -49.48466110229492, -47.539207458496094, -45.59375762939453, -43.6483039855957, -41.70285415649414, -39.75740051269531, -37.81195068359375, -35.86649703979492, -33.92104721069336, -31.975595474243164, -30.03014373779297, -28.084692001342773, -26.139240264892578, -24.193788528442383, -22.248336791992188, -20.302886962890625, -18.357433319091797, -16.411983489990234, -14.466531753540039, -12.521080017089844, -10.575628280639648, -8.630176544189453, -6.684725761413574, -4.739274024963379, -2.7938222885131836, -0.8483695983886719, 1.0970820188522339, 3.0425336360931396, 4.987985134124756, 6.933436870574951, 8.878888130187988, 10.824339866638184, 12.769791603088379, 14.715243339538574, 16.660694122314453, 18.60614585876465, 20.551597595214844, 22.49704933166504, 24.442501068115234, 26.38795280456543, 28.333404541015625, 30.27885627746582, 32.224308013916016, 34.16975784301758, 36.115211486816406, 38.06066131591797, 40.0061149597168, 41.95156478881836, 43.89701843261719, 45.84246826171875, 47.78791809082031, 49.73337173461914, 51.6788215637207, 53.62427520751953, 55.569725036621094, 57.51517868041992, 59.460628509521484, 61.40608215332031]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 4.0, 6.0, 5.0, 7.0, 15.0, 18.0, 15.0, 19.0, 21.0, 31.0, 36.0, 34.0, 30.0, 36.0, 50.0, 51.0, 43.0, 64.0, 37.0, 52.0, 66.0, 41.0, 44.0, 46.0, 28.0, 33.0, 22.0, 22.0, 19.0, 25.0, 19.0, 13.0, 11.0, 4.0, 9.0, 5.0, 2.0, 7.0, 3.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8984375, -9.5826416015625, -9.266845703125, -8.9510498046875, -8.63525390625, -8.3194580078125, -8.003662109375, -7.6878662109375, -7.3720703125, -7.0562744140625, -6.740478515625, -6.4246826171875, -6.10888671875, -5.7930908203125, -5.477294921875, -5.1614990234375, -4.845703125, -4.5299072265625, -4.214111328125, -3.8983154296875, -3.58251953125, -3.2667236328125, -2.950927734375, -2.6351318359375, -2.3193359375, -2.0035400390625, -1.687744140625, -1.3719482421875, -1.05615234375, -0.7403564453125, -0.424560546875, -0.1087646484375, 0.20703125, 0.5228271484375, 0.838623046875, 1.1544189453125, 1.47021484375, 1.7860107421875, 2.101806640625, 2.4176025390625, 2.7333984375, 3.0491943359375, 3.364990234375, 3.6807861328125, 3.99658203125, 4.3123779296875, 4.628173828125, 4.9439697265625, 5.259765625, 5.5755615234375, 5.891357421875, 6.2071533203125, 6.52294921875, 6.8387451171875, 7.154541015625, 7.4703369140625, 7.7861328125, 8.1019287109375, 8.417724609375, 8.7335205078125, 9.04931640625, 9.3651123046875, 9.680908203125, 9.9967041015625, 10.3125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 3.0, 12.0, 4.0, 13.0, 13.0, 16.0, 21.0, 27.0, 22.0, 32.0, 44.0, 56.0, 79.0, 105.0, 201.0, 515.0, 1993.0, 14759.0, 415658.0, 3486065.0, 260233.0, 11623.0, 1709.0, 476.0, 171.0, 89.0, 70.0, 47.0, 43.0, 39.0, 32.0, 22.0, 16.0, 15.0, 13.0, 11.0, 8.0, 5.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.203125, -28.2744140625, -27.345703125, -26.4169921875, -25.48828125, -24.5595703125, -23.630859375, -22.7021484375, -21.7734375, -20.8447265625, -19.916015625, -18.9873046875, -18.05859375, -17.1298828125, -16.201171875, -15.2724609375, -14.34375, -13.4150390625, -12.486328125, -11.5576171875, -10.62890625, -9.7001953125, -8.771484375, -7.8427734375, -6.9140625, -5.9853515625, -5.056640625, -4.1279296875, -3.19921875, -2.2705078125, -1.341796875, -0.4130859375, 0.515625, 1.4443359375, 2.373046875, 3.3017578125, 4.23046875, 5.1591796875, 6.087890625, 7.0166015625, 7.9453125, 8.8740234375, 9.802734375, 10.7314453125, 11.66015625, 12.5888671875, 13.517578125, 14.4462890625, 15.375, 16.3037109375, 17.232421875, 18.1611328125, 19.08984375, 20.0185546875, 20.947265625, 21.8759765625, 22.8046875, 23.7333984375, 24.662109375, 25.5908203125, 26.51953125, 27.4482421875, 28.376953125, 29.3056640625, 30.234375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 3.0, 4.0, 4.0, 8.0, 13.0, 8.0, 16.0, 21.0, 22.0, 30.0, 33.0, 39.0, 72.0, 80.0, 101.0, 131.0, 145.0, 210.0, 290.0, 323.0, 365.0, 402.0, 394.0, 299.0, 236.0, 169.0, 156.0, 97.0, 86.0, 60.0, 53.0, 44.0, 40.0, 24.0, 22.0, 23.0, 4.0, 15.0, 13.0, 4.0, 7.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.613037109375, -12.21044921875, -11.807861328125, -11.4052734375, -11.002685546875, -10.60009765625, -10.197509765625, -9.794921875, -9.392333984375, -8.98974609375, -8.587158203125, -8.1845703125, -7.781982421875, -7.37939453125, -6.976806640625, -6.57421875, -6.171630859375, -5.76904296875, -5.366455078125, -4.9638671875, -4.561279296875, -4.15869140625, -3.756103515625, -3.353515625, -2.950927734375, -2.54833984375, -2.145751953125, -1.7431640625, -1.340576171875, -0.93798828125, -0.535400390625, -0.1328125, 0.269775390625, 0.67236328125, 1.074951171875, 1.4775390625, 1.880126953125, 2.28271484375, 2.685302734375, 3.087890625, 3.490478515625, 3.89306640625, 4.295654296875, 4.6982421875, 5.100830078125, 5.50341796875, 5.906005859375, 6.30859375, 6.711181640625, 7.11376953125, 7.516357421875, 7.9189453125, 8.321533203125, 8.72412109375, 9.126708984375, 9.529296875, 9.931884765625, 10.33447265625, 10.737060546875, 11.1396484375, 11.542236328125, 11.94482421875, 12.347412109375, 12.75]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 4.0, 7.0, 11.0, 13.0, 18.0, 30.0, 28.0, 62.0, 82.0, 110.0, 122.0, 209.0, 308.0, 498.0, 1761.0, 679453.0, 3506693.0, 3191.0, 585.0, 330.0, 212.0, 149.0, 129.0, 73.0, 59.0, 54.0, 32.0, 16.0, 14.0, 13.0, 6.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.4375, -111.2666015625, -108.095703125, -104.9248046875, -101.75390625, -98.5830078125, -95.412109375, -92.2412109375, -89.0703125, -85.8994140625, -82.728515625, -79.5576171875, -76.38671875, -73.2158203125, -70.044921875, -66.8740234375, -63.703125, -60.5322265625, -57.361328125, -54.1904296875, -51.01953125, -47.8486328125, -44.677734375, -41.5068359375, -38.3359375, -35.1650390625, -31.994140625, -28.8232421875, -25.65234375, -22.4814453125, -19.310546875, -16.1396484375, -12.96875, -9.7978515625, -6.626953125, -3.4560546875, -0.28515625, 2.8857421875, 6.056640625, 9.2275390625, 12.3984375, 15.5693359375, 18.740234375, 21.9111328125, 25.08203125, 28.2529296875, 31.423828125, 34.5947265625, 37.765625, 40.9365234375, 44.107421875, 47.2783203125, 50.44921875, 53.6201171875, 56.791015625, 59.9619140625, 63.1328125, 66.3037109375, 69.474609375, 72.6455078125, 75.81640625, 78.9873046875, 82.158203125, 85.3291015625, 88.5]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 59.0, 459.0, 438.0, 55.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-451.9886169433594, -442.93896484375, -433.8892822265625, -424.8396301269531, -415.78997802734375, -406.74029541015625, -397.6906433105469, -388.6409912109375, -379.59130859375, -370.5416564941406, -361.4919738769531, -352.44232177734375, -343.3926696777344, -334.343017578125, -325.2933349609375, -316.2436828613281, -307.19403076171875, -298.1443786621094, -289.0946960449219, -280.0450439453125, -270.9953918457031, -261.94573974609375, -252.89605712890625, -243.84640502929688, -234.79673767089844, -225.7470703125, -216.69741821289062, -207.6477508544922, -198.59808349609375, -189.54843139648438, -180.49876403808594, -171.4490966796875, -162.39944458007812, -153.3497772216797, -144.3001251220703, -135.25045776367188, -126.20079803466797, -117.15113830566406, -108.10147094726562, -99.05181121826172, -90.00215148925781, -80.9524917602539, -71.90283203125, -62.85316467285156, -53.803504943847656, -44.75384521484375, -35.70418167114258, -26.654518127441406, -17.6048583984375, -8.555196762084961, 0.4944648742675781, 9.544126510620117, 18.593788146972656, 27.643447875976562, 36.693111419677734, 45.742774963378906, 54.79243469238281, 63.84209442138672, 72.89175415039062, 81.94142150878906, 90.99108123779297, 100.04074096679688, 109.09040832519531, 118.14006805419922, 127.18972778320312]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 6.0, 3.0, 4.0, 10.0, 9.0, 12.0, 12.0, 12.0, 14.0, 10.0, 23.0, 20.0, 31.0, 38.0, 33.0, 32.0, 35.0, 28.0, 40.0, 34.0, 35.0, 44.0, 32.0, 36.0, 50.0, 38.0, 31.0, 40.0, 45.0, 30.0, 33.0, 22.0, 28.0, 27.0, 20.0, 13.0, 19.0, 15.0, 12.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.2247314453125, -50.460514068603516, -48.69629669189453, -46.93207931518555, -45.16786193847656, -43.40364456176758, -41.639427185058594, -39.87520980834961, -38.110992431640625, -36.34677505493164, -34.582557678222656, -32.81834030151367, -31.054122924804688, -29.289905548095703, -27.52568817138672, -25.761470794677734, -23.99725341796875, -22.233036041259766, -20.46881866455078, -18.704601287841797, -16.940383911132812, -15.176166534423828, -13.411949157714844, -11.64773178100586, -9.883514404296875, -8.11929702758789, -6.355079650878906, -4.590862274169922, -2.8266448974609375, -1.0624275207519531, 0.7017898559570312, 2.4660072326660156, 4.230224609375, 5.994441986083984, 7.758659362792969, 9.522876739501953, 11.287094116210938, 13.051311492919922, 14.815528869628906, 16.57974624633789, 18.343963623046875, 20.10818099975586, 21.872398376464844, 23.636615753173828, 25.400833129882812, 27.165050506591797, 28.92926788330078, 30.693485260009766, 32.45770263671875, 34.221920013427734, 35.98613739013672, 37.7503547668457, 39.51457214355469, 41.27878952026367, 43.043006896972656, 44.80722427368164, 46.571441650390625, 48.33565902709961, 50.099876403808594, 51.86409378051758, 53.62831115722656, 55.39252853393555, 57.15674591064453, 58.920963287353516, 60.6851806640625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 11.0, 8.0, 10.0, 11.0, 11.0, 15.0, 13.0, 27.0, 17.0, 25.0, 24.0, 34.0, 28.0, 34.0, 38.0, 38.0, 52.0, 44.0, 48.0, 51.0, 35.0, 35.0, 43.0, 32.0, 39.0, 41.0, 28.0, 34.0, 24.0, 24.0, 22.0, 13.0, 15.0, 18.0, 10.0, 5.0, 7.0, 4.0, 6.0, 8.0, 2.0, 3.0, 0.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.680419921875, -8.39208984375, -8.103759765625, -7.8154296875, -7.527099609375, -7.23876953125, -6.950439453125, -6.662109375, -6.373779296875, -6.08544921875, -5.797119140625, -5.5087890625, -5.220458984375, -4.93212890625, -4.643798828125, -4.35546875, -4.067138671875, -3.77880859375, -3.490478515625, -3.2021484375, -2.913818359375, -2.62548828125, -2.337158203125, -2.048828125, -1.760498046875, -1.47216796875, -1.183837890625, -0.8955078125, -0.607177734375, -0.31884765625, -0.030517578125, 0.2578125, 0.546142578125, 0.83447265625, 1.122802734375, 1.4111328125, 1.699462890625, 1.98779296875, 2.276123046875, 2.564453125, 2.852783203125, 3.14111328125, 3.429443359375, 3.7177734375, 4.006103515625, 4.29443359375, 4.582763671875, 4.87109375, 5.159423828125, 5.44775390625, 5.736083984375, 6.0244140625, 6.312744140625, 6.60107421875, 6.889404296875, 7.177734375, 7.466064453125, 7.75439453125, 8.042724609375, 8.3310546875, 8.619384765625, 8.90771484375, 9.196044921875, 9.484375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 5.0, 4.0, 10.0, 7.0, 12.0, 28.0, 51.0, 70.0, 95.0, 128.0, 176.0, 270.0, 406.0, 580.0, 811.0, 1172.0, 1700.0, 2486.0, 3588.0, 5080.0, 7388.0, 10870.0, 15664.0, 22916.0, 33509.0, 50646.0, 77827.0, 122904.0, 185820.0, 173623.0, 112405.0, 71793.0, 46814.0, 31608.0, 21249.0, 14335.0, 10050.0, 6839.0, 4801.0, 3344.0, 2232.0, 1660.0, 1135.0, 775.0, 534.0, 350.0, 249.0, 178.0, 110.0, 86.0, 64.0, 35.0, 32.0, 21.0, 9.0, 8.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.1494140625, -1.1133880615234375, -1.077362060546875, -1.0413360595703125, -1.00531005859375, -0.9692840576171875, -0.933258056640625, -0.8972320556640625, -0.8612060546875, -0.8251800537109375, -0.789154052734375, -0.7531280517578125, -0.71710205078125, -0.6810760498046875, -0.645050048828125, -0.6090240478515625, -0.572998046875, -0.5369720458984375, -0.500946044921875, -0.4649200439453125, -0.42889404296875, -0.3928680419921875, -0.356842041015625, -0.3208160400390625, -0.2847900390625, -0.2487640380859375, -0.212738037109375, -0.1767120361328125, -0.14068603515625, -0.1046600341796875, -0.068634033203125, -0.0326080322265625, 0.00341796875, 0.0394439697265625, 0.075469970703125, 0.1114959716796875, 0.14752197265625, 0.1835479736328125, 0.219573974609375, 0.2555999755859375, 0.2916259765625, 0.3276519775390625, 0.363677978515625, 0.3997039794921875, 0.43572998046875, 0.4717559814453125, 0.507781982421875, 0.5438079833984375, 0.579833984375, 0.6158599853515625, 0.651885986328125, 0.6879119873046875, 0.72393798828125, 0.7599639892578125, 0.795989990234375, 0.8320159912109375, 0.8680419921875, 0.9040679931640625, 0.940093994140625, 0.9761199951171875, 1.01214599609375, 1.0481719970703125, 1.084197998046875, 1.1202239990234375, 1.15625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 6.0, 5.0, 10.0, 13.0, 10.0, 8.0, 17.0, 28.0, 24.0, 25.0, 15.0, 26.0, 42.0, 48.0, 36.0, 24.0, 39.0, 43.0, 1072.0, 47.0, 45.0, 44.0, 45.0, 47.0, 42.0, 36.0, 36.0, 26.0, 26.0, 19.0, 25.0, 16.0, 16.0, 20.0, 13.0, 8.0, 9.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2421875, -6.040771484375, -5.83935546875, -5.637939453125, -5.4365234375, -5.235107421875, -5.03369140625, -4.832275390625, -4.630859375, -4.429443359375, -4.22802734375, -4.026611328125, -3.8251953125, -3.623779296875, -3.42236328125, -3.220947265625, -3.01953125, -2.818115234375, -2.61669921875, -2.415283203125, -2.2138671875, -2.012451171875, -1.81103515625, -1.609619140625, -1.408203125, -1.206787109375, -1.00537109375, -0.803955078125, -0.6025390625, -0.401123046875, -0.19970703125, 0.001708984375, 0.203125, 0.404541015625, 0.60595703125, 0.807373046875, 1.0087890625, 1.210205078125, 1.41162109375, 1.613037109375, 1.814453125, 2.015869140625, 2.21728515625, 2.418701171875, 2.6201171875, 2.821533203125, 3.02294921875, 3.224365234375, 3.42578125, 3.627197265625, 3.82861328125, 4.030029296875, 4.2314453125, 4.432861328125, 4.63427734375, 4.835693359375, 5.037109375, 5.238525390625, 5.43994140625, 5.641357421875, 5.8427734375, 6.044189453125, 6.24560546875, 6.447021484375, 6.6484375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 12.0, 6.0, 20.0, 16.0, 29.0, 36.0, 73.0, 126.0, 182.0, 288.0, 468.0, 734.0, 1217.0, 2053.0, 3413.0, 5709.0, 9746.0, 15985.0, 27145.0, 47282.0, 83181.0, 146196.0, 1293279.0, 196277.0, 111710.0, 63051.0, 36132.0, 21382.0, 12450.0, 7497.0, 4601.0, 2617.0, 1635.0, 967.0, 612.0, 396.0, 212.0, 152.0, 74.0, 63.0, 47.0, 23.0, 17.0, 14.0, 3.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.533203125, -1.4864044189453125, -1.439605712890625, -1.3928070068359375, -1.34600830078125, -1.2992095947265625, -1.252410888671875, -1.2056121826171875, -1.1588134765625, -1.1120147705078125, -1.065216064453125, -1.0184173583984375, -0.97161865234375, -0.9248199462890625, -0.878021240234375, -0.8312225341796875, -0.784423828125, -0.7376251220703125, -0.690826416015625, -0.6440277099609375, -0.59722900390625, -0.5504302978515625, -0.503631591796875, -0.4568328857421875, -0.4100341796875, -0.3632354736328125, -0.316436767578125, -0.2696380615234375, -0.22283935546875, -0.1760406494140625, -0.129241943359375, -0.0824432373046875, -0.03564453125, 0.0111541748046875, 0.057952880859375, 0.1047515869140625, 0.15155029296875, 0.1983489990234375, 0.245147705078125, 0.2919464111328125, 0.3387451171875, 0.3855438232421875, 0.432342529296875, 0.4791412353515625, 0.52593994140625, 0.5727386474609375, 0.619537353515625, 0.6663360595703125, 0.713134765625, 0.7599334716796875, 0.806732177734375, 0.8535308837890625, 0.90032958984375, 0.9471282958984375, 0.993927001953125, 1.0407257080078125, 1.0875244140625, 1.1343231201171875, 1.181121826171875, 1.2279205322265625, 1.27471923828125, 1.3215179443359375, 1.368316650390625, 1.4151153564453125, 1.4619140625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 8.0, 8.0, 6.0, 10.0, 11.0, 22.0, 19.0, 21.0, 34.0, 47.0, 58.0, 57.0, 72.0, 69.0, 96.0, 77.0, 59.0, 69.0, 51.0, 44.0, 37.0, 25.0, 21.0, 16.0, 9.0, 13.0, 4.0, 4.0, 7.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002986907958984375, -0.002899855375289917, -0.002812802791595459, -0.002725750207901001, -0.002638697624206543, -0.002551645040512085, -0.002464592456817627, -0.002377539873123169, -0.002290487289428711, -0.002203434705734253, -0.002116382122039795, -0.002029329538345337, -0.001942276954650879, -0.001855224370956421, -0.0017681717872619629, -0.0016811192035675049, -0.0015940666198730469, -0.0015070140361785889, -0.0014199614524841309, -0.0013329088687896729, -0.0012458562850952148, -0.0011588037014007568, -0.0010717511177062988, -0.0009846985340118408, -0.0008976459503173828, -0.0008105933666229248, -0.0007235407829284668, -0.0006364881992340088, -0.0005494356155395508, -0.0004623830318450928, -0.00037533044815063477, -0.00028827786445617676, -0.00020122528076171875, -0.00011417269706726074, -2.7120113372802734e-05, 5.9932470321655273e-05, 0.00014698505401611328, 0.0002340376377105713, 0.0003210902214050293, 0.0004081428050994873, 0.0004951953887939453, 0.0005822479724884033, 0.0006693005561828613, 0.0007563531398773193, 0.0008434057235717773, 0.0009304583072662354, 0.0010175108909606934, 0.0011045634746551514, 0.0011916160583496094, 0.0012786686420440674, 0.0013657212257385254, 0.0014527738094329834, 0.0015398263931274414, 0.0016268789768218994, 0.0017139315605163574, 0.0018009841442108154, 0.0018880367279052734, 0.0019750893115997314, 0.0020621418952941895, 0.0021491944789886475, 0.0022362470626831055, 0.0023232996463775635, 0.0024103522300720215, 0.0024974048137664795, 0.0025844573974609375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 1.0, 5.0, 6.0, 12.0, 8.0, 11.0, 7.0, 20.0, 40.0, 21.0, 60.0, 92.0, 127.0, 158.0, 346.0, 911.0, 299970.0, 744794.0, 1038.0, 339.0, 176.0, 115.0, 76.0, 55.0, 35.0, 27.0, 22.0, 19.0, 8.0, 12.0, 5.0, 10.0, 6.0, 1.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056793212890625, -0.054837703704833984, -0.05288219451904297, -0.05092668533325195, -0.04897117614746094, -0.04701566696166992, -0.045060157775878906, -0.04310464859008789, -0.041149139404296875, -0.03919363021850586, -0.037238121032714844, -0.03528261184692383, -0.03332710266113281, -0.0313715934753418, -0.02941608428955078, -0.027460575103759766, -0.02550506591796875, -0.023549556732177734, -0.02159404754638672, -0.019638538360595703, -0.017683029174804688, -0.015727519989013672, -0.013772010803222656, -0.01181650161743164, -0.009860992431640625, -0.00790548324584961, -0.005949974060058594, -0.003994464874267578, -0.0020389556884765625, -8.344650268554688e-05, 0.0018720626831054688, 0.0038275718688964844, 0.0057830810546875, 0.007738590240478516, 0.009694099426269531, 0.011649608612060547, 0.013605117797851562, 0.015560626983642578, 0.017516136169433594, 0.01947164535522461, 0.021427154541015625, 0.02338266372680664, 0.025338172912597656, 0.027293682098388672, 0.029249191284179688, 0.031204700469970703, 0.03316020965576172, 0.035115718841552734, 0.03707122802734375, 0.039026737213134766, 0.04098224639892578, 0.0429377555847168, 0.04489326477050781, 0.04684877395629883, 0.048804283142089844, 0.05075979232788086, 0.052715301513671875, 0.05467081069946289, 0.056626319885253906, 0.05858182907104492, 0.06053733825683594, 0.06249284744262695, 0.06444835662841797, 0.06640386581420898, 0.068359375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 7.0, 7.0, 23.0, 79.0, 169.0, 276.0, 230.0, 142.0, 59.0, 20.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006881483714096248, -0.0006108620436862111, -0.0005335757159627974, -0.0004562893882393837, -0.00037900306051597, -0.0003017167327925563, -0.00022443040506914258, -0.00014714407734572887, -6.985774962231517e-05, 7.4285781010985374e-06, 8.471490582451224e-05, 0.00016200123354792595, 0.00023928756127133965, 0.00031657388899475336, 0.00039386021671816707, 0.00047114654444158077, 0.0005484328721649945, 0.0006257191998884082, 0.0007030055276118219, 0.0007802918553352356, 0.0008575781830586493, 0.000934864510782063, 0.0010121508967131376, 0.0010894371662288904, 0.0011667234357446432, 0.001244009705260396, 0.0013212960911914706, 0.0013985824771225452, 0.001475868746638298, 0.0015531550161540508, 0.0016304414020851254, 0.0017077277880162, 0.0017850142903625965, 0.0018623005598783493, 0.001939586945809424, 0.0020168733317404985, 0.0020941596012562513, 0.002171445870772004, 0.0022487323731184006, 0.0023260186426341534, 0.002403304912149906, 0.002480591181665659, 0.0025578774511814117, 0.002635163953527808, 0.002712450223043561, 0.0027897364925593138, 0.0028670229949057102, 0.002944309264421463, 0.003021595533937216, 0.0030988818034529686, 0.0031761680729687214, 0.003253454575315118, 0.0033307408448308706, 0.0034080271143466234, 0.00348531361669302, 0.0035625998862087727, 0.0036398861557245255, 0.0037171724252402782, 0.003794458694756031, 0.0038717451971024275, 0.003949031233787537, 0.004026317968964577, 0.0041036042384803295, 0.004180890507996082, 0.004258176777511835]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 11.0, 8.0, 11.0, 10.0, 15.0, 9.0, 18.0, 21.0, 27.0, 27.0, 36.0, 39.0, 40.0, 37.0, 40.0, 46.0, 36.0, 44.0, 32.0, 42.0, 56.0, 29.0, 46.0, 36.0, 37.0, 28.0, 29.0, 36.0, 29.0, 28.0, 14.0, 14.0, 11.0, 14.0, 11.0, 7.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001127481460571289, -0.0010868236422538757, -0.0010461658239364624, -0.001005508005619049, -0.0009648501873016357, -0.0009241923689842224, -0.0008835345506668091, -0.0008428767323493958, -0.0008022189140319824, -0.0007615610957145691, -0.0007209032773971558, -0.0006802454590797424, -0.0006395876407623291, -0.0005989298224449158, -0.0005582720041275024, -0.0005176141858100891, -0.0004769563674926758, -0.00043629854917526245, -0.0003956407308578491, -0.0003549829125404358, -0.00031432509422302246, -0.00027366727590560913, -0.0002330094575881958, -0.00019235163927078247, -0.00015169382095336914, -0.00011103600263595581, -7.037818431854248e-05, -2.972036600112915e-05, 1.093745231628418e-05, 5.159527063369751e-05, 9.225308895111084e-05, 0.00013291090726852417, 0.0001735687255859375, 0.00021422654390335083, 0.00025488436222076416, 0.0002955421805381775, 0.0003361999988555908, 0.00037685781717300415, 0.0004175156354904175, 0.0004581734538078308, 0.0004988312721252441, 0.0005394890904426575, 0.0005801469087600708, 0.0006208047270774841, 0.0006614625453948975, 0.0007021203637123108, 0.0007427781820297241, 0.0007834360003471375, 0.0008240938186645508, 0.0008647516369819641, 0.0009054094552993774, 0.0009460672736167908, 0.000986725091934204, 0.0010273829102516174, 0.0010680407285690308, 0.001108698546886444, 0.0011493563652038574, 0.0011900141835212708, 0.001230672001838684, 0.0012713298201560974, 0.0013119876384735107, 0.001352645456790924, 0.0013933032751083374, 0.0014339610934257507, 0.001474618911743164]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 11.0, 8.0, 10.0, 11.0, 11.0, 15.0, 13.0, 27.0, 17.0, 25.0, 24.0, 34.0, 28.0, 34.0, 38.0, 38.0, 52.0, 44.0, 48.0, 51.0, 35.0, 35.0, 43.0, 32.0, 39.0, 41.0, 28.0, 34.0, 24.0, 24.0, 22.0, 13.0, 15.0, 18.0, 10.0, 5.0, 7.0, 4.0, 6.0, 8.0, 3.0, 2.0, 0.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.680419921875, -8.39208984375, -8.103759765625, -7.8154296875, -7.527099609375, -7.23876953125, -6.950439453125, -6.662109375, -6.373779296875, -6.08544921875, -5.797119140625, -5.5087890625, -5.220458984375, -4.93212890625, -4.643798828125, -4.35546875, -4.067138671875, -3.77880859375, -3.490478515625, -3.2021484375, -2.913818359375, -2.62548828125, -2.337158203125, -2.048828125, -1.760498046875, -1.47216796875, -1.183837890625, -0.8955078125, -0.607177734375, -0.31884765625, -0.030517578125, 0.2578125, 0.546142578125, 0.83447265625, 1.122802734375, 1.4111328125, 1.699462890625, 1.98779296875, 2.276123046875, 2.564453125, 2.852783203125, 3.14111328125, 3.429443359375, 3.7177734375, 4.006103515625, 4.29443359375, 4.582763671875, 4.87109375, 5.159423828125, 5.44775390625, 5.736083984375, 6.0244140625, 6.312744140625, 6.60107421875, 6.889404296875, 7.177734375, 7.466064453125, 7.75439453125, 8.042724609375, 8.3310546875, 8.619384765625, 8.90771484375, 9.196044921875, 9.484375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 10.0, 15.0, 11.0, 16.0, 10.0, 18.0, 22.0, 30.0, 31.0, 55.0, 62.0, 101.0, 138.0, 166.0, 314.0, 585.0, 1560.0, 5686.0, 31413.0, 314460.0, 630879.0, 50619.0, 8535.0, 1991.0, 704.0, 327.0, 228.0, 160.0, 98.0, 74.0, 52.0, 51.0, 29.0, 29.0, 19.0, 7.0, 13.0, 7.0, 7.0, 4.0, 9.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.75, -17.1796875, -16.609375, -16.0390625, -15.46875, -14.8984375, -14.328125, -13.7578125, -13.1875, -12.6171875, -12.046875, -11.4765625, -10.90625, -10.3359375, -9.765625, -9.1953125, -8.625, -8.0546875, -7.484375, -6.9140625, -6.34375, -5.7734375, -5.203125, -4.6328125, -4.0625, -3.4921875, -2.921875, -2.3515625, -1.78125, -1.2109375, -0.640625, -0.0703125, 0.5, 1.0703125, 1.640625, 2.2109375, 2.78125, 3.3515625, 3.921875, 4.4921875, 5.0625, 5.6328125, 6.203125, 6.7734375, 7.34375, 7.9140625, 8.484375, 9.0546875, 9.625, 10.1953125, 10.765625, 11.3359375, 11.90625, 12.4765625, 13.046875, 13.6171875, 14.1875, 14.7578125, 15.328125, 15.8984375, 16.46875, 17.0390625, 17.609375, 18.1796875, 18.75]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 6.0, 5.0, 6.0, 10.0, 6.0, 10.0, 13.0, 17.0, 21.0, 21.0, 27.0, 18.0, 38.0, 25.0, 33.0, 35.0, 54.0, 51.0, 82.0, 145.0, 1569.0, 334.0, 89.0, 65.0, 37.0, 48.0, 44.0, 33.0, 28.0, 25.0, 19.0, 22.0, 25.0, 15.0, 16.0, 13.0, 10.0, 4.0, 6.0, 4.0, 3.0, 3.0, 5.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.6875, -26.819580078125, -25.95166015625, -25.083740234375, -24.2158203125, -23.347900390625, -22.47998046875, -21.612060546875, -20.744140625, -19.876220703125, -19.00830078125, -18.140380859375, -17.2724609375, -16.404541015625, -15.53662109375, -14.668701171875, -13.80078125, -12.932861328125, -12.06494140625, -11.197021484375, -10.3291015625, -9.461181640625, -8.59326171875, -7.725341796875, -6.857421875, -5.989501953125, -5.12158203125, -4.253662109375, -3.3857421875, -2.517822265625, -1.64990234375, -0.781982421875, 0.0859375, 0.953857421875, 1.82177734375, 2.689697265625, 3.5576171875, 4.425537109375, 5.29345703125, 6.161376953125, 7.029296875, 7.897216796875, 8.76513671875, 9.633056640625, 10.5009765625, 11.368896484375, 12.23681640625, 13.104736328125, 13.97265625, 14.840576171875, 15.70849609375, 16.576416015625, 17.4443359375, 18.312255859375, 19.18017578125, 20.048095703125, 20.916015625, 21.783935546875, 22.65185546875, 23.519775390625, 24.3876953125, 25.255615234375, 26.12353515625, 26.991455078125, 27.859375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 4.0, 5.0, 3.0, 4.0, 9.0, 8.0, 8.0, 13.0, 18.0, 30.0, 32.0, 29.0, 41.0, 43.0, 48.0, 92.0, 108.0, 160.0, 329.0, 759.0, 5474.0, 2742113.0, 391317.0, 3439.0, 640.0, 316.0, 189.0, 97.0, 67.0, 64.0, 47.0, 29.0, 38.0, 28.0, 28.0, 15.0, 13.0, 11.0, 9.0, 5.0, 7.0, 7.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-64.5625, -62.5390625, -60.515625, -58.4921875, -56.46875, -54.4453125, -52.421875, -50.3984375, -48.375, -46.3515625, -44.328125, -42.3046875, -40.28125, -38.2578125, -36.234375, -34.2109375, -32.1875, -30.1640625, -28.140625, -26.1171875, -24.09375, -22.0703125, -20.046875, -18.0234375, -16.0, -13.9765625, -11.953125, -9.9296875, -7.90625, -5.8828125, -3.859375, -1.8359375, 0.1875, 2.2109375, 4.234375, 6.2578125, 8.28125, 10.3046875, 12.328125, 14.3515625, 16.375, 18.3984375, 20.421875, 22.4453125, 24.46875, 26.4921875, 28.515625, 30.5390625, 32.5625, 34.5859375, 36.609375, 38.6328125, 40.65625, 42.6796875, 44.703125, 46.7265625, 48.75, 50.7734375, 52.796875, 54.8203125, 56.84375, 58.8671875, 60.890625, 62.9140625, 64.9375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 42.0, 471.0, 454.0, 44.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.8292999267578, -123.87491607666016, -118.9205322265625, -113.96614837646484, -109.01176452636719, -104.05738067626953, -99.10299682617188, -94.14860534667969, -89.19422912597656, -84.2398452758789, -79.28546142578125, -74.3310775756836, -69.37669372558594, -64.42230987548828, -59.46792221069336, -54.5135383605957, -49.55915069580078, -44.604766845703125, -39.65038299560547, -34.69599914550781, -29.741613388061523, -24.787229537963867, -19.832843780517578, -14.878459930419922, -9.924076080322266, -4.969691753387451, -0.015307426452636719, 4.939077377319336, 9.893461227416992, 14.847845077514648, 19.802230834960938, 24.756614685058594, 29.71099853515625, 34.665382385253906, 39.61976623535156, 44.57415008544922, 49.528533935546875, 54.48291778564453, 59.43730545043945, 64.39169311523438, 69.3460693359375, 74.30045318603516, 79.25483703613281, 84.20922088623047, 89.16360473632812, 94.11798858642578, 99.07237243652344, 104.02676391601562, 108.98114776611328, 113.93553161621094, 118.8899154663086, 123.84429931640625, 128.79869079589844, 133.75306701660156, 138.70745849609375, 143.66183471679688, 148.61622619628906, 153.57061767578125, 158.52499389648438, 163.47938537597656, 168.4337615966797, 173.38815307617188, 178.342529296875, 183.2969207763672, 188.2512969970703]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 1.0, 5.0, 8.0, 7.0, 8.0, 10.0, 11.0, 19.0, 10.0, 13.0, 13.0, 18.0, 21.0, 26.0, 27.0, 29.0, 22.0, 35.0, 28.0, 27.0, 31.0, 32.0, 38.0, 36.0, 29.0, 37.0, 32.0, 30.0, 46.0, 29.0, 37.0, 25.0, 21.0, 28.0, 21.0, 17.0, 25.0, 20.0, 12.0, 17.0, 20.0, 12.0, 14.0, 11.0, 7.0, 4.0, 7.0, 7.0, 4.0, 3.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-59.55815124511719, -57.63398742675781, -55.70982360839844, -53.78565979003906, -51.86149978637695, -49.93733596801758, -48.0131721496582, -46.08900833129883, -44.16484832763672, -42.240684509277344, -40.31652069091797, -38.392356872558594, -36.468196868896484, -34.54403305053711, -32.619869232177734, -30.69570541381836, -28.771541595458984, -26.84737777709961, -24.923215866088867, -22.999052047729492, -21.07489013671875, -19.150726318359375, -17.2265625, -15.302399635314941, -13.378236770629883, -11.454073905944824, -9.529911041259766, -7.605747222900391, -5.681584358215332, -3.7574214935302734, -1.8332576751708984, 0.09090518951416016, 2.0150680541992188, 3.9392311573028564, 5.863394260406494, 7.787557601928711, 9.71172046661377, 11.635883331298828, 13.560047149658203, 15.484210014343262, 17.40837287902832, 19.332536697387695, 21.256698608398438, 23.180862426757812, 25.105026245117188, 27.02918815612793, 28.953351974487305, 30.877513885498047, 32.80167770385742, 34.7258415222168, 36.65000534057617, 38.57416534423828, 40.498329162597656, 42.42249298095703, 44.346656799316406, 46.27082061767578, 48.194984436035156, 50.11914825439453, 52.043312072753906, 53.96747589111328, 55.89163589477539, 57.815799713134766, 59.73996353149414, 61.664127349853516, 63.588287353515625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 9.0, 7.0, 4.0, 7.0, 6.0, 12.0, 9.0, 11.0, 18.0, 20.0, 27.0, 27.0, 26.0, 28.0, 35.0, 32.0, 36.0, 43.0, 43.0, 52.0, 39.0, 37.0, 37.0, 62.0, 34.0, 38.0, 31.0, 39.0, 34.0, 29.0, 33.0, 20.0, 20.0, 17.0, 18.0, 14.0, 9.0, 12.0, 6.0, 4.0, 5.0, 1.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.046875, -8.7479248046875, -8.448974609375, -8.1500244140625, -7.85107421875, -7.5521240234375, -7.253173828125, -6.9542236328125, -6.6552734375, -6.3563232421875, -6.057373046875, -5.7584228515625, -5.45947265625, -5.1605224609375, -4.861572265625, -4.5626220703125, -4.263671875, -3.9647216796875, -3.665771484375, -3.3668212890625, -3.06787109375, -2.7689208984375, -2.469970703125, -2.1710205078125, -1.8720703125, -1.5731201171875, -1.274169921875, -0.9752197265625, -0.67626953125, -0.3773193359375, -0.078369140625, 0.2205810546875, 0.51953125, 0.8184814453125, 1.117431640625, 1.4163818359375, 1.71533203125, 2.0142822265625, 2.313232421875, 2.6121826171875, 2.9111328125, 3.2100830078125, 3.509033203125, 3.8079833984375, 4.10693359375, 4.4058837890625, 4.704833984375, 5.0037841796875, 5.302734375, 5.6016845703125, 5.900634765625, 6.1995849609375, 6.49853515625, 6.7974853515625, 7.096435546875, 7.3953857421875, 7.6943359375, 7.9932861328125, 8.292236328125, 8.5911865234375, 8.89013671875, 9.1890869140625, 9.488037109375, 9.7869873046875, 10.0859375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 0.0, 1.0, 6.0, 11.0, 8.0, 10.0, 13.0, 11.0, 18.0, 20.0, 18.0, 25.0, 50.0, 46.0, 66.0, 162.0, 318.0, 685.0, 2039.0, 7001.0, 36784.0, 612072.0, 3101198.0, 395110.0, 29288.0, 6170.0, 1808.0, 657.0, 256.0, 106.0, 67.0, 51.0, 42.0, 30.0, 33.0, 17.0, 16.0, 11.0, 9.0, 9.0, 5.0, 6.0, 5.0, 10.0, 0.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-25.6875, -24.8955078125, -24.103515625, -23.3115234375, -22.51953125, -21.7275390625, -20.935546875, -20.1435546875, -19.3515625, -18.5595703125, -17.767578125, -16.9755859375, -16.18359375, -15.3916015625, -14.599609375, -13.8076171875, -13.015625, -12.2236328125, -11.431640625, -10.6396484375, -9.84765625, -9.0556640625, -8.263671875, -7.4716796875, -6.6796875, -5.8876953125, -5.095703125, -4.3037109375, -3.51171875, -2.7197265625, -1.927734375, -1.1357421875, -0.34375, 0.4482421875, 1.240234375, 2.0322265625, 2.82421875, 3.6162109375, 4.408203125, 5.2001953125, 5.9921875, 6.7841796875, 7.576171875, 8.3681640625, 9.16015625, 9.9521484375, 10.744140625, 11.5361328125, 12.328125, 13.1201171875, 13.912109375, 14.7041015625, 15.49609375, 16.2880859375, 17.080078125, 17.8720703125, 18.6640625, 19.4560546875, 20.248046875, 21.0400390625, 21.83203125, 22.6240234375, 23.416015625, 24.2080078125, 25.0]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 11.0, 18.0, 11.0, 17.0, 23.0, 40.0, 59.0, 95.0, 131.0, 168.0, 272.0, 395.0, 559.0, 620.0, 531.0, 362.0, 254.0, 153.0, 128.0, 78.0, 44.0, 37.0, 24.0, 12.0, 11.0, 10.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.65625, -21.02685546875, -20.3974609375, -19.76806640625, -19.138671875, -18.50927734375, -17.8798828125, -17.25048828125, -16.62109375, -15.99169921875, -15.3623046875, -14.73291015625, -14.103515625, -13.47412109375, -12.8447265625, -12.21533203125, -11.5859375, -10.95654296875, -10.3271484375, -9.69775390625, -9.068359375, -8.43896484375, -7.8095703125, -7.18017578125, -6.55078125, -5.92138671875, -5.2919921875, -4.66259765625, -4.033203125, -3.40380859375, -2.7744140625, -2.14501953125, -1.515625, -0.88623046875, -0.2568359375, 0.37255859375, 1.001953125, 1.63134765625, 2.2607421875, 2.89013671875, 3.51953125, 4.14892578125, 4.7783203125, 5.40771484375, 6.037109375, 6.66650390625, 7.2958984375, 7.92529296875, 8.5546875, 9.18408203125, 9.8134765625, 10.44287109375, 11.072265625, 11.70166015625, 12.3310546875, 12.96044921875, 13.58984375, 14.21923828125, 14.8486328125, 15.47802734375, 16.107421875, 16.73681640625, 17.3662109375, 17.99560546875, 18.625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 9.0, 12.0, 11.0, 9.0, 27.0, 36.0, 39.0, 66.0, 78.0, 102.0, 141.0, 240.0, 354.0, 942.0, 6287.0, 773787.0, 3397200.0, 12376.0, 1244.0, 471.0, 247.0, 170.0, 111.0, 85.0, 51.0, 48.0, 42.0, 23.0, 19.0, 14.0, 10.0, 9.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-90.5625, -88.18603515625, -85.8095703125, -83.43310546875, -81.056640625, -78.68017578125, -76.3037109375, -73.92724609375, -71.55078125, -69.17431640625, -66.7978515625, -64.42138671875, -62.044921875, -59.66845703125, -57.2919921875, -54.91552734375, -52.5390625, -50.16259765625, -47.7861328125, -45.40966796875, -43.033203125, -40.65673828125, -38.2802734375, -35.90380859375, -33.52734375, -31.15087890625, -28.7744140625, -26.39794921875, -24.021484375, -21.64501953125, -19.2685546875, -16.89208984375, -14.515625, -12.13916015625, -9.7626953125, -7.38623046875, -5.009765625, -2.63330078125, -0.2568359375, 2.11962890625, 4.49609375, 6.87255859375, 9.2490234375, 11.62548828125, 14.001953125, 16.37841796875, 18.7548828125, 21.13134765625, 23.5078125, 25.88427734375, 28.2607421875, 30.63720703125, 33.013671875, 35.39013671875, 37.7666015625, 40.14306640625, 42.51953125, 44.89599609375, 47.2724609375, 49.64892578125, 52.025390625, 54.40185546875, 56.7783203125, 59.15478515625, 61.53125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 11.0, 31.0, 74.0, 155.0, 248.0, 251.0, 146.0, 64.0, 16.0, 10.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.1055450439453, -158.2458953857422, -154.38623046875, -150.52658081054688, -146.6669158935547, -142.80726623535156, -138.94760131835938, -135.08795166015625, -131.22830200195312, -127.36864471435547, -123.50898742675781, -119.64933776855469, -115.78968048095703, -111.93002319335938, -108.07036590576172, -104.21070861816406, -100.3510513305664, -96.49139404296875, -92.6317367553711, -88.77207946777344, -84.91242980957031, -81.05277252197266, -77.193115234375, -73.33345794677734, -69.47380065917969, -65.61414337158203, -61.75448989868164, -57.894832611083984, -54.035179138183594, -50.17552185058594, -46.31586456298828, -42.456207275390625, -38.5965576171875, -34.736900329589844, -30.877246856689453, -27.017589569091797, -23.157934188842773, -19.29827880859375, -15.438621520996094, -11.57896614074707, -7.719310760498047, -3.8596549034118652, 9.5367431640625e-07, 3.8596572875976562, 7.71931266784668, 11.578968048095703, 15.43862533569336, 19.298280715942383, 23.157936096191406, 27.01759147644043, 30.877246856689453, 34.73690414428711, 38.5965576171875, 42.456214904785156, 46.31587219238281, 50.17552947998047, 54.03518295288086, 57.894840240478516, 61.754493713378906, 65.61415100097656, 69.47380828857422, 73.33346557617188, 77.193115234375, 81.05277252197266, 84.91242980957031]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 11.0, 4.0, 6.0, 9.0, 11.0, 9.0, 23.0, 16.0, 22.0, 25.0, 26.0, 37.0, 32.0, 27.0, 38.0, 39.0, 40.0, 43.0, 30.0, 43.0, 46.0, 47.0, 55.0, 47.0, 43.0, 37.0, 40.0, 31.0, 25.0, 23.0, 12.0, 17.0, 13.0, 11.0, 11.0, 18.0, 12.0, 4.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.865867614746094, -52.09005355834961, -50.31423568725586, -48.538421630859375, -46.76260757446289, -44.98678970336914, -43.210975646972656, -41.435157775878906, -39.65934371948242, -37.88352966308594, -36.10771179199219, -34.3318977355957, -32.55608367919922, -30.78026580810547, -29.004451751708984, -27.228635787963867, -25.452821731567383, -23.677005767822266, -21.90119171142578, -20.125375747680664, -18.349559783935547, -16.573745727539062, -14.797929763793945, -13.022113800048828, -11.246298789978027, -9.470483779907227, -7.694667816162109, -5.918852806091309, -4.14303731918335, -2.3672218322753906, -0.5914068222045898, 1.1844091415405273, 2.960224151611328, 4.736039638519287, 6.511855125427246, 8.287670135498047, 10.063486099243164, 11.839301109313965, 13.615116119384766, 15.390932083129883, 17.166748046875, 18.942564010620117, 20.7183780670166, 22.49419403076172, 24.270009994506836, 26.045825958251953, 27.821640014648438, 29.597455978393555, 31.37327003479004, 33.149085998535156, 34.92490005493164, 36.700714111328125, 38.476531982421875, 40.25234603881836, 42.028160095214844, 43.803977966308594, 45.57979202270508, 47.35560607910156, 49.13142395019531, 50.9072380065918, 52.68305206298828, 54.45886993408203, 56.234683990478516, 58.010498046875, 59.78631591796875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 10.0, 6.0, 15.0, 10.0, 15.0, 9.0, 15.0, 20.0, 17.0, 24.0, 27.0, 19.0, 21.0, 30.0, 31.0, 35.0, 31.0, 33.0, 47.0, 40.0, 38.0, 35.0, 42.0, 41.0, 47.0, 33.0, 37.0, 40.0, 38.0, 23.0, 23.0, 29.0, 13.0, 13.0, 18.0, 13.0, 14.0, 9.0, 10.0, 6.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.921875, -9.634521484375, -9.34716796875, -9.059814453125, -8.7724609375, -8.485107421875, -8.19775390625, -7.910400390625, -7.623046875, -7.335693359375, -7.04833984375, -6.760986328125, -6.4736328125, -6.186279296875, -5.89892578125, -5.611572265625, -5.32421875, -5.036865234375, -4.74951171875, -4.462158203125, -4.1748046875, -3.887451171875, -3.60009765625, -3.312744140625, -3.025390625, -2.738037109375, -2.45068359375, -2.163330078125, -1.8759765625, -1.588623046875, -1.30126953125, -1.013916015625, -0.7265625, -0.439208984375, -0.15185546875, 0.135498046875, 0.4228515625, 0.710205078125, 0.99755859375, 1.284912109375, 1.572265625, 1.859619140625, 2.14697265625, 2.434326171875, 2.7216796875, 3.009033203125, 3.29638671875, 3.583740234375, 3.87109375, 4.158447265625, 4.44580078125, 4.733154296875, 5.0205078125, 5.307861328125, 5.59521484375, 5.882568359375, 6.169921875, 6.457275390625, 6.74462890625, 7.031982421875, 7.3193359375, 7.606689453125, 7.89404296875, 8.181396484375, 8.46875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 0.0, 6.0, 9.0, 11.0, 12.0, 26.0, 33.0, 55.0, 80.0, 122.0, 198.0, 299.0, 437.0, 652.0, 980.0, 1390.0, 2107.0, 3334.0, 4769.0, 7394.0, 11065.0, 17093.0, 26534.0, 41011.0, 64601.0, 103356.0, 165459.0, 212187.0, 140626.0, 88323.0, 55046.0, 35440.0, 22600.0, 14491.0, 9617.0, 6478.0, 4192.0, 2797.0, 1917.0, 1267.0, 830.0, 544.0, 359.0, 279.0, 182.0, 122.0, 68.0, 54.0, 49.0, 23.0, 19.0, 10.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.234283447265625, -1.19219970703125, -1.150115966796875, -1.1080322265625, -1.065948486328125, -1.02386474609375, -0.981781005859375, -0.939697265625, -0.897613525390625, -0.85552978515625, -0.813446044921875, -0.7713623046875, -0.729278564453125, -0.68719482421875, -0.645111083984375, -0.60302734375, -0.560943603515625, -0.51885986328125, -0.476776123046875, -0.4346923828125, -0.392608642578125, -0.35052490234375, -0.308441162109375, -0.266357421875, -0.224273681640625, -0.18218994140625, -0.140106201171875, -0.0980224609375, -0.055938720703125, -0.01385498046875, 0.028228759765625, 0.0703125, 0.112396240234375, 0.15447998046875, 0.196563720703125, 0.2386474609375, 0.280731201171875, 0.32281494140625, 0.364898681640625, 0.406982421875, 0.449066162109375, 0.49114990234375, 0.533233642578125, 0.5753173828125, 0.617401123046875, 0.65948486328125, 0.701568603515625, 0.74365234375, 0.785736083984375, 0.82781982421875, 0.869903564453125, 0.9119873046875, 0.954071044921875, 0.99615478515625, 1.038238525390625, 1.080322265625, 1.122406005859375, 1.16448974609375, 1.206573486328125, 1.2486572265625, 1.290740966796875, 1.33282470703125, 1.374908447265625, 1.4169921875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 9.0, 9.0, 4.0, 10.0, 14.0, 16.0, 22.0, 13.0, 20.0, 19.0, 26.0, 38.0, 31.0, 36.0, 48.0, 45.0, 42.0, 52.0, 40.0, 1079.0, 43.0, 41.0, 32.0, 35.0, 24.0, 36.0, 28.0, 27.0, 25.0, 31.0, 29.0, 17.0, 13.0, 14.0, 8.0, 10.0, 8.0, 11.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96484375, -5.765380859375, -5.56591796875, -5.366455078125, -5.1669921875, -4.967529296875, -4.76806640625, -4.568603515625, -4.369140625, -4.169677734375, -3.97021484375, -3.770751953125, -3.5712890625, -3.371826171875, -3.17236328125, -2.972900390625, -2.7734375, -2.573974609375, -2.37451171875, -2.175048828125, -1.9755859375, -1.776123046875, -1.57666015625, -1.377197265625, -1.177734375, -0.978271484375, -0.77880859375, -0.579345703125, -0.3798828125, -0.180419921875, 0.01904296875, 0.218505859375, 0.41796875, 0.617431640625, 0.81689453125, 1.016357421875, 1.2158203125, 1.415283203125, 1.61474609375, 1.814208984375, 2.013671875, 2.213134765625, 2.41259765625, 2.612060546875, 2.8115234375, 3.010986328125, 3.21044921875, 3.409912109375, 3.609375, 3.808837890625, 4.00830078125, 4.207763671875, 4.4072265625, 4.606689453125, 4.80615234375, 5.005615234375, 5.205078125, 5.404541015625, 5.60400390625, 5.803466796875, 6.0029296875, 6.202392578125, 6.40185546875, 6.601318359375, 6.80078125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 7.0, 17.0, 23.0, 45.0, 55.0, 79.0, 108.0, 213.0, 284.0, 517.0, 747.0, 1124.0, 1723.0, 2702.0, 4272.0, 6803.0, 10780.0, 16974.0, 26766.0, 42282.0, 68353.0, 108503.0, 171609.0, 1256187.0, 139284.0, 88107.0, 55507.0, 34449.0, 21652.0, 13749.0, 8725.0, 5563.0, 3518.0, 2296.0, 1520.0, 886.0, 588.0, 365.0, 242.0, 196.0, 102.0, 69.0, 56.0, 27.0, 16.0, 15.0, 9.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2469024658203125, -1.205718994140625, -1.1645355224609375, -1.12335205078125, -1.0821685791015625, -1.040985107421875, -0.9998016357421875, -0.9586181640625, -0.9174346923828125, -0.876251220703125, -0.8350677490234375, -0.79388427734375, -0.7527008056640625, -0.711517333984375, -0.6703338623046875, -0.629150390625, -0.5879669189453125, -0.546783447265625, -0.5055999755859375, -0.46441650390625, -0.4232330322265625, -0.382049560546875, -0.3408660888671875, -0.2996826171875, -0.2584991455078125, -0.217315673828125, -0.1761322021484375, -0.13494873046875, -0.0937652587890625, -0.052581787109375, -0.0113983154296875, 0.02978515625, 0.0709686279296875, 0.112152099609375, 0.1533355712890625, 0.19451904296875, 0.2357025146484375, 0.276885986328125, 0.3180694580078125, 0.3592529296875, 0.4004364013671875, 0.441619873046875, 0.4828033447265625, 0.52398681640625, 0.5651702880859375, 0.606353759765625, 0.6475372314453125, 0.688720703125, 0.7299041748046875, 0.771087646484375, 0.8122711181640625, 0.85345458984375, 0.8946380615234375, 0.935821533203125, 0.9770050048828125, 1.0181884765625, 1.0593719482421875, 1.100555419921875, 1.1417388916015625, 1.18292236328125, 1.2241058349609375, 1.265289306640625, 1.3064727783203125, 1.34765625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 4.0, 4.0, 9.0, 7.0, 8.0, 10.0, 15.0, 31.0, 29.0, 41.0, 65.0, 65.0, 73.0, 80.0, 85.0, 100.0, 70.0, 67.0, 52.0, 41.0, 38.0, 24.0, 18.0, 9.0, 14.0, 15.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036334991455078125, -0.003529101610183716, -0.003424704074859619, -0.0033203065395355225, -0.0032159090042114258, -0.003111511468887329, -0.0030071139335632324, -0.0029027163982391357, -0.002798318862915039, -0.0026939213275909424, -0.0025895237922668457, -0.002485126256942749, -0.0023807287216186523, -0.0022763311862945557, -0.002171933650970459, -0.0020675361156463623, -0.0019631385803222656, -0.001858741044998169, -0.0017543435096740723, -0.0016499459743499756, -0.001545548439025879, -0.0014411509037017822, -0.0013367533683776855, -0.0012323558330535889, -0.0011279582977294922, -0.0010235607624053955, -0.0009191632270812988, -0.0008147656917572021, -0.0007103681564331055, -0.0006059706211090088, -0.0005015730857849121, -0.00039717555046081543, -0.00029277801513671875, -0.00018838047981262207, -8.398294448852539e-05, 2.041459083557129e-05, 0.00012481212615966797, 0.00022920966148376465, 0.00033360719680786133, 0.000438004732131958, 0.0005424022674560547, 0.0006467998027801514, 0.000751197338104248, 0.0008555948734283447, 0.0009599924087524414, 0.001064389944076538, 0.0011687874794006348, 0.0012731850147247314, 0.0013775825500488281, 0.0014819800853729248, 0.0015863776206970215, 0.0016907751560211182, 0.0017951726913452148, 0.0018995702266693115, 0.002003967761993408, 0.002108365297317505, 0.0022127628326416016, 0.0023171603679656982, 0.002421557903289795, 0.0025259554386138916, 0.0026303529739379883, 0.002734750509262085, 0.0028391480445861816, 0.0029435455799102783, 0.003047943115234375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 2.0, 8.0, 14.0, 20.0, 14.0, 23.0, 28.0, 43.0, 54.0, 96.0, 147.0, 252.0, 687.0, 48673.0, 996295.0, 1241.0, 337.0, 190.0, 122.0, 75.0, 56.0, 39.0, 29.0, 20.0, 22.0, 10.0, 4.0, 11.0, 6.0, 6.0, 9.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059783935546875, -0.057584285736083984, -0.05538463592529297, -0.05318498611450195, -0.05098533630371094, -0.04878568649291992, -0.046586036682128906, -0.04438638687133789, -0.042186737060546875, -0.03998708724975586, -0.037787437438964844, -0.03558778762817383, -0.03338813781738281, -0.031188488006591797, -0.02898883819580078, -0.026789188385009766, -0.02458953857421875, -0.022389888763427734, -0.02019023895263672, -0.017990589141845703, -0.015790939331054688, -0.013591289520263672, -0.011391639709472656, -0.00919198989868164, -0.006992340087890625, -0.004792690277099609, -0.0025930404663085938, -0.0003933906555175781, 0.0018062591552734375, 0.004005908966064453, 0.006205558776855469, 0.008405208587646484, 0.0106048583984375, 0.012804508209228516, 0.015004158020019531, 0.017203807830810547, 0.019403457641601562, 0.021603107452392578, 0.023802757263183594, 0.02600240707397461, 0.028202056884765625, 0.03040170669555664, 0.032601356506347656, 0.03480100631713867, 0.03700065612792969, 0.0392003059387207, 0.04139995574951172, 0.043599605560302734, 0.04579925537109375, 0.047998905181884766, 0.05019855499267578, 0.0523982048034668, 0.05459785461425781, 0.05679750442504883, 0.058997154235839844, 0.06119680404663086, 0.06339645385742188, 0.06559610366821289, 0.0677957534790039, 0.06999540328979492, 0.07219505310058594, 0.07439470291137695, 0.07659435272216797, 0.07879400253295898, 0.08099365234375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 13.0, 503.0, 488.0, 15.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011714515276253223, -0.0007818718440830708, -0.00039229216054081917, -2.712476998567581e-06, 0.000386867206543684, 0.0007764468900859356, 0.0011660265736281872, 0.0015556062571704388, 0.0019451859407126904, 0.002334765624254942, 0.0027243453077971935, 0.003113924991339445, 0.0035035046748816967, 0.0038930843584239483, 0.0042826640419662, 0.0046722437255084515, 0.005061823409050703, 0.005451403092592955, 0.005840982776135206, 0.006230562459677458, 0.006620142143219709, 0.007009721826761961, 0.007399301510304213, 0.007788881193846464, 0.008178461343050003, 0.008568041026592255, 0.008957620710134506, 0.009347200393676758, 0.00973678007721901, 0.010126359760761261, 0.010515939444303513, 0.010905519127845764, 0.011295098811388016, 0.011684678494930267, 0.012074258178472519, 0.01246383786201477, 0.012853417545557022, 0.013242997229099274, 0.013632576912641525, 0.014022156596183777, 0.014411736279726028, 0.01480131596326828, 0.015190895646810532, 0.015580475330352783, 0.015970055013895035, 0.016359634697437286, 0.016749214380979538, 0.01713879406452179, 0.01752837374806404, 0.017917953431606293, 0.018307533115148544, 0.018697112798690796, 0.019086692482233047, 0.0194762721657753, 0.01986585184931755, 0.020255431532859802, 0.020645011216402054, 0.021034590899944305, 0.021424170583486557, 0.02181375026702881, 0.02220332995057106, 0.022592909634113312, 0.022982489317655563, 0.023372069001197815, 0.023761648684740067]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 0.0, 3.0, 5.0, 4.0, 4.0, 6.0, 9.0, 10.0, 4.0, 8.0, 9.0, 9.0, 16.0, 17.0, 24.0, 19.0, 17.0, 30.0, 25.0, 30.0, 25.0, 30.0, 45.0, 45.0, 42.0, 40.0, 42.0, 40.0, 41.0, 38.0, 37.0, 32.0, 43.0, 31.0, 35.0, 28.0, 24.0, 18.0, 13.0, 22.0, 10.0, 13.0, 9.0, 9.0, 12.0, 11.0, 6.0, 5.0, 2.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012637972831726074, -0.001223200000822544, -0.0011826027184724808, -0.0011420054361224174, -0.0011014081537723541, -0.0010608108714222908, -0.0010202135890722275, -0.0009796163067221642, -0.0009390190243721008, -0.0008984217420220375, -0.0008578244596719742, -0.0008172271773219109, -0.0007766298949718475, -0.0007360326126217842, -0.0006954353302717209, -0.0006548380479216576, -0.0006142407655715942, -0.0005736434832215309, -0.0005330462008714676, -0.0004924489185214043, -0.00045185163617134094, -0.0004112543538212776, -0.0003706570714712143, -0.00033005978912115097, -0.00028946250677108765, -0.0002488652244210243, -0.000208267942070961, -0.00016767065972089767, -0.00012707337737083435, -8.647609502077103e-05, -4.58788126707077e-05, -5.281530320644379e-06, 3.5315752029418945e-05, 7.591303437948227e-05, 0.0001165103167295456, 0.00015710759907960892, 0.00019770488142967224, 0.00023830216377973557, 0.0002788994461297989, 0.0003194967284798622, 0.00036009401082992554, 0.00040069129317998886, 0.0004412885755300522, 0.0004818858578801155, 0.0005224831402301788, 0.0005630804225802422, 0.0006036777049303055, 0.0006442749872803688, 0.0006848722696304321, 0.0007254695519804955, 0.0007660668343305588, 0.0008066641166806221, 0.0008472613990306854, 0.0008878586813807487, 0.0009284559637308121, 0.0009690532460808754, 0.0010096505284309387, 0.001050247810781002, 0.0010908450931310654, 0.0011314423754811287, 0.001172039657831192, 0.0012126369401812553, 0.0012532342225313187, 0.001293831504881382, 0.0013344287872314453]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 10.0, 6.0, 15.0, 10.0, 15.0, 9.0, 15.0, 20.0, 17.0, 24.0, 27.0, 19.0, 21.0, 30.0, 31.0, 35.0, 31.0, 33.0, 47.0, 40.0, 38.0, 35.0, 42.0, 41.0, 47.0, 33.0, 37.0, 40.0, 38.0, 23.0, 23.0, 29.0, 13.0, 13.0, 18.0, 13.0, 14.0, 9.0, 10.0, 6.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.921875, -9.634521484375, -9.34716796875, -9.059814453125, -8.7724609375, -8.485107421875, -8.19775390625, -7.910400390625, -7.623046875, -7.335693359375, -7.04833984375, -6.760986328125, -6.4736328125, -6.186279296875, -5.89892578125, -5.611572265625, -5.32421875, -5.036865234375, -4.74951171875, -4.462158203125, -4.1748046875, -3.887451171875, -3.60009765625, -3.312744140625, -3.025390625, -2.738037109375, -2.45068359375, -2.163330078125, -1.8759765625, -1.588623046875, -1.30126953125, -1.013916015625, -0.7265625, -0.439208984375, -0.15185546875, 0.135498046875, 0.4228515625, 0.710205078125, 0.99755859375, 1.284912109375, 1.572265625, 1.859619140625, 2.14697265625, 2.434326171875, 2.7216796875, 3.009033203125, 3.29638671875, 3.583740234375, 3.87109375, 4.158447265625, 4.44580078125, 4.733154296875, 5.0205078125, 5.307861328125, 5.59521484375, 5.882568359375, 6.169921875, 6.457275390625, 6.74462890625, 7.031982421875, 7.3193359375, 7.606689453125, 7.89404296875, 8.181396484375, 8.46875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 4.0, 11.0, 8.0, 13.0, 30.0, 28.0, 31.0, 29.0, 48.0, 52.0, 72.0, 89.0, 142.0, 193.0, 249.0, 304.0, 434.0, 636.0, 1263.0, 3553.0, 14187.0, 80078.0, 832710.0, 91245.0, 15553.0, 3854.0, 1238.0, 667.0, 441.0, 350.0, 262.0, 178.0, 162.0, 104.0, 74.0, 52.0, 49.0, 38.0, 23.0, 27.0, 18.0, 10.0, 14.0, 10.0, 4.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-25.078125, -24.351806640625, -23.62548828125, -22.899169921875, -22.1728515625, -21.446533203125, -20.72021484375, -19.993896484375, -19.267578125, -18.541259765625, -17.81494140625, -17.088623046875, -16.3623046875, -15.635986328125, -14.90966796875, -14.183349609375, -13.45703125, -12.730712890625, -12.00439453125, -11.278076171875, -10.5517578125, -9.825439453125, -9.09912109375, -8.372802734375, -7.646484375, -6.920166015625, -6.19384765625, -5.467529296875, -4.7412109375, -4.014892578125, -3.28857421875, -2.562255859375, -1.8359375, -1.109619140625, -0.38330078125, 0.343017578125, 1.0693359375, 1.795654296875, 2.52197265625, 3.248291015625, 3.974609375, 4.700927734375, 5.42724609375, 6.153564453125, 6.8798828125, 7.606201171875, 8.33251953125, 9.058837890625, 9.78515625, 10.511474609375, 11.23779296875, 11.964111328125, 12.6904296875, 13.416748046875, 14.14306640625, 14.869384765625, 15.595703125, 16.322021484375, 17.04833984375, 17.774658203125, 18.5009765625, 19.227294921875, 19.95361328125, 20.679931640625, 21.40625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 7.0, 5.0, 8.0, 6.0, 11.0, 10.0, 20.0, 17.0, 20.0, 21.0, 22.0, 34.0, 41.0, 26.0, 41.0, 50.0, 54.0, 61.0, 180.0, 1741.0, 192.0, 71.0, 57.0, 50.0, 39.0, 37.0, 35.0, 32.0, 26.0, 22.0, 22.0, 10.0, 14.0, 20.0, 10.0, 9.0, 8.0, 5.0, 1.0, 5.0, 1.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.875, -28.984375, -28.09375, -27.203125, -26.3125, -25.421875, -24.53125, -23.640625, -22.75, -21.859375, -20.96875, -20.078125, -19.1875, -18.296875, -17.40625, -16.515625, -15.625, -14.734375, -13.84375, -12.953125, -12.0625, -11.171875, -10.28125, -9.390625, -8.5, -7.609375, -6.71875, -5.828125, -4.9375, -4.046875, -3.15625, -2.265625, -1.375, -0.484375, 0.40625, 1.296875, 2.1875, 3.078125, 3.96875, 4.859375, 5.75, 6.640625, 7.53125, 8.421875, 9.3125, 10.203125, 11.09375, 11.984375, 12.875, 13.765625, 14.65625, 15.546875, 16.4375, 17.328125, 18.21875, 19.109375, 20.0, 20.890625, 21.78125, 22.671875, 23.5625, 24.453125, 25.34375, 26.234375, 27.125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 2.0, 9.0, 13.0, 14.0, 20.0, 16.0, 19.0, 20.0, 32.0, 43.0, 41.0, 46.0, 89.0, 102.0, 192.0, 356.0, 1327.0, 31649.0, 3090045.0, 19573.0, 1078.0, 345.0, 185.0, 116.0, 66.0, 57.0, 36.0, 32.0, 33.0, 30.0, 16.0, 25.0, 12.0, 10.0, 13.0, 4.0, 5.0, 10.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.1875, -72.7177734375, -70.248046875, -67.7783203125, -65.30859375, -62.8388671875, -60.369140625, -57.8994140625, -55.4296875, -52.9599609375, -50.490234375, -48.0205078125, -45.55078125, -43.0810546875, -40.611328125, -38.1416015625, -35.671875, -33.2021484375, -30.732421875, -28.2626953125, -25.79296875, -23.3232421875, -20.853515625, -18.3837890625, -15.9140625, -13.4443359375, -10.974609375, -8.5048828125, -6.03515625, -3.5654296875, -1.095703125, 1.3740234375, 3.84375, 6.3134765625, 8.783203125, 11.2529296875, 13.72265625, 16.1923828125, 18.662109375, 21.1318359375, 23.6015625, 26.0712890625, 28.541015625, 31.0107421875, 33.48046875, 35.9501953125, 38.419921875, 40.8896484375, 43.359375, 45.8291015625, 48.298828125, 50.7685546875, 53.23828125, 55.7080078125, 58.177734375, 60.6474609375, 63.1171875, 65.5869140625, 68.056640625, 70.5263671875, 72.99609375, 75.4658203125, 77.935546875, 80.4052734375, 82.875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 19.0, 121.0, 321.0, 377.0, 129.0, 32.0, 9.0, 4.0, 1.0, 1.0], "bins": [-157.57447814941406, -154.81683349609375, -152.05917358398438, -149.30152893066406, -146.54388427734375, -143.78622436523438, -141.02857971191406, -138.27093505859375, -135.51327514648438, -132.75563049316406, -129.9979705810547, -127.24032592773438, -124.48267364501953, -121.72502136230469, -118.96737670898438, -116.20972442626953, -113.45207977294922, -110.69442749023438, -107.93678283691406, -105.17913055419922, -102.42147827148438, -99.66383361816406, -96.90618133544922, -94.14852905273438, -91.39088439941406, -88.63323211669922, -85.8755874633789, -83.11793518066406, -80.36028289794922, -77.60263061523438, -74.84498596191406, -72.08733367919922, -69.3296890258789, -66.57203674316406, -63.814388275146484, -61.056739807128906, -58.29908752441406, -55.541439056396484, -52.783790588378906, -50.02613830566406, -47.268489837646484, -44.510841369628906, -41.75318908691406, -38.995540618896484, -36.237892150878906, -33.48023986816406, -30.722591400146484, -27.964941024780273, -25.207290649414062, -22.44964027404785, -19.69198989868164, -16.934341430664062, -14.176691055297852, -11.41904067993164, -8.661392211914062, -5.903741836547852, -3.1460914611816406, -0.3884415626525879, 2.369208335876465, 5.126857757568359, 7.88450813293457, 10.642158508300781, 13.39980697631836, 16.15745735168457, 18.91510772705078]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 10.0, 5.0, 17.0, 20.0, 15.0, 14.0, 31.0, 34.0, 29.0, 36.0, 36.0, 46.0, 55.0, 36.0, 42.0, 48.0, 47.0, 58.0, 46.0, 34.0, 47.0, 33.0, 32.0, 34.0, 32.0, 24.0, 22.0, 28.0, 19.0, 14.0, 12.0, 12.0, 6.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-83.14183807373047, -80.67510986328125, -78.2083740234375, -75.74164581298828, -73.27491760253906, -70.80818176269531, -68.3414535522461, -65.87472534179688, -63.407989501953125, -60.94125747680664, -58.47452926635742, -56.00779724121094, -53.54106521606445, -51.07433319091797, -48.60760498046875, -46.140872955322266, -43.67414474487305, -41.20741271972656, -38.740684509277344, -36.27395248413086, -33.807220458984375, -31.340490341186523, -28.873760223388672, -26.407028198242188, -23.940298080444336, -21.473567962646484, -19.0068359375, -16.54010581970215, -14.07337474822998, -11.606643676757812, -9.139913558959961, -6.673181533813477, -4.206451416015625, -1.7397205829620361, 0.7270102500915527, 3.1937408447265625, 5.6604719161987305, 8.127202987670898, 10.59393310546875, 13.060665130615234, 15.527395248413086, 17.994125366210938, 20.460857391357422, 22.927587509155273, 25.394317626953125, 27.86104965209961, 30.32777976989746, 32.79450988769531, 35.2612419128418, 37.72797393798828, 40.1947021484375, 42.661434173583984, 45.12816619873047, 47.59489440917969, 50.06162643432617, 52.528358459472656, 54.995086669921875, 57.46181869506836, 59.92854690551758, 62.39527893066406, 64.86200714111328, 67.32874298095703, 69.79547119140625, 72.26220703125, 74.72893524169922]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 9.0, 8.0, 14.0, 19.0, 14.0, 16.0, 17.0, 18.0, 23.0, 32.0, 25.0, 29.0, 27.0, 34.0, 29.0, 24.0, 51.0, 49.0, 47.0, 53.0, 60.0, 50.0, 41.0, 44.0, 37.0, 26.0, 29.0, 32.0, 20.0, 20.0, 15.0, 10.0, 20.0, 10.0, 10.0, 5.0, 10.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.015625, -10.695068359375, -10.37451171875, -10.053955078125, -9.7333984375, -9.412841796875, -9.09228515625, -8.771728515625, -8.451171875, -8.130615234375, -7.81005859375, -7.489501953125, -7.1689453125, -6.848388671875, -6.52783203125, -6.207275390625, -5.88671875, -5.566162109375, -5.24560546875, -4.925048828125, -4.6044921875, -4.283935546875, -3.96337890625, -3.642822265625, -3.322265625, -3.001708984375, -2.68115234375, -2.360595703125, -2.0400390625, -1.719482421875, -1.39892578125, -1.078369140625, -0.7578125, -0.437255859375, -0.11669921875, 0.203857421875, 0.5244140625, 0.844970703125, 1.16552734375, 1.486083984375, 1.806640625, 2.127197265625, 2.44775390625, 2.768310546875, 3.0888671875, 3.409423828125, 3.72998046875, 4.050537109375, 4.37109375, 4.691650390625, 5.01220703125, 5.332763671875, 5.6533203125, 5.973876953125, 6.29443359375, 6.614990234375, 6.935546875, 7.256103515625, 7.57666015625, 7.897216796875, 8.2177734375, 8.538330078125, 8.85888671875, 9.179443359375, 9.5]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 5.0, 11.0, 12.0, 7.0, 17.0, 22.0, 19.0, 40.0, 48.0, 75.0, 94.0, 130.0, 176.0, 301.0, 493.0, 1083.0, 2876.0, 9142.0, 44582.0, 702334.0, 2995714.0, 393973.0, 31358.0, 7145.0, 2367.0, 918.0, 470.0, 280.0, 164.0, 114.0, 87.0, 49.0, 51.0, 32.0, 19.0, 19.0, 11.0, 15.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.296875, -26.50341796875, -25.7099609375, -24.91650390625, -24.123046875, -23.32958984375, -22.5361328125, -21.74267578125, -20.94921875, -20.15576171875, -19.3623046875, -18.56884765625, -17.775390625, -16.98193359375, -16.1884765625, -15.39501953125, -14.6015625, -13.80810546875, -13.0146484375, -12.22119140625, -11.427734375, -10.63427734375, -9.8408203125, -9.04736328125, -8.25390625, -7.46044921875, -6.6669921875, -5.87353515625, -5.080078125, -4.28662109375, -3.4931640625, -2.69970703125, -1.90625, -1.11279296875, -0.3193359375, 0.47412109375, 1.267578125, 2.06103515625, 2.8544921875, 3.64794921875, 4.44140625, 5.23486328125, 6.0283203125, 6.82177734375, 7.615234375, 8.40869140625, 9.2021484375, 9.99560546875, 10.7890625, 11.58251953125, 12.3759765625, 13.16943359375, 13.962890625, 14.75634765625, 15.5498046875, 16.34326171875, 17.13671875, 17.93017578125, 18.7236328125, 19.51708984375, 20.310546875, 21.10400390625, 21.8974609375, 22.69091796875, 23.484375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 16.0, 17.0, 34.0, 64.0, 105.0, 204.0, 316.0, 551.0, 787.0, 767.0, 530.0, 259.0, 170.0, 92.0, 62.0, 33.0, 30.0, 19.0, 9.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.015625, -23.154052734375, -22.29248046875, -21.430908203125, -20.5693359375, -19.707763671875, -18.84619140625, -17.984619140625, -17.123046875, -16.261474609375, -15.39990234375, -14.538330078125, -13.6767578125, -12.815185546875, -11.95361328125, -11.092041015625, -10.23046875, -9.368896484375, -8.50732421875, -7.645751953125, -6.7841796875, -5.922607421875, -5.06103515625, -4.199462890625, -3.337890625, -2.476318359375, -1.61474609375, -0.753173828125, 0.1083984375, 0.969970703125, 1.83154296875, 2.693115234375, 3.5546875, 4.416259765625, 5.27783203125, 6.139404296875, 7.0009765625, 7.862548828125, 8.72412109375, 9.585693359375, 10.447265625, 11.308837890625, 12.17041015625, 13.031982421875, 13.8935546875, 14.755126953125, 15.61669921875, 16.478271484375, 17.33984375, 18.201416015625, 19.06298828125, 19.924560546875, 20.7861328125, 21.647705078125, 22.50927734375, 23.370849609375, 24.232421875, 25.093994140625, 25.95556640625, 26.817138671875, 27.6787109375, 28.540283203125, 29.40185546875, 30.263427734375, 31.125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 14.0, 19.0, 19.0, 22.0, 38.0, 38.0, 79.0, 101.0, 133.0, 203.0, 339.0, 734.0, 2516.0, 28444.0, 3683215.0, 467066.0, 8506.0, 1403.0, 553.0, 282.0, 162.0, 114.0, 84.0, 45.0, 39.0, 31.0, 19.0, 20.0, 10.0, 7.0, 8.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-73.75, -71.630859375, -69.51171875, -67.392578125, -65.2734375, -63.154296875, -61.03515625, -58.916015625, -56.796875, -54.677734375, -52.55859375, -50.439453125, -48.3203125, -46.201171875, -44.08203125, -41.962890625, -39.84375, -37.724609375, -35.60546875, -33.486328125, -31.3671875, -29.248046875, -27.12890625, -25.009765625, -22.890625, -20.771484375, -18.65234375, -16.533203125, -14.4140625, -12.294921875, -10.17578125, -8.056640625, -5.9375, -3.818359375, -1.69921875, 0.419921875, 2.5390625, 4.658203125, 6.77734375, 8.896484375, 11.015625, 13.134765625, 15.25390625, 17.373046875, 19.4921875, 21.611328125, 23.73046875, 25.849609375, 27.96875, 30.087890625, 32.20703125, 34.326171875, 36.4453125, 38.564453125, 40.68359375, 42.802734375, 44.921875, 47.041015625, 49.16015625, 51.279296875, 53.3984375, 55.517578125, 57.63671875, 59.755859375, 61.875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 10.0, 347.0, 639.0, 20.0, 0.0, 0.0, 1.0], "bins": [-955.713134765625, -939.5426025390625, -923.3720703125, -907.2015380859375, -891.031005859375, -874.8604736328125, -858.68994140625, -842.5194091796875, -826.348876953125, -810.1783447265625, -794.0078125, -777.8372802734375, -761.666748046875, -745.4962158203125, -729.32568359375, -713.1551513671875, -696.984619140625, -680.8140869140625, -664.6435546875, -648.4730224609375, -632.302490234375, -616.1319580078125, -599.96142578125, -583.7908935546875, -567.6203002929688, -551.4497680664062, -535.2792358398438, -519.1087036132812, -502.93817138671875, -486.76763916015625, -470.59710693359375, -454.42657470703125, -438.2560119628906, -422.0854797363281, -405.9149475097656, -389.7444152832031, -373.5738830566406, -357.4033508300781, -341.2327880859375, -325.062255859375, -308.8917236328125, -292.72119140625, -276.5506591796875, -260.380126953125, -244.2095947265625, -228.0390625, -211.86851501464844, -195.69798278808594, -179.5274658203125, -163.35693359375, -147.1864013671875, -131.015869140625, -114.84532928466797, -98.67479705810547, -82.50425720214844, -66.33372497558594, -50.163185119628906, -33.992652893066406, -17.82211685180664, -1.651580810546875, 14.518951416015625, 30.689483642578125, 46.860023498535156, 63.030555725097656, 79.20108795166016]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 8.0, 8.0, 16.0, 17.0, 7.0, 13.0, 17.0, 29.0, 22.0, 21.0, 25.0, 31.0, 29.0, 30.0, 41.0, 45.0, 43.0, 40.0, 45.0, 34.0, 42.0, 41.0, 41.0, 34.0, 45.0, 31.0, 32.0, 19.0, 31.0, 19.0, 19.0, 21.0, 18.0, 16.0, 15.0, 12.0, 8.0, 6.0, 6.0, 4.0, 5.0, 5.0, 9.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.43505859375, -46.72454071044922, -45.0140266418457, -43.30350875854492, -41.59299087524414, -39.882476806640625, -38.171958923339844, -36.46144104003906, -34.75092315673828, -33.0404052734375, -31.32988929748535, -29.619373321533203, -27.908855438232422, -26.198339462280273, -24.487823486328125, -22.777305603027344, -21.066791534423828, -19.35627555847168, -17.6457576751709, -15.93524169921875, -14.224724769592285, -12.51420783996582, -10.803691864013672, -9.093174934387207, -7.382658004760742, -5.672141075134277, -3.9616246223449707, -2.251108169555664, -0.5405912399291992, 1.1699256896972656, 2.880441665649414, 4.590958595275879, 6.301475524902344, 8.011992454528809, 9.722509384155273, 11.433025360107422, 13.143542289733887, 14.854059219360352, 16.5645751953125, 18.27509307861328, 19.98560905456543, 21.696125030517578, 23.40664291381836, 25.117158889770508, 26.827674865722656, 28.538192749023438, 30.248708724975586, 31.959224700927734, 33.669742584228516, 35.3802604675293, 37.09077453613281, 38.801292419433594, 40.511810302734375, 42.222328186035156, 43.93284225463867, 45.64336013793945, 47.35387420654297, 49.06439208984375, 50.774906158447266, 52.48542404174805, 54.19594192504883, 55.906455993652344, 57.616973876953125, 59.327491760253906, 61.03800964355469]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 2.0, 4.0, 7.0, 9.0, 17.0, 13.0, 16.0, 22.0, 17.0, 25.0, 38.0, 29.0, 36.0, 37.0, 38.0, 43.0, 58.0, 47.0, 44.0, 47.0, 55.0, 51.0, 50.0, 38.0, 38.0, 33.0, 27.0, 26.0, 24.0, 19.0, 27.0, 16.0, 12.0, 9.0, 5.0, 9.0, 2.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.171875, -12.781982421875, -12.39208984375, -12.002197265625, -11.6123046875, -11.222412109375, -10.83251953125, -10.442626953125, -10.052734375, -9.662841796875, -9.27294921875, -8.883056640625, -8.4931640625, -8.103271484375, -7.71337890625, -7.323486328125, -6.93359375, -6.543701171875, -6.15380859375, -5.763916015625, -5.3740234375, -4.984130859375, -4.59423828125, -4.204345703125, -3.814453125, -3.424560546875, -3.03466796875, -2.644775390625, -2.2548828125, -1.864990234375, -1.47509765625, -1.085205078125, -0.6953125, -0.305419921875, 0.08447265625, 0.474365234375, 0.8642578125, 1.254150390625, 1.64404296875, 2.033935546875, 2.423828125, 2.813720703125, 3.20361328125, 3.593505859375, 3.9833984375, 4.373291015625, 4.76318359375, 5.153076171875, 5.54296875, 5.932861328125, 6.32275390625, 6.712646484375, 7.1025390625, 7.492431640625, 7.88232421875, 8.272216796875, 8.662109375, 9.052001953125, 9.44189453125, 9.831787109375, 10.2216796875, 10.611572265625, 11.00146484375, 11.391357421875, 11.78125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 12.0, 16.0, 16.0, 18.0, 34.0, 49.0, 74.0, 114.0, 161.0, 250.0, 294.0, 474.0, 667.0, 883.0, 1306.0, 1933.0, 2638.0, 4054.0, 6149.0, 9040.0, 13995.0, 20733.0, 32112.0, 49117.0, 76438.0, 122291.0, 194058.0, 185837.0, 115655.0, 72732.0, 46896.0, 30442.0, 19860.0, 13222.0, 8711.0, 5776.0, 3817.0, 2733.0, 1792.0, 1255.0, 894.0, 608.0, 397.0, 296.0, 237.0, 138.0, 112.0, 69.0, 50.0, 41.0, 37.0, 20.0, 10.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.501953125, -1.45635986328125, -1.4107666015625, -1.36517333984375, -1.319580078125, -1.27398681640625, -1.2283935546875, -1.18280029296875, -1.13720703125, -1.09161376953125, -1.0460205078125, -1.00042724609375, -0.954833984375, -0.90924072265625, -0.8636474609375, -0.81805419921875, -0.7724609375, -0.72686767578125, -0.6812744140625, -0.63568115234375, -0.590087890625, -0.54449462890625, -0.4989013671875, -0.45330810546875, -0.40771484375, -0.36212158203125, -0.3165283203125, -0.27093505859375, -0.225341796875, -0.17974853515625, -0.1341552734375, -0.08856201171875, -0.04296875, 0.00262451171875, 0.0482177734375, 0.09381103515625, 0.139404296875, 0.18499755859375, 0.2305908203125, 0.27618408203125, 0.32177734375, 0.36737060546875, 0.4129638671875, 0.45855712890625, 0.504150390625, 0.54974365234375, 0.5953369140625, 0.64093017578125, 0.6865234375, 0.73211669921875, 0.7777099609375, 0.82330322265625, 0.868896484375, 0.91448974609375, 0.9600830078125, 1.00567626953125, 1.05126953125, 1.09686279296875, 1.1424560546875, 1.18804931640625, 1.233642578125, 1.27923583984375, 1.3248291015625, 1.37042236328125, 1.416015625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 8.0, 5.0, 10.0, 10.0, 11.0, 19.0, 13.0, 18.0, 21.0, 21.0, 26.0, 30.0, 30.0, 31.0, 35.0, 42.0, 36.0, 40.0, 33.0, 1065.0, 38.0, 40.0, 39.0, 41.0, 36.0, 50.0, 28.0, 37.0, 27.0, 24.0, 27.0, 10.0, 17.0, 15.0, 14.0, 10.0, 10.0, 14.0, 16.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.9140625, -5.71533203125, -5.5166015625, -5.31787109375, -5.119140625, -4.92041015625, -4.7216796875, -4.52294921875, -4.32421875, -4.12548828125, -3.9267578125, -3.72802734375, -3.529296875, -3.33056640625, -3.1318359375, -2.93310546875, -2.734375, -2.53564453125, -2.3369140625, -2.13818359375, -1.939453125, -1.74072265625, -1.5419921875, -1.34326171875, -1.14453125, -0.94580078125, -0.7470703125, -0.54833984375, -0.349609375, -0.15087890625, 0.0478515625, 0.24658203125, 0.4453125, 0.64404296875, 0.8427734375, 1.04150390625, 1.240234375, 1.43896484375, 1.6376953125, 1.83642578125, 2.03515625, 2.23388671875, 2.4326171875, 2.63134765625, 2.830078125, 3.02880859375, 3.2275390625, 3.42626953125, 3.625, 3.82373046875, 4.0224609375, 4.22119140625, 4.419921875, 4.61865234375, 4.8173828125, 5.01611328125, 5.21484375, 5.41357421875, 5.6123046875, 5.81103515625, 6.009765625, 6.20849609375, 6.4072265625, 6.60595703125, 6.8046875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 6.0, 3.0, 7.0, 8.0, 15.0, 23.0, 26.0, 51.0, 69.0, 99.0, 160.0, 233.0, 336.0, 477.0, 648.0, 1033.0, 1635.0, 2292.0, 3556.0, 5312.0, 8088.0, 12724.0, 19916.0, 31327.0, 49623.0, 79181.0, 123660.0, 1154455.0, 266695.0, 122198.0, 77339.0, 48870.0, 30911.0, 19822.0, 12677.0, 7944.0, 5230.0, 3567.0, 2269.0, 1517.0, 1024.0, 688.0, 446.0, 324.0, 203.0, 152.0, 86.0, 75.0, 52.0, 32.0, 25.0, 10.0, 14.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.3095703125, -1.267303466796875, -1.22503662109375, -1.182769775390625, -1.1405029296875, -1.098236083984375, -1.05596923828125, -1.013702392578125, -0.971435546875, -0.929168701171875, -0.88690185546875, -0.844635009765625, -0.8023681640625, -0.760101318359375, -0.71783447265625, -0.675567626953125, -0.63330078125, -0.591033935546875, -0.54876708984375, -0.506500244140625, -0.4642333984375, -0.421966552734375, -0.37969970703125, -0.337432861328125, -0.295166015625, -0.252899169921875, -0.21063232421875, -0.168365478515625, -0.1260986328125, -0.083831787109375, -0.04156494140625, 0.000701904296875, 0.04296875, 0.085235595703125, 0.12750244140625, 0.169769287109375, 0.2120361328125, 0.254302978515625, 0.29656982421875, 0.338836669921875, 0.381103515625, 0.423370361328125, 0.46563720703125, 0.507904052734375, 0.5501708984375, 0.592437744140625, 0.63470458984375, 0.676971435546875, 0.71923828125, 0.761505126953125, 0.80377197265625, 0.846038818359375, 0.8883056640625, 0.930572509765625, 0.97283935546875, 1.015106201171875, 1.057373046875, 1.099639892578125, 1.14190673828125, 1.184173583984375, 1.2264404296875, 1.268707275390625, 1.31097412109375, 1.353240966796875, 1.3955078125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 5.0, 6.0, 9.0, 9.0, 10.0, 30.0, 25.0, 27.0, 35.0, 27.0, 42.0, 38.0, 60.0, 63.0, 66.0, 72.0, 70.0, 57.0, 58.0, 53.0, 35.0, 33.0, 28.0, 29.0, 18.0, 24.0, 12.0, 14.0, 8.0, 9.0, 6.0, 2.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00247955322265625, -0.0024029910564422607, -0.0023264288902282715, -0.0022498667240142822, -0.002173304557800293, -0.0020967423915863037, -0.0020201802253723145, -0.0019436180591583252, -0.001867055892944336, -0.0017904937267303467, -0.0017139315605163574, -0.0016373693943023682, -0.001560807228088379, -0.0014842450618743896, -0.0014076828956604004, -0.0013311207294464111, -0.0012545585632324219, -0.0011779963970184326, -0.0011014342308044434, -0.001024872064590454, -0.0009483098983764648, -0.0008717477321624756, -0.0007951855659484863, -0.0007186233997344971, -0.0006420612335205078, -0.0005654990673065186, -0.0004889369010925293, -0.00041237473487854004, -0.0003358125686645508, -0.0002592504024505615, -0.00018268823623657227, -0.00010612607002258301, -2.956390380859375e-05, 4.699826240539551e-05, 0.00012356042861938477, 0.00020012259483337402, 0.0002766847610473633, 0.00035324692726135254, 0.0004298090934753418, 0.0005063712596893311, 0.0005829334259033203, 0.0006594955921173096, 0.0007360577583312988, 0.0008126199245452881, 0.0008891820907592773, 0.0009657442569732666, 0.0010423064231872559, 0.0011188685894012451, 0.0011954307556152344, 0.0012719929218292236, 0.0013485550880432129, 0.0014251172542572021, 0.0015016794204711914, 0.0015782415866851807, 0.00165480375289917, 0.0017313659191131592, 0.0018079280853271484, 0.0018844902515411377, 0.001961052417755127, 0.002037614583969116, 0.0021141767501831055, 0.0021907389163970947, 0.002267301082611084, 0.0023438632488250732, 0.0024204254150390625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 8.0, 8.0, 10.0, 14.0, 14.0, 22.0, 21.0, 28.0, 42.0, 54.0, 71.0, 102.0, 158.0, 253.0, 531.0, 1812.0, 982875.0, 60642.0, 856.0, 380.0, 181.0, 128.0, 77.0, 63.0, 54.0, 32.0, 25.0, 27.0, 10.0, 10.0, 11.0, 10.0, 5.0, 7.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.060272216796875, -0.05853986740112305, -0.056807518005371094, -0.05507516860961914, -0.05334281921386719, -0.051610469818115234, -0.04987812042236328, -0.04814577102661133, -0.046413421630859375, -0.04468107223510742, -0.04294872283935547, -0.041216373443603516, -0.03948402404785156, -0.03775167465209961, -0.036019325256347656, -0.0342869758605957, -0.03255462646484375, -0.030822277069091797, -0.029089927673339844, -0.02735757827758789, -0.025625228881835938, -0.023892879486083984, -0.02216053009033203, -0.020428180694580078, -0.018695831298828125, -0.016963481903076172, -0.015231132507324219, -0.013498783111572266, -0.011766433715820312, -0.01003408432006836, -0.008301734924316406, -0.006569385528564453, -0.0048370361328125, -0.003104686737060547, -0.0013723373413085938, 0.0003600120544433594, 0.0020923614501953125, 0.0038247108459472656, 0.005557060241699219, 0.007289409637451172, 0.009021759033203125, 0.010754108428955078, 0.012486457824707031, 0.014218807220458984, 0.015951156616210938, 0.01768350601196289, 0.019415855407714844, 0.021148204803466797, 0.02288055419921875, 0.024612903594970703, 0.026345252990722656, 0.02807760238647461, 0.029809951782226562, 0.031542301177978516, 0.03327465057373047, 0.03500699996948242, 0.036739349365234375, 0.03847169876098633, 0.04020404815673828, 0.041936397552490234, 0.04366874694824219, 0.04540109634399414, 0.047133445739746094, 0.04886579513549805, 0.05059814453125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 38.0, 244.0, 482.0, 209.0, 38.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028597526252269745, -0.002674409653991461, -0.002489066682755947, -0.0023037237115204334, -0.0021183807402849197, -0.0019330378854647279, -0.001747695030644536, -0.0015623520594090223, -0.0013770090881735086, -0.001191666116937995, -0.0010063231457024813, -0.0008209802908822894, -0.0006356373196467757, -0.00045029434841126204, -0.0002649514935910702, -7.960852235555649e-05, 0.0001057344488799572, 0.00029107739101164043, 0.00047642033314332366, 0.0006617632461711764, 0.0008471062174066901, 0.0010324491886422038, 0.0012177920434623957, 0.0014031350146979094, 0.001588477985933423, 0.0017738209571689367, 0.0019591639284044504, 0.0021445066668093204, 0.002329849638044834, 0.002515192609280348, 0.0027005355805158615, 0.002885878551751375, 0.003071221522986889, 0.0032565644942224026, 0.0034419074654579163, 0.00362725043669343, 0.0038125934079289436, 0.003997936379164457, 0.004183279350399971, 0.004368621855974197, 0.004553965292870998, 0.004739308264106512, 0.004924651235342026, 0.0051099942065775394, 0.005295337177813053, 0.005480680149048567, 0.0056660231202840805, 0.005851365625858307, 0.006036708597093821, 0.006222051568329334, 0.006407394539564848, 0.006592737510800362, 0.006778080482035875, 0.006963423453271389, 0.007148765958845615, 0.007334109395742416, 0.007519451901316643, 0.0077047948725521564, 0.00789013784378767, 0.008075480349361897, 0.008260823786258698, 0.008446166291832924, 0.008631509728729725, 0.008816852234303951, 0.009002195671200752]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 6.0, 8.0, 8.0, 13.0, 13.0, 7.0, 16.0, 17.0, 24.0, 24.0, 30.0, 32.0, 22.0, 35.0, 42.0, 33.0, 28.0, 34.0, 48.0, 38.0, 48.0, 41.0, 33.0, 39.0, 37.0, 37.0, 32.0, 32.0, 25.0, 24.0, 20.0, 22.0, 24.0, 11.0, 15.0, 16.0, 15.0, 8.0, 4.0, 5.0, 3.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.0012595653533935547, -0.0012222090736031532, -0.0011848527938127518, -0.0011474965140223503, -0.0011101402342319489, -0.0010727839544415474, -0.001035427674651146, -0.0009980713948607445, -0.000960715115070343, -0.0009233588352799416, -0.0008860025554895401, -0.0008486462756991386, -0.0008112899959087372, -0.0007739337161183357, -0.0007365774363279343, -0.0006992211565375328, -0.0006618648767471313, -0.0006245085969567299, -0.0005871523171663284, -0.000549796037375927, -0.0005124397575855255, -0.00047508347779512405, -0.0004377271980047226, -0.00040037091821432114, -0.0003630146384239197, -0.0003256583586335182, -0.00028830207884311676, -0.0002509457990527153, -0.00021358951926231384, -0.00017623323947191238, -0.00013887695968151093, -0.00010152067989110947, -6.416440010070801e-05, -2.680812031030655e-05, 1.054815948009491e-05, 4.790443927049637e-05, 8.526071906089783e-05, 0.00012261699885129929, 0.00015997327864170074, 0.0001973295584321022, 0.00023468583822250366, 0.0002720421180129051, 0.0003093983978033066, 0.00034675467759370804, 0.0003841109573841095, 0.00042146723717451096, 0.0004588235169649124, 0.0004961797967553139, 0.0005335360765457153, 0.0005708923563361168, 0.0006082486361265182, 0.0006456049159169197, 0.0006829611957073212, 0.0007203174754977226, 0.0007576737552881241, 0.0007950300350785255, 0.000832386314868927, 0.0008697425946593285, 0.0009070988744497299, 0.0009444551542401314, 0.0009818114340305328, 0.0010191677138209343, 0.0010565239936113358, 0.0010938802734017372, 0.0011312365531921387]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 2.0, 4.0, 7.0, 9.0, 17.0, 13.0, 16.0, 22.0, 17.0, 25.0, 38.0, 29.0, 36.0, 37.0, 38.0, 43.0, 58.0, 47.0, 44.0, 47.0, 55.0, 51.0, 50.0, 38.0, 38.0, 33.0, 27.0, 26.0, 24.0, 19.0, 27.0, 16.0, 12.0, 9.0, 5.0, 9.0, 2.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.171875, -12.781982421875, -12.39208984375, -12.002197265625, -11.6123046875, -11.222412109375, -10.83251953125, -10.442626953125, -10.052734375, -9.662841796875, -9.27294921875, -8.883056640625, -8.4931640625, -8.103271484375, -7.71337890625, -7.323486328125, -6.93359375, -6.543701171875, -6.15380859375, -5.763916015625, -5.3740234375, -4.984130859375, -4.59423828125, -4.204345703125, -3.814453125, -3.424560546875, -3.03466796875, -2.644775390625, -2.2548828125, -1.864990234375, -1.47509765625, -1.085205078125, -0.6953125, -0.305419921875, 0.08447265625, 0.474365234375, 0.8642578125, 1.254150390625, 1.64404296875, 2.033935546875, 2.423828125, 2.813720703125, 3.20361328125, 3.593505859375, 3.9833984375, 4.373291015625, 4.76318359375, 5.153076171875, 5.54296875, 5.932861328125, 6.32275390625, 6.712646484375, 7.1025390625, 7.492431640625, 7.88232421875, 8.272216796875, 8.662109375, 9.052001953125, 9.44189453125, 9.831787109375, 10.2216796875, 10.611572265625, 11.00146484375, 11.391357421875, 11.78125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 10.0, 16.0, 18.0, 23.0, 29.0, 52.0, 61.0, 75.0, 123.0, 154.0, 324.0, 636.0, 1221.0, 3184.0, 8592.0, 25904.0, 86328.0, 400235.0, 395655.0, 85708.0, 25699.0, 8614.0, 3117.0, 1293.0, 583.0, 299.0, 173.0, 128.0, 78.0, 53.0, 41.0, 38.0, 17.0, 23.0, 6.0, 14.0, 6.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.09375, -16.5909423828125, -16.088134765625, -15.5853271484375, -15.08251953125, -14.5797119140625, -14.076904296875, -13.5740966796875, -13.0712890625, -12.5684814453125, -12.065673828125, -11.5628662109375, -11.06005859375, -10.5572509765625, -10.054443359375, -9.5516357421875, -9.048828125, -8.5460205078125, -8.043212890625, -7.5404052734375, -7.03759765625, -6.5347900390625, -6.031982421875, -5.5291748046875, -5.0263671875, -4.5235595703125, -4.020751953125, -3.5179443359375, -3.01513671875, -2.5123291015625, -2.009521484375, -1.5067138671875, -1.00390625, -0.5010986328125, 0.001708984375, 0.5045166015625, 1.00732421875, 1.5101318359375, 2.012939453125, 2.5157470703125, 3.0185546875, 3.5213623046875, 4.024169921875, 4.5269775390625, 5.02978515625, 5.5325927734375, 6.035400390625, 6.5382080078125, 7.041015625, 7.5438232421875, 8.046630859375, 8.5494384765625, 9.05224609375, 9.5550537109375, 10.057861328125, 10.5606689453125, 11.0634765625, 11.5662841796875, 12.069091796875, 12.5718994140625, 13.07470703125, 13.5775146484375, 14.080322265625, 14.5831298828125, 15.0859375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 10.0, 5.0, 2.0, 9.0, 10.0, 8.0, 8.0, 15.0, 18.0, 17.0, 19.0, 18.0, 22.0, 23.0, 33.0, 28.0, 32.0, 49.0, 47.0, 53.0, 92.0, 178.0, 1580.0, 244.0, 103.0, 69.0, 42.0, 36.0, 28.0, 20.0, 26.0, 24.0, 24.0, 28.0, 16.0, 22.0, 15.0, 18.0, 6.0, 7.0, 10.0, 13.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.59375, -24.7294921875, -23.865234375, -23.0009765625, -22.13671875, -21.2724609375, -20.408203125, -19.5439453125, -18.6796875, -17.8154296875, -16.951171875, -16.0869140625, -15.22265625, -14.3583984375, -13.494140625, -12.6298828125, -11.765625, -10.9013671875, -10.037109375, -9.1728515625, -8.30859375, -7.4443359375, -6.580078125, -5.7158203125, -4.8515625, -3.9873046875, -3.123046875, -2.2587890625, -1.39453125, -0.5302734375, 0.333984375, 1.1982421875, 2.0625, 2.9267578125, 3.791015625, 4.6552734375, 5.51953125, 6.3837890625, 7.248046875, 8.1123046875, 8.9765625, 9.8408203125, 10.705078125, 11.5693359375, 12.43359375, 13.2978515625, 14.162109375, 15.0263671875, 15.890625, 16.7548828125, 17.619140625, 18.4833984375, 19.34765625, 20.2119140625, 21.076171875, 21.9404296875, 22.8046875, 23.6689453125, 24.533203125, 25.3974609375, 26.26171875, 27.1259765625, 27.990234375, 28.8544921875, 29.71875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 7.0, 9.0, 2.0, 11.0, 18.0, 30.0, 20.0, 36.0, 34.0, 73.0, 64.0, 112.0, 146.0, 198.0, 320.0, 628.0, 2268.0, 26725.0, 2303653.0, 790290.0, 17700.0, 1741.0, 544.0, 283.0, 197.0, 137.0, 107.0, 86.0, 54.0, 43.0, 30.0, 28.0, 19.0, 13.0, 22.0, 10.0, 9.0, 4.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.0, -40.5966796875, -39.193359375, -37.7900390625, -36.38671875, -34.9833984375, -33.580078125, -32.1767578125, -30.7734375, -29.3701171875, -27.966796875, -26.5634765625, -25.16015625, -23.7568359375, -22.353515625, -20.9501953125, -19.546875, -18.1435546875, -16.740234375, -15.3369140625, -13.93359375, -12.5302734375, -11.126953125, -9.7236328125, -8.3203125, -6.9169921875, -5.513671875, -4.1103515625, -2.70703125, -1.3037109375, 0.099609375, 1.5029296875, 2.90625, 4.3095703125, 5.712890625, 7.1162109375, 8.51953125, 9.9228515625, 11.326171875, 12.7294921875, 14.1328125, 15.5361328125, 16.939453125, 18.3427734375, 19.74609375, 21.1494140625, 22.552734375, 23.9560546875, 25.359375, 26.7626953125, 28.166015625, 29.5693359375, 30.97265625, 32.3759765625, 33.779296875, 35.1826171875, 36.5859375, 37.9892578125, 39.392578125, 40.7958984375, 42.19921875, 43.6025390625, 45.005859375, 46.4091796875, 47.8125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 212.0, 785.0, 19.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-571.7947387695312, -561.2528076171875, -550.7108154296875, -540.1688842773438, -529.6268920898438, -519.0849609375, -508.54296875, -498.00103759765625, -487.4590759277344, -476.9171142578125, -466.3751525878906, -455.83319091796875, -445.2912292480469, -434.749267578125, -424.20733642578125, -413.6653747558594, -403.1234130859375, -392.5814514160156, -382.03948974609375, -371.4975280761719, -360.95556640625, -350.41363525390625, -339.87164306640625, -329.3297119140625, -318.7877197265625, -308.2457580566406, -297.70379638671875, -287.1618347167969, -276.619873046875, -266.07794189453125, -255.5359649658203, -244.9940185546875, -234.45208740234375, -223.91012573242188, -213.3681640625, -202.82620239257812, -192.2842559814453, -181.74229431152344, -171.20033264160156, -160.65838623046875, -150.1164093017578, -139.57444763183594, -129.03248596191406, -118.49053192138672, -107.94857788085938, -97.4066162109375, -86.86465454101562, -76.32270050048828, -65.7807388305664, -55.2387809753418, -44.69682312011719, -34.15486145019531, -23.612903594970703, -13.070945739746094, -2.5289840698242188, 8.012969970703125, 18.554931640625, 29.09688949584961, 39.63884735107422, 50.180809020996094, 60.7227668762207, 71.26472473144531, 81.80668640136719, 92.34864044189453, 102.8906021118164]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 12.0, 7.0, 18.0, 10.0, 12.0, 14.0, 17.0, 19.0, 18.0, 29.0, 27.0, 21.0, 39.0, 29.0, 52.0, 28.0, 45.0, 49.0, 42.0, 41.0, 34.0, 36.0, 40.0, 43.0, 39.0, 26.0, 27.0, 31.0, 24.0, 31.0, 17.0, 15.0, 14.0, 14.0, 16.0, 12.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 8.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-67.27494812011719, -65.1795883178711, -63.084232330322266, -60.98887634277344, -58.89352035522461, -56.79816436767578, -54.70280456542969, -52.60744857788086, -50.51209259033203, -48.4167366027832, -46.32137680053711, -44.22602081298828, -42.13066482543945, -40.035308837890625, -37.93994903564453, -35.8445930480957, -33.74923324584961, -31.65387535095215, -29.55851936340332, -27.46316146850586, -25.36780548095703, -23.27244758605957, -21.17708969116211, -19.08173370361328, -16.98637580871582, -14.891018867492676, -12.795661926269531, -10.70030403137207, -8.604947090148926, -6.509590148925781, -4.41423225402832, -2.318875312805176, -0.22351837158203125, 1.8718388080596924, 3.967195987701416, 6.062553405761719, 8.157910346984863, 10.253267288208008, 12.348625183105469, 14.443982124328613, 16.539339065551758, 18.63469696044922, 20.730052947998047, 22.825410842895508, 24.92076873779297, 27.016124725341797, 29.111482620239258, 31.20684051513672, 33.30219650268555, 35.397552490234375, 37.49291229248047, 39.5882682800293, 41.683624267578125, 43.77898406982422, 45.87434005737305, 47.969696044921875, 50.06505584716797, 52.1604118347168, 54.25577163696289, 56.35112762451172, 58.44648361206055, 60.541839599609375, 62.63719940185547, 64.73255920410156, 66.82791137695312]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 4.0, 12.0, 12.0, 11.0, 21.0, 8.0, 34.0, 18.0, 20.0, 30.0, 41.0, 38.0, 35.0, 46.0, 48.0, 39.0, 36.0, 59.0, 50.0, 49.0, 54.0, 47.0, 34.0, 30.0, 34.0, 16.0, 28.0, 28.0, 24.0, 23.0, 9.0, 13.0, 13.0, 5.0, 10.0, 5.0, 4.0, 1.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.3046875, -12.91943359375, -12.5341796875, -12.14892578125, -11.763671875, -11.37841796875, -10.9931640625, -10.60791015625, -10.22265625, -9.83740234375, -9.4521484375, -9.06689453125, -8.681640625, -8.29638671875, -7.9111328125, -7.52587890625, -7.140625, -6.75537109375, -6.3701171875, -5.98486328125, -5.599609375, -5.21435546875, -4.8291015625, -4.44384765625, -4.05859375, -3.67333984375, -3.2880859375, -2.90283203125, -2.517578125, -2.13232421875, -1.7470703125, -1.36181640625, -0.9765625, -0.59130859375, -0.2060546875, 0.17919921875, 0.564453125, 0.94970703125, 1.3349609375, 1.72021484375, 2.10546875, 2.49072265625, 2.8759765625, 3.26123046875, 3.646484375, 4.03173828125, 4.4169921875, 4.80224609375, 5.1875, 5.57275390625, 5.9580078125, 6.34326171875, 6.728515625, 7.11376953125, 7.4990234375, 7.88427734375, 8.26953125, 8.65478515625, 9.0400390625, 9.42529296875, 9.810546875, 10.19580078125, 10.5810546875, 10.96630859375, 11.3515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 4.0, 10.0, 9.0, 15.0, 12.0, 24.0, 17.0, 21.0, 33.0, 50.0, 72.0, 132.0, 350.0, 1223.0, 4552.0, 26972.0, 791875.0, 3219900.0, 134142.0, 11212.0, 2456.0, 612.0, 245.0, 108.0, 63.0, 37.0, 31.0, 20.0, 15.0, 9.0, 13.0, 13.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.96875, -33.81396484375, -32.6591796875, -31.50439453125, -30.349609375, -29.19482421875, -28.0400390625, -26.88525390625, -25.73046875, -24.57568359375, -23.4208984375, -22.26611328125, -21.111328125, -19.95654296875, -18.8017578125, -17.64697265625, -16.4921875, -15.33740234375, -14.1826171875, -13.02783203125, -11.873046875, -10.71826171875, -9.5634765625, -8.40869140625, -7.25390625, -6.09912109375, -4.9443359375, -3.78955078125, -2.634765625, -1.47998046875, -0.3251953125, 0.82958984375, 1.984375, 3.13916015625, 4.2939453125, 5.44873046875, 6.603515625, 7.75830078125, 8.9130859375, 10.06787109375, 11.22265625, 12.37744140625, 13.5322265625, 14.68701171875, 15.841796875, 16.99658203125, 18.1513671875, 19.30615234375, 20.4609375, 21.61572265625, 22.7705078125, 23.92529296875, 25.080078125, 26.23486328125, 27.3896484375, 28.54443359375, 29.69921875, 30.85400390625, 32.0087890625, 33.16357421875, 34.318359375, 35.47314453125, 36.6279296875, 37.78271484375, 38.9375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 8.0, 9.0, 18.0, 9.0, 15.0, 17.0, 26.0, 37.0, 45.0, 82.0, 101.0, 152.0, 233.0, 394.0, 591.0, 609.0, 611.0, 408.0, 253.0, 144.0, 97.0, 69.0, 42.0, 36.0, 21.0, 16.0, 10.0, 8.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.71875, -24.09326171875, -23.4677734375, -22.84228515625, -22.216796875, -21.59130859375, -20.9658203125, -20.34033203125, -19.71484375, -19.08935546875, -18.4638671875, -17.83837890625, -17.212890625, -16.58740234375, -15.9619140625, -15.33642578125, -14.7109375, -14.08544921875, -13.4599609375, -12.83447265625, -12.208984375, -11.58349609375, -10.9580078125, -10.33251953125, -9.70703125, -9.08154296875, -8.4560546875, -7.83056640625, -7.205078125, -6.57958984375, -5.9541015625, -5.32861328125, -4.703125, -4.07763671875, -3.4521484375, -2.82666015625, -2.201171875, -1.57568359375, -0.9501953125, -0.32470703125, 0.30078125, 0.92626953125, 1.5517578125, 2.17724609375, 2.802734375, 3.42822265625, 4.0537109375, 4.67919921875, 5.3046875, 5.93017578125, 6.5556640625, 7.18115234375, 7.806640625, 8.43212890625, 9.0576171875, 9.68310546875, 10.30859375, 10.93408203125, 11.5595703125, 12.18505859375, 12.810546875, 13.43603515625, 14.0615234375, 14.68701171875, 15.3125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 11.0, 6.0, 9.0, 8.0, 14.0, 17.0, 23.0, 35.0, 54.0, 111.0, 151.0, 279.0, 588.0, 1420.0, 5363.0, 29450.0, 318200.0, 3553644.0, 252934.0, 24811.0, 4632.0, 1308.0, 481.0, 275.0, 153.0, 68.0, 66.0, 44.0, 33.0, 22.0, 16.0, 8.0, 11.0, 14.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.84375, -33.736328125, -32.62890625, -31.521484375, -30.4140625, -29.306640625, -28.19921875, -27.091796875, -25.984375, -24.876953125, -23.76953125, -22.662109375, -21.5546875, -20.447265625, -19.33984375, -18.232421875, -17.125, -16.017578125, -14.91015625, -13.802734375, -12.6953125, -11.587890625, -10.48046875, -9.373046875, -8.265625, -7.158203125, -6.05078125, -4.943359375, -3.8359375, -2.728515625, -1.62109375, -0.513671875, 0.59375, 1.701171875, 2.80859375, 3.916015625, 5.0234375, 6.130859375, 7.23828125, 8.345703125, 9.453125, 10.560546875, 11.66796875, 12.775390625, 13.8828125, 14.990234375, 16.09765625, 17.205078125, 18.3125, 19.419921875, 20.52734375, 21.634765625, 22.7421875, 23.849609375, 24.95703125, 26.064453125, 27.171875, 28.279296875, 29.38671875, 30.494140625, 31.6015625, 32.708984375, 33.81640625, 34.923828125, 36.03125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 22.0, 50.0, 130.0, 226.0, 231.0, 179.0, 103.0, 28.0, 19.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-173.52529907226562, -170.01736450195312, -166.50941467285156, -163.00148010253906, -159.4935302734375, -155.985595703125, -152.47764587402344, -148.96971130371094, -145.46176147460938, -141.95382690429688, -138.4458770751953, -134.9379425048828, -131.42999267578125, -127.92205047607422, -124.41410827636719, -120.90617370605469, -117.39823150634766, -113.89028930664062, -110.3823471069336, -106.87440490722656, -103.36646270751953, -99.8585205078125, -96.3505859375, -92.84263610839844, -89.33470153808594, -85.8267593383789, -82.31881713867188, -78.81087493896484, -75.30293273925781, -71.79499053955078, -68.28704833984375, -64.77911376953125, -61.27117156982422, -57.76322937011719, -54.255287170410156, -50.747344970703125, -47.239402770996094, -43.73146057128906, -40.2235221862793, -36.715579986572266, -33.207637786865234, -29.699695587158203, -26.191753387451172, -22.683813095092773, -19.175870895385742, -15.667928695678711, -12.159988403320312, -8.652046203613281, -5.14410400390625, -1.636162281036377, 1.871779441833496, 5.379720687866211, 8.887662887573242, 12.395605087280273, 15.903545379638672, 19.411487579345703, 22.919429779052734, 26.427371978759766, 29.935314178466797, 33.44325256347656, 36.951194763183594, 40.459136962890625, 43.967079162597656, 47.47502136230469, 50.98296356201172]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 8.0, 4.0, 7.0, 14.0, 12.0, 13.0, 27.0, 26.0, 22.0, 32.0, 30.0, 36.0, 35.0, 43.0, 50.0, 43.0, 47.0, 41.0, 39.0, 44.0, 56.0, 40.0, 40.0, 40.0, 28.0, 32.0, 32.0, 26.0, 21.0, 16.0, 15.0, 17.0, 14.0, 12.0, 10.0, 11.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.31184005737305, -55.43180847167969, -53.551780700683594, -51.671749114990234, -49.79172134399414, -47.91168975830078, -46.03166198730469, -44.15163040161133, -42.27159881591797, -40.39156723022461, -38.511539459228516, -36.631507873535156, -34.75148010253906, -32.8714485168457, -30.991418838500977, -29.11138916015625, -27.231361389160156, -25.35133171081543, -23.471302032470703, -21.591270446777344, -19.71124267578125, -17.83121109008789, -15.951181411743164, -14.071151733398438, -12.191122055053711, -10.311092376708984, -8.431062698364258, -6.551032066345215, -4.671002388000488, -2.7909727096557617, -0.9109420776367188, 0.9690876007080078, 2.8491134643554688, 4.729143142700195, 6.60917329788208, 8.489203453063965, 10.369233131408691, 12.249262809753418, 14.129293441772461, 16.009323120117188, 17.889352798461914, 19.76938247680664, 21.649412155151367, 23.529441833496094, 25.409473419189453, 27.289501190185547, 29.169532775878906, 31.049562454223633, 32.92959213256836, 34.80962371826172, 36.68965148925781, 38.56968307495117, 40.449710845947266, 42.329742431640625, 44.20977020263672, 46.08980178833008, 47.96983337402344, 49.8498649597168, 51.72989273071289, 53.60992431640625, 55.489952087402344, 57.3699836730957, 59.25001525878906, 61.130043029785156, 63.01007080078125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 1.0, 3.0, 11.0, 4.0, 10.0, 15.0, 13.0, 12.0, 19.0, 28.0, 21.0, 21.0, 33.0, 22.0, 29.0, 32.0, 35.0, 48.0, 44.0, 41.0, 38.0, 48.0, 44.0, 41.0, 44.0, 39.0, 40.0, 28.0, 25.0, 22.0, 29.0, 24.0, 24.0, 19.0, 16.0, 16.0, 12.0, 4.0, 17.0, 6.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.2109375, -10.8543701171875, -10.497802734375, -10.1412353515625, -9.78466796875, -9.4281005859375, -9.071533203125, -8.7149658203125, -8.3583984375, -8.0018310546875, -7.645263671875, -7.2886962890625, -6.93212890625, -6.5755615234375, -6.218994140625, -5.8624267578125, -5.505859375, -5.1492919921875, -4.792724609375, -4.4361572265625, -4.07958984375, -3.7230224609375, -3.366455078125, -3.0098876953125, -2.6533203125, -2.2967529296875, -1.940185546875, -1.5836181640625, -1.22705078125, -0.8704833984375, -0.513916015625, -0.1573486328125, 0.19921875, 0.5557861328125, 0.912353515625, 1.2689208984375, 1.62548828125, 1.9820556640625, 2.338623046875, 2.6951904296875, 3.0517578125, 3.4083251953125, 3.764892578125, 4.1214599609375, 4.47802734375, 4.8345947265625, 5.191162109375, 5.5477294921875, 5.904296875, 6.2608642578125, 6.617431640625, 6.9739990234375, 7.33056640625, 7.6871337890625, 8.043701171875, 8.4002685546875, 8.7568359375, 9.1134033203125, 9.469970703125, 9.8265380859375, 10.18310546875, 10.5396728515625, 10.896240234375, 11.2528076171875, 11.609375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 11.0, 11.0, 17.0, 23.0, 35.0, 55.0, 69.0, 113.0, 153.0, 201.0, 298.0, 464.0, 645.0, 1004.0, 1456.0, 2164.0, 3401.0, 5241.0, 8283.0, 13221.0, 20938.0, 34417.0, 56590.0, 96935.0, 167362.0, 232381.0, 163245.0, 94146.0, 55419.0, 33699.0, 20545.0, 12833.0, 8004.0, 5205.0, 3329.0, 2176.0, 1456.0, 952.0, 658.0, 397.0, 314.0, 237.0, 133.0, 95.0, 75.0, 43.0, 33.0, 26.0, 10.0, 13.0, 10.0, 9.0, 3.0, 2.0, 1.0, 3.0], "bins": [-1.8154296875, -1.761199951171875, -1.70697021484375, -1.652740478515625, -1.5985107421875, -1.544281005859375, -1.49005126953125, -1.435821533203125, -1.381591796875, -1.327362060546875, -1.27313232421875, -1.218902587890625, -1.1646728515625, -1.110443115234375, -1.05621337890625, -1.001983642578125, -0.94775390625, -0.893524169921875, -0.83929443359375, -0.785064697265625, -0.7308349609375, -0.676605224609375, -0.62237548828125, -0.568145751953125, -0.513916015625, -0.459686279296875, -0.40545654296875, -0.351226806640625, -0.2969970703125, -0.242767333984375, -0.18853759765625, -0.134307861328125, -0.080078125, -0.025848388671875, 0.02838134765625, 0.082611083984375, 0.1368408203125, 0.191070556640625, 0.24530029296875, 0.299530029296875, 0.353759765625, 0.407989501953125, 0.46221923828125, 0.516448974609375, 0.5706787109375, 0.624908447265625, 0.67913818359375, 0.733367919921875, 0.78759765625, 0.841827392578125, 0.89605712890625, 0.950286865234375, 1.0045166015625, 1.058746337890625, 1.11297607421875, 1.167205810546875, 1.221435546875, 1.275665283203125, 1.32989501953125, 1.384124755859375, 1.4383544921875, 1.492584228515625, 1.54681396484375, 1.601043701171875, 1.6552734375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 8.0, 1.0, 7.0, 17.0, 5.0, 7.0, 7.0, 19.0, 26.0, 24.0, 35.0, 28.0, 34.0, 28.0, 25.0, 35.0, 38.0, 50.0, 43.0, 42.0, 1072.0, 33.0, 53.0, 60.0, 49.0, 33.0, 35.0, 24.0, 30.0, 29.0, 15.0, 23.0, 17.0, 13.0, 16.0, 10.0, 8.0, 11.0, 3.0, 3.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.578125, -8.3406982421875, -8.103271484375, -7.8658447265625, -7.62841796875, -7.3909912109375, -7.153564453125, -6.9161376953125, -6.6787109375, -6.4412841796875, -6.203857421875, -5.9664306640625, -5.72900390625, -5.4915771484375, -5.254150390625, -5.0167236328125, -4.779296875, -4.5418701171875, -4.304443359375, -4.0670166015625, -3.82958984375, -3.5921630859375, -3.354736328125, -3.1173095703125, -2.8798828125, -2.6424560546875, -2.405029296875, -2.1676025390625, -1.93017578125, -1.6927490234375, -1.455322265625, -1.2178955078125, -0.98046875, -0.7430419921875, -0.505615234375, -0.2681884765625, -0.03076171875, 0.2066650390625, 0.444091796875, 0.6815185546875, 0.9189453125, 1.1563720703125, 1.393798828125, 1.6312255859375, 1.86865234375, 2.1060791015625, 2.343505859375, 2.5809326171875, 2.818359375, 3.0557861328125, 3.293212890625, 3.5306396484375, 3.76806640625, 4.0054931640625, 4.242919921875, 4.4803466796875, 4.7177734375, 4.9552001953125, 5.192626953125, 5.4300537109375, 5.66748046875, 5.9049072265625, 6.142333984375, 6.3797607421875, 6.6171875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 2.0, 3.0, 8.0, 11.0, 12.0, 28.0, 37.0, 48.0, 63.0, 109.0, 160.0, 241.0, 343.0, 548.0, 782.0, 1261.0, 1837.0, 2833.0, 4263.0, 6344.0, 9724.0, 14726.0, 23056.0, 36298.0, 57566.0, 92299.0, 150842.0, 1258960.0, 162509.0, 99884.0, 62108.0, 38855.0, 24959.0, 15996.0, 10350.0, 6841.0, 4432.0, 2888.0, 1942.0, 1294.0, 926.0, 578.0, 361.0, 292.0, 171.0, 121.0, 79.0, 54.0, 35.0, 22.0, 15.0, 8.0, 15.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4296875, -1.3829345703125, -1.336181640625, -1.2894287109375, -1.24267578125, -1.1959228515625, -1.149169921875, -1.1024169921875, -1.0556640625, -1.0089111328125, -0.962158203125, -0.9154052734375, -0.86865234375, -0.8218994140625, -0.775146484375, -0.7283935546875, -0.681640625, -0.6348876953125, -0.588134765625, -0.5413818359375, -0.49462890625, -0.4478759765625, -0.401123046875, -0.3543701171875, -0.3076171875, -0.2608642578125, -0.214111328125, -0.1673583984375, -0.12060546875, -0.0738525390625, -0.027099609375, 0.0196533203125, 0.06640625, 0.1131591796875, 0.159912109375, 0.2066650390625, 0.25341796875, 0.3001708984375, 0.346923828125, 0.3936767578125, 0.4404296875, 0.4871826171875, 0.533935546875, 0.5806884765625, 0.62744140625, 0.6741943359375, 0.720947265625, 0.7677001953125, 0.814453125, 0.8612060546875, 0.907958984375, 0.9547119140625, 1.00146484375, 1.0482177734375, 1.094970703125, 1.1417236328125, 1.1884765625, 1.2352294921875, 1.281982421875, 1.3287353515625, 1.37548828125, 1.4222412109375, 1.468994140625, 1.5157470703125, 1.5625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 7.0, 3.0, 9.0, 12.0, 9.0, 15.0, 19.0, 31.0, 39.0, 39.0, 60.0, 49.0, 65.0, 54.0, 59.0, 67.0, 63.0, 52.0, 44.0, 54.0, 51.0, 36.0, 27.0, 24.0, 24.0, 12.0, 19.0, 13.0, 6.0, 8.0, 5.0, 3.0, 5.0, 0.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003002166748046875, -0.002920866012573242, -0.0028395652770996094, -0.0027582645416259766, -0.0026769638061523438, -0.002595663070678711, -0.002514362335205078, -0.0024330615997314453, -0.0023517608642578125, -0.0022704601287841797, -0.002189159393310547, -0.002107858657836914, -0.0020265579223632812, -0.0019452571868896484, -0.0018639564514160156, -0.0017826557159423828, -0.00170135498046875, -0.0016200542449951172, -0.0015387535095214844, -0.0014574527740478516, -0.0013761520385742188, -0.001294851303100586, -0.0012135505676269531, -0.0011322498321533203, -0.0010509490966796875, -0.0009696483612060547, -0.0008883476257324219, -0.0008070468902587891, -0.0007257461547851562, -0.0006444454193115234, -0.0005631446838378906, -0.0004818439483642578, -0.000400543212890625, -0.0003192424774169922, -0.00023794174194335938, -0.00015664100646972656, -7.534027099609375e-05, 5.9604644775390625e-06, 8.726119995117188e-05, 0.0001685619354248047, 0.0002498626708984375, 0.0003311634063720703, 0.0004124641418457031, 0.0004937648773193359, 0.0005750656127929688, 0.0006563663482666016, 0.0007376670837402344, 0.0008189678192138672, 0.0009002685546875, 0.0009815692901611328, 0.0010628700256347656, 0.0011441707611083984, 0.0012254714965820312, 0.001306772232055664, 0.0013880729675292969, 0.0014693737030029297, 0.0015506744384765625, 0.0016319751739501953, 0.0017132759094238281, 0.001794576644897461, 0.0018758773803710938, 0.0019571781158447266, 0.0020384788513183594, 0.002119779586791992, 0.002201080322265625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 8.0, 6.0, 7.0, 22.0, 14.0, 22.0, 23.0, 30.0, 40.0, 51.0, 74.0, 100.0, 119.0, 186.0, 286.0, 551.0, 2066.0, 929521.0, 113110.0, 1043.0, 450.0, 227.0, 152.0, 116.0, 78.0, 70.0, 38.0, 31.0, 15.0, 16.0, 13.0, 12.0, 10.0, 11.0, 5.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045013427734375, -0.0433964729309082, -0.041779518127441406, -0.04016256332397461, -0.03854560852050781, -0.036928653717041016, -0.03531169891357422, -0.03369474411010742, -0.032077789306640625, -0.030460834503173828, -0.02884387969970703, -0.027226924896240234, -0.025609970092773438, -0.02399301528930664, -0.022376060485839844, -0.020759105682373047, -0.01914215087890625, -0.017525196075439453, -0.015908241271972656, -0.01429128646850586, -0.012674331665039062, -0.011057376861572266, -0.009440422058105469, -0.007823467254638672, -0.006206512451171875, -0.004589557647705078, -0.0029726028442382812, -0.0013556480407714844, 0.0002613067626953125, 0.0018782615661621094, 0.0034952163696289062, 0.005112171173095703, 0.0067291259765625, 0.008346080780029297, 0.009963035583496094, 0.01157999038696289, 0.013196945190429688, 0.014813899993896484, 0.01643085479736328, 0.018047809600830078, 0.019664764404296875, 0.021281719207763672, 0.02289867401123047, 0.024515628814697266, 0.026132583618164062, 0.02774953842163086, 0.029366493225097656, 0.030983448028564453, 0.03260040283203125, 0.03421735763549805, 0.035834312438964844, 0.03745126724243164, 0.03906822204589844, 0.040685176849365234, 0.04230213165283203, 0.04391908645629883, 0.045536041259765625, 0.04715299606323242, 0.04876995086669922, 0.050386905670166016, 0.05200386047363281, 0.05362081527709961, 0.055237770080566406, 0.0568547248840332, 0.0584716796875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 23.0, 159.0, 567.0, 231.0, 31.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01107342541217804, -0.010858663357794285, -0.010643900372087955, -0.0104291383177042, -0.010214376263320446, -0.009999613277614117, -0.009784851223230362, -0.009570089168846607, -0.009355326183140278, -0.009140564128756523, -0.008925801143050194, -0.008711039088666439, -0.008496277034282684, -0.008281514048576355, -0.0080667519941926, -0.007851989939808846, -0.0076372274197638035, -0.0074224648997187614, -0.007207702845335007, -0.006992940325289965, -0.006778177805244923, -0.006563415750861168, -0.006348653230816126, -0.006133890710771084, -0.005919128656387329, -0.005704366136342287, -0.005489604081958532, -0.00527484156191349, -0.005060079041868448, -0.004845316521823406, -0.0046305544674396515, -0.0044157919473946095, -0.004201029427349567, -0.003986266907304525, -0.003771504620090127, -0.0035567423328757286, -0.0033419798128306866, -0.003127217525616288, -0.00291245523840189, -0.0026976927183568478, -0.002482930663973093, -0.0022681683767586946, -0.0020534058567136526, -0.0018386435694992542, -0.001623881165869534, -0.0014091187622398138, -0.0011943564750254154, -0.0009795940713956952, -0.000764831667765975, -0.0005500692641362548, -0.0003353069187141955, -0.00012054457329213619, 9.421783033758402e-05, 0.00030898023396730423, 0.0005237425211817026, 0.0007385049248114228, 0.000953267328441143, 0.0011680297320708632, 0.0013827921357005835, 0.0015975544229149818, 0.001812316826544702, 0.0020270792301744223, 0.0022418415173888206, 0.0024566040374338627, 0.002671366324648261]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 3.0, 4.0, 12.0, 7.0, 10.0, 11.0, 10.0, 19.0, 20.0, 20.0, 19.0, 23.0, 30.0, 39.0, 32.0, 31.0, 38.0, 37.0, 33.0, 39.0, 44.0, 28.0, 29.0, 35.0, 43.0, 34.0, 36.0, 24.0, 34.0, 36.0, 26.0, 35.0, 15.0, 20.0, 18.0, 7.0, 17.0, 14.0, 20.0, 6.0, 5.0, 6.0, 11.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.00114518404006958, -0.0011092368513345718, -0.0010732896625995636, -0.0010373424738645554, -0.0010013952851295471, -0.0009654480963945389, -0.0009295009076595306, -0.0008935537189245224, -0.0008576065301895142, -0.0008216593414545059, -0.0007857121527194977, -0.0007497649639844894, -0.0007138177752494812, -0.000677870586514473, -0.0006419233977794647, -0.0006059762090444565, -0.0005700290203094482, -0.00053408183157444, -0.0004981346428394318, -0.0004621874541044235, -0.0004262402653694153, -0.00039029307663440704, -0.0003543458878993988, -0.00031839869916439056, -0.0002824515104293823, -0.0002465043216943741, -0.00021055713295936584, -0.0001746099442243576, -0.00013866275548934937, -0.00010271556675434113, -6.676837801933289e-05, -3.0821189284324646e-05, 5.125999450683594e-06, 4.1073188185691833e-05, 7.702037692070007e-05, 0.00011296756565570831, 0.00014891475439071655, 0.0001848619431257248, 0.00022080913186073303, 0.00025675632059574127, 0.0002927035093307495, 0.00032865069806575775, 0.000364597886800766, 0.00040054507553577423, 0.00043649226427078247, 0.0004724394530057907, 0.000508386641740799, 0.0005443338304758072, 0.0005802810192108154, 0.0006162282079458237, 0.0006521753966808319, 0.0006881225854158401, 0.0007240697741508484, 0.0007600169628858566, 0.0007959641516208649, 0.0008319113403558731, 0.0008678585290908813, 0.0009038057178258896, 0.0009397529065608978, 0.0009757000952959061, 0.0010116472840309143, 0.0010475944727659225, 0.0010835416615009308, 0.001119488850235939, 0.0011554360389709473]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 1.0, 3.0, 11.0, 4.0, 10.0, 15.0, 13.0, 12.0, 19.0, 28.0, 21.0, 21.0, 33.0, 22.0, 29.0, 32.0, 35.0, 48.0, 44.0, 41.0, 38.0, 48.0, 44.0, 41.0, 44.0, 39.0, 40.0, 28.0, 25.0, 22.0, 29.0, 24.0, 24.0, 19.0, 16.0, 16.0, 12.0, 4.0, 17.0, 6.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.2109375, -10.8543701171875, -10.497802734375, -10.1412353515625, -9.78466796875, -9.4281005859375, -9.071533203125, -8.7149658203125, -8.3583984375, -8.0018310546875, -7.645263671875, -7.2886962890625, -6.93212890625, -6.5755615234375, -6.218994140625, -5.8624267578125, -5.505859375, -5.1492919921875, -4.792724609375, -4.4361572265625, -4.07958984375, -3.7230224609375, -3.366455078125, -3.0098876953125, -2.6533203125, -2.2967529296875, -1.940185546875, -1.5836181640625, -1.22705078125, -0.8704833984375, -0.513916015625, -0.1573486328125, 0.19921875, 0.5557861328125, 0.912353515625, 1.2689208984375, 1.62548828125, 1.9820556640625, 2.338623046875, 2.6951904296875, 3.0517578125, 3.4083251953125, 3.764892578125, 4.1214599609375, 4.47802734375, 4.8345947265625, 5.191162109375, 5.5477294921875, 5.904296875, 6.2608642578125, 6.617431640625, 6.9739990234375, 7.33056640625, 7.6871337890625, 8.043701171875, 8.4002685546875, 8.7568359375, 9.1134033203125, 9.469970703125, 9.8265380859375, 10.18310546875, 10.5396728515625, 10.896240234375, 11.2528076171875, 11.609375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 3.0, 22.0, 10.0, 24.0, 23.0, 46.0, 54.0, 80.0, 98.0, 145.0, 241.0, 318.0, 429.0, 620.0, 989.0, 1715.0, 3290.0, 7053.0, 17460.0, 46330.0, 138051.0, 459733.0, 250180.0, 73824.0, 26794.0, 10538.0, 4539.0, 2288.0, 1174.0, 749.0, 487.0, 337.0, 266.0, 191.0, 143.0, 79.0, 70.0, 45.0, 46.0, 19.0, 18.0, 8.0, 4.0, 9.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.6053466796875, -12.195068359375, -11.7847900390625, -11.37451171875, -10.9642333984375, -10.553955078125, -10.1436767578125, -9.7333984375, -9.3231201171875, -8.912841796875, -8.5025634765625, -8.09228515625, -7.6820068359375, -7.271728515625, -6.8614501953125, -6.451171875, -6.0408935546875, -5.630615234375, -5.2203369140625, -4.81005859375, -4.3997802734375, -3.989501953125, -3.5792236328125, -3.1689453125, -2.7586669921875, -2.348388671875, -1.9381103515625, -1.52783203125, -1.1175537109375, -0.707275390625, -0.2969970703125, 0.11328125, 0.5235595703125, 0.933837890625, 1.3441162109375, 1.75439453125, 2.1646728515625, 2.574951171875, 2.9852294921875, 3.3955078125, 3.8057861328125, 4.216064453125, 4.6263427734375, 5.03662109375, 5.4468994140625, 5.857177734375, 6.2674560546875, 6.677734375, 7.0880126953125, 7.498291015625, 7.9085693359375, 8.31884765625, 8.7291259765625, 9.139404296875, 9.5496826171875, 9.9599609375, 10.3702392578125, 10.780517578125, 11.1907958984375, 11.60107421875, 12.0113525390625, 12.421630859375, 12.8319091796875, 13.2421875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 6.0, 3.0, 5.0, 9.0, 11.0, 18.0, 13.0, 15.0, 15.0, 20.0, 24.0, 24.0, 35.0, 23.0, 27.0, 41.0, 36.0, 50.0, 65.0, 120.0, 310.0, 1564.0, 148.0, 73.0, 53.0, 45.0, 35.0, 29.0, 26.0, 20.0, 31.0, 22.0, 27.0, 20.0, 17.0, 14.0, 9.0, 7.0, 7.0, 9.0, 8.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-27.4375, -26.634765625, -25.83203125, -25.029296875, -24.2265625, -23.423828125, -22.62109375, -21.818359375, -21.015625, -20.212890625, -19.41015625, -18.607421875, -17.8046875, -17.001953125, -16.19921875, -15.396484375, -14.59375, -13.791015625, -12.98828125, -12.185546875, -11.3828125, -10.580078125, -9.77734375, -8.974609375, -8.171875, -7.369140625, -6.56640625, -5.763671875, -4.9609375, -4.158203125, -3.35546875, -2.552734375, -1.75, -0.947265625, -0.14453125, 0.658203125, 1.4609375, 2.263671875, 3.06640625, 3.869140625, 4.671875, 5.474609375, 6.27734375, 7.080078125, 7.8828125, 8.685546875, 9.48828125, 10.291015625, 11.09375, 11.896484375, 12.69921875, 13.501953125, 14.3046875, 15.107421875, 15.91015625, 16.712890625, 17.515625, 18.318359375, 19.12109375, 19.923828125, 20.7265625, 21.529296875, 22.33203125, 23.134765625, 23.9375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 10.0, 14.0, 14.0, 20.0, 38.0, 27.0, 53.0, 73.0, 96.0, 163.0, 231.0, 369.0, 801.0, 5957.0, 326591.0, 2791882.0, 16797.0, 1247.0, 429.0, 271.0, 176.0, 115.0, 93.0, 60.0, 39.0, 31.0, 25.0, 15.0, 16.0, 9.0, 12.0, 4.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-61.84375, -60.0849609375, -58.326171875, -56.5673828125, -54.80859375, -53.0498046875, -51.291015625, -49.5322265625, -47.7734375, -46.0146484375, -44.255859375, -42.4970703125, -40.73828125, -38.9794921875, -37.220703125, -35.4619140625, -33.703125, -31.9443359375, -30.185546875, -28.4267578125, -26.66796875, -24.9091796875, -23.150390625, -21.3916015625, -19.6328125, -17.8740234375, -16.115234375, -14.3564453125, -12.59765625, -10.8388671875, -9.080078125, -7.3212890625, -5.5625, -3.8037109375, -2.044921875, -0.2861328125, 1.47265625, 3.2314453125, 4.990234375, 6.7490234375, 8.5078125, 10.2666015625, 12.025390625, 13.7841796875, 15.54296875, 17.3017578125, 19.060546875, 20.8193359375, 22.578125, 24.3369140625, 26.095703125, 27.8544921875, 29.61328125, 31.3720703125, 33.130859375, 34.8896484375, 36.6484375, 38.4072265625, 40.166015625, 41.9248046875, 43.68359375, 45.4423828125, 47.201171875, 48.9599609375, 50.71875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 30.0, 221.0, 497.0, 244.0, 24.0, 1.0, 1.0], "bins": [-249.39454650878906, -245.20701599121094, -241.01947021484375, -236.83193969726562, -232.6444091796875, -228.4568634033203, -224.2693328857422, -220.08180236816406, -215.89425659179688, -211.70672607421875, -207.51918029785156, -203.33164978027344, -199.1441192626953, -194.95657348632812, -190.76904296875, -186.58151245117188, -182.39398193359375, -178.20645141601562, -174.01890563964844, -169.8313751220703, -165.6438446044922, -161.456298828125, -157.26876831054688, -153.08123779296875, -148.89369201660156, -144.70616149902344, -140.51861572265625, -136.33108520507812, -132.1435546875, -127.95600891113281, -123.76847839355469, -119.58094024658203, -115.39338684082031, -111.20584869384766, -107.01831817626953, -102.83078002929688, -98.64324188232422, -94.45570373535156, -90.26817321777344, -86.08063507080078, -81.89310455322266, -77.70556640625, -73.51803588867188, -69.33049774169922, -65.14295959472656, -60.95542526245117, -56.76789093017578, -52.580352783203125, -48.392818450927734, -44.205284118652344, -40.01774597167969, -35.8302116394043, -31.642675399780273, -27.45513916015625, -23.26760482788086, -19.080068588256836, -14.892532348632812, -10.704996109008789, -6.517460823059082, -2.329925537109375, 1.8576107025146484, 6.045146942138672, 10.232681274414062, 14.420217514038086, 18.60775375366211]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 6.0, 10.0, 9.0, 12.0, 15.0, 18.0, 19.0, 34.0, 32.0, 27.0, 36.0, 33.0, 30.0, 32.0, 33.0, 34.0, 33.0, 40.0, 45.0, 41.0, 41.0, 44.0, 34.0, 42.0, 40.0, 30.0, 26.0, 25.0, 20.0, 22.0, 14.0, 14.0, 18.0, 15.0, 12.0, 9.0, 9.0, 7.0, 5.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-62.89476013183594, -61.11080551147461, -59.32685089111328, -57.54289245605469, -55.75893783569336, -53.97498321533203, -52.1910285949707, -50.407073974609375, -48.62311935424805, -46.83916473388672, -45.05521011352539, -43.27125549316406, -41.48729705810547, -39.70334243774414, -37.91938781738281, -36.135433197021484, -34.351478576660156, -32.56752395629883, -30.783567428588867, -28.99961280822754, -27.21565818786621, -25.43170166015625, -23.647747039794922, -21.863792419433594, -20.079833984375, -18.295879364013672, -16.51192283630371, -14.727968215942383, -12.944013595581055, -11.16005802154541, -9.376102447509766, -7.5921478271484375, -5.808193206787109, -4.024238109588623, -2.2402827739715576, -0.4563274383544922, 1.3276276588439941, 3.1115827560424805, 4.895538330078125, 6.679492950439453, 8.463448524475098, 10.247404098510742, 12.03135871887207, 13.815314292907715, 15.59926986694336, 17.383224487304688, 19.167179107666016, 20.951133728027344, 22.735090255737305, 24.519044876098633, 26.303001403808594, 28.086956024169922, 29.87091064453125, 31.654865264892578, 33.438819885253906, 35.2227783203125, 37.00673294067383, 38.790687561035156, 40.574642181396484, 42.35859680175781, 44.142555236816406, 45.926509857177734, 47.71046447753906, 49.49441909790039, 51.27837371826172]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 6.0, 7.0, 13.0, 14.0, 15.0, 21.0, 23.0, 17.0, 21.0, 29.0, 30.0, 32.0, 37.0, 34.0, 40.0, 35.0, 48.0, 58.0, 55.0, 37.0, 36.0, 46.0, 45.0, 34.0, 33.0, 23.0, 34.0, 30.0, 24.0, 18.0, 29.0, 13.0, 9.0, 11.0, 10.0, 7.0, 7.0, 3.0, 7.0, 3.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.21875, -11.842529296875, -11.46630859375, -11.090087890625, -10.7138671875, -10.337646484375, -9.96142578125, -9.585205078125, -9.208984375, -8.832763671875, -8.45654296875, -8.080322265625, -7.7041015625, -7.327880859375, -6.95166015625, -6.575439453125, -6.19921875, -5.822998046875, -5.44677734375, -5.070556640625, -4.6943359375, -4.318115234375, -3.94189453125, -3.565673828125, -3.189453125, -2.813232421875, -2.43701171875, -2.060791015625, -1.6845703125, -1.308349609375, -0.93212890625, -0.555908203125, -0.1796875, 0.196533203125, 0.57275390625, 0.948974609375, 1.3251953125, 1.701416015625, 2.07763671875, 2.453857421875, 2.830078125, 3.206298828125, 3.58251953125, 3.958740234375, 4.3349609375, 4.711181640625, 5.08740234375, 5.463623046875, 5.83984375, 6.216064453125, 6.59228515625, 6.968505859375, 7.3447265625, 7.720947265625, 8.09716796875, 8.473388671875, 8.849609375, 9.225830078125, 9.60205078125, 9.978271484375, 10.3544921875, 10.730712890625, 11.10693359375, 11.483154296875, 11.859375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 4.0, 4.0, 13.0, 12.0, 13.0, 18.0, 28.0, 27.0, 36.0, 53.0, 62.0, 92.0, 124.0, 188.0, 273.0, 335.0, 461.0, 2908.0, 4186821.0, 1144.0, 477.0, 343.0, 223.0, 165.0, 121.0, 81.0, 62.0, 48.0, 34.0, 28.0, 12.0, 11.0, 22.0, 9.0, 6.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.5, -279.96875, -270.4375, -260.90625, -251.375, -241.84375, -232.3125, -222.78125, -213.25, -203.71875, -194.1875, -184.65625, -175.125, -165.59375, -156.0625, -146.53125, -137.0, -127.46875, -117.9375, -108.40625, -98.875, -89.34375, -79.8125, -70.28125, -60.75, -51.21875, -41.6875, -32.15625, -22.625, -13.09375, -3.5625, 5.96875, 15.5, 25.03125, 34.5625, 44.09375, 53.625, 63.15625, 72.6875, 82.21875, 91.75, 101.28125, 110.8125, 120.34375, 129.875, 139.40625, 148.9375, 158.46875, 168.0, 177.53125, 187.0625, 196.59375, 206.125, 215.65625, 225.1875, 234.71875, 244.25, 253.78125, 263.3125, 272.84375, 282.375, 291.90625, 301.4375, 310.96875, 320.5]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 12.0, 16.0, 37.0, 46.0, 66.0, 144.0, 312.0, 771.0, 1212.0, 801.0, 306.0, 157.0, 82.0, 41.0, 35.0, 16.0, 15.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.0, -29.87353515625, -28.7470703125, -27.62060546875, -26.494140625, -25.36767578125, -24.2412109375, -23.11474609375, -21.98828125, -20.86181640625, -19.7353515625, -18.60888671875, -17.482421875, -16.35595703125, -15.2294921875, -14.10302734375, -12.9765625, -11.85009765625, -10.7236328125, -9.59716796875, -8.470703125, -7.34423828125, -6.2177734375, -5.09130859375, -3.96484375, -2.83837890625, -1.7119140625, -0.58544921875, 0.541015625, 1.66748046875, 2.7939453125, 3.92041015625, 5.046875, 6.17333984375, 7.2998046875, 8.42626953125, 9.552734375, 10.67919921875, 11.8056640625, 12.93212890625, 14.05859375, 15.18505859375, 16.3115234375, 17.43798828125, 18.564453125, 19.69091796875, 20.8173828125, 21.94384765625, 23.0703125, 24.19677734375, 25.3232421875, 26.44970703125, 27.576171875, 28.70263671875, 29.8291015625, 30.95556640625, 32.08203125, 33.20849609375, 34.3349609375, 35.46142578125, 36.587890625, 37.71435546875, 38.8408203125, 39.96728515625, 41.09375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 9.0, 13.0, 12.0, 16.0, 20.0, 20.0, 22.0, 25.0, 34.0, 51.0, 60.0, 70.0, 137.0, 383.0, 5507.0, 4171130.0, 15705.0, 549.0, 156.0, 65.0, 62.0, 40.0, 33.0, 24.0, 22.0, 20.0, 28.0, 17.0, 9.0, 8.0, 7.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-170.875, -166.072265625, -161.26953125, -156.466796875, -151.6640625, -146.861328125, -142.05859375, -137.255859375, -132.453125, -127.650390625, -122.84765625, -118.044921875, -113.2421875, -108.439453125, -103.63671875, -98.833984375, -94.03125, -89.228515625, -84.42578125, -79.623046875, -74.8203125, -70.017578125, -65.21484375, -60.412109375, -55.609375, -50.806640625, -46.00390625, -41.201171875, -36.3984375, -31.595703125, -26.79296875, -21.990234375, -17.1875, -12.384765625, -7.58203125, -2.779296875, 2.0234375, 6.826171875, 11.62890625, 16.431640625, 21.234375, 26.037109375, 30.83984375, 35.642578125, 40.4453125, 45.248046875, 50.05078125, 54.853515625, 59.65625, 64.458984375, 69.26171875, 74.064453125, 78.8671875, 83.669921875, 88.47265625, 93.275390625, 98.078125, 102.880859375, 107.68359375, 112.486328125, 117.2890625, 122.091796875, 126.89453125, 131.697265625, 136.5]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 17.0, 40.0, 180.0, 319.0, 301.0, 118.0, 32.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.09324645996094, -121.01203918457031, -115.93083190917969, -110.84961700439453, -105.7684097290039, -100.68720245361328, -95.60598754882812, -90.5247802734375, -85.44357299804688, -80.36236572265625, -75.28115844726562, -70.19994354248047, -65.11873626708984, -60.03752899169922, -54.95631790161133, -49.87510681152344, -44.79389953613281, -39.71269226074219, -34.6314811706543, -29.55027198791504, -24.46906280517578, -19.387853622436523, -14.306644439697266, -9.225433349609375, -4.14422607421875, 0.9369831085205078, 6.018192291259766, 11.099401473999023, 16.18061065673828, 21.26181983947754, 26.343029022216797, 31.424240112304688, 36.50544738769531, 41.58665466308594, 46.66786575317383, 51.74907684326172, 56.830284118652344, 61.91149139404297, 66.99270629882812, 72.07391357421875, 77.15512084960938, 82.236328125, 87.31753540039062, 92.39875030517578, 97.4799575805664, 102.56116485595703, 107.64237976074219, 112.72358703613281, 117.80479431152344, 122.88600158691406, 127.96720886230469, 133.0484161376953, 138.129638671875, 143.21084594726562, 148.29205322265625, 153.37326049804688, 158.4544677734375, 163.53567504882812, 168.61688232421875, 173.69808959960938, 178.779296875, 183.8605194091797, 188.9417266845703, 194.02293395996094, 199.10414123535156]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 10.0, 6.0, 7.0, 13.0, 9.0, 21.0, 24.0, 20.0, 15.0, 35.0, 30.0, 33.0, 44.0, 47.0, 46.0, 34.0, 41.0, 48.0, 51.0, 44.0, 36.0, 37.0, 26.0, 45.0, 39.0, 23.0, 26.0, 28.0, 24.0, 24.0, 24.0, 18.0, 17.0, 10.0, 8.0, 9.0, 8.0, 7.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.21525573730469, -58.28989028930664, -56.364524841308594, -54.43915939331055, -52.5137939453125, -50.58842468261719, -48.66305923461914, -46.737693786621094, -44.81232833862305, -42.886962890625, -40.96159744262695, -39.036231994628906, -37.110862731933594, -35.18550109863281, -33.2601318359375, -31.334766387939453, -29.409400939941406, -27.48403549194336, -25.558670043945312, -23.633302688598633, -21.707937240600586, -19.78257179260254, -17.85720443725586, -15.931838989257812, -14.006473541259766, -12.081108093261719, -10.155741691589355, -8.230375289916992, -6.305009841918945, -4.379644393920898, -2.454277992248535, -0.5289115905761719, 1.396453857421875, 3.32181978225708, 5.247185707092285, 7.17255163192749, 9.097917556762695, 11.023283004760742, 12.948649406433105, 14.874015808105469, 16.799381256103516, 18.724746704101562, 20.65011215209961, 22.57547950744629, 24.500844955444336, 26.426210403442383, 28.351577758789062, 30.27694320678711, 32.202308654785156, 34.1276741027832, 36.05303955078125, 37.9784049987793, 39.903770446777344, 41.829139709472656, 43.7545051574707, 45.67987060546875, 47.6052360534668, 49.530601501464844, 51.45596694946289, 53.38133239746094, 55.30670166015625, 57.23206329345703, 59.157432556152344, 61.08279800415039, 63.00816345214844]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 4.0, 4.0, 10.0, 7.0, 15.0, 21.0, 15.0, 18.0, 16.0, 25.0, 18.0, 26.0, 20.0, 27.0, 36.0, 24.0, 42.0, 40.0, 53.0, 32.0, 49.0, 33.0, 49.0, 31.0, 31.0, 39.0, 28.0, 27.0, 34.0, 25.0, 28.0, 23.0, 14.0, 19.0, 11.0, 22.0, 15.0, 12.0, 11.0, 7.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-9.3046875, -8.9827880859375, -8.660888671875, -8.3389892578125, -8.01708984375, -7.6951904296875, -7.373291015625, -7.0513916015625, -6.7294921875, -6.4075927734375, -6.085693359375, -5.7637939453125, -5.44189453125, -5.1199951171875, -4.798095703125, -4.4761962890625, -4.154296875, -3.8323974609375, -3.510498046875, -3.1885986328125, -2.86669921875, -2.5447998046875, -2.222900390625, -1.9010009765625, -1.5791015625, -1.2572021484375, -0.935302734375, -0.6134033203125, -0.29150390625, 0.0303955078125, 0.352294921875, 0.6741943359375, 0.99609375, 1.3179931640625, 1.639892578125, 1.9617919921875, 2.28369140625, 2.6055908203125, 2.927490234375, 3.2493896484375, 3.5712890625, 3.8931884765625, 4.215087890625, 4.5369873046875, 4.85888671875, 5.1807861328125, 5.502685546875, 5.8245849609375, 6.146484375, 6.4683837890625, 6.790283203125, 7.1121826171875, 7.43408203125, 7.7559814453125, 8.077880859375, 8.3997802734375, 8.7216796875, 9.0435791015625, 9.365478515625, 9.6873779296875, 10.00927734375, 10.3311767578125, 10.653076171875, 10.9749755859375, 11.296875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 9.0, 10.0, 14.0, 22.0, 30.0, 57.0, 65.0, 120.0, 184.0, 282.0, 457.0, 816.0, 1287.0, 2349.0, 4101.0, 7127.0, 13172.0, 24340.0, 46690.0, 91519.0, 181940.0, 295030.0, 183914.0, 92618.0, 47368.0, 24522.0, 13407.0, 7265.0, 4092.0, 2302.0, 1369.0, 784.0, 479.0, 311.0, 179.0, 104.0, 86.0, 53.0, 28.0, 21.0, 11.0, 7.0, 3.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.09765625, -2.028900146484375, -1.96014404296875, -1.891387939453125, -1.8226318359375, -1.753875732421875, -1.68511962890625, -1.616363525390625, -1.547607421875, -1.478851318359375, -1.41009521484375, -1.341339111328125, -1.2725830078125, -1.203826904296875, -1.13507080078125, -1.066314697265625, -0.99755859375, -0.928802490234375, -0.86004638671875, -0.791290283203125, -0.7225341796875, -0.653778076171875, -0.58502197265625, -0.516265869140625, -0.447509765625, -0.378753662109375, -0.30999755859375, -0.241241455078125, -0.1724853515625, -0.103729248046875, -0.03497314453125, 0.033782958984375, 0.1025390625, 0.171295166015625, 0.24005126953125, 0.308807373046875, 0.3775634765625, 0.446319580078125, 0.51507568359375, 0.583831787109375, 0.652587890625, 0.721343994140625, 0.79010009765625, 0.858856201171875, 0.9276123046875, 0.996368408203125, 1.06512451171875, 1.133880615234375, 1.20263671875, 1.271392822265625, 1.34014892578125, 1.408905029296875, 1.4776611328125, 1.546417236328125, 1.61517333984375, 1.683929443359375, 1.752685546875, 1.821441650390625, 1.89019775390625, 1.958953857421875, 2.0277099609375, 2.096466064453125, 2.16522216796875, 2.233978271484375, 2.302734375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 5.0, 6.0, 7.0, 10.0, 16.0, 11.0, 13.0, 15.0, 26.0, 31.0, 35.0, 41.0, 34.0, 33.0, 47.0, 37.0, 45.0, 50.0, 1078.0, 40.0, 48.0, 57.0, 45.0, 22.0, 42.0, 39.0, 38.0, 28.0, 28.0, 29.0, 14.0, 10.0, 10.0, 8.0, 10.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.90625, -7.641845703125, -7.37744140625, -7.113037109375, -6.8486328125, -6.584228515625, -6.31982421875, -6.055419921875, -5.791015625, -5.526611328125, -5.26220703125, -4.997802734375, -4.7333984375, -4.468994140625, -4.20458984375, -3.940185546875, -3.67578125, -3.411376953125, -3.14697265625, -2.882568359375, -2.6181640625, -2.353759765625, -2.08935546875, -1.824951171875, -1.560546875, -1.296142578125, -1.03173828125, -0.767333984375, -0.5029296875, -0.238525390625, 0.02587890625, 0.290283203125, 0.5546875, 0.819091796875, 1.08349609375, 1.347900390625, 1.6123046875, 1.876708984375, 2.14111328125, 2.405517578125, 2.669921875, 2.934326171875, 3.19873046875, 3.463134765625, 3.7275390625, 3.991943359375, 4.25634765625, 4.520751953125, 4.78515625, 5.049560546875, 5.31396484375, 5.578369140625, 5.8427734375, 6.107177734375, 6.37158203125, 6.635986328125, 6.900390625, 7.164794921875, 7.42919921875, 7.693603515625, 7.9580078125, 8.222412109375, 8.48681640625, 8.751220703125, 9.015625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 9.0, 16.0, 20.0, 34.0, 38.0, 68.0, 139.0, 184.0, 341.0, 539.0, 918.0, 1512.0, 2420.0, 4053.0, 6998.0, 11793.0, 19922.0, 34904.0, 60925.0, 109274.0, 197086.0, 1301775.0, 149166.0, 83046.0, 46597.0, 26851.0, 15618.0, 9292.0, 5538.0, 3249.0, 1912.0, 1125.0, 674.0, 443.0, 230.0, 166.0, 94.0, 52.0, 47.0, 29.0, 12.0, 10.0, 4.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8974609375, -1.838653564453125, -1.77984619140625, -1.721038818359375, -1.6622314453125, -1.603424072265625, -1.54461669921875, -1.485809326171875, -1.427001953125, -1.368194580078125, -1.30938720703125, -1.250579833984375, -1.1917724609375, -1.132965087890625, -1.07415771484375, -1.015350341796875, -0.95654296875, -0.897735595703125, -0.83892822265625, -0.780120849609375, -0.7213134765625, -0.662506103515625, -0.60369873046875, -0.544891357421875, -0.486083984375, -0.427276611328125, -0.36846923828125, -0.309661865234375, -0.2508544921875, -0.192047119140625, -0.13323974609375, -0.074432373046875, -0.015625, 0.043182373046875, 0.10198974609375, 0.160797119140625, 0.2196044921875, 0.278411865234375, 0.33721923828125, 0.396026611328125, 0.454833984375, 0.513641357421875, 0.57244873046875, 0.631256103515625, 0.6900634765625, 0.748870849609375, 0.80767822265625, 0.866485595703125, 0.92529296875, 0.984100341796875, 1.04290771484375, 1.101715087890625, 1.1605224609375, 1.219329833984375, 1.27813720703125, 1.336944580078125, 1.395751953125, 1.454559326171875, 1.51336669921875, 1.572174072265625, 1.6309814453125, 1.689788818359375, 1.74859619140625, 1.807403564453125, 1.8662109375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 9.0, 11.0, 13.0, 17.0, 13.0, 26.0, 18.0, 27.0, 43.0, 50.0, 66.0, 62.0, 78.0, 83.0, 65.0, 76.0, 74.0, 46.0, 40.0, 40.0, 27.0, 29.0, 12.0, 13.0, 10.0, 8.0, 12.0, 8.0, 4.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002712249755859375, -0.0026206672191619873, -0.0025290846824645996, -0.002437502145767212, -0.0023459196090698242, -0.0022543370723724365, -0.002162754535675049, -0.002071171998977661, -0.0019795894622802734, -0.0018880069255828857, -0.001796424388885498, -0.0017048418521881104, -0.0016132593154907227, -0.001521676778793335, -0.0014300942420959473, -0.0013385117053985596, -0.0012469291687011719, -0.0011553466320037842, -0.0010637640953063965, -0.0009721815586090088, -0.0008805990219116211, -0.0007890164852142334, -0.0006974339485168457, -0.000605851411819458, -0.0005142688751220703, -0.0004226863384246826, -0.0003311038017272949, -0.00023952126502990723, -0.00014793872833251953, -5.6356191635131836e-05, 3.522634506225586e-05, 0.00012680888175964355, 0.00021839141845703125, 0.00030997395515441895, 0.00040155649185180664, 0.0004931390285491943, 0.000584721565246582, 0.0006763041019439697, 0.0007678866386413574, 0.0008594691753387451, 0.0009510517120361328, 0.0010426342487335205, 0.0011342167854309082, 0.001225799322128296, 0.0013173818588256836, 0.0014089643955230713, 0.001500546932220459, 0.0015921294689178467, 0.0016837120056152344, 0.001775294542312622, 0.0018668770790100098, 0.0019584596157073975, 0.002050042152404785, 0.002141624689102173, 0.0022332072257995605, 0.0023247897624969482, 0.002416372299194336, 0.0025079548358917236, 0.0025995373725891113, 0.002691119909286499, 0.0027827024459838867, 0.0028742849826812744, 0.002965867519378662, 0.00305745005607605, 0.0031490325927734375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 4.0, 7.0, 8.0, 6.0, 5.0, 10.0, 24.0, 14.0, 26.0, 22.0, 41.0, 63.0, 82.0, 102.0, 152.0, 217.0, 376.0, 617.0, 1405.0, 584950.0, 457275.0, 1401.0, 610.0, 358.0, 208.0, 143.0, 98.0, 72.0, 73.0, 46.0, 31.0, 33.0, 15.0, 8.0, 7.0, 5.0, 3.0, 3.0, 5.0, 4.0, 4.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.053497314453125, -0.05196809768676758, -0.050438880920410156, -0.048909664154052734, -0.04738044738769531, -0.04585123062133789, -0.04432201385498047, -0.04279279708862305, -0.041263580322265625, -0.0397343635559082, -0.03820514678955078, -0.03667593002319336, -0.03514671325683594, -0.033617496490478516, -0.032088279724121094, -0.030559062957763672, -0.02902984619140625, -0.027500629425048828, -0.025971412658691406, -0.024442195892333984, -0.022912979125976562, -0.02138376235961914, -0.01985454559326172, -0.018325328826904297, -0.016796112060546875, -0.015266895294189453, -0.013737678527832031, -0.01220846176147461, -0.010679244995117188, -0.009150028228759766, -0.007620811462402344, -0.006091594696044922, -0.0045623779296875, -0.003033161163330078, -0.0015039443969726562, 2.5272369384765625e-05, 0.0015544891357421875, 0.0030837059020996094, 0.004612922668457031, 0.006142139434814453, 0.007671356201171875, 0.009200572967529297, 0.010729789733886719, 0.01225900650024414, 0.013788223266601562, 0.015317440032958984, 0.016846656799316406, 0.018375873565673828, 0.01990509033203125, 0.021434307098388672, 0.022963523864746094, 0.024492740631103516, 0.026021957397460938, 0.02755117416381836, 0.02908039093017578, 0.030609607696533203, 0.032138824462890625, 0.03366804122924805, 0.03519725799560547, 0.03672647476196289, 0.03825569152832031, 0.039784908294677734, 0.041314125061035156, 0.04284334182739258, 0.04437255859375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 100.0, 471.0, 371.0, 58.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008021735586225986, -0.007834665477275848, -0.007647596299648285, -0.007460526656359434, -0.007273457013070583, -0.007086386904120445, -0.0068993172608315945, -0.006712247617542744, -0.006525177974253893, -0.006338108330965042, -0.006151038687676191, -0.0059639690443873405, -0.0057768989354372025, -0.005589829292148352, -0.005402759648859501, -0.00521569000557065, -0.005028620362281799, -0.0048415507189929485, -0.004654481075704098, -0.004467411432415247, -0.004280341789126396, -0.004093271680176258, -0.0039062020368874073, -0.0037191323935985565, -0.0035320627503097057, -0.003344993107020855, -0.003157923463732004, -0.0029708535876125097, -0.002783783944323659, -0.002596714301034808, -0.0024096444249153137, -0.002222574781626463, -0.002035504672676325, -0.001848435029387474, -0.0016613652696833014, -0.0014742955099791288, -0.001287225866690278, -0.0011001562234014273, -0.0009130864636972547, -0.000726016703993082, -0.0005389470607042313, -0.00035187735920771956, -0.00016480765771120787, 2.226204378530383e-05, 0.00020933174528181553, 0.0003964014467783272, 0.0005834711482748389, 0.0007705409079790115, 0.0009576105512678623, 0.001144680194556713, 0.0013317499542608857, 0.0015188197139650583, 0.0017058893572539091, 0.00189295900054276, 0.0020800288766622543, 0.002267098519951105, 0.002454168163239956, 0.0026412378065288067, 0.0028283074498176575, 0.003015377325937152, 0.0032024469692260027, 0.0033895166125148535, 0.003576586488634348, 0.0037636561319231987, 0.0039507257752120495]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 6.0, 8.0, 6.0, 10.0, 14.0, 15.0, 8.0, 18.0, 24.0, 19.0, 28.0, 31.0, 36.0, 40.0, 50.0, 36.0, 48.0, 54.0, 52.0, 61.0, 47.0, 42.0, 44.0, 35.0, 35.0, 35.0, 36.0, 26.0, 25.0, 13.0, 22.0, 10.0, 15.0, 14.0, 7.0, 10.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00129777193069458, -0.0012513287365436554, -0.0012048855423927307, -0.001158442348241806, -0.0011119991540908813, -0.0010655559599399567, -0.001019112765789032, -0.0009726695716381073, -0.0009262263774871826, -0.0008797831833362579, -0.0008333399891853333, -0.0007868967950344086, -0.0007404536008834839, -0.0006940104067325592, -0.0006475672125816345, -0.0006011240184307098, -0.0005546808242797852, -0.0005082376301288605, -0.0004617944359779358, -0.0004153512418270111, -0.0003689080476760864, -0.00032246485352516174, -0.00027602165937423706, -0.00022957846522331238, -0.0001831352710723877, -0.000136692076921463, -9.024888277053833e-05, -4.380568861961365e-05, 2.637505531311035e-06, 4.908069968223572e-05, 9.55238938331604e-05, 0.00014196708798408508, 0.00018841028213500977, 0.00023485347628593445, 0.00028129667043685913, 0.0003277398645877838, 0.0003741830587387085, 0.0004206262528896332, 0.00046706944704055786, 0.0005135126411914825, 0.0005599558353424072, 0.0006063990294933319, 0.0006528422236442566, 0.0006992854177951813, 0.000745728611946106, 0.0007921718060970306, 0.0008386150002479553, 0.00088505819439888, 0.0009315013885498047, 0.0009779445827007294, 0.001024387776851654, 0.0010708309710025787, 0.0011172741651535034, 0.001163717359304428, 0.0012101605534553528, 0.0012566037476062775, 0.0013030469417572021, 0.0013494901359081268, 0.0013959333300590515, 0.0014423765242099762, 0.0014888197183609009, 0.0015352629125118256, 0.0015817061066627502, 0.001628149300813675, 0.0016745924949645996]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 4.0, 4.0, 10.0, 7.0, 15.0, 21.0, 15.0, 18.0, 16.0, 25.0, 18.0, 26.0, 20.0, 27.0, 36.0, 24.0, 42.0, 40.0, 53.0, 32.0, 49.0, 33.0, 49.0, 31.0, 31.0, 39.0, 28.0, 27.0, 34.0, 25.0, 28.0, 23.0, 14.0, 19.0, 11.0, 22.0, 15.0, 12.0, 11.0, 7.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-9.3046875, -8.9827880859375, -8.660888671875, -8.3389892578125, -8.01708984375, -7.6951904296875, -7.373291015625, -7.0513916015625, -6.7294921875, -6.4075927734375, -6.085693359375, -5.7637939453125, -5.44189453125, -5.1199951171875, -4.798095703125, -4.4761962890625, -4.154296875, -3.8323974609375, -3.510498046875, -3.1885986328125, -2.86669921875, -2.5447998046875, -2.222900390625, -1.9010009765625, -1.5791015625, -1.2572021484375, -0.935302734375, -0.6134033203125, -0.29150390625, 0.0303955078125, 0.352294921875, 0.6741943359375, 0.99609375, 1.3179931640625, 1.639892578125, 1.9617919921875, 2.28369140625, 2.6055908203125, 2.927490234375, 3.2493896484375, 3.5712890625, 3.8931884765625, 4.215087890625, 4.5369873046875, 4.85888671875, 5.1807861328125, 5.502685546875, 5.8245849609375, 6.146484375, 6.4683837890625, 6.790283203125, 7.1121826171875, 7.43408203125, 7.7559814453125, 8.077880859375, 8.3997802734375, 8.7216796875, 9.0435791015625, 9.365478515625, 9.6873779296875, 10.00927734375, 10.3311767578125, 10.653076171875, 10.9749755859375, 11.296875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 8.0, 7.0, 12.0, 12.0, 19.0, 23.0, 40.0, 44.0, 56.0, 99.0, 94.0, 150.0, 196.0, 298.0, 377.0, 443.0, 612.0, 819.0, 1154.0, 1891.0, 4145.0, 14035.0, 71630.0, 419636.0, 433038.0, 74598.0, 14326.0, 4291.0, 2002.0, 1165.0, 851.0, 598.0, 466.0, 388.0, 266.0, 179.0, 157.0, 106.0, 83.0, 71.0, 46.0, 29.0, 22.0, 17.0, 19.0, 10.0, 10.0, 5.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-18.609375, -18.00927734375, -17.4091796875, -16.80908203125, -16.208984375, -15.60888671875, -15.0087890625, -14.40869140625, -13.80859375, -13.20849609375, -12.6083984375, -12.00830078125, -11.408203125, -10.80810546875, -10.2080078125, -9.60791015625, -9.0078125, -8.40771484375, -7.8076171875, -7.20751953125, -6.607421875, -6.00732421875, -5.4072265625, -4.80712890625, -4.20703125, -3.60693359375, -3.0068359375, -2.40673828125, -1.806640625, -1.20654296875, -0.6064453125, -0.00634765625, 0.59375, 1.19384765625, 1.7939453125, 2.39404296875, 2.994140625, 3.59423828125, 4.1943359375, 4.79443359375, 5.39453125, 5.99462890625, 6.5947265625, 7.19482421875, 7.794921875, 8.39501953125, 8.9951171875, 9.59521484375, 10.1953125, 10.79541015625, 11.3955078125, 11.99560546875, 12.595703125, 13.19580078125, 13.7958984375, 14.39599609375, 14.99609375, 15.59619140625, 16.1962890625, 16.79638671875, 17.396484375, 17.99658203125, 18.5966796875, 19.19677734375, 19.796875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 4.0, 6.0, 2.0, 7.0, 11.0, 11.0, 17.0, 19.0, 16.0, 21.0, 26.0, 26.0, 31.0, 38.0, 43.0, 54.0, 80.0, 107.0, 404.0, 1504.0, 126.0, 73.0, 55.0, 58.0, 42.0, 40.0, 32.0, 23.0, 25.0, 35.0, 17.0, 23.0, 11.0, 14.0, 6.0, 10.0, 5.0, 2.0, 7.0, 4.0, 3.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-31.046875, -30.1611328125, -29.275390625, -28.3896484375, -27.50390625, -26.6181640625, -25.732421875, -24.8466796875, -23.9609375, -23.0751953125, -22.189453125, -21.3037109375, -20.41796875, -19.5322265625, -18.646484375, -17.7607421875, -16.875, -15.9892578125, -15.103515625, -14.2177734375, -13.33203125, -12.4462890625, -11.560546875, -10.6748046875, -9.7890625, -8.9033203125, -8.017578125, -7.1318359375, -6.24609375, -5.3603515625, -4.474609375, -3.5888671875, -2.703125, -1.8173828125, -0.931640625, -0.0458984375, 0.83984375, 1.7255859375, 2.611328125, 3.4970703125, 4.3828125, 5.2685546875, 6.154296875, 7.0400390625, 7.92578125, 8.8115234375, 9.697265625, 10.5830078125, 11.46875, 12.3544921875, 13.240234375, 14.1259765625, 15.01171875, 15.8974609375, 16.783203125, 17.6689453125, 18.5546875, 19.4404296875, 20.326171875, 21.2119140625, 22.09765625, 22.9833984375, 23.869140625, 24.7548828125, 25.640625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 7.0, 9.0, 7.0, 9.0, 14.0, 13.0, 9.0, 17.0, 23.0, 25.0, 36.0, 42.0, 53.0, 87.0, 140.0, 194.0, 356.0, 585.0, 1367.0, 52055.0, 3085553.0, 3103.0, 830.0, 412.0, 226.0, 151.0, 107.0, 58.0, 43.0, 45.0, 32.0, 15.0, 10.0, 9.0, 10.0, 6.0, 10.0, 6.0, 6.0, 3.0, 9.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0], "bins": [-115.875, -112.7646484375, -109.654296875, -106.5439453125, -103.43359375, -100.3232421875, -97.212890625, -94.1025390625, -90.9921875, -87.8818359375, -84.771484375, -81.6611328125, -78.55078125, -75.4404296875, -72.330078125, -69.2197265625, -66.109375, -62.9990234375, -59.888671875, -56.7783203125, -53.66796875, -50.5576171875, -47.447265625, -44.3369140625, -41.2265625, -38.1162109375, -35.005859375, -31.8955078125, -28.78515625, -25.6748046875, -22.564453125, -19.4541015625, -16.34375, -13.2333984375, -10.123046875, -7.0126953125, -3.90234375, -0.7919921875, 2.318359375, 5.4287109375, 8.5390625, 11.6494140625, 14.759765625, 17.8701171875, 20.98046875, 24.0908203125, 27.201171875, 30.3115234375, 33.421875, 36.5322265625, 39.642578125, 42.7529296875, 45.86328125, 48.9736328125, 52.083984375, 55.1943359375, 58.3046875, 61.4150390625, 64.525390625, 67.6357421875, 70.74609375, 73.8564453125, 76.966796875, 80.0771484375, 83.1875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 50.0, 329.0, 527.0, 104.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.00137329101562, -148.02281188964844, -141.0442352294922, -134.065673828125, -127.08710479736328, -120.10853576660156, -113.12997436523438, -106.15140533447266, -99.17283630371094, -92.19426727294922, -85.21570587158203, -78.23713684082031, -71.2585678100586, -64.27999877929688, -57.30143737792969, -50.32286834716797, -43.34430694580078, -36.36574172973633, -29.38717269897461, -22.408607482910156, -15.43004035949707, -8.451473236083984, -1.4729080200195312, 5.5056610107421875, 12.48422622680664, 19.462793350219727, 26.441360473632812, 33.419925689697266, 40.39849090576172, 47.37705993652344, 54.35562515258789, 61.33419418334961, 68.31275939941406, 75.29132843017578, 82.26988983154297, 89.24845886230469, 96.2270278930664, 103.20559692382812, 110.18415832519531, 117.16272735595703, 124.14129638671875, 131.11985778808594, 138.0984344482422, 145.07699584960938, 152.05555725097656, 159.0341339111328, 166.0126953125, 172.99127197265625, 179.96981811523438, 186.94837951660156, 193.9269561767578, 200.905517578125, 207.8840789794922, 214.86265563964844, 221.84121704101562, 228.81979370117188, 235.79835510253906, 242.77691650390625, 249.7554931640625, 256.73406982421875, 263.7126159667969, 270.6911926269531, 277.66973876953125, 284.6483154296875, 291.62689208984375]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 5.0, 5.0, 13.0, 13.0, 16.0, 8.0, 18.0, 9.0, 20.0, 28.0, 16.0, 25.0, 21.0, 28.0, 38.0, 26.0, 30.0, 42.0, 48.0, 43.0, 47.0, 36.0, 43.0, 40.0, 34.0, 37.0, 29.0, 40.0, 34.0, 31.0, 29.0, 30.0, 14.0, 18.0, 10.0, 20.0, 15.0, 6.0, 4.0, 4.0, 6.0, 7.0, 10.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-77.30536651611328, -75.1236343383789, -72.94190979003906, -70.76017761230469, -68.57844543457031, -66.39671325683594, -64.2149887084961, -62.03325653076172, -59.851524353027344, -57.669795989990234, -55.48806381225586, -53.30633544921875, -51.124603271484375, -48.942874908447266, -46.761146545410156, -44.57941436767578, -42.39768600463867, -40.21595764160156, -38.03422546386719, -35.85249710083008, -33.6707649230957, -31.489036560058594, -29.30730628967285, -27.12557601928711, -24.943845748901367, -22.762115478515625, -20.580385208129883, -18.39865493774414, -16.21692657470703, -14.035195350646973, -11.853466033935547, -9.671735763549805, -7.4900054931640625, -5.30827522277832, -3.1265454292297363, -0.9448156356811523, 1.2369146347045898, 3.418644905090332, 5.600374221801758, 7.7821044921875, 9.963834762573242, 12.145565032958984, 14.327295303344727, 16.50902557373047, 18.690753936767578, 20.872486114501953, 23.054214477539062, 25.235944747924805, 27.417675018310547, 29.59940528869629, 31.78113555908203, 33.96286392211914, 36.144596099853516, 38.326324462890625, 40.508056640625, 42.68978500366211, 44.87151336669922, 47.05324172973633, 49.2349739074707, 51.41670227050781, 53.59843444824219, 55.7801628112793, 57.961891174316406, 60.14362335205078, 62.325355529785156]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 6.0, 6.0, 5.0, 3.0, 8.0, 13.0, 17.0, 17.0, 17.0, 20.0, 19.0, 28.0, 25.0, 42.0, 27.0, 34.0, 40.0, 37.0, 35.0, 47.0, 54.0, 38.0, 36.0, 49.0, 41.0, 34.0, 27.0, 33.0, 33.0, 40.0, 24.0, 20.0, 18.0, 17.0, 15.0, 15.0, 12.0, 12.0, 8.0, 10.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.53125, -9.181396484375, -8.83154296875, -8.481689453125, -8.1318359375, -7.781982421875, -7.43212890625, -7.082275390625, -6.732421875, -6.382568359375, -6.03271484375, -5.682861328125, -5.3330078125, -4.983154296875, -4.63330078125, -4.283447265625, -3.93359375, -3.583740234375, -3.23388671875, -2.884033203125, -2.5341796875, -2.184326171875, -1.83447265625, -1.484619140625, -1.134765625, -0.784912109375, -0.43505859375, -0.085205078125, 0.2646484375, 0.614501953125, 0.96435546875, 1.314208984375, 1.6640625, 2.013916015625, 2.36376953125, 2.713623046875, 3.0634765625, 3.413330078125, 3.76318359375, 4.113037109375, 4.462890625, 4.812744140625, 5.16259765625, 5.512451171875, 5.8623046875, 6.212158203125, 6.56201171875, 6.911865234375, 7.26171875, 7.611572265625, 7.96142578125, 8.311279296875, 8.6611328125, 9.010986328125, 9.36083984375, 9.710693359375, 10.060546875, 10.410400390625, 10.76025390625, 11.110107421875, 11.4599609375, 11.809814453125, 12.15966796875, 12.509521484375, 12.859375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 3.0, 8.0, 10.0, 10.0, 17.0, 19.0, 18.0, 36.0, 39.0, 43.0, 68.0, 83.0, 105.0, 172.0, 266.0, 453.0, 1136.0, 3186.0, 15300.0, 227280.0, 2921422.0, 975070.0, 39895.0, 6127.0, 1786.0, 663.0, 333.0, 204.0, 131.0, 93.0, 61.0, 59.0, 43.0, 34.0, 25.0, 18.0, 12.0, 16.0, 10.0, 5.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-32.53125, -31.566650390625, -30.60205078125, -29.637451171875, -28.6728515625, -27.708251953125, -26.74365234375, -25.779052734375, -24.814453125, -23.849853515625, -22.88525390625, -21.920654296875, -20.9560546875, -19.991455078125, -19.02685546875, -18.062255859375, -17.09765625, -16.133056640625, -15.16845703125, -14.203857421875, -13.2392578125, -12.274658203125, -11.31005859375, -10.345458984375, -9.380859375, -8.416259765625, -7.45166015625, -6.487060546875, -5.5224609375, -4.557861328125, -3.59326171875, -2.628662109375, -1.6640625, -0.699462890625, 0.26513671875, 1.229736328125, 2.1943359375, 3.158935546875, 4.12353515625, 5.088134765625, 6.052734375, 7.017333984375, 7.98193359375, 8.946533203125, 9.9111328125, 10.875732421875, 11.84033203125, 12.804931640625, 13.76953125, 14.734130859375, 15.69873046875, 16.663330078125, 17.6279296875, 18.592529296875, 19.55712890625, 20.521728515625, 21.486328125, 22.450927734375, 23.41552734375, 24.380126953125, 25.3447265625, 26.309326171875, 27.27392578125, 28.238525390625, 29.203125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 12.0, 19.0, 21.0, 45.0, 66.0, 73.0, 60.0, 113.0, 145.0, 214.0, 289.0, 481.0, 653.0, 559.0, 401.0, 271.0, 170.0, 118.0, 92.0, 57.0, 55.0, 42.0, 32.0, 16.0, 10.0, 18.0, 9.0, 10.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-25.953125, -25.283203125, -24.61328125, -23.943359375, -23.2734375, -22.603515625, -21.93359375, -21.263671875, -20.59375, -19.923828125, -19.25390625, -18.583984375, -17.9140625, -17.244140625, -16.57421875, -15.904296875, -15.234375, -14.564453125, -13.89453125, -13.224609375, -12.5546875, -11.884765625, -11.21484375, -10.544921875, -9.875, -9.205078125, -8.53515625, -7.865234375, -7.1953125, -6.525390625, -5.85546875, -5.185546875, -4.515625, -3.845703125, -3.17578125, -2.505859375, -1.8359375, -1.166015625, -0.49609375, 0.173828125, 0.84375, 1.513671875, 2.18359375, 2.853515625, 3.5234375, 4.193359375, 4.86328125, 5.533203125, 6.203125, 6.873046875, 7.54296875, 8.212890625, 8.8828125, 9.552734375, 10.22265625, 10.892578125, 11.5625, 12.232421875, 12.90234375, 13.572265625, 14.2421875, 14.912109375, 15.58203125, 16.251953125, 16.921875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 7.0, 11.0, 23.0, 42.0, 71.0, 114.0, 257.0, 652.0, 2369.0, 32903.0, 4035404.0, 117573.0, 3360.0, 865.0, 293.0, 152.0, 74.0, 48.0, 23.0, 16.0, 10.0, 9.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-89.8125, -87.4248046875, -85.037109375, -82.6494140625, -80.26171875, -77.8740234375, -75.486328125, -73.0986328125, -70.7109375, -68.3232421875, -65.935546875, -63.5478515625, -61.16015625, -58.7724609375, -56.384765625, -53.9970703125, -51.609375, -49.2216796875, -46.833984375, -44.4462890625, -42.05859375, -39.6708984375, -37.283203125, -34.8955078125, -32.5078125, -30.1201171875, -27.732421875, -25.3447265625, -22.95703125, -20.5693359375, -18.181640625, -15.7939453125, -13.40625, -11.0185546875, -8.630859375, -6.2431640625, -3.85546875, -1.4677734375, 0.919921875, 3.3076171875, 5.6953125, 8.0830078125, 10.470703125, 12.8583984375, 15.24609375, 17.6337890625, 20.021484375, 22.4091796875, 24.796875, 27.1845703125, 29.572265625, 31.9599609375, 34.34765625, 36.7353515625, 39.123046875, 41.5107421875, 43.8984375, 46.2861328125, 48.673828125, 51.0615234375, 53.44921875, 55.8369140625, 58.224609375, 60.6123046875, 63.0]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 37.0, 868.0, 110.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1249.329345703125, -1227.6512451171875, -1205.97314453125, -1184.295166015625, -1162.6170654296875, -1140.93896484375, -1119.260986328125, -1097.5828857421875, -1075.90478515625, -1054.2266845703125, -1032.548583984375, -1010.87060546875, -989.1925048828125, -967.514404296875, -945.8363647460938, -924.1583251953125, -902.480224609375, -880.8021240234375, -859.1240844726562, -837.446044921875, -815.7679443359375, -794.08984375, -772.4118041992188, -750.7337646484375, -729.0556640625, -707.3775634765625, -685.6995239257812, -664.021484375, -642.3433837890625, -620.665283203125, -598.9872436523438, -577.3092041015625, -555.631103515625, -533.9530029296875, -512.2749633789062, -490.5968933105469, -468.9188232421875, -447.2407531738281, -425.56268310546875, -403.8846130371094, -382.20654296875, -360.5284729003906, -338.85040283203125, -317.1723327636719, -295.4942626953125, -273.8161926269531, -252.13812255859375, -230.46005249023438, -208.78199768066406, -187.1039276123047, -165.4258575439453, -143.74778747558594, -122.06971740722656, -100.39164733886719, -78.71357727050781, -57.03550720214844, -35.35743713378906, -13.679367065429688, 7.9987030029296875, 29.676773071289062, 51.35484313964844, 73.03291320800781, 94.71098327636719, 116.38905334472656, 138.06712341308594]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 7.0, 5.0, 7.0, 7.0, 3.0, 8.0, 12.0, 6.0, 15.0, 13.0, 26.0, 28.0, 19.0, 32.0, 34.0, 24.0, 31.0, 35.0, 43.0, 49.0, 39.0, 41.0, 62.0, 53.0, 48.0, 35.0, 35.0, 40.0, 30.0, 22.0, 35.0, 27.0, 19.0, 21.0, 12.0, 20.0, 15.0, 13.0, 8.0, 2.0, 8.0, 4.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-80.67355346679688, -78.47052764892578, -76.26750946044922, -74.06448364257812, -71.86146545410156, -69.65843963623047, -67.45541381835938, -65.25239562988281, -63.04936981201172, -60.84634780883789, -58.64332580566406, -56.44029998779297, -54.23727798461914, -52.03425598144531, -49.831233978271484, -47.628211975097656, -45.42518997192383, -43.22216796875, -41.01914596557617, -38.816123962402344, -36.61309814453125, -34.41007614135742, -32.207054138183594, -30.004032135009766, -27.801008224487305, -25.597986221313477, -23.394962310791016, -21.191940307617188, -18.98891830444336, -16.7858943939209, -14.58287239074707, -12.379849433898926, -10.176826477050781, -7.973803520202637, -5.77078104019165, -3.567758560180664, -1.3647356033325195, 0.838287353515625, 3.041309356689453, 5.244332313537598, 7.447355270385742, 9.650378227233887, 11.853401184082031, 14.05642318725586, 16.259445190429688, 18.46246910095215, 20.665491104125977, 22.868515014648438, 25.071537017822266, 27.274559020996094, 29.477582931518555, 31.680604934692383, 33.883628845214844, 36.08665084838867, 38.2896728515625, 40.49269485473633, 42.695716857910156, 44.898738861083984, 47.10176086425781, 49.304786682128906, 51.507808685302734, 53.71083068847656, 55.91385269165039, 58.11687469482422, 60.31990051269531]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 4.0, 6.0, 5.0, 10.0, 12.0, 16.0, 13.0, 13.0, 23.0, 24.0, 29.0, 38.0, 33.0, 43.0, 47.0, 44.0, 48.0, 44.0, 43.0, 34.0, 41.0, 39.0, 46.0, 44.0, 34.0, 39.0, 29.0, 41.0, 26.0, 21.0, 28.0, 15.0, 13.0, 13.0, 10.0, 10.0, 10.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7265625, -7.43310546875, -7.1396484375, -6.84619140625, -6.552734375, -6.25927734375, -5.9658203125, -5.67236328125, -5.37890625, -5.08544921875, -4.7919921875, -4.49853515625, -4.205078125, -3.91162109375, -3.6181640625, -3.32470703125, -3.03125, -2.73779296875, -2.4443359375, -2.15087890625, -1.857421875, -1.56396484375, -1.2705078125, -0.97705078125, -0.68359375, -0.39013671875, -0.0966796875, 0.19677734375, 0.490234375, 0.78369140625, 1.0771484375, 1.37060546875, 1.6640625, 1.95751953125, 2.2509765625, 2.54443359375, 2.837890625, 3.13134765625, 3.4248046875, 3.71826171875, 4.01171875, 4.30517578125, 4.5986328125, 4.89208984375, 5.185546875, 5.47900390625, 5.7724609375, 6.06591796875, 6.359375, 6.65283203125, 6.9462890625, 7.23974609375, 7.533203125, 7.82666015625, 8.1201171875, 8.41357421875, 8.70703125, 9.00048828125, 9.2939453125, 9.58740234375, 9.880859375, 10.17431640625, 10.4677734375, 10.76123046875, 11.0546875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 8.0, 4.0, 9.0, 14.0, 18.0, 24.0, 38.0, 52.0, 76.0, 150.0, 231.0, 384.0, 655.0, 1076.0, 1929.0, 3248.0, 5529.0, 9897.0, 17208.0, 30398.0, 54229.0, 97185.0, 177252.0, 263811.0, 171365.0, 93386.0, 52025.0, 29023.0, 16836.0, 9469.0, 5412.0, 3115.0, 1815.0, 1087.0, 635.0, 367.0, 220.0, 145.0, 81.0, 51.0, 29.0, 19.0, 13.0, 14.0, 6.0, 6.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5927734375, -1.5437164306640625, -1.494659423828125, -1.4456024169921875, -1.39654541015625, -1.3474884033203125, -1.298431396484375, -1.2493743896484375, -1.2003173828125, -1.1512603759765625, -1.102203369140625, -1.0531463623046875, -1.00408935546875, -0.9550323486328125, -0.905975341796875, -0.8569183349609375, -0.807861328125, -0.7588043212890625, -0.709747314453125, -0.6606903076171875, -0.61163330078125, -0.5625762939453125, -0.513519287109375, -0.4644622802734375, -0.4154052734375, -0.3663482666015625, -0.317291259765625, -0.2682342529296875, -0.21917724609375, -0.1701202392578125, -0.121063232421875, -0.0720062255859375, -0.02294921875, 0.0261077880859375, 0.075164794921875, 0.1242218017578125, 0.17327880859375, 0.2223358154296875, 0.271392822265625, 0.3204498291015625, 0.3695068359375, 0.4185638427734375, 0.467620849609375, 0.5166778564453125, 0.56573486328125, 0.6147918701171875, 0.663848876953125, 0.7129058837890625, 0.761962890625, 0.8110198974609375, 0.860076904296875, 0.9091339111328125, 0.95819091796875, 1.0072479248046875, 1.056304931640625, 1.1053619384765625, 1.1544189453125, 1.2034759521484375, 1.252532958984375, 1.3015899658203125, 1.35064697265625, 1.3997039794921875, 1.448760986328125, 1.4978179931640625, 1.546875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 9.0, 4.0, 12.0, 9.0, 18.0, 22.0, 24.0, 23.0, 17.0, 28.0, 26.0, 37.0, 30.0, 27.0, 32.0, 47.0, 28.0, 41.0, 1064.0, 34.0, 41.0, 47.0, 38.0, 36.0, 43.0, 33.0, 28.0, 30.0, 22.0, 34.0, 25.0, 15.0, 15.0, 13.0, 16.0, 10.0, 10.0, 10.0, 8.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.44537353515625, -4.2735595703125, -4.10174560546875, -3.929931640625, -3.75811767578125, -3.5863037109375, -3.41448974609375, -3.24267578125, -3.07086181640625, -2.8990478515625, -2.72723388671875, -2.555419921875, -2.38360595703125, -2.2117919921875, -2.03997802734375, -1.8681640625, -1.69635009765625, -1.5245361328125, -1.35272216796875, -1.180908203125, -1.00909423828125, -0.8372802734375, -0.66546630859375, -0.49365234375, -0.32183837890625, -0.1500244140625, 0.02178955078125, 0.193603515625, 0.36541748046875, 0.5372314453125, 0.70904541015625, 0.880859375, 1.05267333984375, 1.2244873046875, 1.39630126953125, 1.568115234375, 1.73992919921875, 1.9117431640625, 2.08355712890625, 2.25537109375, 2.42718505859375, 2.5989990234375, 2.77081298828125, 2.942626953125, 3.11444091796875, 3.2862548828125, 3.45806884765625, 3.6298828125, 3.80169677734375, 3.9735107421875, 4.14532470703125, 4.317138671875, 4.48895263671875, 4.6607666015625, 4.83258056640625, 5.00439453125, 5.17620849609375, 5.3480224609375, 5.51983642578125, 5.691650390625, 5.86346435546875, 6.0352783203125, 6.20709228515625, 6.37890625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 7.0, 14.0, 20.0, 38.0, 48.0, 73.0, 100.0, 148.0, 216.0, 323.0, 461.0, 684.0, 1037.0, 1492.0, 2314.0, 3425.0, 5283.0, 8004.0, 11987.0, 18794.0, 28827.0, 45585.0, 71928.0, 113044.0, 175366.0, 1243680.0, 131286.0, 83446.0, 52886.0, 33833.0, 21450.0, 14190.0, 9228.0, 6067.0, 3902.0, 2569.0, 1726.0, 1222.0, 797.0, 542.0, 354.0, 235.0, 155.0, 110.0, 63.0, 61.0, 37.0, 15.0, 23.0, 7.0, 10.0, 7.0, 4.0, 2.0, 3.0, 0.0, 3.0], "bins": [-1.1328125, -1.09759521484375, -1.0623779296875, -1.02716064453125, -0.991943359375, -0.95672607421875, -0.9215087890625, -0.88629150390625, -0.85107421875, -0.81585693359375, -0.7806396484375, -0.74542236328125, -0.710205078125, -0.67498779296875, -0.6397705078125, -0.60455322265625, -0.5693359375, -0.53411865234375, -0.4989013671875, -0.46368408203125, -0.428466796875, -0.39324951171875, -0.3580322265625, -0.32281494140625, -0.28759765625, -0.25238037109375, -0.2171630859375, -0.18194580078125, -0.146728515625, -0.11151123046875, -0.0762939453125, -0.04107666015625, -0.005859375, 0.02935791015625, 0.0645751953125, 0.09979248046875, 0.135009765625, 0.17022705078125, 0.2054443359375, 0.24066162109375, 0.27587890625, 0.31109619140625, 0.3463134765625, 0.38153076171875, 0.416748046875, 0.45196533203125, 0.4871826171875, 0.52239990234375, 0.5576171875, 0.59283447265625, 0.6280517578125, 0.66326904296875, 0.698486328125, 0.73370361328125, 0.7689208984375, 0.80413818359375, 0.83935546875, 0.87457275390625, 0.9097900390625, 0.94500732421875, 0.980224609375, 1.01544189453125, 1.0506591796875, 1.08587646484375, 1.12109375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 5.0, 4.0, 11.0, 17.0, 11.0, 14.0, 21.0, 25.0, 19.0, 33.0, 42.0, 40.0, 61.0, 47.0, 55.0, 55.0, 65.0, 61.0, 51.0, 52.0, 52.0, 39.0, 28.0, 35.0, 33.0, 26.0, 16.0, 17.0, 10.0, 10.0, 15.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002025604248046875, -0.0019669532775878906, -0.0019083023071289062, -0.0018496513366699219, -0.0017910003662109375, -0.0017323493957519531, -0.0016736984252929688, -0.0016150474548339844, -0.001556396484375, -0.0014977455139160156, -0.0014390945434570312, -0.0013804435729980469, -0.0013217926025390625, -0.0012631416320800781, -0.0012044906616210938, -0.0011458396911621094, -0.001087188720703125, -0.0010285377502441406, -0.0009698867797851562, -0.0009112358093261719, -0.0008525848388671875, -0.0007939338684082031, -0.0007352828979492188, -0.0006766319274902344, -0.00061798095703125, -0.0005593299865722656, -0.0005006790161132812, -0.0004420280456542969, -0.0003833770751953125, -0.0003247261047363281, -0.00026607513427734375, -0.00020742416381835938, -0.000148773193359375, -9.012222290039062e-05, -3.147125244140625e-05, 2.7179718017578125e-05, 8.58306884765625e-05, 0.00014448165893554688, 0.00020313262939453125, 0.0002617835998535156, 0.0003204345703125, 0.0003790855407714844, 0.00043773651123046875, 0.0004963874816894531, 0.0005550384521484375, 0.0006136894226074219, 0.0006723403930664062, 0.0007309913635253906, 0.000789642333984375, 0.0008482933044433594, 0.0009069442749023438, 0.0009655952453613281, 0.0010242462158203125, 0.0010828971862792969, 0.0011415481567382812, 0.0012001991271972656, 0.00125885009765625, 0.0013175010681152344, 0.0013761520385742188, 0.0014348030090332031, 0.0014934539794921875, 0.0015521049499511719, 0.0016107559204101562, 0.0016694068908691406, 0.001728057861328125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 6.0, 12.0, 14.0, 12.0, 25.0, 24.0, 33.0, 46.0, 72.0, 104.0, 131.0, 174.0, 263.0, 441.0, 773.0, 4489.0, 1029541.0, 10002.0, 913.0, 456.0, 297.0, 202.0, 132.0, 87.0, 67.0, 69.0, 31.0, 42.0, 17.0, 19.0, 10.0, 9.0, 10.0, 7.0, 2.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.038787841796875, -0.03755903244018555, -0.036330223083496094, -0.03510141372680664, -0.03387260437011719, -0.032643795013427734, -0.03141498565673828, -0.030186176300048828, -0.028957366943359375, -0.027728557586669922, -0.02649974822998047, -0.025270938873291016, -0.024042129516601562, -0.02281332015991211, -0.021584510803222656, -0.020355701446533203, -0.01912689208984375, -0.017898082733154297, -0.016669273376464844, -0.01544046401977539, -0.014211654663085938, -0.012982845306396484, -0.011754035949707031, -0.010525226593017578, -0.009296417236328125, -0.008067607879638672, -0.006838798522949219, -0.005609989166259766, -0.0043811798095703125, -0.0031523704528808594, -0.0019235610961914062, -0.0006947517395019531, 0.0005340576171875, 0.0017628669738769531, 0.0029916763305664062, 0.004220485687255859, 0.0054492950439453125, 0.006678104400634766, 0.007906913757324219, 0.009135723114013672, 0.010364532470703125, 0.011593341827392578, 0.012822151184082031, 0.014050960540771484, 0.015279769897460938, 0.01650857925415039, 0.017737388610839844, 0.018966197967529297, 0.02019500732421875, 0.021423816680908203, 0.022652626037597656, 0.02388143539428711, 0.025110244750976562, 0.026339054107666016, 0.02756786346435547, 0.028796672821044922, 0.030025482177734375, 0.03125429153442383, 0.03248310089111328, 0.033711910247802734, 0.03494071960449219, 0.03616952896118164, 0.037398338317871094, 0.03862714767456055, 0.03985595703125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 65.0, 662.0, 278.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0074579487554728985, -0.007230037357658148, -0.007002125959843397, -0.0067742145620286465, -0.006546303164213896, -0.006318391766399145, -0.006090480834245682, -0.005862569436430931, -0.00563465803861618, -0.00540674664080143, -0.005178835242986679, -0.004950923845171928, -0.004723012447357178, -0.004495101049542427, -0.004267189651727676, -0.004039278253912926, -0.003811366856098175, -0.0035834554582834244, -0.0033555440604686737, -0.003127632662653923, -0.0028997212648391724, -0.0026718098670244217, -0.0024438987020403147, -0.002215987304225564, -0.0019880759064108133, -0.0017601645085960627, -0.001532253110781312, -0.0013043418293818831, -0.0010764304315671325, -0.0008485190337523818, -0.000620607752352953, -0.0003926963545382023, -0.00016478542238473892, 6.312594632618129e-05, 0.0002910373150371015, 0.0005189486546441913, 0.0007468600524589419, 0.0009747714502736926, 0.0012026827316731215, 0.0014305941294878721, 0.0016585055273026228, 0.0018864169251173735, 0.002114328322932124, 0.002342239487916231, 0.002570150885730982, 0.0027980622835457325, 0.003025973681360483, 0.003253885079175234, 0.0034817964769899845, 0.003709707874804735, 0.003937619272619486, 0.0041655306704342365, 0.004393442068248987, 0.004621353466063738, 0.004849264398217201, 0.005077175796031952, 0.005305087193846703, 0.005532998591661453, 0.005760909989476204, 0.005988821387290955, 0.006216732785105705, 0.006444644182920456, 0.006672555580735207, 0.006900466978549957, 0.007128378376364708]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 2.0, 10.0, 5.0, 16.0, 12.0, 16.0, 20.0, 24.0, 24.0, 29.0, 34.0, 34.0, 48.0, 45.0, 46.0, 53.0, 45.0, 43.0, 40.0, 47.0, 44.0, 45.0, 48.0, 34.0, 37.0, 34.0, 36.0, 23.0, 14.0, 23.0, 17.0, 13.0, 8.0, 7.0, 5.0, 6.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012417435646057129, -0.001206129789352417, -0.001170516014099121, -0.0011349022388458252, -0.0010992884635925293, -0.0010636746883392334, -0.0010280609130859375, -0.0009924471378326416, -0.0009568333625793457, -0.0009212195873260498, -0.0008856058120727539, -0.000849992036819458, -0.0008143782615661621, -0.0007787644863128662, -0.0007431507110595703, -0.0007075369358062744, -0.0006719231605529785, -0.0006363093852996826, -0.0006006956100463867, -0.0005650818347930908, -0.0005294680595397949, -0.000493854284286499, -0.0004582405090332031, -0.0004226267337799072, -0.00038701295852661133, -0.00035139918327331543, -0.00031578540802001953, -0.00028017163276672363, -0.00024455785751342773, -0.00020894408226013184, -0.00017333030700683594, -0.00013771653175354004, -0.00010210275650024414, -6.648898124694824e-05, -3.0875205993652344e-05, 4.738569259643555e-06, 4.035234451293945e-05, 7.596611976623535e-05, 0.00011157989501953125, 0.00014719367027282715, 0.00018280744552612305, 0.00021842122077941895, 0.00025403499603271484, 0.00028964877128601074, 0.00032526254653930664, 0.00036087632179260254, 0.00039649009704589844, 0.00043210387229919434, 0.00046771764755249023, 0.0005033314228057861, 0.000538945198059082, 0.0005745589733123779, 0.0006101727485656738, 0.0006457865238189697, 0.0006814002990722656, 0.0007170140743255615, 0.0007526278495788574, 0.0007882416248321533, 0.0008238554000854492, 0.0008594691753387451, 0.000895082950592041, 0.0009306967258453369, 0.0009663105010986328, 0.0010019242763519287, 0.0010375380516052246]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 4.0, 6.0, 5.0, 10.0, 12.0, 17.0, 12.0, 13.0, 23.0, 24.0, 29.0, 38.0, 33.0, 43.0, 47.0, 44.0, 48.0, 44.0, 43.0, 34.0, 41.0, 39.0, 46.0, 44.0, 34.0, 39.0, 29.0, 41.0, 26.0, 21.0, 28.0, 15.0, 13.0, 13.0, 10.0, 10.0, 10.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7265625, -7.43310546875, -7.1396484375, -6.84619140625, -6.552734375, -6.25927734375, -5.9658203125, -5.67236328125, -5.37890625, -5.08544921875, -4.7919921875, -4.49853515625, -4.205078125, -3.91162109375, -3.6181640625, -3.32470703125, -3.03125, -2.73779296875, -2.4443359375, -2.15087890625, -1.857421875, -1.56396484375, -1.2705078125, -0.97705078125, -0.68359375, -0.39013671875, -0.0966796875, 0.19677734375, 0.490234375, 0.78369140625, 1.0771484375, 1.37060546875, 1.6640625, 1.95751953125, 2.2509765625, 2.54443359375, 2.837890625, 3.13134765625, 3.4248046875, 3.71826171875, 4.01171875, 4.30517578125, 4.5986328125, 4.89208984375, 5.185546875, 5.47900390625, 5.7724609375, 6.06591796875, 6.359375, 6.65283203125, 6.9462890625, 7.23974609375, 7.533203125, 7.82666015625, 8.1201171875, 8.41357421875, 8.70703125, 9.00048828125, 9.2939453125, 9.58740234375, 9.880859375, 10.17431640625, 10.4677734375, 10.76123046875, 11.0546875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 6.0, 13.0, 17.0, 34.0, 36.0, 67.0, 78.0, 101.0, 188.0, 270.0, 467.0, 664.0, 1045.0, 1604.0, 2959.0, 6359.0, 23034.0, 272233.0, 668350.0, 52175.0, 9500.0, 3847.0, 2021.0, 1236.0, 743.0, 532.0, 307.0, 211.0, 139.0, 110.0, 67.0, 39.0, 38.0, 24.0, 5.0, 4.0, 7.0, 10.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.5, -27.690185546875, -26.88037109375, -26.070556640625, -25.2607421875, -24.450927734375, -23.64111328125, -22.831298828125, -22.021484375, -21.211669921875, -20.40185546875, -19.592041015625, -18.7822265625, -17.972412109375, -17.16259765625, -16.352783203125, -15.54296875, -14.733154296875, -13.92333984375, -13.113525390625, -12.3037109375, -11.493896484375, -10.68408203125, -9.874267578125, -9.064453125, -8.254638671875, -7.44482421875, -6.635009765625, -5.8251953125, -5.015380859375, -4.20556640625, -3.395751953125, -2.5859375, -1.776123046875, -0.96630859375, -0.156494140625, 0.6533203125, 1.463134765625, 2.27294921875, 3.082763671875, 3.892578125, 4.702392578125, 5.51220703125, 6.322021484375, 7.1318359375, 7.941650390625, 8.75146484375, 9.561279296875, 10.37109375, 11.180908203125, 11.99072265625, 12.800537109375, 13.6103515625, 14.420166015625, 15.22998046875, 16.039794921875, 16.849609375, 17.659423828125, 18.46923828125, 19.279052734375, 20.0888671875, 20.898681640625, 21.70849609375, 22.518310546875, 23.328125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 11.0, 10.0, 7.0, 10.0, 13.0, 10.0, 13.0, 18.0, 28.0, 26.0, 23.0, 40.0, 60.0, 42.0, 61.0, 87.0, 182.0, 1649.0, 286.0, 94.0, 66.0, 47.0, 50.0, 38.0, 28.0, 37.0, 19.0, 25.0, 14.0, 15.0, 7.0, 5.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.109375, -24.26318359375, -23.4169921875, -22.57080078125, -21.724609375, -20.87841796875, -20.0322265625, -19.18603515625, -18.33984375, -17.49365234375, -16.6474609375, -15.80126953125, -14.955078125, -14.10888671875, -13.2626953125, -12.41650390625, -11.5703125, -10.72412109375, -9.8779296875, -9.03173828125, -8.185546875, -7.33935546875, -6.4931640625, -5.64697265625, -4.80078125, -3.95458984375, -3.1083984375, -2.26220703125, -1.416015625, -0.56982421875, 0.2763671875, 1.12255859375, 1.96875, 2.81494140625, 3.6611328125, 4.50732421875, 5.353515625, 6.19970703125, 7.0458984375, 7.89208984375, 8.73828125, 9.58447265625, 10.4306640625, 11.27685546875, 12.123046875, 12.96923828125, 13.8154296875, 14.66162109375, 15.5078125, 16.35400390625, 17.2001953125, 18.04638671875, 18.892578125, 19.73876953125, 20.5849609375, 21.43115234375, 22.27734375, 23.12353515625, 23.9697265625, 24.81591796875, 25.662109375, 26.50830078125, 27.3544921875, 28.20068359375, 29.046875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 5.0, 8.0, 11.0, 18.0, 26.0, 30.0, 46.0, 74.0, 93.0, 124.0, 231.0, 359.0, 737.0, 3243.0, 3096460.0, 41438.0, 1393.0, 505.0, 266.0, 191.0, 102.0, 83.0, 75.0, 49.0, 21.0, 32.0, 14.0, 23.0, 9.0, 4.0, 10.0, 6.0, 3.0, 7.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.4375, -94.6337890625, -91.830078125, -89.0263671875, -86.22265625, -83.4189453125, -80.615234375, -77.8115234375, -75.0078125, -72.2041015625, -69.400390625, -66.5966796875, -63.79296875, -60.9892578125, -58.185546875, -55.3818359375, -52.578125, -49.7744140625, -46.970703125, -44.1669921875, -41.36328125, -38.5595703125, -35.755859375, -32.9521484375, -30.1484375, -27.3447265625, -24.541015625, -21.7373046875, -18.93359375, -16.1298828125, -13.326171875, -10.5224609375, -7.71875, -4.9150390625, -2.111328125, 0.6923828125, 3.49609375, 6.2998046875, 9.103515625, 11.9072265625, 14.7109375, 17.5146484375, 20.318359375, 23.1220703125, 25.92578125, 28.7294921875, 31.533203125, 34.3369140625, 37.140625, 39.9443359375, 42.748046875, 45.5517578125, 48.35546875, 51.1591796875, 53.962890625, 56.7666015625, 59.5703125, 62.3740234375, 65.177734375, 67.9814453125, 70.78515625, 73.5888671875, 76.392578125, 79.1962890625, 82.0]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 12.0, 121.0, 427.0, 351.0, 87.0, 10.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.39105224609375, -230.99803161621094, -225.60501098632812, -220.21197509765625, -214.81895446777344, -209.42593383789062, -204.0329132080078, -198.639892578125, -193.24685668945312, -187.8538360595703, -182.4608154296875, -177.06777954101562, -171.6747589111328, -166.28173828125, -160.8887176513672, -155.49569702148438, -150.1026611328125, -144.7096405029297, -139.31661987304688, -133.923583984375, -128.5305633544922, -123.13754272460938, -117.74452209472656, -112.35149383544922, -106.95848083496094, -101.56546020507812, -96.17243194580078, -90.77941131591797, -85.38638305664062, -79.99336242675781, -74.600341796875, -69.20731353759766, -63.814292907714844, -58.421268463134766, -53.02824401855469, -47.635223388671875, -42.24219512939453, -36.84917449951172, -31.45615005493164, -26.063125610351562, -20.670101165771484, -15.277076721191406, -9.884053230285645, -4.491029739379883, 0.9019947052001953, 6.295019149780273, 11.688041687011719, 17.081066131591797, 22.474090576171875, 27.867115020751953, 33.26013946533203, 38.653160095214844, 44.04618835449219, 49.439208984375, 54.83223342895508, 60.225257873535156, 65.6182861328125, 71.01130676269531, 76.40433502197266, 81.79735565185547, 87.19038391113281, 92.58340454101562, 97.97642517089844, 103.36945343017578, 108.7624740600586]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 4.0, 7.0, 12.0, 14.0, 20.0, 19.0, 17.0, 34.0, 33.0, 30.0, 37.0, 35.0, 47.0, 43.0, 48.0, 33.0, 38.0, 52.0, 30.0, 41.0, 31.0, 37.0, 32.0, 39.0, 33.0, 20.0, 33.0, 25.0, 17.0, 17.0, 29.0, 21.0, 12.0, 14.0, 10.0, 4.0, 7.0, 3.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-67.76932525634766, -65.67735290527344, -63.58538055419922, -61.493412017822266, -59.40143966674805, -57.30946731567383, -55.217498779296875, -53.125526428222656, -51.03355407714844, -48.94158172607422, -46.849609375, -44.75764083862305, -42.66566848754883, -40.57369613647461, -38.481727600097656, -36.38975524902344, -34.29778289794922, -32.205810546875, -30.113840103149414, -28.021869659423828, -25.92989730834961, -23.83792495727539, -21.745954513549805, -19.65398406982422, -17.56201171875, -15.470040321350098, -13.378068923950195, -11.286097526550293, -9.19412612915039, -7.102154731750488, -5.010183334350586, -2.9182119369506836, -0.8262481689453125, 1.2657232284545898, 3.357694625854492, 5.4496660232543945, 7.541637420654297, 9.6336088180542, 11.725580215454102, 13.817551612854004, 15.909523010253906, 18.001495361328125, 20.09346580505371, 22.185436248779297, 24.277408599853516, 26.369380950927734, 28.46135139465332, 30.553321838378906, 32.645294189453125, 34.737266540527344, 36.82923889160156, 38.921207427978516, 41.013179779052734, 43.10515213012695, 45.197120666503906, 47.289093017578125, 49.381065368652344, 51.47303771972656, 53.56501007080078, 55.656978607177734, 57.74895095825195, 59.84092330932617, 61.932891845703125, 64.02486419677734, 66.11683654785156]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 5.0, 9.0, 4.0, 7.0, 8.0, 11.0, 7.0, 8.0, 11.0, 20.0, 29.0, 22.0, 25.0, 35.0, 31.0, 36.0, 55.0, 40.0, 42.0, 52.0, 40.0, 40.0, 34.0, 41.0, 43.0, 43.0, 32.0, 25.0, 41.0, 27.0, 28.0, 30.0, 24.0, 13.0, 17.0, 17.0, 10.0, 10.0, 3.0, 8.0, 5.0, 6.0, 1.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.823486328125, -7.53759765625, -7.251708984375, -6.9658203125, -6.679931640625, -6.39404296875, -6.108154296875, -5.822265625, -5.536376953125, -5.25048828125, -4.964599609375, -4.6787109375, -4.392822265625, -4.10693359375, -3.821044921875, -3.53515625, -3.249267578125, -2.96337890625, -2.677490234375, -2.3916015625, -2.105712890625, -1.81982421875, -1.533935546875, -1.248046875, -0.962158203125, -0.67626953125, -0.390380859375, -0.1044921875, 0.181396484375, 0.46728515625, 0.753173828125, 1.0390625, 1.324951171875, 1.61083984375, 1.896728515625, 2.1826171875, 2.468505859375, 2.75439453125, 3.040283203125, 3.326171875, 3.612060546875, 3.89794921875, 4.183837890625, 4.4697265625, 4.755615234375, 5.04150390625, 5.327392578125, 5.61328125, 5.899169921875, 6.18505859375, 6.470947265625, 6.7568359375, 7.042724609375, 7.32861328125, 7.614501953125, 7.900390625, 8.186279296875, 8.47216796875, 8.758056640625, 9.0439453125, 9.329833984375, 9.61572265625, 9.901611328125, 10.1875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 8.0, 14.0, 15.0, 21.0, 31.0, 43.0, 62.0, 74.0, 115.0, 152.0, 240.0, 373.0, 604.0, 1120.0, 2107.0, 4673.0, 15259.0, 117386.0, 1514459.0, 2284952.0, 220308.0, 20818.0, 5599.0, 2583.0, 1252.0, 752.0, 441.0, 276.0, 158.0, 104.0, 86.0, 61.0, 31.0, 28.0, 20.0, 15.0, 12.0, 14.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8984375, -15.2655029296875, -14.632568359375, -13.9996337890625, -13.36669921875, -12.7337646484375, -12.100830078125, -11.4678955078125, -10.8349609375, -10.2020263671875, -9.569091796875, -8.9361572265625, -8.30322265625, -7.6702880859375, -7.037353515625, -6.4044189453125, -5.771484375, -5.1385498046875, -4.505615234375, -3.8726806640625, -3.23974609375, -2.6068115234375, -1.973876953125, -1.3409423828125, -0.7080078125, -0.0750732421875, 0.557861328125, 1.1907958984375, 1.82373046875, 2.4566650390625, 3.089599609375, 3.7225341796875, 4.35546875, 4.9884033203125, 5.621337890625, 6.2542724609375, 6.88720703125, 7.5201416015625, 8.153076171875, 8.7860107421875, 9.4189453125, 10.0518798828125, 10.684814453125, 11.3177490234375, 11.95068359375, 12.5836181640625, 13.216552734375, 13.8494873046875, 14.482421875, 15.1153564453125, 15.748291015625, 16.3812255859375, 17.01416015625, 17.6470947265625, 18.280029296875, 18.9129638671875, 19.5458984375, 20.1788330078125, 20.811767578125, 21.4447021484375, 22.07763671875, 22.7105712890625, 23.343505859375, 23.9764404296875, 24.609375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 2.0, 6.0, 21.0, 31.0, 44.0, 85.0, 196.0, 322.0, 631.0, 1025.0, 785.0, 406.0, 253.0, 125.0, 68.0, 27.0, 24.0, 11.0, 6.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.234375, -23.251220703125, -22.26806640625, -21.284912109375, -20.3017578125, -19.318603515625, -18.33544921875, -17.352294921875, -16.369140625, -15.385986328125, -14.40283203125, -13.419677734375, -12.4365234375, -11.453369140625, -10.47021484375, -9.487060546875, -8.50390625, -7.520751953125, -6.53759765625, -5.554443359375, -4.5712890625, -3.588134765625, -2.60498046875, -1.621826171875, -0.638671875, 0.344482421875, 1.32763671875, 2.310791015625, 3.2939453125, 4.277099609375, 5.26025390625, 6.243408203125, 7.2265625, 8.209716796875, 9.19287109375, 10.176025390625, 11.1591796875, 12.142333984375, 13.12548828125, 14.108642578125, 15.091796875, 16.074951171875, 17.05810546875, 18.041259765625, 19.0244140625, 20.007568359375, 20.99072265625, 21.973876953125, 22.95703125, 23.940185546875, 24.92333984375, 25.906494140625, 26.8896484375, 27.872802734375, 28.85595703125, 29.839111328125, 30.822265625, 31.805419921875, 32.78857421875, 33.771728515625, 34.7548828125, 35.738037109375, 36.72119140625, 37.704345703125, 38.6875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 5.0, 11.0, 24.0, 23.0, 36.0, 85.0, 127.0, 262.0, 542.0, 1339.0, 5606.0, 3060638.0, 1118962.0, 4474.0, 1164.0, 477.0, 214.0, 114.0, 69.0, 39.0, 21.0, 8.0, 14.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-73.5625, -71.5712890625, -69.580078125, -67.5888671875, -65.59765625, -63.6064453125, -61.615234375, -59.6240234375, -57.6328125, -55.6416015625, -53.650390625, -51.6591796875, -49.66796875, -47.6767578125, -45.685546875, -43.6943359375, -41.703125, -39.7119140625, -37.720703125, -35.7294921875, -33.73828125, -31.7470703125, -29.755859375, -27.7646484375, -25.7734375, -23.7822265625, -21.791015625, -19.7998046875, -17.80859375, -15.8173828125, -13.826171875, -11.8349609375, -9.84375, -7.8525390625, -5.861328125, -3.8701171875, -1.87890625, 0.1123046875, 2.103515625, 4.0947265625, 6.0859375, 8.0771484375, 10.068359375, 12.0595703125, 14.05078125, 16.0419921875, 18.033203125, 20.0244140625, 22.015625, 24.0068359375, 25.998046875, 27.9892578125, 29.98046875, 31.9716796875, 33.962890625, 35.9541015625, 37.9453125, 39.9365234375, 41.927734375, 43.9189453125, 45.91015625, 47.9013671875, 49.892578125, 51.8837890625, 53.875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 36.0, 297.0, 503.0, 163.0, 14.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-347.0843505859375, -339.4287109375, -331.7730407714844, -324.1174011230469, -316.4617614746094, -308.80609130859375, -301.15045166015625, -293.49481201171875, -285.83917236328125, -278.18353271484375, -270.5278625488281, -262.8722229003906, -255.21658325195312, -247.56092834472656, -239.9052734375, -232.2496337890625, -224.59396362304688, -216.9383087158203, -209.2826690673828, -201.62701416015625, -193.97137451171875, -186.3157196044922, -178.66006469726562, -171.00442504882812, -163.34878540039062, -155.69313049316406, -148.03749084472656, -140.3818359375, -132.7261962890625, -125.07054138183594, -117.4148941040039, -109.75924682617188, -102.10359191894531, -94.44794464111328, -86.79229736328125, -79.13664245605469, -71.48099517822266, -63.825347900390625, -56.169700622558594, -48.5140495300293, -40.858402252197266, -33.202754974365234, -25.547103881835938, -17.891456604003906, -10.235807418823242, -2.580158233642578, 5.075489044189453, 12.73114013671875, 20.38678741455078, 28.042436599731445, 35.69808578491211, 43.35373306274414, 51.00938415527344, 58.66503143310547, 66.3206787109375, 73.97633361816406, 81.63197326660156, 89.2876205444336, 96.94326782226562, 104.59892272949219, 112.25457000732422, 119.91021728515625, 127.56586456298828, 135.2215118408203, 142.87716674804688]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 6.0, 13.0, 11.0, 16.0, 24.0, 32.0, 36.0, 42.0, 42.0, 54.0, 59.0, 55.0, 55.0, 45.0, 62.0, 58.0, 54.0, 43.0, 33.0, 48.0, 36.0, 43.0, 26.0, 30.0, 17.0, 13.0, 17.0, 4.0, 8.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.59625244140625, -82.1253890991211, -79.6545181274414, -77.18365478515625, -74.7127914428711, -72.24192810058594, -69.77105712890625, -67.3001937866211, -64.82933044433594, -62.358463287353516, -59.88759994506836, -57.41673278808594, -54.94586944580078, -52.47500228881836, -50.00413513183594, -47.53327178955078, -45.062400817871094, -42.59153366088867, -40.120670318603516, -37.649803161621094, -35.17893981933594, -32.708072662353516, -30.237205505371094, -27.766340255737305, -25.295475006103516, -22.824609756469727, -20.353744506835938, -17.882877349853516, -15.412012100219727, -12.941146850585938, -10.470280647277832, -7.999414443969727, -5.5285491943359375, -3.0576834678649902, -0.586817741394043, 1.8840479850769043, 4.354913711547852, 6.825778961181641, 9.296645164489746, 11.767511367797852, 14.23837661743164, 16.70924186706543, 19.18010711669922, 21.65097427368164, 24.12183952331543, 26.59270477294922, 29.06357192993164, 31.53443717956543, 34.00530242919922, 36.47616958618164, 38.9470329284668, 41.41790008544922, 43.888763427734375, 46.3596305847168, 48.83049774169922, 51.301361083984375, 53.7722282409668, 56.24309539794922, 58.713958740234375, 61.1848258972168, 63.65569305419922, 66.12655639648438, 68.59741973876953, 71.06829071044922, 73.53915405273438]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 10.0, 11.0, 13.0, 12.0, 13.0, 18.0, 23.0, 31.0, 26.0, 27.0, 29.0, 39.0, 41.0, 46.0, 45.0, 42.0, 54.0, 39.0, 33.0, 45.0, 41.0, 33.0, 38.0, 32.0, 41.0, 30.0, 36.0, 17.0, 27.0, 24.0, 9.0, 15.0, 13.0, 10.0, 8.0, 8.0, 3.0, 2.0, 2.0, 7.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.90966796875, -5.6787109375, -5.44775390625, -5.216796875, -4.98583984375, -4.7548828125, -4.52392578125, -4.29296875, -4.06201171875, -3.8310546875, -3.60009765625, -3.369140625, -3.13818359375, -2.9072265625, -2.67626953125, -2.4453125, -2.21435546875, -1.9833984375, -1.75244140625, -1.521484375, -1.29052734375, -1.0595703125, -0.82861328125, -0.59765625, -0.36669921875, -0.1357421875, 0.09521484375, 0.326171875, 0.55712890625, 0.7880859375, 1.01904296875, 1.25, 1.48095703125, 1.7119140625, 1.94287109375, 2.173828125, 2.40478515625, 2.6357421875, 2.86669921875, 3.09765625, 3.32861328125, 3.5595703125, 3.79052734375, 4.021484375, 4.25244140625, 4.4833984375, 4.71435546875, 4.9453125, 5.17626953125, 5.4072265625, 5.63818359375, 5.869140625, 6.10009765625, 6.3310546875, 6.56201171875, 6.79296875, 7.02392578125, 7.2548828125, 7.48583984375, 7.716796875, 7.94775390625, 8.1787109375, 8.40966796875, 8.640625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 17.0, 18.0, 13.0, 35.0, 44.0, 72.0, 115.0, 168.0, 277.0, 413.0, 562.0, 780.0, 1273.0, 1906.0, 2814.0, 4227.0, 6276.0, 9613.0, 14867.0, 22425.0, 35802.0, 57045.0, 93449.0, 151441.0, 215842.0, 160862.0, 98987.0, 61219.0, 38206.0, 24180.0, 15395.0, 10103.0, 6633.0, 4345.0, 2951.0, 2085.0, 1302.0, 923.0, 647.0, 398.0, 258.0, 205.0, 120.0, 84.0, 62.0, 34.0, 20.0, 22.0, 10.0, 1.0, 3.0, 0.0, 5.0, 1.0, 0.0, 3.0], "bins": [-0.98291015625, -0.952728271484375, -0.92254638671875, -0.892364501953125, -0.8621826171875, -0.832000732421875, -0.80181884765625, -0.771636962890625, -0.741455078125, -0.711273193359375, -0.68109130859375, -0.650909423828125, -0.6207275390625, -0.590545654296875, -0.56036376953125, -0.530181884765625, -0.5, -0.469818115234375, -0.43963623046875, -0.409454345703125, -0.3792724609375, -0.349090576171875, -0.31890869140625, -0.288726806640625, -0.258544921875, -0.228363037109375, -0.19818115234375, -0.167999267578125, -0.1378173828125, -0.107635498046875, -0.07745361328125, -0.047271728515625, -0.01708984375, 0.013092041015625, 0.04327392578125, 0.073455810546875, 0.1036376953125, 0.133819580078125, 0.16400146484375, 0.194183349609375, 0.224365234375, 0.254547119140625, 0.28472900390625, 0.314910888671875, 0.3450927734375, 0.375274658203125, 0.40545654296875, 0.435638427734375, 0.4658203125, 0.496002197265625, 0.52618408203125, 0.556365966796875, 0.5865478515625, 0.616729736328125, 0.64691162109375, 0.677093505859375, 0.707275390625, 0.737457275390625, 0.76763916015625, 0.797821044921875, 0.8280029296875, 0.858184814453125, 0.88836669921875, 0.918548583984375, 0.94873046875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 6.0, 8.0, 7.0, 9.0, 10.0, 12.0, 20.0, 21.0, 19.0, 28.0, 28.0, 27.0, 23.0, 43.0, 25.0, 28.0, 36.0, 39.0, 35.0, 41.0, 1057.0, 33.0, 40.0, 38.0, 40.0, 31.0, 29.0, 38.0, 35.0, 32.0, 24.0, 18.0, 16.0, 17.0, 20.0, 11.0, 12.0, 7.0, 9.0, 6.0, 9.0, 7.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.20703125, -4.0836181640625, -3.960205078125, -3.8367919921875, -3.71337890625, -3.5899658203125, -3.466552734375, -3.3431396484375, -3.2197265625, -3.0963134765625, -2.972900390625, -2.8494873046875, -2.72607421875, -2.6026611328125, -2.479248046875, -2.3558349609375, -2.232421875, -2.1090087890625, -1.985595703125, -1.8621826171875, -1.73876953125, -1.6153564453125, -1.491943359375, -1.3685302734375, -1.2451171875, -1.1217041015625, -0.998291015625, -0.8748779296875, -0.75146484375, -0.6280517578125, -0.504638671875, -0.3812255859375, -0.2578125, -0.1343994140625, -0.010986328125, 0.1124267578125, 0.23583984375, 0.3592529296875, 0.482666015625, 0.6060791015625, 0.7294921875, 0.8529052734375, 0.976318359375, 1.0997314453125, 1.22314453125, 1.3465576171875, 1.469970703125, 1.5933837890625, 1.716796875, 1.8402099609375, 1.963623046875, 2.0870361328125, 2.21044921875, 2.3338623046875, 2.457275390625, 2.5806884765625, 2.7041015625, 2.8275146484375, 2.950927734375, 3.0743408203125, 3.19775390625, 3.3211669921875, 3.444580078125, 3.5679931640625, 3.69140625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 9.0, 21.0, 24.0, 43.0, 56.0, 96.0, 141.0, 204.0, 300.0, 426.0, 650.0, 871.0, 1375.0, 2031.0, 2990.0, 4499.0, 6493.0, 10018.0, 15036.0, 23051.0, 35432.0, 54516.0, 82779.0, 124564.0, 1224610.0, 168380.0, 115294.0, 76776.0, 50091.0, 32862.0, 21541.0, 14002.0, 9062.0, 6181.0, 4099.0, 2843.0, 1850.0, 1275.0, 858.0, 617.0, 352.0, 267.0, 177.0, 114.0, 81.0, 47.0, 41.0, 35.0, 19.0, 12.0, 6.0, 6.0, 3.0, 4.0, 1.0], "bins": [-0.88134765625, -0.8553543090820312, -0.8293609619140625, -0.8033676147460938, -0.777374267578125, -0.7513809204101562, -0.7253875732421875, -0.6993942260742188, -0.67340087890625, -0.6474075317382812, -0.6214141845703125, -0.5954208374023438, -0.569427490234375, -0.5434341430664062, -0.5174407958984375, -0.49144744873046875, -0.4654541015625, -0.43946075439453125, -0.4134674072265625, -0.38747406005859375, -0.361480712890625, -0.33548736572265625, -0.3094940185546875, -0.28350067138671875, -0.25750732421875, -0.23151397705078125, -0.2055206298828125, -0.17952728271484375, -0.153533935546875, -0.12754058837890625, -0.1015472412109375, -0.07555389404296875, -0.049560546875, -0.02356719970703125, 0.0024261474609375, 0.02841949462890625, 0.054412841796875, 0.08040618896484375, 0.1063995361328125, 0.13239288330078125, 0.15838623046875, 0.18437957763671875, 0.2103729248046875, 0.23636627197265625, 0.262359619140625, 0.28835296630859375, 0.3143463134765625, 0.34033966064453125, 0.3663330078125, 0.39232635498046875, 0.4183197021484375, 0.44431304931640625, 0.470306396484375, 0.49629974365234375, 0.5222930908203125, 0.5482864379882812, 0.57427978515625, 0.6002731323242188, 0.6262664794921875, 0.6522598266601562, 0.678253173828125, 0.7042465209960938, 0.7302398681640625, 0.7562332153320312, 0.7822265625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 5.0, 4.0, 6.0, 6.0, 11.0, 13.0, 24.0, 35.0, 42.0, 33.0, 49.0, 59.0, 56.0, 62.0, 78.0, 73.0, 68.0, 57.0, 54.0, 52.0, 38.0, 31.0, 26.0, 25.0, 16.0, 16.0, 10.0, 16.0, 4.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017948150634765625, -0.0017390847206115723, -0.001683354377746582, -0.0016276240348815918, -0.0015718936920166016, -0.0015161633491516113, -0.001460433006286621, -0.0014047026634216309, -0.0013489723205566406, -0.0012932419776916504, -0.0012375116348266602, -0.00118178129196167, -0.0011260509490966797, -0.0010703206062316895, -0.0010145902633666992, -0.000958859920501709, -0.0009031295776367188, -0.0008473992347717285, -0.0007916688919067383, -0.000735938549041748, -0.0006802082061767578, -0.0006244778633117676, -0.0005687475204467773, -0.0005130171775817871, -0.0004572868347167969, -0.00040155649185180664, -0.0003458261489868164, -0.00029009580612182617, -0.00023436546325683594, -0.0001786351203918457, -0.00012290477752685547, -6.717443466186523e-05, -1.1444091796875e-05, 4.4286251068115234e-05, 0.00010001659393310547, 0.0001557469367980957, 0.00021147727966308594, 0.00026720762252807617, 0.0003229379653930664, 0.00037866830825805664, 0.0004343986511230469, 0.0004901289939880371, 0.0005458593368530273, 0.0006015896797180176, 0.0006573200225830078, 0.000713050365447998, 0.0007687807083129883, 0.0008245110511779785, 0.0008802413940429688, 0.000935971736907959, 0.0009917020797729492, 0.0010474324226379395, 0.0011031627655029297, 0.00115889310836792, 0.0012146234512329102, 0.0012703537940979004, 0.0013260841369628906, 0.0013818144798278809, 0.001437544822692871, 0.0014932751655578613, 0.0015490055084228516, 0.0016047358512878418, 0.001660466194152832, 0.0017161965370178223, 0.0017719268798828125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 7.0, 16.0, 18.0, 16.0, 26.0, 43.0, 62.0, 74.0, 72.0, 118.0, 148.0, 245.0, 343.0, 541.0, 1128.0, 151675.0, 890415.0, 1530.0, 667.0, 400.0, 266.0, 164.0, 118.0, 116.0, 65.0, 68.0, 36.0, 35.0, 15.0, 20.0, 17.0, 11.0, 8.0, 10.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.0292510986328125, -0.028340578079223633, -0.027430057525634766, -0.0265195369720459, -0.02560901641845703, -0.024698495864868164, -0.023787975311279297, -0.02287745475769043, -0.021966934204101562, -0.021056413650512695, -0.020145893096923828, -0.01923537254333496, -0.018324851989746094, -0.017414331436157227, -0.01650381088256836, -0.015593290328979492, -0.014682769775390625, -0.013772249221801758, -0.01286172866821289, -0.011951208114624023, -0.011040687561035156, -0.010130167007446289, -0.009219646453857422, -0.008309125900268555, -0.0073986053466796875, -0.00648808479309082, -0.005577564239501953, -0.004667043685913086, -0.0037565231323242188, -0.0028460025787353516, -0.0019354820251464844, -0.0010249614715576172, -0.00011444091796875, 0.0007960796356201172, 0.0017066001892089844, 0.0026171207427978516, 0.0035276412963867188, 0.004438161849975586, 0.005348682403564453, 0.00625920295715332, 0.0071697235107421875, 0.008080244064331055, 0.008990764617919922, 0.009901285171508789, 0.010811805725097656, 0.011722326278686523, 0.01263284683227539, 0.013543367385864258, 0.014453887939453125, 0.015364408493041992, 0.01627492904663086, 0.017185449600219727, 0.018095970153808594, 0.01900649070739746, 0.019917011260986328, 0.020827531814575195, 0.021738052368164062, 0.02264857292175293, 0.023559093475341797, 0.024469614028930664, 0.02538013458251953, 0.0262906551361084, 0.027201175689697266, 0.028111696243286133, 0.029022216796875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 310.0, 585.0, 92.0, 6.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00799393281340599, -0.007854266092181206, -0.0077146003022789955, -0.007574933581054211, -0.007435267325490713, -0.007295601069927216, -0.007155934814363718, -0.0070162685588002205, -0.006876601837575436, -0.006736935582011938, -0.0065972693264484406, -0.006457602605223656, -0.006317936349660158, -0.006178270094096661, -0.006038603838533163, -0.0058989375829696655, -0.005759270861744881, -0.005619604606181383, -0.005479938350617886, -0.005340271629393101, -0.005200605373829603, -0.005060939118266106, -0.004921272862702608, -0.0047816066071391106, -0.004641940351575613, -0.0045022740960121155, -0.004362607840448618, -0.004222941119223833, -0.0040832748636603355, -0.003943608608096838, -0.0038039423525333405, -0.0036642758641391993, -0.003524609375745058, -0.0033849431201815605, -0.0032452766317874193, -0.0031056103762239218, -0.0029659438878297806, -0.002826277632266283, -0.0026866113767027855, -0.0025469448883086443, -0.002407278399914503, -0.0022676121443510056, -0.0021279456559568644, -0.001988279400393367, -0.0018486129119992256, -0.001708946656435728, -0.0015692802844569087, -0.0014296139124780893, -0.0012899476569145918, -0.0011502812849357724, -0.001010614912956953, -0.0008709485991857946, -0.0007312822272069752, -0.0005916158552281559, -0.0004519495414569974, -0.000312283169478178, -0.00017261679749935865, -3.295044007245451e-05, 0.00010671591735444963, 0.00024638226022943854, 0.0003860486322082579, 0.0005257150041870773, 0.0006653813179582357, 0.0008050476899370551, 0.0009447140619158745]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 3.0, 4.0, 11.0, 9.0, 10.0, 19.0, 19.0, 17.0, 18.0, 35.0, 39.0, 36.0, 36.0, 35.0, 38.0, 45.0, 51.0, 47.0, 49.0, 50.0, 41.0, 45.0, 47.0, 44.0, 37.0, 30.0, 21.0, 32.0, 25.0, 16.0, 12.0, 8.0, 15.0, 15.0, 9.0, 5.0, 9.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008946657180786133, -0.0008666180074214935, -0.0008385702967643738, -0.000810522586107254, -0.0007824748754501343, -0.0007544271647930145, -0.0007263794541358948, -0.000698331743478775, -0.0006702840328216553, -0.0006422363221645355, -0.0006141886115074158, -0.000586140900850296, -0.0005580931901931763, -0.0005300454795360565, -0.0005019977688789368, -0.000473950058221817, -0.00044590234756469727, -0.0004178546369075775, -0.00038980692625045776, -0.000361759215593338, -0.00033371150493621826, -0.0003056637942790985, -0.00027761608362197876, -0.000249568372964859, -0.00022152066230773926, -0.0001934729516506195, -0.00016542524099349976, -0.00013737753033638, -0.00010932981967926025, -8.12821090221405e-05, -5.323439836502075e-05, -2.5186687707901e-05, 2.86102294921875e-06, 3.09087336063385e-05, 5.895644426345825e-05, 8.7004154920578e-05, 0.00011505186557769775, 0.0001430995762348175, 0.00017114728689193726, 0.000199194997549057, 0.00022724270820617676, 0.0002552904188632965, 0.00028333812952041626, 0.000311385840177536, 0.00033943355083465576, 0.0003674812614917755, 0.00039552897214889526, 0.000423576682806015, 0.00045162439346313477, 0.0004796721041202545, 0.0005077198147773743, 0.000535767525434494, 0.0005638152360916138, 0.0005918629467487335, 0.0006199106574058533, 0.000647958368062973, 0.0006760060787200928, 0.0007040537893772125, 0.0007321015000343323, 0.000760149210691452, 0.0007881969213485718, 0.0008162446320056915, 0.0008442923426628113, 0.000872340053319931, 0.0009003877639770508]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 10.0, 11.0, 13.0, 12.0, 13.0, 18.0, 23.0, 31.0, 26.0, 27.0, 29.0, 39.0, 41.0, 46.0, 45.0, 42.0, 54.0, 39.0, 33.0, 45.0, 41.0, 33.0, 38.0, 32.0, 41.0, 30.0, 37.0, 16.0, 27.0, 24.0, 9.0, 15.0, 13.0, 10.0, 8.0, 8.0, 3.0, 2.0, 2.0, 7.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.90966796875, -5.6787109375, -5.44775390625, -5.216796875, -4.98583984375, -4.7548828125, -4.52392578125, -4.29296875, -4.06201171875, -3.8310546875, -3.60009765625, -3.369140625, -3.13818359375, -2.9072265625, -2.67626953125, -2.4453125, -2.21435546875, -1.9833984375, -1.75244140625, -1.521484375, -1.29052734375, -1.0595703125, -0.82861328125, -0.59765625, -0.36669921875, -0.1357421875, 0.09521484375, 0.326171875, 0.55712890625, 0.7880859375, 1.01904296875, 1.25, 1.48095703125, 1.7119140625, 1.94287109375, 2.173828125, 2.40478515625, 2.6357421875, 2.86669921875, 3.09765625, 3.32861328125, 3.5595703125, 3.79052734375, 4.021484375, 4.25244140625, 4.4833984375, 4.71435546875, 4.9453125, 5.17626953125, 5.4072265625, 5.63818359375, 5.869140625, 6.10009765625, 6.3310546875, 6.56201171875, 6.79296875, 7.02392578125, 7.2548828125, 7.48583984375, 7.716796875, 7.94775390625, 8.1787109375, 8.40966796875, 8.640625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 5.0, 8.0, 7.0, 4.0, 10.0, 17.0, 15.0, 23.0, 33.0, 44.0, 59.0, 94.0, 116.0, 180.0, 241.0, 381.0, 553.0, 946.0, 1644.0, 3580.0, 8637.0, 28345.0, 134399.0, 628501.0, 185726.0, 35539.0, 10532.0, 4121.0, 1875.0, 1057.0, 601.0, 388.0, 256.0, 165.0, 130.0, 86.0, 64.0, 52.0, 27.0, 33.0, 14.0, 9.0, 8.0, 13.0, 5.0, 2.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9296875, -10.5185546875, -10.107421875, -9.6962890625, -9.28515625, -8.8740234375, -8.462890625, -8.0517578125, -7.640625, -7.2294921875, -6.818359375, -6.4072265625, -5.99609375, -5.5849609375, -5.173828125, -4.7626953125, -4.3515625, -3.9404296875, -3.529296875, -3.1181640625, -2.70703125, -2.2958984375, -1.884765625, -1.4736328125, -1.0625, -0.6513671875, -0.240234375, 0.1708984375, 0.58203125, 0.9931640625, 1.404296875, 1.8154296875, 2.2265625, 2.6376953125, 3.048828125, 3.4599609375, 3.87109375, 4.2822265625, 4.693359375, 5.1044921875, 5.515625, 5.9267578125, 6.337890625, 6.7490234375, 7.16015625, 7.5712890625, 7.982421875, 8.3935546875, 8.8046875, 9.2158203125, 9.626953125, 10.0380859375, 10.44921875, 10.8603515625, 11.271484375, 11.6826171875, 12.09375, 12.5048828125, 12.916015625, 13.3271484375, 13.73828125, 14.1494140625, 14.560546875, 14.9716796875, 15.3828125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 2.0, 9.0, 10.0, 8.0, 11.0, 20.0, 14.0, 21.0, 34.0, 39.0, 29.0, 56.0, 52.0, 46.0, 78.0, 184.0, 1732.0, 251.0, 81.0, 33.0, 52.0, 44.0, 43.0, 30.0, 31.0, 20.0, 21.0, 20.0, 17.0, 10.0, 7.0, 10.0, 4.0, 6.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.6875, -21.060302734375, -20.43310546875, -19.805908203125, -19.1787109375, -18.551513671875, -17.92431640625, -17.297119140625, -16.669921875, -16.042724609375, -15.41552734375, -14.788330078125, -14.1611328125, -13.533935546875, -12.90673828125, -12.279541015625, -11.65234375, -11.025146484375, -10.39794921875, -9.770751953125, -9.1435546875, -8.516357421875, -7.88916015625, -7.261962890625, -6.634765625, -6.007568359375, -5.38037109375, -4.753173828125, -4.1259765625, -3.498779296875, -2.87158203125, -2.244384765625, -1.6171875, -0.989990234375, -0.36279296875, 0.264404296875, 0.8916015625, 1.518798828125, 2.14599609375, 2.773193359375, 3.400390625, 4.027587890625, 4.65478515625, 5.281982421875, 5.9091796875, 6.536376953125, 7.16357421875, 7.790771484375, 8.41796875, 9.045166015625, 9.67236328125, 10.299560546875, 10.9267578125, 11.553955078125, 12.18115234375, 12.808349609375, 13.435546875, 14.062744140625, 14.68994140625, 15.317138671875, 15.9443359375, 16.571533203125, 17.19873046875, 17.825927734375, 18.453125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 3.0, 0.0, 6.0, 9.0, 10.0, 6.0, 14.0, 17.0, 19.0, 22.0, 38.0, 54.0, 84.0, 102.0, 193.0, 376.0, 796.0, 5138.0, 3129949.0, 6973.0, 870.0, 402.0, 221.0, 123.0, 68.0, 55.0, 31.0, 33.0, 22.0, 8.0, 16.0, 16.0, 6.0, 5.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.3125, -54.46826171875, -52.6240234375, -50.77978515625, -48.935546875, -47.09130859375, -45.2470703125, -43.40283203125, -41.55859375, -39.71435546875, -37.8701171875, -36.02587890625, -34.181640625, -32.33740234375, -30.4931640625, -28.64892578125, -26.8046875, -24.96044921875, -23.1162109375, -21.27197265625, -19.427734375, -17.58349609375, -15.7392578125, -13.89501953125, -12.05078125, -10.20654296875, -8.3623046875, -6.51806640625, -4.673828125, -2.82958984375, -0.9853515625, 0.85888671875, 2.703125, 4.54736328125, 6.3916015625, 8.23583984375, 10.080078125, 11.92431640625, 13.7685546875, 15.61279296875, 17.45703125, 19.30126953125, 21.1455078125, 22.98974609375, 24.833984375, 26.67822265625, 28.5224609375, 30.36669921875, 32.2109375, 34.05517578125, 35.8994140625, 37.74365234375, 39.587890625, 41.43212890625, 43.2763671875, 45.12060546875, 46.96484375, 48.80908203125, 50.6533203125, 52.49755859375, 54.341796875, 56.18603515625, 58.0302734375, 59.87451171875, 61.71875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 30.0, 190.0, 546.0, 213.0, 27.0, 4.0, 2.0, 2.0], "bins": [-139.81094360351562, -137.4203338623047, -135.0297393798828, -132.63912963867188, -130.24853515625, -127.85792541503906, -125.46732330322266, -123.07672119140625, -120.68611907958984, -118.29551696777344, -115.90491485595703, -113.51431274414062, -111.12370300292969, -108.73310089111328, -106.34249877929688, -103.95189666748047, -101.56129455566406, -99.17069244384766, -96.78009033203125, -94.38948822021484, -91.99888610839844, -89.6082763671875, -87.2176742553711, -84.82707214355469, -82.43647003173828, -80.04586791992188, -77.65526580810547, -75.26466369628906, -72.87405395507812, -70.48345184326172, -68.09284973144531, -65.7022476196289, -63.311649322509766, -60.92104721069336, -58.53044128417969, -56.13983917236328, -53.749237060546875, -51.35863494873047, -48.96803283691406, -46.57742691040039, -44.186824798583984, -41.79622268676758, -39.405616760253906, -37.0150146484375, -34.624412536621094, -32.23381042480469, -29.84320640563965, -27.45260238647461, -25.062000274658203, -22.671398162841797, -20.280794143676758, -17.89019012451172, -15.499588012695312, -13.10898494720459, -10.718381881713867, -8.327777862548828, -5.937176704406738, -3.5465736389160156, -1.155970573425293, 1.2346324920654297, 3.6252355575561523, 6.015838623046875, 8.406441688537598, 10.797045707702637, 13.187647819519043]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 9.0, 3.0, 5.0, 6.0, 15.0, 10.0, 13.0, 16.0, 23.0, 23.0, 23.0, 23.0, 42.0, 24.0, 33.0, 41.0, 33.0, 38.0, 62.0, 45.0, 50.0, 51.0, 38.0, 34.0, 46.0, 28.0, 34.0, 35.0, 27.0, 23.0, 22.0, 23.0, 22.0, 13.0, 15.0, 11.0, 12.0, 11.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.942039489746094, -38.56901168823242, -37.19598388671875, -35.822959899902344, -34.44993209838867, -33.076904296875, -31.70387840270996, -30.330852508544922, -28.95782470703125, -27.584796905517578, -26.21177101135254, -24.8387451171875, -23.465717315673828, -22.092689514160156, -20.719663619995117, -19.346637725830078, -17.973609924316406, -16.600582122802734, -15.227556228637695, -13.85452938079834, -12.481502532958984, -11.108475685119629, -9.735448837280273, -8.362421989440918, -6.9893951416015625, -5.616368293762207, -4.243341445922852, -2.870314598083496, -1.4972877502441406, -0.12426090240478516, 1.2487659454345703, 2.621792793273926, 3.9948158264160156, 5.367842674255371, 6.740869522094727, 8.113896369934082, 9.486923217773438, 10.859950065612793, 12.232976913452148, 13.606003761291504, 14.97903060913086, 16.35205841064453, 17.72508430480957, 19.09811019897461, 20.47113800048828, 21.844165802001953, 23.217191696166992, 24.59021759033203, 25.963245391845703, 27.336273193359375, 28.709299087524414, 30.082324981689453, 31.455352783203125, 32.8283805847168, 34.20140838623047, 35.574432373046875, 36.94746017456055, 38.32048797607422, 39.693511962890625, 41.0665397644043, 42.43956756591797, 43.81259536743164, 45.18562316894531, 46.55864715576172, 47.93167495727539]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 3.0, 15.0, 15.0, 8.0, 16.0, 19.0, 24.0, 19.0, 27.0, 19.0, 29.0, 39.0, 42.0, 34.0, 38.0, 44.0, 41.0, 43.0, 45.0, 46.0, 41.0, 41.0, 48.0, 32.0, 30.0, 34.0, 31.0, 28.0, 19.0, 21.0, 20.0, 14.0, 15.0, 12.0, 2.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0, -7.734375, -7.46875, -7.203125, -6.9375, -6.671875, -6.40625, -6.140625, -5.875, -5.609375, -5.34375, -5.078125, -4.8125, -4.546875, -4.28125, -4.015625, -3.75, -3.484375, -3.21875, -2.953125, -2.6875, -2.421875, -2.15625, -1.890625, -1.625, -1.359375, -1.09375, -0.828125, -0.5625, -0.296875, -0.03125, 0.234375, 0.5, 0.765625, 1.03125, 1.296875, 1.5625, 1.828125, 2.09375, 2.359375, 2.625, 2.890625, 3.15625, 3.421875, 3.6875, 3.953125, 4.21875, 4.484375, 4.75, 5.015625, 5.28125, 5.546875, 5.8125, 6.078125, 6.34375, 6.609375, 6.875, 7.140625, 7.40625, 7.671875, 7.9375, 8.203125, 8.46875, 8.734375, 9.0]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 6.0, 11.0, 14.0, 14.0, 21.0, 31.0, 22.0, 41.0, 45.0, 61.0, 58.0, 96.0, 107.0, 146.0, 185.0, 235.0, 351.0, 530.0, 919.0, 2252.0, 14219.0, 2560446.0, 1599058.0, 10708.0, 1919.0, 849.0, 537.0, 338.0, 272.0, 169.0, 120.0, 96.0, 82.0, 57.0, 55.0, 43.0, 37.0, 22.0, 27.0, 21.0, 16.0, 16.0, 11.0, 6.0, 5.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.3125, -44.765625, -43.21875, -41.671875, -40.125, -38.578125, -37.03125, -35.484375, -33.9375, -32.390625, -30.84375, -29.296875, -27.75, -26.203125, -24.65625, -23.109375, -21.5625, -20.015625, -18.46875, -16.921875, -15.375, -13.828125, -12.28125, -10.734375, -9.1875, -7.640625, -6.09375, -4.546875, -3.0, -1.453125, 0.09375, 1.640625, 3.1875, 4.734375, 6.28125, 7.828125, 9.375, 10.921875, 12.46875, 14.015625, 15.5625, 17.109375, 18.65625, 20.203125, 21.75, 23.296875, 24.84375, 26.390625, 27.9375, 29.484375, 31.03125, 32.578125, 34.125, 35.671875, 37.21875, 38.765625, 40.3125, 41.859375, 43.40625, 44.953125, 46.5, 48.046875, 49.59375, 51.140625, 52.6875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 7.0, 1.0, 10.0, 9.0, 23.0, 60.0, 82.0, 177.0, 335.0, 665.0, 1044.0, 776.0, 447.0, 196.0, 106.0, 67.0, 25.0, 22.0, 7.0, 8.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.71875, -31.9862060546875, -31.253662109375, -30.5211181640625, -29.78857421875, -29.0560302734375, -28.323486328125, -27.5909423828125, -26.8583984375, -26.1258544921875, -25.393310546875, -24.6607666015625, -23.92822265625, -23.1956787109375, -22.463134765625, -21.7305908203125, -20.998046875, -20.2655029296875, -19.532958984375, -18.8004150390625, -18.06787109375, -17.3353271484375, -16.602783203125, -15.8702392578125, -15.1376953125, -14.4051513671875, -13.672607421875, -12.9400634765625, -12.20751953125, -11.4749755859375, -10.742431640625, -10.0098876953125, -9.27734375, -8.5447998046875, -7.812255859375, -7.0797119140625, -6.34716796875, -5.6146240234375, -4.882080078125, -4.1495361328125, -3.4169921875, -2.6844482421875, -1.951904296875, -1.2193603515625, -0.48681640625, 0.2457275390625, 0.978271484375, 1.7108154296875, 2.443359375, 3.1759033203125, 3.908447265625, 4.6409912109375, 5.37353515625, 6.1060791015625, 6.838623046875, 7.5711669921875, 8.3037109375, 9.0362548828125, 9.768798828125, 10.5013427734375, 11.23388671875, 11.9664306640625, 12.698974609375, 13.4315185546875, 14.1640625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 10.0, 17.0, 39.0, 88.0, 166.0, 498.0, 2369.0, 40642.0, 3957252.0, 187404.0, 4612.0, 752.0, 219.0, 101.0, 46.0, 25.0, 12.0, 7.0, 8.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.34375, -43.10009765625, -41.8564453125, -40.61279296875, -39.369140625, -38.12548828125, -36.8818359375, -35.63818359375, -34.39453125, -33.15087890625, -31.9072265625, -30.66357421875, -29.419921875, -28.17626953125, -26.9326171875, -25.68896484375, -24.4453125, -23.20166015625, -21.9580078125, -20.71435546875, -19.470703125, -18.22705078125, -16.9833984375, -15.73974609375, -14.49609375, -13.25244140625, -12.0087890625, -10.76513671875, -9.521484375, -8.27783203125, -7.0341796875, -5.79052734375, -4.546875, -3.30322265625, -2.0595703125, -0.81591796875, 0.427734375, 1.67138671875, 2.9150390625, 4.15869140625, 5.40234375, 6.64599609375, 7.8896484375, 9.13330078125, 10.376953125, 11.62060546875, 12.8642578125, 14.10791015625, 15.3515625, 16.59521484375, 17.8388671875, 19.08251953125, 20.326171875, 21.56982421875, 22.8134765625, 24.05712890625, 25.30078125, 26.54443359375, 27.7880859375, 29.03173828125, 30.275390625, 31.51904296875, 32.7626953125, 34.00634765625, 35.25]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 8.0, 11.0, 20.0, 53.0, 61.0, 106.0, 147.0, 176.0, 153.0, 100.0, 67.0, 46.0, 15.0, 14.0, 9.0, 10.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.93859100341797, -87.90706634521484, -83.87554931640625, -79.84402465820312, -75.8125, -71.78097534179688, -67.74945068359375, -63.717933654785156, -59.68640899658203, -55.654884338378906, -51.62336349487305, -47.59184265136719, -43.56031799316406, -39.52879333496094, -35.49727249145508, -31.465749740600586, -27.434226989746094, -23.4027042388916, -19.37118148803711, -15.339658737182617, -11.308135986328125, -7.276613235473633, -3.2450904846191406, 0.7864322662353516, 4.817955017089844, 8.849477767944336, 12.881000518798828, 16.91252326965332, 20.944046020507812, 24.975568771362305, 29.007091522216797, 33.038612365722656, 37.07014465332031, 41.10166931152344, 45.1331901550293, 49.164710998535156, 53.19623565673828, 57.227760314941406, 61.259281158447266, 65.29080200195312, 69.32232666015625, 73.35385131835938, 77.3853759765625, 81.4168930053711, 85.44841766357422, 89.47994232177734, 93.51145935058594, 97.54298400878906, 101.57450866699219, 105.60603332519531, 109.63755798339844, 113.66907501220703, 117.70059967041016, 121.73212432861328, 125.76364135742188, 129.795166015625, 133.82669067382812, 137.85821533203125, 141.88973999023438, 145.9212646484375, 149.95278930664062, 153.9842987060547, 158.0158233642578, 162.04734802246094, 166.07887268066406]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 7.0, 10.0, 15.0, 13.0, 13.0, 12.0, 21.0, 21.0, 20.0, 24.0, 27.0, 27.0, 31.0, 40.0, 34.0, 37.0, 45.0, 38.0, 30.0, 40.0, 43.0, 45.0, 36.0, 34.0, 39.0, 37.0, 42.0, 22.0, 25.0, 22.0, 24.0, 13.0, 16.0, 18.0, 17.0, 10.0, 6.0, 13.0, 8.0, 7.0, 5.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-47.35752487182617, -45.88702392578125, -44.416526794433594, -42.94602584838867, -41.47552490234375, -40.005027770996094, -38.53452682495117, -37.06402587890625, -35.593528747558594, -34.12302780151367, -32.652530670166016, -31.182029724121094, -29.711528778076172, -28.241029739379883, -26.770530700683594, -25.300029754638672, -23.82952880859375, -22.35902976989746, -20.88852882385254, -19.41802978515625, -17.947528839111328, -16.47702980041504, -15.00653076171875, -13.536030769348145, -12.065530776977539, -10.595030784606934, -9.124530792236328, -7.654031753540039, -6.183531761169434, -4.713031768798828, -3.242532730102539, -1.7720327377319336, -0.3015327453613281, 1.1689670085906982, 2.6394667625427246, 4.109966278076172, 5.580466270446777, 7.050966262817383, 8.521465301513672, 9.991965293884277, 11.462465286254883, 12.932965278625488, 14.403465270996094, 15.873964309692383, 17.344463348388672, 18.814964294433594, 20.285463333129883, 21.755962371826172, 23.226463317871094, 24.696962356567383, 26.167463302612305, 27.637962341308594, 29.108463287353516, 30.578962326049805, 32.049461364746094, 33.519962310791016, 34.99046325683594, 36.46096420288086, 37.931461334228516, 39.40196228027344, 40.87246322631836, 42.34296417236328, 43.81346130371094, 45.28396224975586, 46.754459381103516]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 4.0, 11.0, 9.0, 10.0, 14.0, 11.0, 21.0, 14.0, 20.0, 27.0, 29.0, 31.0, 38.0, 40.0, 25.0, 36.0, 51.0, 37.0, 38.0, 32.0, 35.0, 32.0, 44.0, 43.0, 35.0, 39.0, 39.0, 29.0, 26.0, 33.0, 15.0, 20.0, 9.0, 12.0, 13.0, 15.0, 12.0, 11.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-79.5, -77.1416015625, -74.783203125, -72.4248046875, -70.06640625, -67.7080078125, -65.349609375, -62.9912109375, -60.6328125, -58.2744140625, -55.916015625, -53.5576171875, -51.19921875, -48.8408203125, -46.482421875, -44.1240234375, -41.765625, -39.4072265625, -37.048828125, -34.6904296875, -32.33203125, -29.9736328125, -27.615234375, -25.2568359375, -22.8984375, -20.5400390625, -18.181640625, -15.8232421875, -13.46484375, -11.1064453125, -8.748046875, -6.3896484375, -4.03125, -1.6728515625, 0.685546875, 3.0439453125, 5.40234375, 7.7607421875, 10.119140625, 12.4775390625, 14.8359375, 17.1943359375, 19.552734375, 21.9111328125, 24.26953125, 26.6279296875, 28.986328125, 31.3447265625, 33.703125, 36.0615234375, 38.419921875, 40.7783203125, 43.13671875, 45.4951171875, 47.853515625, 50.2119140625, 52.5703125, 54.9287109375, 57.287109375, 59.6455078125, 62.00390625, 64.3623046875, 66.720703125, 69.0791015625, 71.4375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 7.0, 7.0, 21.0, 19.0, 44.0, 47.0, 70.0, 112.0, 183.0, 242.0, 383.0, 551.0, 867.0, 1249.0, 1906.0, 2917.0, 4340.0, 6621.0, 10143.0, 15386.0, 23959.0, 36782.0, 56963.0, 87866.0, 139854.0, 200189.0, 163877.0, 103810.0, 66568.0, 42748.0, 27966.0, 18168.0, 11796.0, 7666.0, 5103.0, 3446.0, 2249.0, 1452.0, 998.0, 674.0, 407.0, 302.0, 203.0, 123.0, 90.0, 51.0, 46.0, 28.0, 16.0, 16.0, 5.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.3046875, -9.010986328125, -8.71728515625, -8.423583984375, -8.1298828125, -7.836181640625, -7.54248046875, -7.248779296875, -6.955078125, -6.661376953125, -6.36767578125, -6.073974609375, -5.7802734375, -5.486572265625, -5.19287109375, -4.899169921875, -4.60546875, -4.311767578125, -4.01806640625, -3.724365234375, -3.4306640625, -3.136962890625, -2.84326171875, -2.549560546875, -2.255859375, -1.962158203125, -1.66845703125, -1.374755859375, -1.0810546875, -0.787353515625, -0.49365234375, -0.199951171875, 0.09375, 0.387451171875, 0.68115234375, 0.974853515625, 1.2685546875, 1.562255859375, 1.85595703125, 2.149658203125, 2.443359375, 2.737060546875, 3.03076171875, 3.324462890625, 3.6181640625, 3.911865234375, 4.20556640625, 4.499267578125, 4.79296875, 5.086669921875, 5.38037109375, 5.674072265625, 5.9677734375, 6.261474609375, 6.55517578125, 6.848876953125, 7.142578125, 7.436279296875, 7.72998046875, 8.023681640625, 8.3173828125, 8.611083984375, 8.90478515625, 9.198486328125, 9.4921875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 6.0, 3.0, 6.0, 6.0, 20.0, 15.0, 14.0, 14.0, 38.0, 28.0, 23.0, 27.0, 45.0, 43.0, 45.0, 34.0, 39.0, 36.0, 1072.0, 31.0, 47.0, 39.0, 40.0, 40.0, 35.0, 45.0, 40.0, 32.0, 34.0, 26.0, 18.0, 22.0, 17.0, 8.0, 13.0, 4.0, 8.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.4375, -50.68896484375, -48.9404296875, -47.19189453125, -45.443359375, -43.69482421875, -41.9462890625, -40.19775390625, -38.44921875, -36.70068359375, -34.9521484375, -33.20361328125, -31.455078125, -29.70654296875, -27.9580078125, -26.20947265625, -24.4609375, -22.71240234375, -20.9638671875, -19.21533203125, -17.466796875, -15.71826171875, -13.9697265625, -12.22119140625, -10.47265625, -8.72412109375, -6.9755859375, -5.22705078125, -3.478515625, -1.72998046875, 0.0185546875, 1.76708984375, 3.515625, 5.26416015625, 7.0126953125, 8.76123046875, 10.509765625, 12.25830078125, 14.0068359375, 15.75537109375, 17.50390625, 19.25244140625, 21.0009765625, 22.74951171875, 24.498046875, 26.24658203125, 27.9951171875, 29.74365234375, 31.4921875, 33.24072265625, 34.9892578125, 36.73779296875, 38.486328125, 40.23486328125, 41.9833984375, 43.73193359375, 45.48046875, 47.22900390625, 48.9775390625, 50.72607421875, 52.474609375, 54.22314453125, 55.9716796875, 57.72021484375, 59.46875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 14.0, 13.0, 19.0, 25.0, 27.0, 48.0, 69.0, 114.0, 182.0, 274.0, 449.0, 606.0, 936.0, 1419.0, 2306.0, 3686.0, 5574.0, 8727.0, 13899.0, 21832.0, 34849.0, 55328.0, 87384.0, 137702.0, 1249852.0, 171688.0, 110311.0, 69297.0, 44518.0, 27784.0, 17545.0, 10943.0, 7030.0, 4538.0, 2911.0, 1827.0, 1193.0, 776.0, 471.0, 328.0, 213.0, 154.0, 102.0, 53.0, 44.0, 26.0, 19.0, 12.0, 11.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.34375, -9.0399169921875, -8.736083984375, -8.4322509765625, -8.12841796875, -7.8245849609375, -7.520751953125, -7.2169189453125, -6.9130859375, -6.6092529296875, -6.305419921875, -6.0015869140625, -5.69775390625, -5.3939208984375, -5.090087890625, -4.7862548828125, -4.482421875, -4.1785888671875, -3.874755859375, -3.5709228515625, -3.26708984375, -2.9632568359375, -2.659423828125, -2.3555908203125, -2.0517578125, -1.7479248046875, -1.444091796875, -1.1402587890625, -0.83642578125, -0.5325927734375, -0.228759765625, 0.0750732421875, 0.37890625, 0.6827392578125, 0.986572265625, 1.2904052734375, 1.59423828125, 1.8980712890625, 2.201904296875, 2.5057373046875, 2.8095703125, 3.1134033203125, 3.417236328125, 3.7210693359375, 4.02490234375, 4.3287353515625, 4.632568359375, 4.9364013671875, 5.240234375, 5.5440673828125, 5.847900390625, 6.1517333984375, 6.45556640625, 6.7593994140625, 7.063232421875, 7.3670654296875, 7.6708984375, 7.9747314453125, 8.278564453125, 8.5823974609375, 8.88623046875, 9.1900634765625, 9.493896484375, 9.7977294921875, 10.1015625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 12.0, 9.0, 12.0, 20.0, 33.0, 31.0, 30.0, 47.0, 50.0, 56.0, 61.0, 48.0, 54.0, 62.0, 51.0, 46.0, 38.0, 45.0, 45.0, 46.0, 37.0, 23.0, 27.0, 22.0, 14.0, 15.0, 10.0, 10.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.022674560546875, -0.02207040786743164, -0.02146625518798828, -0.020862102508544922, -0.020257949829101562, -0.019653797149658203, -0.019049644470214844, -0.018445491790771484, -0.017841339111328125, -0.017237186431884766, -0.016633033752441406, -0.016028881072998047, -0.015424728393554688, -0.014820575714111328, -0.014216423034667969, -0.01361227035522461, -0.01300811767578125, -0.01240396499633789, -0.011799812316894531, -0.011195659637451172, -0.010591506958007812, -0.009987354278564453, -0.009383201599121094, -0.008779048919677734, -0.008174896240234375, -0.007570743560791016, -0.006966590881347656, -0.006362438201904297, -0.0057582855224609375, -0.005154132843017578, -0.004549980163574219, -0.003945827484130859, -0.0033416748046875, -0.0027375221252441406, -0.0021333694458007812, -0.0015292167663574219, -0.0009250640869140625, -0.0003209114074707031, 0.00028324127197265625, 0.0008873939514160156, 0.001491546630859375, 0.0020956993103027344, 0.0026998519897460938, 0.003304004669189453, 0.0039081573486328125, 0.004512310028076172, 0.005116462707519531, 0.005720615386962891, 0.00632476806640625, 0.006928920745849609, 0.007533073425292969, 0.008137226104736328, 0.008741378784179688, 0.009345531463623047, 0.009949684143066406, 0.010553836822509766, 0.011157989501953125, 0.011762142181396484, 0.012366294860839844, 0.012970447540283203, 0.013574600219726562, 0.014178752899169922, 0.014782905578613281, 0.01538705825805664, 0.0159912109375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 8.0, 9.0, 16.0, 22.0, 24.0, 55.0, 53.0, 76.0, 104.0, 156.0, 201.0, 305.0, 510.0, 1010.0, 2402.0, 8767.0, 47716.0, 351413.0, 530325.0, 84954.0, 13915.0, 3418.0, 1269.0, 649.0, 385.0, 243.0, 154.0, 116.0, 66.0, 68.0, 32.0, 27.0, 20.0, 12.0, 19.0, 12.0, 8.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.156005859375, -0.15099716186523438, -0.14598846435546875, -0.14097976684570312, -0.1359710693359375, -0.13096237182617188, -0.12595367431640625, -0.12094497680664062, -0.115936279296875, -0.11092758178710938, -0.10591888427734375, -0.10091018676757812, -0.0959014892578125, -0.09089279174804688, -0.08588409423828125, -0.08087539672851562, -0.07586669921875, -0.07085800170898438, -0.06584930419921875, -0.060840606689453125, -0.0558319091796875, -0.050823211669921875, -0.04581451416015625, -0.040805816650390625, -0.035797119140625, -0.030788421630859375, -0.02577972412109375, -0.020771026611328125, -0.0157623291015625, -0.010753631591796875, -0.00574493408203125, -0.000736236572265625, 0.0042724609375, 0.009281158447265625, 0.01428985595703125, 0.019298553466796875, 0.0243072509765625, 0.029315948486328125, 0.03432464599609375, 0.039333343505859375, 0.044342041015625, 0.049350738525390625, 0.05435943603515625, 0.059368133544921875, 0.0643768310546875, 0.06938552856445312, 0.07439422607421875, 0.07940292358398438, 0.08441162109375, 0.08942031860351562, 0.09442901611328125, 0.09943771362304688, 0.1044464111328125, 0.10945510864257812, 0.11446380615234375, 0.11947250366210938, 0.124481201171875, 0.12948989868164062, 0.13449859619140625, 0.13950729370117188, 0.1445159912109375, 0.14952468872070312, 0.15453338623046875, 0.15954208374023438, 0.16455078125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 11.0, 9.0, 17.0, 30.0, 38.0, 55.0, 83.0, 113.0, 131.0, 128.0, 107.0, 86.0, 68.0, 45.0, 26.0, 18.0, 12.0, 8.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014692848548293114, -0.014030023477971554, -0.013367198407649994, -0.012704374268651009, -0.012041548267006874, -0.011378724128007889, -0.010715899057686329, -0.010053073987364769, -0.009390248917043209, -0.00872742384672165, -0.00806459877640009, -0.007401774171739817, -0.006738949101418257, -0.006076124031096697, -0.005413299426436424, -0.004750474356114864, -0.0040876492857933044, -0.0034248242154717445, -0.0027619993779808283, -0.002099174540489912, -0.0014363494701683521, -0.0007735243998467922, -0.00011069979518651962, 0.0005521252751350403, 0.0012149503454566002, 0.0018777752993628383, 0.0025406002532690763, 0.0032034250907599926, 0.0038662501610815525, 0.004529075231403112, 0.005191899836063385, 0.005854724906384945, 0.006517549976706505, 0.007180375047028065, 0.007843200117349625, 0.00850602425634861, 0.009168850257992744, 0.00983167439699173, 0.01049449946731329, 0.01115732453763485, 0.01182014960795641, 0.01248297467827797, 0.01314579974859953, 0.01380862481892109, 0.014471448957920074, 0.015134274959564209, 0.015797099098563194, 0.01645992323756218, 0.017122749239206314, 0.0177855733782053, 0.018448399379849434, 0.01911122351884842, 0.019774049520492554, 0.02043687365949154, 0.021099697798490524, 0.02176252380013466, 0.022425349801778793, 0.02308817394077778, 0.023750999942421913, 0.0244138240814209, 0.025076650083065033, 0.025739474222064018, 0.026402298361063004, 0.027065124362707138, 0.027727948501706123]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 11.0, 11.0, 10.0, 15.0, 10.0, 23.0, 18.0, 23.0, 24.0, 29.0, 25.0, 31.0, 37.0, 37.0, 43.0, 29.0, 45.0, 41.0, 37.0, 38.0, 32.0, 36.0, 39.0, 28.0, 28.0, 25.0, 22.0, 29.0, 25.0, 22.0, 24.0, 25.0, 18.0, 10.0, 11.0, 15.0, 9.0, 7.0, 8.0, 6.0, 3.0, 9.0, 4.0, 10.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.008817911148071289, -0.008537821471691132, -0.008257731795310974, -0.007977642118930817, -0.007697552442550659, -0.007417462766170502, -0.007137373089790344, -0.006857283413410187, -0.006577193737030029, -0.006297104060649872, -0.006017014384269714, -0.005736924707889557, -0.005456835031509399, -0.005176745355129242, -0.0048966556787490845, -0.004616566002368927, -0.0043364763259887695, -0.004056386649608612, -0.0037762969732284546, -0.003496207296848297, -0.0032161176204681396, -0.002936027944087982, -0.0026559382677078247, -0.0023758485913276672, -0.0020957589149475098, -0.0018156692385673523, -0.0015355795621871948, -0.0012554898858070374, -0.0009754002094268799, -0.0006953105330467224, -0.00041522085666656494, -0.00013513118028640747, 0.00014495849609375, 0.00042504817247390747, 0.0007051378488540649, 0.0009852275252342224, 0.0012653172016143799, 0.0015454068779945374, 0.0018254965543746948, 0.0021055862307548523, 0.0023856759071350098, 0.0026657655835151672, 0.0029458552598953247, 0.003225944936275482, 0.0035060346126556396, 0.003786124289035797, 0.004066213965415955, 0.004346303641796112, 0.0046263933181762695, 0.004906482994556427, 0.0051865726709365845, 0.005466662347316742, 0.005746752023696899, 0.006026841700077057, 0.006306931376457214, 0.006587021052837372, 0.006867110729217529, 0.007147200405597687, 0.007427290081977844, 0.007707379758358002, 0.00798746943473816, 0.008267559111118317, 0.008547648787498474, 0.008827738463878632, 0.009107828140258789]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 4.0, 11.0, 9.0, 10.0, 14.0, 11.0, 21.0, 14.0, 20.0, 27.0, 29.0, 32.0, 37.0, 40.0, 24.0, 37.0, 50.0, 38.0, 39.0, 31.0, 35.0, 32.0, 44.0, 42.0, 36.0, 39.0, 39.0, 30.0, 25.0, 33.0, 15.0, 20.0, 9.0, 12.0, 13.0, 15.0, 12.0, 11.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-79.5, -77.1416015625, -74.783203125, -72.4248046875, -70.06640625, -67.7080078125, -65.349609375, -62.9912109375, -60.6328125, -58.2744140625, -55.916015625, -53.5576171875, -51.19921875, -48.8408203125, -46.482421875, -44.1240234375, -41.765625, -39.4072265625, -37.048828125, -34.6904296875, -32.33203125, -29.9736328125, -27.615234375, -25.2568359375, -22.8984375, -20.5400390625, -18.181640625, -15.8232421875, -13.46484375, -11.1064453125, -8.748046875, -6.3896484375, -4.03125, -1.6728515625, 0.685546875, 3.0439453125, 5.40234375, 7.7607421875, 10.119140625, 12.4775390625, 14.8359375, 17.1943359375, 19.552734375, 21.9111328125, 24.26953125, 26.6279296875, 28.986328125, 31.3447265625, 33.703125, 36.0615234375, 38.419921875, 40.7783203125, 43.13671875, 45.4951171875, 47.853515625, 50.2119140625, 52.5703125, 54.9287109375, 57.287109375, 59.6455078125, 62.00390625, 64.3623046875, 66.720703125, 69.0791015625, 71.4375]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 13.0, 7.0, 12.0, 15.0, 16.0, 23.0, 38.0, 39.0, 67.0, 91.0, 132.0, 202.0, 324.0, 580.0, 1063.0, 1980.0, 3812.0, 8782.0, 25291.0, 110499.0, 571110.0, 253422.0, 45993.0, 13569.0, 5454.0, 2632.0, 1353.0, 803.0, 434.0, 255.0, 156.0, 114.0, 76.0, 54.0, 22.0, 25.0, 23.0, 21.0, 14.0, 7.0, 11.0, 4.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-21.390625, -20.75634765625, -20.1220703125, -19.48779296875, -18.853515625, -18.21923828125, -17.5849609375, -16.95068359375, -16.31640625, -15.68212890625, -15.0478515625, -14.41357421875, -13.779296875, -13.14501953125, -12.5107421875, -11.87646484375, -11.2421875, -10.60791015625, -9.9736328125, -9.33935546875, -8.705078125, -8.07080078125, -7.4365234375, -6.80224609375, -6.16796875, -5.53369140625, -4.8994140625, -4.26513671875, -3.630859375, -2.99658203125, -2.3623046875, -1.72802734375, -1.09375, -0.45947265625, 0.1748046875, 0.80908203125, 1.443359375, 2.07763671875, 2.7119140625, 3.34619140625, 3.98046875, 4.61474609375, 5.2490234375, 5.88330078125, 6.517578125, 7.15185546875, 7.7861328125, 8.42041015625, 9.0546875, 9.68896484375, 10.3232421875, 10.95751953125, 11.591796875, 12.22607421875, 12.8603515625, 13.49462890625, 14.12890625, 14.76318359375, 15.3974609375, 16.03173828125, 16.666015625, 17.30029296875, 17.9345703125, 18.56884765625, 19.203125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 8.0, 9.0, 13.0, 18.0, 25.0, 37.0, 36.0, 49.0, 51.0, 80.0, 69.0, 99.0, 2124.0, 74.0, 74.0, 63.0, 47.0, 44.0, 34.0, 20.0, 26.0, 11.0, 12.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-213.125, -206.33984375, -199.5546875, -192.76953125, -185.984375, -179.19921875, -172.4140625, -165.62890625, -158.84375, -152.05859375, -145.2734375, -138.48828125, -131.703125, -124.91796875, -118.1328125, -111.34765625, -104.5625, -97.77734375, -90.9921875, -84.20703125, -77.421875, -70.63671875, -63.8515625, -57.06640625, -50.28125, -43.49609375, -36.7109375, -29.92578125, -23.140625, -16.35546875, -9.5703125, -2.78515625, 4.0, 10.78515625, 17.5703125, 24.35546875, 31.140625, 37.92578125, 44.7109375, 51.49609375, 58.28125, 65.06640625, 71.8515625, 78.63671875, 85.421875, 92.20703125, 98.9921875, 105.77734375, 112.5625, 119.34765625, 126.1328125, 132.91796875, 139.703125, 146.48828125, 153.2734375, 160.05859375, 166.84375, 173.62890625, 180.4140625, 187.19921875, 193.984375, 200.76953125, 207.5546875, 214.33984375, 221.125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 10.0, 9.0, 14.0, 16.0, 23.0, 36.0, 59.0, 80.0, 120.0, 190.0, 318.0, 627.0, 1446.0, 4216.0, 43993.0, 2984604.0, 99964.0, 6366.0, 1825.0, 773.0, 365.0, 212.0, 135.0, 99.0, 50.0, 39.0, 24.0, 22.0, 17.0, 8.0, 9.0, 3.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.21875, -44.7568359375, -43.294921875, -41.8330078125, -40.37109375, -38.9091796875, -37.447265625, -35.9853515625, -34.5234375, -33.0615234375, -31.599609375, -30.1376953125, -28.67578125, -27.2138671875, -25.751953125, -24.2900390625, -22.828125, -21.3662109375, -19.904296875, -18.4423828125, -16.98046875, -15.5185546875, -14.056640625, -12.5947265625, -11.1328125, -9.6708984375, -8.208984375, -6.7470703125, -5.28515625, -3.8232421875, -2.361328125, -0.8994140625, 0.5625, 2.0244140625, 3.486328125, 4.9482421875, 6.41015625, 7.8720703125, 9.333984375, 10.7958984375, 12.2578125, 13.7197265625, 15.181640625, 16.6435546875, 18.10546875, 19.5673828125, 21.029296875, 22.4912109375, 23.953125, 25.4150390625, 26.876953125, 28.3388671875, 29.80078125, 31.2626953125, 32.724609375, 34.1865234375, 35.6484375, 37.1103515625, 38.572265625, 40.0341796875, 41.49609375, 42.9580078125, 44.419921875, 45.8818359375, 47.34375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 35.0, 179.0, 642.0, 111.0, 18.0, 8.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1493.390869140625, -1466.4288330078125, -1439.466796875, -1412.5047607421875, -1385.542724609375, -1358.580810546875, -1331.6187744140625, -1304.65673828125, -1277.6947021484375, -1250.732666015625, -1223.7706298828125, -1196.80859375, -1169.8466796875, -1142.8846435546875, -1115.922607421875, -1088.9605712890625, -1061.99853515625, -1035.0364990234375, -1008.074462890625, -981.1124877929688, -954.1504516601562, -927.1884155273438, -900.2264404296875, -873.264404296875, -846.3023681640625, -819.34033203125, -792.3782958984375, -765.4163208007812, -738.4542846679688, -711.4922485351562, -684.5302734375, -657.5682373046875, -630.6062622070312, -603.6442260742188, -576.6822509765625, -549.72021484375, -522.7581787109375, -495.796142578125, -468.8341369628906, -441.87213134765625, -414.91009521484375, -387.94805908203125, -360.9860534667969, -334.0240478515625, -307.06201171875, -280.0999755859375, -253.13796997070312, -226.1759490966797, -199.21392822265625, -172.2519073486328, -145.28988647460938, -118.32786560058594, -91.3658447265625, -64.40382385253906, -37.441802978515625, -10.479782104492188, 16.48223876953125, 43.44425964355469, 70.40628051757812, 97.36830139160156, 124.330322265625, 151.29234313964844, 178.25436401367188, 205.2163848876953, 232.17840576171875]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 12.0, 4.0, 10.0, 13.0, 22.0, 18.0, 18.0, 24.0, 19.0, 32.0, 43.0, 44.0, 42.0, 39.0, 52.0, 58.0, 46.0, 54.0, 53.0, 44.0, 44.0, 53.0, 44.0, 24.0, 37.0, 24.0, 21.0, 19.0, 11.0, 20.0, 10.0, 10.0, 6.0, 4.0, 1.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-214.85885620117188, -208.4850311279297, -202.11122131347656, -195.73739624023438, -189.3635711669922, -182.98974609375, -176.61593627929688, -170.2421112060547, -163.8682861328125, -157.4944610595703, -151.1206512451172, -144.746826171875, -138.3730010986328, -131.99917602539062, -125.6253662109375, -119.25154113769531, -112.87773132324219, -106.50391387939453, -100.13008880615234, -93.75627136230469, -87.3824462890625, -81.00862884521484, -74.63481140136719, -68.260986328125, -61.887168884277344, -55.51334762573242, -49.1395263671875, -42.765708923339844, -36.39188766479492, -30.01806640625, -23.644248962402344, -17.270427703857422, -10.8966064453125, -4.5227861404418945, 1.851034164428711, 8.224853515625, 14.598674774169922, 20.972496032714844, 27.3463134765625, 33.72013473510742, 40.093955993652344, 46.467777252197266, 52.84159851074219, 59.215415954589844, 65.5892333984375, 71.96305847167969, 78.33687591552734, 84.710693359375, 91.08451843261719, 97.45833587646484, 103.83216094970703, 110.20597839355469, 116.57980346679688, 122.95362091064453, 129.3274383544922, 135.70126342773438, 142.0750732421875, 148.4488983154297, 154.8227081298828, 161.196533203125, 167.5703582763672, 173.94418334960938, 180.3179931640625, 186.6918182373047, 193.06564331054688]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 7.0, 17.0, 17.0, 24.0, 25.0, 33.0, 24.0, 46.0, 70.0, 92.0, 120.0, 168.0, 217.0, 295.0, 417.0, 640.0, 793.0, 1382.0, 1040823.0, 868.0, 637.0, 521.0, 339.0, 222.0, 187.0, 118.0, 92.0, 76.0, 57.0, 42.0, 41.0, 30.0, 21.0, 12.0, 13.0, 22.0, 11.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.26725387573242, -44.62516784667969, -42.98308181762695, -41.34099578857422, -39.69891357421875, -38.05682373046875, -36.41474151611328, -34.77265548706055, -33.13056945800781, -31.488483428955078, -29.846397399902344, -28.204313278198242, -26.562227249145508, -24.920141220092773, -23.278057098388672, -21.635971069335938, -19.993885040283203, -18.35179901123047, -16.709712982177734, -15.067628860473633, -13.425542831420898, -11.783456802368164, -10.141371726989746, -8.499286651611328, -6.857200622558594, -5.215115070343018, -3.5730295181274414, -1.9309439659118652, -0.28885841369628906, 1.3532276153564453, 2.9953126907348633, 4.637397766113281, 6.27947998046875, 7.921565532684326, 9.563651084899902, 11.20573616027832, 12.847822189331055, 14.489908218383789, 16.13199234008789, 17.774078369140625, 19.41616439819336, 21.058250427246094, 22.700336456298828, 24.34242057800293, 25.984506607055664, 27.6265926361084, 29.2686767578125, 30.910762786865234, 32.55284881591797, 34.1949348449707, 35.83702087402344, 37.47910690307617, 39.121192932128906, 40.763275146484375, 42.40536117553711, 44.047447204589844, 45.68953323364258, 47.33161926269531, 48.97370529174805, 50.61579132080078, 52.25787353515625, 53.89996337890625, 55.54204559326172, 57.18413162231445, 58.82621765136719]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 12.0, 12.0, 10.0, 11.0, 31.0, 149.0, 51462728.0, 114.0, 36.0, 12.0, 5.0, 5.0, 4.0, 4.0, 6.0, 3.0, 5.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8412.0771484375, -8002.13037109375, -7592.18359375, -7182.2373046875, -6772.2900390625, -6362.34375, -5952.39697265625, -5542.4501953125, -5132.50341796875, -4722.556640625, -4312.60986328125, -3902.663330078125, -3492.716552734375, -3082.769775390625, -2672.8232421875, -2262.87646484375, -1852.9296875, -1442.98291015625, -1033.0362548828125, -623.089599609375, -213.142822265625, 196.803955078125, 606.75048828125, 1016.697265625, 1426.64404296875, 1836.5908203125, 2246.53759765625, 2656.484130859375, 3066.430908203125, 3476.377685546875, 3886.32421875, 4296.27099609375, 4706.216796875, 5116.16357421875, 5526.1103515625, 5936.056640625, 6346.00390625, 6755.9501953125, 7165.89697265625, 7575.84375, 7985.79052734375, 8395.7373046875, 8805.68359375, 9215.630859375, 9625.5771484375, 10035.5244140625, 10445.470703125, 10855.41796875, 11265.3642578125, 11675.310546875, 12085.2578125, 12495.2041015625, 12905.1513671875, 13315.09765625, 13725.044921875, 14134.9912109375, 14544.9375, 14954.8837890625, 15364.8310546875, 15774.77734375, 16184.724609375, 16594.671875, 17004.6171875, 17414.564453125, 17824.51171875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 7.0, 6.0, 18.0, 19.0, 27.0, 25.0, 54.0, 90.0, 114.0, 154.0, 237.0, 296.0, 427.0, 577.0, 944.0, 1491.0, 2099.0, 3120.0, 4744.0, 7354.0, 11174.0, 17590.0, 27807.0, 42489.0, 65475.0, 100597.0, 161749.0, 266913.0, 501835.0, 3710630.0, 589430.0, 292243.0, 175108.0, 109623.0, 69264.0, 44425.0, 28995.0, 18415.0, 12532.0, 7869.0, 5245.0, 3554.0, 2236.0, 1518.0, 987.0, 600.0, 470.0, 281.0, 176.0, 114.0, 87.0, 70.0, 49.0, 29.0, 28.0, 12.0, 7.0, 6.0, 5.0, 6.0, 2.0, 6.0], "bins": [-4.98046875, -4.82275390625, -4.6650390625, -4.50732421875, -4.349609375, -4.19189453125, -4.0341796875, -3.87646484375, -3.71875, -3.56103515625, -3.4033203125, -3.24560546875, -3.087890625, -2.93017578125, -2.7724609375, -2.61474609375, -2.45703125, -2.29931640625, -2.1416015625, -1.98388671875, -1.826171875, -1.66845703125, -1.5107421875, -1.35302734375, -1.1953125, -1.03759765625, -0.8798828125, -0.72216796875, -0.564453125, -0.40673828125, -0.2490234375, -0.09130859375, 0.06640625, 0.22412109375, 0.3818359375, 0.53955078125, 0.697265625, 0.85498046875, 1.0126953125, 1.17041015625, 1.328125, 1.48583984375, 1.6435546875, 1.80126953125, 1.958984375, 2.11669921875, 2.2744140625, 2.43212890625, 2.58984375, 2.74755859375, 2.9052734375, 3.06298828125, 3.220703125, 3.37841796875, 3.5361328125, 3.69384765625, 3.8515625, 4.00927734375, 4.1669921875, 4.32470703125, 4.482421875, 4.64013671875, 4.7978515625, 4.95556640625, 5.11328125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 5.0, 6.0, 7.0, 8.0, 13.0, 9.0, 16.0, 10.0, 15.0, 18.0, 17.0, 22.0, 23.0, 28.0, 26.0, 20.0, 33.0, 39.0, 53.0, 47.0, 74.0, 342.0, 640.0, 120.0, 41.0, 29.0, 36.0, 47.0, 32.0, 46.0, 32.0, 25.0, 20.0, 26.0, 16.0, 15.0, 14.0, 16.0, 11.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.046875, -16.500244140625, -15.95361328125, -15.406982421875, -14.8603515625, -14.313720703125, -13.76708984375, -13.220458984375, -12.673828125, -12.127197265625, -11.58056640625, -11.033935546875, -10.4873046875, -9.940673828125, -9.39404296875, -8.847412109375, -8.30078125, -7.754150390625, -7.20751953125, -6.660888671875, -6.1142578125, -5.567626953125, -5.02099609375, -4.474365234375, -3.927734375, -3.381103515625, -2.83447265625, -2.287841796875, -1.7412109375, -1.194580078125, -0.64794921875, -0.101318359375, 0.4453125, 0.991943359375, 1.53857421875, 2.085205078125, 2.6318359375, 3.178466796875, 3.72509765625, 4.271728515625, 4.818359375, 5.364990234375, 5.91162109375, 6.458251953125, 7.0048828125, 7.551513671875, 8.09814453125, 8.644775390625, 9.19140625, 9.738037109375, 10.28466796875, 10.831298828125, 11.3779296875, 11.924560546875, 12.47119140625, 13.017822265625, 13.564453125, 14.111083984375, 14.65771484375, 15.204345703125, 15.7509765625, 16.297607421875, 16.84423828125, 17.390869140625, 17.9375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 9.0, 17.0, 21.0, 21.0, 31.0, 37.0, 67.0, 118.0, 202.0, 307.0, 399.0, 527.0, 858.0, 1326.0, 2069.0, 2933.0, 4740.0, 7505.0, 11972.0, 19286.0, 33290.0, 58605.0, 107835.0, 215257.0, 488625.0, 3906621.0, 813894.0, 293322.0, 141828.0, 74140.0, 41390.0, 24292.0, 14582.0, 9115.0, 5665.0, 3522.0, 2427.0, 1550.0, 990.0, 642.0, 448.0, 309.0, 238.0, 167.0, 81.0, 53.0, 30.0, 17.0, 24.0, 13.0, 10.0, 17.0, 2.0, 0.0, 3.0], "bins": [-7.75, -7.52667236328125, -7.3033447265625, -7.08001708984375, -6.856689453125, -6.63336181640625, -6.4100341796875, -6.18670654296875, -5.96337890625, -5.74005126953125, -5.5167236328125, -5.29339599609375, -5.070068359375, -4.84674072265625, -4.6234130859375, -4.40008544921875, -4.1767578125, -3.95343017578125, -3.7301025390625, -3.50677490234375, -3.283447265625, -3.06011962890625, -2.8367919921875, -2.61346435546875, -2.39013671875, -2.16680908203125, -1.9434814453125, -1.72015380859375, -1.496826171875, -1.27349853515625, -1.0501708984375, -0.82684326171875, -0.603515625, -0.38018798828125, -0.1568603515625, 0.06646728515625, 0.289794921875, 0.51312255859375, 0.7364501953125, 0.95977783203125, 1.18310546875, 1.40643310546875, 1.6297607421875, 1.85308837890625, 2.076416015625, 2.29974365234375, 2.5230712890625, 2.74639892578125, 2.9697265625, 3.19305419921875, 3.4163818359375, 3.63970947265625, 3.863037109375, 4.08636474609375, 4.3096923828125, 4.53302001953125, 4.75634765625, 4.97967529296875, 5.2030029296875, 5.42633056640625, 5.649658203125, 5.87298583984375, 6.0963134765625, 6.31964111328125, 6.54296875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 6.0, 3.0, 9.0, 9.0, 8.0, 12.0, 7.0, 13.0, 16.0, 14.0, 21.0, 20.0, 22.0, 25.0, 32.0, 38.0, 41.0, 50.0, 60.0, 126.0, 531.0, 391.0, 119.0, 54.0, 35.0, 38.0, 33.0, 42.0, 39.0, 40.0, 28.0, 27.0, 23.0, 20.0, 16.0, 15.0, 8.0, 7.0, 5.0, 4.0, 5.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.5546875, -11.192138671875, -10.82958984375, -10.467041015625, -10.1044921875, -9.741943359375, -9.37939453125, -9.016845703125, -8.654296875, -8.291748046875, -7.92919921875, -7.566650390625, -7.2041015625, -6.841552734375, -6.47900390625, -6.116455078125, -5.75390625, -5.391357421875, -5.02880859375, -4.666259765625, -4.3037109375, -3.941162109375, -3.57861328125, -3.216064453125, -2.853515625, -2.490966796875, -2.12841796875, -1.765869140625, -1.4033203125, -1.040771484375, -0.67822265625, -0.315673828125, 0.046875, 0.409423828125, 0.77197265625, 1.134521484375, 1.4970703125, 1.859619140625, 2.22216796875, 2.584716796875, 2.947265625, 3.309814453125, 3.67236328125, 4.034912109375, 4.3974609375, 4.760009765625, 5.12255859375, 5.485107421875, 5.84765625, 6.210205078125, 6.57275390625, 6.935302734375, 7.2978515625, 7.660400390625, 8.02294921875, 8.385498046875, 8.748046875, 9.110595703125, 9.47314453125, 9.835693359375, 10.1982421875, 10.560791015625, 10.92333984375, 11.285888671875, 11.6484375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 0.0, 4.0, 0.0, 9.0, 16.0, 10.0, 10.0, 17.0, 33.0, 40.0, 31.0, 42.0, 67.0, 102.0, 145.0, 125.0, 216.0, 237.0, 307.0, 483.0, 613.0, 800.0, 1146.0, 1709.0, 2496.0, 4286.0, 7230.0, 14983.0, 35570.0, 123251.0, 5875749.0, 144795.0, 39224.0, 16203.0, 7901.0, 4494.0, 2732.0, 1709.0, 1230.0, 943.0, 611.0, 434.0, 337.0, 241.0, 220.0, 161.0, 103.0, 77.0, 82.0, 53.0, 32.0, 30.0, 14.0, 18.0, 22.0, 11.0, 10.0, 5.0, 12.0, 9.0, 8.0], "bins": [-19.125, -18.554931640625, -17.98486328125, -17.414794921875, -16.8447265625, -16.274658203125, -15.70458984375, -15.134521484375, -14.564453125, -13.994384765625, -13.42431640625, -12.854248046875, -12.2841796875, -11.714111328125, -11.14404296875, -10.573974609375, -10.00390625, -9.433837890625, -8.86376953125, -8.293701171875, -7.7236328125, -7.153564453125, -6.58349609375, -6.013427734375, -5.443359375, -4.873291015625, -4.30322265625, -3.733154296875, -3.1630859375, -2.593017578125, -2.02294921875, -1.452880859375, -0.8828125, -0.312744140625, 0.25732421875, 0.827392578125, 1.3974609375, 1.967529296875, 2.53759765625, 3.107666015625, 3.677734375, 4.247802734375, 4.81787109375, 5.387939453125, 5.9580078125, 6.528076171875, 7.09814453125, 7.668212890625, 8.23828125, 8.808349609375, 9.37841796875, 9.948486328125, 10.5185546875, 11.088623046875, 11.65869140625, 12.228759765625, 12.798828125, 13.368896484375, 13.93896484375, 14.509033203125, 15.0791015625, 15.649169921875, 16.21923828125, 16.789306640625, 17.359375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 11.0, 9.0, 7.0, 6.0, 13.0, 22.0, 15.0, 25.0, 17.0, 19.0, 27.0, 28.0, 28.0, 29.0, 45.0, 56.0, 62.0, 108.0, 248.0, 465.0, 209.0, 95.0, 72.0, 41.0, 36.0, 33.0, 48.0, 28.0, 27.0, 30.0, 26.0, 15.0, 21.0, 12.0, 15.0, 10.0, 12.0, 13.0, 10.0, 6.0, 6.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.69140625, -7.46063232421875, -7.2298583984375, -6.99908447265625, -6.768310546875, -6.53753662109375, -6.3067626953125, -6.07598876953125, -5.84521484375, -5.61444091796875, -5.3836669921875, -5.15289306640625, -4.922119140625, -4.69134521484375, -4.4605712890625, -4.22979736328125, -3.9990234375, -3.76824951171875, -3.5374755859375, -3.30670166015625, -3.075927734375, -2.84515380859375, -2.6143798828125, -2.38360595703125, -2.15283203125, -1.92205810546875, -1.6912841796875, -1.46051025390625, -1.229736328125, -0.99896240234375, -0.7681884765625, -0.53741455078125, -0.306640625, -0.07586669921875, 0.1549072265625, 0.38568115234375, 0.616455078125, 0.84722900390625, 1.0780029296875, 1.30877685546875, 1.53955078125, 1.77032470703125, 2.0010986328125, 2.23187255859375, 2.462646484375, 2.69342041015625, 2.9241943359375, 3.15496826171875, 3.3857421875, 3.61651611328125, 3.8472900390625, 4.07806396484375, 4.308837890625, 4.53961181640625, 4.7703857421875, 5.00115966796875, 5.23193359375, 5.46270751953125, 5.6934814453125, 5.92425537109375, 6.155029296875, 6.38580322265625, 6.6165771484375, 6.84735107421875, 7.078125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 10.0, 40.0, 63.0, 115.0, 223.0, 242.0, 121.0, 77.0, 27.0, 23.0, 15.0, 12.0, 9.0, 3.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.559688568115234, -26.752370834350586, -25.945053100585938, -25.137737274169922, -24.330419540405273, -23.523101806640625, -22.715784072875977, -21.908466339111328, -21.10114860534668, -20.29383087158203, -19.486513137817383, -18.679195404052734, -17.87187957763672, -17.06456184387207, -16.257244110107422, -15.449926376342773, -14.642609596252441, -13.835291862487793, -13.027975082397461, -12.220657348632812, -11.413339614868164, -10.606021881103516, -9.798705101013184, -8.991387367248535, -8.184070587158203, -7.376753330230713, -6.5694355964660645, -5.762118339538574, -4.954800605773926, -4.1474833488464355, -3.3401660919189453, -2.532848358154297, -1.7255306243896484, -0.9182131886482239, -0.11089575290679932, 0.6964216232299805, 1.5037391185760498, 2.311056613922119, 3.1183738708496094, 3.925691604614258, 4.733008861541748, 5.540326118469238, 6.347643852233887, 7.154961109161377, 7.962278366088867, 8.769596099853516, 9.576913833618164, 10.384231567382812, 11.191548347473145, 11.998866081237793, 12.806182861328125, 13.613500595092773, 14.420818328857422, 15.22813606262207, 16.03545379638672, 16.842769622802734, 17.650087356567383, 18.45740509033203, 19.26472282409668, 20.072040557861328, 20.879356384277344, 21.686674118041992, 22.49399185180664, 23.30130958557129, 24.108627319335938]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 10.0, 9.0, 10.0, 20.0, 13.0, 17.0, 24.0, 18.0, 29.0, 24.0, 29.0, 30.0, 41.0, 37.0, 43.0, 49.0, 50.0, 31.0, 45.0, 50.0, 41.0, 28.0, 52.0, 39.0, 39.0, 32.0, 36.0, 24.0, 22.0, 20.0, 11.0, 8.0, 15.0, 8.0, 11.0, 6.0, 6.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.969585418701172, -11.603760719299316, -11.237936973571777, -10.872112274169922, -10.506288528442383, -10.140463829040527, -9.774639129638672, -9.408815383911133, -9.042990684509277, -8.677165985107422, -8.311342239379883, -7.945517539978027, -7.57969331741333, -7.213869094848633, -6.8480448722839355, -6.482220649719238, -6.116396427154541, -5.750572204589844, -5.3847479820251465, -5.018923759460449, -4.653099060058594, -4.2872748374938965, -3.921450614929199, -3.555626153945923, -3.1898019313812256, -2.8239777088165283, -2.458153247833252, -2.0923290252685547, -1.7265046834945679, -1.360680341720581, -0.9948561191558838, -0.6290316581726074, -0.26320743560791016, 0.10261687636375427, 0.4684411883354187, 0.8342654705047607, 1.2000898122787476, 1.5659141540527344, 1.9317383766174316, 2.297562837600708, 2.6633870601654053, 3.0292112827301025, 3.395035743713379, 3.760859966278076, 4.126684188842773, 4.492508888244629, 4.858332633972168, 5.224157333374023, 5.589981555938721, 5.955805778503418, 6.321630001068115, 6.6874542236328125, 7.053278923034668, 7.419103145599365, 7.7849273681640625, 8.150752067565918, 8.516575813293457, 8.882400512695312, 9.248224258422852, 9.614048957824707, 9.979872703552246, 10.345697402954102, 10.71152114868164, 11.077345848083496, 11.443170547485352]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 10.0, 10.0, 19.0, 15.0, 21.0, 38.0, 40.0, 52.0, 73.0, 94.0, 109.0, 146.0, 197.0, 258.0, 315.0, 465.0, 651.0, 985.0, 1494.0, 2396.0, 4032.0, 7534.0, 15390.0, 40752.0, 3577404.0, 473719.0, 36671.0, 13747.0, 6909.0, 3680.0, 2245.0, 1445.0, 1049.0, 650.0, 448.0, 369.0, 248.0, 165.0, 129.0, 87.0, 67.0, 45.0, 30.0, 20.0, 23.0, 6.0, 9.0, 9.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.341796875, -0.3320159912109375, -0.322235107421875, -0.3124542236328125, -0.30267333984375, -0.2928924560546875, -0.283111572265625, -0.2733306884765625, -0.2635498046875, -0.2537689208984375, -0.243988037109375, -0.2342071533203125, -0.22442626953125, -0.2146453857421875, -0.204864501953125, -0.1950836181640625, -0.185302734375, -0.1755218505859375, -0.165740966796875, -0.1559600830078125, -0.14617919921875, -0.1363983154296875, -0.126617431640625, -0.1168365478515625, -0.1070556640625, -0.0972747802734375, -0.087493896484375, -0.0777130126953125, -0.06793212890625, -0.0581512451171875, -0.048370361328125, -0.0385894775390625, -0.02880859375, -0.0190277099609375, -0.009246826171875, 0.0005340576171875, 0.01031494140625, 0.0200958251953125, 0.029876708984375, 0.0396575927734375, 0.0494384765625, 0.0592193603515625, 0.069000244140625, 0.0787811279296875, 0.08856201171875, 0.0983428955078125, 0.108123779296875, 0.1179046630859375, 0.127685546875, 0.1374664306640625, 0.147247314453125, 0.1570281982421875, 0.16680908203125, 0.1765899658203125, 0.186370849609375, 0.1961517333984375, 0.2059326171875, 0.2157135009765625, 0.225494384765625, 0.2352752685546875, 0.24505615234375, 0.2548370361328125, 0.264617919921875, 0.2743988037109375, 0.2841796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 9.0, 8.0, 5.0, 16.0, 19.0, 23.0, 510.0, 282.0, 31.0, 20.0, 10.0, 12.0, 10.0, 5.0, 8.0, 1.0, 4.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.038909912109375, -0.0377955436706543, -0.036681175231933594, -0.03556680679321289, -0.03445243835449219, -0.033338069915771484, -0.03222370147705078, -0.031109333038330078, -0.029994964599609375, -0.028880596160888672, -0.02776622772216797, -0.026651859283447266, -0.025537490844726562, -0.02442312240600586, -0.023308753967285156, -0.022194385528564453, -0.02108001708984375, -0.019965648651123047, -0.018851280212402344, -0.01773691177368164, -0.016622543334960938, -0.015508174896240234, -0.014393806457519531, -0.013279438018798828, -0.012165069580078125, -0.011050701141357422, -0.009936332702636719, -0.008821964263916016, -0.0077075958251953125, -0.006593227386474609, -0.005478858947753906, -0.004364490509033203, -0.0032501220703125, -0.002135753631591797, -0.0010213851928710938, 9.298324584960938e-05, 0.0012073516845703125, 0.0023217201232910156, 0.0034360885620117188, 0.004550457000732422, 0.005664825439453125, 0.006779193878173828, 0.007893562316894531, 0.009007930755615234, 0.010122299194335938, 0.01123666763305664, 0.012351036071777344, 0.013465404510498047, 0.01457977294921875, 0.015694141387939453, 0.016808509826660156, 0.01792287826538086, 0.019037246704101562, 0.020151615142822266, 0.02126598358154297, 0.022380352020263672, 0.023494720458984375, 0.024609088897705078, 0.02572345733642578, 0.026837825775146484, 0.027952194213867188, 0.02906656265258789, 0.030180931091308594, 0.0312952995300293, 0.03240966796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 8.0, 13.0, 14.0, 16.0, 21.0, 23.0, 27.0, 51.0, 62.0, 103.0, 139.0, 249.0, 460.0, 1074.0, 3074.0, 12072.0, 60596.0, 848251.0, 3146459.0, 96679.0, 17528.0, 4555.0, 1552.0, 539.0, 255.0, 141.0, 75.0, 65.0, 44.0, 41.0, 22.0, 23.0, 14.0, 10.0, 9.0, 6.0, 1.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.51904296875, -0.5046730041503906, -0.49030303955078125, -0.4759330749511719, -0.4615631103515625, -0.4471931457519531, -0.43282318115234375, -0.4184532165527344, -0.404083251953125, -0.3897132873535156, -0.37534332275390625, -0.3609733581542969, -0.3466033935546875, -0.3322334289550781, -0.31786346435546875, -0.3034934997558594, -0.28912353515625, -0.2747535705566406, -0.26038360595703125, -0.24601364135742188, -0.2316436767578125, -0.21727371215820312, -0.20290374755859375, -0.18853378295898438, -0.174163818359375, -0.15979385375976562, -0.14542388916015625, -0.13105392456054688, -0.1166839599609375, -0.10231399536132812, -0.08794403076171875, -0.07357406616210938, -0.0592041015625, -0.044834136962890625, -0.03046417236328125, -0.016094207763671875, -0.0017242431640625, 0.012645721435546875, 0.02701568603515625, 0.041385650634765625, 0.055755615234375, 0.07012557983398438, 0.08449554443359375, 0.09886550903320312, 0.1132354736328125, 0.12760543823242188, 0.14197540283203125, 0.15634536743164062, 0.17071533203125, 0.18508529663085938, 0.19945526123046875, 0.21382522583007812, 0.2281951904296875, 0.24256515502929688, 0.25693511962890625, 0.2713050842285156, 0.285675048828125, 0.3000450134277344, 0.31441497802734375, 0.3287849426269531, 0.3431549072265625, 0.3575248718261719, 0.37189483642578125, 0.3862648010253906, 0.400634765625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 8.0, 9.0, 5.0, 11.0, 16.0, 14.0, 15.0, 22.0, 29.0, 44.0, 45.0, 73.0, 79.0, 94.0, 111.0, 184.0, 267.0, 573.0, 1177.0, 423.0, 213.0, 150.0, 97.0, 83.0, 76.0, 46.0, 52.0, 30.0, 27.0, 27.0, 17.0, 12.0, 16.0, 11.0, 4.0, 4.0, 5.0, 2.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.08258056640625, -0.0803070068359375, -0.078033447265625, -0.0757598876953125, -0.073486328125, -0.0712127685546875, -0.068939208984375, -0.0666656494140625, -0.06439208984375, -0.0621185302734375, -0.059844970703125, -0.0575714111328125, -0.0552978515625, -0.0530242919921875, -0.050750732421875, -0.0484771728515625, -0.04620361328125, -0.0439300537109375, -0.041656494140625, -0.0393829345703125, -0.037109375, -0.0348358154296875, -0.032562255859375, -0.0302886962890625, -0.02801513671875, -0.0257415771484375, -0.023468017578125, -0.0211944580078125, -0.0189208984375, -0.0166473388671875, -0.014373779296875, -0.0121002197265625, -0.00982666015625, -0.0075531005859375, -0.005279541015625, -0.0030059814453125, -0.000732421875, 0.0015411376953125, 0.003814697265625, 0.0060882568359375, 0.00836181640625, 0.0106353759765625, 0.012908935546875, 0.0151824951171875, 0.0174560546875, 0.0197296142578125, 0.022003173828125, 0.0242767333984375, 0.02655029296875, 0.0288238525390625, 0.031097412109375, 0.0333709716796875, 0.03564453125, 0.0379180908203125, 0.040191650390625, 0.0424652099609375, 0.04473876953125, 0.0470123291015625, 0.049285888671875, 0.0515594482421875, 0.0538330078125, 0.0561065673828125, 0.058380126953125, 0.0606536865234375, 0.06292724609375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 5.0, 12.0, 9.0, 14.0, 26.0, 47.0, 116.0, 201.0, 259.0, 121.0, 78.0, 39.0, 25.0, 22.0, 8.0, 9.0, 4.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4893340766429901, -0.4651179313659668, -0.44090181589126587, -0.41668567061424255, -0.39246952533721924, -0.3682534098625183, -0.344037264585495, -0.3198211193084717, -0.29560500383377075, -0.27138885855674744, -0.2471727430820465, -0.2229565978050232, -0.19874046742916107, -0.17452433705329895, -0.15030819177627563, -0.1260920614004135, -0.10187593102455139, -0.07765980064868927, -0.05344366282224655, -0.029227524995803833, -0.005011394619941711, 0.01920473575592041, 0.043420881032943726, 0.06763701140880585, 0.09185314178466797, 0.11606927216053009, 0.1402854025363922, 0.16450154781341553, 0.18871767818927765, 0.21293380856513977, 0.23714995384216309, 0.261366069316864, 0.28558218479156494, 0.30979833006858826, 0.3340144455432892, 0.3582305908203125, 0.3824467062950134, 0.40666285157203674, 0.43087899684906006, 0.455095112323761, 0.4793112576007843, 0.5035274028778076, 0.5277435183525085, 0.5519596338272095, 0.5761758089065552, 0.6003919243812561, 0.624608039855957, 0.6488242149353027, 0.6730403304100037, 0.6972564458847046, 0.7214726209640503, 0.7456887364387512, 0.7699048519134521, 0.7941210269927979, 0.8183371424674988, 0.8425532579421997, 0.8667694330215454, 0.8909855484962463, 0.915201723575592, 0.939417839050293, 0.9636339545249939, 0.9878500699996948, 1.0120662450790405, 1.0362824201583862, 1.0604984760284424]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 8.0, 3.0, 5.0, 3.0, 11.0, 7.0, 9.0, 20.0, 11.0, 26.0, 23.0, 30.0, 25.0, 33.0, 39.0, 31.0, 51.0, 44.0, 64.0, 45.0, 59.0, 49.0, 42.0, 29.0, 39.0, 39.0, 43.0, 41.0, 32.0, 25.0, 19.0, 17.0, 20.0, 16.0, 13.0, 9.0, 7.0, 3.0, 2.0, 5.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31900107860565186, -0.3084261119365692, -0.2978511452674866, -0.2872762084007263, -0.2767012417316437, -0.26612627506256104, -0.2555513083934784, -0.24497634172439575, -0.2344013750553131, -0.22382640838623047, -0.21325145661830902, -0.20267648994922638, -0.19210152328014374, -0.1815265715122223, -0.17095160484313965, -0.160376638174057, -0.14980168640613556, -0.13922671973705292, -0.12865176796913147, -0.11807680130004883, -0.10750183463096619, -0.09692687541246414, -0.0863519161939621, -0.07577694952487946, -0.06520199030637741, -0.05462702736258507, -0.044052064418792725, -0.03347710520029068, -0.022902142256498337, -0.012327179312705994, -0.001752220094203949, 0.008822746574878693, 0.019397705793380737, 0.02997266873717308, 0.040547631680965424, 0.05112259089946747, 0.06169755384325981, 0.07227251678705215, 0.0828474760055542, 0.09342244267463684, 0.10399740189313889, 0.11457236111164093, 0.12514732778072357, 0.13572227954864502, 0.14629724621772766, 0.1568722128868103, 0.16744717955589294, 0.17802214622497559, 0.18859709799289703, 0.19917206466197968, 0.20974701642990112, 0.22032198309898376, 0.2308969497680664, 0.24147191643714905, 0.2520468831062317, 0.26262181997299194, 0.2731967866420746, 0.2837717533111572, 0.29434671998023987, 0.3049216866493225, 0.31549662351608276, 0.3260715901851654, 0.33664655685424805, 0.3472215235233307, 0.35779649019241333]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 9.0, 7.0, 11.0, 12.0, 14.0, 24.0, 36.0, 36.0, 56.0, 90.0, 127.0, 230.0, 349.0, 608.0, 1076.0, 2081.0, 4363.0, 11942.0, 78115.0, 886422.0, 45485.0, 9622.0, 3598.0, 1736.0, 943.0, 561.0, 337.0, 212.0, 147.0, 100.0, 66.0, 44.0, 28.0, 16.0, 12.0, 11.0, 6.0, 9.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.33447265625, -0.3244590759277344, -0.31444549560546875, -0.3044319152832031, -0.2944183349609375, -0.2844047546386719, -0.27439117431640625, -0.2643775939941406, -0.254364013671875, -0.24435043334960938, -0.23433685302734375, -0.22432327270507812, -0.2143096923828125, -0.20429611206054688, -0.19428253173828125, -0.18426895141601562, -0.17425537109375, -0.16424179077148438, -0.15422821044921875, -0.14421463012695312, -0.1342010498046875, -0.12418746948242188, -0.11417388916015625, -0.10416030883789062, -0.094146728515625, -0.08413314819335938, -0.07411956787109375, -0.06410598754882812, -0.0540924072265625, -0.044078826904296875, -0.03406524658203125, -0.024051666259765625, -0.0140380859375, -0.004024505615234375, 0.00598907470703125, 0.016002655029296875, 0.0260162353515625, 0.036029815673828125, 0.04604339599609375, 0.056056976318359375, 0.066070556640625, 0.07608413696289062, 0.08609771728515625, 0.09611129760742188, 0.1061248779296875, 0.11613845825195312, 0.12615203857421875, 0.13616561889648438, 0.14617919921875, 0.15619277954101562, 0.16620635986328125, 0.17621994018554688, 0.1862335205078125, 0.19624710083007812, 0.20626068115234375, 0.21627426147460938, 0.226287841796875, 0.23630142211914062, 0.24631500244140625, 0.2563285827636719, 0.2663421630859375, 0.2763557434082031, 0.28636932373046875, 0.2963829040527344, 0.306396484375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 11.0, 6.0, 7.0, 12.0, 30.0, 85.0, 161.0, 248.0, 195.0, 118.0, 40.0, 29.0, 11.0, 6.0, 4.0, 2.0, 7.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03973388671875, -0.038556575775146484, -0.03737926483154297, -0.03620195388793945, -0.03502464294433594, -0.03384733200073242, -0.032670021057128906, -0.03149271011352539, -0.030315399169921875, -0.02913808822631836, -0.027960777282714844, -0.026783466339111328, -0.025606155395507812, -0.024428844451904297, -0.02325153350830078, -0.022074222564697266, -0.02089691162109375, -0.019719600677490234, -0.01854228973388672, -0.017364978790283203, -0.016187667846679688, -0.015010356903076172, -0.013833045959472656, -0.01265573501586914, -0.011478424072265625, -0.01030111312866211, -0.009123802185058594, -0.007946491241455078, -0.0067691802978515625, -0.005591869354248047, -0.004414558410644531, -0.0032372474670410156, -0.0020599365234375, -0.0008826255798339844, 0.00029468536376953125, 0.0014719963073730469, 0.0026493072509765625, 0.003826618194580078, 0.005003929138183594, 0.006181240081787109, 0.007358551025390625, 0.00853586196899414, 0.009713172912597656, 0.010890483856201172, 0.012067794799804688, 0.013245105743408203, 0.014422416687011719, 0.015599727630615234, 0.01677703857421875, 0.017954349517822266, 0.01913166046142578, 0.020308971405029297, 0.021486282348632812, 0.022663593292236328, 0.023840904235839844, 0.02501821517944336, 0.026195526123046875, 0.02737283706665039, 0.028550148010253906, 0.029727458953857422, 0.030904769897460938, 0.03208208084106445, 0.03325939178466797, 0.034436702728271484, 0.035614013671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 6.0, 7.0, 7.0, 13.0, 22.0, 30.0, 42.0, 62.0, 118.0, 243.0, 576.0, 1697.0, 7804.0, 76880.0, 886664.0, 64739.0, 6912.0, 1586.0, 554.0, 237.0, 134.0, 73.0, 48.0, 26.0, 19.0, 12.0, 9.0, 7.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.67236328125, -0.6516571044921875, -0.630950927734375, -0.6102447509765625, -0.58953857421875, -0.5688323974609375, -0.548126220703125, -0.5274200439453125, -0.5067138671875, -0.4860076904296875, -0.465301513671875, -0.4445953369140625, -0.42388916015625, -0.4031829833984375, -0.382476806640625, -0.3617706298828125, -0.341064453125, -0.3203582763671875, -0.299652099609375, -0.2789459228515625, -0.25823974609375, -0.2375335693359375, -0.216827392578125, -0.1961212158203125, -0.1754150390625, -0.1547088623046875, -0.134002685546875, -0.1132965087890625, -0.09259033203125, -0.0718841552734375, -0.051177978515625, -0.0304718017578125, -0.009765625, 0.0109405517578125, 0.031646728515625, 0.0523529052734375, 0.07305908203125, 0.0937652587890625, 0.114471435546875, 0.1351776123046875, 0.1558837890625, 0.1765899658203125, 0.197296142578125, 0.2180023193359375, 0.23870849609375, 0.2594146728515625, 0.280120849609375, 0.3008270263671875, 0.321533203125, 0.3422393798828125, 0.362945556640625, 0.3836517333984375, 0.40435791015625, 0.4250640869140625, 0.445770263671875, 0.4664764404296875, 0.4871826171875, 0.5078887939453125, 0.528594970703125, 0.5493011474609375, 0.57000732421875, 0.5907135009765625, 0.611419677734375, 0.6321258544921875, 0.65283203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 6.0, 4.0, 7.0, 13.0, 12.0, 10.0, 7.0, 12.0, 28.0, 18.0, 27.0, 16.0, 38.0, 30.0, 50.0, 42.0, 51.0, 55.0, 51.0, 36.0, 46.0, 48.0, 47.0, 40.0, 43.0, 33.0, 35.0, 39.0, 29.0, 17.0, 21.0, 17.0, 15.0, 9.0, 11.0, 9.0, 10.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.2054443359375, -0.20029354095458984, -0.1951427459716797, -0.18999195098876953, -0.18484115600585938, -0.17969036102294922, -0.17453956604003906, -0.1693887710571289, -0.16423797607421875, -0.1590871810913086, -0.15393638610839844, -0.14878559112548828, -0.14363479614257812, -0.13848400115966797, -0.1333332061767578, -0.12818241119384766, -0.1230316162109375, -0.11788082122802734, -0.11273002624511719, -0.10757923126220703, -0.10242843627929688, -0.09727764129638672, -0.09212684631347656, -0.0869760513305664, -0.08182525634765625, -0.0766744613647461, -0.07152366638183594, -0.06637287139892578, -0.061222076416015625, -0.05607128143310547, -0.05092048645019531, -0.045769691467285156, -0.040618896484375, -0.035468101501464844, -0.030317306518554688, -0.02516651153564453, -0.020015716552734375, -0.014864921569824219, -0.009714126586914062, -0.004563331604003906, 0.00058746337890625, 0.005738258361816406, 0.010889053344726562, 0.01603984832763672, 0.021190643310546875, 0.02634143829345703, 0.03149223327636719, 0.036643028259277344, 0.0417938232421875, 0.046944618225097656, 0.05209541320800781, 0.05724620819091797, 0.062397003173828125, 0.06754779815673828, 0.07269859313964844, 0.0778493881225586, 0.08300018310546875, 0.0881509780883789, 0.09330177307128906, 0.09845256805419922, 0.10360336303710938, 0.10875415802001953, 0.11390495300292969, 0.11905574798583984, 0.12420654296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 8.0, 9.0, 13.0, 26.0, 23.0, 60.0, 128.0, 310.0, 1042.0, 11773.0, 1028123.0, 5763.0, 787.0, 257.0, 92.0, 48.0, 30.0, 24.0, 12.0, 4.0, 8.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3623046875, -1.310699462890625, -1.25909423828125, -1.207489013671875, -1.1558837890625, -1.104278564453125, -1.05267333984375, -1.001068115234375, -0.949462890625, -0.897857666015625, -0.84625244140625, -0.794647216796875, -0.7430419921875, -0.691436767578125, -0.63983154296875, -0.588226318359375, -0.53662109375, -0.485015869140625, -0.43341064453125, -0.381805419921875, -0.3302001953125, -0.278594970703125, -0.22698974609375, -0.175384521484375, -0.123779296875, -0.072174072265625, -0.02056884765625, 0.031036376953125, 0.0826416015625, 0.134246826171875, 0.18585205078125, 0.237457275390625, 0.2890625, 0.340667724609375, 0.39227294921875, 0.443878173828125, 0.4954833984375, 0.547088623046875, 0.59869384765625, 0.650299072265625, 0.701904296875, 0.753509521484375, 0.80511474609375, 0.856719970703125, 0.9083251953125, 0.959930419921875, 1.01153564453125, 1.063140869140625, 1.11474609375, 1.166351318359375, 1.21795654296875, 1.269561767578125, 1.3211669921875, 1.372772216796875, 1.42437744140625, 1.475982666015625, 1.527587890625, 1.579193115234375, 1.63079833984375, 1.682403564453125, 1.7340087890625, 1.785614013671875, 1.83721923828125, 1.888824462890625, 1.9404296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 6.0, 9.0, 7.0, 12.0, 18.0, 19.0, 15.0, 40.0, 43.0, 50.0, 76.0, 88.0, 101.0, 121.0, 79.0, 88.0, 53.0, 50.0, 43.0, 17.0, 18.0, 13.0, 5.0, 11.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.390146255493164e-05, -2.3270025849342346e-05, -2.2638589143753052e-05, -2.2007152438163757e-05, -2.1375715732574463e-05, -2.074427902698517e-05, -2.0112842321395874e-05, -1.948140561580658e-05, -1.8849968910217285e-05, -1.821853220462799e-05, -1.7587095499038696e-05, -1.6955658793449402e-05, -1.6324222087860107e-05, -1.5692785382270813e-05, -1.5061348676681519e-05, -1.4429911971092224e-05, -1.379847526550293e-05, -1.3167038559913635e-05, -1.253560185432434e-05, -1.1904165148735046e-05, -1.1272728443145752e-05, -1.0641291737556458e-05, -1.0009855031967163e-05, -9.378418326377869e-06, -8.746981620788574e-06, -8.11554491519928e-06, -7.484108209609985e-06, -6.852671504020691e-06, -6.2212347984313965e-06, -5.589798092842102e-06, -4.958361387252808e-06, -4.326924681663513e-06, -3.6954879760742188e-06, -3.0640512704849243e-06, -2.43261456489563e-06, -1.8011778593063354e-06, -1.169741153717041e-06, -5.383044481277466e-07, 9.313225746154785e-08, 7.245689630508423e-07, 1.3560056686401367e-06, 1.987442374229431e-06, 2.6188790798187256e-06, 3.25031578540802e-06, 3.8817524909973145e-06, 4.513189196586609e-06, 5.144625902175903e-06, 5.776062607765198e-06, 6.407499313354492e-06, 7.038936018943787e-06, 7.670372724533081e-06, 8.301809430122375e-06, 8.93324613571167e-06, 9.564682841300964e-06, 1.0196119546890259e-05, 1.0827556252479553e-05, 1.1458992958068848e-05, 1.2090429663658142e-05, 1.2721866369247437e-05, 1.3353303074836731e-05, 1.3984739780426025e-05, 1.461617648601532e-05, 1.5247613191604614e-05, 1.587904989719391e-05, 1.6510486602783203e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 7.0, 12.0, 14.0, 26.0, 21.0, 34.0, 45.0, 69.0, 79.0, 129.0, 170.0, 274.0, 396.0, 635.0, 944.0, 1561.0, 2854.0, 5747.0, 14440.0, 66956.0, 748509.0, 165300.0, 23671.0, 7775.0, 3479.0, 1902.0, 1212.0, 723.0, 477.0, 331.0, 202.0, 164.0, 97.0, 87.0, 43.0, 38.0, 25.0, 25.0, 15.0, 14.0, 16.0, 9.0, 2.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.278564453125, -0.27075958251953125, -0.2629547119140625, -0.25514984130859375, -0.247344970703125, -0.23954010009765625, -0.2317352294921875, -0.22393035888671875, -0.21612548828125, -0.20832061767578125, -0.2005157470703125, -0.19271087646484375, -0.184906005859375, -0.17710113525390625, -0.1692962646484375, -0.16149139404296875, -0.1536865234375, -0.14588165283203125, -0.1380767822265625, -0.13027191162109375, -0.122467041015625, -0.11466217041015625, -0.1068572998046875, -0.09905242919921875, -0.09124755859375, -0.08344268798828125, -0.0756378173828125, -0.06783294677734375, -0.060028076171875, -0.05222320556640625, -0.0444183349609375, -0.03661346435546875, -0.02880859375, -0.02100372314453125, -0.0131988525390625, -0.00539398193359375, 0.002410888671875, 0.01021575927734375, 0.0180206298828125, 0.02582550048828125, 0.03363037109375, 0.04143524169921875, 0.0492401123046875, 0.05704498291015625, 0.064849853515625, 0.07265472412109375, 0.0804595947265625, 0.08826446533203125, 0.0960693359375, 0.10387420654296875, 0.1116790771484375, 0.11948394775390625, 0.127288818359375, 0.13509368896484375, 0.1428985595703125, 0.15070343017578125, 0.15850830078125, 0.16631317138671875, 0.1741180419921875, 0.18192291259765625, 0.189727783203125, 0.19753265380859375, 0.2053375244140625, 0.21314239501953125, 0.220947265625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 7.0, 11.0, 30.0, 43.0, 71.0, 122.0, 226.0, 165.0, 110.0, 73.0, 45.0, 20.0, 16.0, 6.0, 11.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2047119140625, -0.19680213928222656, -0.18889236450195312, -0.1809825897216797, -0.17307281494140625, -0.1651630401611328, -0.15725326538085938, -0.14934349060058594, -0.1414337158203125, -0.13352394104003906, -0.12561416625976562, -0.11770439147949219, -0.10979461669921875, -0.10188484191894531, -0.09397506713867188, -0.08606529235839844, -0.078155517578125, -0.07024574279785156, -0.062335968017578125, -0.05442619323730469, -0.04651641845703125, -0.03860664367675781, -0.030696868896484375, -0.022787094116210938, -0.0148773193359375, -0.0069675445556640625, 0.000942230224609375, 0.008852005004882812, 0.01676177978515625, 0.024671554565429688, 0.032581329345703125, 0.04049110412597656, 0.04840087890625, 0.05631065368652344, 0.06422042846679688, 0.07213020324707031, 0.08003997802734375, 0.08794975280761719, 0.09585952758789062, 0.10376930236816406, 0.1116790771484375, 0.11958885192871094, 0.12749862670898438, 0.1354084014892578, 0.14331817626953125, 0.1512279510498047, 0.15913772583007812, 0.16704750061035156, 0.174957275390625, 0.18286705017089844, 0.19077682495117188, 0.1986865997314453, 0.20659637451171875, 0.2145061492919922, 0.22241592407226562, 0.23032569885253906, 0.2382354736328125, 0.24614524841308594, 0.2540550231933594, 0.2619647979736328, 0.26987457275390625, 0.2777843475341797, 0.2856941223144531, 0.29360389709472656, 0.301513671875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 11.0, 10.0, 15.0, 59.0, 251.0, 422.0, 131.0, 50.0, 23.0, 13.0, 11.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01239538192749, -3.870124340057373, -3.727853298187256, -3.5855822563171387, -3.4433112144470215, -3.3010401725769043, -3.158769130706787, -3.01649808883667, -2.8742270469665527, -2.7319560050964355, -2.5896849632263184, -2.447413921356201, -2.305142879486084, -2.162871837615967, -2.0206007957458496, -1.8783297538757324, -1.7360587120056152, -1.593787670135498, -1.4515166282653809, -1.3092455863952637, -1.1669745445251465, -1.0247035026550293, -0.8824324607849121, -0.7401614189147949, -0.5978903770446777, -0.45561933517456055, -0.31334829330444336, -0.17107725143432617, -0.028806209564208984, 0.1134648323059082, 0.2557358741760254, 0.3980069160461426, 0.540278434753418, 0.6825494766235352, 0.8248205184936523, 0.9670915603637695, 1.1093626022338867, 1.251633644104004, 1.393904685974121, 1.5361757278442383, 1.6784467697143555, 1.8207178115844727, 1.9629888534545898, 2.105259895324707, 2.247530937194824, 2.3898019790649414, 2.5320730209350586, 2.674344062805176, 2.816615104675293, 2.95888614654541, 3.1011571884155273, 3.2434282302856445, 3.3856992721557617, 3.527970314025879, 3.670241355895996, 3.8125123977661133, 3.9547834396362305, 4.097054481506348, 4.239325523376465, 4.381596565246582, 4.523867607116699, 4.666138648986816, 4.808409690856934, 4.950680732727051, 5.092951774597168]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 13.0, 12.0, 20.0, 30.0, 57.0, 101.0, 184.0, 210.0, 140.0, 101.0, 47.0, 20.0, 18.0, 11.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.699883460998535, -3.581669807434082, -3.463456153869629, -3.345242500305176, -3.2270288467407227, -3.1088151931762695, -2.9906015396118164, -2.8723878860473633, -2.75417423248291, -2.635960578918457, -2.517746925354004, -2.399533271789551, -2.2813196182250977, -2.1631059646606445, -2.0448923110961914, -1.9266787767410278, -1.8084652423858643, -1.6902515888214111, -1.572037935256958, -1.4538242816925049, -1.3356106281280518, -1.2173969745635986, -1.099183440208435, -0.9809697866439819, -0.8627561330795288, -0.7445424795150757, -0.6263288259506226, -0.5081152319908142, -0.3899015784263611, -0.27168792486190796, -0.1534743309020996, -0.035260677337646484, 0.08295297622680664, 0.20116661489009857, 0.3193802535533905, 0.43759387731552124, 0.5558075308799744, 0.6740211844444275, 0.7922347784042358, 0.910448431968689, 1.028662085533142, 1.1468757390975952, 1.2650893926620483, 1.383302927017212, 1.501516580581665, 1.6197302341461182, 1.7379438877105713, 1.8561575412750244, 1.9743711948394775, 2.0925848484039307, 2.210798501968384, 2.329012155532837, 2.44722580909729, 2.565439462661743, 2.683652877807617, 2.8018665313720703, 2.9200801849365234, 3.0382938385009766, 3.1565074920654297, 3.274721145629883, 3.392934799194336, 3.511148452758789, 3.629362106323242, 3.7475757598876953, 3.8657894134521484]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 5.0, 7.0, 12.0, 16.0, 23.0, 64.0, 172.0, 1648.0, 4039815.0, 150873.0, 1316.0, 179.0, 51.0, 28.0, 19.0, 10.0, 11.0, 9.0, 4.0, 2.0, 2.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8359375, -2.71221923828125, -2.5885009765625, -2.46478271484375, -2.341064453125, -2.21734619140625, -2.0936279296875, -1.96990966796875, -1.84619140625, -1.72247314453125, -1.5987548828125, -1.47503662109375, -1.351318359375, -1.22760009765625, -1.1038818359375, -0.98016357421875, -0.8564453125, -0.73272705078125, -0.6090087890625, -0.48529052734375, -0.361572265625, -0.23785400390625, -0.1141357421875, 0.00958251953125, 0.13330078125, 0.25701904296875, 0.3807373046875, 0.50445556640625, 0.628173828125, 0.75189208984375, 0.8756103515625, 0.99932861328125, 1.123046875, 1.24676513671875, 1.3704833984375, 1.49420166015625, 1.617919921875, 1.74163818359375, 1.8653564453125, 1.98907470703125, 2.11279296875, 2.23651123046875, 2.3602294921875, 2.48394775390625, 2.607666015625, 2.73138427734375, 2.8551025390625, 2.97882080078125, 3.1025390625, 3.22625732421875, 3.3499755859375, 3.47369384765625, 3.597412109375, 3.72113037109375, 3.8448486328125, 3.96856689453125, 4.09228515625, 4.21600341796875, 4.3397216796875, 4.46343994140625, 4.587158203125, 4.71087646484375, 4.8345947265625, 4.95831298828125, 5.08203125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 0.0, 6.0, 5.0, 8.0, 7.0, 13.0, 13.0, 19.0, 29.0, 60.0, 80.0, 98.0, 127.0, 147.0, 121.0, 86.0, 67.0, 31.0, 17.0, 14.0, 11.0, 6.0, 3.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0295562744140625, -0.028656959533691406, -0.027757644653320312, -0.02685832977294922, -0.025959014892578125, -0.02505970001220703, -0.024160385131835938, -0.023261070251464844, -0.02236175537109375, -0.021462440490722656, -0.020563125610351562, -0.01966381072998047, -0.018764495849609375, -0.01786518096923828, -0.016965866088867188, -0.016066551208496094, -0.015167236328125, -0.014267921447753906, -0.013368606567382812, -0.012469291687011719, -0.011569976806640625, -0.010670661926269531, -0.009771347045898438, -0.008872032165527344, -0.00797271728515625, -0.007073402404785156, -0.0061740875244140625, -0.005274772644042969, -0.004375457763671875, -0.0034761428833007812, -0.0025768280029296875, -0.0016775131225585938, -0.0007781982421875, 0.00012111663818359375, 0.0010204315185546875, 0.0019197463989257812, 0.002819061279296875, 0.0037183761596679688, 0.0046176910400390625, 0.005517005920410156, 0.00641632080078125, 0.007315635681152344, 0.008214950561523438, 0.009114265441894531, 0.010013580322265625, 0.010912895202636719, 0.011812210083007812, 0.012711524963378906, 0.01361083984375, 0.014510154724121094, 0.015409469604492188, 0.01630878448486328, 0.017208099365234375, 0.01810741424560547, 0.019006729125976562, 0.019906044006347656, 0.02080535888671875, 0.021704673767089844, 0.022603988647460938, 0.02350330352783203, 0.024402618408203125, 0.02530193328857422, 0.026201248168945312, 0.027100563049316406, 0.0279998779296875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 8.0, 26.0, 19.0, 42.0, 54.0, 103.0, 174.0, 408.0, 964.0, 2701.0, 9447.0, 53191.0, 3809455.0, 289487.0, 20720.0, 4973.0, 1563.0, 535.0, 206.0, 82.0, 50.0, 24.0, 12.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.009765625, -0.9866905212402344, -0.9636154174804688, -0.9405403137207031, -0.9174652099609375, -0.8943901062011719, -0.8713150024414062, -0.8482398986816406, -0.825164794921875, -0.8020896911621094, -0.7790145874023438, -0.7559394836425781, -0.7328643798828125, -0.7097892761230469, -0.6867141723632812, -0.6636390686035156, -0.64056396484375, -0.6174888610839844, -0.5944137573242188, -0.5713386535644531, -0.5482635498046875, -0.5251884460449219, -0.5021133422851562, -0.4790382385253906, -0.455963134765625, -0.4328880310058594, -0.40981292724609375, -0.3867378234863281, -0.3636627197265625, -0.3405876159667969, -0.31751251220703125, -0.2944374084472656, -0.2713623046875, -0.24828720092773438, -0.22521209716796875, -0.20213699340820312, -0.1790618896484375, -0.15598678588867188, -0.13291168212890625, -0.10983657836914062, -0.086761474609375, -0.06368637084960938, -0.04061126708984375, -0.017536163330078125, 0.0055389404296875, 0.028614044189453125, 0.05168914794921875, 0.07476425170898438, 0.09783935546875, 0.12091445922851562, 0.14398956298828125, 0.16706466674804688, 0.1901397705078125, 0.21321487426757812, 0.23628997802734375, 0.2593650817871094, 0.282440185546875, 0.3055152893066406, 0.32859039306640625, 0.3516654968261719, 0.3747406005859375, 0.3978157043457031, 0.42089080810546875, 0.4439659118652344, 0.467041015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 5.0, 4.0, 6.0, 0.0, 8.0, 10.0, 13.0, 17.0, 24.0, 32.0, 46.0, 77.0, 141.0, 392.0, 1618.0, 930.0, 280.0, 148.0, 80.0, 63.0, 33.0, 35.0, 23.0, 8.0, 10.0, 10.0, 7.0, 9.0, 8.0, 8.0, 5.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.056396484375, -0.054781436920166016, -0.05316638946533203, -0.05155134201049805, -0.04993629455566406, -0.04832124710083008, -0.046706199645996094, -0.04509115219116211, -0.043476104736328125, -0.04186105728149414, -0.040246009826660156, -0.03863096237182617, -0.03701591491699219, -0.0354008674621582, -0.03378582000732422, -0.032170772552490234, -0.03055572509765625, -0.028940677642822266, -0.02732563018798828, -0.025710582733154297, -0.024095535278320312, -0.022480487823486328, -0.020865440368652344, -0.01925039291381836, -0.017635345458984375, -0.01602029800415039, -0.014405250549316406, -0.012790203094482422, -0.011175155639648438, -0.009560108184814453, -0.007945060729980469, -0.006330013275146484, -0.0047149658203125, -0.0030999183654785156, -0.0014848709106445312, 0.00013017654418945312, 0.0017452239990234375, 0.003360271453857422, 0.004975318908691406, 0.006590366363525391, 0.008205413818359375, 0.00982046127319336, 0.011435508728027344, 0.013050556182861328, 0.014665603637695312, 0.016280651092529297, 0.01789569854736328, 0.019510746002197266, 0.02112579345703125, 0.022740840911865234, 0.02435588836669922, 0.025970935821533203, 0.027585983276367188, 0.029201030731201172, 0.030816078186035156, 0.03243112564086914, 0.034046173095703125, 0.03566122055053711, 0.037276268005371094, 0.03889131546020508, 0.04050636291503906, 0.04212141036987305, 0.04373645782470703, 0.045351505279541016, 0.046966552734375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 23.0, 582.0, 393.0, 12.0, 4.0], "bins": [-5.504264831542969, -5.414007186889648, -5.323750019073486, -5.233492374420166, -5.143235206604004, -5.052977561950684, -4.9627203941345215, -4.872462749481201, -4.782205581665039, -4.691947937011719, -4.601690769195557, -4.511433124542236, -4.421175956726074, -4.330918312072754, -4.240661144256592, -4.1504034996032715, -4.060146331787109, -3.969888925552368, -3.879631519317627, -3.7893741130828857, -3.6991167068481445, -3.6088593006134033, -3.518601894378662, -3.428344249725342, -3.3380866050720215, -3.2478291988372803, -3.157571792602539, -3.067314386367798, -2.9770569801330566, -2.8867995738983154, -2.796542167663574, -2.706284523010254, -2.6160271167755127, -2.5257697105407715, -2.4355123043060303, -2.345254898071289, -2.254997491836548, -2.1647400856018066, -2.0744824409484863, -1.9842251539230347, -1.893967866897583, -1.8037104606628418, -1.7134530544281006, -1.6231956481933594, -1.5329382419586182, -1.442680835723877, -1.3524233102798462, -1.262165904045105, -1.1719083786010742, -1.081650972366333, -0.9913935661315918, -0.9011361002922058, -0.8108786940574646, -0.7206212878227234, -0.6303638219833374, -0.5401064157485962, -0.44984906911849976, -0.35959166288375854, -0.26933422684669495, -0.17907679080963135, -0.08881938457489014, 0.0014380216598510742, 0.09169548749923706, 0.18195289373397827, 0.2722102999687195]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 1.0, 6.0, 10.0, 12.0, 27.0, 45.0, 64.0, 105.0, 128.0, 143.0, 119.0, 104.0, 74.0, 57.0, 34.0, 19.0, 10.0, 8.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3847852945327759, -0.37370383739471436, -0.36262235045433044, -0.3515408933162689, -0.340459406375885, -0.3293779492378235, -0.31829649209976196, -0.30721500515937805, -0.29613354802131653, -0.285052090883255, -0.2739706039428711, -0.26288914680480957, -0.25180765986442566, -0.24072620272636414, -0.22964473068714142, -0.2185632586479187, -0.20748178660869598, -0.19640031456947327, -0.18531884253025055, -0.17423737049102783, -0.1631559133529663, -0.1520744413137436, -0.14099296927452087, -0.12991151213645935, -0.11883003264665604, -0.10774856060743332, -0.0966670960187912, -0.08558562397956848, -0.07450415194034576, -0.06342268735170364, -0.052341215312480927, -0.041259750723838806, -0.03017827868461609, -0.01909681037068367, -0.008015340194106102, 0.003066129982471466, 0.014147598296403885, 0.025229066610336304, 0.03631053864955902, 0.04739200323820114, 0.05847347527742386, 0.06955494731664658, 0.0806364119052887, 0.09171788394451141, 0.10279935598373413, 0.11388082057237625, 0.12496229261159897, 0.1360437572002411, 0.1471252292394638, 0.15820670127868652, 0.16928817331790924, 0.18036964535713196, 0.19145110249519348, 0.2025325745344162, 0.21361404657363892, 0.22469550371170044, 0.23577699065208435, 0.24685846269130707, 0.2579399347305298, 0.2690213918685913, 0.2801028788089752, 0.29118433594703674, 0.30226582288742065, 0.3133472800254822, 0.3244287371635437]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 7.0, 6.0, 10.0, 8.0, 23.0, 29.0, 44.0, 81.0, 96.0, 158.0, 237.0, 348.0, 539.0, 825.0, 1350.0, 2150.0, 3789.0, 6618.0, 12405.0, 27804.0, 76294.0, 292975.0, 445727.0, 106608.0, 35804.0, 15531.0, 7838.0, 4426.0, 2475.0, 1554.0, 952.0, 630.0, 417.0, 268.0, 185.0, 106.0, 71.0, 57.0, 47.0, 19.0, 19.0, 12.0, 9.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1591796875, -0.15437698364257812, -0.14957427978515625, -0.14477157592773438, -0.1399688720703125, -0.13516616821289062, -0.13036346435546875, -0.12556076049804688, -0.120758056640625, -0.11595535278320312, -0.11115264892578125, -0.10634994506835938, -0.1015472412109375, -0.09674453735351562, -0.09194183349609375, -0.08713912963867188, -0.08233642578125, -0.07753372192382812, -0.07273101806640625, -0.06792831420898438, -0.0631256103515625, -0.058322906494140625, -0.05352020263671875, -0.048717498779296875, -0.043914794921875, -0.039112091064453125, -0.03430938720703125, -0.029506683349609375, -0.0247039794921875, -0.019901275634765625, -0.01509857177734375, -0.010295867919921875, -0.0054931640625, -0.000690460205078125, 0.00411224365234375, 0.008914947509765625, 0.0137176513671875, 0.018520355224609375, 0.02332305908203125, 0.028125762939453125, 0.032928466796875, 0.037731170654296875, 0.04253387451171875, 0.047336578369140625, 0.0521392822265625, 0.056941986083984375, 0.06174468994140625, 0.06654739379882812, 0.07135009765625, 0.07615280151367188, 0.08095550537109375, 0.08575820922851562, 0.0905609130859375, 0.09536361694335938, 0.10016632080078125, 0.10496902465820312, 0.109771728515625, 0.11457443237304688, 0.11937713623046875, 0.12417984008789062, 0.1289825439453125, 0.13378524780273438, 0.13858795166015625, 0.14339065551757812, 0.148193359375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 4.0, 1.0, 6.0, 0.0, 9.0, 8.0, 13.0, 11.0, 13.0, 19.0, 32.0, 46.0, 43.0, 63.0, 74.0, 83.0, 78.0, 80.0, 84.0, 52.0, 48.0, 60.0, 41.0, 32.0, 19.0, 12.0, 10.0, 12.0, 8.0, 9.0, 2.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0170745849609375, -0.01655292510986328, -0.016031265258789062, -0.015509605407714844, -0.014987945556640625, -0.014466285705566406, -0.013944625854492188, -0.013422966003417969, -0.01290130615234375, -0.012379646301269531, -0.011857986450195312, -0.011336326599121094, -0.010814666748046875, -0.010293006896972656, -0.009771347045898438, -0.009249687194824219, -0.00872802734375, -0.008206367492675781, -0.0076847076416015625, -0.007163047790527344, -0.006641387939453125, -0.006119728088378906, -0.0055980682373046875, -0.005076408386230469, -0.00455474853515625, -0.004033088684082031, -0.0035114288330078125, -0.0029897689819335938, -0.002468109130859375, -0.0019464492797851562, -0.0014247894287109375, -0.0009031295776367188, -0.0003814697265625, 0.00014019012451171875, 0.0006618499755859375, 0.0011835098266601562, 0.001705169677734375, 0.0022268295288085938, 0.0027484893798828125, 0.0032701492309570312, 0.00379180908203125, 0.004313468933105469, 0.0048351287841796875, 0.005356788635253906, 0.005878448486328125, 0.006400108337402344, 0.0069217681884765625, 0.007443428039550781, 0.007965087890625, 0.008486747741699219, 0.009008407592773438, 0.009530067443847656, 0.010051727294921875, 0.010573387145996094, 0.011095046997070312, 0.011616706848144531, 0.01213836669921875, 0.012660026550292969, 0.013181686401367188, 0.013703346252441406, 0.014225006103515625, 0.014746665954589844, 0.015268325805664062, 0.01578998565673828, 0.0163116455078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 1.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 24.0, 86.0, 831.0, 24777.0, 969591.0, 51712.0, 1303.0, 109.0, 34.0, 9.0, 7.0, 3.0, 7.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.523406982421875, -0.49798583984375, -0.472564697265625, -0.4471435546875, -0.421722412109375, -0.39630126953125, -0.370880126953125, -0.345458984375, -0.320037841796875, -0.29461669921875, -0.269195556640625, -0.2437744140625, -0.218353271484375, -0.19293212890625, -0.167510986328125, -0.14208984375, -0.116668701171875, -0.09124755859375, -0.065826416015625, -0.0404052734375, -0.014984130859375, 0.01043701171875, 0.035858154296875, 0.061279296875, 0.086700439453125, 0.11212158203125, 0.137542724609375, 0.1629638671875, 0.188385009765625, 0.21380615234375, 0.239227294921875, 0.2646484375, 0.290069580078125, 0.31549072265625, 0.340911865234375, 0.3663330078125, 0.391754150390625, 0.41717529296875, 0.442596435546875, 0.468017578125, 0.493438720703125, 0.51885986328125, 0.544281005859375, 0.5697021484375, 0.595123291015625, 0.62054443359375, 0.645965576171875, 0.67138671875, 0.696807861328125, 0.72222900390625, 0.747650146484375, 0.7730712890625, 0.798492431640625, 0.82391357421875, 0.849334716796875, 0.874755859375, 0.900177001953125, 0.92559814453125, 0.951019287109375, 0.9764404296875, 1.001861572265625, 1.02728271484375, 1.052703857421875, 1.078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 7.0, 6.0, 5.0, 11.0, 10.0, 18.0, 15.0, 19.0, 18.0, 29.0, 15.0, 25.0, 37.0, 33.0, 33.0, 42.0, 28.0, 36.0, 46.0, 44.0, 41.0, 45.0, 30.0, 41.0, 43.0, 46.0, 32.0, 40.0, 27.0, 25.0, 26.0, 26.0, 14.0, 13.0, 15.0, 8.0, 11.0, 11.0, 7.0, 7.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.079833984375, -0.07739734649658203, -0.07496070861816406, -0.0725240707397461, -0.07008743286132812, -0.06765079498291016, -0.06521415710449219, -0.06277751922607422, -0.06034088134765625, -0.05790424346923828, -0.05546760559082031, -0.053030967712402344, -0.050594329833984375, -0.048157691955566406, -0.04572105407714844, -0.04328441619873047, -0.0408477783203125, -0.03841114044189453, -0.03597450256347656, -0.033537864685058594, -0.031101226806640625, -0.028664588928222656, -0.026227951049804688, -0.02379131317138672, -0.02135467529296875, -0.01891803741455078, -0.016481399536132812, -0.014044761657714844, -0.011608123779296875, -0.009171485900878906, -0.0067348480224609375, -0.004298210144042969, -0.001861572265625, 0.0005750656127929688, 0.0030117034912109375, 0.005448341369628906, 0.007884979248046875, 0.010321617126464844, 0.012758255004882812, 0.015194892883300781, 0.01763153076171875, 0.02006816864013672, 0.022504806518554688, 0.024941444396972656, 0.027378082275390625, 0.029814720153808594, 0.03225135803222656, 0.03468799591064453, 0.0371246337890625, 0.03956127166748047, 0.04199790954589844, 0.044434547424316406, 0.046871185302734375, 0.049307823181152344, 0.05174446105957031, 0.05418109893798828, 0.05661773681640625, 0.05905437469482422, 0.06149101257324219, 0.06392765045166016, 0.06636428833007812, 0.0688009262084961, 0.07123756408691406, 0.07367420196533203, 0.07611083984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 4.0, 9.0, 12.0, 17.0, 43.0, 175.0, 1856.0, 1031695.0, 14203.0, 382.0, 81.0, 23.0, 17.0, 10.0, 8.0, 8.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.12890625, -2.075286865234375, -2.02166748046875, -1.968048095703125, -1.9144287109375, -1.860809326171875, -1.80718994140625, -1.753570556640625, -1.699951171875, -1.646331787109375, -1.59271240234375, -1.539093017578125, -1.4854736328125, -1.431854248046875, -1.37823486328125, -1.324615478515625, -1.27099609375, -1.217376708984375, -1.16375732421875, -1.110137939453125, -1.0565185546875, -1.002899169921875, -0.94927978515625, -0.895660400390625, -0.842041015625, -0.788421630859375, -0.73480224609375, -0.681182861328125, -0.6275634765625, -0.573944091796875, -0.52032470703125, -0.466705322265625, -0.4130859375, -0.359466552734375, -0.30584716796875, -0.252227783203125, -0.1986083984375, -0.144989013671875, -0.09136962890625, -0.037750244140625, 0.015869140625, 0.069488525390625, 0.12310791015625, 0.176727294921875, 0.2303466796875, 0.283966064453125, 0.33758544921875, 0.391204833984375, 0.44482421875, 0.498443603515625, 0.55206298828125, 0.605682373046875, 0.6593017578125, 0.712921142578125, 0.76654052734375, 0.820159912109375, 0.873779296875, 0.927398681640625, 0.98101806640625, 1.034637451171875, 1.0882568359375, 1.141876220703125, 1.19549560546875, 1.249114990234375, 1.302734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 10.0, 14.0, 20.0, 21.0, 53.0, 142.0, 335.0, 211.0, 78.0, 35.0, 25.0, 10.0, 10.0, 4.0, 7.0, 0.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.679794311523438e-05, -9.392388164997101e-05, -9.104982018470764e-05, -8.817575871944427e-05, -8.530169725418091e-05, -8.242763578891754e-05, -7.955357432365417e-05, -7.667951285839081e-05, -7.380545139312744e-05, -7.093138992786407e-05, -6.805732846260071e-05, -6.518326699733734e-05, -6.230920553207397e-05, -5.943514406681061e-05, -5.656108260154724e-05, -5.3687021136283875e-05, -5.081295967102051e-05, -4.793889820575714e-05, -4.5064836740493774e-05, -4.219077527523041e-05, -3.931671380996704e-05, -3.6442652344703674e-05, -3.356859087944031e-05, -3.069452941417694e-05, -2.7820467948913574e-05, -2.4946406483650208e-05, -2.207234501838684e-05, -1.9198283553123474e-05, -1.6324222087860107e-05, -1.345016062259674e-05, -1.0576099157333374e-05, -7.702037692070007e-06, -4.827976226806641e-06, -1.953914761543274e-06, 9.201467037200928e-07, 3.7942081689834595e-06, 6.668269634246826e-06, 9.542331099510193e-06, 1.241639256477356e-05, 1.5290454030036926e-05, 1.8164515495300293e-05, 2.103857696056366e-05, 2.3912638425827026e-05, 2.6786699891090393e-05, 2.966076135635376e-05, 3.2534822821617126e-05, 3.540888428688049e-05, 3.828294575214386e-05, 4.1157007217407227e-05, 4.403106868267059e-05, 4.690513014793396e-05, 4.977919161319733e-05, 5.265325307846069e-05, 5.552731454372406e-05, 5.840137600898743e-05, 6.12754374742508e-05, 6.414949893951416e-05, 6.702356040477753e-05, 6.98976218700409e-05, 7.277168333530426e-05, 7.564574480056763e-05, 7.8519806265831e-05, 8.139386773109436e-05, 8.426792919635773e-05, 8.71419906616211e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 12.0, 5.0, 14.0, 21.0, 28.0, 36.0, 64.0, 93.0, 166.0, 268.0, 473.0, 883.0, 2018.0, 5160.0, 16673.0, 73675.0, 505068.0, 368448.0, 54522.0, 13125.0, 4251.0, 1725.0, 768.0, 401.0, 255.0, 145.0, 90.0, 55.0, 35.0, 21.0, 15.0, 12.0, 12.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2310791015625, -0.22446060180664062, -0.21784210205078125, -0.21122360229492188, -0.2046051025390625, -0.19798660278320312, -0.19136810302734375, -0.18474960327148438, -0.178131103515625, -0.17151260375976562, -0.16489410400390625, -0.15827560424804688, -0.1516571044921875, -0.14503860473632812, -0.13842010498046875, -0.13180160522460938, -0.12518310546875, -0.11856460571289062, -0.11194610595703125, -0.10532760620117188, -0.0987091064453125, -0.09209060668945312, -0.08547210693359375, -0.07885360717773438, -0.072235107421875, -0.06561660766601562, -0.05899810791015625, -0.052379608154296875, -0.0457611083984375, -0.039142608642578125, -0.03252410888671875, -0.025905609130859375, -0.019287109375, -0.012668609619140625, -0.00605010986328125, 0.000568389892578125, 0.0071868896484375, 0.013805389404296875, 0.02042388916015625, 0.027042388916015625, 0.033660888671875, 0.040279388427734375, 0.04689788818359375, 0.053516387939453125, 0.0601348876953125, 0.06675338745117188, 0.07337188720703125, 0.07999038696289062, 0.08660888671875, 0.09322738647460938, 0.09984588623046875, 0.10646438598632812, 0.1130828857421875, 0.11970138549804688, 0.12631988525390625, 0.13293838500976562, 0.139556884765625, 0.14617538452148438, 0.15279388427734375, 0.15941238403320312, 0.1660308837890625, 0.17264938354492188, 0.17926788330078125, 0.18588638305664062, 0.1925048828125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 11.0, 10.0, 19.0, 37.0, 38.0, 42.0, 76.0, 116.0, 132.0, 140.0, 103.0, 78.0, 56.0, 37.0, 39.0, 22.0, 12.0, 7.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1575927734375, -0.1531238555908203, -0.14865493774414062, -0.14418601989746094, -0.13971710205078125, -0.13524818420410156, -0.13077926635742188, -0.1263103485107422, -0.1218414306640625, -0.11737251281738281, -0.11290359497070312, -0.10843467712402344, -0.10396575927734375, -0.09949684143066406, -0.09502792358398438, -0.09055900573730469, -0.086090087890625, -0.08162117004394531, -0.07715225219726562, -0.07268333435058594, -0.06821441650390625, -0.06374549865722656, -0.059276580810546875, -0.05480766296386719, -0.0503387451171875, -0.04586982727050781, -0.041400909423828125, -0.03693199157714844, -0.03246307373046875, -0.027994155883789062, -0.023525238037109375, -0.019056320190429688, -0.01458740234375, -0.010118484497070312, -0.005649566650390625, -0.0011806488037109375, 0.00328826904296875, 0.0077571868896484375, 0.012226104736328125, 0.016695022583007812, 0.0211639404296875, 0.025632858276367188, 0.030101776123046875, 0.03457069396972656, 0.03903961181640625, 0.04350852966308594, 0.047977447509765625, 0.05244636535644531, 0.056915283203125, 0.06138420104980469, 0.06585311889648438, 0.07032203674316406, 0.07479095458984375, 0.07925987243652344, 0.08372879028320312, 0.08819770812988281, 0.0926666259765625, 0.09713554382324219, 0.10160446166992188, 0.10607337951660156, 0.11054229736328125, 0.11501121520996094, 0.11948013305664062, 0.12394905090332031, 0.12841796875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 15.0, 35.0, 47.0, 158.0, 323.0, 230.0, 105.0, 41.0, 15.0, 8.0, 11.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8318114280700684, -1.7755467891693115, -1.7192820310592651, -1.6630172729492188, -1.606752634048462, -1.550487995147705, -1.4942232370376587, -1.4379584789276123, -1.3816938400268555, -1.3254292011260986, -1.2691644430160522, -1.2128996849060059, -1.156635046005249, -1.1003704071044922, -1.0441056489944458, -0.9878409504890442, -0.9315762519836426, -0.875311553478241, -0.8190468549728394, -0.7627821564674377, -0.7065174579620361, -0.6502527594566345, -0.5939880609512329, -0.5377233624458313, -0.4814586639404297, -0.4251939654350281, -0.36892926692962646, -0.31266456842422485, -0.25639986991882324, -0.20013517141342163, -0.14387047290802002, -0.08760577440261841, -0.03134119510650635, 0.024923503398895264, 0.08118820190429688, 0.1374529004096985, 0.1937175989151001, 0.2499822974205017, 0.3062469959259033, 0.36251169443130493, 0.41877639293670654, 0.47504109144210815, 0.5313057899475098, 0.5875704884529114, 0.643835186958313, 0.7000998854637146, 0.7563645839691162, 0.8126292824745178, 0.8688939809799194, 0.925158679485321, 0.9814233779907227, 1.0376880168914795, 1.0939527750015259, 1.1502175331115723, 1.206482172012329, 1.262746810913086, 1.3190115690231323, 1.3752763271331787, 1.4315409660339355, 1.4878056049346924, 1.5440703630447388, 1.6003351211547852, 1.656599760055542, 1.7128643989562988, 1.7691291570663452]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 5.0, 3.0, 5.0, 5.0, 16.0, 13.0, 18.0, 25.0, 38.0, 47.0, 55.0, 63.0, 75.0, 82.0, 75.0, 74.0, 75.0, 53.0, 56.0, 54.0, 28.0, 25.0, 22.0, 19.0, 11.0, 10.0, 10.0, 7.0, 3.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9033595323562622, -0.8758248686790466, -0.848290205001831, -0.8207556009292603, -0.7932209372520447, -0.7656862735748291, -0.7381516098976135, -0.710616946220398, -0.6830823421478271, -0.6555476784706116, -0.628013014793396, -0.6004784107208252, -0.5729437470436096, -0.545409083366394, -0.5178744196891785, -0.4903397560119629, -0.4628050923347473, -0.43527042865753174, -0.40773579478263855, -0.380201131105423, -0.3526664972305298, -0.3251318335533142, -0.29759716987609863, -0.27006250619888306, -0.24252787232398987, -0.21499322354793549, -0.1874585747718811, -0.15992391109466553, -0.13238926231861115, -0.10485461354255676, -0.07731994986534119, -0.049785301089286804, -0.022250711917877197, 0.0052839405834674835, 0.032818593084812164, 0.060353249311447144, 0.08788789808750153, 0.11542254686355591, 0.14295721054077148, 0.17049185931682587, 0.19802650809288025, 0.22556115686893463, 0.253095805644989, 0.2806304693222046, 0.30816513299942017, 0.33569976687431335, 0.36323443055152893, 0.3907690644264221, 0.4183037281036377, 0.44583839178085327, 0.47337302565574646, 0.5009076595306396, 0.5284423232078552, 0.5559769868850708, 0.5835116505622864, 0.611046314239502, 0.6385809183120728, 0.6661155819892883, 0.6936502456665039, 0.7211848497390747, 0.7487195134162903, 0.7762541770935059, 0.8037888407707214, 0.831323504447937, 0.8588581681251526]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 4.0, 8.0, 16.0, 12.0, 33.0, 49.0, 159.0, 2122.0, 3693807.0, 496830.0, 1054.0, 45.0, 33.0, 14.0, 14.0, 24.0, 16.0, 8.0, 10.0, 4.0, 6.0, 4.0, 6.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1328125, -2.050689697265625, -1.96856689453125, -1.886444091796875, -1.8043212890625, -1.722198486328125, -1.64007568359375, -1.557952880859375, -1.475830078125, -1.393707275390625, -1.31158447265625, -1.229461669921875, -1.1473388671875, -1.065216064453125, -0.98309326171875, -0.900970458984375, -0.81884765625, -0.736724853515625, -0.65460205078125, -0.572479248046875, -0.4903564453125, -0.408233642578125, -0.32611083984375, -0.243988037109375, -0.161865234375, -0.079742431640625, 0.00238037109375, 0.084503173828125, 0.1666259765625, 0.248748779296875, 0.33087158203125, 0.412994384765625, 0.4951171875, 0.577239990234375, 0.65936279296875, 0.741485595703125, 0.8236083984375, 0.905731201171875, 0.98785400390625, 1.069976806640625, 1.152099609375, 1.234222412109375, 1.31634521484375, 1.398468017578125, 1.4805908203125, 1.562713623046875, 1.64483642578125, 1.726959228515625, 1.80908203125, 1.891204833984375, 1.97332763671875, 2.055450439453125, 2.1375732421875, 2.219696044921875, 2.30181884765625, 2.383941650390625, 2.466064453125, 2.548187255859375, 2.63031005859375, 2.712432861328125, 2.7945556640625, 2.876678466796875, 2.95880126953125, 3.040924072265625, 3.123046875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 9.0, 1.0, 3.0, 8.0, 6.0, 10.0, 12.0, 19.0, 18.0, 31.0, 35.0, 43.0, 44.0, 68.0, 61.0, 60.0, 74.0, 77.0, 65.0, 57.0, 54.0, 52.0, 50.0, 38.0, 24.0, 10.0, 10.0, 14.0, 9.0, 8.0, 10.0, 7.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0186614990234375, -0.01820194721221924, -0.017742395401000977, -0.017282843589782715, -0.016823291778564453, -0.01636373996734619, -0.01590418815612793, -0.015444636344909668, -0.014985084533691406, -0.014525532722473145, -0.014065980911254883, -0.013606429100036621, -0.01314687728881836, -0.012687325477600098, -0.012227773666381836, -0.011768221855163574, -0.011308670043945312, -0.01084911823272705, -0.010389566421508789, -0.009930014610290527, -0.009470462799072266, -0.009010910987854004, -0.008551359176635742, -0.00809180736541748, -0.007632255554199219, -0.007172703742980957, -0.006713151931762695, -0.006253600120544434, -0.005794048309326172, -0.00533449649810791, -0.0048749446868896484, -0.004415392875671387, -0.003955841064453125, -0.0034962892532348633, -0.0030367374420166016, -0.00257718563079834, -0.002117633819580078, -0.0016580820083618164, -0.0011985301971435547, -0.000738978385925293, -0.00027942657470703125, 0.00018012523651123047, 0.0006396770477294922, 0.001099228858947754, 0.0015587806701660156, 0.0020183324813842773, 0.002477884292602539, 0.0029374361038208008, 0.0033969879150390625, 0.0038565397262573242, 0.004316091537475586, 0.004775643348693848, 0.005235195159912109, 0.005694746971130371, 0.006154298782348633, 0.0066138505935668945, 0.007073402404785156, 0.007532954216003418, 0.00799250602722168, 0.008452057838439941, 0.008911609649658203, 0.009371161460876465, 0.009830713272094727, 0.010290265083312988, 0.01074981689453125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 6.0, 14.0, 64.0, 125.0, 352.0, 2651.0, 990444.0, 3197039.0, 3020.0, 365.0, 129.0, 56.0, 16.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.445556640625, -0.3961753845214844, -0.34679412841796875, -0.2974128723144531, -0.2480316162109375, -0.19865036010742188, -0.14926910400390625, -0.09988784790039062, -0.050506591796875, -0.001125335693359375, 0.04825592041015625, 0.09763717651367188, 0.1470184326171875, 0.19639968872070312, 0.24578094482421875, 0.2951622009277344, 0.34454345703125, 0.3939247131347656, 0.44330596923828125, 0.4926872253417969, 0.5420684814453125, 0.5914497375488281, 0.6408309936523438, 0.6902122497558594, 0.739593505859375, 0.7889747619628906, 0.8383560180664062, 0.8877372741699219, 0.9371185302734375, 0.9864997863769531, 1.0358810424804688, 1.0852622985839844, 1.1346435546875, 1.1840248107910156, 1.2334060668945312, 1.2827873229980469, 1.3321685791015625, 1.3815498352050781, 1.4309310913085938, 1.4803123474121094, 1.529693603515625, 1.5790748596191406, 1.6284561157226562, 1.6778373718261719, 1.7272186279296875, 1.7765998840332031, 1.8259811401367188, 1.8753623962402344, 1.92474365234375, 1.9741249084472656, 2.0235061645507812, 2.072887420654297, 2.1222686767578125, 2.171649932861328, 2.2210311889648438, 2.2704124450683594, 2.319793701171875, 2.3691749572753906, 2.4185562133789062, 2.467937469482422, 2.5173187255859375, 2.566699981689453, 2.6160812377929688, 2.6654624938964844, 2.71484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 7.0, 10.0, 14.0, 13.0, 16.0, 17.0, 28.0, 34.0, 39.0, 68.0, 124.0, 201.0, 395.0, 1714.0, 633.0, 249.0, 143.0, 112.0, 65.0, 52.0, 27.0, 28.0, 14.0, 17.0, 11.0, 6.0, 3.0, 8.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.04986572265625, -0.04857921600341797, -0.04729270935058594, -0.046006202697753906, -0.044719696044921875, -0.043433189392089844, -0.04214668273925781, -0.04086017608642578, -0.03957366943359375, -0.03828716278076172, -0.03700065612792969, -0.035714149475097656, -0.034427642822265625, -0.033141136169433594, -0.03185462951660156, -0.03056812286376953, -0.0292816162109375, -0.02799510955810547, -0.026708602905273438, -0.025422096252441406, -0.024135589599609375, -0.022849082946777344, -0.021562576293945312, -0.02027606964111328, -0.01898956298828125, -0.01770305633544922, -0.016416549682617188, -0.015130043029785156, -0.013843536376953125, -0.012557029724121094, -0.011270523071289062, -0.009984016418457031, -0.008697509765625, -0.007411003112792969, -0.0061244964599609375, -0.004837989807128906, -0.003551483154296875, -0.0022649765014648438, -0.0009784698486328125, 0.00030803680419921875, 0.00159454345703125, 0.0028810501098632812, 0.0041675567626953125, 0.005454063415527344, 0.006740570068359375, 0.008027076721191406, 0.009313583374023438, 0.010600090026855469, 0.0118865966796875, 0.013173103332519531, 0.014459609985351562, 0.015746116638183594, 0.017032623291015625, 0.018319129943847656, 0.019605636596679688, 0.02089214324951172, 0.02217864990234375, 0.02346515655517578, 0.024751663208007812, 0.026038169860839844, 0.027324676513671875, 0.028611183166503906, 0.029897689819335938, 0.03118419647216797, 0.032470703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 6.0, 185.0, 765.0, 51.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7070081233978271, -0.5940101146697998, -0.4810120463371277, -0.36801400780677795, -0.2550159692764282, -0.14201796054840088, -0.02901989221572876, 0.08397817611694336, 0.1969761848449707, 0.30997422337532043, 0.42297226190567017, 0.5359703302383423, 0.6489683389663696, 0.761966347694397, 0.8749644160270691, 0.9879624843597412, 1.1009604930877686, 1.213958501815796, 1.3269565105438232, 1.4399546384811401, 1.5529526472091675, 1.6659506559371948, 1.7789487838745117, 1.891946792602539, 2.0049448013305664, 2.1179428100585938, 2.230940818786621, 2.3439388275146484, 2.456936836242676, 2.569934844970703, 2.6829330921173096, 2.795931100845337, 2.908928871154785, 3.0219268798828125, 3.13492488861084, 3.247922897338867, 3.3609209060668945, 3.473918914794922, 3.5869171619415283, 3.6999151706695557, 3.812913179397583, 3.9259111881256104, 4.038909435272217, 4.151907444000244, 4.2649054527282715, 4.377903461456299, 4.490901470184326, 4.6038994789123535, 4.716897487640381, 4.829895496368408, 4.9428935050964355, 5.055891513824463, 5.16888952255249, 5.281887531280518, 5.394885540008545, 5.5078840255737305, 5.620882034301758, 5.733880043029785, 5.8468780517578125, 5.95987606048584, 6.072874069213867, 6.1858720779418945, 6.298870086669922, 6.411868095397949, 6.524866104125977]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 10.0, 14.0, 17.0, 36.0, 45.0, 81.0, 101.0, 120.0, 117.0, 104.0, 95.0, 86.0, 76.0, 51.0, 23.0, 11.0, 8.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.555079460144043, -0.5425467491149902, -0.5300140380859375, -0.5174813270568848, -0.504948616027832, -0.4924158751964569, -0.4798831641674042, -0.46735045313835144, -0.4548177421092987, -0.44228503108024597, -0.42975232005119324, -0.4172195792198181, -0.4046868681907654, -0.39215415716171265, -0.3796214461326599, -0.3670887351036072, -0.35455602407455444, -0.3420233130455017, -0.329490602016449, -0.31695789098739624, -0.3044251501560211, -0.2918924391269684, -0.27935972809791565, -0.2668270170688629, -0.2542942762374878, -0.24176156520843506, -0.22922883927822113, -0.2166961282491684, -0.20416341722011566, -0.19163069128990173, -0.179097980260849, -0.16656526923179626, -0.15403255820274353, -0.1414998471736908, -0.12896712124347687, -0.11643441021442413, -0.1039016991853714, -0.09136898070573807, -0.07883626222610474, -0.066303551197052, -0.05377083271741867, -0.04123811796307564, -0.028705401346087456, -0.016172684729099274, -0.003639969974756241, 0.008892744779586792, 0.021425463259220123, 0.03395817428827286, 0.04649089276790619, 0.05902360752224922, 0.07155632227659225, 0.08408904075622559, 0.09662175178527832, 0.10915447026491165, 0.12168718874454498, 0.13421989977359772, 0.14675262570381165, 0.15928533673286438, 0.1718180626630783, 0.18435077369213104, 0.19688348472118378, 0.2094162106513977, 0.22194892168045044, 0.23448163270950317, 0.2470143437385559]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 3.0, 11.0, 6.0, 8.0, 19.0, 18.0, 23.0, 30.0, 36.0, 29.0, 41.0, 35.0, 51.0, 44.0, 41.0, 34651.0, 1013004.0, 73.0, 62.0, 47.0, 49.0, 44.0, 38.0, 37.0, 39.0, 28.0, 18.0, 12.0, 10.0, 6.0, 9.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.986328125, -3.869537353515625, -3.75274658203125, -3.635955810546875, -3.5191650390625, -3.402374267578125, -3.28558349609375, -3.168792724609375, -3.052001953125, -2.935211181640625, -2.81842041015625, -2.701629638671875, -2.5848388671875, -2.468048095703125, -2.35125732421875, -2.234466552734375, -2.11767578125, -2.000885009765625, -1.88409423828125, -1.767303466796875, -1.6505126953125, -1.533721923828125, -1.41693115234375, -1.300140380859375, -1.183349609375, -1.066558837890625, -0.94976806640625, -0.832977294921875, -0.7161865234375, -0.599395751953125, -0.48260498046875, -0.365814208984375, -0.2490234375, -0.132232666015625, -0.01544189453125, 0.101348876953125, 0.2181396484375, 0.334930419921875, 0.45172119140625, 0.568511962890625, 0.685302734375, 0.802093505859375, 0.91888427734375, 1.035675048828125, 1.1524658203125, 1.269256591796875, 1.38604736328125, 1.502838134765625, 1.61962890625, 1.736419677734375, 1.85321044921875, 1.970001220703125, 2.0867919921875, 2.203582763671875, 2.32037353515625, 2.437164306640625, 2.553955078125, 2.670745849609375, 2.78753662109375, 2.904327392578125, 3.0211181640625, 3.137908935546875, 3.25469970703125, 3.371490478515625, 3.48828125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 28.0, 132.0, 331.0, 348.0, 140.0, 34.0], "bins": [-0.1541748046875, -0.151644766330719, -0.149114727973938, -0.14658468961715698, -0.14405465126037598, -0.14152461290359497, -0.13899457454681396, -0.13646453619003296, -0.13393449783325195, -0.13140445947647095, -0.12887442111968994, -0.12634438276290894, -0.12381434440612793, -0.12128430604934692, -0.11875426769256592, -0.11622422933578491, -0.1136941909790039, -0.1111641526222229, -0.1086341142654419, -0.10610407590866089, -0.10357403755187988, -0.10104399919509888, -0.09851396083831787, -0.09598392248153687, -0.09345388412475586, -0.09092384576797485, -0.08839380741119385, -0.08586376905441284, -0.08333373069763184, -0.08080369234085083, -0.07827365398406982, -0.07574361562728882, -0.07321357727050781, -0.0706835389137268, -0.0681535005569458, -0.0656234622001648, -0.06309342384338379, -0.06056338548660278, -0.05803334712982178, -0.05550330877304077, -0.052973270416259766, -0.05044323205947876, -0.047913193702697754, -0.04538315534591675, -0.04285311698913574, -0.040323078632354736, -0.03779304027557373, -0.035263001918792725, -0.03273296356201172, -0.030202925205230713, -0.027672886848449707, -0.0251428484916687, -0.022612810134887695, -0.02008277177810669, -0.017552733421325684, -0.015022695064544678, -0.012492656707763672, -0.009962618350982666, -0.00743257999420166, -0.004902541637420654, -0.0023725032806396484, 0.00015753507614135742, 0.0026875734329223633, 0.005217611789703369, 0.007747650146484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 10.0, 7.0, 15.0, 19.0, 30.0, 49.0, 76.0, 108.0, 189.0, 334.0, 640.0, 1477.0, 3423.0, 9683.0, 36352.0, 227415.0, 652153.0, 87030.0, 19478.0, 5828.0, 2181.0, 922.0, 446.0, 256.0, 148.0, 90.0, 64.0, 26.0, 26.0, 22.0, 16.0, 9.0, 12.0, 3.0, 2.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8779296875, -0.8523101806640625, -0.826690673828125, -0.8010711669921875, -0.77545166015625, -0.7498321533203125, -0.724212646484375, -0.6985931396484375, -0.6729736328125, -0.6473541259765625, -0.621734619140625, -0.5961151123046875, -0.57049560546875, -0.5448760986328125, -0.519256591796875, -0.4936370849609375, -0.468017578125, -0.4423980712890625, -0.416778564453125, -0.3911590576171875, -0.36553955078125, -0.3399200439453125, -0.314300537109375, -0.2886810302734375, -0.2630615234375, -0.2374420166015625, -0.211822509765625, -0.1862030029296875, -0.16058349609375, -0.1349639892578125, -0.109344482421875, -0.0837249755859375, -0.05810546875, -0.0324859619140625, -0.006866455078125, 0.0187530517578125, 0.04437255859375, 0.0699920654296875, 0.095611572265625, 0.1212310791015625, 0.1468505859375, 0.1724700927734375, 0.198089599609375, 0.2237091064453125, 0.24932861328125, 0.2749481201171875, 0.300567626953125, 0.3261871337890625, 0.351806640625, 0.3774261474609375, 0.403045654296875, 0.4286651611328125, 0.45428466796875, 0.4799041748046875, 0.505523681640625, 0.5311431884765625, 0.5567626953125, 0.5823822021484375, 0.608001708984375, 0.6336212158203125, 0.65924072265625, 0.6848602294921875, 0.710479736328125, 0.7360992431640625, 0.76171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 1.0, 5.0, 8.0, 10.0, 13.0, 19.0, 16.0, 28.0, 33.0, 33.0, 42.0, 39.0, 60.0, 62.0, 76.0, 65.0, 59.0, 46.0, 57.0, 50.0, 54.0, 41.0, 29.0, 28.0, 20.0, 23.0, 26.0, 11.0, 15.0, 8.0, 6.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1160888671875, -0.11192703247070312, -0.10776519775390625, -0.10360336303710938, -0.0994415283203125, -0.09527969360351562, -0.09111785888671875, -0.08695602416992188, -0.082794189453125, -0.07863235473632812, -0.07447052001953125, -0.07030868530273438, -0.0661468505859375, -0.061985015869140625, -0.05782318115234375, -0.053661346435546875, -0.04949951171875, -0.045337677001953125, -0.04117584228515625, -0.037014007568359375, -0.0328521728515625, -0.028690338134765625, -0.02452850341796875, -0.020366668701171875, -0.016204833984375, -0.012042999267578125, -0.00788116455078125, -0.003719329833984375, 0.0004425048828125, 0.004604339599609375, 0.00876617431640625, 0.012928009033203125, 0.01708984375, 0.021251678466796875, 0.02541351318359375, 0.029575347900390625, 0.0337371826171875, 0.037899017333984375, 0.04206085205078125, 0.046222686767578125, 0.050384521484375, 0.054546356201171875, 0.05870819091796875, 0.06287002563476562, 0.0670318603515625, 0.07119369506835938, 0.07535552978515625, 0.07951736450195312, 0.08367919921875, 0.08784103393554688, 0.09200286865234375, 0.09616470336914062, 0.1003265380859375, 0.10448837280273438, 0.10865020751953125, 0.11281204223632812, 0.116973876953125, 0.12113571166992188, 0.12529754638671875, 0.12945938110351562, 0.1336212158203125, 0.13778305053710938, 0.14194488525390625, 0.14610671997070312, 0.1502685546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 14.0, 23.0, 39.0, 72.0, 128.0, 238.0, 546.0, 1646.0, 5240.0, 22004.0, 149174.0, 744350.0, 101350.0, 17058.0, 4225.0, 1392.0, 523.0, 229.0, 100.0, 71.0, 43.0, 28.0, 12.0, 10.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.841796875, -0.81500244140625, -0.7882080078125, -0.76141357421875, -0.734619140625, -0.70782470703125, -0.6810302734375, -0.65423583984375, -0.62744140625, -0.60064697265625, -0.5738525390625, -0.54705810546875, -0.520263671875, -0.49346923828125, -0.4666748046875, -0.43988037109375, -0.4130859375, -0.38629150390625, -0.3594970703125, -0.33270263671875, -0.305908203125, -0.27911376953125, -0.2523193359375, -0.22552490234375, -0.19873046875, -0.17193603515625, -0.1451416015625, -0.11834716796875, -0.091552734375, -0.06475830078125, -0.0379638671875, -0.01116943359375, 0.015625, 0.04241943359375, 0.0692138671875, 0.09600830078125, 0.122802734375, 0.14959716796875, 0.1763916015625, 0.20318603515625, 0.22998046875, 0.25677490234375, 0.2835693359375, 0.31036376953125, 0.337158203125, 0.36395263671875, 0.3907470703125, 0.41754150390625, 0.4443359375, 0.47113037109375, 0.4979248046875, 0.52471923828125, 0.551513671875, 0.57830810546875, 0.6051025390625, 0.63189697265625, 0.65869140625, 0.68548583984375, 0.7122802734375, 0.73907470703125, 0.765869140625, 0.79266357421875, 0.8194580078125, 0.84625244140625, 0.873046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 7.0, 8.0, 11.0, 18.0, 28.0, 50.0, 49.0, 62.0, 100.0, 100.0, 135.0, 126.0, 85.0, 51.0, 40.0, 33.0, 19.0, 14.0, 13.0, 11.0, 7.0, 5.0, 7.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.97781753540039e-05, -9.717419743537903e-05, -9.457021951675415e-05, -9.196624159812927e-05, -8.93622636795044e-05, -8.675828576087952e-05, -8.415430784225464e-05, -8.155032992362976e-05, -7.894635200500488e-05, -7.634237408638e-05, -7.373839616775513e-05, -7.113441824913025e-05, -6.853044033050537e-05, -6.592646241188049e-05, -6.332248449325562e-05, -6.071850657463074e-05, -5.811452865600586e-05, -5.551055073738098e-05, -5.2906572818756104e-05, -5.0302594900131226e-05, -4.769861698150635e-05, -4.509463906288147e-05, -4.249066114425659e-05, -3.9886683225631714e-05, -3.7282705307006836e-05, -3.467872738838196e-05, -3.207474946975708e-05, -2.9470771551132202e-05, -2.6866793632507324e-05, -2.4262815713882446e-05, -2.165883779525757e-05, -1.905485987663269e-05, -1.6450881958007812e-05, -1.3846904039382935e-05, -1.1242926120758057e-05, -8.638948202133179e-06, -6.034970283508301e-06, -3.430992364883423e-06, -8.270144462585449e-07, 1.776963472366333e-06, 4.380941390991211e-06, 6.984919309616089e-06, 9.588897228240967e-06, 1.2192875146865845e-05, 1.4796853065490723e-05, 1.74008309841156e-05, 2.000480890274048e-05, 2.2608786821365356e-05, 2.5212764739990234e-05, 2.7816742658615112e-05, 3.042072057723999e-05, 3.302469849586487e-05, 3.5628676414489746e-05, 3.8232654333114624e-05, 4.08366322517395e-05, 4.344061017036438e-05, 4.604458808898926e-05, 4.8648566007614136e-05, 5.1252543926239014e-05, 5.385652184486389e-05, 5.646049976348877e-05, 5.906447768211365e-05, 6.166845560073853e-05, 6.42724335193634e-05, 6.687641143798828e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 5.0, 11.0, 11.0, 30.0, 31.0, 49.0, 75.0, 120.0, 239.0, 480.0, 1254.0, 4431.0, 22258.0, 215788.0, 728916.0, 61454.0, 9680.0, 2296.0, 749.0, 315.0, 134.0, 99.0, 58.0, 26.0, 21.0, 11.0, 10.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58447265625, -0.5582046508789062, -0.5319366455078125, -0.5056686401367188, -0.479400634765625, -0.45313262939453125, -0.4268646240234375, -0.40059661865234375, -0.37432861328125, -0.34806060791015625, -0.3217926025390625, -0.29552459716796875, -0.269256591796875, -0.24298858642578125, -0.2167205810546875, -0.19045257568359375, -0.1641845703125, -0.13791656494140625, -0.1116485595703125, -0.08538055419921875, -0.059112548828125, -0.03284454345703125, -0.0065765380859375, 0.01969146728515625, 0.04595947265625, 0.07222747802734375, 0.0984954833984375, 0.12476348876953125, 0.151031494140625, 0.17729949951171875, 0.2035675048828125, 0.22983551025390625, 0.256103515625, 0.28237152099609375, 0.3086395263671875, 0.33490753173828125, 0.361175537109375, 0.38744354248046875, 0.4137115478515625, 0.43997955322265625, 0.46624755859375, 0.49251556396484375, 0.5187835693359375, 0.5450515747070312, 0.571319580078125, 0.5975875854492188, 0.6238555908203125, 0.6501235961914062, 0.6763916015625, 0.7026596069335938, 0.7289276123046875, 0.7551956176757812, 0.781463623046875, 0.8077316284179688, 0.8339996337890625, 0.8602676391601562, 0.88653564453125, 0.9128036499023438, 0.9390716552734375, 0.9653396606445312, 0.991607666015625, 1.0178756713867188, 1.0441436767578125, 1.0704116821289062, 1.0966796875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 5.0, 9.0, 13.0, 13.0, 14.0, 22.0, 27.0, 32.0, 43.0, 76.0, 94.0, 105.0, 112.0, 96.0, 73.0, 65.0, 36.0, 37.0, 26.0, 22.0, 17.0, 15.0, 15.0, 8.0, 15.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.34912109375, -0.34107208251953125, -0.3330230712890625, -0.32497406005859375, -0.316925048828125, -0.30887603759765625, -0.3008270263671875, -0.29277801513671875, -0.28472900390625, -0.27667999267578125, -0.2686309814453125, -0.26058197021484375, -0.252532958984375, -0.24448394775390625, -0.2364349365234375, -0.22838592529296875, -0.2203369140625, -0.21228790283203125, -0.2042388916015625, -0.19618988037109375, -0.188140869140625, -0.18009185791015625, -0.1720428466796875, -0.16399383544921875, -0.15594482421875, -0.14789581298828125, -0.1398468017578125, -0.13179779052734375, -0.123748779296875, -0.11569976806640625, -0.1076507568359375, -0.09960174560546875, -0.091552734375, -0.08350372314453125, -0.0754547119140625, -0.06740570068359375, -0.059356689453125, -0.05130767822265625, -0.0432586669921875, -0.03520965576171875, -0.02716064453125, -0.01911163330078125, -0.0110626220703125, -0.00301361083984375, 0.005035400390625, 0.01308441162109375, 0.0211334228515625, 0.02918243408203125, 0.0372314453125, 0.04528045654296875, 0.0533294677734375, 0.06137847900390625, 0.069427490234375, 0.07747650146484375, 0.0855255126953125, 0.09357452392578125, 0.10162353515625, 0.10967254638671875, 0.1177215576171875, 0.12577056884765625, 0.133819580078125, 0.14186859130859375, 0.1499176025390625, 0.15796661376953125, 0.166015625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 7.0, 21.0, 119.0, 625.0, 210.0, 20.0, 8.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.046420097351074, -6.597654342651367, -6.148888111114502, -5.700121879577637, -5.25135612487793, -4.802590370178223, -4.353824138641357, -3.9050581455230713, -3.456292152404785, -3.007526159286499, -2.558760166168213, -2.1099941730499268, -1.6612281799316406, -1.2124621868133545, -0.7636961936950684, -0.3149302005767822, 0.1338357925415039, 0.58260178565979, 1.0313677787780762, 1.4801337718963623, 1.9288997650146484, 2.3776657581329346, 2.8264317512512207, 3.275197744369507, 3.723963737487793, 4.1727294921875, 4.621495723724365, 5.0702619552612305, 5.5190277099609375, 5.9677934646606445, 6.41655969619751, 6.865325927734375, 7.314090728759766, 7.762856483459473, 8.21162223815918, 8.660388946533203, 9.10915470123291, 9.557920455932617, 10.00668716430664, 10.455452919006348, 10.904218673706055, 11.352984428405762, 11.801750183105469, 12.250516891479492, 12.6992826461792, 13.148048400878906, 13.59681510925293, 14.045580863952637, 14.494346618652344, 14.94311237335205, 15.391878128051758, 15.840644836425781, 16.289409637451172, 16.738176345825195, 17.18694305419922, 17.63570785522461, 18.084474563598633, 18.533241271972656, 18.982006072998047, 19.43077278137207, 19.879539489746094, 20.328304290771484, 20.777070999145508, 21.2258358001709, 21.674602508544922]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 9.0, 14.0, 25.0, 26.0, 38.0, 54.0, 39.0, 62.0, 59.0, 74.0, 81.0, 68.0, 82.0, 60.0, 74.0, 43.0, 58.0, 30.0, 29.0, 22.0, 15.0, 9.0, 9.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8026463985443115, -0.7644394040107727, -0.7262324094772339, -0.6880253553390503, -0.6498183608055115, -0.6116113662719727, -0.5734043121337891, -0.5351973176002502, -0.4969903230667114, -0.4587833285331726, -0.4205763041973114, -0.3823692798614502, -0.3441622853279114, -0.30595529079437256, -0.26774826645851135, -0.22954124212265015, -0.19133424758911133, -0.15312723815441132, -0.1149202287197113, -0.07671321928501129, -0.03850620985031128, -0.0002992004156112671, 0.037907809019088745, 0.07611483335494995, 0.11432182788848877, 0.15252883732318878, 0.1907358467578888, 0.2289428561925888, 0.2671498656272888, 0.30535686016082764, 0.34356388449668884, 0.38177090883255005, 0.41997790336608887, 0.4581848978996277, 0.4963919222354889, 0.5345989465713501, 0.5728059411048889, 0.6110129356384277, 0.6492199897766113, 0.6874269843101501, 0.725633978843689, 0.7638409733772278, 0.8020479679107666, 0.8402550220489502, 0.878462016582489, 0.9166690111160278, 0.9548760652542114, 0.9930830597877502, 1.031290054321289, 1.0694971084594727, 1.1077040433883667, 1.1459110975265503, 1.1841180324554443, 1.222325086593628, 1.2605321407318115, 1.2987391948699951, 1.3369461297988892, 1.3751531839370728, 1.4133601188659668, 1.4515671730041504, 1.489774227142334, 1.527981162071228, 1.5661882162094116, 1.6043951511383057, 1.6426022052764893]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 5.0, 7.0, 7.0, 8.0, 9.0, 13.0, 10.0, 25.0, 20.0, 17.0, 23.0, 34.0, 43.0, 41.0, 61.0, 55.0, 61.0, 120.0, 330.0, 17099.0, 4170215.0, 5442.0, 293.0, 110.0, 55.0, 43.0, 30.0, 19.0, 19.0, 22.0, 11.0, 10.0, 6.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.75, -5.59197998046875, -5.4339599609375, -5.27593994140625, -5.117919921875, -4.95989990234375, -4.8018798828125, -4.64385986328125, -4.48583984375, -4.32781982421875, -4.1697998046875, -4.01177978515625, -3.853759765625, -3.69573974609375, -3.5377197265625, -3.37969970703125, -3.2216796875, -3.06365966796875, -2.9056396484375, -2.74761962890625, -2.589599609375, -2.43157958984375, -2.2735595703125, -2.11553955078125, -1.95751953125, -1.79949951171875, -1.6414794921875, -1.48345947265625, -1.325439453125, -1.16741943359375, -1.0093994140625, -0.85137939453125, -0.693359375, -0.53533935546875, -0.3773193359375, -0.21929931640625, -0.061279296875, 0.09674072265625, 0.2547607421875, 0.41278076171875, 0.57080078125, 0.72882080078125, 0.8868408203125, 1.04486083984375, 1.202880859375, 1.36090087890625, 1.5189208984375, 1.67694091796875, 1.8349609375, 1.99298095703125, 2.1510009765625, 2.30902099609375, 2.467041015625, 2.62506103515625, 2.7830810546875, 2.94110107421875, 3.09912109375, 3.25714111328125, 3.4151611328125, 3.57318115234375, 3.731201171875, 3.88922119140625, 4.0472412109375, 4.20526123046875, 4.36328125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 6.0, 15.0, 41.0, 86.0, 136.0, 179.0, 190.0, 158.0, 103.0, 61.0, 21.0, 10.0, 5.0, 3.0, 1.0], "bins": [-0.125732421875, -0.12345290184020996, -0.12117338180541992, -0.11889386177062988, -0.11661434173583984, -0.1143348217010498, -0.11205530166625977, -0.10977578163146973, -0.10749626159667969, -0.10521674156188965, -0.10293722152709961, -0.10065770149230957, -0.09837818145751953, -0.09609866142272949, -0.09381914138793945, -0.09153962135314941, -0.08926010131835938, -0.08698058128356934, -0.0847010612487793, -0.08242154121398926, -0.08014202117919922, -0.07786250114440918, -0.07558298110961914, -0.0733034610748291, -0.07102394104003906, -0.06874442100524902, -0.06646490097045898, -0.06418538093566895, -0.061905860900878906, -0.05962634086608887, -0.05734682083129883, -0.05506730079650879, -0.05278778076171875, -0.05050826072692871, -0.04822874069213867, -0.04594922065734863, -0.043669700622558594, -0.041390180587768555, -0.039110660552978516, -0.03683114051818848, -0.03455162048339844, -0.0322721004486084, -0.02999258041381836, -0.02771306037902832, -0.02543354034423828, -0.023154020309448242, -0.020874500274658203, -0.018594980239868164, -0.016315460205078125, -0.014035940170288086, -0.011756420135498047, -0.009476900100708008, -0.007197380065917969, -0.00491786003112793, -0.0026383399963378906, -0.00035881996154785156, 0.0019207000732421875, 0.0042002201080322266, 0.006479740142822266, 0.008759260177612305, 0.011038780212402344, 0.013318300247192383, 0.015597820281982422, 0.01787734031677246, 0.0201568603515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 11.0, 13.0, 23.0, 44.0, 104.0, 179.0, 444.0, 2418.0, 3961656.0, 227002.0, 1658.0, 345.0, 189.0, 90.0, 64.0, 26.0, 10.0, 10.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -3.9287109375, -3.646484375, -3.3642578125, -3.08203125, -2.7998046875, -2.517578125, -2.2353515625, -1.953125, -1.6708984375, -1.388671875, -1.1064453125, -0.82421875, -0.5419921875, -0.259765625, 0.0224609375, 0.3046875, 0.5869140625, 0.869140625, 1.1513671875, 1.43359375, 1.7158203125, 1.998046875, 2.2802734375, 2.5625, 2.8447265625, 3.126953125, 3.4091796875, 3.69140625, 3.9736328125, 4.255859375, 4.5380859375, 4.8203125, 5.1025390625, 5.384765625, 5.6669921875, 5.94921875, 6.2314453125, 6.513671875, 6.7958984375, 7.078125, 7.3603515625, 7.642578125, 7.9248046875, 8.20703125, 8.4892578125, 8.771484375, 9.0537109375, 9.3359375, 9.6181640625, 9.900390625, 10.1826171875, 10.46484375, 10.7470703125, 11.029296875, 11.3115234375, 11.59375, 11.8759765625, 12.158203125, 12.4404296875, 12.72265625, 13.0048828125, 13.287109375, 13.5693359375, 13.8515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 14.0, 72.0, 435.0, 3217.0, 253.0, 59.0, 19.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26904296875, -0.24524688720703125, -0.2214508056640625, -0.19765472412109375, -0.173858642578125, -0.15006256103515625, -0.1262664794921875, -0.10247039794921875, -0.07867431640625, -0.05487823486328125, -0.0310821533203125, -0.00728607177734375, 0.016510009765625, 0.04030609130859375, 0.0641021728515625, 0.08789825439453125, 0.1116943359375, 0.13549041748046875, 0.1592864990234375, 0.18308258056640625, 0.206878662109375, 0.23067474365234375, 0.2544708251953125, 0.27826690673828125, 0.30206298828125, 0.32585906982421875, 0.3496551513671875, 0.37345123291015625, 0.397247314453125, 0.42104339599609375, 0.4448394775390625, 0.46863555908203125, 0.492431640625, 0.5162277221679688, 0.5400238037109375, 0.5638198852539062, 0.587615966796875, 0.6114120483398438, 0.6352081298828125, 0.6590042114257812, 0.68280029296875, 0.7065963745117188, 0.7303924560546875, 0.7541885375976562, 0.777984619140625, 0.8017807006835938, 0.8255767822265625, 0.8493728637695312, 0.8731689453125, 0.8969650268554688, 0.9207611083984375, 0.9445571899414062, 0.968353271484375, 0.9921493530273438, 1.0159454345703125, 1.0397415161132812, 1.06353759765625, 1.0873336791992188, 1.1111297607421875, 1.1349258422851562, 1.158721923828125, 1.1825180053710938, 1.2063140869140625, 1.2301101684570312, 1.25390625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 10.0, 35.0, 164.0, 504.0, 222.0, 51.0, 15.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.556102752685547, -3.3115787506103516, -3.0670547485351562, -2.822530746459961, -2.5780067443847656, -2.3334827423095703, -2.088958740234375, -1.8444346189498901, -1.5999106168746948, -1.3553866147994995, -1.1108626127243042, -0.8663385510444641, -0.6218145489692688, -0.3772904872894287, -0.1327664852142334, 0.11175751686096191, 0.3562815189361572, 0.6008055210113525, 0.8453295230865479, 1.0898535251617432, 1.3343775272369385, 1.5789016485214233, 1.8234256505966187, 2.0679497718811035, 2.312473773956299, 2.556997776031494, 2.8015217781066895, 3.0460457801818848, 3.29056978225708, 3.5350937843322754, 3.7796177864074707, 4.024141788482666, 4.268665790557861, 4.513189792633057, 4.757713794708252, 5.002237796783447, 5.246761798858643, 5.491285800933838, 5.735809803009033, 5.9803338050842285, 6.224857807159424, 6.469381809234619, 6.7139058113098145, 6.95842981338501, 7.202953815460205, 7.4474778175354, 7.692001819610596, 7.936525821685791, 8.181050300598145, 8.42557430267334, 8.670098304748535, 8.91462230682373, 9.159146308898926, 9.403670310974121, 9.648194313049316, 9.892718315124512, 10.137242317199707, 10.381766319274902, 10.626290321350098, 10.870814323425293, 11.115338325500488, 11.359862327575684, 11.604386329650879, 11.848910331726074, 12.09343433380127]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 12.0, 14.0, 36.0, 46.0, 57.0, 80.0, 89.0, 115.0, 98.0, 120.0, 100.0, 82.0, 44.0, 46.0, 28.0, 19.0, 5.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3043053150177, -2.23893404006958, -2.17356276512146, -2.108191728591919, -2.042820453643799, -1.9774491786956787, -1.9120779037475586, -1.846706748008728, -1.7813355922698975, -1.7159643173217773, -1.6505931615829468, -1.5852218866348267, -1.519850730895996, -1.454479455947876, -1.3891081809997559, -1.3237370252609253, -1.2583657503128052, -1.192994475364685, -1.1276233196258545, -1.0622520446777344, -0.9968808889389038, -0.9315096139907837, -0.8661383986473083, -0.800767183303833, -0.7353959679603577, -0.6700247526168823, -0.604653537273407, -0.5392823219299316, -0.4739110767841339, -0.40853986144065857, -0.34316861629486084, -0.2777974009513855, -0.2124263048171997, -0.14705508947372437, -0.08168385922908783, -0.016312628984451294, 0.04905858635902405, 0.11442980170249939, 0.17980104684829712, 0.24517226219177246, 0.3105434775352478, 0.37591469287872314, 0.4412859082221985, 0.5066571235656738, 0.572028398513794, 0.6373995542526245, 0.7027708292007446, 0.76814204454422, 0.8335132598876953, 0.8988844752311707, 0.964255690574646, 1.0296269655227661, 1.0949981212615967, 1.1603693962097168, 1.225740671157837, 1.2911118268966675, 1.356482982635498, 1.4218542575836182, 1.4872254133224487, 1.5525966882705688, 1.6179678440093994, 1.6833391189575195, 1.7487103939056396, 1.8140815496444702, 1.8794528245925903]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 9.0, 6.0, 8.0, 6.0, 13.0, 9.0, 15.0, 12.0, 20.0, 25.0, 27.0, 32.0, 41.0, 50.0, 75.0, 193.0, 644.0, 4761.0, 197226.0, 827408.0, 15974.0, 1278.0, 291.0, 102.0, 64.0, 58.0, 36.0, 32.0, 24.0, 21.0, 20.0, 14.0, 9.0, 13.0, 7.0, 7.0, 4.0, 4.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-3.556640625, -3.455596923828125, -3.35455322265625, -3.253509521484375, -3.1524658203125, -3.051422119140625, -2.95037841796875, -2.849334716796875, -2.748291015625, -2.647247314453125, -2.54620361328125, -2.445159912109375, -2.3441162109375, -2.243072509765625, -2.14202880859375, -2.040985107421875, -1.93994140625, -1.838897705078125, -1.73785400390625, -1.636810302734375, -1.5357666015625, -1.434722900390625, -1.33367919921875, -1.232635498046875, -1.131591796875, -1.030548095703125, -0.92950439453125, -0.828460693359375, -0.7274169921875, -0.626373291015625, -0.52532958984375, -0.424285888671875, -0.3232421875, -0.222198486328125, -0.12115478515625, -0.020111083984375, 0.0809326171875, 0.181976318359375, 0.28302001953125, 0.384063720703125, 0.485107421875, 0.586151123046875, 0.68719482421875, 0.788238525390625, 0.8892822265625, 0.990325927734375, 1.09136962890625, 1.192413330078125, 1.29345703125, 1.394500732421875, 1.49554443359375, 1.596588134765625, 1.6976318359375, 1.798675537109375, 1.89971923828125, 2.000762939453125, 2.101806640625, 2.202850341796875, 2.30389404296875, 2.404937744140625, 2.5059814453125, 2.607025146484375, 2.70806884765625, 2.809112548828125, 2.91015625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 8.0, 5.0, 20.0, 25.0, 29.0, 33.0, 47.0, 52.0, 44.0, 63.0, 67.0, 79.0, 94.0, 74.0, 58.0, 55.0, 51.0, 39.0, 41.0, 30.0, 21.0, 17.0, 11.0, 9.0, 10.0, 3.0, 6.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07733154296875, -0.07493400573730469, -0.07253646850585938, -0.07013893127441406, -0.06774139404296875, -0.06534385681152344, -0.06294631958007812, -0.06054878234863281, -0.0581512451171875, -0.05575370788574219, -0.053356170654296875, -0.05095863342285156, -0.04856109619140625, -0.04616355895996094, -0.043766021728515625, -0.04136848449707031, -0.038970947265625, -0.03657341003417969, -0.034175872802734375, -0.03177833557128906, -0.02938079833984375, -0.026983261108398438, -0.024585723876953125, -0.022188186645507812, -0.0197906494140625, -0.017393112182617188, -0.014995574951171875, -0.012598037719726562, -0.01020050048828125, -0.0078029632568359375, -0.005405426025390625, -0.0030078887939453125, -0.0006103515625, 0.0017871856689453125, 0.004184722900390625, 0.0065822601318359375, 0.00897979736328125, 0.011377334594726562, 0.013774871826171875, 0.016172409057617188, 0.0185699462890625, 0.020967483520507812, 0.023365020751953125, 0.025762557983398438, 0.02816009521484375, 0.030557632446289062, 0.032955169677734375, 0.03535270690917969, 0.037750244140625, 0.04014778137207031, 0.042545318603515625, 0.04494285583496094, 0.04734039306640625, 0.04973793029785156, 0.052135467529296875, 0.05453300476074219, 0.0569305419921875, 0.05932807922363281, 0.061725616455078125, 0.06412315368652344, 0.06652069091796875, 0.06891822814941406, 0.07131576538085938, 0.07371330261230469, 0.07611083984375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 2.0, 9.0, 8.0, 12.0, 16.0, 15.0, 31.0, 42.0, 73.0, 102.0, 157.0, 238.0, 467.0, 891.0, 2072.0, 5699.0, 22023.0, 120938.0, 567262.0, 269340.0, 43576.0, 9747.0, 3070.0, 1243.0, 612.0, 320.0, 193.0, 119.0, 69.0, 62.0, 51.0, 21.0, 21.0, 12.0, 4.0, 7.0, 7.0, 9.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8369140625, -0.808746337890625, -0.78057861328125, -0.752410888671875, -0.7242431640625, -0.696075439453125, -0.66790771484375, -0.639739990234375, -0.611572265625, -0.583404541015625, -0.55523681640625, -0.527069091796875, -0.4989013671875, -0.470733642578125, -0.44256591796875, -0.414398193359375, -0.38623046875, -0.358062744140625, -0.32989501953125, -0.301727294921875, -0.2735595703125, -0.245391845703125, -0.21722412109375, -0.189056396484375, -0.160888671875, -0.132720947265625, -0.10455322265625, -0.076385498046875, -0.0482177734375, -0.020050048828125, 0.00811767578125, 0.036285400390625, 0.064453125, 0.092620849609375, 0.12078857421875, 0.148956298828125, 0.1771240234375, 0.205291748046875, 0.23345947265625, 0.261627197265625, 0.289794921875, 0.317962646484375, 0.34613037109375, 0.374298095703125, 0.4024658203125, 0.430633544921875, 0.45880126953125, 0.486968994140625, 0.51513671875, 0.543304443359375, 0.57147216796875, 0.599639892578125, 0.6278076171875, 0.655975341796875, 0.68414306640625, 0.712310791015625, 0.740478515625, 0.768646240234375, 0.79681396484375, 0.824981689453125, 0.8531494140625, 0.881317138671875, 0.90948486328125, 0.937652587890625, 0.9658203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 7.0, 5.0, 3.0, 6.0, 12.0, 14.0, 17.0, 20.0, 27.0, 20.0, 27.0, 39.0, 57.0, 54.0, 61.0, 46.0, 58.0, 52.0, 62.0, 68.0, 57.0, 50.0, 40.0, 35.0, 36.0, 36.0, 24.0, 21.0, 12.0, 14.0, 11.0, 2.0, 5.0, 3.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.35791015625, -0.34685516357421875, -0.3358001708984375, -0.32474517822265625, -0.313690185546875, -0.30263519287109375, -0.2915802001953125, -0.28052520751953125, -0.26947021484375, -0.25841522216796875, -0.2473602294921875, -0.23630523681640625, -0.225250244140625, -0.21419525146484375, -0.2031402587890625, -0.19208526611328125, -0.1810302734375, -0.16997528076171875, -0.1589202880859375, -0.14786529541015625, -0.136810302734375, -0.12575531005859375, -0.1147003173828125, -0.10364532470703125, -0.09259033203125, -0.08153533935546875, -0.0704803466796875, -0.05942535400390625, -0.048370361328125, -0.03731536865234375, -0.0262603759765625, -0.01520538330078125, -0.004150390625, 0.00690460205078125, 0.0179595947265625, 0.02901458740234375, 0.040069580078125, 0.05112457275390625, 0.0621795654296875, 0.07323455810546875, 0.08428955078125, 0.09534454345703125, 0.1063995361328125, 0.11745452880859375, 0.128509521484375, 0.13956451416015625, 0.1506195068359375, 0.16167449951171875, 0.1727294921875, 0.18378448486328125, 0.1948394775390625, 0.20589447021484375, 0.216949462890625, 0.22800445556640625, 0.2390594482421875, 0.25011444091796875, 0.26116943359375, 0.27222442626953125, 0.2832794189453125, 0.29433441162109375, 0.305389404296875, 0.31644439697265625, 0.3274993896484375, 0.33855438232421875, 0.349609375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 11.0, 8.0, 18.0, 20.0, 29.0, 57.0, 92.0, 113.0, 177.0, 380.0, 897.0, 2652.0, 12056.0, 159283.0, 819719.0, 43818.0, 6189.0, 1719.0, 591.0, 289.0, 147.0, 96.0, 55.0, 37.0, 28.0, 19.0, 16.0, 14.0, 5.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.189453125, -1.1501922607421875, -1.110931396484375, -1.0716705322265625, -1.03240966796875, -0.9931488037109375, -0.953887939453125, -0.9146270751953125, -0.8753662109375, -0.8361053466796875, -0.796844482421875, -0.7575836181640625, -0.71832275390625, -0.6790618896484375, -0.639801025390625, -0.6005401611328125, -0.561279296875, -0.5220184326171875, -0.482757568359375, -0.4434967041015625, -0.40423583984375, -0.3649749755859375, -0.325714111328125, -0.2864532470703125, -0.2471923828125, -0.2079315185546875, -0.168670654296875, -0.1294097900390625, -0.09014892578125, -0.0508880615234375, -0.011627197265625, 0.0276336669921875, 0.06689453125, 0.1061553955078125, 0.145416259765625, 0.1846771240234375, 0.22393798828125, 0.2631988525390625, 0.302459716796875, 0.3417205810546875, 0.3809814453125, 0.4202423095703125, 0.459503173828125, 0.4987640380859375, 0.53802490234375, 0.5772857666015625, 0.616546630859375, 0.6558074951171875, 0.695068359375, 0.7343292236328125, 0.773590087890625, 0.8128509521484375, 0.85211181640625, 0.8913726806640625, 0.930633544921875, 0.9698944091796875, 1.0091552734375, 1.0484161376953125, 1.087677001953125, 1.1269378662109375, 1.16619873046875, 1.2054595947265625, 1.244720458984375, 1.2839813232421875, 1.3232421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 9.0, 13.0, 16.0, 18.0, 26.0, 29.0, 44.0, 82.0, 124.0, 142.0, 132.0, 117.0, 72.0, 61.0, 39.0, 26.0, 10.0, 15.0, 12.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.08970832824707e-05, -8.710380643606186e-05, -8.331052958965302e-05, -7.951725274324417e-05, -7.572397589683533e-05, -7.193069905042648e-05, -6.813742220401764e-05, -6.43441453576088e-05, -6.055086851119995e-05, -5.675759166479111e-05, -5.296431481838226e-05, -4.917103797197342e-05, -4.5377761125564575e-05, -4.158448427915573e-05, -3.779120743274689e-05, -3.399793058633804e-05, -3.02046537399292e-05, -2.6411376893520355e-05, -2.261810004711151e-05, -1.8824823200702667e-05, -1.5031546354293823e-05, -1.123826950788498e-05, -7.444992661476135e-06, -3.6517158150672913e-06, 1.4156103134155273e-07, 3.934837877750397e-06, 7.72811472415924e-06, 1.1521391570568085e-05, 1.531466841697693e-05, 1.9107945263385773e-05, 2.2901222109794617e-05, 2.669449895620346e-05, 3.0487775802612305e-05, 3.428105264902115e-05, 3.807432949542999e-05, 4.186760634183884e-05, 4.566088318824768e-05, 4.9454160034656525e-05, 5.324743688106537e-05, 5.704071372747421e-05, 6.083399057388306e-05, 6.46272674202919e-05, 6.842054426670074e-05, 7.221382111310959e-05, 7.600709795951843e-05, 7.980037480592728e-05, 8.359365165233612e-05, 8.738692849874496e-05, 9.118020534515381e-05, 9.497348219156265e-05, 9.87667590379715e-05, 0.00010256003588438034, 0.00010635331273078918, 0.00011014658957719803, 0.00011393986642360687, 0.00011773314327001572, 0.00012152642011642456, 0.0001253196969628334, 0.00012911297380924225, 0.0001329062506556511, 0.00013669952750205994, 0.00014049280434846878, 0.00014428608119487762, 0.00014807935804128647, 0.0001518726348876953]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 5.0, 6.0, 11.0, 12.0, 11.0, 19.0, 23.0, 58.0, 75.0, 150.0, 246.0, 343.0, 713.0, 1486.0, 3869.0, 13118.0, 85473.0, 744060.0, 170582.0, 19627.0, 4909.0, 1887.0, 846.0, 404.0, 222.0, 133.0, 73.0, 56.0, 29.0, 26.0, 24.0, 10.0, 13.0, 9.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69140625, -0.6672592163085938, -0.6431121826171875, -0.6189651489257812, -0.594818115234375, -0.5706710815429688, -0.5465240478515625, -0.5223770141601562, -0.49822998046875, -0.47408294677734375, -0.4499359130859375, -0.42578887939453125, -0.401641845703125, -0.37749481201171875, -0.3533477783203125, -0.32920074462890625, -0.3050537109375, -0.28090667724609375, -0.2567596435546875, -0.23261260986328125, -0.208465576171875, -0.18431854248046875, -0.1601715087890625, -0.13602447509765625, -0.11187744140625, -0.08773040771484375, -0.0635833740234375, -0.03943634033203125, -0.015289306640625, 0.00885772705078125, 0.0330047607421875, 0.05715179443359375, 0.081298828125, 0.10544586181640625, 0.1295928955078125, 0.15373992919921875, 0.177886962890625, 0.20203399658203125, 0.2261810302734375, 0.25032806396484375, 0.27447509765625, 0.29862213134765625, 0.3227691650390625, 0.34691619873046875, 0.371063232421875, 0.39521026611328125, 0.4193572998046875, 0.44350433349609375, 0.4676513671875, 0.49179840087890625, 0.5159454345703125, 0.5400924682617188, 0.564239501953125, 0.5883865356445312, 0.6125335693359375, 0.6366806030273438, 0.66082763671875, 0.6849746704101562, 0.7091217041015625, 0.7332687377929688, 0.757415771484375, 0.7815628051757812, 0.8057098388671875, 0.8298568725585938, 0.85400390625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 14.0, 14.0, 14.0, 18.0, 26.0, 33.0, 40.0, 41.0, 59.0, 64.0, 79.0, 91.0, 119.0, 70.0, 62.0, 60.0, 47.0, 22.0, 25.0, 22.0, 9.0, 11.0, 7.0, 8.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.302490234375, -0.29425048828125, -0.2860107421875, -0.27777099609375, -0.26953125, -0.26129150390625, -0.2530517578125, -0.24481201171875, -0.236572265625, -0.22833251953125, -0.2200927734375, -0.21185302734375, -0.20361328125, -0.19537353515625, -0.1871337890625, -0.17889404296875, -0.170654296875, -0.16241455078125, -0.1541748046875, -0.14593505859375, -0.1376953125, -0.12945556640625, -0.1212158203125, -0.11297607421875, -0.104736328125, -0.09649658203125, -0.0882568359375, -0.08001708984375, -0.07177734375, -0.06353759765625, -0.0552978515625, -0.04705810546875, -0.038818359375, -0.03057861328125, -0.0223388671875, -0.01409912109375, -0.005859375, 0.00238037109375, 0.0106201171875, 0.01885986328125, 0.027099609375, 0.03533935546875, 0.0435791015625, 0.05181884765625, 0.06005859375, 0.06829833984375, 0.0765380859375, 0.08477783203125, 0.093017578125, 0.10125732421875, 0.1094970703125, 0.11773681640625, 0.1259765625, 0.13421630859375, 0.1424560546875, 0.15069580078125, 0.158935546875, 0.16717529296875, 0.1754150390625, 0.18365478515625, 0.19189453125, 0.20013427734375, 0.2083740234375, 0.21661376953125, 0.224853515625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 19.0, 83.0, 335.0, 433.0, 110.0, 21.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.385377883911133, -10.91618537902832, -10.446993827819824, -9.977801322937012, -9.5086088180542, -9.039417266845703, -8.57022476196289, -8.101032257080078, -7.631840229034424, -7.1626482009887695, -6.693455696105957, -6.224263668060303, -5.755071640014648, -5.285879135131836, -4.816687107086182, -4.347495079040527, -3.878302574157715, -3.4091103076934814, -2.939918041229248, -2.4707260131835938, -2.0015337467193604, -1.532341480255127, -1.0631494522094727, -0.5939571857452393, -0.12476491928100586, 0.34442728757858276, 0.8136194944381714, 1.2828116416931152, 1.7520039081573486, 2.221196174621582, 2.6903882026672363, 3.1595804691314697, 3.628772735595703, 4.097964763641357, 4.56715726852417, 5.036349296569824, 5.505541801452637, 5.974733829498291, 6.443925857543945, 6.913118362426758, 7.382310390472412, 7.851502418518066, 8.320694923400879, 8.789886474609375, 9.259078979492188, 9.728271484375, 10.197463989257812, 10.666655540466309, 11.135848045349121, 11.605040550231934, 12.07423210144043, 12.543424606323242, 13.012617111206055, 13.481809616088867, 13.951001167297363, 14.420193672180176, 14.889385223388672, 15.358577728271484, 15.82776927947998, 16.29696273803711, 16.76615333557129, 17.2353458404541, 17.704538345336914, 18.173730850219727, 18.64292335510254]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 8.0, 5.0, 7.0, 6.0, 7.0, 10.0, 24.0, 17.0, 16.0, 22.0, 20.0, 27.0, 32.0, 31.0, 38.0, 43.0, 45.0, 36.0, 52.0, 39.0, 50.0, 63.0, 41.0, 37.0, 38.0, 35.0, 38.0, 35.0, 35.0, 21.0, 23.0, 14.0, 15.0, 8.0, 14.0, 14.0, 8.0, 7.0, 3.0, 7.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.9695837497711182, -1.9022765159606934, -1.8349692821502686, -1.7676621675491333, -1.7003549337387085, -1.6330476999282837, -1.5657405853271484, -1.4984333515167236, -1.4311261177062988, -1.363818883895874, -1.2965116500854492, -1.229204535484314, -1.1618973016738892, -1.0945900678634644, -1.027282953262329, -0.9599757194519043, -0.8926684856414795, -0.8253612518310547, -0.7580540776252747, -0.6907469034194946, -0.6234396696090698, -0.556132435798645, -0.488825261592865, -0.4215180575847626, -0.35421085357666016, -0.28690364956855774, -0.21959644556045532, -0.1522892415523529, -0.08498203754425049, -0.01767483353614807, 0.049632370471954346, 0.11693957448005676, 0.18424701690673828, 0.2515542209148407, 0.3188614249229431, 0.38616862893104553, 0.45347583293914795, 0.5207830667495728, 0.5880902409553528, 0.6553974151611328, 0.7227046489715576, 0.7900118827819824, 0.8573190569877625, 0.9246262311935425, 0.9919334650039673, 1.059240698814392, 1.1265478134155273, 1.1938550472259521, 1.261162281036377, 1.3284695148468018, 1.3957767486572266, 1.4630838632583618, 1.5303910970687866, 1.5976983308792114, 1.6650054454803467, 1.7323126792907715, 1.7996199131011963, 1.866927146911621, 1.934234380722046, 2.0015416145324707, 2.0688486099243164, 2.136155843734741, 2.203463077545166, 2.270770311355591, 2.3380775451660156]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 4.0, 9.0, 10.0, 15.0, 9.0, 11.0, 15.0, 20.0, 13.0, 26.0, 19.0, 40.0, 31.0, 53.0, 91.0, 230.0, 1240.0, 21317.0, 4007391.0, 158001.0, 4634.0, 638.0, 185.0, 76.0, 56.0, 40.0, 36.0, 11.0, 16.0, 10.0, 10.0, 4.0, 8.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.28125, -4.164703369140625, -4.04815673828125, -3.931610107421875, -3.8150634765625, -3.698516845703125, -3.58197021484375, -3.465423583984375, -3.348876953125, -3.232330322265625, -3.11578369140625, -2.999237060546875, -2.8826904296875, -2.766143798828125, -2.64959716796875, -2.533050537109375, -2.41650390625, -2.299957275390625, -2.18341064453125, -2.066864013671875, -1.9503173828125, -1.833770751953125, -1.71722412109375, -1.600677490234375, -1.484130859375, -1.367584228515625, -1.25103759765625, -1.134490966796875, -1.0179443359375, -0.901397705078125, -0.78485107421875, -0.668304443359375, -0.5517578125, -0.435211181640625, -0.31866455078125, -0.202117919921875, -0.0855712890625, 0.030975341796875, 0.14752197265625, 0.264068603515625, 0.380615234375, 0.497161865234375, 0.61370849609375, 0.730255126953125, 0.8468017578125, 0.963348388671875, 1.07989501953125, 1.196441650390625, 1.31298828125, 1.429534912109375, 1.54608154296875, 1.662628173828125, 1.7791748046875, 1.895721435546875, 2.01226806640625, 2.128814697265625, 2.245361328125, 2.361907958984375, 2.47845458984375, 2.595001220703125, 2.7115478515625, 2.828094482421875, 2.94464111328125, 3.061187744140625, 3.177734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 5.0, 3.0, 4.0, 7.0, 7.0, 10.0, 24.0, 24.0, 32.0, 36.0, 44.0, 37.0, 53.0, 44.0, 62.0, 65.0, 58.0, 72.0, 68.0, 45.0, 53.0, 44.0, 40.0, 37.0, 26.0, 15.0, 17.0, 17.0, 9.0, 9.0, 9.0, 6.0, 3.0, 1.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058685302734375, -0.05639028549194336, -0.05409526824951172, -0.05180025100708008, -0.04950523376464844, -0.0472102165222168, -0.044915199279785156, -0.042620182037353516, -0.040325164794921875, -0.038030147552490234, -0.035735130310058594, -0.03344011306762695, -0.031145095825195312, -0.028850078582763672, -0.02655506134033203, -0.02426004409790039, -0.02196502685546875, -0.01967000961303711, -0.01737499237060547, -0.015079975128173828, -0.012784957885742188, -0.010489940643310547, -0.008194923400878906, -0.005899906158447266, -0.003604888916015625, -0.0013098716735839844, 0.0009851455688476562, 0.003280162811279297, 0.0055751800537109375, 0.007870197296142578, 0.010165214538574219, 0.01246023178100586, 0.0147552490234375, 0.01705026626586914, 0.01934528350830078, 0.021640300750732422, 0.023935317993164062, 0.026230335235595703, 0.028525352478027344, 0.030820369720458984, 0.033115386962890625, 0.035410404205322266, 0.037705421447753906, 0.04000043869018555, 0.04229545593261719, 0.04459047317504883, 0.04688549041748047, 0.04918050765991211, 0.05147552490234375, 0.05377054214477539, 0.05606555938720703, 0.05836057662963867, 0.06065559387207031, 0.06295061111450195, 0.0652456283569336, 0.06754064559936523, 0.06983566284179688, 0.07213068008422852, 0.07442569732666016, 0.0767207145690918, 0.07901573181152344, 0.08131074905395508, 0.08360576629638672, 0.08590078353881836, 0.08819580078125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 20.0, 111.0, 351.0, 1445.0, 132671.0, 4056925.0, 2124.0, 460.0, 117.0, 25.0, 16.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53515625, -7.16009521484375, -6.7850341796875, -6.40997314453125, -6.034912109375, -5.65985107421875, -5.2847900390625, -4.90972900390625, -4.53466796875, -4.15960693359375, -3.7845458984375, -3.40948486328125, -3.034423828125, -2.65936279296875, -2.2843017578125, -1.90924072265625, -1.5341796875, -1.15911865234375, -0.7840576171875, -0.40899658203125, -0.033935546875, 0.34112548828125, 0.7161865234375, 1.09124755859375, 1.46630859375, 1.84136962890625, 2.2164306640625, 2.59149169921875, 2.966552734375, 3.34161376953125, 3.7166748046875, 4.09173583984375, 4.466796875, 4.84185791015625, 5.2169189453125, 5.59197998046875, 5.967041015625, 6.34210205078125, 6.7171630859375, 7.09222412109375, 7.46728515625, 7.84234619140625, 8.2174072265625, 8.59246826171875, 8.967529296875, 9.34259033203125, 9.7176513671875, 10.09271240234375, 10.4677734375, 10.84283447265625, 11.2178955078125, 11.59295654296875, 11.968017578125, 12.34307861328125, 12.7181396484375, 13.09320068359375, 13.46826171875, 13.84332275390625, 14.2183837890625, 14.59344482421875, 14.968505859375, 15.34356689453125, 15.7186279296875, 16.09368896484375, 16.46875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 23.0, 57.0, 445.0, 3196.0, 286.0, 54.0, 16.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81884765625, -0.7852554321289062, -0.7516632080078125, -0.7180709838867188, -0.684478759765625, -0.6508865356445312, -0.6172943115234375, -0.5837020874023438, -0.55010986328125, -0.5165176391601562, -0.4829254150390625, -0.44933319091796875, -0.415740966796875, -0.38214874267578125, -0.3485565185546875, -0.31496429443359375, -0.2813720703125, -0.24777984619140625, -0.2141876220703125, -0.18059539794921875, -0.147003173828125, -0.11341094970703125, -0.0798187255859375, -0.04622650146484375, -0.01263427734375, 0.02095794677734375, 0.0545501708984375, 0.08814239501953125, 0.121734619140625, 0.15532684326171875, 0.1889190673828125, 0.22251129150390625, 0.256103515625, 0.28969573974609375, 0.3232879638671875, 0.35688018798828125, 0.390472412109375, 0.42406463623046875, 0.4576568603515625, 0.49124908447265625, 0.52484130859375, 0.5584335327148438, 0.5920257568359375, 0.6256179809570312, 0.659210205078125, 0.6928024291992188, 0.7263946533203125, 0.7599868774414062, 0.7935791015625, 0.8271713256835938, 0.8607635498046875, 0.8943557739257812, 0.927947998046875, 0.9615402221679688, 0.9951324462890625, 1.0287246704101562, 1.06231689453125, 1.0959091186523438, 1.1295013427734375, 1.1630935668945312, 1.196685791015625, 1.2302780151367188, 1.2638702392578125, 1.2974624633789062, 1.3310546875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 19.0, 92.0, 423.0, 367.0, 66.0, 21.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-13.477032661437988, -13.195364952087402, -12.913697242736816, -12.632030487060547, -12.350362777709961, -12.068695068359375, -11.787027359008789, -11.505359649658203, -11.223692893981934, -10.942025184631348, -10.660357475280762, -10.378690719604492, -10.097023010253906, -9.81535530090332, -9.533687591552734, -9.252019882202148, -8.970352172851562, -8.688684463500977, -8.40701675415039, -8.125349998474121, -7.843682289123535, -7.562014579772949, -7.280346870422363, -6.9986796379089355, -6.717012405395508, -6.435344696044922, -6.153677463531494, -5.872009754180908, -5.5903425216674805, -5.3086748123168945, -5.027007102966309, -4.745339870452881, -4.463673114776611, -4.182005405426025, -3.9003381729125977, -3.6186704635620117, -3.337003231048584, -3.055335521697998, -2.773668050765991, -2.4920005798339844, -2.2103331089019775, -1.9286656379699707, -1.6469981670379639, -1.3653305768966675, -1.0836631059646606, -0.8019956350326538, -0.5203280448913574, -0.23866057395935059, 0.04300689697265625, 0.3246743977069855, 0.6063418984413147, 0.8880094289779663, 1.1696768999099731, 1.45134437084198, 1.7330119609832764, 2.014679431915283, 2.29634690284729, 2.578014373779297, 2.8596818447113037, 3.1413493156433105, 3.4230170249938965, 3.704684257507324, 3.98635196685791, 4.268019676208496, 4.549686908721924]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 7.0, 11.0, 11.0, 35.0, 37.0, 38.0, 47.0, 62.0, 62.0, 69.0, 92.0, 81.0, 88.0, 59.0, 72.0, 56.0, 40.0, 39.0, 23.0, 26.0, 13.0, 10.0, 10.0, 7.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4030470848083496, -1.3432602882385254, -1.2834734916687012, -1.2236865758895874, -1.1638997793197632, -1.104112982749939, -1.0443260669708252, -0.984539270401001, -0.9247524738311768, -0.8649656772613525, -0.8051788210868835, -0.7453919649124146, -0.6856051683425903, -0.6258183717727661, -0.5660315155982971, -0.5062446594238281, -0.4464578628540039, -0.3866710364818573, -0.3268842101097107, -0.2670973837375641, -0.20731055736541748, -0.14752373099327087, -0.08773690462112427, -0.02795007824897766, 0.031836748123168945, 0.09162357449531555, 0.15141040086746216, 0.21119722723960876, 0.27098405361175537, 0.330770879983902, 0.3905577063560486, 0.4503445327281952, 0.5101313591003418, 0.569918155670166, 0.629705011844635, 0.689491868019104, 0.7492786645889282, 0.8090654611587524, 0.8688523173332214, 0.9286391735076904, 0.9884259700775146, 1.0482127666473389, 1.107999563217163, 1.1677864789962769, 1.227573275566101, 1.2873600721359253, 1.347146987915039, 1.4069337844848633, 1.4667205810546875, 1.5265073776245117, 1.586294174194336, 1.6460810899734497, 1.705867886543274, 1.7656546831130981, 1.825441598892212, 1.8852283954620361, 1.9450151920318604, 2.0048019886016846, 2.064588785171509, 2.124375581741333, 2.1841626167297363, 2.2439494132995605, 2.3037362098693848, 2.363523006439209, 2.423309803009033]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 8.0, 10.0, 9.0, 7.0, 15.0, 19.0, 23.0, 38.0, 56.0, 76.0, 107.0, 182.0, 340.0, 732.0, 1954.0, 9527.0, 121676.0, 813378.0, 89147.0, 7955.0, 1810.0, 594.0, 304.0, 197.0, 122.0, 60.0, 51.0, 38.0, 23.0, 23.0, 10.0, 11.0, 10.0, 8.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.04296875, -1.971160888671875, -1.89935302734375, -1.827545166015625, -1.7557373046875, -1.683929443359375, -1.61212158203125, -1.540313720703125, -1.468505859375, -1.396697998046875, -1.32489013671875, -1.253082275390625, -1.1812744140625, -1.109466552734375, -1.03765869140625, -0.965850830078125, -0.89404296875, -0.822235107421875, -0.75042724609375, -0.678619384765625, -0.6068115234375, -0.535003662109375, -0.46319580078125, -0.391387939453125, -0.319580078125, -0.247772216796875, -0.17596435546875, -0.104156494140625, -0.0323486328125, 0.039459228515625, 0.11126708984375, 0.183074951171875, 0.2548828125, 0.326690673828125, 0.39849853515625, 0.470306396484375, 0.5421142578125, 0.613922119140625, 0.68572998046875, 0.757537841796875, 0.829345703125, 0.901153564453125, 0.97296142578125, 1.044769287109375, 1.1165771484375, 1.188385009765625, 1.26019287109375, 1.332000732421875, 1.40380859375, 1.475616455078125, 1.54742431640625, 1.619232177734375, 1.6910400390625, 1.762847900390625, 1.83465576171875, 1.906463623046875, 1.978271484375, 2.050079345703125, 2.12188720703125, 2.193695068359375, 2.2655029296875, 2.337310791015625, 2.40911865234375, 2.480926513671875, 2.552734375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 2.0, 6.0, 8.0, 19.0, 19.0, 37.0, 33.0, 49.0, 48.0, 57.0, 74.0, 78.0, 83.0, 87.0, 66.0, 82.0, 60.0, 48.0, 35.0, 34.0, 22.0, 15.0, 15.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10760498046875, -0.10328388214111328, -0.09896278381347656, -0.09464168548583984, -0.09032058715820312, -0.0859994888305664, -0.08167839050292969, -0.07735729217529297, -0.07303619384765625, -0.06871509552001953, -0.06439399719238281, -0.060072898864746094, -0.055751800537109375, -0.051430702209472656, -0.04710960388183594, -0.04278850555419922, -0.0384674072265625, -0.03414630889892578, -0.029825210571289062, -0.025504112243652344, -0.021183013916015625, -0.016861915588378906, -0.012540817260742188, -0.008219718933105469, -0.00389862060546875, 0.00042247772216796875, 0.0047435760498046875, 0.009064674377441406, 0.013385772705078125, 0.017706871032714844, 0.022027969360351562, 0.02634906768798828, 0.030670166015625, 0.03499126434326172, 0.03931236267089844, 0.043633460998535156, 0.047954559326171875, 0.052275657653808594, 0.05659675598144531, 0.06091785430908203, 0.06523895263671875, 0.06956005096435547, 0.07388114929199219, 0.0782022476196289, 0.08252334594726562, 0.08684444427490234, 0.09116554260253906, 0.09548664093017578, 0.0998077392578125, 0.10412883758544922, 0.10844993591308594, 0.11277103424072266, 0.11709213256835938, 0.1214132308959961, 0.1257343292236328, 0.13005542755126953, 0.13437652587890625, 0.13869762420654297, 0.1430187225341797, 0.1473398208618164, 0.15166091918945312, 0.15598201751708984, 0.16030311584472656, 0.16462421417236328, 0.1689453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 7.0, 7.0, 5.0, 10.0, 8.0, 25.0, 18.0, 33.0, 43.0, 68.0, 103.0, 134.0, 243.0, 394.0, 681.0, 1370.0, 2874.0, 6649.0, 18708.0, 67751.0, 299323.0, 473365.0, 127284.0, 31236.0, 10022.0, 3999.0, 1810.0, 950.0, 544.0, 327.0, 180.0, 130.0, 72.0, 49.0, 36.0, 25.0, 22.0, 13.0, 10.0, 2.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.92578125, -0.8994903564453125, -0.873199462890625, -0.8469085693359375, -0.82061767578125, -0.7943267822265625, -0.768035888671875, -0.7417449951171875, -0.7154541015625, -0.6891632080078125, -0.662872314453125, -0.6365814208984375, -0.61029052734375, -0.5839996337890625, -0.557708740234375, -0.5314178466796875, -0.505126953125, -0.4788360595703125, -0.452545166015625, -0.4262542724609375, -0.39996337890625, -0.3736724853515625, -0.347381591796875, -0.3210906982421875, -0.2947998046875, -0.2685089111328125, -0.242218017578125, -0.2159271240234375, -0.18963623046875, -0.1633453369140625, -0.137054443359375, -0.1107635498046875, -0.08447265625, -0.0581817626953125, -0.031890869140625, -0.0055999755859375, 0.02069091796875, 0.0469818115234375, 0.073272705078125, 0.0995635986328125, 0.1258544921875, 0.1521453857421875, 0.178436279296875, 0.2047271728515625, 0.23101806640625, 0.2573089599609375, 0.283599853515625, 0.3098907470703125, 0.336181640625, 0.3624725341796875, 0.388763427734375, 0.4150543212890625, 0.44134521484375, 0.4676361083984375, 0.493927001953125, 0.5202178955078125, 0.5465087890625, 0.5727996826171875, 0.599090576171875, 0.6253814697265625, 0.65167236328125, 0.6779632568359375, 0.704254150390625, 0.7305450439453125, 0.7568359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 3.0, 11.0, 12.0, 7.0, 15.0, 13.0, 17.0, 21.0, 26.0, 27.0, 35.0, 42.0, 47.0, 47.0, 53.0, 56.0, 56.0, 57.0, 58.0, 51.0, 33.0, 45.0, 42.0, 38.0, 31.0, 26.0, 20.0, 25.0, 15.0, 8.0, 14.0, 16.0, 5.0, 2.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.5205078125, -0.5063667297363281, -0.49222564697265625, -0.4780845642089844, -0.4639434814453125, -0.4498023986816406, -0.43566131591796875, -0.4215202331542969, -0.407379150390625, -0.3932380676269531, -0.37909698486328125, -0.3649559020996094, -0.3508148193359375, -0.3366737365722656, -0.32253265380859375, -0.3083915710449219, -0.29425048828125, -0.2801094055175781, -0.26596832275390625, -0.2518272399902344, -0.2376861572265625, -0.22354507446289062, -0.20940399169921875, -0.19526290893554688, -0.181121826171875, -0.16698074340820312, -0.15283966064453125, -0.13869857788085938, -0.1245574951171875, -0.11041641235351562, -0.09627532958984375, -0.08213424682617188, -0.0679931640625, -0.053852081298828125, -0.03971099853515625, -0.025569915771484375, -0.0114288330078125, 0.002712249755859375, 0.01685333251953125, 0.030994415283203125, 0.045135498046875, 0.059276580810546875, 0.07341766357421875, 0.08755874633789062, 0.1016998291015625, 0.11584091186523438, 0.12998199462890625, 0.14412307739257812, 0.15826416015625, 0.17240524291992188, 0.18654632568359375, 0.20068740844726562, 0.2148284912109375, 0.22896957397460938, 0.24311065673828125, 0.2572517395019531, 0.271392822265625, 0.2855339050292969, 0.29967498779296875, 0.3138160705566406, 0.3279571533203125, 0.3420982360839844, 0.35623931884765625, 0.3703804016113281, 0.384521484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 2.0, 6.0, 3.0, 7.0, 4.0, 13.0, 17.0, 28.0, 40.0, 61.0, 114.0, 174.0, 485.0, 1438.0, 5390.0, 33847.0, 847142.0, 144494.0, 11270.0, 2563.0, 791.0, 300.0, 142.0, 73.0, 43.0, 24.0, 18.0, 20.0, 16.0, 3.0, 5.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-1.333984375, -1.2966461181640625, -1.259307861328125, -1.2219696044921875, -1.18463134765625, -1.1472930908203125, -1.109954833984375, -1.0726165771484375, -1.0352783203125, -0.9979400634765625, -0.960601806640625, -0.9232635498046875, -0.88592529296875, -0.8485870361328125, -0.811248779296875, -0.7739105224609375, -0.736572265625, -0.6992340087890625, -0.661895751953125, -0.6245574951171875, -0.58721923828125, -0.5498809814453125, -0.512542724609375, -0.4752044677734375, -0.4378662109375, -0.4005279541015625, -0.363189697265625, -0.3258514404296875, -0.28851318359375, -0.2511749267578125, -0.213836669921875, -0.1764984130859375, -0.13916015625, -0.1018218994140625, -0.064483642578125, -0.0271453857421875, 0.01019287109375, 0.0475311279296875, 0.084869384765625, 0.1222076416015625, 0.1595458984375, 0.1968841552734375, 0.234222412109375, 0.2715606689453125, 0.30889892578125, 0.3462371826171875, 0.383575439453125, 0.4209136962890625, 0.458251953125, 0.4955902099609375, 0.532928466796875, 0.5702667236328125, 0.60760498046875, 0.6449432373046875, 0.682281494140625, 0.7196197509765625, 0.7569580078125, 0.7942962646484375, 0.831634521484375, 0.8689727783203125, 0.90631103515625, 0.9436492919921875, 0.980987548828125, 1.0183258056640625, 1.0556640625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 10.0, 6.0, 8.0, 9.0, 9.0, 23.0, 25.0, 34.0, 46.0, 69.0, 118.0, 110.0, 127.0, 121.0, 98.0, 62.0, 34.0, 21.0, 24.0, 11.0, 6.0, 8.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.207559585571289e-05, -7.894355803728104e-05, -7.581152021884918e-05, -7.267948240041733e-05, -6.954744458198547e-05, -6.641540676355362e-05, -6.328336894512177e-05, -6.015133112668991e-05, -5.701929330825806e-05, -5.38872554898262e-05, -5.075521767139435e-05, -4.7623179852962494e-05, -4.449114203453064e-05, -4.1359104216098785e-05, -3.822706639766693e-05, -3.509502857923508e-05, -3.196299076080322e-05, -2.883095294237137e-05, -2.5698915123939514e-05, -2.256687730550766e-05, -1.9434839487075806e-05, -1.630280166864395e-05, -1.3170763850212097e-05, -1.0038726031780243e-05, -6.906688213348389e-06, -3.7746503949165344e-06, -6.426125764846802e-07, 2.489425241947174e-06, 5.621463060379028e-06, 8.753500878810883e-06, 1.1885538697242737e-05, 1.5017576515674591e-05, 1.8149614334106445e-05, 2.12816521525383e-05, 2.4413689970970154e-05, 2.7545727789402008e-05, 3.067776560783386e-05, 3.3809803426265717e-05, 3.694184124469757e-05, 4.0073879063129425e-05, 4.320591688156128e-05, 4.6337954699993134e-05, 4.946999251842499e-05, 5.260203033685684e-05, 5.5734068155288696e-05, 5.886610597372055e-05, 6.19981437921524e-05, 6.513018161058426e-05, 6.826221942901611e-05, 7.139425724744797e-05, 7.452629506587982e-05, 7.765833288431168e-05, 8.079037070274353e-05, 8.392240852117538e-05, 8.705444633960724e-05, 9.018648415803909e-05, 9.331852197647095e-05, 9.64505597949028e-05, 9.958259761333466e-05, 0.00010271463543176651, 0.00010584667325019836, 0.00010897871106863022, 0.00011211074888706207, 0.00011524278670549393, 0.00011837482452392578]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 9.0, 10.0, 11.0, 23.0, 28.0, 43.0, 73.0, 81.0, 142.0, 211.0, 443.0, 820.0, 1789.0, 4205.0, 11410.0, 47320.0, 555671.0, 374097.0, 35713.0, 9474.0, 3605.0, 1651.0, 734.0, 399.0, 232.0, 118.0, 75.0, 49.0, 22.0, 21.0, 16.0, 15.0, 10.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.65185546875, -0.6326370239257812, -0.6134185791015625, -0.5942001342773438, -0.574981689453125, -0.5557632446289062, -0.5365447998046875, -0.5173263549804688, -0.49810791015625, -0.47888946533203125, -0.4596710205078125, -0.44045257568359375, -0.421234130859375, -0.40201568603515625, -0.3827972412109375, -0.36357879638671875, -0.3443603515625, -0.32514190673828125, -0.3059234619140625, -0.28670501708984375, -0.267486572265625, -0.24826812744140625, -0.2290496826171875, -0.20983123779296875, -0.19061279296875, -0.17139434814453125, -0.1521759033203125, -0.13295745849609375, -0.113739013671875, -0.09452056884765625, -0.0753021240234375, -0.05608367919921875, -0.036865234375, -0.01764678955078125, 0.0015716552734375, 0.02079010009765625, 0.040008544921875, 0.05922698974609375, 0.0784454345703125, 0.09766387939453125, 0.11688232421875, 0.13610076904296875, 0.1553192138671875, 0.17453765869140625, 0.193756103515625, 0.21297454833984375, 0.2321929931640625, 0.25141143798828125, 0.2706298828125, 0.28984832763671875, 0.3090667724609375, 0.32828521728515625, 0.347503662109375, 0.36672210693359375, 0.3859405517578125, 0.40515899658203125, 0.42437744140625, 0.44359588623046875, 0.4628143310546875, 0.48203277587890625, 0.501251220703125, 0.5204696655273438, 0.5396881103515625, 0.5589065551757812, 0.578125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 6.0, 2.0, 5.0, 6.0, 6.0, 9.0, 14.0, 29.0, 42.0, 74.0, 134.0, 177.0, 178.0, 107.0, 80.0, 47.0, 26.0, 16.0, 9.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.486328125, -0.4715843200683594, -0.45684051513671875, -0.4420967102050781, -0.4273529052734375, -0.4126091003417969, -0.39786529541015625, -0.3831214904785156, -0.368377685546875, -0.3536338806152344, -0.33889007568359375, -0.3241462707519531, -0.3094024658203125, -0.2946586608886719, -0.27991485595703125, -0.2651710510253906, -0.25042724609375, -0.23568344116210938, -0.22093963623046875, -0.20619583129882812, -0.1914520263671875, -0.17670822143554688, -0.16196441650390625, -0.14722061157226562, -0.132476806640625, -0.11773300170898438, -0.10298919677734375, -0.08824539184570312, -0.0735015869140625, -0.058757781982421875, -0.04401397705078125, -0.029270172119140625, -0.0145263671875, 0.000217437744140625, 0.01496124267578125, 0.029705047607421875, 0.0444488525390625, 0.059192657470703125, 0.07393646240234375, 0.08868026733398438, 0.103424072265625, 0.11816787719726562, 0.13291168212890625, 0.14765548706054688, 0.1623992919921875, 0.17714309692382812, 0.19188690185546875, 0.20663070678710938, 0.22137451171875, 0.23611831665039062, 0.25086212158203125, 0.2656059265136719, 0.2803497314453125, 0.2950935363769531, 0.30983734130859375, 0.3245811462402344, 0.339324951171875, 0.3540687561035156, 0.36881256103515625, 0.3835563659667969, 0.3983001708984375, 0.4130439758300781, 0.42778778076171875, 0.4425315856933594, 0.457275390625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 7.0, 5.0, 32.0, 113.0, 239.0, 334.0, 171.0, 69.0, 20.0, 12.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.548263549804688, -9.185465812683105, -8.822668075561523, -8.459871292114258, -8.097073554992676, -7.734275817871094, -7.371478080749512, -7.008680820465088, -6.645883560180664, -6.283085823059082, -5.920288562774658, -5.557490825653076, -5.194693565368652, -4.83189582824707, -4.469098091125488, -4.1063008308410645, -3.7435030937194824, -3.3807055950164795, -3.0179080963134766, -2.6551103591918945, -2.2923130989074707, -1.9295154809951782, -1.5667178630828857, -1.2039203643798828, -0.8411228656768799, -0.47832533717155457, -0.11552780866622925, 0.24726974964141846, 0.6100672483444214, 0.9728647470474243, 1.3356623649597168, 1.6984598636627197, 2.0612573623657227, 2.4240548610687256, 2.7868523597717285, 3.1496500968933105, 3.5124473571777344, 3.8752450942993164, 4.238042831420898, 4.600840091705322, 4.963637351989746, 5.326435089111328, 5.689232349395752, 6.052030086517334, 6.414827346801758, 6.77762508392334, 7.140422821044922, 7.503220081329346, 7.866017818450928, 8.228815078735352, 8.591612815856934, 8.954410552978516, 9.317208290100098, 9.680005073547363, 10.042802810668945, 10.405600547790527, 10.76839828491211, 11.131196022033691, 11.493993759155273, 11.856790542602539, 12.219588279724121, 12.582386016845703, 12.945183753967285, 13.307981491088867, 13.670778274536133]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 7.0, 4.0, 7.0, 7.0, 12.0, 17.0, 16.0, 16.0, 25.0, 25.0, 34.0, 30.0, 39.0, 40.0, 39.0, 54.0, 46.0, 47.0, 61.0, 59.0, 43.0, 56.0, 52.0, 37.0, 44.0, 32.0, 31.0, 26.0, 23.0, 13.0, 14.0, 5.0, 14.0, 4.0, 11.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0359015464782715, -2.949129104614258, -2.862356424331665, -2.7755839824676514, -2.6888115406036377, -2.602038860321045, -2.5152664184570312, -2.4284939765930176, -2.341721296310425, -2.254948854446411, -2.1681761741638184, -2.0814037322998047, -1.9946311712265015, -1.9078586101531982, -1.8210861682891846, -1.7343136072158813, -1.6475411653518677, -1.5607686042785645, -1.4739961624145508, -1.3872236013412476, -1.3004510402679443, -1.2136785984039307, -1.1269060373306274, -1.0401334762573242, -0.9533609747886658, -0.8665884733200073, -0.7798159122467041, -0.6930434107780457, -0.6062709093093872, -0.519498348236084, -0.43272584676742554, -0.3459532856941223, -0.25918078422546387, -0.17240825295448303, -0.08563573658466339, 0.00113677978515625, 0.08790931105613708, 0.17468184232711792, 0.26145434379577637, 0.3482269048690796, 0.43499940633773804, 0.5217719078063965, 0.6085444688796997, 0.6953169703483582, 0.7820894718170166, 0.8688620328903198, 0.9556345343589783, 1.0424070358276367, 1.12917959690094, 1.2159521579742432, 1.3027245998382568, 1.38949716091156, 1.4762697219848633, 1.563042163848877, 1.6498147249221802, 1.7365872859954834, 1.823359727859497, 1.9101322889328003, 1.996904730796814, 2.083677291870117, 2.170449733734131, 2.2572224140167236, 2.3439948558807373, 2.43076753616333, 2.5175399780273438]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 2.0, 6.0, 6.0, 6.0, 5.0, 8.0, 13.0, 7.0, 11.0, 16.0, 22.0, 17.0, 26.0, 38.0, 70.0, 71.0, 128.0, 242.0, 496.0, 1420.0, 6761.0, 71579.0, 3989565.0, 110789.0, 9486.0, 2028.0, 674.0, 309.0, 170.0, 88.0, 78.0, 42.0, 28.0, 19.0, 20.0, 10.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-3.2578125, -3.17547607421875, -3.0931396484375, -3.01080322265625, -2.928466796875, -2.84613037109375, -2.7637939453125, -2.68145751953125, -2.59912109375, -2.51678466796875, -2.4344482421875, -2.35211181640625, -2.269775390625, -2.18743896484375, -2.1051025390625, -2.02276611328125, -1.9404296875, -1.85809326171875, -1.7757568359375, -1.69342041015625, -1.611083984375, -1.52874755859375, -1.4464111328125, -1.36407470703125, -1.28173828125, -1.19940185546875, -1.1170654296875, -1.03472900390625, -0.952392578125, -0.87005615234375, -0.7877197265625, -0.70538330078125, -0.623046875, -0.54071044921875, -0.4583740234375, -0.37603759765625, -0.293701171875, -0.21136474609375, -0.1290283203125, -0.04669189453125, 0.03564453125, 0.11798095703125, 0.2003173828125, 0.28265380859375, 0.364990234375, 0.44732666015625, 0.5296630859375, 0.61199951171875, 0.6943359375, 0.77667236328125, 0.8590087890625, 0.94134521484375, 1.023681640625, 1.10601806640625, 1.1883544921875, 1.27069091796875, 1.35302734375, 1.43536376953125, 1.5177001953125, 1.60003662109375, 1.682373046875, 1.76470947265625, 1.8470458984375, 1.92938232421875, 2.01171875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 10.0, 12.0, 16.0, 18.0, 26.0, 34.0, 41.0, 41.0, 43.0, 45.0, 50.0, 55.0, 80.0, 60.0, 54.0, 69.0, 46.0, 47.0, 47.0, 31.0, 33.0, 27.0, 23.0, 22.0, 19.0, 19.0, 12.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08978271484375, -0.08627033233642578, -0.08275794982910156, -0.07924556732177734, -0.07573318481445312, -0.0722208023071289, -0.06870841979980469, -0.06519603729248047, -0.06168365478515625, -0.05817127227783203, -0.05465888977050781, -0.051146507263183594, -0.047634124755859375, -0.044121742248535156, -0.04060935974121094, -0.03709697723388672, -0.0335845947265625, -0.03007221221923828, -0.026559829711914062, -0.023047447204589844, -0.019535064697265625, -0.016022682189941406, -0.012510299682617188, -0.008997917175292969, -0.00548553466796875, -0.0019731521606445312, 0.0015392303466796875, 0.005051612854003906, 0.008563995361328125, 0.012076377868652344, 0.015588760375976562, 0.01910114288330078, 0.022613525390625, 0.02612590789794922, 0.029638290405273438, 0.033150672912597656, 0.036663055419921875, 0.040175437927246094, 0.04368782043457031, 0.04720020294189453, 0.05071258544921875, 0.05422496795654297, 0.05773735046386719, 0.061249732971191406, 0.06476211547851562, 0.06827449798583984, 0.07178688049316406, 0.07529926300048828, 0.0788116455078125, 0.08232402801513672, 0.08583641052246094, 0.08934879302978516, 0.09286117553710938, 0.0963735580444336, 0.09988594055175781, 0.10339832305908203, 0.10691070556640625, 0.11042308807373047, 0.11393547058105469, 0.1174478530883789, 0.12096023559570312, 0.12447261810302734, 0.12798500061035156, 0.13149738311767578, 0.135009765625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 8.0, 14.0, 22.0, 42.0, 101.0, 177.0, 442.0, 1090.0, 4229.0, 258600.0, 3920113.0, 7162.0, 1283.0, 514.0, 244.0, 106.0, 49.0, 38.0, 23.0, 13.0, 7.0, 4.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.55810546875, -2.4169921875, -2.27587890625, -2.134765625, -1.99365234375, -1.8525390625, -1.71142578125, -1.5703125, -1.42919921875, -1.2880859375, -1.14697265625, -1.005859375, -0.86474609375, -0.7236328125, -0.58251953125, -0.44140625, -0.30029296875, -0.1591796875, -0.01806640625, 0.123046875, 0.26416015625, 0.4052734375, 0.54638671875, 0.6875, 0.82861328125, 0.9697265625, 1.11083984375, 1.251953125, 1.39306640625, 1.5341796875, 1.67529296875, 1.81640625, 1.95751953125, 2.0986328125, 2.23974609375, 2.380859375, 2.52197265625, 2.6630859375, 2.80419921875, 2.9453125, 3.08642578125, 3.2275390625, 3.36865234375, 3.509765625, 3.65087890625, 3.7919921875, 3.93310546875, 4.07421875, 4.21533203125, 4.3564453125, 4.49755859375, 4.638671875, 4.77978515625, 4.9208984375, 5.06201171875, 5.203125, 5.34423828125, 5.4853515625, 5.62646484375, 5.767578125, 5.90869140625, 6.0498046875, 6.19091796875, 6.33203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 13.0, 34.0, 81.0, 366.0, 2830.0, 558.0, 132.0, 36.0, 12.0, 10.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.49877166748046875, -0.4745941162109375, -0.45041656494140625, -0.426239013671875, -0.40206146240234375, -0.3778839111328125, -0.35370635986328125, -0.32952880859375, -0.30535125732421875, -0.2811737060546875, -0.25699615478515625, -0.232818603515625, -0.20864105224609375, -0.1844635009765625, -0.16028594970703125, -0.1361083984375, -0.11193084716796875, -0.0877532958984375, -0.06357574462890625, -0.039398193359375, -0.01522064208984375, 0.0089569091796875, 0.03313446044921875, 0.05731201171875, 0.08148956298828125, 0.1056671142578125, 0.12984466552734375, 0.154022216796875, 0.17819976806640625, 0.2023773193359375, 0.22655487060546875, 0.250732421875, 0.27490997314453125, 0.2990875244140625, 0.32326507568359375, 0.347442626953125, 0.37162017822265625, 0.3957977294921875, 0.41997528076171875, 0.44415283203125, 0.46833038330078125, 0.4925079345703125, 0.5166854858398438, 0.540863037109375, 0.5650405883789062, 0.5892181396484375, 0.6133956909179688, 0.6375732421875, 0.6617507934570312, 0.6859283447265625, 0.7101058959960938, 0.734283447265625, 0.7584609985351562, 0.7826385498046875, 0.8068161010742188, 0.83099365234375, 0.8551712036132812, 0.8793487548828125, 0.9035263061523438, 0.927703857421875, 0.9518814086914062, 0.9760589599609375, 1.0002365112304688, 1.0244140625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 11.0, 54.0, 303.0, 467.0, 119.0, 33.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.450301647186279, -5.225833892822266, -5.00136661529541, -4.776899337768555, -4.552431583404541, -4.327963829040527, -4.103496551513672, -3.8790290355682373, -3.6545615196228027, -3.430094003677368, -3.2056264877319336, -2.981158971786499, -2.7566914558410645, -2.53222393989563, -2.3077564239501953, -2.0832889080047607, -1.8588213920593262, -1.6343538761138916, -1.409886360168457, -1.1854188442230225, -0.9609513282775879, -0.7364838123321533, -0.5120162963867188, -0.2875487804412842, -0.06308126449584961, 0.16138625144958496, 0.38585376739501953, 0.6103212833404541, 0.8347887992858887, 1.0592563152313232, 1.2837238311767578, 1.5081913471221924, 1.7326583862304688, 1.9571259021759033, 2.181593418121338, 2.4060609340667725, 2.630528450012207, 2.8549959659576416, 3.079463481903076, 3.3039309978485107, 3.5283985137939453, 3.75286602973938, 3.9773335456848145, 4.201801300048828, 4.426268577575684, 4.650735855102539, 4.875203609466553, 5.099671363830566, 5.324138641357422, 5.548605918884277, 5.773073673248291, 5.997541427612305, 6.22200870513916, 6.446475982666016, 6.670943737030029, 6.895411491394043, 7.119878768920898, 7.344346046447754, 7.568813800811768, 7.793281555175781, 8.017748832702637, 8.242216110229492, 8.466684341430664, 8.69115161895752, 8.915618896484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 6.0, 15.0, 18.0, 13.0, 37.0, 40.0, 43.0, 49.0, 65.0, 74.0, 85.0, 69.0, 73.0, 64.0, 59.0, 60.0, 47.0, 39.0, 45.0, 35.0, 25.0, 11.0, 9.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6858141422271729, -1.6417864561080933, -1.5977587699890137, -1.5537312030792236, -1.509703516960144, -1.4656758308410645, -1.4216482639312744, -1.3776205778121948, -1.3335928916931152, -1.2895652055740356, -1.245537519454956, -1.201509952545166, -1.1574822664260864, -1.1134545803070068, -1.0694270133972168, -1.0253993272781372, -0.9813716411590576, -0.937343955039978, -0.8933163285255432, -0.8492887020111084, -0.8052610158920288, -0.7612333297729492, -0.7172057032585144, -0.6731780767440796, -0.629150390625, -0.5851227045059204, -0.5410950779914856, -0.4970674216747284, -0.4530397653579712, -0.409012109041214, -0.3649844527244568, -0.3209567964076996, -0.27692925930023193, -0.23290160298347473, -0.18887394666671753, -0.14484629034996033, -0.10081863403320312, -0.05679097771644592, -0.01276332139968872, 0.03126433491706848, 0.07529199123382568, 0.11931964755058289, 0.1633473038673401, 0.2073749601840973, 0.2514026165008545, 0.2954302728176117, 0.3394579291343689, 0.3834855854511261, 0.4275132417678833, 0.4715408980846405, 0.5155685544013977, 0.5595961809158325, 0.6036238670349121, 0.6476515531539917, 0.6916791796684265, 0.7357068061828613, 0.7797344923019409, 0.8237621784210205, 0.8677898049354553, 0.9118174314498901, 0.9558451175689697, 0.9998728036880493, 1.043900489807129, 1.087928056716919, 1.1319557428359985]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 8.0, 2.0, 3.0, 7.0, 10.0, 8.0, 15.0, 13.0, 18.0, 30.0, 27.0, 37.0, 47.0, 83.0, 129.0, 205.0, 312.0, 642.0, 1413.0, 4215.0, 21046.0, 220978.0, 703656.0, 80267.0, 10441.0, 2671.0, 990.0, 481.0, 298.0, 165.0, 88.0, 64.0, 42.0, 34.0, 23.0, 27.0, 15.0, 12.0, 9.0, 3.0, 8.0, 1.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 4.0], "bins": [-2.46875, -2.4025726318359375, -2.336395263671875, -2.2702178955078125, -2.20404052734375, -2.1378631591796875, -2.071685791015625, -2.0055084228515625, -1.9393310546875, -1.8731536865234375, -1.806976318359375, -1.7407989501953125, -1.67462158203125, -1.6084442138671875, -1.542266845703125, -1.4760894775390625, -1.409912109375, -1.3437347412109375, -1.277557373046875, -1.2113800048828125, -1.14520263671875, -1.0790252685546875, -1.012847900390625, -0.9466705322265625, -0.8804931640625, -0.8143157958984375, -0.748138427734375, -0.6819610595703125, -0.61578369140625, -0.5496063232421875, -0.483428955078125, -0.4172515869140625, -0.35107421875, -0.2848968505859375, -0.218719482421875, -0.1525421142578125, -0.08636474609375, -0.0201873779296875, 0.045989990234375, 0.1121673583984375, 0.1783447265625, 0.2445220947265625, 0.310699462890625, 0.3768768310546875, 0.44305419921875, 0.5092315673828125, 0.575408935546875, 0.6415863037109375, 0.707763671875, 0.7739410400390625, 0.840118408203125, 0.9062957763671875, 0.97247314453125, 1.0386505126953125, 1.104827880859375, 1.1710052490234375, 1.2371826171875, 1.3033599853515625, 1.369537353515625, 1.4357147216796875, 1.50189208984375, 1.5680694580078125, 1.634246826171875, 1.7004241943359375, 1.7666015625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 19.0, 10.0, 22.0, 24.0, 38.0, 37.0, 54.0, 51.0, 62.0, 59.0, 65.0, 80.0, 66.0, 66.0, 49.0, 58.0, 56.0, 44.0, 32.0, 27.0, 20.0, 12.0, 8.0, 11.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12237548828125, -0.1180868148803711, -0.11379814147949219, -0.10950946807861328, -0.10522079467773438, -0.10093212127685547, -0.09664344787597656, -0.09235477447509766, -0.08806610107421875, -0.08377742767333984, -0.07948875427246094, -0.07520008087158203, -0.07091140747070312, -0.06662273406982422, -0.06233406066894531, -0.058045387268066406, -0.0537567138671875, -0.049468040466308594, -0.04517936706542969, -0.04089069366455078, -0.036602020263671875, -0.03231334686279297, -0.028024673461914062, -0.023736000061035156, -0.01944732666015625, -0.015158653259277344, -0.010869979858398438, -0.006581306457519531, -0.002292633056640625, 0.0019960403442382812, 0.0062847137451171875, 0.010573387145996094, 0.014862060546875, 0.019150733947753906, 0.023439407348632812, 0.02772808074951172, 0.032016754150390625, 0.03630542755126953, 0.04059410095214844, 0.044882774353027344, 0.04917144775390625, 0.053460121154785156, 0.05774879455566406, 0.06203746795654297, 0.06632614135742188, 0.07061481475830078, 0.07490348815917969, 0.0791921615600586, 0.0834808349609375, 0.0877695083618164, 0.09205818176269531, 0.09634685516357422, 0.10063552856445312, 0.10492420196533203, 0.10921287536621094, 0.11350154876708984, 0.11779022216796875, 0.12207889556884766, 0.12636756896972656, 0.13065624237060547, 0.13494491577148438, 0.13923358917236328, 0.1435222625732422, 0.1478109359741211, 0.152099609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 9.0, 5.0, 7.0, 4.0, 15.0, 19.0, 29.0, 47.0, 91.0, 152.0, 235.0, 432.0, 955.0, 2315.0, 6706.0, 28079.0, 237433.0, 653549.0, 95982.0, 14980.0, 4244.0, 1643.0, 727.0, 379.0, 197.0, 117.0, 58.0, 44.0, 35.0, 18.0, 10.0, 8.0, 11.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.337890625, -1.2888946533203125, -1.239898681640625, -1.1909027099609375, -1.14190673828125, -1.0929107666015625, -1.043914794921875, -0.9949188232421875, -0.9459228515625, -0.8969268798828125, -0.847930908203125, -0.7989349365234375, -0.74993896484375, -0.7009429931640625, -0.651947021484375, -0.6029510498046875, -0.553955078125, -0.5049591064453125, -0.455963134765625, -0.4069671630859375, -0.35797119140625, -0.3089752197265625, -0.259979248046875, -0.2109832763671875, -0.1619873046875, -0.1129913330078125, -0.063995361328125, -0.0149993896484375, 0.03399658203125, 0.0829925537109375, 0.131988525390625, 0.1809844970703125, 0.22998046875, 0.2789764404296875, 0.327972412109375, 0.3769683837890625, 0.42596435546875, 0.4749603271484375, 0.523956298828125, 0.5729522705078125, 0.6219482421875, 0.6709442138671875, 0.719940185546875, 0.7689361572265625, 0.81793212890625, 0.8669281005859375, 0.915924072265625, 0.9649200439453125, 1.013916015625, 1.0629119873046875, 1.111907958984375, 1.1609039306640625, 1.20989990234375, 1.2588958740234375, 1.307891845703125, 1.3568878173828125, 1.4058837890625, 1.4548797607421875, 1.503875732421875, 1.5528717041015625, 1.60186767578125, 1.6508636474609375, 1.699859619140625, 1.7488555908203125, 1.7978515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 6.0, 2.0, 7.0, 5.0, 7.0, 5.0, 7.0, 15.0, 19.0, 14.0, 24.0, 30.0, 36.0, 44.0, 36.0, 49.0, 46.0, 54.0, 44.0, 55.0, 64.0, 49.0, 38.0, 56.0, 34.0, 46.0, 39.0, 29.0, 27.0, 20.0, 22.0, 15.0, 16.0, 9.0, 7.0, 7.0, 6.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.418212890625, -0.4025154113769531, -0.38681793212890625, -0.3711204528808594, -0.3554229736328125, -0.3397254943847656, -0.32402801513671875, -0.3083305358886719, -0.292633056640625, -0.2769355773925781, -0.26123809814453125, -0.24554061889648438, -0.2298431396484375, -0.21414566040039062, -0.19844818115234375, -0.18275070190429688, -0.16705322265625, -0.15135574340820312, -0.13565826416015625, -0.11996078491210938, -0.1042633056640625, -0.08856582641601562, -0.07286834716796875, -0.057170867919921875, -0.041473388671875, -0.025775909423828125, -0.01007843017578125, 0.005619049072265625, 0.0213165283203125, 0.037014007568359375, 0.05271148681640625, 0.06840896606445312, 0.0841064453125, 0.09980392456054688, 0.11550140380859375, 0.13119888305664062, 0.1468963623046875, 0.16259384155273438, 0.17829132080078125, 0.19398880004882812, 0.209686279296875, 0.22538375854492188, 0.24108123779296875, 0.2567787170410156, 0.2724761962890625, 0.2881736755371094, 0.30387115478515625, 0.3195686340332031, 0.33526611328125, 0.3509635925292969, 0.36666107177734375, 0.3823585510253906, 0.3980560302734375, 0.4137535095214844, 0.42945098876953125, 0.4451484680175781, 0.460845947265625, 0.4765434265136719, 0.49224090576171875, 0.5079383850097656, 0.5236358642578125, 0.5393333435058594, 0.5550308227539062, 0.5707283020019531, 0.58642578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 3.0, 11.0, 11.0, 22.0, 32.0, 50.0, 78.0, 136.0, 250.0, 390.0, 862.0, 2150.0, 7145.0, 38538.0, 397778.0, 535842.0, 51817.0, 8930.0, 2481.0, 932.0, 453.0, 226.0, 138.0, 85.0, 53.0, 27.0, 22.0, 26.0, 15.0, 11.0, 8.0, 3.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.68212890625, -0.662109375, -0.64208984375, -0.6220703125, -0.60205078125, -0.58203125, -0.56201171875, -0.5419921875, -0.52197265625, -0.501953125, -0.48193359375, -0.4619140625, -0.44189453125, -0.421875, -0.40185546875, -0.3818359375, -0.36181640625, -0.341796875, -0.32177734375, -0.3017578125, -0.28173828125, -0.26171875, -0.24169921875, -0.2216796875, -0.20166015625, -0.181640625, -0.16162109375, -0.1416015625, -0.12158203125, -0.1015625, -0.08154296875, -0.0615234375, -0.04150390625, -0.021484375, -0.00146484375, 0.0185546875, 0.03857421875, 0.05859375, 0.07861328125, 0.0986328125, 0.11865234375, 0.138671875, 0.15869140625, 0.1787109375, 0.19873046875, 0.21875, 0.23876953125, 0.2587890625, 0.27880859375, 0.298828125, 0.31884765625, 0.3388671875, 0.35888671875, 0.37890625, 0.39892578125, 0.4189453125, 0.43896484375, 0.458984375, 0.47900390625, 0.4990234375, 0.51904296875, 0.5390625, 0.55908203125, 0.5791015625, 0.59912109375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 10.0, 7.0, 15.0, 11.0, 19.0, 18.0, 54.0, 49.0, 82.0, 110.0, 126.0, 112.0, 106.0, 87.0, 50.0, 34.0, 25.0, 24.0, 17.0, 11.0, 8.0, 4.0, 1.0, 5.0, 3.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.970499038696289e-05, -8.610356599092484e-05, -8.250214159488678e-05, -7.890071719884872e-05, -7.529929280281067e-05, -7.169786840677261e-05, -6.809644401073456e-05, -6.44950196146965e-05, -6.089359521865845e-05, -5.729217082262039e-05, -5.3690746426582336e-05, -5.008932203054428e-05, -4.6487897634506226e-05, -4.288647323846817e-05, -3.9285048842430115e-05, -3.568362444639206e-05, -3.2082200050354004e-05, -2.848077565431595e-05, -2.4879351258277893e-05, -2.1277926862239838e-05, -1.7676502466201782e-05, -1.4075078070163727e-05, -1.0473653674125671e-05, -6.872229278087616e-06, -3.2708048820495605e-06, 3.3061951398849487e-07, 3.93204391002655e-06, 7.533468306064606e-06, 1.1134892702102661e-05, 1.4736317098140717e-05, 1.8337741494178772e-05, 2.1939165890216827e-05, 2.5540590286254883e-05, 2.9142014682292938e-05, 3.2743439078330994e-05, 3.634486347436905e-05, 3.9946287870407104e-05, 4.354771226644516e-05, 4.7149136662483215e-05, 5.075056105852127e-05, 5.4351985454559326e-05, 5.795340985059738e-05, 6.155483424663544e-05, 6.515625864267349e-05, 6.875768303871155e-05, 7.23591074347496e-05, 7.596053183078766e-05, 7.956195622682571e-05, 8.316338062286377e-05, 8.676480501890182e-05, 9.036622941493988e-05, 9.396765381097794e-05, 9.756907820701599e-05, 0.00010117050260305405, 0.0001047719269990921, 0.00010837335139513016, 0.00011197477579116821, 0.00011557620018720627, 0.00011917762458324432, 0.00012277904897928238, 0.00012638047337532043, 0.0001299818977713585, 0.00013358332216739655, 0.0001371847465634346, 0.00014078617095947266]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 11.0, 17.0, 25.0, 25.0, 33.0, 64.0, 112.0, 168.0, 322.0, 567.0, 1201.0, 2762.0, 7178.0, 23697.0, 115303.0, 580359.0, 255268.0, 42346.0, 11530.0, 4090.0, 1732.0, 805.0, 366.0, 213.0, 122.0, 75.0, 50.0, 37.0, 19.0, 12.0, 10.0, 9.0, 6.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36376953125, -0.35109710693359375, -0.3384246826171875, -0.32575225830078125, -0.313079833984375, -0.30040740966796875, -0.2877349853515625, -0.27506256103515625, -0.26239013671875, -0.24971771240234375, -0.2370452880859375, -0.22437286376953125, -0.211700439453125, -0.19902801513671875, -0.1863555908203125, -0.17368316650390625, -0.1610107421875, -0.14833831787109375, -0.1356658935546875, -0.12299346923828125, -0.110321044921875, -0.09764862060546875, -0.0849761962890625, -0.07230377197265625, -0.05963134765625, -0.04695892333984375, -0.0342864990234375, -0.02161407470703125, -0.008941650390625, 0.00373077392578125, 0.0164031982421875, 0.02907562255859375, 0.041748046875, 0.05442047119140625, 0.0670928955078125, 0.07976531982421875, 0.092437744140625, 0.10511016845703125, 0.1177825927734375, 0.13045501708984375, 0.14312744140625, 0.15579986572265625, 0.1684722900390625, 0.18114471435546875, 0.193817138671875, 0.20648956298828125, 0.2191619873046875, 0.23183441162109375, 0.2445068359375, 0.25717926025390625, 0.2698516845703125, 0.28252410888671875, 0.295196533203125, 0.30786895751953125, 0.3205413818359375, 0.33321380615234375, 0.34588623046875, 0.35855865478515625, 0.3712310791015625, 0.38390350341796875, 0.396575927734375, 0.40924835205078125, 0.4219207763671875, 0.43459320068359375, 0.447265625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 9.0, 8.0, 9.0, 14.0, 20.0, 25.0, 37.0, 27.0, 28.0, 62.0, 52.0, 73.0, 78.0, 80.0, 80.0, 61.0, 49.0, 52.0, 46.0, 20.0, 30.0, 33.0, 20.0, 19.0, 18.0, 10.0, 5.0, 3.0, 4.0, 5.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2218017578125, -0.2152538299560547, -0.20870590209960938, -0.20215797424316406, -0.19561004638671875, -0.18906211853027344, -0.18251419067382812, -0.1759662628173828, -0.1694183349609375, -0.1628704071044922, -0.15632247924804688, -0.14977455139160156, -0.14322662353515625, -0.13667869567871094, -0.13013076782226562, -0.12358283996582031, -0.117034912109375, -0.11048698425292969, -0.10393905639648438, -0.09739112854003906, -0.09084320068359375, -0.08429527282714844, -0.07774734497070312, -0.07119941711425781, -0.0646514892578125, -0.05810356140136719, -0.051555633544921875, -0.04500770568847656, -0.03845977783203125, -0.03191184997558594, -0.025363922119140625, -0.018815994262695312, -0.01226806640625, -0.0057201385498046875, 0.000827789306640625, 0.0073757171630859375, 0.01392364501953125, 0.020471572875976562, 0.027019500732421875, 0.03356742858886719, 0.0401153564453125, 0.04666328430175781, 0.053211212158203125, 0.05975914001464844, 0.06630706787109375, 0.07285499572753906, 0.07940292358398438, 0.08595085144042969, 0.092498779296875, 0.09904670715332031, 0.10559463500976562, 0.11214256286621094, 0.11869049072265625, 0.12523841857910156, 0.13178634643554688, 0.1383342742919922, 0.1448822021484375, 0.1514301300048828, 0.15797805786132812, 0.16452598571777344, 0.17107391357421875, 0.17762184143066406, 0.18416976928710938, 0.1907176971435547, 0.197265625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 7.0, 42.0, 71.0, 222.0, 307.0, 208.0, 88.0, 34.0, 12.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.069975852966309, -8.64826774597168, -8.226558685302734, -7.8048505783081055, -7.38314151763916, -6.961433410644531, -6.539724826812744, -6.118016242980957, -5.69630765914917, -5.274599075317383, -4.852890491485596, -4.431181907653809, -4.00947380065918, -3.5877649784088135, -3.1660566329956055, -2.7443480491638184, -2.3226394653320312, -1.9009308815002441, -1.4792224168777466, -1.057513952255249, -0.6358053684234619, -0.2140967845916748, 0.2076115608215332, 0.6293201446533203, 1.0510287284851074, 1.4727373123168945, 1.894445776939392, 2.3161542415618896, 2.7378628253936768, 3.159571409225464, 3.581279754638672, 4.002988338470459, 4.42469596862793, 4.846404552459717, 5.268113136291504, 5.689821243286133, 6.111530303955078, 6.533238410949707, 6.954946994781494, 7.376655578613281, 7.798364162445068, 8.220072746276855, 8.641780853271484, 9.06348991394043, 9.485198020935059, 9.906907081604004, 10.328615188598633, 10.750324249267578, 11.172032356262207, 11.593740463256836, 12.015449523925781, 12.43715763092041, 12.858866691589355, 13.280574798583984, 13.70228385925293, 14.123991966247559, 14.545700073242188, 14.967408180236816, 15.389117240905762, 15.81082534790039, 16.232534408569336, 16.65424346923828, 17.075950622558594, 17.49765968322754, 17.919368743896484]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 9.0, 6.0, 12.0, 11.0, 15.0, 26.0, 36.0, 46.0, 45.0, 32.0, 50.0, 58.0, 62.0, 67.0, 57.0, 70.0, 53.0, 69.0, 46.0, 40.0, 40.0, 27.0, 27.0, 26.0, 26.0, 11.0, 13.0, 12.0, 1.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.658356666564941, -4.537021160125732, -4.415685176849365, -4.294349670410156, -4.173013687133789, -4.05167818069458, -3.930342435836792, -3.809006690979004, -3.687670946121216, -3.5663352012634277, -3.4449994564056396, -3.3236637115478516, -3.2023282051086426, -3.0809924602508545, -2.9596567153930664, -2.8383209705352783, -2.7169852256774902, -2.595649480819702, -2.474313735961914, -2.352978229522705, -2.231642484664917, -2.110306739807129, -1.9889709949493408, -1.8676352500915527, -1.7462997436523438, -1.6249639987945557, -1.5036283731460571, -1.382292628288269, -1.260956883430481, -1.1396212577819824, -1.0182855129241943, -0.8969497680664062, -0.7756140232086182, -0.6542783379554749, -0.5329425930976868, -0.41160690784454346, -0.29027119278907776, -0.16893547773361206, -0.04759979248046875, 0.07373595237731934, 0.19507163763046265, 0.31640735268592834, 0.43774306774139404, 0.5590787529945374, 0.6804144382476807, 0.8017501831054688, 0.9230858683586121, 1.044421672821045, 1.1657572984695435, 1.2870930433273315, 1.40842866897583, 1.5297644138336182, 1.6511001586914062, 1.7724359035491943, 1.8937715291976929, 2.0151071548461914, 2.1364428997039795, 2.2577786445617676, 2.3791143894195557, 2.5004501342773438, 2.6217856407165527, 2.743121385574341, 2.864457130432129, 2.985792875289917, 3.107128620147705]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 7.0, 9.0, 2.0, 10.0, 10.0, 15.0, 17.0, 28.0, 34.0, 32.0, 40.0, 54.0, 83.0, 147.0, 244.0, 624.0, 1643.0, 7369.0, 67802.0, 3816608.0, 275915.0, 18254.0, 3367.0, 1021.0, 419.0, 212.0, 124.0, 68.0, 37.0, 25.0, 18.0, 13.0, 7.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.27734375, -3.19482421875, -3.1123046875, -3.02978515625, -2.947265625, -2.86474609375, -2.7822265625, -2.69970703125, -2.6171875, -2.53466796875, -2.4521484375, -2.36962890625, -2.287109375, -2.20458984375, -2.1220703125, -2.03955078125, -1.95703125, -1.87451171875, -1.7919921875, -1.70947265625, -1.626953125, -1.54443359375, -1.4619140625, -1.37939453125, -1.296875, -1.21435546875, -1.1318359375, -1.04931640625, -0.966796875, -0.88427734375, -0.8017578125, -0.71923828125, -0.63671875, -0.55419921875, -0.4716796875, -0.38916015625, -0.306640625, -0.22412109375, -0.1416015625, -0.05908203125, 0.0234375, 0.10595703125, 0.1884765625, 0.27099609375, 0.353515625, 0.43603515625, 0.5185546875, 0.60107421875, 0.68359375, 0.76611328125, 0.8486328125, 0.93115234375, 1.013671875, 1.09619140625, 1.1787109375, 1.26123046875, 1.34375, 1.42626953125, 1.5087890625, 1.59130859375, 1.673828125, 1.75634765625, 1.8388671875, 1.92138671875, 2.00390625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 13.0, 7.0, 16.0, 16.0, 24.0, 19.0, 29.0, 40.0, 41.0, 49.0, 61.0, 61.0, 51.0, 58.0, 72.0, 62.0, 48.0, 56.0, 39.0, 46.0, 41.0, 34.0, 21.0, 19.0, 20.0, 12.0, 9.0, 7.0, 8.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1290283203125, -0.12499237060546875, -0.1209564208984375, -0.11692047119140625, -0.112884521484375, -0.10884857177734375, -0.1048126220703125, -0.10077667236328125, -0.09674072265625, -0.09270477294921875, -0.0886688232421875, -0.08463287353515625, -0.080596923828125, -0.07656097412109375, -0.0725250244140625, -0.06848907470703125, -0.064453125, -0.06041717529296875, -0.0563812255859375, -0.05234527587890625, -0.048309326171875, -0.04427337646484375, -0.0402374267578125, -0.03620147705078125, -0.03216552734375, -0.02812957763671875, -0.0240936279296875, -0.02005767822265625, -0.016021728515625, -0.01198577880859375, -0.0079498291015625, -0.00391387939453125, 0.0001220703125, 0.00415802001953125, 0.0081939697265625, 0.01222991943359375, 0.016265869140625, 0.02030181884765625, 0.0243377685546875, 0.02837371826171875, 0.03240966796875, 0.03644561767578125, 0.0404815673828125, 0.04451751708984375, 0.048553466796875, 0.05258941650390625, 0.0566253662109375, 0.06066131591796875, 0.064697265625, 0.06873321533203125, 0.0727691650390625, 0.07680511474609375, 0.080841064453125, 0.08487701416015625, 0.0889129638671875, 0.09294891357421875, 0.09698486328125, 0.10102081298828125, 0.1050567626953125, 0.10909271240234375, 0.113128662109375, 0.11716461181640625, 0.1212005615234375, 0.12523651123046875, 0.1292724609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 9.0, 18.0, 24.0, 32.0, 77.0, 158.0, 411.0, 1338.0, 6758.0, 300493.0, 3872501.0, 9677.0, 1783.0, 551.0, 184.0, 97.0, 48.0, 38.0, 26.0, 21.0, 11.0, 16.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.72265625, -4.52679443359375, -4.3309326171875, -4.13507080078125, -3.939208984375, -3.74334716796875, -3.5474853515625, -3.35162353515625, -3.15576171875, -2.95989990234375, -2.7640380859375, -2.56817626953125, -2.372314453125, -2.17645263671875, -1.9805908203125, -1.78472900390625, -1.5888671875, -1.39300537109375, -1.1971435546875, -1.00128173828125, -0.805419921875, -0.60955810546875, -0.4136962890625, -0.21783447265625, -0.02197265625, 0.17388916015625, 0.3697509765625, 0.56561279296875, 0.761474609375, 0.95733642578125, 1.1531982421875, 1.34906005859375, 1.544921875, 1.74078369140625, 1.9366455078125, 2.13250732421875, 2.328369140625, 2.52423095703125, 2.7200927734375, 2.91595458984375, 3.11181640625, 3.30767822265625, 3.5035400390625, 3.69940185546875, 3.895263671875, 4.09112548828125, 4.2869873046875, 4.48284912109375, 4.6787109375, 4.87457275390625, 5.0704345703125, 5.26629638671875, 5.462158203125, 5.65802001953125, 5.8538818359375, 6.04974365234375, 6.24560546875, 6.44146728515625, 6.6373291015625, 6.83319091796875, 7.029052734375, 7.22491455078125, 7.4207763671875, 7.61663818359375, 7.8125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 7.0, 6.0, 5.0, 8.0, 6.0, 14.0, 21.0, 20.0, 41.0, 62.0, 112.0, 226.0, 504.0, 1623.0, 791.0, 313.0, 122.0, 85.0, 42.0, 19.0, 17.0, 10.0, 7.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49951171875, -0.48211669921875, -0.4647216796875, -0.44732666015625, -0.429931640625, -0.41253662109375, -0.3951416015625, -0.37774658203125, -0.3603515625, -0.34295654296875, -0.3255615234375, -0.30816650390625, -0.290771484375, -0.27337646484375, -0.2559814453125, -0.23858642578125, -0.22119140625, -0.20379638671875, -0.1864013671875, -0.16900634765625, -0.151611328125, -0.13421630859375, -0.1168212890625, -0.09942626953125, -0.08203125, -0.06463623046875, -0.0472412109375, -0.02984619140625, -0.012451171875, 0.00494384765625, 0.0223388671875, 0.03973388671875, 0.05712890625, 0.07452392578125, 0.0919189453125, 0.10931396484375, 0.126708984375, 0.14410400390625, 0.1614990234375, 0.17889404296875, 0.1962890625, 0.21368408203125, 0.2310791015625, 0.24847412109375, 0.265869140625, 0.28326416015625, 0.3006591796875, 0.31805419921875, 0.33544921875, 0.35284423828125, 0.3702392578125, 0.38763427734375, 0.405029296875, 0.42242431640625, 0.4398193359375, 0.45721435546875, 0.474609375, 0.49200439453125, 0.5093994140625, 0.52679443359375, 0.544189453125, 0.56158447265625, 0.5789794921875, 0.59637451171875, 0.61376953125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 9.0, 5.0, 20.0, 44.0, 137.0, 304.0, 322.0, 97.0, 33.0, 18.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.602534294128418, -14.303973197937012, -14.005412101745605, -13.706851959228516, -13.40829086303711, -13.109729766845703, -12.811168670654297, -12.51260757446289, -12.214046478271484, -11.915485382080078, -11.616924285888672, -11.318364143371582, -11.019803047180176, -10.72124195098877, -10.422680854797363, -10.124119758605957, -9.825559616088867, -9.526998519897461, -9.228437423706055, -8.929877281188965, -8.631316184997559, -8.332755088806152, -8.034193992614746, -7.73563289642334, -7.437072277069092, -7.1385111808776855, -6.8399505615234375, -6.541389465332031, -6.242828369140625, -5.944267749786377, -5.645706653594971, -5.347146034240723, -5.048583984375, -4.750022888183594, -4.451462268829346, -4.1529011726379395, -3.8543403148651123, -3.555779457092285, -3.257218360900879, -2.9586575031280518, -2.6600966453552246, -2.3615357875823975, -2.0629749298095703, -1.764413833618164, -1.465852975845337, -1.1672921180725098, -0.8687311410903931, -0.5701701641082764, -0.2716093063354492, 0.026951611042022705, 0.32551252841949463, 0.6240734457969666, 0.9226343631744385, 1.2211952209472656, 1.5197561979293823, 1.818317174911499, 2.116878032684326, 2.4154388904571533, 2.7139997482299805, 3.0125608444213867, 3.311121702194214, 3.609682559967041, 3.9082436561584473, 4.206804275512695, 4.505365371704102]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 11.0, 21.0, 11.0, 24.0, 44.0, 49.0, 42.0, 65.0, 50.0, 77.0, 65.0, 62.0, 73.0, 64.0, 63.0, 54.0, 51.0, 50.0, 39.0, 26.0, 15.0, 10.0, 7.0, 9.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.830462694168091, -2.7550129890441895, -2.679563522338867, -2.604114055633545, -2.5286643505096436, -2.453214645385742, -2.37776517868042, -2.3023157119750977, -2.2268660068511963, -2.151416301727295, -2.0759668350219727, -2.0005173683166504, -1.925067663192749, -1.8496180772781372, -1.7741684913635254, -1.6987189054489136, -1.6232693195343018, -1.54781973361969, -1.4723701477050781, -1.3969205617904663, -1.3214709758758545, -1.2460213899612427, -1.1705718040466309, -1.095122218132019, -1.0196726322174072, -0.9442230463027954, -0.8687734603881836, -0.7933238744735718, -0.71787428855896, -0.6424247026443481, -0.5669751167297363, -0.4915255308151245, -0.4160761833190918, -0.34062659740448, -0.26517701148986816, -0.18972742557525635, -0.11427783966064453, -0.038828253746032715, 0.0366213321685791, 0.11207091808319092, 0.18752050399780273, 0.26297008991241455, 0.33841967582702637, 0.4138692617416382, 0.48931884765625, 0.5647684335708618, 0.6402180194854736, 0.7156676054000854, 0.7911171913146973, 0.8665667772293091, 0.9420163631439209, 1.0174659490585327, 1.0929155349731445, 1.1683651208877563, 1.2438147068023682, 1.31926429271698, 1.3947138786315918, 1.4701634645462036, 1.5456130504608154, 1.6210626363754272, 1.696512222290039, 1.7719618082046509, 1.8474113941192627, 1.9228609800338745, 1.9983105659484863]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 3.0, 7.0, 10.0, 10.0, 20.0, 17.0, 23.0, 34.0, 40.0, 64.0, 84.0, 137.0, 156.0, 254.0, 390.0, 759.0, 1761.0, 7435.0, 65520.0, 681039.0, 264118.0, 20496.0, 3435.0, 1140.0, 553.0, 324.0, 200.0, 138.0, 91.0, 86.0, 53.0, 46.0, 25.0, 18.0, 18.0, 14.0, 12.0, 9.0, 6.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3203125, -2.249481201171875, -2.17864990234375, -2.107818603515625, -2.0369873046875, -1.966156005859375, -1.89532470703125, -1.824493408203125, -1.753662109375, -1.682830810546875, -1.61199951171875, -1.541168212890625, -1.4703369140625, -1.399505615234375, -1.32867431640625, -1.257843017578125, -1.18701171875, -1.116180419921875, -1.04534912109375, -0.974517822265625, -0.9036865234375, -0.832855224609375, -0.76202392578125, -0.691192626953125, -0.620361328125, -0.549530029296875, -0.47869873046875, -0.407867431640625, -0.3370361328125, -0.266204833984375, -0.19537353515625, -0.124542236328125, -0.0537109375, 0.017120361328125, 0.08795166015625, 0.158782958984375, 0.2296142578125, 0.300445556640625, 0.37127685546875, 0.442108154296875, 0.512939453125, 0.583770751953125, 0.65460205078125, 0.725433349609375, 0.7962646484375, 0.867095947265625, 0.93792724609375, 1.008758544921875, 1.07958984375, 1.150421142578125, 1.22125244140625, 1.292083740234375, 1.3629150390625, 1.433746337890625, 1.50457763671875, 1.575408935546875, 1.646240234375, 1.717071533203125, 1.78790283203125, 1.858734130859375, 1.9295654296875, 2.000396728515625, 2.07122802734375, 2.142059326171875, 2.212890625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 6.0, 6.0, 11.0, 21.0, 14.0, 27.0, 40.0, 65.0, 67.0, 95.0, 95.0, 88.0, 88.0, 97.0, 69.0, 57.0, 38.0, 32.0, 32.0, 20.0, 15.0, 10.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.263671875, -0.257354736328125, -0.25103759765625, -0.244720458984375, -0.2384033203125, -0.232086181640625, -0.22576904296875, -0.219451904296875, -0.213134765625, -0.206817626953125, -0.20050048828125, -0.194183349609375, -0.1878662109375, -0.181549072265625, -0.17523193359375, -0.168914794921875, -0.16259765625, -0.156280517578125, -0.14996337890625, -0.143646240234375, -0.1373291015625, -0.131011962890625, -0.12469482421875, -0.118377685546875, -0.112060546875, -0.105743408203125, -0.09942626953125, -0.093109130859375, -0.0867919921875, -0.080474853515625, -0.07415771484375, -0.067840576171875, -0.0615234375, -0.055206298828125, -0.04888916015625, -0.042572021484375, -0.0362548828125, -0.029937744140625, -0.02362060546875, -0.017303466796875, -0.010986328125, -0.004669189453125, 0.00164794921875, 0.007965087890625, 0.0142822265625, 0.020599365234375, 0.02691650390625, 0.033233642578125, 0.03955078125, 0.045867919921875, 0.05218505859375, 0.058502197265625, 0.0648193359375, 0.071136474609375, 0.07745361328125, 0.083770751953125, 0.090087890625, 0.096405029296875, 0.10272216796875, 0.109039306640625, 0.1153564453125, 0.121673583984375, 0.12799072265625, 0.134307861328125, 0.140625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 6.0, 10.0, 13.0, 22.0, 30.0, 48.0, 46.0, 66.0, 87.0, 127.0, 211.0, 338.0, 479.0, 847.0, 1450.0, 2730.0, 5642.0, 12416.0, 29143.0, 73498.0, 180339.0, 318532.0, 242172.0, 105528.0, 41886.0, 17153.0, 7565.0, 3535.0, 1914.0, 1012.0, 618.0, 367.0, 203.0, 152.0, 108.0, 71.0, 56.0, 38.0, 23.0, 23.0, 18.0, 7.0, 9.0, 4.0, 2.0, 5.0, 7.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5341796875, -0.5167770385742188, -0.4993743896484375, -0.48197174072265625, -0.464569091796875, -0.44716644287109375, -0.4297637939453125, -0.41236114501953125, -0.39495849609375, -0.37755584716796875, -0.3601531982421875, -0.34275054931640625, -0.325347900390625, -0.30794525146484375, -0.2905426025390625, -0.27313995361328125, -0.2557373046875, -0.23833465576171875, -0.2209320068359375, -0.20352935791015625, -0.186126708984375, -0.16872406005859375, -0.1513214111328125, -0.13391876220703125, -0.11651611328125, -0.09911346435546875, -0.0817108154296875, -0.06430816650390625, -0.046905517578125, -0.02950286865234375, -0.0121002197265625, 0.00530242919921875, 0.022705078125, 0.04010772705078125, 0.0575103759765625, 0.07491302490234375, 0.092315673828125, 0.10971832275390625, 0.1271209716796875, 0.14452362060546875, 0.16192626953125, 0.17932891845703125, 0.1967315673828125, 0.21413421630859375, 0.231536865234375, 0.24893951416015625, 0.2663421630859375, 0.28374481201171875, 0.3011474609375, 0.31855010986328125, 0.3359527587890625, 0.35335540771484375, 0.370758056640625, 0.38816070556640625, 0.4055633544921875, 0.42296600341796875, 0.44036865234375, 0.45777130126953125, 0.4751739501953125, 0.49257659912109375, 0.509979248046875, 0.5273818969726562, 0.5447845458984375, 0.5621871948242188, 0.57958984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 6.0, 3.0, 4.0, 4.0, 14.0, 7.0, 7.0, 11.0, 17.0, 13.0, 16.0, 15.0, 10.0, 18.0, 30.0, 15.0, 32.0, 31.0, 31.0, 26.0, 31.0, 47.0, 33.0, 30.0, 41.0, 35.0, 47.0, 43.0, 40.0, 45.0, 30.0, 28.0, 30.0, 24.0, 28.0, 26.0, 17.0, 21.0, 14.0, 14.0, 12.0, 15.0, 9.0, 6.0, 9.0, 1.0, 3.0, 7.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.3818359375, -0.3686256408691406, -0.35541534423828125, -0.3422050476074219, -0.3289947509765625, -0.3157844543457031, -0.30257415771484375, -0.2893638610839844, -0.276153564453125, -0.2629432678222656, -0.24973297119140625, -0.23652267456054688, -0.2233123779296875, -0.21010208129882812, -0.19689178466796875, -0.18368148803710938, -0.17047119140625, -0.15726089477539062, -0.14405059814453125, -0.13084030151367188, -0.1176300048828125, -0.10441970825195312, -0.09120941162109375, -0.07799911499023438, -0.064788818359375, -0.051578521728515625, -0.03836822509765625, -0.025157928466796875, -0.0119476318359375, 0.001262664794921875, 0.01447296142578125, 0.027683258056640625, 0.0408935546875, 0.054103851318359375, 0.06731414794921875, 0.08052444458007812, 0.0937347412109375, 0.10694503784179688, 0.12015533447265625, 0.13336563110351562, 0.146575927734375, 0.15978622436523438, 0.17299652099609375, 0.18620681762695312, 0.1994171142578125, 0.21262741088867188, 0.22583770751953125, 0.23904800415039062, 0.25225830078125, 0.2654685974121094, 0.27867889404296875, 0.2918891906738281, 0.3050994873046875, 0.3183097839355469, 0.33152008056640625, 0.3447303771972656, 0.357940673828125, 0.3711509704589844, 0.38436126708984375, 0.3975715637207031, 0.4107818603515625, 0.4239921569824219, 0.43720245361328125, 0.4504127502441406, 0.463623046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 15.0, 16.0, 23.0, 34.0, 42.0, 71.0, 138.0, 295.0, 566.0, 1337.0, 3501.0, 12289.0, 67805.0, 414828.0, 450923.0, 76472.0, 13627.0, 3870.0, 1367.0, 654.0, 301.0, 168.0, 83.0, 42.0, 19.0, 21.0, 13.0, 3.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447998046875, -0.4325675964355469, -0.41713714599609375, -0.4017066955566406, -0.3862762451171875, -0.3708457946777344, -0.35541534423828125, -0.3399848937988281, -0.324554443359375, -0.3091239929199219, -0.29369354248046875, -0.2782630920410156, -0.2628326416015625, -0.24740219116210938, -0.23197174072265625, -0.21654129028320312, -0.20111083984375, -0.18568038940429688, -0.17024993896484375, -0.15481948852539062, -0.1393890380859375, -0.12395858764648438, -0.10852813720703125, -0.09309768676757812, -0.077667236328125, -0.062236785888671875, -0.04680633544921875, -0.031375885009765625, -0.0159454345703125, -0.000514984130859375, 0.01491546630859375, 0.030345916748046875, 0.0457763671875, 0.061206817626953125, 0.07663726806640625, 0.09206771850585938, 0.1074981689453125, 0.12292861938476562, 0.13835906982421875, 0.15378952026367188, 0.169219970703125, 0.18465042114257812, 0.20008087158203125, 0.21551132202148438, 0.2309417724609375, 0.24637222290039062, 0.26180267333984375, 0.2772331237792969, 0.29266357421875, 0.3080940246582031, 0.32352447509765625, 0.3389549255371094, 0.3543853759765625, 0.3698158264160156, 0.38524627685546875, 0.4006767272949219, 0.416107177734375, 0.4315376281738281, 0.44696807861328125, 0.4623985290527344, 0.4778289794921875, 0.4932594299316406, 0.5086898803710938, 0.5241203308105469, 0.53955078125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 5.0, 6.0, 10.0, 11.0, 23.0, 32.0, 35.0, 59.0, 74.0, 83.0, 102.0, 91.0, 105.0, 84.0, 70.0, 56.0, 35.0, 27.0, 19.0, 11.0, 12.0, 14.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.876489639282227e-05, -9.57949087023735e-05, -9.282492101192474e-05, -8.985493332147598e-05, -8.688494563102722e-05, -8.391495794057846e-05, -8.09449702501297e-05, -7.797498255968094e-05, -7.500499486923218e-05, -7.203500717878342e-05, -6.906501948833466e-05, -6.60950317978859e-05, -6.312504410743713e-05, -6.015505641698837e-05, -5.718506872653961e-05, -5.421508103609085e-05, -5.124509334564209e-05, -4.827510565519333e-05, -4.530511796474457e-05, -4.233513027429581e-05, -3.9365142583847046e-05, -3.6395154893398285e-05, -3.3425167202949524e-05, -3.0455179512500763e-05, -2.7485191822052002e-05, -2.451520413160324e-05, -2.154521644115448e-05, -1.857522875070572e-05, -1.5605241060256958e-05, -1.2635253369808197e-05, -9.665265679359436e-06, -6.695277988910675e-06, -3.725290298461914e-06, -7.553026080131531e-07, 2.214685082435608e-06, 5.184672772884369e-06, 8.15466046333313e-06, 1.1124648153781891e-05, 1.4094635844230652e-05, 1.7064623534679413e-05, 2.0034611225128174e-05, 2.3004598915576935e-05, 2.5974586606025696e-05, 2.8944574296474457e-05, 3.191456198692322e-05, 3.488454967737198e-05, 3.785453736782074e-05, 4.08245250582695e-05, 4.379451274871826e-05, 4.676450043916702e-05, 4.9734488129615784e-05, 5.2704475820064545e-05, 5.5674463510513306e-05, 5.864445120096207e-05, 6.161443889141083e-05, 6.458442658185959e-05, 6.755441427230835e-05, 7.052440196275711e-05, 7.349438965320587e-05, 7.646437734365463e-05, 7.94343650341034e-05, 8.240435272455215e-05, 8.537434041500092e-05, 8.834432810544968e-05, 9.131431579589844e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 9.0, 11.0, 14.0, 10.0, 26.0, 35.0, 48.0, 67.0, 125.0, 171.0, 327.0, 503.0, 898.0, 1600.0, 3587.0, 8780.0, 25332.0, 88457.0, 295079.0, 401113.0, 155607.0, 42930.0, 13548.0, 5245.0, 2243.0, 1176.0, 626.0, 359.0, 190.0, 144.0, 94.0, 63.0, 43.0, 32.0, 15.0, 13.0, 10.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.323486328125, -0.31479454040527344, -0.3061027526855469, -0.2974109649658203, -0.28871917724609375, -0.2800273895263672, -0.2713356018066406, -0.26264381408691406, -0.2539520263671875, -0.24526023864746094, -0.23656845092773438, -0.2278766632080078, -0.21918487548828125, -0.2104930877685547, -0.20180130004882812, -0.19310951232910156, -0.184417724609375, -0.17572593688964844, -0.16703414916992188, -0.1583423614501953, -0.14965057373046875, -0.1409587860107422, -0.13226699829101562, -0.12357521057128906, -0.1148834228515625, -0.10619163513183594, -0.09749984741210938, -0.08880805969238281, -0.08011627197265625, -0.07142448425292969, -0.06273269653320312, -0.05404090881347656, -0.04534912109375, -0.03665733337402344, -0.027965545654296875, -0.019273757934570312, -0.01058197021484375, -0.0018901824951171875, 0.006801605224609375, 0.015493392944335938, 0.0241851806640625, 0.03287696838378906, 0.041568756103515625, 0.05026054382324219, 0.05895233154296875, 0.06764411926269531, 0.07633590698242188, 0.08502769470214844, 0.093719482421875, 0.10241127014160156, 0.11110305786132812, 0.11979484558105469, 0.12848663330078125, 0.1371784210205078, 0.14587020874023438, 0.15456199645996094, 0.1632537841796875, 0.17194557189941406, 0.18063735961914062, 0.1893291473388672, 0.19802093505859375, 0.2067127227783203, 0.21540451049804688, 0.22409629821777344, 0.2327880859375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 3.0, 5.0, 7.0, 9.0, 11.0, 12.0, 11.0, 14.0, 29.0, 34.0, 39.0, 55.0, 55.0, 80.0, 66.0, 46.0, 62.0, 76.0, 55.0, 57.0, 58.0, 48.0, 34.0, 32.0, 22.0, 14.0, 14.0, 10.0, 9.0, 9.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.219482421875, -0.2124652862548828, -0.20544815063476562, -0.19843101501464844, -0.19141387939453125, -0.18439674377441406, -0.17737960815429688, -0.1703624725341797, -0.1633453369140625, -0.1563282012939453, -0.14931106567382812, -0.14229393005371094, -0.13527679443359375, -0.12825965881347656, -0.12124252319335938, -0.11422538757324219, -0.107208251953125, -0.10019111633300781, -0.09317398071289062, -0.08615684509277344, -0.07913970947265625, -0.07212257385253906, -0.06510543823242188, -0.05808830261230469, -0.0510711669921875, -0.04405403137207031, -0.037036895751953125, -0.030019760131835938, -0.02300262451171875, -0.015985488891601562, -0.008968353271484375, -0.0019512176513671875, 0.00506591796875, 0.012083053588867188, 0.019100189208984375, 0.026117324829101562, 0.03313446044921875, 0.04015159606933594, 0.047168731689453125, 0.05418586730957031, 0.0612030029296875, 0.06822013854980469, 0.07523727416992188, 0.08225440979003906, 0.08927154541015625, 0.09628868103027344, 0.10330581665039062, 0.11032295227050781, 0.117340087890625, 0.12435722351074219, 0.13137435913085938, 0.13839149475097656, 0.14540863037109375, 0.15242576599121094, 0.15944290161132812, 0.1664600372314453, 0.1734771728515625, 0.1804943084716797, 0.18751144409179688, 0.19452857971191406, 0.20154571533203125, 0.20856285095214844, 0.21557998657226562, 0.2225971221923828, 0.2296142578125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 11.0, 40.0, 150.0, 298.0, 309.0, 134.0, 41.0, 12.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.177391052246094, -9.752223014831543, -9.327054023742676, -8.901885986328125, -8.476716995239258, -8.051548957824707, -7.626380920410156, -7.201212406158447, -6.776043891906738, -6.350875377655029, -5.92570686340332, -5.5005388259887695, -5.0753703117370605, -4.650201797485352, -4.225033760070801, -3.799865245819092, -3.374696731567383, -2.949528217315674, -2.524359941482544, -2.099191665649414, -1.674023151397705, -1.248854637145996, -0.8236863613128662, -0.39851808547973633, 0.026650428771972656, 0.4518188238143921, 0.8769872188568115, 1.302155613899231, 1.7273240089416504, 2.1524925231933594, 2.5776607990264893, 3.002829074859619, 3.427997589111328, 3.853166103363037, 4.278334617614746, 4.703502655029297, 5.128671169281006, 5.553839683532715, 5.979007720947266, 6.404176235198975, 6.829344749450684, 7.254513263702393, 7.679681777954102, 8.104849815368652, 8.530017852783203, 8.95518684387207, 9.380354881286621, 9.805522918701172, 10.230691909790039, 10.65585994720459, 11.081028938293457, 11.506196975708008, 11.931365966796875, 12.356534004211426, 12.781702041625977, 13.206871032714844, 13.632039070129395, 14.057207107543945, 14.482376098632812, 14.907544136047363, 15.332712173461914, 15.757881164550781, 16.18305015563965, 16.608217239379883, 17.03338623046875]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 3.0, 0.0, 6.0, 6.0, 4.0, 7.0, 10.0, 14.0, 16.0, 25.0, 17.0, 28.0, 31.0, 31.0, 37.0, 33.0, 36.0, 36.0, 47.0, 57.0, 48.0, 49.0, 54.0, 43.0, 42.0, 36.0, 27.0, 27.0, 36.0, 30.0, 34.0, 17.0, 31.0, 13.0, 18.0, 13.0, 12.0, 6.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.4539852142333984, -3.3572051525115967, -3.260425090789795, -3.1636452674865723, -3.0668652057647705, -2.9700851440429688, -2.873305082321167, -2.7765250205993652, -2.6797451972961426, -2.582965135574341, -2.486185073852539, -2.3894052505493164, -2.2926251888275146, -2.195845127105713, -2.099065065383911, -2.0022850036621094, -1.9055050611495972, -1.8087249994277954, -1.7119450569152832, -1.6151649951934814, -1.5183850526809692, -1.4216049909591675, -1.3248250484466553, -1.2280449867248535, -1.1312649250030518, -1.03448486328125, -0.9377049207687378, -0.840924859046936, -0.7441449165344238, -0.6473648548126221, -0.5505848526954651, -0.4538048505783081, -0.3570249080657959, -0.2602449059486389, -0.16346488893032074, -0.06668487191200256, 0.03009513020515442, 0.1268751323223114, 0.22365516424179077, 0.32043516635894775, 0.41721516847610474, 0.5139951705932617, 0.6107751727104187, 0.7075551748275757, 0.8043352365493774, 0.9011151790618896, 0.9978952407836914, 1.0946753025054932, 1.1914552450180054, 1.2882353067398071, 1.3850152492523193, 1.481795310974121, 1.5785752534866333, 1.675355315208435, 1.7721352577209473, 1.868915319442749, 1.9656953811645508, 2.0624754428863525, 2.1592555046081543, 2.256035327911377, 2.3528153896331787, 2.4495954513549805, 2.5463755130767822, 2.643155574798584, 2.7399353981018066]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 7.0, 8.0, 16.0, 11.0, 17.0, 13.0, 37.0, 27.0, 46.0, 55.0, 100.0, 141.0, 244.0, 517.0, 1334.0, 5396.0, 48937.0, 3988995.0, 134443.0, 10142.0, 2020.0, 762.0, 371.0, 204.0, 136.0, 88.0, 57.0, 44.0, 35.0, 19.0, 12.0, 7.0, 12.0, 7.0, 8.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.181640625, -3.099334716796875, -3.01702880859375, -2.934722900390625, -2.8524169921875, -2.770111083984375, -2.68780517578125, -2.605499267578125, -2.523193359375, -2.440887451171875, -2.35858154296875, -2.276275634765625, -2.1939697265625, -2.111663818359375, -2.02935791015625, -1.947052001953125, -1.86474609375, -1.782440185546875, -1.70013427734375, -1.617828369140625, -1.5355224609375, -1.453216552734375, -1.37091064453125, -1.288604736328125, -1.206298828125, -1.123992919921875, -1.04168701171875, -0.959381103515625, -0.8770751953125, -0.794769287109375, -0.71246337890625, -0.630157470703125, -0.5478515625, -0.465545654296875, -0.38323974609375, -0.300933837890625, -0.2186279296875, -0.136322021484375, -0.05401611328125, 0.028289794921875, 0.110595703125, 0.192901611328125, 0.27520751953125, 0.357513427734375, 0.4398193359375, 0.522125244140625, 0.60443115234375, 0.686737060546875, 0.76904296875, 0.851348876953125, 0.93365478515625, 1.015960693359375, 1.0982666015625, 1.180572509765625, 1.26287841796875, 1.345184326171875, 1.427490234375, 1.509796142578125, 1.59210205078125, 1.674407958984375, 1.7567138671875, 1.839019775390625, 1.92132568359375, 2.003631591796875, 2.0859375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 13.0, 17.0, 25.0, 21.0, 49.0, 40.0, 64.0, 72.0, 80.0, 76.0, 84.0, 83.0, 64.0, 59.0, 56.0, 44.0, 35.0, 29.0, 30.0, 14.0, 11.0, 10.0, 3.0, 7.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2418212890625, -0.23584556579589844, -0.22986984252929688, -0.2238941192626953, -0.21791839599609375, -0.2119426727294922, -0.20596694946289062, -0.19999122619628906, -0.1940155029296875, -0.18803977966308594, -0.18206405639648438, -0.1760883331298828, -0.17011260986328125, -0.1641368865966797, -0.15816116333007812, -0.15218544006347656, -0.146209716796875, -0.14023399353027344, -0.13425827026367188, -0.1282825469970703, -0.12230682373046875, -0.11633110046386719, -0.11035537719726562, -0.10437965393066406, -0.0984039306640625, -0.09242820739746094, -0.08645248413085938, -0.08047676086425781, -0.07450103759765625, -0.06852531433105469, -0.06254959106445312, -0.05657386779785156, -0.05059814453125, -0.04462242126464844, -0.038646697998046875, -0.03267097473144531, -0.02669525146484375, -0.020719528198242188, -0.014743804931640625, -0.008768081665039062, -0.0027923583984375, 0.0031833648681640625, 0.009159088134765625, 0.015134811401367188, 0.02111053466796875, 0.027086257934570312, 0.033061981201171875, 0.03903770446777344, 0.045013427734375, 0.05098915100097656, 0.056964874267578125, 0.06294059753417969, 0.06891632080078125, 0.07489204406738281, 0.08086776733398438, 0.08684349060058594, 0.0928192138671875, 0.09879493713378906, 0.10477066040039062, 0.11074638366699219, 0.11672210693359375, 0.12269783020019531, 0.12867355346679688, 0.13464927673339844, 0.140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 11.0, 7.0, 8.0, 16.0, 18.0, 20.0, 26.0, 39.0, 61.0, 53.0, 78.0, 190.0, 8687.0, 4182926.0, 1606.0, 135.0, 77.0, 68.0, 50.0, 42.0, 38.0, 27.0, 22.0, 12.0, 15.0, 16.0, 11.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -11.07080078125, -10.7822265625, -10.49365234375, -10.205078125, -9.91650390625, -9.6279296875, -9.33935546875, -9.05078125, -8.76220703125, -8.4736328125, -8.18505859375, -7.896484375, -7.60791015625, -7.3193359375, -7.03076171875, -6.7421875, -6.45361328125, -6.1650390625, -5.87646484375, -5.587890625, -5.29931640625, -5.0107421875, -4.72216796875, -4.43359375, -4.14501953125, -3.8564453125, -3.56787109375, -3.279296875, -2.99072265625, -2.7021484375, -2.41357421875, -2.125, -1.83642578125, -1.5478515625, -1.25927734375, -0.970703125, -0.68212890625, -0.3935546875, -0.10498046875, 0.18359375, 0.47216796875, 0.7607421875, 1.04931640625, 1.337890625, 1.62646484375, 1.9150390625, 2.20361328125, 2.4921875, 2.78076171875, 3.0693359375, 3.35791015625, 3.646484375, 3.93505859375, 4.2236328125, 4.51220703125, 4.80078125, 5.08935546875, 5.3779296875, 5.66650390625, 5.955078125, 6.24365234375, 6.5322265625, 6.82080078125, 7.109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 55.0, 413.0, 3344.0, 219.0, 39.0, 13.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.2545433044433594, -0.19634246826171875, -0.13814163208007812, -0.0799407958984375, -0.021739959716796875, 0.03646087646484375, 0.09466171264648438, 0.152862548828125, 0.21106338500976562, 0.26926422119140625, 0.3274650573730469, 0.3856658935546875, 0.4438667297363281, 0.5020675659179688, 0.5602684020996094, 0.61846923828125, 0.6766700744628906, 0.7348709106445312, 0.7930717468261719, 0.8512725830078125, 0.9094734191894531, 0.9676742553710938, 1.0258750915527344, 1.084075927734375, 1.1422767639160156, 1.2004776000976562, 1.2586784362792969, 1.3168792724609375, 1.3750801086425781, 1.4332809448242188, 1.4914817810058594, 1.5496826171875, 1.6078834533691406, 1.6660842895507812, 1.7242851257324219, 1.7824859619140625, 1.8406867980957031, 1.8988876342773438, 1.9570884704589844, 2.015289306640625, 2.0734901428222656, 2.1316909790039062, 2.189891815185547, 2.2480926513671875, 2.306293487548828, 2.3644943237304688, 2.4226951599121094, 2.48089599609375, 2.5390968322753906, 2.5972976684570312, 2.655498504638672, 2.7136993408203125, 2.771900177001953, 2.8301010131835938, 2.8883018493652344, 2.946502685546875, 3.0047035217285156, 3.0629043579101562, 3.121105194091797, 3.1793060302734375, 3.237506866455078, 3.2957077026367188, 3.3539085388183594, 3.412109375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 15.0, 418.0, 564.0, 14.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.514610290527344, -22.494400024414062, -21.47418785095215, -20.453975677490234, -19.433765411376953, -18.413555145263672, -17.393342971801758, -16.373130798339844, -15.352920532226562, -14.332709312438965, -13.312498092651367, -12.29228687286377, -11.272075653076172, -10.251864433288574, -9.231653213500977, -8.211441993713379, -7.191230773925781, -6.171019554138184, -5.150808334350586, -4.130597114562988, -3.1103858947753906, -2.090174674987793, -1.0699634552001953, -0.049752235412597656, 0.970458984375, 1.9906702041625977, 3.0108814239501953, 4.031092643737793, 5.051303863525391, 6.071515083312988, 7.091726303100586, 8.111937522888184, 9.132148742675781, 10.152359962463379, 11.172571182250977, 12.192782402038574, 13.212993621826172, 14.23320484161377, 15.253416061401367, 16.27362823486328, 17.293838500976562, 18.314048767089844, 19.334260940551758, 20.354473114013672, 21.374683380126953, 22.394893646240234, 23.41510581970215, 24.435317993164062, 25.455528259277344, 26.475738525390625, 27.49595069885254, 28.516162872314453, 29.536373138427734, 30.556583404541016, 31.57679557800293, 32.597007751464844, 33.617218017578125, 34.637428283691406, 35.65763854980469, 36.677852630615234, 37.698062896728516, 38.7182731628418, 39.738487243652344, 40.758697509765625, 41.778907775878906]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 28.0, 102.0, 163.0, 247.0, 222.0, 147.0, 56.0, 23.0, 8.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.795660972595215, -7.550102233886719, -7.304543972015381, -7.058985233306885, -6.813426494598389, -6.567868232727051, -6.322309494018555, -6.076750755310059, -5.8311920166015625, -5.585633277893066, -5.3400750160217285, -5.094516277313232, -4.848957538604736, -4.603399276733398, -4.357840538024902, -4.112281799316406, -3.8667232990264893, -3.6211647987365723, -3.375606060028076, -3.130047559738159, -2.884488821029663, -2.638930320739746, -2.39337158203125, -2.147813081741333, -1.9022544622421265, -1.65669584274292, -1.4111372232437134, -1.1655786037445068, -0.9200200438499451, -0.6744614839553833, -0.42890286445617676, -0.18334424495697021, 0.06221437454223633, 0.30777299404144287, 0.5533316135406494, 0.7988901734352112, 1.0444488525390625, 1.2900073528289795, 1.535565972328186, 1.7811245918273926, 2.0266833305358887, 2.2722418308258057, 2.5178005695343018, 2.7633590698242188, 3.008917808532715, 3.254476308822632, 3.500034809112549, 3.745593547821045, 3.991152048110962, 4.236710548400879, 4.482269287109375, 4.727828025817871, 4.973386287689209, 5.218945026397705, 5.464503765106201, 5.710062026977539, 5.955620765686035, 6.201179504394531, 6.446737766265869, 6.692296504974365, 6.937855243682861, 7.183413505554199, 7.428972244262695, 7.674530982971191, 7.9200897216796875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 10.0, 5.0, 11.0, 11.0, 17.0, 22.0, 25.0, 30.0, 58.0, 52.0, 88.0, 114.0, 146.0, 193.0, 320.0, 437.0, 748.0, 1647.0, 4071.0, 14459.0, 71888.0, 383818.0, 452045.0, 91667.0, 17609.0, 4785.0, 1754.0, 868.0, 501.0, 295.0, 220.0, 161.0, 106.0, 86.0, 62.0, 55.0, 31.0, 32.0, 24.0, 18.0, 22.0, 11.0, 12.0, 5.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.369140625, -1.326446533203125, -1.28375244140625, -1.241058349609375, -1.1983642578125, -1.155670166015625, -1.11297607421875, -1.070281982421875, -1.027587890625, -0.984893798828125, -0.94219970703125, -0.899505615234375, -0.8568115234375, -0.814117431640625, -0.77142333984375, -0.728729248046875, -0.68603515625, -0.643341064453125, -0.60064697265625, -0.557952880859375, -0.5152587890625, -0.472564697265625, -0.42987060546875, -0.387176513671875, -0.344482421875, -0.301788330078125, -0.25909423828125, -0.216400146484375, -0.1737060546875, -0.131011962890625, -0.08831787109375, -0.045623779296875, -0.0029296875, 0.039764404296875, 0.08245849609375, 0.125152587890625, 0.1678466796875, 0.210540771484375, 0.25323486328125, 0.295928955078125, 0.338623046875, 0.381317138671875, 0.42401123046875, 0.466705322265625, 0.5093994140625, 0.552093505859375, 0.59478759765625, 0.637481689453125, 0.68017578125, 0.722869873046875, 0.76556396484375, 0.808258056640625, 0.8509521484375, 0.893646240234375, 0.93634033203125, 0.979034423828125, 1.021728515625, 1.064422607421875, 1.10711669921875, 1.149810791015625, 1.1925048828125, 1.235198974609375, 1.27789306640625, 1.320587158203125, 1.36328125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 26.0, 33.0, 56.0, 74.0, 112.0, 127.0, 132.0, 99.0, 106.0, 70.0, 59.0, 31.0, 31.0, 13.0, 14.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23095703125, -0.22116851806640625, -0.2113800048828125, -0.20159149169921875, -0.191802978515625, -0.18201446533203125, -0.1722259521484375, -0.16243743896484375, -0.15264892578125, -0.14286041259765625, -0.1330718994140625, -0.12328338623046875, -0.113494873046875, -0.10370635986328125, -0.0939178466796875, -0.08412933349609375, -0.0743408203125, -0.06455230712890625, -0.0547637939453125, -0.04497528076171875, -0.035186767578125, -0.02539825439453125, -0.0156097412109375, -0.00582122802734375, 0.00396728515625, 0.01375579833984375, 0.0235443115234375, 0.03333282470703125, 0.043121337890625, 0.05290985107421875, 0.0626983642578125, 0.07248687744140625, 0.082275390625, 0.09206390380859375, 0.1018524169921875, 0.11164093017578125, 0.121429443359375, 0.13121795654296875, 0.1410064697265625, 0.15079498291015625, 0.16058349609375, 0.17037200927734375, 0.1801605224609375, 0.18994903564453125, 0.199737548828125, 0.20952606201171875, 0.2193145751953125, 0.22910308837890625, 0.2388916015625, 0.24868011474609375, 0.2584686279296875, 0.26825714111328125, 0.278045654296875, 0.28783416748046875, 0.2976226806640625, 0.30741119384765625, 0.31719970703125, 0.32698822021484375, 0.3367767333984375, 0.34656524658203125, 0.356353759765625, 0.36614227294921875, 0.3759307861328125, 0.38571929931640625, 0.3955078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 5.0, 4.0, 8.0, 12.0, 16.0, 22.0, 38.0, 34.0, 63.0, 87.0, 121.0, 203.0, 331.0, 561.0, 1111.0, 2135.0, 4593.0, 10903.0, 27920.0, 76585.0, 200099.0, 350379.0, 227734.0, 89768.0, 32946.0, 12473.0, 5090.0, 2394.0, 1147.0, 640.0, 396.0, 253.0, 159.0, 94.0, 65.0, 58.0, 27.0, 21.0, 23.0, 7.0, 11.0, 4.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.5302734375, -0.51171875, -0.4931640625, -0.474609375, -0.4560546875, -0.4375, -0.4189453125, -0.400390625, -0.3818359375, -0.36328125, -0.3447265625, -0.326171875, -0.3076171875, -0.2890625, -0.2705078125, -0.251953125, -0.2333984375, -0.21484375, -0.1962890625, -0.177734375, -0.1591796875, -0.140625, -0.1220703125, -0.103515625, -0.0849609375, -0.06640625, -0.0478515625, -0.029296875, -0.0107421875, 0.0078125, 0.0263671875, 0.044921875, 0.0634765625, 0.08203125, 0.1005859375, 0.119140625, 0.1376953125, 0.15625, 0.1748046875, 0.193359375, 0.2119140625, 0.23046875, 0.2490234375, 0.267578125, 0.2861328125, 0.3046875, 0.3232421875, 0.341796875, 0.3603515625, 0.37890625, 0.3974609375, 0.416015625, 0.4345703125, 0.453125, 0.4716796875, 0.490234375, 0.5087890625, 0.52734375, 0.5458984375, 0.564453125, 0.5830078125, 0.6015625, 0.6201171875, 0.638671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 5.0, 14.0, 10.0, 16.0, 9.0, 17.0, 19.0, 31.0, 20.0, 30.0, 33.0, 48.0, 45.0, 52.0, 41.0, 49.0, 47.0, 51.0, 60.0, 36.0, 46.0, 47.0, 41.0, 28.0, 32.0, 30.0, 32.0, 22.0, 13.0, 12.0, 15.0, 13.0, 6.0, 10.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.5058746337890625, -0.486358642578125, -0.4668426513671875, -0.44732666015625, -0.4278106689453125, -0.408294677734375, -0.3887786865234375, -0.3692626953125, -0.3497467041015625, -0.330230712890625, -0.3107147216796875, -0.29119873046875, -0.2716827392578125, -0.252166748046875, -0.2326507568359375, -0.213134765625, -0.1936187744140625, -0.174102783203125, -0.1545867919921875, -0.13507080078125, -0.1155548095703125, -0.096038818359375, -0.0765228271484375, -0.0570068359375, -0.0374908447265625, -0.017974853515625, 0.0015411376953125, 0.02105712890625, 0.0405731201171875, 0.060089111328125, 0.0796051025390625, 0.09912109375, 0.1186370849609375, 0.138153076171875, 0.1576690673828125, 0.17718505859375, 0.1967010498046875, 0.216217041015625, 0.2357330322265625, 0.2552490234375, 0.2747650146484375, 0.294281005859375, 0.3137969970703125, 0.33331298828125, 0.3528289794921875, 0.372344970703125, 0.3918609619140625, 0.411376953125, 0.4308929443359375, 0.450408935546875, 0.4699249267578125, 0.48944091796875, 0.5089569091796875, 0.528472900390625, 0.5479888916015625, 0.5675048828125, 0.5870208740234375, 0.606536865234375, 0.6260528564453125, 0.64556884765625, 0.6650848388671875, 0.684600830078125, 0.7041168212890625, 0.7236328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 6.0, 13.0, 31.0, 38.0, 62.0, 93.0, 137.0, 288.0, 431.0, 865.0, 1833.0, 4804.0, 22762.0, 284584.0, 654974.0, 63633.0, 8678.0, 2678.0, 1164.0, 598.0, 320.0, 205.0, 116.0, 78.0, 51.0, 27.0, 20.0, 14.0, 9.0, 10.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67236328125, -0.6527175903320312, -0.6330718994140625, -0.6134262084960938, -0.593780517578125, -0.5741348266601562, -0.5544891357421875, -0.5348434448242188, -0.51519775390625, -0.49555206298828125, -0.4759063720703125, -0.45626068115234375, -0.436614990234375, -0.41696929931640625, -0.3973236083984375, -0.37767791748046875, -0.3580322265625, -0.33838653564453125, -0.3187408447265625, -0.29909515380859375, -0.279449462890625, -0.25980377197265625, -0.2401580810546875, -0.22051239013671875, -0.20086669921875, -0.18122100830078125, -0.1615753173828125, -0.14192962646484375, -0.122283935546875, -0.10263824462890625, -0.0829925537109375, -0.06334686279296875, -0.043701171875, -0.02405548095703125, -0.0044097900390625, 0.01523590087890625, 0.034881591796875, 0.05452728271484375, 0.0741729736328125, 0.09381866455078125, 0.11346435546875, 0.13311004638671875, 0.1527557373046875, 0.17240142822265625, 0.192047119140625, 0.21169281005859375, 0.2313385009765625, 0.25098419189453125, 0.2706298828125, 0.29027557373046875, 0.3099212646484375, 0.32956695556640625, 0.349212646484375, 0.36885833740234375, 0.3885040283203125, 0.40814971923828125, 0.42779541015625, 0.44744110107421875, 0.4670867919921875, 0.48673248291015625, 0.506378173828125, 0.5260238647460938, 0.5456695556640625, 0.5653152465820312, 0.5849609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 4.0, 7.0, 9.0, 12.0, 33.0, 54.0, 91.0, 126.0, 166.0, 166.0, 134.0, 74.0, 48.0, 26.0, 22.0, 9.0, 8.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011342763900756836, -0.00010887999087572098, -0.0001043323427438736, -9.978469461202621e-05, -9.523704648017883e-05, -9.068939834833145e-05, -8.614175021648407e-05, -8.159410208463669e-05, -7.70464539527893e-05, -7.249880582094193e-05, -6.795115768909454e-05, -6.340350955724716e-05, -5.885586142539978e-05, -5.43082132935524e-05, -4.976056516170502e-05, -4.5212917029857635e-05, -4.0665268898010254e-05, -3.611762076616287e-05, -3.156997263431549e-05, -2.702232450246811e-05, -2.2474676370620728e-05, -1.7927028238773346e-05, -1.3379380106925964e-05, -8.831731975078583e-06, -4.284083843231201e-06, 2.635642886161804e-07, 4.811212420463562e-06, 9.358860552310944e-06, 1.3906508684158325e-05, 1.8454156816005707e-05, 2.300180494785309e-05, 2.754945307970047e-05, 3.209710121154785e-05, 3.664474934339523e-05, 4.1192397475242615e-05, 4.5740045607089996e-05, 5.028769373893738e-05, 5.483534187078476e-05, 5.938299000263214e-05, 6.393063813447952e-05, 6.84782862663269e-05, 7.302593439817429e-05, 7.757358253002167e-05, 8.212123066186905e-05, 8.666887879371643e-05, 9.121652692556381e-05, 9.57641750574112e-05, 0.00010031182318925858, 0.00010485947132110596, 0.00010940711945295334, 0.00011395476758480072, 0.0001185024157166481, 0.00012305006384849548, 0.00012759771198034286, 0.00013214536011219025, 0.00013669300824403763, 0.000141240656375885, 0.0001457883045077324, 0.00015033595263957977, 0.00015488360077142715, 0.00015943124890327454, 0.00016397889703512192, 0.0001685265451669693, 0.00017307419329881668, 0.00017762184143066406]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 2.0, 12.0, 15.0, 18.0, 36.0, 50.0, 72.0, 127.0, 212.0, 367.0, 764.0, 1809.0, 4990.0, 19790.0, 138384.0, 632434.0, 211140.0, 27991.0, 6220.0, 2187.0, 881.0, 464.0, 207.0, 122.0, 84.0, 55.0, 35.0, 23.0, 10.0, 15.0, 12.0, 3.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.48779296875, -0.47369384765625, -0.4595947265625, -0.44549560546875, -0.431396484375, -0.41729736328125, -0.4031982421875, -0.38909912109375, -0.375, -0.36090087890625, -0.3468017578125, -0.33270263671875, -0.318603515625, -0.30450439453125, -0.2904052734375, -0.27630615234375, -0.26220703125, -0.24810791015625, -0.2340087890625, -0.21990966796875, -0.205810546875, -0.19171142578125, -0.1776123046875, -0.16351318359375, -0.1494140625, -0.13531494140625, -0.1212158203125, -0.10711669921875, -0.093017578125, -0.07891845703125, -0.0648193359375, -0.05072021484375, -0.03662109375, -0.02252197265625, -0.0084228515625, 0.00567626953125, 0.019775390625, 0.03387451171875, 0.0479736328125, 0.06207275390625, 0.076171875, 0.09027099609375, 0.1043701171875, 0.11846923828125, 0.132568359375, 0.14666748046875, 0.1607666015625, 0.17486572265625, 0.18896484375, 0.20306396484375, 0.2171630859375, 0.23126220703125, 0.245361328125, 0.25946044921875, 0.2735595703125, 0.28765869140625, 0.3017578125, 0.31585693359375, 0.3299560546875, 0.34405517578125, 0.358154296875, 0.37225341796875, 0.3863525390625, 0.40045166015625, 0.41455078125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 7.0, 13.0, 3.0, 11.0, 20.0, 35.0, 50.0, 59.0, 72.0, 76.0, 102.0, 91.0, 109.0, 82.0, 63.0, 50.0, 43.0, 41.0, 23.0, 14.0, 6.0, 8.0, 6.0, 4.0, 2.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3896484375, -0.3786659240722656, -0.36768341064453125, -0.3567008972167969, -0.3457183837890625, -0.3347358703613281, -0.32375335693359375, -0.3127708435058594, -0.301788330078125, -0.2908058166503906, -0.27982330322265625, -0.2688407897949219, -0.2578582763671875, -0.24687576293945312, -0.23589324951171875, -0.22491073608398438, -0.21392822265625, -0.20294570922851562, -0.19196319580078125, -0.18098068237304688, -0.1699981689453125, -0.15901565551757812, -0.14803314208984375, -0.13705062866210938, -0.126068115234375, -0.11508560180664062, -0.10410308837890625, -0.09312057495117188, -0.0821380615234375, -0.07115554809570312, -0.06017303466796875, -0.049190521240234375, -0.0382080078125, -0.027225494384765625, -0.01624298095703125, -0.005260467529296875, 0.0057220458984375, 0.016704559326171875, 0.02768707275390625, 0.038669586181640625, 0.049652099609375, 0.060634613037109375, 0.07161712646484375, 0.08259963989257812, 0.0935821533203125, 0.10456466674804688, 0.11554718017578125, 0.12652969360351562, 0.13751220703125, 0.14849472045898438, 0.15947723388671875, 0.17045974731445312, 0.1814422607421875, 0.19242477416992188, 0.20340728759765625, 0.21438980102539062, 0.225372314453125, 0.23635482788085938, 0.24733734130859375, 0.2583198547363281, 0.2693023681640625, 0.2802848815917969, 0.29126739501953125, 0.3022499084472656, 0.313232421875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 24.0, 29.0, 65.0, 132.0, 205.0, 231.0, 137.0, 80.0, 46.0, 25.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.12966537475586, -8.84589672088623, -8.562128067016602, -8.278360366821289, -7.99459171295166, -7.710823059082031, -7.4270548820495605, -7.14328670501709, -6.859518051147461, -6.575749397277832, -6.291981220245361, -6.008213043212891, -5.724444389343262, -5.440675735473633, -5.156907558441162, -4.873139381408691, -4.5893707275390625, -4.305602073669434, -4.021833896636963, -3.738065481185913, -3.4542970657348633, -3.1705286502838135, -2.8867602348327637, -2.602991819381714, -2.319223403930664, -2.0354549884796143, -1.7516865730285645, -1.4679181575775146, -1.1841497421264648, -0.900381326675415, -0.6166129112243652, -0.33284449577331543, -0.049076080322265625, 0.23469233512878418, 0.518460750579834, 0.8022291660308838, 1.0859975814819336, 1.3697659969329834, 1.6535344123840332, 1.937302827835083, 2.221071243286133, 2.5048396587371826, 2.7886080741882324, 3.0723764896392822, 3.356144905090332, 3.639913320541382, 3.9236817359924316, 4.207449913024902, 4.491218566894531, 4.77498722076416, 5.058755397796631, 5.342523574829102, 5.6262922286987305, 5.910060882568359, 6.19382905960083, 6.477597236633301, 6.76136589050293, 7.045134544372559, 7.328902721405029, 7.6126708984375, 7.896439552307129, 8.180208206176758, 8.46397590637207, 8.7477445602417, 9.031513214111328]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 9.0, 4.0, 5.0, 12.0, 8.0, 7.0, 8.0, 17.0, 14.0, 8.0, 27.0, 20.0, 23.0, 27.0, 21.0, 33.0, 29.0, 29.0, 43.0, 40.0, 45.0, 34.0, 43.0, 30.0, 61.0, 31.0, 40.0, 34.0, 39.0, 29.0, 21.0, 32.0, 24.0, 24.0, 22.0, 13.0, 14.0, 19.0, 18.0, 15.0, 7.0, 4.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.2159557342529297, -3.117790460586548, -3.019625186920166, -2.9214601516723633, -2.8232948780059814, -2.7251296043395996, -2.6269643306732178, -2.528799057006836, -2.430633783340454, -2.3324685096740723, -2.2343032360076904, -2.1361379623413086, -2.037972927093506, -1.939807653427124, -1.8416423797607422, -1.7434771060943604, -1.645311951637268, -1.5471466779708862, -1.448981523513794, -1.350816249847412, -1.2526509761810303, -1.1544857025146484, -1.0563205480575562, -0.9581552743911743, -0.8599900603294373, -0.7618248462677002, -0.6636595726013184, -0.5654943585395813, -0.46732911467552185, -0.3691638708114624, -0.27099865674972534, -0.1728333830833435, -0.07466816902160645, 0.023497067391872406, 0.12166230380535126, 0.2198275327682495, 0.31799277663230896, 0.4161580204963684, 0.5143232345581055, 0.6124885082244873, 0.7106537222862244, 0.8088189363479614, 0.9069842100143433, 1.0051493644714355, 1.1033146381378174, 1.2014799118041992, 1.299645185470581, 1.397810459136963, 1.4959756135940552, 1.594140887260437, 1.6923060417175293, 1.7904713153839111, 1.888636589050293, 1.9868018627166748, 2.0849671363830566, 2.1831321716308594, 2.281297445297241, 2.379462718963623, 2.477627992630005, 2.5757932662963867, 2.6739583015441895, 2.7721235752105713, 2.870288848876953, 2.968454122543335, 3.066619396209717]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 8.0, 17.0, 18.0, 19.0, 34.0, 58.0, 79.0, 126.0, 204.0, 313.0, 623.0, 1272.0, 3190.0, 12583.0, 84874.0, 3743744.0, 310437.0, 26970.0, 5492.0, 1867.0, 879.0, 464.0, 293.0, 197.0, 126.0, 104.0, 62.0, 49.0, 31.0, 31.0, 29.0, 23.0, 13.0, 12.0, 8.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3232421875, -1.2697296142578125, -1.216217041015625, -1.1627044677734375, -1.10919189453125, -1.0556793212890625, -1.002166748046875, -0.9486541748046875, -0.8951416015625, -0.8416290283203125, -0.788116455078125, -0.7346038818359375, -0.68109130859375, -0.6275787353515625, -0.574066162109375, -0.5205535888671875, -0.467041015625, -0.4135284423828125, -0.360015869140625, -0.3065032958984375, -0.25299072265625, -0.1994781494140625, -0.145965576171875, -0.0924530029296875, -0.0389404296875, 0.0145721435546875, 0.068084716796875, 0.1215972900390625, 0.17510986328125, 0.2286224365234375, 0.282135009765625, 0.3356475830078125, 0.38916015625, 0.4426727294921875, 0.496185302734375, 0.5496978759765625, 0.60321044921875, 0.6567230224609375, 0.710235595703125, 0.7637481689453125, 0.8172607421875, 0.8707733154296875, 0.924285888671875, 0.9777984619140625, 1.03131103515625, 1.0848236083984375, 1.138336181640625, 1.1918487548828125, 1.245361328125, 1.2988739013671875, 1.352386474609375, 1.4058990478515625, 1.45941162109375, 1.5129241943359375, 1.566436767578125, 1.6199493408203125, 1.6734619140625, 1.7269744873046875, 1.780487060546875, 1.8339996337890625, 1.88751220703125, 1.9410247802734375, 1.994537353515625, 2.0480499267578125, 2.1015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 6.0, 13.0, 12.0, 19.0, 26.0, 46.0, 78.0, 75.0, 85.0, 90.0, 96.0, 113.0, 82.0, 66.0, 46.0, 40.0, 49.0, 15.0, 15.0, 12.0, 8.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2257080078125, -0.21648597717285156, -0.20726394653320312, -0.1980419158935547, -0.18881988525390625, -0.1795978546142578, -0.17037582397460938, -0.16115379333496094, -0.1519317626953125, -0.14270973205566406, -0.13348770141601562, -0.12426567077636719, -0.11504364013671875, -0.10582160949707031, -0.09659957885742188, -0.08737754821777344, -0.078155517578125, -0.06893348693847656, -0.059711456298828125, -0.05048942565917969, -0.04126739501953125, -0.03204536437988281, -0.022823333740234375, -0.013601303100585938, -0.0043792724609375, 0.0048427581787109375, 0.014064788818359375, 0.023286819458007812, 0.03250885009765625, 0.04173088073730469, 0.050952911376953125, 0.06017494201660156, 0.06939697265625, 0.07861900329589844, 0.08784103393554688, 0.09706306457519531, 0.10628509521484375, 0.11550712585449219, 0.12472915649414062, 0.13395118713378906, 0.1431732177734375, 0.15239524841308594, 0.16161727905273438, 0.1708393096923828, 0.18006134033203125, 0.1892833709716797, 0.19850540161132812, 0.20772743225097656, 0.216949462890625, 0.22617149353027344, 0.23539352416992188, 0.2446155548095703, 0.25383758544921875, 0.2630596160888672, 0.2722816467285156, 0.28150367736816406, 0.2907257080078125, 0.29994773864746094, 0.3091697692871094, 0.3183917999267578, 0.32761383056640625, 0.3368358612060547, 0.3460578918457031, 0.35527992248535156, 0.364501953125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 9.0, 8.0, 15.0, 29.0, 31.0, 40.0, 50.0, 103.0, 185.0, 330.0, 898.0, 2385.0, 9872.0, 67014.0, 3482397.0, 588440.0, 33130.0, 6091.0, 1757.0, 714.0, 331.0, 153.0, 87.0, 57.0, 45.0, 19.0, 20.0, 17.0, 12.0, 14.0, 6.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.9033203125, -1.8530120849609375, -1.802703857421875, -1.7523956298828125, -1.70208740234375, -1.6517791748046875, -1.601470947265625, -1.5511627197265625, -1.5008544921875, -1.4505462646484375, -1.400238037109375, -1.3499298095703125, -1.29962158203125, -1.2493133544921875, -1.199005126953125, -1.1486968994140625, -1.098388671875, -1.0480804443359375, -0.997772216796875, -0.9474639892578125, -0.89715576171875, -0.8468475341796875, -0.796539306640625, -0.7462310791015625, -0.6959228515625, -0.6456146240234375, -0.595306396484375, -0.5449981689453125, -0.49468994140625, -0.4443817138671875, -0.394073486328125, -0.3437652587890625, -0.29345703125, -0.2431488037109375, -0.192840576171875, -0.1425323486328125, -0.09222412109375, -0.0419158935546875, 0.008392333984375, 0.0587005615234375, 0.1090087890625, 0.1593170166015625, 0.209625244140625, 0.2599334716796875, 0.31024169921875, 0.3605499267578125, 0.410858154296875, 0.4611663818359375, 0.511474609375, 0.5617828369140625, 0.612091064453125, 0.6623992919921875, 0.71270751953125, 0.7630157470703125, 0.813323974609375, 0.8636322021484375, 0.9139404296875, 0.9642486572265625, 1.014556884765625, 1.0648651123046875, 1.11517333984375, 1.1654815673828125, 1.215789794921875, 1.2660980224609375, 1.31640625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 1.0, 4.0, 0.0, 3.0, 10.0, 8.0, 11.0, 27.0, 39.0, 62.0, 121.0, 187.0, 440.0, 1454.0, 894.0, 331.0, 183.0, 87.0, 62.0, 46.0, 26.0, 21.0, 10.0, 14.0, 7.0, 9.0, 0.0, 6.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302734375, -0.28823089599609375, -0.2737274169921875, -0.25922393798828125, -0.244720458984375, -0.23021697998046875, -0.2157135009765625, -0.20121002197265625, -0.18670654296875, -0.17220306396484375, -0.1576995849609375, -0.14319610595703125, -0.128692626953125, -0.11418914794921875, -0.0996856689453125, -0.08518218994140625, -0.0706787109375, -0.05617523193359375, -0.0416717529296875, -0.02716827392578125, -0.012664794921875, 0.00183868408203125, 0.0163421630859375, 0.03084564208984375, 0.04534912109375, 0.05985260009765625, 0.0743560791015625, 0.08885955810546875, 0.103363037109375, 0.11786651611328125, 0.1323699951171875, 0.14687347412109375, 0.161376953125, 0.17588043212890625, 0.1903839111328125, 0.20488739013671875, 0.219390869140625, 0.23389434814453125, 0.2483978271484375, 0.26290130615234375, 0.27740478515625, 0.29190826416015625, 0.3064117431640625, 0.32091522216796875, 0.335418701171875, 0.34992218017578125, 0.3644256591796875, 0.37892913818359375, 0.3934326171875, 0.40793609619140625, 0.4224395751953125, 0.43694305419921875, 0.451446533203125, 0.46595001220703125, 0.4804534912109375, 0.49495697021484375, 0.50946044921875, 0.5239639282226562, 0.5384674072265625, 0.5529708862304688, 0.567474365234375, 0.5819778442382812, 0.5964813232421875, 0.6109848022460938, 0.62548828125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 6.0, 16.0, 20.0, 67.0, 114.0, 164.0, 188.0, 156.0, 96.0, 68.0, 44.0, 12.0, 10.0, 9.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.503411293029785, -3.3913064002990723, -3.2792015075683594, -3.1670966148376465, -3.0549917221069336, -2.9428868293762207, -2.830781936645508, -2.718677043914795, -2.606572151184082, -2.494467258453369, -2.3823623657226562, -2.2702574729919434, -2.1581525802612305, -2.0460476875305176, -1.9339427947998047, -1.8218379020690918, -1.709733009338379, -1.597628116607666, -1.4855232238769531, -1.3734183311462402, -1.2613134384155273, -1.1492085456848145, -1.0371036529541016, -0.9249987602233887, -0.8128938674926758, -0.7007889747619629, -0.58868408203125, -0.4765791893005371, -0.3644742965698242, -0.25236940383911133, -0.14026451110839844, -0.028159618377685547, 0.08394527435302734, 0.19605016708374023, 0.3081550598144531, 0.420259952545166, 0.5323648452758789, 0.6444697380065918, 0.7565746307373047, 0.8686795234680176, 0.9807844161987305, 1.0928893089294434, 1.2049942016601562, 1.3170990943908691, 1.429203987121582, 1.541308879852295, 1.6534137725830078, 1.7655186653137207, 1.8776235580444336, 1.9897284507751465, 2.1018333435058594, 2.2139382362365723, 2.326043128967285, 2.438148021697998, 2.550252914428711, 2.662357807159424, 2.7744626998901367, 2.8865675926208496, 2.9986724853515625, 3.1107773780822754, 3.2228822708129883, 3.334987163543701, 3.447092056274414, 3.559196949005127, 3.67130184173584]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 6.0, 10.0, 11.0, 10.0, 29.0, 25.0, 31.0, 50.0, 32.0, 34.0, 33.0, 49.0, 50.0, 56.0, 44.0, 47.0, 47.0, 50.0, 40.0, 43.0, 44.0, 46.0, 33.0, 33.0, 26.0, 13.0, 20.0, 20.0, 17.0, 6.0, 6.0, 6.0, 11.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4813545942306519, -1.4335582256317139, -1.3857619762420654, -1.3379656076431274, -1.2901692390441895, -1.242372989654541, -1.194576621055603, -1.146780252456665, -1.0989840030670166, -1.0511876344680786, -1.0033913850784302, -0.9555950164794922, -0.907798707485199, -0.8600023984909058, -0.8122060298919678, -0.7644097208976746, -0.7166134119033813, -0.6688171029090881, -0.6210207939147949, -0.5732244253158569, -0.5254281163215637, -0.4776318073272705, -0.4298354685306549, -0.3820391297340393, -0.3342428207397461, -0.2864465117454529, -0.23865017294883728, -0.19085384905338287, -0.14305752515792847, -0.09526120126247406, -0.04746487736701965, 0.00033146142959594727, 0.04812788963317871, 0.09592421352863312, 0.14372053742408752, 0.19151686131954193, 0.23931318521499634, 0.28710949420928955, 0.33490583300590515, 0.38270217180252075, 0.43049848079681396, 0.4782947897911072, 0.5260910987854004, 0.5738874673843384, 0.6216837763786316, 0.6694800853729248, 0.7172764539718628, 0.765072762966156, 0.8128690719604492, 0.8606653809547424, 0.9084616899490356, 0.9562580585479736, 1.004054307937622, 1.05185067653656, 1.099647045135498, 1.1474432945251465, 1.1952396631240845, 1.2430360317230225, 1.290832281112671, 1.3386286497116089, 1.3864250183105469, 1.4342212677001953, 1.4820176362991333, 1.5298140048980713, 1.5776102542877197]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 10.0, 8.0, 13.0, 15.0, 24.0, 35.0, 84.0, 182.0, 337.0, 851.0, 2831.0, 19343.0, 380639.0, 608520.0, 29966.0, 3862.0, 1009.0, 399.0, 184.0, 98.0, 56.0, 35.0, 17.0, 9.0, 12.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.828125, -2.749755859375, -2.67138671875, -2.593017578125, -2.5146484375, -2.436279296875, -2.35791015625, -2.279541015625, -2.201171875, -2.122802734375, -2.04443359375, -1.966064453125, -1.8876953125, -1.809326171875, -1.73095703125, -1.652587890625, -1.57421875, -1.495849609375, -1.41748046875, -1.339111328125, -1.2607421875, -1.182373046875, -1.10400390625, -1.025634765625, -0.947265625, -0.868896484375, -0.79052734375, -0.712158203125, -0.6337890625, -0.555419921875, -0.47705078125, -0.398681640625, -0.3203125, -0.241943359375, -0.16357421875, -0.085205078125, -0.0068359375, 0.071533203125, 0.14990234375, 0.228271484375, 0.306640625, 0.385009765625, 0.46337890625, 0.541748046875, 0.6201171875, 0.698486328125, 0.77685546875, 0.855224609375, 0.93359375, 1.011962890625, 1.09033203125, 1.168701171875, 1.2470703125, 1.325439453125, 1.40380859375, 1.482177734375, 1.560546875, 1.638916015625, 1.71728515625, 1.795654296875, 1.8740234375, 1.952392578125, 2.03076171875, 2.109130859375, 2.1875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 11.0, 13.0, 29.0, 32.0, 55.0, 63.0, 94.0, 104.0, 96.0, 128.0, 84.0, 76.0, 71.0, 44.0, 37.0, 23.0, 13.0, 6.0, 4.0, 5.0, 9.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22119140625, -0.21104049682617188, -0.20088958740234375, -0.19073867797851562, -0.1805877685546875, -0.17043685913085938, -0.16028594970703125, -0.15013504028320312, -0.139984130859375, -0.12983322143554688, -0.11968231201171875, -0.10953140258789062, -0.0993804931640625, -0.08922958374023438, -0.07907867431640625, -0.06892776489257812, -0.05877685546875, -0.048625946044921875, -0.03847503662109375, -0.028324127197265625, -0.0181732177734375, -0.008022308349609375, 0.00212860107421875, 0.012279510498046875, 0.022430419921875, 0.032581329345703125, 0.04273223876953125, 0.052883148193359375, 0.0630340576171875, 0.07318496704101562, 0.08333587646484375, 0.09348678588867188, 0.1036376953125, 0.11378860473632812, 0.12393951416015625, 0.13409042358398438, 0.1442413330078125, 0.15439224243164062, 0.16454315185546875, 0.17469406127929688, 0.184844970703125, 0.19499588012695312, 0.20514678955078125, 0.21529769897460938, 0.2254486083984375, 0.23559951782226562, 0.24575042724609375, 0.2559013366699219, 0.26605224609375, 0.2762031555175781, 0.28635406494140625, 0.2965049743652344, 0.3066558837890625, 0.3168067932128906, 0.32695770263671875, 0.3371086120605469, 0.347259521484375, 0.3574104309082031, 0.36756134033203125, 0.3777122497558594, 0.3878631591796875, 0.3980140686035156, 0.40816497802734375, 0.4183158874511719, 0.428466796875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 9.0, 13.0, 16.0, 20.0, 17.0, 30.0, 37.0, 75.0, 129.0, 242.0, 457.0, 1010.0, 2904.0, 9280.0, 39662.0, 208538.0, 564934.0, 174709.0, 33849.0, 8253.0, 2456.0, 939.0, 405.0, 214.0, 127.0, 64.0, 48.0, 35.0, 23.0, 19.0, 12.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1171875, -1.0856704711914062, -1.0541534423828125, -1.0226364135742188, -0.991119384765625, -0.9596023559570312, -0.9280853271484375, -0.8965682983398438, -0.86505126953125, -0.8335342407226562, -0.8020172119140625, -0.7705001831054688, -0.738983154296875, -0.7074661254882812, -0.6759490966796875, -0.6444320678710938, -0.6129150390625, -0.5813980102539062, -0.5498809814453125, -0.5183639526367188, -0.486846923828125, -0.45532989501953125, -0.4238128662109375, -0.39229583740234375, -0.36077880859375, -0.32926177978515625, -0.2977447509765625, -0.26622772216796875, -0.234710693359375, -0.20319366455078125, -0.1716766357421875, -0.14015960693359375, -0.108642578125, -0.07712554931640625, -0.0456085205078125, -0.01409149169921875, 0.017425537109375, 0.04894256591796875, 0.0804595947265625, 0.11197662353515625, 0.14349365234375, 0.17501068115234375, 0.2065277099609375, 0.23804473876953125, 0.269561767578125, 0.30107879638671875, 0.3325958251953125, 0.36411285400390625, 0.3956298828125, 0.42714691162109375, 0.4586639404296875, 0.49018096923828125, 0.521697998046875, 0.5532150268554688, 0.5847320556640625, 0.6162490844726562, 0.64776611328125, 0.6792831420898438, 0.7108001708984375, 0.7423171997070312, 0.773834228515625, 0.8053512573242188, 0.8368682861328125, 0.8683853149414062, 0.89990234375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 6.0, 6.0, 5.0, 16.0, 5.0, 15.0, 14.0, 11.0, 19.0, 23.0, 41.0, 27.0, 31.0, 39.0, 38.0, 45.0, 40.0, 50.0, 48.0, 55.0, 58.0, 51.0, 41.0, 40.0, 46.0, 31.0, 29.0, 22.0, 21.0, 26.0, 19.0, 22.0, 8.0, 12.0, 7.0, 12.0, 4.0, 8.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5869140625, -0.5660629272460938, -0.5452117919921875, -0.5243606567382812, -0.503509521484375, -0.48265838623046875, -0.4618072509765625, -0.44095611572265625, -0.42010498046875, -0.39925384521484375, -0.3784027099609375, -0.35755157470703125, -0.336700439453125, -0.31584930419921875, -0.2949981689453125, -0.27414703369140625, -0.2532958984375, -0.23244476318359375, -0.2115936279296875, -0.19074249267578125, -0.169891357421875, -0.14904022216796875, -0.1281890869140625, -0.10733795166015625, -0.08648681640625, -0.06563568115234375, -0.0447845458984375, -0.02393341064453125, -0.003082275390625, 0.01776885986328125, 0.0386199951171875, 0.05947113037109375, 0.080322265625, 0.10117340087890625, 0.1220245361328125, 0.14287567138671875, 0.163726806640625, 0.18457794189453125, 0.2054290771484375, 0.22628021240234375, 0.24713134765625, 0.26798248291015625, 0.2888336181640625, 0.30968475341796875, 0.330535888671875, 0.35138702392578125, 0.3722381591796875, 0.39308929443359375, 0.4139404296875, 0.43479156494140625, 0.4556427001953125, 0.47649383544921875, 0.497344970703125, 0.5181961059570312, 0.5390472412109375, 0.5598983764648438, 0.58074951171875, 0.6016006469726562, 0.6224517822265625, 0.6433029174804688, 0.664154052734375, 0.6850051879882812, 0.7058563232421875, 0.7267074584960938, 0.74755859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 11.0, 17.0, 53.0, 168.0, 415.0, 3352.0, 876505.0, 165968.0, 1585.0, 280.0, 124.0, 46.0, 13.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.888671875, -1.831207275390625, -1.77374267578125, -1.716278076171875, -1.6588134765625, -1.601348876953125, -1.54388427734375, -1.486419677734375, -1.428955078125, -1.371490478515625, -1.31402587890625, -1.256561279296875, -1.1990966796875, -1.141632080078125, -1.08416748046875, -1.026702880859375, -0.96923828125, -0.911773681640625, -0.85430908203125, -0.796844482421875, -0.7393798828125, -0.681915283203125, -0.62445068359375, -0.566986083984375, -0.509521484375, -0.452056884765625, -0.39459228515625, -0.337127685546875, -0.2796630859375, -0.222198486328125, -0.16473388671875, -0.107269287109375, -0.0498046875, 0.007659912109375, 0.06512451171875, 0.122589111328125, 0.1800537109375, 0.237518310546875, 0.29498291015625, 0.352447509765625, 0.409912109375, 0.467376708984375, 0.52484130859375, 0.582305908203125, 0.6397705078125, 0.697235107421875, 0.75469970703125, 0.812164306640625, 0.86962890625, 0.927093505859375, 0.98455810546875, 1.042022705078125, 1.0994873046875, 1.156951904296875, 1.21441650390625, 1.271881103515625, 1.329345703125, 1.386810302734375, 1.44427490234375, 1.501739501953125, 1.5592041015625, 1.616668701171875, 1.67413330078125, 1.731597900390625, 1.7890625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 11.0, 11.0, 21.0, 26.0, 49.0, 75.0, 91.0, 137.0, 162.0, 126.0, 108.0, 66.0, 49.0, 27.0, 17.0, 7.0, 10.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.259845733642578e-05, -6.901286542415619e-05, -6.54272735118866e-05, -6.1841681599617e-05, -5.825608968734741e-05, -5.467049777507782e-05, -5.108490586280823e-05, -4.7499313950538635e-05, -4.391372203826904e-05, -4.032813012599945e-05, -3.674253821372986e-05, -3.3156946301460266e-05, -2.9571354389190674e-05, -2.598576247692108e-05, -2.240017056465149e-05, -1.8814578652381897e-05, -1.5228986740112305e-05, -1.1643394827842712e-05, -8.05780291557312e-06, -4.472211003303528e-06, -8.866190910339355e-07, 2.6989728212356567e-06, 6.284564733505249e-06, 9.870156645774841e-06, 1.3455748558044434e-05, 1.7041340470314026e-05, 2.0626932382583618e-05, 2.421252429485321e-05, 2.7798116207122803e-05, 3.1383708119392395e-05, 3.496930003166199e-05, 3.855489194393158e-05, 4.214048385620117e-05, 4.5726075768470764e-05, 4.9311667680740356e-05, 5.289725959300995e-05, 5.648285150527954e-05, 6.006844341754913e-05, 6.365403532981873e-05, 6.723962724208832e-05, 7.082521915435791e-05, 7.44108110666275e-05, 7.79964029788971e-05, 8.158199489116669e-05, 8.516758680343628e-05, 8.875317871570587e-05, 9.233877062797546e-05, 9.592436254024506e-05, 9.950995445251465e-05, 0.00010309554636478424, 0.00010668113827705383, 0.00011026673018932343, 0.00011385232210159302, 0.00011743791401386261, 0.0001210235059261322, 0.0001246090978384018, 0.0001281946897506714, 0.00013178028166294098, 0.00013536587357521057, 0.00013895146548748016, 0.00014253705739974976, 0.00014612264931201935, 0.00014970824122428894, 0.00015329383313655853, 0.00015687942504882812]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 19.0, 55.0, 119.0, 346.0, 3380.0, 1033962.0, 9997.0, 424.0, 165.0, 61.0, 19.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.345703125, -2.26904296875, -2.1923828125, -2.11572265625, -2.0390625, -1.96240234375, -1.8857421875, -1.80908203125, -1.732421875, -1.65576171875, -1.5791015625, -1.50244140625, -1.42578125, -1.34912109375, -1.2724609375, -1.19580078125, -1.119140625, -1.04248046875, -0.9658203125, -0.88916015625, -0.8125, -0.73583984375, -0.6591796875, -0.58251953125, -0.505859375, -0.42919921875, -0.3525390625, -0.27587890625, -0.19921875, -0.12255859375, -0.0458984375, 0.03076171875, 0.107421875, 0.18408203125, 0.2607421875, 0.33740234375, 0.4140625, 0.49072265625, 0.5673828125, 0.64404296875, 0.720703125, 0.79736328125, 0.8740234375, 0.95068359375, 1.02734375, 1.10400390625, 1.1806640625, 1.25732421875, 1.333984375, 1.41064453125, 1.4873046875, 1.56396484375, 1.640625, 1.71728515625, 1.7939453125, 1.87060546875, 1.947265625, 2.02392578125, 2.1005859375, 2.17724609375, 2.25390625, 2.33056640625, 2.4072265625, 2.48388671875, 2.560546875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 9.0, 12.0, 95.0, 331.0, 406.0, 127.0, 20.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.544921875, -1.4935455322265625, -1.442169189453125, -1.3907928466796875, -1.33941650390625, -1.2880401611328125, -1.236663818359375, -1.1852874755859375, -1.1339111328125, -1.0825347900390625, -1.031158447265625, -0.9797821044921875, -0.92840576171875, -0.8770294189453125, -0.825653076171875, -0.7742767333984375, -0.722900390625, -0.6715240478515625, -0.620147705078125, -0.5687713623046875, -0.51739501953125, -0.4660186767578125, -0.414642333984375, -0.3632659912109375, -0.3118896484375, -0.2605133056640625, -0.209136962890625, -0.1577606201171875, -0.10638427734375, -0.0550079345703125, -0.003631591796875, 0.0477447509765625, 0.09912109375, 0.1504974365234375, 0.201873779296875, 0.2532501220703125, 0.30462646484375, 0.3560028076171875, 0.407379150390625, 0.4587554931640625, 0.5101318359375, 0.5615081787109375, 0.612884521484375, 0.6642608642578125, 0.71563720703125, 0.7670135498046875, 0.818389892578125, 0.8697662353515625, 0.921142578125, 0.9725189208984375, 1.023895263671875, 1.0752716064453125, 1.12664794921875, 1.1780242919921875, 1.229400634765625, 1.2807769775390625, 1.3321533203125, 1.3835296630859375, 1.434906005859375, 1.4862823486328125, 1.53765869140625, 1.5890350341796875, 1.640411376953125, 1.6917877197265625, 1.7431640625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 8.0, 12.0, 25.0, 95.0, 213.0, 310.0, 208.0, 87.0, 26.0, 16.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.107353210449219, -7.7137064933776855, -7.3200602531433105, -6.926413536071777, -6.532767295837402, -6.139120578765869, -5.745473861694336, -5.351827621459961, -4.958180904388428, -4.5645341873168945, -4.1708879470825195, -3.7772412300109863, -3.3835947513580322, -2.989948272705078, -2.596301555633545, -2.202655076980591, -1.8090085983276367, -1.4153621196746826, -1.021715521812439, -0.6280689239501953, -0.2344224452972412, 0.1592240333557129, 0.5528707504272461, 0.9465172290802002, 1.3401637077331543, 1.7338101863861084, 2.1274566650390625, 2.5211033821105957, 2.91474986076355, 3.308396339416504, 3.702043056488037, 4.09568977355957, 4.489336013793945, 4.8829827308654785, 5.2766289710998535, 5.670275688171387, 6.063921928405762, 6.457568645477295, 6.851215362548828, 7.244861602783203, 7.638508319854736, 8.03215503692627, 8.425801277160645, 8.819448471069336, 9.213094711303711, 9.606740951538086, 10.000387191772461, 10.394034385681152, 10.787680625915527, 11.181326866149902, 11.574974060058594, 11.968620300292969, 12.362266540527344, 12.755912780761719, 13.14955997467041, 13.543206214904785, 13.936853408813477, 14.330499649047852, 14.724146842956543, 15.117793083190918, 15.511439323425293, 15.905086517333984, 16.29873275756836, 16.692378997802734, 17.08602523803711]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 8.0, 10.0, 5.0, 13.0, 15.0, 7.0, 14.0, 23.0, 24.0, 21.0, 28.0, 29.0, 23.0, 38.0, 40.0, 35.0, 43.0, 36.0, 50.0, 32.0, 40.0, 43.0, 39.0, 36.0, 54.0, 39.0, 31.0, 34.0, 23.0, 27.0, 24.0, 21.0, 24.0, 12.0, 11.0, 7.0, 10.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 5.0], "bins": [-3.5458197593688965, -3.450713872909546, -3.3556082248687744, -3.260502338409424, -3.1653966903686523, -3.0702908039093018, -2.975184917449951, -2.8800792694091797, -2.784973621368408, -2.6898677349090576, -2.594762086868286, -2.4996562004089355, -2.404550552368164, -2.3094446659088135, -2.214338779449463, -2.1192331314086914, -2.024127244949341, -1.9290214776992798, -1.8339157104492188, -1.7388098239898682, -1.6437041759490967, -1.548598289489746, -1.453492522239685, -1.358386754989624, -1.263280987739563, -1.168175220489502, -1.073069453239441, -0.9779636263847351, -0.8828578591346741, -0.787752091884613, -0.6926462650299072, -0.5975404977798462, -0.502434492111206, -0.407328724861145, -0.3122229278087616, -0.21711713075637817, -0.12201136350631714, -0.026905596256256104, 0.06820023059844971, 0.16330599784851074, 0.2584117650985718, 0.3535175323486328, 0.44862332940101624, 0.5437291264533997, 0.6388348937034607, 0.7339406609535217, 0.8290464878082275, 0.9241522550582886, 1.0192580223083496, 1.1143637895584106, 1.2094695568084717, 1.3045754432678223, 1.3996810913085938, 1.4947869777679443, 1.5898927450180054, 1.6849985122680664, 1.7801042795181274, 1.8752100467681885, 1.9703158140182495, 2.0654215812683105, 2.160527467727661, 2.2556331157684326, 2.350739002227783, 2.4458446502685547, 2.5409505367279053]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 9.0, 3.0, 11.0, 26.0, 31.0, 36.0, 62.0, 131.0, 196.0, 404.0, 861.0, 2048.0, 7225.0, 37962.0, 1496392.0, 2598875.0, 38647.0, 7203.0, 2167.0, 832.0, 411.0, 216.0, 147.0, 97.0, 61.0, 61.0, 39.0, 28.0, 22.0, 18.0, 15.0, 7.0, 9.0, 4.0, 4.0, 4.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.4150390625, -1.3645172119140625, -1.313995361328125, -1.2634735107421875, -1.21295166015625, -1.1624298095703125, -1.111907958984375, -1.0613861083984375, -1.0108642578125, -0.9603424072265625, -0.909820556640625, -0.8592987060546875, -0.80877685546875, -0.7582550048828125, -0.707733154296875, -0.6572113037109375, -0.606689453125, -0.5561676025390625, -0.505645751953125, -0.4551239013671875, -0.40460205078125, -0.3540802001953125, -0.303558349609375, -0.2530364990234375, -0.2025146484375, -0.1519927978515625, -0.101470947265625, -0.0509490966796875, -0.00042724609375, 0.0500946044921875, 0.100616455078125, 0.1511383056640625, 0.20166015625, 0.2521820068359375, 0.302703857421875, 0.3532257080078125, 0.40374755859375, 0.4542694091796875, 0.504791259765625, 0.5553131103515625, 0.6058349609375, 0.6563568115234375, 0.706878662109375, 0.7574005126953125, 0.80792236328125, 0.8584442138671875, 0.908966064453125, 0.9594879150390625, 1.010009765625, 1.0605316162109375, 1.111053466796875, 1.1615753173828125, 1.21209716796875, 1.2626190185546875, 1.313140869140625, 1.3636627197265625, 1.4141845703125, 1.4647064208984375, 1.515228271484375, 1.5657501220703125, 1.61627197265625, 1.6667938232421875, 1.717315673828125, 1.7678375244140625, 1.818359375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 17.0, 14.0, 31.0, 63.0, 94.0, 98.0, 94.0, 112.0, 110.0, 77.0, 74.0, 72.0, 41.0, 37.0, 26.0, 12.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2607421875, -0.2492218017578125, -0.237701416015625, -0.2261810302734375, -0.21466064453125, -0.2031402587890625, -0.191619873046875, -0.1800994873046875, -0.1685791015625, -0.1570587158203125, -0.145538330078125, -0.1340179443359375, -0.12249755859375, -0.1109771728515625, -0.099456787109375, -0.0879364013671875, -0.076416015625, -0.0648956298828125, -0.053375244140625, -0.0418548583984375, -0.03033447265625, -0.0188140869140625, -0.007293701171875, 0.0042266845703125, 0.0157470703125, 0.0272674560546875, 0.038787841796875, 0.0503082275390625, 0.06182861328125, 0.0733489990234375, 0.084869384765625, 0.0963897705078125, 0.10791015625, 0.1194305419921875, 0.130950927734375, 0.1424713134765625, 0.15399169921875, 0.1655120849609375, 0.177032470703125, 0.1885528564453125, 0.2000732421875, 0.2115936279296875, 0.223114013671875, 0.2346343994140625, 0.24615478515625, 0.2576751708984375, 0.269195556640625, 0.2807159423828125, 0.292236328125, 0.3037567138671875, 0.315277099609375, 0.3267974853515625, 0.33831787109375, 0.3498382568359375, 0.361358642578125, 0.3728790283203125, 0.3843994140625, 0.3959197998046875, 0.407440185546875, 0.4189605712890625, 0.43048095703125, 0.4420013427734375, 0.453521728515625, 0.4650421142578125, 0.4765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 4.0, 9.0, 9.0, 22.0, 34.0, 63.0, 107.0, 184.0, 431.0, 876.0, 2335.0, 9067.0, 87146.0, 3931138.0, 145602.0, 12395.0, 2928.0, 1033.0, 448.0, 210.0, 108.0, 65.0, 35.0, 16.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.5546875, -2.496063232421875, -2.43743896484375, -2.378814697265625, -2.3201904296875, -2.261566162109375, -2.20294189453125, -2.144317626953125, -2.085693359375, -2.027069091796875, -1.96844482421875, -1.909820556640625, -1.8511962890625, -1.792572021484375, -1.73394775390625, -1.675323486328125, -1.61669921875, -1.558074951171875, -1.49945068359375, -1.440826416015625, -1.3822021484375, -1.323577880859375, -1.26495361328125, -1.206329345703125, -1.147705078125, -1.089080810546875, -1.03045654296875, -0.971832275390625, -0.9132080078125, -0.854583740234375, -0.79595947265625, -0.737335205078125, -0.6787109375, -0.620086669921875, -0.56146240234375, -0.502838134765625, -0.4442138671875, -0.385589599609375, -0.32696533203125, -0.268341064453125, -0.209716796875, -0.151092529296875, -0.09246826171875, -0.033843994140625, 0.0247802734375, 0.083404541015625, 0.14202880859375, 0.200653076171875, 0.25927734375, 0.317901611328125, 0.37652587890625, 0.435150146484375, 0.4937744140625, 0.552398681640625, 0.61102294921875, 0.669647216796875, 0.728271484375, 0.786895751953125, 0.84552001953125, 0.904144287109375, 0.9627685546875, 1.021392822265625, 1.08001708984375, 1.138641357421875, 1.197265625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 16.0, 15.0, 33.0, 51.0, 97.0, 272.0, 1411.0, 1590.0, 294.0, 106.0, 59.0, 53.0, 34.0, 10.0, 11.0, 4.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64208984375, -0.623748779296875, -0.60540771484375, -0.587066650390625, -0.5687255859375, -0.550384521484375, -0.53204345703125, -0.513702392578125, -0.495361328125, -0.477020263671875, -0.45867919921875, -0.440338134765625, -0.4219970703125, -0.403656005859375, -0.38531494140625, -0.366973876953125, -0.3486328125, -0.330291748046875, -0.31195068359375, -0.293609619140625, -0.2752685546875, -0.256927490234375, -0.23858642578125, -0.220245361328125, -0.201904296875, -0.183563232421875, -0.16522216796875, -0.146881103515625, -0.1285400390625, -0.110198974609375, -0.09185791015625, -0.073516845703125, -0.05517578125, -0.036834716796875, -0.01849365234375, -0.000152587890625, 0.0181884765625, 0.036529541015625, 0.05487060546875, 0.073211669921875, 0.091552734375, 0.109893798828125, 0.12823486328125, 0.146575927734375, 0.1649169921875, 0.183258056640625, 0.20159912109375, 0.219940185546875, 0.23828125, 0.256622314453125, 0.27496337890625, 0.293304443359375, 0.3116455078125, 0.329986572265625, 0.34832763671875, 0.366668701171875, 0.385009765625, 0.403350830078125, 0.42169189453125, 0.440032958984375, 0.4583740234375, 0.476715087890625, 0.49505615234375, 0.513397216796875, 0.53173828125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 7.0, 27.0, 105.0, 409.0, 342.0, 84.0, 18.0, 5.0, 7.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.522583961486816, -4.281192302703857, -4.039801120758057, -3.7984094619750977, -3.5570180416107178, -3.315626621246338, -3.074235200881958, -2.832843780517578, -2.591452121734619, -2.3500607013702393, -2.1086692810058594, -1.86727774143219, -1.6258862018585205, -1.3844947814941406, -1.1431033611297607, -0.9017118215560913, -0.660320520401001, -0.4189290404319763, -0.17753759026527405, 0.06385385990142822, 0.3052453398704529, 0.5466368198394775, 0.7880282402038574, 1.0294197797775269, 1.2708112001419067, 1.5122026205062866, 1.753594160079956, 1.994985580444336, 2.236377000808716, 2.4777684211730957, 2.7191600799560547, 2.9605515003204346, 3.2019429206848145, 3.4433343410491943, 3.684725761413574, 3.926117420196533, 4.167508602142334, 4.408900260925293, 4.650291442871094, 4.891683101654053, 5.133074760437012, 5.374466419219971, 5.6158576011657715, 5.8572492599487305, 6.098640441894531, 6.34003210067749, 6.581423759460449, 6.82281494140625, 7.064206123352051, 7.30559778213501, 7.5469889640808105, 7.7883806228637695, 8.02977180480957, 8.271163940429688, 8.512555122375488, 8.753946304321289, 8.995338439941406, 9.236729621887207, 9.478121757507324, 9.719512939453125, 9.960904121398926, 10.202295303344727, 10.443687438964844, 10.685078620910645, 10.926469802856445]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 9.0, 13.0, 17.0, 27.0, 39.0, 37.0, 57.0, 66.0, 74.0, 74.0, 84.0, 81.0, 89.0, 75.0, 56.0, 56.0, 30.0, 31.0, 31.0, 21.0, 12.0, 4.0, 4.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9352753162384033, -1.8642559051513672, -1.7932363748550415, -1.7222169637680054, -1.6511974334716797, -1.5801780223846436, -1.5091586112976074, -1.4381392002105713, -1.3671196699142456, -1.2961002588272095, -1.2250807285308838, -1.1540613174438477, -1.0830419063568115, -1.0120223760604858, -0.9410029649734497, -0.8699834942817688, -0.7989640235900879, -0.727944552898407, -0.6569250822067261, -0.5859056711196899, -0.514886200428009, -0.4438667297363281, -0.3728472888469696, -0.3018278479576111, -0.23080837726593018, -0.15978892147541046, -0.08876946568489075, -0.017750009894371033, 0.05326944589614868, 0.12428891658782959, 0.1953083574771881, 0.26632779836654663, 0.33734703063964844, 0.40836650133132935, 0.47938594222068787, 0.5504053831100464, 0.6214248538017273, 0.6924443244934082, 0.7634637355804443, 0.8344832062721252, 0.9055026769638062, 0.9765221476554871, 1.047541618347168, 1.118561029434204, 1.1895804405212402, 1.260599970817566, 1.331619381904602, 1.4026389122009277, 1.4736583232879639, 1.544677734375, 1.6156972646713257, 1.6867166757583618, 1.7577362060546875, 1.8287556171417236, 1.8997750282287598, 1.970794439315796, 2.041813850402832, 2.112833261489868, 2.1838526725769043, 2.2548723220825195, 2.3258917331695557, 2.396911144256592, 2.467930555343628, 2.538949966430664, 2.6099696159362793]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 9.0, 5.0, 8.0, 12.0, 16.0, 24.0, 42.0, 69.0, 73.0, 136.0, 223.0, 394.0, 888.0, 2432.0, 10022.0, 64780.0, 515307.0, 394771.0, 47751.0, 7851.0, 2055.0, 787.0, 353.0, 197.0, 102.0, 88.0, 42.0, 40.0, 22.0, 14.0, 9.0, 10.0, 9.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1728515625, -1.1216888427734375, -1.070526123046875, -1.0193634033203125, -0.96820068359375, -0.9170379638671875, -0.865875244140625, -0.8147125244140625, -0.7635498046875, -0.7123870849609375, -0.661224365234375, -0.6100616455078125, -0.55889892578125, -0.5077362060546875, -0.456573486328125, -0.4054107666015625, -0.354248046875, -0.3030853271484375, -0.251922607421875, -0.2007598876953125, -0.14959716796875, -0.0984344482421875, -0.047271728515625, 0.0038909912109375, 0.0550537109375, 0.1062164306640625, 0.157379150390625, 0.2085418701171875, 0.25970458984375, 0.3108673095703125, 0.362030029296875, 0.4131927490234375, 0.46435546875, 0.5155181884765625, 0.566680908203125, 0.6178436279296875, 0.66900634765625, 0.7201690673828125, 0.771331787109375, 0.8224945068359375, 0.8736572265625, 0.9248199462890625, 0.975982666015625, 1.0271453857421875, 1.07830810546875, 1.1294708251953125, 1.180633544921875, 1.2317962646484375, 1.282958984375, 1.3341217041015625, 1.385284423828125, 1.4364471435546875, 1.48760986328125, 1.5387725830078125, 1.589935302734375, 1.6410980224609375, 1.6922607421875, 1.7434234619140625, 1.794586181640625, 1.8457489013671875, 1.89691162109375, 1.9480743408203125, 1.999237060546875, 2.0503997802734375, 2.1015625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 11.0, 21.0, 31.0, 56.0, 74.0, 100.0, 105.0, 120.0, 127.0, 76.0, 100.0, 67.0, 45.0, 29.0, 17.0, 9.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.281982421875, -0.2683906555175781, -0.25479888916015625, -0.24120712280273438, -0.2276153564453125, -0.21402359008789062, -0.20043182373046875, -0.18684005737304688, -0.173248291015625, -0.15965652465820312, -0.14606475830078125, -0.13247299194335938, -0.1188812255859375, -0.10528945922851562, -0.09169769287109375, -0.07810592651367188, -0.06451416015625, -0.050922393798828125, -0.03733062744140625, -0.023738861083984375, -0.0101470947265625, 0.003444671630859375, 0.01703643798828125, 0.030628204345703125, 0.044219970703125, 0.057811737060546875, 0.07140350341796875, 0.08499526977539062, 0.0985870361328125, 0.11217880249023438, 0.12577056884765625, 0.13936233520507812, 0.1529541015625, 0.16654586791992188, 0.18013763427734375, 0.19372940063476562, 0.2073211669921875, 0.22091293334960938, 0.23450469970703125, 0.24809646606445312, 0.261688232421875, 0.2752799987792969, 0.28887176513671875, 0.3024635314941406, 0.3160552978515625, 0.3296470642089844, 0.34323883056640625, 0.3568305969238281, 0.37042236328125, 0.3840141296386719, 0.39760589599609375, 0.4111976623535156, 0.4247894287109375, 0.4383811950683594, 0.45197296142578125, 0.4655647277832031, 0.479156494140625, 0.4927482604980469, 0.5063400268554688, 0.5199317932128906, 0.5335235595703125, 0.5471153259277344, 0.5607070922851562, 0.5742988586425781, 0.587890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 9.0, 9.0, 13.0, 10.0, 28.0, 29.0, 45.0, 63.0, 113.0, 172.0, 352.0, 674.0, 1676.0, 4958.0, 17921.0, 73710.0, 318234.0, 466619.0, 122869.0, 28864.0, 7829.0, 2429.0, 931.0, 423.0, 195.0, 126.0, 74.0, 47.0, 39.0, 30.0, 15.0, 9.0, 11.0, 7.0, 4.0, 3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.9931640625, -0.9649276733398438, -0.9366912841796875, -0.9084548950195312, -0.880218505859375, -0.8519821166992188, -0.8237457275390625, -0.7955093383789062, -0.76727294921875, -0.7390365600585938, -0.7108001708984375, -0.6825637817382812, -0.654327392578125, -0.6260910034179688, -0.5978546142578125, -0.5696182250976562, -0.5413818359375, -0.5131454467773438, -0.4849090576171875, -0.45667266845703125, -0.428436279296875, -0.40019989013671875, -0.3719635009765625, -0.34372711181640625, -0.31549072265625, -0.28725433349609375, -0.2590179443359375, -0.23078155517578125, -0.202545166015625, -0.17430877685546875, -0.1460723876953125, -0.11783599853515625, -0.089599609375, -0.06136322021484375, -0.0331268310546875, -0.00489044189453125, 0.023345947265625, 0.05158233642578125, 0.0798187255859375, 0.10805511474609375, 0.13629150390625, 0.16452789306640625, 0.1927642822265625, 0.22100067138671875, 0.249237060546875, 0.27747344970703125, 0.3057098388671875, 0.33394622802734375, 0.3621826171875, 0.39041900634765625, 0.4186553955078125, 0.44689178466796875, 0.475128173828125, 0.5033645629882812, 0.5316009521484375, 0.5598373413085938, 0.58807373046875, 0.6163101196289062, 0.6445465087890625, 0.6727828979492188, 0.701019287109375, 0.7292556762695312, 0.7574920654296875, 0.7857284545898438, 0.81396484375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 8.0, 4.0, 8.0, 6.0, 14.0, 14.0, 18.0, 18.0, 28.0, 25.0, 24.0, 30.0, 35.0, 46.0, 45.0, 54.0, 46.0, 45.0, 40.0, 39.0, 40.0, 41.0, 38.0, 47.0, 34.0, 30.0, 36.0, 18.0, 29.0, 25.0, 23.0, 16.0, 19.0, 13.0, 7.0, 5.0, 6.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.67919921875, -0.6577529907226562, -0.6363067626953125, -0.6148605346679688, -0.593414306640625, -0.5719680786132812, -0.5505218505859375, -0.5290756225585938, -0.50762939453125, -0.48618316650390625, -0.4647369384765625, -0.44329071044921875, -0.421844482421875, -0.40039825439453125, -0.3789520263671875, -0.35750579833984375, -0.3360595703125, -0.31461334228515625, -0.2931671142578125, -0.27172088623046875, -0.250274658203125, -0.22882843017578125, -0.2073822021484375, -0.18593597412109375, -0.16448974609375, -0.14304351806640625, -0.1215972900390625, -0.10015106201171875, -0.078704833984375, -0.05725860595703125, -0.0358123779296875, -0.01436614990234375, 0.007080078125, 0.02852630615234375, 0.0499725341796875, 0.07141876220703125, 0.092864990234375, 0.11431121826171875, 0.1357574462890625, 0.15720367431640625, 0.17864990234375, 0.20009613037109375, 0.2215423583984375, 0.24298858642578125, 0.264434814453125, 0.28588104248046875, 0.3073272705078125, 0.32877349853515625, 0.3502197265625, 0.37166595458984375, 0.3931121826171875, 0.41455841064453125, 0.436004638671875, 0.45745086669921875, 0.4788970947265625, 0.5003433227539062, 0.52178955078125, 0.5432357788085938, 0.5646820068359375, 0.5861282348632812, 0.607574462890625, 0.6290206909179688, 0.6504669189453125, 0.6719131469726562, 0.693359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 10.0, 4.0, 10.0, 18.0, 18.0, 33.0, 58.0, 62.0, 113.0, 194.0, 427.0, 932.0, 3172.0, 19614.0, 243758.0, 692029.0, 76896.0, 8172.0, 1704.0, 592.0, 263.0, 159.0, 108.0, 67.0, 44.0, 38.0, 15.0, 16.0, 13.0, 3.0, 8.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.392578125, -0.3757171630859375, -0.358856201171875, -0.3419952392578125, -0.32513427734375, -0.3082733154296875, -0.291412353515625, -0.2745513916015625, -0.2576904296875, -0.2408294677734375, -0.223968505859375, -0.2071075439453125, -0.19024658203125, -0.1733856201171875, -0.156524658203125, -0.1396636962890625, -0.122802734375, -0.1059417724609375, -0.089080810546875, -0.0722198486328125, -0.05535888671875, -0.0384979248046875, -0.021636962890625, -0.0047760009765625, 0.0120849609375, 0.0289459228515625, 0.045806884765625, 0.0626678466796875, 0.07952880859375, 0.0963897705078125, 0.113250732421875, 0.1301116943359375, 0.14697265625, 0.1638336181640625, 0.180694580078125, 0.1975555419921875, 0.21441650390625, 0.2312774658203125, 0.248138427734375, 0.2649993896484375, 0.2818603515625, 0.2987213134765625, 0.315582275390625, 0.3324432373046875, 0.34930419921875, 0.3661651611328125, 0.383026123046875, 0.3998870849609375, 0.416748046875, 0.4336090087890625, 0.450469970703125, 0.4673309326171875, 0.48419189453125, 0.5010528564453125, 0.517913818359375, 0.5347747802734375, 0.5516357421875, 0.5684967041015625, 0.585357666015625, 0.6022186279296875, 0.61907958984375, 0.6359405517578125, 0.652801513671875, 0.6696624755859375, 0.6865234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 9.0, 19.0, 32.0, 49.0, 79.0, 144.0, 202.0, 182.0, 126.0, 71.0, 49.0, 15.0, 11.0, 4.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.577108383178711e-05, -8.091423660516739e-05, -7.605738937854767e-05, -7.120054215192795e-05, -6.634369492530823e-05, -6.148684769868851e-05, -5.663000047206879e-05, -5.1773153245449066e-05, -4.6916306018829346e-05, -4.2059458792209625e-05, -3.7202611565589905e-05, -3.2345764338970184e-05, -2.7488917112350464e-05, -2.2632069885730743e-05, -1.7775222659111023e-05, -1.2918375432491302e-05, -8.061528205871582e-06, -3.2046809792518616e-06, 1.6521662473678589e-06, 6.509013473987579e-06, 1.13658607006073e-05, 1.622270792722702e-05, 2.107955515384674e-05, 2.593640238046646e-05, 3.079324960708618e-05, 3.56500968337059e-05, 4.050694406032562e-05, 4.536379128694534e-05, 5.0220638513565063e-05, 5.5077485740184784e-05, 5.9934332966804504e-05, 6.479118019342422e-05, 6.964802742004395e-05, 7.450487464666367e-05, 7.936172187328339e-05, 8.42185690999031e-05, 8.907541632652283e-05, 9.393226355314255e-05, 9.878911077976227e-05, 0.00010364595800638199, 0.00010850280523300171, 0.00011335965245962143, 0.00011821649968624115, 0.00012307334691286087, 0.0001279301941394806, 0.0001327870413661003, 0.00013764388859272003, 0.00014250073581933975, 0.00014735758304595947, 0.0001522144302725792, 0.00015707127749919891, 0.00016192812472581863, 0.00016678497195243835, 0.00017164181917905807, 0.0001764986664056778, 0.00018135551363229752, 0.00018621236085891724, 0.00019106920808553696, 0.00019592605531215668, 0.0002007829025387764, 0.00020563974976539612, 0.00021049659699201584, 0.00021535344421863556, 0.00022021029144525528, 0.000225067138671875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 13.0, 18.0, 24.0, 69.0, 131.0, 320.0, 876.0, 4033.0, 59561.0, 861998.0, 113617.0, 6103.0, 1105.0, 368.0, 171.0, 74.0, 35.0, 16.0, 12.0, 5.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85009765625, -0.827484130859375, -0.80487060546875, -0.782257080078125, -0.7596435546875, -0.737030029296875, -0.71441650390625, -0.691802978515625, -0.669189453125, -0.646575927734375, -0.62396240234375, -0.601348876953125, -0.5787353515625, -0.556121826171875, -0.53350830078125, -0.510894775390625, -0.48828125, -0.465667724609375, -0.44305419921875, -0.420440673828125, -0.3978271484375, -0.375213623046875, -0.35260009765625, -0.329986572265625, -0.307373046875, -0.284759521484375, -0.26214599609375, -0.239532470703125, -0.2169189453125, -0.194305419921875, -0.17169189453125, -0.149078369140625, -0.12646484375, -0.103851318359375, -0.08123779296875, -0.058624267578125, -0.0360107421875, -0.013397216796875, 0.00921630859375, 0.031829833984375, 0.054443359375, 0.077056884765625, 0.09967041015625, 0.122283935546875, 0.1448974609375, 0.167510986328125, 0.19012451171875, 0.212738037109375, 0.2353515625, 0.257965087890625, 0.28057861328125, 0.303192138671875, 0.3258056640625, 0.348419189453125, 0.37103271484375, 0.393646240234375, 0.416259765625, 0.438873291015625, 0.46148681640625, 0.484100341796875, 0.5067138671875, 0.529327392578125, 0.55194091796875, 0.574554443359375, 0.59716796875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 12.0, 16.0, 31.0, 66.0, 121.0, 211.0, 217.0, 128.0, 95.0, 47.0, 25.0, 11.0, 9.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9072265625, -0.8871574401855469, -0.8670883178710938, -0.8470191955566406, -0.8269500732421875, -0.8068809509277344, -0.7868118286132812, -0.7667427062988281, -0.746673583984375, -0.7266044616699219, -0.7065353393554688, -0.6864662170410156, -0.6663970947265625, -0.6463279724121094, -0.6262588500976562, -0.6061897277832031, -0.58612060546875, -0.5660514831542969, -0.5459823608398438, -0.5259132385253906, -0.5058441162109375, -0.4857749938964844, -0.46570587158203125, -0.4456367492675781, -0.425567626953125, -0.4054985046386719, -0.38542938232421875, -0.3653602600097656, -0.3452911376953125, -0.3252220153808594, -0.30515289306640625, -0.2850837707519531, -0.2650146484375, -0.24494552612304688, -0.22487640380859375, -0.20480728149414062, -0.1847381591796875, -0.16466903686523438, -0.14459991455078125, -0.12453079223632812, -0.104461669921875, -0.08439254760742188, -0.06432342529296875, -0.044254302978515625, -0.0241851806640625, -0.004116058349609375, 0.01595306396484375, 0.036022186279296875, 0.05609130859375, 0.07616043090820312, 0.09622955322265625, 0.11629867553710938, 0.1363677978515625, 0.15643692016601562, 0.17650604248046875, 0.19657516479492188, 0.216644287109375, 0.23671340942382812, 0.25678253173828125, 0.2768516540527344, 0.2969207763671875, 0.3169898986816406, 0.33705902099609375, 0.3571281433105469, 0.377197265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 4.0, 7.0, 10.0, 15.0, 23.0, 47.0, 53.0, 84.0, 100.0, 141.0, 133.0, 117.0, 108.0, 54.0, 34.0, 25.0, 22.0, 6.0, 10.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.417672157287598, -7.24643611907959, -7.075200080871582, -6.903964042663574, -6.732728004455566, -6.561491966247559, -6.390255928039551, -6.219019889831543, -6.047783851623535, -5.876547813415527, -5.7053117752075195, -5.534075736999512, -5.362839698791504, -5.191603660583496, -5.020367622375488, -4.8491315841674805, -4.677895545959473, -4.506659507751465, -4.335423469543457, -4.164187431335449, -3.9929513931274414, -3.8217153549194336, -3.650479316711426, -3.479243278503418, -3.308006763458252, -3.136770725250244, -2.9655346870422363, -2.7942986488342285, -2.6230626106262207, -2.451826572418213, -2.280590534210205, -2.1093544960021973, -1.9381182193756104, -1.7668821811676025, -1.5956461429595947, -1.424410104751587, -1.253174066543579, -1.0819380283355713, -0.9107018709182739, -0.7394658327102661, -0.5682297945022583, -0.3969937562942505, -0.2257576882839203, -0.05452162027359009, 0.11671441793441772, 0.28795045614242554, 0.4591865539550781, 0.6304225921630859, 0.8016586303710938, 0.9728946685791016, 1.1441307067871094, 1.3153667449951172, 1.486602783203125, 1.6578388214111328, 1.8290749788284302, 2.0003108978271484, 2.1715469360351562, 2.342782974243164, 2.514019012451172, 2.6852550506591797, 2.8564910888671875, 3.0277271270751953, 3.198963165283203, 3.370199203491211, 3.541435480117798]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 4.0, 3.0, 8.0, 5.0, 7.0, 4.0, 9.0, 10.0, 18.0, 16.0, 15.0, 19.0, 26.0, 35.0, 47.0, 43.0, 43.0, 54.0, 43.0, 63.0, 36.0, 44.0, 43.0, 46.0, 37.0, 37.0, 38.0, 45.0, 34.0, 31.0, 25.0, 14.0, 27.0, 15.0, 12.0, 12.0, 10.0, 6.0, 5.0, 4.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.011470794677734, -3.9004287719726562, -3.7893869876861572, -3.678344964981079, -3.56730318069458, -3.456261157989502, -3.345219135284424, -3.2341771125793457, -3.1231353282928467, -3.0120933055877686, -2.9010515213012695, -2.7900094985961914, -2.6789674758911133, -2.5679256916046143, -2.456883668899536, -2.345841884613037, -2.234799861907959, -2.123757839202881, -2.012716054916382, -1.9016740322113037, -1.7906321287155151, -1.6795902252197266, -1.5685482025146484, -1.4575062990188599, -1.3464643955230713, -1.2354224920272827, -1.1243805885314941, -1.013338565826416, -0.9022966623306274, -0.7912547588348389, -0.6802127957344055, -0.5691708326339722, -0.4581291675567627, -0.34708723425865173, -0.23604530096054077, -0.1250033676624298, -0.013961434364318848, 0.09708046913146973, 0.20812243223190308, 0.3191643953323364, 0.430206298828125, 0.5412482023239136, 0.6522901654243469, 0.7633321285247803, 0.8743740320205688, 0.9854159355163574, 1.0964579582214355, 1.2074998617172241, 1.3185417652130127, 1.4295836687088013, 1.5406255722045898, 1.651667594909668, 1.7627094984054565, 1.8737514019012451, 1.9847934246063232, 2.0958352088928223, 2.2068772315979004, 2.3179192543029785, 2.4289610385894775, 2.5400030612945557, 2.6510448455810547, 2.762086868286133, 2.873128890991211, 2.984170913696289, 3.095212697982788]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 13.0, 6.0, 13.0, 39.0, 63.0, 101.0, 196.0, 384.0, 731.0, 1827.0, 5312.0, 24543.0, 286135.0, 3809320.0, 51449.0, 9171.0, 2628.0, 1067.0, 479.0, 275.0, 138.0, 110.0, 66.0, 49.0, 49.0, 23.0, 23.0, 17.0, 16.0, 9.0, 8.0, 6.0, 5.0, 1.0, 6.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.396484375, -1.333587646484375, -1.27069091796875, -1.207794189453125, -1.1448974609375, -1.082000732421875, -1.01910400390625, -0.956207275390625, -0.893310546875, -0.830413818359375, -0.76751708984375, -0.704620361328125, -0.6417236328125, -0.578826904296875, -0.51593017578125, -0.453033447265625, -0.39013671875, -0.327239990234375, -0.26434326171875, -0.201446533203125, -0.1385498046875, -0.075653076171875, -0.01275634765625, 0.050140380859375, 0.113037109375, 0.175933837890625, 0.23883056640625, 0.301727294921875, 0.3646240234375, 0.427520751953125, 0.49041748046875, 0.553314208984375, 0.6162109375, 0.679107666015625, 0.74200439453125, 0.804901123046875, 0.8677978515625, 0.930694580078125, 0.99359130859375, 1.056488037109375, 1.119384765625, 1.182281494140625, 1.24517822265625, 1.308074951171875, 1.3709716796875, 1.433868408203125, 1.49676513671875, 1.559661865234375, 1.62255859375, 1.685455322265625, 1.74835205078125, 1.811248779296875, 1.8741455078125, 1.937042236328125, 1.99993896484375, 2.062835693359375, 2.125732421875, 2.188629150390625, 2.25152587890625, 2.314422607421875, 2.3773193359375, 2.440216064453125, 2.50311279296875, 2.566009521484375, 2.62890625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 13.0, 12.0, 25.0, 48.0, 52.0, 68.0, 80.0, 95.0, 94.0, 86.0, 94.0, 78.0, 72.0, 51.0, 40.0, 32.0, 23.0, 13.0, 13.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255615234375, -0.24350357055664062, -0.23139190673828125, -0.21928024291992188, -0.2071685791015625, -0.19505691528320312, -0.18294525146484375, -0.17083358764648438, -0.158721923828125, -0.14661026000976562, -0.13449859619140625, -0.12238693237304688, -0.1102752685546875, -0.09816360473632812, -0.08605194091796875, -0.07394027709960938, -0.06182861328125, -0.049716949462890625, -0.03760528564453125, -0.025493621826171875, -0.0133819580078125, -0.001270294189453125, 0.01084136962890625, 0.022953033447265625, 0.035064697265625, 0.047176361083984375, 0.05928802490234375, 0.07139968872070312, 0.0835113525390625, 0.09562301635742188, 0.10773468017578125, 0.11984634399414062, 0.1319580078125, 0.14406967163085938, 0.15618133544921875, 0.16829299926757812, 0.1804046630859375, 0.19251632690429688, 0.20462799072265625, 0.21673965454101562, 0.228851318359375, 0.24096298217773438, 0.25307464599609375, 0.2651863098144531, 0.2772979736328125, 0.2894096374511719, 0.30152130126953125, 0.3136329650878906, 0.32574462890625, 0.3378562927246094, 0.34996795654296875, 0.3620796203613281, 0.3741912841796875, 0.3863029479980469, 0.39841461181640625, 0.4105262756347656, 0.422637939453125, 0.4347496032714844, 0.44686126708984375, 0.4589729309082031, 0.4710845947265625, 0.4831962585449219, 0.49530792236328125, 0.5074195861816406, 0.51953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 9.0, 5.0, 8.0, 12.0, 24.0, 31.0, 39.0, 40.0, 91.0, 141.0, 251.0, 625.0, 2122.0, 9936.0, 79346.0, 3905699.0, 175619.0, 15778.0, 2922.0, 803.0, 327.0, 171.0, 87.0, 77.0, 36.0, 29.0, 22.0, 7.0, 13.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.623046875, -2.5600433349609375, -2.497039794921875, -2.4340362548828125, -2.37103271484375, -2.3080291748046875, -2.245025634765625, -2.1820220947265625, -2.1190185546875, -2.0560150146484375, -1.993011474609375, -1.9300079345703125, -1.86700439453125, -1.8040008544921875, -1.740997314453125, -1.6779937744140625, -1.614990234375, -1.5519866943359375, -1.488983154296875, -1.4259796142578125, -1.36297607421875, -1.2999725341796875, -1.236968994140625, -1.1739654541015625, -1.1109619140625, -1.0479583740234375, -0.984954833984375, -0.9219512939453125, -0.85894775390625, -0.7959442138671875, -0.732940673828125, -0.6699371337890625, -0.60693359375, -0.5439300537109375, -0.480926513671875, -0.4179229736328125, -0.35491943359375, -0.2919158935546875, -0.228912353515625, -0.1659088134765625, -0.1029052734375, -0.0399017333984375, 0.023101806640625, 0.0861053466796875, 0.14910888671875, 0.2121124267578125, 0.275115966796875, 0.3381195068359375, 0.401123046875, 0.4641265869140625, 0.527130126953125, 0.5901336669921875, 0.65313720703125, 0.7161407470703125, 0.779144287109375, 0.8421478271484375, 0.9051513671875, 0.9681549072265625, 1.031158447265625, 1.0941619873046875, 1.15716552734375, 1.2201690673828125, 1.283172607421875, 1.3461761474609375, 1.4091796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 9.0, 3.0, 5.0, 17.0, 14.0, 21.0, 23.0, 46.0, 47.0, 94.0, 188.0, 381.0, 2179.0, 534.0, 205.0, 100.0, 59.0, 42.0, 31.0, 16.0, 13.0, 10.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.461669921875, -0.4483299255371094, -0.43498992919921875, -0.4216499328613281, -0.4083099365234375, -0.3949699401855469, -0.38162994384765625, -0.3682899475097656, -0.354949951171875, -0.3416099548339844, -0.32826995849609375, -0.3149299621582031, -0.3015899658203125, -0.2882499694824219, -0.27490997314453125, -0.2615699768066406, -0.24822998046875, -0.23488998413085938, -0.22154998779296875, -0.20820999145507812, -0.1948699951171875, -0.18152999877929688, -0.16819000244140625, -0.15485000610351562, -0.141510009765625, -0.12817001342773438, -0.11483001708984375, -0.10149002075195312, -0.0881500244140625, -0.07481002807617188, -0.06147003173828125, -0.048130035400390625, -0.0347900390625, -0.021450042724609375, -0.00811004638671875, 0.005229949951171875, 0.0185699462890625, 0.031909942626953125, 0.04524993896484375, 0.058589935302734375, 0.071929931640625, 0.08526992797851562, 0.09860992431640625, 0.11194992065429688, 0.1252899169921875, 0.13862991333007812, 0.15196990966796875, 0.16530990600585938, 0.17864990234375, 0.19198989868164062, 0.20532989501953125, 0.21866989135742188, 0.2320098876953125, 0.24534988403320312, 0.25868988037109375, 0.2720298767089844, 0.285369873046875, 0.2987098693847656, 0.31204986572265625, 0.3253898620605469, 0.3387298583984375, 0.3520698547363281, 0.36540985107421875, 0.3787498474121094, 0.39208984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 9.0, 25.0, 100.0, 291.0, 348.0, 154.0, 38.0, 13.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.679964065551758, -7.4977874755859375, -7.315610885620117, -7.133434295654297, -6.951257705688477, -6.769081115722656, -6.586904525756836, -6.404727458953857, -6.222550868988037, -6.040374279022217, -5.8581976890563965, -5.676021099090576, -5.493844509124756, -5.311667442321777, -5.129490852355957, -4.947314262390137, -4.765137672424316, -4.582961082458496, -4.400784492492676, -4.2186079025268555, -4.036431312561035, -3.8542544841766357, -3.6720778942108154, -3.489901065826416, -3.307724952697754, -3.1255483627319336, -2.9433717727661133, -2.761195182800293, -2.5790183544158936, -2.3968417644500732, -2.214665174484253, -2.0324883460998535, -1.8503117561340332, -1.668135166168213, -1.485958456993103, -1.3037818670272827, -1.1216051578521729, -0.9394285678863525, -0.7572519779205322, -0.5750752687454224, -0.39289867877960205, -0.21072204411029816, -0.028545409440994263, 0.15363121032714844, 0.3358078598976135, 0.5179845094680786, 0.7001610994338989, 0.8823378086090088, 1.064514398574829, 1.2466909885406494, 1.4288676977157593, 1.6110442876815796, 1.7932209968566895, 1.9753975868225098, 2.15757417678833, 2.3397507667541504, 2.5219273567199707, 2.704103946685791, 2.8862805366516113, 3.0684571266174316, 3.250633955001831, 3.4328105449676514, 3.6149871349334717, 3.797163963317871, 3.9793405532836914]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 2.0, 1.0, 12.0, 7.0, 11.0, 11.0, 14.0, 19.0, 19.0, 27.0, 25.0, 39.0, 29.0, 38.0, 37.0, 41.0, 50.0, 57.0, 58.0, 49.0, 40.0, 38.0, 43.0, 37.0, 34.0, 31.0, 21.0, 18.0, 39.0, 27.0, 26.0, 14.0, 12.0, 14.0, 7.0, 8.0, 6.0, 8.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.9652738571166992, -0.9320940971374512, -0.8989143371582031, -0.8657345771789551, -0.832554817199707, -0.799375057220459, -0.7661952376365662, -0.7330154776573181, -0.6998357176780701, -0.666655957698822, -0.633476197719574, -0.6002964377403259, -0.5671166181564331, -0.5339368581771851, -0.500757098197937, -0.46757733821868896, -0.4343975782394409, -0.40121781826019287, -0.3680380582809448, -0.3348582684993744, -0.30167850852012634, -0.2684987485408783, -0.23531897366046906, -0.20213919878005981, -0.16895943880081177, -0.13577967882156372, -0.10259990394115448, -0.06942013651132584, -0.03624036908149719, -0.0030606091022491455, 0.030119165778160095, 0.06329894065856934, 0.09647881984710693, 0.12965857982635498, 0.16283835470676422, 0.19601812958717346, 0.2291978895664215, 0.26237764954566956, 0.29555743932724, 0.32873719930648804, 0.3619169592857361, 0.39509671926498413, 0.4282764792442322, 0.4614562690258026, 0.49463602900505066, 0.5278158187866211, 0.5609955787658691, 0.5941753387451172, 0.6273550987243652, 0.6605348587036133, 0.6937146186828613, 0.7268943786621094, 0.7600741386413574, 0.7932538986206055, 0.8264337182044983, 0.8596134781837463, 0.8927932381629944, 0.9259729981422424, 0.9591527581214905, 0.9923325181007385, 1.0255123376846313, 1.0586920976638794, 1.0918718576431274, 1.1250516176223755, 1.1582313776016235]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 13.0, 26.0, 31.0, 39.0, 56.0, 70.0, 136.0, 229.0, 457.0, 922.0, 2628.0, 10068.0, 55531.0, 366282.0, 505056.0, 86754.0, 14443.0, 3468.0, 1138.0, 500.0, 248.0, 163.0, 109.0, 61.0, 35.0, 23.0, 16.0, 16.0, 9.0, 6.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7939453125, -1.74285888671875, -1.6917724609375, -1.64068603515625, -1.589599609375, -1.53851318359375, -1.4874267578125, -1.43634033203125, -1.38525390625, -1.33416748046875, -1.2830810546875, -1.23199462890625, -1.180908203125, -1.12982177734375, -1.0787353515625, -1.02764892578125, -0.9765625, -0.92547607421875, -0.8743896484375, -0.82330322265625, -0.772216796875, -0.72113037109375, -0.6700439453125, -0.61895751953125, -0.56787109375, -0.51678466796875, -0.4656982421875, -0.41461181640625, -0.363525390625, -0.31243896484375, -0.2613525390625, -0.21026611328125, -0.1591796875, -0.10809326171875, -0.0570068359375, -0.00592041015625, 0.045166015625, 0.09625244140625, 0.1473388671875, 0.19842529296875, 0.24951171875, 0.30059814453125, 0.3516845703125, 0.40277099609375, 0.453857421875, 0.50494384765625, 0.5560302734375, 0.60711669921875, 0.658203125, 0.70928955078125, 0.7603759765625, 0.81146240234375, 0.862548828125, 0.91363525390625, 0.9647216796875, 1.01580810546875, 1.06689453125, 1.11798095703125, 1.1690673828125, 1.22015380859375, 1.271240234375, 1.32232666015625, 1.3734130859375, 1.42449951171875, 1.4755859375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 11.0, 18.0, 20.0, 27.0, 42.0, 71.0, 69.0, 83.0, 80.0, 82.0, 102.0, 88.0, 66.0, 51.0, 50.0, 49.0, 28.0, 21.0, 16.0, 15.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2425537109375, -0.23035621643066406, -0.21815872192382812, -0.2059612274169922, -0.19376373291015625, -0.1815662384033203, -0.16936874389648438, -0.15717124938964844, -0.1449737548828125, -0.13277626037597656, -0.12057876586914062, -0.10838127136230469, -0.09618377685546875, -0.08398628234863281, -0.07178878784179688, -0.05959129333496094, -0.047393798828125, -0.03519630432128906, -0.022998809814453125, -0.010801315307617188, 0.00139617919921875, 0.013593673706054688, 0.025791168212890625, 0.03798866271972656, 0.0501861572265625, 0.06238365173339844, 0.07458114624023438, 0.08677864074707031, 0.09897613525390625, 0.11117362976074219, 0.12337112426757812, 0.13556861877441406, 0.14776611328125, 0.15996360778808594, 0.17216110229492188, 0.1843585968017578, 0.19655609130859375, 0.2087535858154297, 0.22095108032226562, 0.23314857482910156, 0.2453460693359375, 0.25754356384277344, 0.2697410583496094, 0.2819385528564453, 0.29413604736328125, 0.3063335418701172, 0.3185310363769531, 0.33072853088378906, 0.342926025390625, 0.35512351989746094, 0.3673210144042969, 0.3795185089111328, 0.39171600341796875, 0.4039134979248047, 0.4161109924316406, 0.42830848693847656, 0.4405059814453125, 0.45270347595214844, 0.4649009704589844, 0.4770984649658203, 0.48929595947265625, 0.5014934539794922, 0.5136909484863281, 0.5258884429931641, 0.5380859375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 7.0, 5.0, 11.0, 20.0, 19.0, 50.0, 59.0, 58.0, 114.0, 139.0, 231.0, 368.0, 624.0, 1043.0, 2085.0, 4271.0, 10501.0, 27113.0, 76137.0, 203748.0, 355504.0, 227574.0, 86225.0, 30853.0, 11790.0, 4867.0, 2253.0, 1129.0, 619.0, 383.0, 222.0, 170.0, 120.0, 83.0, 45.0, 30.0, 18.0, 17.0, 19.0, 15.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6474609375, -0.6269454956054688, -0.6064300537109375, -0.5859146118164062, -0.565399169921875, -0.5448837280273438, -0.5243682861328125, -0.5038528442382812, -0.48333740234375, -0.46282196044921875, -0.4423065185546875, -0.42179107666015625, -0.401275634765625, -0.38076019287109375, -0.3602447509765625, -0.33972930908203125, -0.3192138671875, -0.29869842529296875, -0.2781829833984375, -0.25766754150390625, -0.237152099609375, -0.21663665771484375, -0.1961212158203125, -0.17560577392578125, -0.15509033203125, -0.13457489013671875, -0.1140594482421875, -0.09354400634765625, -0.073028564453125, -0.05251312255859375, -0.0319976806640625, -0.01148223876953125, 0.009033203125, 0.02954864501953125, 0.0500640869140625, 0.07057952880859375, 0.091094970703125, 0.11161041259765625, 0.1321258544921875, 0.15264129638671875, 0.17315673828125, 0.19367218017578125, 0.2141876220703125, 0.23470306396484375, 0.255218505859375, 0.27573394775390625, 0.2962493896484375, 0.31676483154296875, 0.3372802734375, 0.35779571533203125, 0.3783111572265625, 0.39882659912109375, 0.419342041015625, 0.43985748291015625, 0.4603729248046875, 0.48088836669921875, 0.50140380859375, 0.5219192504882812, 0.5424346923828125, 0.5629501342773438, 0.583465576171875, 0.6039810180664062, 0.6244964599609375, 0.6450119018554688, 0.66552734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 6.0, 3.0, 2.0, 6.0, 10.0, 9.0, 9.0, 16.0, 19.0, 14.0, 22.0, 28.0, 28.0, 37.0, 34.0, 38.0, 41.0, 35.0, 53.0, 41.0, 53.0, 50.0, 37.0, 44.0, 31.0, 52.0, 39.0, 33.0, 29.0, 32.0, 32.0, 24.0, 19.0, 14.0, 9.0, 14.0, 6.0, 6.0, 5.0, 10.0, 6.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.05078125, -1.0204391479492188, -0.9900970458984375, -0.9597549438476562, -0.929412841796875, -0.8990707397460938, -0.8687286376953125, -0.8383865356445312, -0.80804443359375, -0.7777023315429688, -0.7473602294921875, -0.7170181274414062, -0.686676025390625, -0.6563339233398438, -0.6259918212890625, -0.5956497192382812, -0.5653076171875, -0.5349655151367188, -0.5046234130859375, -0.47428131103515625, -0.443939208984375, -0.41359710693359375, -0.3832550048828125, -0.35291290283203125, -0.32257080078125, -0.29222869873046875, -0.2618865966796875, -0.23154449462890625, -0.201202392578125, -0.17086029052734375, -0.1405181884765625, -0.11017608642578125, -0.079833984375, -0.04949188232421875, -0.0191497802734375, 0.01119232177734375, 0.041534423828125, 0.07187652587890625, 0.1022186279296875, 0.13256072998046875, 0.16290283203125, 0.19324493408203125, 0.2235870361328125, 0.25392913818359375, 0.284271240234375, 0.31461334228515625, 0.3449554443359375, 0.37529754638671875, 0.4056396484375, 0.43598175048828125, 0.4663238525390625, 0.49666595458984375, 0.527008056640625, 0.5573501586914062, 0.5876922607421875, 0.6180343627929688, 0.64837646484375, 0.6787185668945312, 0.7090606689453125, 0.7394027709960938, 0.769744873046875, 0.8000869750976562, 0.8304290771484375, 0.8607711791992188, 0.89111328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 11.0, 11.0, 13.0, 35.0, 79.0, 113.0, 231.0, 521.0, 1242.0, 4732.0, 31110.0, 359428.0, 579385.0, 61319.0, 7338.0, 1726.0, 638.0, 307.0, 149.0, 68.0, 50.0, 19.0, 13.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64453125, -0.626190185546875, -0.60784912109375, -0.589508056640625, -0.5711669921875, -0.552825927734375, -0.53448486328125, -0.516143798828125, -0.497802734375, -0.479461669921875, -0.46112060546875, -0.442779541015625, -0.4244384765625, -0.406097412109375, -0.38775634765625, -0.369415283203125, -0.35107421875, -0.332733154296875, -0.31439208984375, -0.296051025390625, -0.2777099609375, -0.259368896484375, -0.24102783203125, -0.222686767578125, -0.204345703125, -0.186004638671875, -0.16766357421875, -0.149322509765625, -0.1309814453125, -0.112640380859375, -0.09429931640625, -0.075958251953125, -0.0576171875, -0.039276123046875, -0.02093505859375, -0.002593994140625, 0.0157470703125, 0.034088134765625, 0.05242919921875, 0.070770263671875, 0.089111328125, 0.107452392578125, 0.12579345703125, 0.144134521484375, 0.1624755859375, 0.180816650390625, 0.19915771484375, 0.217498779296875, 0.23583984375, 0.254180908203125, 0.27252197265625, 0.290863037109375, 0.3092041015625, 0.327545166015625, 0.34588623046875, 0.364227294921875, 0.382568359375, 0.400909423828125, 0.41925048828125, 0.437591552734375, 0.4559326171875, 0.474273681640625, 0.49261474609375, 0.510955810546875, 0.529296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 8.0, 17.0, 15.0, 14.0, 19.0, 20.0, 30.0, 35.0, 40.0, 53.0, 57.0, 41.0, 73.0, 65.0, 73.0, 50.0, 70.0, 56.0, 39.0, 46.0, 21.0, 23.0, 19.0, 20.0, 19.0, 7.0, 6.0, 9.0, 7.0, 7.0, 5.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.079673767089844e-05, -5.902908742427826e-05, -5.726143717765808e-05, -5.54937869310379e-05, -5.3726136684417725e-05, -5.1958486437797546e-05, -5.019083619117737e-05, -4.842318594455719e-05, -4.665553569793701e-05, -4.4887885451316833e-05, -4.3120235204696655e-05, -4.135258495807648e-05, -3.95849347114563e-05, -3.781728446483612e-05, -3.604963421821594e-05, -3.4281983971595764e-05, -3.2514333724975586e-05, -3.074668347835541e-05, -2.897903323173523e-05, -2.721138298511505e-05, -2.5443732738494873e-05, -2.3676082491874695e-05, -2.1908432245254517e-05, -2.014078199863434e-05, -1.837313175201416e-05, -1.6605481505393982e-05, -1.4837831258773804e-05, -1.3070181012153625e-05, -1.1302530765533447e-05, -9.534880518913269e-06, -7.76723027229309e-06, -5.999580025672913e-06, -4.231929779052734e-06, -2.464279532432556e-06, -6.966292858123779e-07, 1.0710209608078003e-06, 2.8386712074279785e-06, 4.606321454048157e-06, 6.373971700668335e-06, 8.141621947288513e-06, 9.909272193908691e-06, 1.167692244052887e-05, 1.3444572687149048e-05, 1.5212222933769226e-05, 1.6979873180389404e-05, 1.8747523427009583e-05, 2.051517367362976e-05, 2.228282392024994e-05, 2.4050474166870117e-05, 2.5818124413490295e-05, 2.7585774660110474e-05, 2.9353424906730652e-05, 3.112107515335083e-05, 3.288872539997101e-05, 3.4656375646591187e-05, 3.6424025893211365e-05, 3.819167613983154e-05, 3.995932638645172e-05, 4.17269766330719e-05, 4.349462687969208e-05, 4.5262277126312256e-05, 4.7029927372932434e-05, 4.879757761955261e-05, 5.056522786617279e-05, 5.233287811279297e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 13.0, 25.0, 33.0, 66.0, 110.0, 242.0, 428.0, 1153.0, 3507.0, 14737.0, 85230.0, 428693.0, 414948.0, 80004.0, 13810.0, 3457.0, 1117.0, 423.0, 229.0, 121.0, 79.0, 52.0, 21.0, 10.0, 18.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.56005859375, -0.5456924438476562, -0.5313262939453125, -0.5169601440429688, -0.502593994140625, -0.48822784423828125, -0.4738616943359375, -0.45949554443359375, -0.44512939453125, -0.43076324462890625, -0.4163970947265625, -0.40203094482421875, -0.387664794921875, -0.37329864501953125, -0.3589324951171875, -0.34456634521484375, -0.3302001953125, -0.31583404541015625, -0.3014678955078125, -0.28710174560546875, -0.272735595703125, -0.25836944580078125, -0.2440032958984375, -0.22963714599609375, -0.21527099609375, -0.20090484619140625, -0.1865386962890625, -0.17217254638671875, -0.157806396484375, -0.14344024658203125, -0.1290740966796875, -0.11470794677734375, -0.100341796875, -0.08597564697265625, -0.0716094970703125, -0.05724334716796875, -0.042877197265625, -0.02851104736328125, -0.0141448974609375, 0.00022125244140625, 0.01458740234375, 0.02895355224609375, 0.0433197021484375, 0.05768585205078125, 0.072052001953125, 0.08641815185546875, 0.1007843017578125, 0.11515045166015625, 0.1295166015625, 0.14388275146484375, 0.1582489013671875, 0.17261505126953125, 0.186981201171875, 0.20134735107421875, 0.2157135009765625, 0.23007965087890625, 0.24444580078125, 0.25881195068359375, 0.2731781005859375, 0.28754425048828125, 0.301910400390625, 0.31627655029296875, 0.3306427001953125, 0.34500885009765625, 0.359375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 7.0, 8.0, 3.0, 11.0, 13.0, 14.0, 23.0, 22.0, 26.0, 32.0, 43.0, 42.0, 69.0, 68.0, 62.0, 64.0, 69.0, 65.0, 59.0, 50.0, 47.0, 34.0, 44.0, 30.0, 21.0, 13.0, 18.0, 18.0, 9.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.342529296875, -0.3314857482910156, -0.32044219970703125, -0.3093986511230469, -0.2983551025390625, -0.2873115539550781, -0.27626800537109375, -0.2652244567871094, -0.254180908203125, -0.24313735961914062, -0.23209381103515625, -0.22105026245117188, -0.2100067138671875, -0.19896316528320312, -0.18791961669921875, -0.17687606811523438, -0.16583251953125, -0.15478897094726562, -0.14374542236328125, -0.13270187377929688, -0.1216583251953125, -0.11061477661132812, -0.09957122802734375, -0.08852767944335938, -0.077484130859375, -0.06644058227539062, -0.05539703369140625, -0.044353485107421875, -0.0333099365234375, -0.022266387939453125, -0.01122283935546875, -0.000179290771484375, 0.0108642578125, 0.021907806396484375, 0.03295135498046875, 0.043994903564453125, 0.0550384521484375, 0.06608200073242188, 0.07712554931640625, 0.08816909790039062, 0.099212646484375, 0.11025619506835938, 0.12129974365234375, 0.13234329223632812, 0.1433868408203125, 0.15443038940429688, 0.16547393798828125, 0.17651748657226562, 0.18756103515625, 0.19860458374023438, 0.20964813232421875, 0.22069168090820312, 0.2317352294921875, 0.24277877807617188, 0.25382232666015625, 0.2648658752441406, 0.275909423828125, 0.2869529724121094, 0.29799652099609375, 0.3090400695800781, 0.3200836181640625, 0.3311271667480469, 0.34217071533203125, 0.3532142639160156, 0.3642578125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 4.0, 12.0, 9.0, 18.0, 21.0, 37.0, 54.0, 70.0, 114.0, 119.0, 140.0, 125.0, 84.0, 69.0, 45.0, 22.0, 25.0, 9.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.03009033203125, -9.813689231872559, -9.597288131713867, -9.380887031555176, -9.164485931396484, -8.948084831237793, -8.731683731079102, -8.515283584594727, -8.298882484436035, -8.082481384277344, -7.866080284118652, -7.649679183959961, -7.433278560638428, -7.216877460479736, -7.000476360321045, -6.7840752601623535, -6.567673683166504, -6.3512725830078125, -6.134871482849121, -5.91847038269043, -5.7020697593688965, -5.485668659210205, -5.269267559051514, -5.052866458892822, -4.836465835571289, -4.620064735412598, -4.403663635253906, -4.187262535095215, -3.9708616733551025, -3.7544608116149902, -3.538059711456299, -3.3216586112976074, -3.105257272720337, -2.8888561725616455, -2.672455310821533, -2.456054210662842, -2.2396531105041504, -2.023252010345459, -1.8068511486053467, -1.5904500484466553, -1.3740490674972534, -1.1576480865478516, -0.9412469863891602, -0.7248460054397583, -0.5084449648857117, -0.29204392433166504, -0.07564294338226318, 0.14075815677642822, 0.3571591377258301, 0.5735601782798767, 0.7899612188339233, 1.0063621997833252, 1.2227632999420166, 1.4391642808914185, 1.6555652618408203, 1.8719663619995117, 2.088367462158203, 2.3047685623168945, 2.521169424057007, 2.7375705242156982, 2.9539716243743896, 3.170372486114502, 3.3867735862731934, 3.6031746864318848, 3.819575548171997]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 9.0, 13.0, 10.0, 9.0, 17.0, 22.0, 10.0, 26.0, 35.0, 28.0, 21.0, 28.0, 38.0, 35.0, 40.0, 34.0, 39.0, 50.0, 34.0, 37.0, 43.0, 39.0, 37.0, 38.0, 31.0, 31.0, 34.0, 29.0, 30.0, 19.0, 29.0, 13.0, 17.0, 15.0, 8.0, 12.0, 6.0, 12.0, 8.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.842136383056641, -4.691004753112793, -4.5398736000061035, -4.388741970062256, -4.237610816955566, -4.086479187011719, -3.935347557067871, -3.7842161655426025, -3.633084774017334, -3.4819533824920654, -3.330821990966797, -3.179690361022949, -3.0285589694976807, -2.877427577972412, -2.7262959480285645, -2.575164556503296, -2.4240331649780273, -2.272901773452759, -2.1217703819274902, -1.9706387519836426, -1.819507360458374, -1.6683759689331055, -1.5172444581985474, -1.3661129474639893, -1.2149815559387207, -1.0638501644134521, -0.912718653678894, -0.7615872025489807, -0.6104557514190674, -0.45932430028915405, -0.3081928491592407, -0.15706133842468262, -0.0059299468994140625, 0.14520150423049927, 0.2963329553604126, 0.4474644064903259, 0.5985958576202393, 0.7497273087501526, 0.9008587598800659, 1.051990270614624, 1.2031216621398926, 1.3542530536651611, 1.5053845643997192, 1.6565160751342773, 1.807647466659546, 1.9587788581848145, 2.109910488128662, 2.2610418796539307, 2.412173271179199, 2.5633046627044678, 2.7144360542297363, 2.865567684173584, 3.0166990756988525, 3.167830467224121, 3.3189620971679688, 3.4700934886932373, 3.621224880218506, 3.7723562717437744, 3.923487663269043, 4.074619293212891, 4.225750923156738, 4.376882076263428, 4.528013706207275, 4.679144859313965, 4.8302764892578125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 6.0, 7.0, 15.0, 16.0, 33.0, 82.0, 126.0, 293.0, 626.0, 1538.0, 4097.0, 14983.0, 91163.0, 3857692.0, 191567.0, 22471.0, 5678.0, 1926.0, 802.0, 440.0, 230.0, 138.0, 98.0, 68.0, 44.0, 35.0, 19.0, 26.0, 19.0, 9.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.8408203125, -1.7807464599609375, -1.720672607421875, -1.6605987548828125, -1.60052490234375, -1.5404510498046875, -1.480377197265625, -1.4203033447265625, -1.3602294921875, -1.3001556396484375, -1.240081787109375, -1.1800079345703125, -1.11993408203125, -1.0598602294921875, -0.999786376953125, -0.9397125244140625, -0.879638671875, -0.8195648193359375, -0.759490966796875, -0.6994171142578125, -0.63934326171875, -0.5792694091796875, -0.519195556640625, -0.4591217041015625, -0.3990478515625, -0.3389739990234375, -0.278900146484375, -0.2188262939453125, -0.15875244140625, -0.0986785888671875, -0.038604736328125, 0.0214691162109375, 0.08154296875, 0.1416168212890625, 0.201690673828125, 0.2617645263671875, 0.32183837890625, 0.3819122314453125, 0.441986083984375, 0.5020599365234375, 0.5621337890625, 0.6222076416015625, 0.682281494140625, 0.7423553466796875, 0.80242919921875, 0.8625030517578125, 0.922576904296875, 0.9826507568359375, 1.042724609375, 1.1027984619140625, 1.162872314453125, 1.2229461669921875, 1.28302001953125, 1.3430938720703125, 1.403167724609375, 1.4632415771484375, 1.5233154296875, 1.5833892822265625, 1.643463134765625, 1.7035369873046875, 1.76361083984375, 1.8236846923828125, 1.883758544921875, 1.9438323974609375, 2.00390625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 8.0, 8.0, 11.0, 14.0, 6.0, 18.0, 40.0, 39.0, 54.0, 63.0, 68.0, 71.0, 73.0, 63.0, 81.0, 71.0, 76.0, 54.0, 41.0, 39.0, 36.0, 27.0, 10.0, 12.0, 9.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26220703125, -0.2499847412109375, -0.237762451171875, -0.2255401611328125, -0.21331787109375, -0.2010955810546875, -0.188873291015625, -0.1766510009765625, -0.1644287109375, -0.1522064208984375, -0.139984130859375, -0.1277618408203125, -0.11553955078125, -0.1033172607421875, -0.091094970703125, -0.0788726806640625, -0.066650390625, -0.0544281005859375, -0.042205810546875, -0.0299835205078125, -0.01776123046875, -0.0055389404296875, 0.006683349609375, 0.0189056396484375, 0.0311279296875, 0.0433502197265625, 0.055572509765625, 0.0677947998046875, 0.08001708984375, 0.0922393798828125, 0.104461669921875, 0.1166839599609375, 0.12890625, 0.1411285400390625, 0.153350830078125, 0.1655731201171875, 0.17779541015625, 0.1900177001953125, 0.202239990234375, 0.2144622802734375, 0.2266845703125, 0.2389068603515625, 0.251129150390625, 0.2633514404296875, 0.27557373046875, 0.2877960205078125, 0.300018310546875, 0.3122406005859375, 0.324462890625, 0.3366851806640625, 0.348907470703125, 0.3611297607421875, 0.37335205078125, 0.3855743408203125, 0.397796630859375, 0.4100189208984375, 0.4222412109375, 0.4344635009765625, 0.446685791015625, 0.4589080810546875, 0.47113037109375, 0.4833526611328125, 0.495574951171875, 0.5077972412109375, 0.52001953125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 4.0, 12.0, 14.0, 14.0, 27.0, 43.0, 57.0, 84.0, 102.0, 148.0, 215.0, 304.0, 480.0, 833.0, 1623.0, 3656.0, 9095.0, 27929.0, 128337.0, 3483539.0, 456639.0, 54235.0, 15641.0, 5754.0, 2463.0, 1135.0, 637.0, 419.0, 244.0, 162.0, 135.0, 80.0, 65.0, 47.0, 25.0, 22.0, 20.0, 16.0, 6.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.3486328125, -1.3119354248046875, -1.275238037109375, -1.2385406494140625, -1.20184326171875, -1.1651458740234375, -1.128448486328125, -1.0917510986328125, -1.0550537109375, -1.0183563232421875, -0.981658935546875, -0.9449615478515625, -0.90826416015625, -0.8715667724609375, -0.834869384765625, -0.7981719970703125, -0.761474609375, -0.7247772216796875, -0.688079833984375, -0.6513824462890625, -0.61468505859375, -0.5779876708984375, -0.541290283203125, -0.5045928955078125, -0.4678955078125, -0.4311981201171875, -0.394500732421875, -0.3578033447265625, -0.32110595703125, -0.2844085693359375, -0.247711181640625, -0.2110137939453125, -0.17431640625, -0.1376190185546875, -0.100921630859375, -0.0642242431640625, -0.02752685546875, 0.0091705322265625, 0.045867919921875, 0.0825653076171875, 0.1192626953125, 0.1559600830078125, 0.192657470703125, 0.2293548583984375, 0.26605224609375, 0.3027496337890625, 0.339447021484375, 0.3761444091796875, 0.412841796875, 0.4495391845703125, 0.486236572265625, 0.5229339599609375, 0.55963134765625, 0.5963287353515625, 0.633026123046875, 0.6697235107421875, 0.7064208984375, 0.7431182861328125, 0.779815673828125, 0.8165130615234375, 0.85321044921875, 0.8899078369140625, 0.926605224609375, 0.9633026123046875, 1.0]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 13.0, 17.0, 35.0, 65.0, 110.0, 425.0, 2666.0, 473.0, 127.0, 51.0, 26.0, 22.0, 10.0, 6.0, 11.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7392578125, -0.7064208984375, -0.673583984375, -0.6407470703125, -0.60791015625, -0.5750732421875, -0.542236328125, -0.5093994140625, -0.4765625, -0.4437255859375, -0.410888671875, -0.3780517578125, -0.34521484375, -0.3123779296875, -0.279541015625, -0.2467041015625, -0.2138671875, -0.1810302734375, -0.148193359375, -0.1153564453125, -0.08251953125, -0.0496826171875, -0.016845703125, 0.0159912109375, 0.048828125, 0.0816650390625, 0.114501953125, 0.1473388671875, 0.18017578125, 0.2130126953125, 0.245849609375, 0.2786865234375, 0.3115234375, 0.3443603515625, 0.377197265625, 0.4100341796875, 0.44287109375, 0.4757080078125, 0.508544921875, 0.5413818359375, 0.57421875, 0.6070556640625, 0.639892578125, 0.6727294921875, 0.70556640625, 0.7384033203125, 0.771240234375, 0.8040771484375, 0.8369140625, 0.8697509765625, 0.902587890625, 0.9354248046875, 0.96826171875, 1.0010986328125, 1.033935546875, 1.0667724609375, 1.099609375, 1.1324462890625, 1.165283203125, 1.1981201171875, 1.23095703125, 1.2637939453125, 1.296630859375, 1.3294677734375, 1.3623046875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 4.0, 4.0, 22.0, 42.0, 131.0, 204.0, 236.0, 174.0, 90.0, 51.0, 12.0, 8.0, 1.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.640812397003174, -5.475379943847656, -5.309947490692139, -5.144515037536621, -4.979082107543945, -4.813649654388428, -4.64821720123291, -4.482784748077393, -4.317352294921875, -4.151919841766357, -3.98648738861084, -3.821054697036743, -3.6556222438812256, -3.490189790725708, -3.3247570991516113, -3.1593246459960938, -2.993892192840576, -2.8284597396850586, -2.663027286529541, -2.4975945949554443, -2.3321621417999268, -2.166729688644409, -2.0012969970703125, -1.835864543914795, -1.6704320907592773, -1.5049996376037598, -1.3395670652389526, -1.1741344928741455, -1.008702039718628, -0.8432695269584656, -0.6778370141983032, -0.5124044418334961, -0.3469715118408203, -0.18153899908065796, -0.016106486320495605, 0.14932602643966675, 0.3147585391998291, 0.48019105195999146, 0.6456235647201538, 0.8110561370849609, 0.9764885902404785, 1.141921043395996, 1.3073536157608032, 1.4727861881256104, 1.638218641281128, 1.8036510944366455, 1.9690836668014526, 2.1345162391662598, 2.2999486923217773, 2.465381145477295, 2.6308135986328125, 2.796246290206909, 2.9616787433624268, 3.1271111965179443, 3.292543888092041, 3.4579763412475586, 3.623408794403076, 3.7888412475585938, 3.9542737007141113, 4.119706153869629, 4.285139083862305, 4.450571537017822, 4.61600399017334, 4.781436443328857, 4.946868896484375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 4.0, 2.0, 6.0, 6.0, 8.0, 12.0, 14.0, 19.0, 21.0, 22.0, 21.0, 32.0, 30.0, 31.0, 45.0, 35.0, 37.0, 53.0, 52.0, 50.0, 40.0, 34.0, 47.0, 45.0, 32.0, 46.0, 45.0, 38.0, 27.0, 28.0, 8.0, 13.0, 16.0, 19.0, 14.0, 10.0, 19.0, 6.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.945880651473999, -1.8837227821350098, -1.8215649127960205, -1.7594070434570312, -1.697249174118042, -1.6350913047790527, -1.5729334354400635, -1.5107754468917847, -1.4486175775527954, -1.3864597082138062, -1.324301838874817, -1.2621439695358276, -1.1999861001968384, -1.1378281116485596, -1.0756702423095703, -1.013512372970581, -0.9513545632362366, -0.8891966938972473, -0.8270388245582581, -0.764880895614624, -0.7027230262756348, -0.6405651569366455, -0.5784072875976562, -0.516249418258667, -0.45409151911735535, -0.3919336497783661, -0.32977575063705444, -0.2676178812980652, -0.20545999705791473, -0.14330211281776428, -0.08114424347877502, -0.01898634433746338, 0.04317152500152588, 0.10532940924167633, 0.16748729348182678, 0.22964516282081604, 0.2918030619621277, 0.35396093130111694, 0.4161188006401062, 0.47827669978141785, 0.5404345989227295, 0.6025924682617188, 0.664750337600708, 0.7269082069396973, 0.7890661358833313, 0.8512240052223206, 0.9133818745613098, 0.9755398035049438, 1.0376975536346436, 1.0998554229736328, 1.162013292312622, 1.2241711616516113, 1.2863290309906006, 1.3484869003295898, 1.410644769668579, 1.472802758216858, 1.5349606275558472, 1.5971184968948364, 1.6592763662338257, 1.721434235572815, 1.7835921049118042, 1.845750093460083, 1.9079079627990723, 1.9700658321380615, 2.032223701477051]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 6.0, 6.0, 10.0, 6.0, 17.0, 14.0, 30.0, 44.0, 51.0, 90.0, 124.0, 211.0, 338.0, 650.0, 1336.0, 3216.0, 9036.0, 30256.0, 117819.0, 390587.0, 354929.0, 99997.0, 25977.0, 8103.0, 2935.0, 1288.0, 611.0, 327.0, 179.0, 122.0, 77.0, 50.0, 37.0, 22.0, 16.0, 11.0, 11.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.345703125, -1.3035736083984375, -1.261444091796875, -1.2193145751953125, -1.17718505859375, -1.1350555419921875, -1.092926025390625, -1.0507965087890625, -1.0086669921875, -0.9665374755859375, -0.924407958984375, -0.8822784423828125, -0.84014892578125, -0.7980194091796875, -0.755889892578125, -0.7137603759765625, -0.671630859375, -0.6295013427734375, -0.587371826171875, -0.5452423095703125, -0.50311279296875, -0.4609832763671875, -0.418853759765625, -0.3767242431640625, -0.3345947265625, -0.2924652099609375, -0.250335693359375, -0.2082061767578125, -0.16607666015625, -0.1239471435546875, -0.081817626953125, -0.0396881103515625, 0.00244140625, 0.0445709228515625, 0.086700439453125, 0.1288299560546875, 0.17095947265625, 0.2130889892578125, 0.255218505859375, 0.2973480224609375, 0.3394775390625, 0.3816070556640625, 0.423736572265625, 0.4658660888671875, 0.50799560546875, 0.5501251220703125, 0.592254638671875, 0.6343841552734375, 0.676513671875, 0.7186431884765625, 0.760772705078125, 0.8029022216796875, 0.84503173828125, 0.8871612548828125, 0.929290771484375, 0.9714202880859375, 1.0135498046875, 1.0556793212890625, 1.097808837890625, 1.1399383544921875, 1.18206787109375, 1.2241973876953125, 1.266326904296875, 1.3084564208984375, 1.3505859375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 9.0, 10.0, 11.0, 12.0, 21.0, 16.0, 28.0, 32.0, 50.0, 55.0, 67.0, 62.0, 62.0, 85.0, 73.0, 54.0, 62.0, 54.0, 52.0, 35.0, 41.0, 19.0, 25.0, 18.0, 9.0, 10.0, 10.0, 11.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2431640625, -0.2308502197265625, -0.218536376953125, -0.2062225341796875, -0.19390869140625, -0.1815948486328125, -0.169281005859375, -0.1569671630859375, -0.1446533203125, -0.1323394775390625, -0.120025634765625, -0.1077117919921875, -0.09539794921875, -0.0830841064453125, -0.070770263671875, -0.0584564208984375, -0.046142578125, -0.0338287353515625, -0.021514892578125, -0.0092010498046875, 0.00311279296875, 0.0154266357421875, 0.027740478515625, 0.0400543212890625, 0.0523681640625, 0.0646820068359375, 0.076995849609375, 0.0893096923828125, 0.10162353515625, 0.1139373779296875, 0.126251220703125, 0.1385650634765625, 0.15087890625, 0.1631927490234375, 0.175506591796875, 0.1878204345703125, 0.20013427734375, 0.2124481201171875, 0.224761962890625, 0.2370758056640625, 0.2493896484375, 0.2617034912109375, 0.274017333984375, 0.2863311767578125, 0.29864501953125, 0.3109588623046875, 0.323272705078125, 0.3355865478515625, 0.347900390625, 0.3602142333984375, 0.372528076171875, 0.3848419189453125, 0.39715576171875, 0.4094696044921875, 0.421783447265625, 0.4340972900390625, 0.4464111328125, 0.4587249755859375, 0.471038818359375, 0.4833526611328125, 0.49566650390625, 0.5079803466796875, 0.520294189453125, 0.5326080322265625, 0.544921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 9.0, 8.0, 15.0, 18.0, 32.0, 55.0, 139.0, 340.0, 877.0, 3184.0, 14923.0, 97405.0, 598087.0, 286312.0, 37650.0, 6798.0, 1654.0, 567.0, 226.0, 100.0, 61.0, 34.0, 15.0, 14.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.09375, -2.0367889404296875, -1.979827880859375, -1.9228668212890625, -1.86590576171875, -1.8089447021484375, -1.751983642578125, -1.6950225830078125, -1.6380615234375, -1.5811004638671875, -1.524139404296875, -1.4671783447265625, -1.41021728515625, -1.3532562255859375, -1.296295166015625, -1.2393341064453125, -1.182373046875, -1.1254119873046875, -1.068450927734375, -1.0114898681640625, -0.95452880859375, -0.8975677490234375, -0.840606689453125, -0.7836456298828125, -0.7266845703125, -0.6697235107421875, -0.612762451171875, -0.5558013916015625, -0.49884033203125, -0.4418792724609375, -0.384918212890625, -0.3279571533203125, -0.27099609375, -0.2140350341796875, -0.157073974609375, -0.1001129150390625, -0.04315185546875, 0.0138092041015625, 0.070770263671875, 0.1277313232421875, 0.1846923828125, 0.2416534423828125, 0.298614501953125, 0.3555755615234375, 0.41253662109375, 0.4694976806640625, 0.526458740234375, 0.5834197998046875, 0.640380859375, 0.6973419189453125, 0.754302978515625, 0.8112640380859375, 0.86822509765625, 0.9251861572265625, 0.982147216796875, 1.0391082763671875, 1.0960693359375, 1.1530303955078125, 1.209991455078125, 1.2669525146484375, 1.32391357421875, 1.3808746337890625, 1.437835693359375, 1.4947967529296875, 1.5517578125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 10.0, 6.0, 8.0, 9.0, 16.0, 14.0, 24.0, 18.0, 19.0, 35.0, 38.0, 48.0, 42.0, 36.0, 40.0, 44.0, 73.0, 56.0, 65.0, 47.0, 40.0, 44.0, 40.0, 39.0, 30.0, 37.0, 17.0, 23.0, 16.0, 17.0, 17.0, 10.0, 7.0, 3.0, 5.0, 3.0, 4.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6591796875, -1.6095428466796875, -1.559906005859375, -1.5102691650390625, -1.46063232421875, -1.4109954833984375, -1.361358642578125, -1.3117218017578125, -1.2620849609375, -1.2124481201171875, -1.162811279296875, -1.1131744384765625, -1.06353759765625, -1.0139007568359375, -0.964263916015625, -0.9146270751953125, -0.864990234375, -0.8153533935546875, -0.765716552734375, -0.7160797119140625, -0.66644287109375, -0.6168060302734375, -0.567169189453125, -0.5175323486328125, -0.4678955078125, -0.4182586669921875, -0.368621826171875, -0.3189849853515625, -0.26934814453125, -0.2197113037109375, -0.170074462890625, -0.1204376220703125, -0.07080078125, -0.0211639404296875, 0.028472900390625, 0.0781097412109375, 0.12774658203125, 0.1773834228515625, 0.227020263671875, 0.2766571044921875, 0.3262939453125, 0.3759307861328125, 0.425567626953125, 0.4752044677734375, 0.52484130859375, 0.5744781494140625, 0.624114990234375, 0.6737518310546875, 0.723388671875, 0.7730255126953125, 0.822662353515625, 0.8722991943359375, 0.92193603515625, 0.9715728759765625, 1.021209716796875, 1.0708465576171875, 1.1204833984375, 1.1701202392578125, 1.219757080078125, 1.2693939208984375, 1.31903076171875, 1.3686676025390625, 1.418304443359375, 1.4679412841796875, 1.517578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 7.0, 10.0, 14.0, 20.0, 48.0, 83.0, 144.0, 282.0, 565.0, 1452.0, 5571.0, 42230.0, 560387.0, 401976.0, 29098.0, 4410.0, 1167.0, 495.0, 266.0, 126.0, 80.0, 46.0, 32.0, 16.0, 13.0, 3.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90234375, -0.8731613159179688, -0.8439788818359375, -0.8147964477539062, -0.785614013671875, -0.7564315795898438, -0.7272491455078125, -0.6980667114257812, -0.66888427734375, -0.6397018432617188, -0.6105194091796875, -0.5813369750976562, -0.552154541015625, -0.5229721069335938, -0.4937896728515625, -0.46460723876953125, -0.4354248046875, -0.40624237060546875, -0.3770599365234375, -0.34787750244140625, -0.318695068359375, -0.28951263427734375, -0.2603302001953125, -0.23114776611328125, -0.20196533203125, -0.17278289794921875, -0.1436004638671875, -0.11441802978515625, -0.085235595703125, -0.05605316162109375, -0.0268707275390625, 0.00231170654296875, 0.031494140625, 0.06067657470703125, 0.0898590087890625, 0.11904144287109375, 0.148223876953125, 0.17740631103515625, 0.2065887451171875, 0.23577117919921875, 0.26495361328125, 0.29413604736328125, 0.3233184814453125, 0.35250091552734375, 0.381683349609375, 0.41086578369140625, 0.4400482177734375, 0.46923065185546875, 0.4984130859375, 0.5275955200195312, 0.5567779541015625, 0.5859603881835938, 0.615142822265625, 0.6443252563476562, 0.6735076904296875, 0.7026901245117188, 0.73187255859375, 0.7610549926757812, 0.7902374267578125, 0.8194198608398438, 0.848602294921875, 0.8777847290039062, 0.9069671630859375, 0.9361495971679688, 0.96533203125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 7.0, 2.0, 5.0, 4.0, 5.0, 11.0, 14.0, 16.0, 31.0, 33.0, 33.0, 51.0, 60.0, 83.0, 91.0, 91.0, 78.0, 95.0, 63.0, 59.0, 44.0, 38.0, 16.0, 22.0, 16.0, 10.0, 4.0, 5.0, 4.0, 7.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011032819747924805, -0.0001070583239197731, -0.00010378845036029816, -0.00010051857680082321, -9.724870324134827e-05, -9.397882968187332e-05, -9.070895612239838e-05, -8.743908256292343e-05, -8.416920900344849e-05, -8.089933544397354e-05, -7.76294618844986e-05, -7.435958832502365e-05, -7.10897147655487e-05, -6.781984120607376e-05, -6.454996764659882e-05, -6.128009408712387e-05, -5.8010220527648926e-05, -5.474034696817398e-05, -5.1470473408699036e-05, -4.820059984922409e-05, -4.4930726289749146e-05, -4.16608527302742e-05, -3.8390979170799255e-05, -3.512110561132431e-05, -3.1851232051849365e-05, -2.858135849237442e-05, -2.5311484932899475e-05, -2.204161137342453e-05, -1.8771737813949585e-05, -1.550186425447464e-05, -1.2231990694999695e-05, -8.96211713552475e-06, -5.692243576049805e-06, -2.4223700165748596e-06, 8.475035429000854e-07, 4.1173771023750305e-06, 7.387250661849976e-06, 1.065712422132492e-05, 1.3926997780799866e-05, 1.719687134027481e-05, 2.0466744899749756e-05, 2.37366184592247e-05, 2.7006492018699646e-05, 3.027636557817459e-05, 3.3546239137649536e-05, 3.681611269712448e-05, 4.0085986256599426e-05, 4.335585981607437e-05, 4.6625733375549316e-05, 4.989560693502426e-05, 5.3165480494499207e-05, 5.643535405397415e-05, 5.97052276134491e-05, 6.297510117292404e-05, 6.624497473239899e-05, 6.951484829187393e-05, 7.278472185134888e-05, 7.605459541082382e-05, 7.932446897029877e-05, 8.259434252977371e-05, 8.586421608924866e-05, 8.91340896487236e-05, 9.240396320819855e-05, 9.567383676767349e-05, 9.894371032714844e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 12.0, 17.0, 24.0, 45.0, 64.0, 88.0, 165.0, 238.0, 449.0, 845.0, 1801.0, 4846.0, 17208.0, 82133.0, 407130.0, 420703.0, 86377.0, 17492.0, 4945.0, 1858.0, 911.0, 500.0, 272.0, 163.0, 81.0, 62.0, 37.0, 18.0, 16.0, 8.0, 10.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4931640625, -0.476165771484375, -0.45916748046875, -0.442169189453125, -0.4251708984375, -0.408172607421875, -0.39117431640625, -0.374176025390625, -0.357177734375, -0.340179443359375, -0.32318115234375, -0.306182861328125, -0.2891845703125, -0.272186279296875, -0.25518798828125, -0.238189697265625, -0.22119140625, -0.204193115234375, -0.18719482421875, -0.170196533203125, -0.1531982421875, -0.136199951171875, -0.11920166015625, -0.102203369140625, -0.085205078125, -0.068206787109375, -0.05120849609375, -0.034210205078125, -0.0172119140625, -0.000213623046875, 0.01678466796875, 0.033782958984375, 0.05078125, 0.067779541015625, 0.08477783203125, 0.101776123046875, 0.1187744140625, 0.135772705078125, 0.15277099609375, 0.169769287109375, 0.186767578125, 0.203765869140625, 0.22076416015625, 0.237762451171875, 0.2547607421875, 0.271759033203125, 0.28875732421875, 0.305755615234375, 0.32275390625, 0.339752197265625, 0.35675048828125, 0.373748779296875, 0.3907470703125, 0.407745361328125, 0.42474365234375, 0.441741943359375, 0.458740234375, 0.475738525390625, 0.49273681640625, 0.509735107421875, 0.5267333984375, 0.543731689453125, 0.56072998046875, 0.577728271484375, 0.5947265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 5.0, 6.0, 7.0, 13.0, 14.0, 18.0, 24.0, 30.0, 43.0, 71.0, 82.0, 127.0, 120.0, 121.0, 95.0, 64.0, 47.0, 40.0, 21.0, 18.0, 13.0, 8.0, 5.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.88134765625, -0.8557205200195312, -0.8300933837890625, -0.8044662475585938, -0.778839111328125, -0.7532119750976562, -0.7275848388671875, -0.7019577026367188, -0.67633056640625, -0.6507034301757812, -0.6250762939453125, -0.5994491577148438, -0.573822021484375, -0.5481948852539062, -0.5225677490234375, -0.49694061279296875, -0.4713134765625, -0.44568634033203125, -0.4200592041015625, -0.39443206787109375, -0.368804931640625, -0.34317779541015625, -0.3175506591796875, -0.29192352294921875, -0.26629638671875, -0.24066925048828125, -0.2150421142578125, -0.18941497802734375, -0.163787841796875, -0.13816070556640625, -0.1125335693359375, -0.08690643310546875, -0.061279296875, -0.03565216064453125, -0.0100250244140625, 0.01560211181640625, 0.041229248046875, 0.06685638427734375, 0.0924835205078125, 0.11811065673828125, 0.14373779296875, 0.16936492919921875, 0.1949920654296875, 0.22061920166015625, 0.246246337890625, 0.27187347412109375, 0.2975006103515625, 0.32312774658203125, 0.3487548828125, 0.37438201904296875, 0.4000091552734375, 0.42563629150390625, 0.451263427734375, 0.47689056396484375, 0.5025177001953125, 0.5281448364257812, 0.55377197265625, 0.5793991088867188, 0.6050262451171875, 0.6306533813476562, 0.656280517578125, 0.6819076538085938, 0.7075347900390625, 0.7331619262695312, 0.7587890625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 14.0, 14.0, 37.0, 64.0, 84.0, 156.0, 148.0, 163.0, 115.0, 74.0, 52.0, 32.0, 26.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.134284496307373, -5.749335289001465, -5.364386081695557, -4.979436874389648, -4.594487190246582, -4.209538459777832, -3.8245887756347656, -3.4396395683288574, -3.054690361022949, -2.669741153717041, -2.284791946411133, -1.8998425006866455, -1.5148932933807373, -1.129944086074829, -0.7449946403503418, -0.3600454330444336, 0.02490377426147461, 0.4098530411720276, 0.7948023080825806, 1.1797516345977783, 1.5647008419036865, 1.9496500492095947, 2.334599494934082, 2.7195487022399902, 3.1044979095458984, 3.4894471168518066, 3.874396324157715, 4.259346008300781, 4.644294738769531, 5.029244422912598, 5.414193630218506, 5.799142837524414, 6.184091567993164, 6.569040775299072, 6.9539899826049805, 7.338939666748047, 7.723888397216797, 8.108838081359863, 8.49378776550293, 8.87873649597168, 9.26368522644043, 9.648634910583496, 10.033583641052246, 10.418533325195312, 10.803482055664062, 11.188431739807129, 11.573381423950195, 11.958330154418945, 12.343279838562012, 12.728229522705078, 13.113178253173828, 13.498127937316895, 13.883076667785645, 14.268026351928711, 14.652975082397461, 15.037924766540527, 15.422874450683594, 15.80782413482666, 16.192773818969727, 16.577722549438477, 16.962671279907227, 17.347620010375977, 17.73257064819336, 18.11751937866211, 18.50246810913086]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 8.0, 2.0, 3.0, 5.0, 9.0, 8.0, 10.0, 19.0, 14.0, 16.0, 24.0, 34.0, 22.0, 31.0, 32.0, 44.0, 37.0, 41.0, 48.0, 44.0, 41.0, 40.0, 57.0, 38.0, 45.0, 35.0, 42.0, 24.0, 32.0, 36.0, 21.0, 23.0, 18.0, 25.0, 14.0, 19.0, 10.0, 6.0, 8.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.193939208984375, -7.955328464508057, -7.7167181968688965, -7.478107452392578, -7.23949670791626, -7.0008864402771, -6.762275695800781, -6.523665428161621, -6.285054683685303, -6.046443939208984, -5.807833671569824, -5.569222927093506, -5.3306121826171875, -5.092001914978027, -4.853391170501709, -4.614780426025391, -4.3761701583862305, -4.137559413909912, -3.898948907852173, -3.6603384017944336, -3.4217278957366943, -3.183117389678955, -2.9445066452026367, -2.7058961391448975, -2.46728515625, -2.2286746501922607, -1.990064024925232, -1.7514533996582031, -1.5128428936004639, -1.274232268333435, -1.0356216430664062, -0.797011137008667, -0.5584006309509277, -0.3197900652885437, -0.08117946982383728, 0.15743112564086914, 0.3960416913032532, 0.6346522569656372, 0.873262882232666, 1.1118733882904053, 1.350484013557434, 1.589094638824463, 1.8277051448822021, 2.0663156509399414, 2.3049263954162598, 2.543536901473999, 2.7821474075317383, 3.0207581520080566, 3.259368658065796, 3.497979164123535, 3.7365899085998535, 3.9752004146575928, 4.213810920715332, 4.45242166519165, 4.691032409667969, 4.929642677307129, 5.168253421783447, 5.406864166259766, 5.645474433898926, 5.884085178375244, 6.1226959228515625, 6.361306190490723, 6.599916934967041, 6.838527679443359, 7.0771379470825195]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 21.0, 40.0, 67.0, 195.0, 809.0, 7667.0, 4162969.0, 20573.0, 1454.0, 287.0, 93.0, 45.0, 20.0, 16.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.84765625, -5.6568603515625, -5.466064453125, -5.2752685546875, -5.08447265625, -4.8936767578125, -4.702880859375, -4.5120849609375, -4.3212890625, -4.1304931640625, -3.939697265625, -3.7489013671875, -3.55810546875, -3.3673095703125, -3.176513671875, -2.9857177734375, -2.794921875, -2.6041259765625, -2.413330078125, -2.2225341796875, -2.03173828125, -1.8409423828125, -1.650146484375, -1.4593505859375, -1.2685546875, -1.0777587890625, -0.886962890625, -0.6961669921875, -0.50537109375, -0.3145751953125, -0.123779296875, 0.0670166015625, 0.2578125, 0.4486083984375, 0.639404296875, 0.8302001953125, 1.02099609375, 1.2117919921875, 1.402587890625, 1.5933837890625, 1.7841796875, 1.9749755859375, 2.165771484375, 2.3565673828125, 2.54736328125, 2.7381591796875, 2.928955078125, 3.1197509765625, 3.310546875, 3.5013427734375, 3.692138671875, 3.8829345703125, 4.07373046875, 4.2645263671875, 4.455322265625, 4.6461181640625, 4.8369140625, 5.0277099609375, 5.218505859375, 5.4093017578125, 5.60009765625, 5.7908935546875, 5.981689453125, 6.1724853515625, 6.36328125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 14.0, 9.0, 14.0, 18.0, 26.0, 28.0, 34.0, 39.0, 42.0, 51.0, 65.0, 50.0, 61.0, 56.0, 48.0, 52.0, 68.0, 57.0, 59.0, 55.0, 35.0, 28.0, 16.0, 17.0, 10.0, 11.0, 10.0, 5.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34716796875, -0.3330841064453125, -0.319000244140625, -0.3049163818359375, -0.29083251953125, -0.2767486572265625, -0.262664794921875, -0.2485809326171875, -0.2344970703125, -0.2204132080078125, -0.206329345703125, -0.1922454833984375, -0.17816162109375, -0.1640777587890625, -0.149993896484375, -0.1359100341796875, -0.121826171875, -0.1077423095703125, -0.093658447265625, -0.0795745849609375, -0.06549072265625, -0.0514068603515625, -0.037322998046875, -0.0232391357421875, -0.0091552734375, 0.0049285888671875, 0.019012451171875, 0.0330963134765625, 0.04718017578125, 0.0612640380859375, 0.075347900390625, 0.0894317626953125, 0.103515625, 0.1175994873046875, 0.131683349609375, 0.1457672119140625, 0.15985107421875, 0.1739349365234375, 0.188018798828125, 0.2021026611328125, 0.2161865234375, 0.2302703857421875, 0.244354248046875, 0.2584381103515625, 0.27252197265625, 0.2866058349609375, 0.300689697265625, 0.3147735595703125, 0.328857421875, 0.3429412841796875, 0.357025146484375, 0.3711090087890625, 0.38519287109375, 0.3992767333984375, 0.413360595703125, 0.4274444580078125, 0.4415283203125, 0.4556121826171875, 0.469696044921875, 0.4837799072265625, 0.49786376953125, 0.5119476318359375, 0.526031494140625, 0.5401153564453125, 0.55419921875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 9.0, 11.0, 11.0, 30.0, 30.0, 36.0, 56.0, 78.0, 91.0, 150.0, 207.0, 268.0, 426.0, 671.0, 962.0, 1570.0, 2718.0, 5222.0, 11551.0, 40564.0, 3924259.0, 164373.0, 22715.0, 8103.0, 4003.0, 2185.0, 1297.0, 832.0, 542.0, 400.0, 241.0, 194.0, 132.0, 105.0, 78.0, 43.0, 33.0, 21.0, 18.0, 10.0, 12.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.53125, -1.48724365234375, -1.4432373046875, -1.39923095703125, -1.355224609375, -1.31121826171875, -1.2672119140625, -1.22320556640625, -1.17919921875, -1.13519287109375, -1.0911865234375, -1.04718017578125, -1.003173828125, -0.95916748046875, -0.9151611328125, -0.87115478515625, -0.8271484375, -0.78314208984375, -0.7391357421875, -0.69512939453125, -0.651123046875, -0.60711669921875, -0.5631103515625, -0.51910400390625, -0.47509765625, -0.43109130859375, -0.3870849609375, -0.34307861328125, -0.299072265625, -0.25506591796875, -0.2110595703125, -0.16705322265625, -0.123046875, -0.07904052734375, -0.0350341796875, 0.00897216796875, 0.052978515625, 0.09698486328125, 0.1409912109375, 0.18499755859375, 0.22900390625, 0.27301025390625, 0.3170166015625, 0.36102294921875, 0.405029296875, 0.44903564453125, 0.4930419921875, 0.53704833984375, 0.5810546875, 0.62506103515625, 0.6690673828125, 0.71307373046875, 0.757080078125, 0.80108642578125, 0.8450927734375, 0.88909912109375, 0.93310546875, 0.97711181640625, 1.0211181640625, 1.06512451171875, 1.109130859375, 1.15313720703125, 1.1971435546875, 1.24114990234375, 1.28515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 4.0, 7.0, 11.0, 20.0, 52.0, 137.0, 3525.0, 159.0, 57.0, 31.0, 10.0, 10.0, 14.0, 2.0, 5.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.404052734375, -0.3926887512207031, -0.38132476806640625, -0.3699607849121094, -0.3585968017578125, -0.3472328186035156, -0.33586883544921875, -0.3245048522949219, -0.313140869140625, -0.3017768859863281, -0.29041290283203125, -0.2790489196777344, -0.2676849365234375, -0.2563209533691406, -0.24495697021484375, -0.23359298706054688, -0.22222900390625, -0.21086502075195312, -0.19950103759765625, -0.18813705444335938, -0.1767730712890625, -0.16540908813476562, -0.15404510498046875, -0.14268112182617188, -0.131317138671875, -0.11995315551757812, -0.10858917236328125, -0.09722518920898438, -0.0858612060546875, -0.07449722290039062, -0.06313323974609375, -0.051769256591796875, -0.0404052734375, -0.029041290283203125, -0.01767730712890625, -0.006313323974609375, 0.0050506591796875, 0.016414642333984375, 0.02777862548828125, 0.039142608642578125, 0.050506591796875, 0.061870574951171875, 0.07323455810546875, 0.08459854125976562, 0.0959625244140625, 0.10732650756835938, 0.11869049072265625, 0.13005447387695312, 0.14141845703125, 0.15278244018554688, 0.16414642333984375, 0.17551040649414062, 0.1868743896484375, 0.19823837280273438, 0.20960235595703125, 0.22096633911132812, 0.232330322265625, 0.24369430541992188, 0.25505828857421875, 0.2664222717285156, 0.2777862548828125, 0.2891502380371094, 0.30051422119140625, 0.3118782043457031, 0.3232421875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 31.0, 92.0, 237.0, 289.0, 190.0, 99.0, 32.0, 16.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0462324619293213, -0.9535099267959595, -0.8607873916625977, -0.7680649161338806, -0.6753423810005188, -0.582619845867157, -0.48989737033843994, -0.3971748352050781, -0.3044523000717163, -0.21172977983951569, -0.11900725960731506, -0.026284754276275635, 0.06643778085708618, 0.159160315990448, 0.25188279151916504, 0.34460532665252686, 0.43732786178588867, 0.5300503969192505, 0.6227729320526123, 0.7154954075813293, 0.8082179427146912, 0.900940477848053, 0.99366295337677, 1.0863854885101318, 1.1791080236434937, 1.2718305587768555, 1.3645530939102173, 1.457275629043579, 1.5499980449676514, 1.6427206993103027, 1.735443115234375, 1.8281656503677368, 1.9208884239196777, 2.01361083984375, 2.1063334941864014, 2.1990559101104736, 2.291778564453125, 2.3845009803771973, 2.4772233963012695, 2.569946050643921, 2.6626687049865723, 2.7553911209106445, 2.848113775253296, 2.940836191177368, 3.0335588455200195, 3.126281261444092, 3.219003677368164, 3.3117263317108154, 3.4044487476348877, 3.49717116355896, 3.5898938179016113, 3.6826162338256836, 3.775338888168335, 3.8680613040924072, 3.9607839584350586, 4.053506374359131, 4.146228790283203, 4.238951206207275, 4.331673622131348, 4.424396514892578, 4.51711893081665, 4.609841346740723, 4.702563762664795, 4.795286178588867, 4.888009071350098]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 3.0, 5.0, 9.0, 11.0, 7.0, 13.0, 10.0, 11.0, 15.0, 12.0, 22.0, 34.0, 26.0, 31.0, 33.0, 43.0, 32.0, 52.0, 46.0, 66.0, 39.0, 38.0, 43.0, 37.0, 40.0, 36.0, 37.0, 33.0, 28.0, 24.0, 21.0, 28.0, 21.0, 22.0, 16.0, 14.0, 4.0, 11.0, 6.0, 2.0, 3.0, 7.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.7976868748664856, -0.7757668495178223, -0.7538468241691589, -0.7319267988204956, -0.7100067734718323, -0.688086748123169, -0.6661666631698608, -0.6442466974258423, -0.6223266124725342, -0.6004065871238708, -0.5784865617752075, -0.5565665364265442, -0.5346465110778809, -0.5127264857292175, -0.4908064305782318, -0.4688864052295685, -0.44696640968322754, -0.4250463843345642, -0.4031263589859009, -0.38120633363723755, -0.3592863082885742, -0.3373662829399109, -0.31544622778892517, -0.29352620244026184, -0.2716061770915985, -0.24968615174293518, -0.22776612639427185, -0.20584608614444733, -0.183926060795784, -0.16200603544712067, -0.14008599519729614, -0.11816596984863281, -0.09624588489532471, -0.07432585954666138, -0.05240582674741745, -0.030485793948173523, -0.008565768599510193, 0.013354256749153137, 0.03527429699897766, 0.05719432234764099, 0.07911434769630432, 0.10103437304496765, 0.12295440584421158, 0.1448744386434555, 0.16679446399211884, 0.18871448934078217, 0.2106345295906067, 0.23255455493927002, 0.25447458028793335, 0.2763946056365967, 0.29831463098526, 0.32023465633392334, 0.34215468168258667, 0.36407470703125, 0.3859947621822357, 0.40791478753089905, 0.4298348128795624, 0.4517548382282257, 0.47367486357688904, 0.49559491872787476, 0.5175149440765381, 0.5394349694252014, 0.5613549947738647, 0.5832750201225281, 0.6051950454711914]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 7.0, 11.0, 6.0, 10.0, 15.0, 22.0, 21.0, 34.0, 63.0, 86.0, 115.0, 178.0, 326.0, 562.0, 1114.0, 2232.0, 5050.0, 11364.0, 27631.0, 66528.0, 154987.0, 286040.0, 263722.0, 131824.0, 55557.0, 22732.0, 9754.0, 4228.0, 1966.0, 1009.0, 517.0, 280.0, 192.0, 111.0, 70.0, 51.0, 36.0, 28.0, 21.0, 18.0, 14.0, 6.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96240234375, -0.9302139282226562, -0.8980255126953125, -0.8658370971679688, -0.833648681640625, -0.8014602661132812, -0.7692718505859375, -0.7370834350585938, -0.70489501953125, -0.6727066040039062, -0.6405181884765625, -0.6083297729492188, -0.576141357421875, -0.5439529418945312, -0.5117645263671875, -0.47957611083984375, -0.4473876953125, -0.41519927978515625, -0.3830108642578125, -0.35082244873046875, -0.318634033203125, -0.28644561767578125, -0.2542572021484375, -0.22206878662109375, -0.18988037109375, -0.15769195556640625, -0.1255035400390625, -0.09331512451171875, -0.061126708984375, -0.02893829345703125, 0.0032501220703125, 0.03543853759765625, 0.067626953125, 0.09981536865234375, 0.1320037841796875, 0.16419219970703125, 0.196380615234375, 0.22856903076171875, 0.2607574462890625, 0.29294586181640625, 0.32513427734375, 0.35732269287109375, 0.3895111083984375, 0.42169952392578125, 0.453887939453125, 0.48607635498046875, 0.5182647705078125, 0.5504531860351562, 0.5826416015625, 0.6148300170898438, 0.6470184326171875, 0.6792068481445312, 0.711395263671875, 0.7435836791992188, 0.7757720947265625, 0.8079605102539062, 0.84014892578125, 0.8723373413085938, 0.9045257568359375, 0.9367141723632812, 0.968902587890625, 1.0010910034179688, 1.0332794189453125, 1.0654678344726562, 1.09765625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 7.0, 13.0, 11.0, 11.0, 19.0, 24.0, 30.0, 36.0, 27.0, 40.0, 45.0, 51.0, 67.0, 70.0, 54.0, 40.0, 50.0, 63.0, 53.0, 60.0, 48.0, 34.0, 32.0, 27.0, 19.0, 8.0, 12.0, 13.0, 4.0, 2.0, 7.0, 12.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38720703125, -0.37223052978515625, -0.3572540283203125, -0.34227752685546875, -0.327301025390625, -0.31232452392578125, -0.2973480224609375, -0.28237152099609375, -0.26739501953125, -0.25241851806640625, -0.2374420166015625, -0.22246551513671875, -0.207489013671875, -0.19251251220703125, -0.1775360107421875, -0.16255950927734375, -0.1475830078125, -0.13260650634765625, -0.1176300048828125, -0.10265350341796875, -0.087677001953125, -0.07270050048828125, -0.0577239990234375, -0.04274749755859375, -0.02777099609375, -0.01279449462890625, 0.0021820068359375, 0.01715850830078125, 0.032135009765625, 0.04711151123046875, 0.0620880126953125, 0.07706451416015625, 0.092041015625, 0.10701751708984375, 0.1219940185546875, 0.13697052001953125, 0.151947021484375, 0.16692352294921875, 0.1819000244140625, 0.19687652587890625, 0.21185302734375, 0.22682952880859375, 0.2418060302734375, 0.25678253173828125, 0.271759033203125, 0.28673553466796875, 0.3017120361328125, 0.31668853759765625, 0.3316650390625, 0.34664154052734375, 0.3616180419921875, 0.37659454345703125, 0.391571044921875, 0.40654754638671875, 0.4215240478515625, 0.43650054931640625, 0.45147705078125, 0.46645355224609375, 0.4814300537109375, 0.49640655517578125, 0.511383056640625, 0.5263595581054688, 0.5413360595703125, 0.5563125610351562, 0.5712890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 3.0, 4.0, 7.0, 9.0, 22.0, 34.0, 36.0, 64.0, 93.0, 181.0, 348.0, 685.0, 1655.0, 4231.0, 12371.0, 41516.0, 152567.0, 438159.0, 282486.0, 79953.0, 22241.0, 7146.0, 2598.0, 1071.0, 472.0, 225.0, 126.0, 85.0, 59.0, 38.0, 25.0, 5.0, 10.0, 6.0, 5.0, 2.0, 4.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.49609375, -1.4517669677734375, -1.407440185546875, -1.3631134033203125, -1.31878662109375, -1.2744598388671875, -1.230133056640625, -1.1858062744140625, -1.1414794921875, -1.0971527099609375, -1.052825927734375, -1.0084991455078125, -0.96417236328125, -0.9198455810546875, -0.875518798828125, -0.8311920166015625, -0.786865234375, -0.7425384521484375, -0.698211669921875, -0.6538848876953125, -0.60955810546875, -0.5652313232421875, -0.520904541015625, -0.4765777587890625, -0.4322509765625, -0.3879241943359375, -0.343597412109375, -0.2992706298828125, -0.25494384765625, -0.2106170654296875, -0.166290283203125, -0.1219635009765625, -0.07763671875, -0.0333099365234375, 0.011016845703125, 0.0553436279296875, 0.09967041015625, 0.1439971923828125, 0.188323974609375, 0.2326507568359375, 0.2769775390625, 0.3213043212890625, 0.365631103515625, 0.4099578857421875, 0.45428466796875, 0.4986114501953125, 0.542938232421875, 0.5872650146484375, 0.631591796875, 0.6759185791015625, 0.720245361328125, 0.7645721435546875, 0.80889892578125, 0.8532257080078125, 0.897552490234375, 0.9418792724609375, 0.9862060546875, 1.0305328369140625, 1.074859619140625, 1.1191864013671875, 1.16351318359375, 1.2078399658203125, 1.252166748046875, 1.2964935302734375, 1.3408203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 6.0, 4.0, 11.0, 19.0, 12.0, 15.0, 22.0, 24.0, 28.0, 32.0, 39.0, 38.0, 46.0, 33.0, 46.0, 39.0, 55.0, 44.0, 50.0, 54.0, 55.0, 55.0, 35.0, 49.0, 26.0, 26.0, 19.0, 26.0, 23.0, 13.0, 9.0, 8.0, 10.0, 5.0, 5.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8994140625, -1.8316192626953125, -1.763824462890625, -1.6960296630859375, -1.62823486328125, -1.5604400634765625, -1.492645263671875, -1.4248504638671875, -1.3570556640625, -1.2892608642578125, -1.221466064453125, -1.1536712646484375, -1.08587646484375, -1.0180816650390625, -0.950286865234375, -0.8824920654296875, -0.814697265625, -0.7469024658203125, -0.679107666015625, -0.6113128662109375, -0.54351806640625, -0.4757232666015625, -0.407928466796875, -0.3401336669921875, -0.2723388671875, -0.2045440673828125, -0.136749267578125, -0.0689544677734375, -0.00115966796875, 0.0666351318359375, 0.134429931640625, 0.2022247314453125, 0.27001953125, 0.3378143310546875, 0.405609130859375, 0.4734039306640625, 0.54119873046875, 0.6089935302734375, 0.676788330078125, 0.7445831298828125, 0.8123779296875, 0.8801727294921875, 0.947967529296875, 1.0157623291015625, 1.08355712890625, 1.1513519287109375, 1.219146728515625, 1.2869415283203125, 1.354736328125, 1.4225311279296875, 1.490325927734375, 1.5581207275390625, 1.62591552734375, 1.6937103271484375, 1.761505126953125, 1.8292999267578125, 1.8970947265625, 1.9648895263671875, 2.032684326171875, 2.1004791259765625, 2.16827392578125, 2.2360687255859375, 2.303863525390625, 2.3716583251953125, 2.439453125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 7.0, 8.0, 27.0, 48.0, 128.0, 316.0, 1101.0, 8330.0, 332230.0, 690169.0, 13981.0, 1547.0, 387.0, 156.0, 64.0, 22.0, 15.0, 8.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8671875, -1.8071441650390625, -1.747100830078125, -1.6870574951171875, -1.62701416015625, -1.5669708251953125, -1.506927490234375, -1.4468841552734375, -1.3868408203125, -1.3267974853515625, -1.266754150390625, -1.2067108154296875, -1.14666748046875, -1.0866241455078125, -1.026580810546875, -0.9665374755859375, -0.906494140625, -0.8464508056640625, -0.786407470703125, -0.7263641357421875, -0.66632080078125, -0.6062774658203125, -0.546234130859375, -0.4861907958984375, -0.4261474609375, -0.3661041259765625, -0.306060791015625, -0.2460174560546875, -0.18597412109375, -0.1259307861328125, -0.065887451171875, -0.0058441162109375, 0.05419921875, 0.1142425537109375, 0.174285888671875, 0.2343292236328125, 0.29437255859375, 0.3544158935546875, 0.414459228515625, 0.4745025634765625, 0.5345458984375, 0.5945892333984375, 0.654632568359375, 0.7146759033203125, 0.77471923828125, 0.8347625732421875, 0.894805908203125, 0.9548492431640625, 1.014892578125, 1.0749359130859375, 1.134979248046875, 1.1950225830078125, 1.25506591796875, 1.3151092529296875, 1.375152587890625, 1.4351959228515625, 1.4952392578125, 1.5552825927734375, 1.615325927734375, 1.6753692626953125, 1.73541259765625, 1.7954559326171875, 1.855499267578125, 1.9155426025390625, 1.9755859375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 6.0, 9.0, 8.0, 10.0, 15.0, 29.0, 36.0, 38.0, 43.0, 65.0, 69.0, 70.0, 88.0, 86.0, 105.0, 86.0, 65.0, 53.0, 38.0, 17.0, 19.0, 10.0, 8.0, 11.0, 9.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010341405868530273, -9.95611771941185e-05, -9.570829570293427e-05, -9.185541421175003e-05, -8.80025327205658e-05, -8.414965122938156e-05, -8.029676973819733e-05, -7.644388824701309e-05, -7.259100675582886e-05, -6.873812526464462e-05, -6.488524377346039e-05, -6.1032362282276154e-05, -5.717948079109192e-05, -5.3326599299907684e-05, -4.947371780872345e-05, -4.5620836317539215e-05, -4.176795482635498e-05, -3.7915073335170746e-05, -3.406219184398651e-05, -3.0209310352802277e-05, -2.6356428861618042e-05, -2.2503547370433807e-05, -1.8650665879249573e-05, -1.4797784388065338e-05, -1.0944902896881104e-05, -7.092021405696869e-06, -3.2391399145126343e-06, 6.137415766716003e-07, 4.466623067855835e-06, 8.31950455904007e-06, 1.2172386050224304e-05, 1.602526754140854e-05, 1.9878149032592773e-05, 2.3731030523777008e-05, 2.7583912014961243e-05, 3.143679350614548e-05, 3.528967499732971e-05, 3.9142556488513947e-05, 4.299543797969818e-05, 4.6848319470882416e-05, 5.070120096206665e-05, 5.4554082453250885e-05, 5.840696394443512e-05, 6.225984543561935e-05, 6.611272692680359e-05, 6.996560841798782e-05, 7.381848990917206e-05, 7.767137140035629e-05, 8.152425289154053e-05, 8.537713438272476e-05, 8.9230015873909e-05, 9.308289736509323e-05, 9.693577885627747e-05, 0.0001007886603474617, 0.00010464154183864594, 0.00010849442332983017, 0.0001123473048210144, 0.00011620018631219864, 0.00012005306780338287, 0.0001239059492945671, 0.00012775883078575134, 0.00013161171227693558, 0.0001354645937681198, 0.00013931747525930405, 0.00014317035675048828]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 14.0, 24.0, 37.0, 80.0, 211.0, 484.0, 1405.0, 5472.0, 38059.0, 505359.0, 455582.0, 34629.0, 5050.0, 1314.0, 433.0, 190.0, 92.0, 45.0, 18.0, 14.0, 16.0, 4.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2314453125, -1.1981430053710938, -1.1648406982421875, -1.1315383911132812, -1.098236083984375, -1.0649337768554688, -1.0316314697265625, -0.9983291625976562, -0.96502685546875, -0.9317245483398438, -0.8984222412109375, -0.8651199340820312, -0.831817626953125, -0.7985153198242188, -0.7652130126953125, -0.7319107055664062, -0.6986083984375, -0.6653060913085938, -0.6320037841796875, -0.5987014770507812, -0.565399169921875, -0.5320968627929688, -0.4987945556640625, -0.46549224853515625, -0.43218994140625, -0.39888763427734375, -0.3655853271484375, -0.33228302001953125, -0.298980712890625, -0.26567840576171875, -0.2323760986328125, -0.19907379150390625, -0.165771484375, -0.13246917724609375, -0.0991668701171875, -0.06586456298828125, -0.032562255859375, 0.00074005126953125, 0.0340423583984375, 0.06734466552734375, 0.10064697265625, 0.13394927978515625, 0.1672515869140625, 0.20055389404296875, 0.233856201171875, 0.26715850830078125, 0.3004608154296875, 0.33376312255859375, 0.3670654296875, 0.40036773681640625, 0.4336700439453125, 0.46697235107421875, 0.500274658203125, 0.5335769653320312, 0.5668792724609375, 0.6001815795898438, 0.63348388671875, 0.6667861938476562, 0.7000885009765625, 0.7333908081054688, 0.766693115234375, 0.7999954223632812, 0.8332977294921875, 0.8666000366210938, 0.89990234375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 4.0, 1.0, 8.0, 8.0, 9.0, 19.0, 28.0, 38.0, 58.0, 75.0, 98.0, 101.0, 107.0, 107.0, 76.0, 66.0, 49.0, 38.0, 32.0, 19.0, 16.0, 7.0, 7.0, 9.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1708984375, -1.138763427734375, -1.10662841796875, -1.074493408203125, -1.0423583984375, -1.010223388671875, -0.97808837890625, -0.945953369140625, -0.913818359375, -0.881683349609375, -0.84954833984375, -0.817413330078125, -0.7852783203125, -0.753143310546875, -0.72100830078125, -0.688873291015625, -0.65673828125, -0.624603271484375, -0.59246826171875, -0.560333251953125, -0.5281982421875, -0.496063232421875, -0.46392822265625, -0.431793212890625, -0.399658203125, -0.367523193359375, -0.33538818359375, -0.303253173828125, -0.2711181640625, -0.238983154296875, -0.20684814453125, -0.174713134765625, -0.142578125, -0.110443115234375, -0.07830810546875, -0.046173095703125, -0.0140380859375, 0.018096923828125, 0.05023193359375, 0.082366943359375, 0.114501953125, 0.146636962890625, 0.17877197265625, 0.210906982421875, 0.2430419921875, 0.275177001953125, 0.30731201171875, 0.339447021484375, 0.37158203125, 0.403717041015625, 0.43585205078125, 0.467987060546875, 0.5001220703125, 0.532257080078125, 0.56439208984375, 0.596527099609375, 0.628662109375, 0.660797119140625, 0.69293212890625, 0.725067138671875, 0.7572021484375, 0.789337158203125, 0.82147216796875, 0.853607177734375, 0.8857421875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 7.0, 10.0, 15.0, 34.0, 59.0, 71.0, 125.0, 130.0, 126.0, 144.0, 103.0, 63.0, 45.0, 22.0, 20.0, 8.0, 5.0, 11.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.77946949005127, -10.329562187194824, -9.879655838012695, -9.42974853515625, -8.979841232299805, -8.52993392944336, -8.080026626586914, -7.630120277404785, -7.18021297454834, -6.7303056716918945, -6.280398845672607, -5.83049201965332, -5.380584716796875, -4.93067741394043, -4.480770587921143, -4.0308637619018555, -3.58095645904541, -3.131049394607544, -2.6811423301696777, -2.2312352657318115, -1.7813282012939453, -1.331421136856079, -0.8815140724182129, -0.4316070079803467, 0.01830005645751953, 0.46820712089538574, 0.918114185333252, 1.3680212497711182, 1.8179283142089844, 2.2678353786468506, 2.717742443084717, 3.167649507522583, 3.617555618286133, 4.067462921142578, 4.517369747161865, 4.967276573181152, 5.417183876037598, 5.867091178894043, 6.31699800491333, 6.766904830932617, 7.2168121337890625, 7.666719436645508, 8.116626739501953, 8.566533088684082, 9.016440391540527, 9.466347694396973, 9.916254043579102, 10.366161346435547, 10.816068649291992, 11.265975952148438, 11.715883255004883, 12.165789604187012, 12.615696907043457, 13.065604209899902, 13.515510559082031, 13.965417861938477, 14.415325164794922, 14.865232467651367, 15.315139770507812, 15.765046119689941, 16.214954376220703, 16.664859771728516, 17.11476707458496, 17.564674377441406, 18.01458168029785]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 11.0, 13.0, 11.0, 2.0, 15.0, 13.0, 18.0, 28.0, 21.0, 29.0, 20.0, 42.0, 35.0, 45.0, 44.0, 42.0, 48.0, 46.0, 45.0, 52.0, 45.0, 41.0, 44.0, 40.0, 30.0, 34.0, 29.0, 24.0, 20.0, 16.0, 18.0, 12.0, 9.0, 10.0, 12.0, 7.0, 11.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.964408874511719, -9.643903732299805, -9.323399543762207, -9.002894401550293, -8.682389259338379, -8.361885070800781, -8.041379928588867, -7.720874786376953, -7.400370121002197, -7.079865455627441, -6.759360313415527, -6.4388556480407715, -6.118350982666016, -5.797845840454102, -5.477341175079346, -5.15683650970459, -4.836331367492676, -4.51582670211792, -4.195321559906006, -3.87481689453125, -3.554311990737915, -3.23380708694458, -2.913302421569824, -2.5927975177764893, -2.2722926139831543, -1.9517877101898193, -1.631282925605774, -1.3107781410217285, -0.9902732372283936, -0.6697683334350586, -0.3492635488510132, -0.028758764266967773, 0.2917461395263672, 0.6122509837150574, 0.9327558279037476, 1.253260612487793, 1.573765516281128, 1.894270420074463, 2.2147750854492188, 2.5352799892425537, 2.8557848930358887, 3.1762897968292236, 3.4967947006225586, 3.8172993659973145, 4.13780403137207, 4.458309173583984, 4.77881383895874, 5.099318504333496, 5.41982364654541, 5.740328311920166, 6.06083345413208, 6.381338119506836, 6.70184326171875, 7.022347927093506, 7.342852592468262, 7.663357734680176, 7.983862400054932, 8.304367065429688, 8.624872207641602, 8.945377349853516, 9.265881538391113, 9.586386680603027, 9.906891822814941, 10.227396011352539, 10.547901153564453]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 10.0, 8.0, 16.0, 24.0, 31.0, 43.0, 66.0, 99.0, 192.0, 337.0, 602.0, 1214.0, 2793.0, 7386.0, 28560.0, 3951876.0, 171251.0, 19420.0, 5743.0, 2191.0, 1026.0, 510.0, 343.0, 197.0, 109.0, 61.0, 51.0, 37.0, 23.0, 15.0, 11.0, 10.0, 8.0, 6.0, 5.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4375, -1.3819580078125, -1.326416015625, -1.2708740234375, -1.21533203125, -1.1597900390625, -1.104248046875, -1.0487060546875, -0.9931640625, -0.9376220703125, -0.882080078125, -0.8265380859375, -0.77099609375, -0.7154541015625, -0.659912109375, -0.6043701171875, -0.548828125, -0.4932861328125, -0.437744140625, -0.3822021484375, -0.32666015625, -0.2711181640625, -0.215576171875, -0.1600341796875, -0.1044921875, -0.0489501953125, 0.006591796875, 0.0621337890625, 0.11767578125, 0.1732177734375, 0.228759765625, 0.2843017578125, 0.33984375, 0.3953857421875, 0.450927734375, 0.5064697265625, 0.56201171875, 0.6175537109375, 0.673095703125, 0.7286376953125, 0.7841796875, 0.8397216796875, 0.895263671875, 0.9508056640625, 1.00634765625, 1.0618896484375, 1.117431640625, 1.1729736328125, 1.228515625, 1.2840576171875, 1.339599609375, 1.3951416015625, 1.45068359375, 1.5062255859375, 1.561767578125, 1.6173095703125, 1.6728515625, 1.7283935546875, 1.783935546875, 1.8394775390625, 1.89501953125, 1.9505615234375, 2.006103515625, 2.0616455078125, 2.1171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 8.0, 11.0, 16.0, 19.0, 19.0, 31.0, 30.0, 43.0, 48.0, 41.0, 51.0, 69.0, 72.0, 72.0, 62.0, 49.0, 56.0, 45.0, 39.0, 45.0, 27.0, 32.0, 29.0, 19.0, 18.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6240234375, -0.605438232421875, -0.58685302734375, -0.568267822265625, -0.5496826171875, -0.531097412109375, -0.51251220703125, -0.493927001953125, -0.475341796875, -0.456756591796875, -0.43817138671875, -0.419586181640625, -0.4010009765625, -0.382415771484375, -0.36383056640625, -0.345245361328125, -0.32666015625, -0.308074951171875, -0.28948974609375, -0.270904541015625, -0.2523193359375, -0.233734130859375, -0.21514892578125, -0.196563720703125, -0.177978515625, -0.159393310546875, -0.14080810546875, -0.122222900390625, -0.1036376953125, -0.085052490234375, -0.06646728515625, -0.047882080078125, -0.029296875, -0.010711669921875, 0.00787353515625, 0.026458740234375, 0.0450439453125, 0.063629150390625, 0.08221435546875, 0.100799560546875, 0.119384765625, 0.137969970703125, 0.15655517578125, 0.175140380859375, 0.1937255859375, 0.212310791015625, 0.23089599609375, 0.249481201171875, 0.26806640625, 0.286651611328125, 0.30523681640625, 0.323822021484375, 0.3424072265625, 0.360992431640625, 0.37957763671875, 0.398162841796875, 0.416748046875, 0.435333251953125, 0.45391845703125, 0.472503662109375, 0.4910888671875, 0.509674072265625, 0.52825927734375, 0.546844482421875, 0.5654296875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 10.0, 15.0, 17.0, 20.0, 28.0, 41.0, 59.0, 98.0, 141.0, 195.0, 296.0, 432.0, 664.0, 1064.0, 1658.0, 2761.0, 5155.0, 10648.0, 24686.0, 76959.0, 3766543.0, 223620.0, 44716.0, 16841.0, 7564.0, 3871.0, 2226.0, 1411.0, 801.0, 549.0, 394.0, 255.0, 187.0, 104.0, 70.0, 45.0, 37.0, 26.0, 29.0, 8.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1513671875, -1.115142822265625, -1.07891845703125, -1.042694091796875, -1.0064697265625, -0.970245361328125, -0.93402099609375, -0.897796630859375, -0.861572265625, -0.825347900390625, -0.78912353515625, -0.752899169921875, -0.7166748046875, -0.680450439453125, -0.64422607421875, -0.608001708984375, -0.57177734375, -0.535552978515625, -0.49932861328125, -0.463104248046875, -0.4268798828125, -0.390655517578125, -0.35443115234375, -0.318206787109375, -0.281982421875, -0.245758056640625, -0.20953369140625, -0.173309326171875, -0.1370849609375, -0.100860595703125, -0.06463623046875, -0.028411865234375, 0.0078125, 0.044036865234375, 0.08026123046875, 0.116485595703125, 0.1527099609375, 0.188934326171875, 0.22515869140625, 0.261383056640625, 0.297607421875, 0.333831787109375, 0.37005615234375, 0.406280517578125, 0.4425048828125, 0.478729248046875, 0.51495361328125, 0.551177978515625, 0.58740234375, 0.623626708984375, 0.65985107421875, 0.696075439453125, 0.7322998046875, 0.768524169921875, 0.80474853515625, 0.840972900390625, 0.877197265625, 0.913421630859375, 0.94964599609375, 0.985870361328125, 1.0220947265625, 1.058319091796875, 1.09454345703125, 1.130767822265625, 1.1669921875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 4.0, 16.0, 20.0, 25.0, 46.0, 77.0, 166.0, 3302.0, 173.0, 80.0, 32.0, 37.0, 19.0, 11.0, 14.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.494140625, -0.48131561279296875, -0.4684906005859375, -0.45566558837890625, -0.442840576171875, -0.43001556396484375, -0.4171905517578125, -0.40436553955078125, -0.39154052734375, -0.37871551513671875, -0.3658905029296875, -0.35306549072265625, -0.340240478515625, -0.32741546630859375, -0.3145904541015625, -0.30176544189453125, -0.2889404296875, -0.27611541748046875, -0.2632904052734375, -0.25046539306640625, -0.237640380859375, -0.22481536865234375, -0.2119903564453125, -0.19916534423828125, -0.18634033203125, -0.17351531982421875, -0.1606903076171875, -0.14786529541015625, -0.135040283203125, -0.12221527099609375, -0.1093902587890625, -0.09656524658203125, -0.083740234375, -0.07091522216796875, -0.0580902099609375, -0.04526519775390625, -0.032440185546875, -0.01961517333984375, -0.0067901611328125, 0.00603485107421875, 0.01885986328125, 0.03168487548828125, 0.0445098876953125, 0.05733489990234375, 0.070159912109375, 0.08298492431640625, 0.0958099365234375, 0.10863494873046875, 0.1214599609375, 0.13428497314453125, 0.1471099853515625, 0.15993499755859375, 0.172760009765625, 0.18558502197265625, 0.1984100341796875, 0.21123504638671875, 0.22406005859375, 0.23688507080078125, 0.2497100830078125, 0.26253509521484375, 0.275360107421875, 0.28818511962890625, 0.3010101318359375, 0.31383514404296875, 0.32666015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 0.0, 21.0, 90.0, 167.0, 231.0, 242.0, 137.0, 77.0, 29.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.519367218017578, -5.406399250030518, -5.293430805206299, -5.180462837219238, -5.0674943923950195, -4.954526424407959, -4.84155797958374, -4.72859001159668, -4.615621566772461, -4.5026535987854, -4.389685153961182, -4.276717185974121, -4.163748741149902, -4.050780773162842, -3.937812328338623, -3.8248443603515625, -3.711876153945923, -3.598907947540283, -3.4859397411346436, -3.372971534729004, -3.2600033283233643, -3.1470351219177246, -3.034067153930664, -2.9210987091064453, -2.8081307411193848, -2.695162534713745, -2.5821943283081055, -2.469226121902466, -2.356257915496826, -2.2432897090911865, -2.130321502685547, -2.0173535346984863, -1.9043848514556885, -1.7914166450500488, -1.6784484386444092, -1.5654802322387695, -1.4525120258331299, -1.3395438194274902, -1.2265757322311401, -1.1136075258255005, -1.0006393194198608, -0.8876711130142212, -0.7747029066085815, -0.6617347598075867, -0.548766553401947, -0.4357983469963074, -0.3228302001953125, -0.20986199378967285, -0.0968937873840332, 0.01607440412044525, 0.1290425956249237, 0.24201077222824097, 0.3549789786338806, 0.46794718503952026, 0.5809153318405151, 0.6938835382461548, 0.8068517446517944, 0.9198199510574341, 1.0327881574630737, 1.1457562446594238, 1.2587244510650635, 1.3716926574707031, 1.4846608638763428, 1.5976290702819824, 1.710597276687622]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 2.0, 5.0, 6.0, 10.0, 10.0, 9.0, 8.0, 18.0, 12.0, 14.0, 15.0, 24.0, 26.0, 23.0, 23.0, 41.0, 33.0, 32.0, 36.0, 30.0, 44.0, 40.0, 51.0, 42.0, 41.0, 34.0, 40.0, 42.0, 33.0, 27.0, 22.0, 27.0, 29.0, 22.0, 28.0, 13.0, 16.0, 12.0, 11.0, 13.0, 10.0, 7.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.7974575161933899, -0.7742125391960144, -0.7509675621986389, -0.7277225852012634, -0.7044776082038879, -0.6812326312065125, -0.657987654209137, -0.6347426772117615, -0.611497700214386, -0.5882527232170105, -0.565007746219635, -0.5417627692222595, -0.518517792224884, -0.49527281522750854, -0.47202783823013306, -0.44878286123275757, -0.42553791403770447, -0.402292937040329, -0.3790479600429535, -0.355802983045578, -0.3325580060482025, -0.309313029050827, -0.2860680818557739, -0.26282310485839844, -0.23957811295986176, -0.21633313596248627, -0.19308815896511078, -0.16984319686889648, -0.146598219871521, -0.12335323542356491, -0.10010826587677002, -0.07686328887939453, -0.05361831188201904, -0.030373336747288704, -0.007128361612558365, 0.016116611659526825, 0.03936158865690231, 0.0626065656542778, 0.08585153520107269, 0.10909651219844818, 0.13234148919582367, 0.15558646619319916, 0.17883144319057465, 0.20207640528678894, 0.22532138228416443, 0.24856635928153992, 0.2718113362789154, 0.2950563132762909, 0.3183012902736664, 0.34154626727104187, 0.36479124426841736, 0.38803622126579285, 0.41128119826316833, 0.4345261752605438, 0.4577711224555969, 0.4810160994529724, 0.5042610764503479, 0.5275060534477234, 0.5507510304450989, 0.5739960074424744, 0.5972409844398499, 0.6204859614372253, 0.6437309384346008, 0.6669759154319763, 0.6902208924293518]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 9.0, 13.0, 14.0, 24.0, 28.0, 55.0, 77.0, 118.0, 177.0, 262.0, 448.0, 742.0, 1192.0, 2261.0, 3898.0, 7331.0, 14877.0, 31939.0, 71406.0, 157678.0, 270853.0, 246870.0, 128387.0, 57304.0, 26131.0, 12321.0, 6144.0, 3373.0, 1779.0, 1077.0, 634.0, 383.0, 253.0, 195.0, 77.0, 82.0, 46.0, 35.0, 22.0, 9.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.9306640625, -0.9005126953125, -0.870361328125, -0.8402099609375, -0.81005859375, -0.7799072265625, -0.749755859375, -0.7196044921875, -0.689453125, -0.6593017578125, -0.629150390625, -0.5989990234375, -0.56884765625, -0.5386962890625, -0.508544921875, -0.4783935546875, -0.4482421875, -0.4180908203125, -0.387939453125, -0.3577880859375, -0.32763671875, -0.2974853515625, -0.267333984375, -0.2371826171875, -0.20703125, -0.1768798828125, -0.146728515625, -0.1165771484375, -0.08642578125, -0.0562744140625, -0.026123046875, 0.0040283203125, 0.0341796875, 0.0643310546875, 0.094482421875, 0.1246337890625, 0.15478515625, 0.1849365234375, 0.215087890625, 0.2452392578125, 0.275390625, 0.3055419921875, 0.335693359375, 0.3658447265625, 0.39599609375, 0.4261474609375, 0.456298828125, 0.4864501953125, 0.5166015625, 0.5467529296875, 0.576904296875, 0.6070556640625, 0.63720703125, 0.6673583984375, 0.697509765625, 0.7276611328125, 0.7578125, 0.7879638671875, 0.818115234375, 0.8482666015625, 0.87841796875, 0.9085693359375, 0.938720703125, 0.9688720703125, 0.9990234375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 8.0, 11.0, 18.0, 16.0, 10.0, 16.0, 31.0, 32.0, 37.0, 38.0, 41.0, 47.0, 52.0, 59.0, 59.0, 48.0, 62.0, 54.0, 57.0, 46.0, 34.0, 37.0, 28.0, 32.0, 26.0, 16.0, 11.0, 16.0, 12.0, 10.0, 9.0, 2.0, 7.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5171279907226562, -0.5000762939453125, -0.48302459716796875, -0.465972900390625, -0.44892120361328125, -0.4318695068359375, -0.41481781005859375, -0.39776611328125, -0.38071441650390625, -0.3636627197265625, -0.34661102294921875, -0.329559326171875, -0.31250762939453125, -0.2954559326171875, -0.27840423583984375, -0.2613525390625, -0.24430084228515625, -0.2272491455078125, -0.21019744873046875, -0.193145751953125, -0.17609405517578125, -0.1590423583984375, -0.14199066162109375, -0.12493896484375, -0.10788726806640625, -0.0908355712890625, -0.07378387451171875, -0.056732177734375, -0.03968048095703125, -0.0226287841796875, -0.00557708740234375, 0.011474609375, 0.02852630615234375, 0.0455780029296875, 0.06262969970703125, 0.079681396484375, 0.09673309326171875, 0.1137847900390625, 0.13083648681640625, 0.14788818359375, 0.16493988037109375, 0.1819915771484375, 0.19904327392578125, 0.216094970703125, 0.23314666748046875, 0.2501983642578125, 0.26725006103515625, 0.2843017578125, 0.30135345458984375, 0.3184051513671875, 0.33545684814453125, 0.352508544921875, 0.36956024169921875, 0.3866119384765625, 0.40366363525390625, 0.42071533203125, 0.43776702880859375, 0.4548187255859375, 0.47187042236328125, 0.488922119140625, 0.5059738159179688, 0.5230255126953125, 0.5400772094726562, 0.55712890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 10.0, 13.0, 24.0, 30.0, 29.0, 59.0, 72.0, 130.0, 214.0, 344.0, 677.0, 1508.0, 3974.0, 14159.0, 79042.0, 529606.0, 353847.0, 49202.0, 10021.0, 2994.0, 1216.0, 565.0, 312.0, 179.0, 99.0, 75.0, 50.0, 36.0, 16.0, 14.0, 8.0, 13.0, 2.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.478515625, -2.409423828125, -2.34033203125, -2.271240234375, -2.2021484375, -2.133056640625, -2.06396484375, -1.994873046875, -1.92578125, -1.856689453125, -1.78759765625, -1.718505859375, -1.6494140625, -1.580322265625, -1.51123046875, -1.442138671875, -1.373046875, -1.303955078125, -1.23486328125, -1.165771484375, -1.0966796875, -1.027587890625, -0.95849609375, -0.889404296875, -0.8203125, -0.751220703125, -0.68212890625, -0.613037109375, -0.5439453125, -0.474853515625, -0.40576171875, -0.336669921875, -0.267578125, -0.198486328125, -0.12939453125, -0.060302734375, 0.0087890625, 0.077880859375, 0.14697265625, 0.216064453125, 0.28515625, 0.354248046875, 0.42333984375, 0.492431640625, 0.5615234375, 0.630615234375, 0.69970703125, 0.768798828125, 0.837890625, 0.906982421875, 0.97607421875, 1.045166015625, 1.1142578125, 1.183349609375, 1.25244140625, 1.321533203125, 1.390625, 1.459716796875, 1.52880859375, 1.597900390625, 1.6669921875, 1.736083984375, 1.80517578125, 1.874267578125, 1.943359375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 9.0, 5.0, 10.0, 9.0, 15.0, 18.0, 15.0, 23.0, 23.0, 32.0, 38.0, 38.0, 51.0, 41.0, 49.0, 60.0, 43.0, 58.0, 50.0, 48.0, 43.0, 58.0, 44.0, 39.0, 37.0, 25.0, 18.0, 18.0, 15.0, 11.0, 14.0, 15.0, 12.0, 6.0, 8.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.789031982421875, -2.71087646484375, -2.632720947265625, -2.5545654296875, -2.476409912109375, -2.39825439453125, -2.320098876953125, -2.241943359375, -2.163787841796875, -2.08563232421875, -2.007476806640625, -1.9293212890625, -1.851165771484375, -1.77301025390625, -1.694854736328125, -1.61669921875, -1.538543701171875, -1.46038818359375, -1.382232666015625, -1.3040771484375, -1.225921630859375, -1.14776611328125, -1.069610595703125, -0.991455078125, -0.913299560546875, -0.83514404296875, -0.756988525390625, -0.6788330078125, -0.600677490234375, -0.52252197265625, -0.444366455078125, -0.3662109375, -0.288055419921875, -0.20989990234375, -0.131744384765625, -0.0535888671875, 0.024566650390625, 0.10272216796875, 0.180877685546875, 0.259033203125, 0.337188720703125, 0.41534423828125, 0.493499755859375, 0.5716552734375, 0.649810791015625, 0.72796630859375, 0.806121826171875, 0.88427734375, 0.962432861328125, 1.04058837890625, 1.118743896484375, 1.1968994140625, 1.275054931640625, 1.35321044921875, 1.431365966796875, 1.509521484375, 1.587677001953125, 1.66583251953125, 1.743988037109375, 1.8221435546875, 1.900299072265625, 1.97845458984375, 2.056610107421875, 2.134765625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 8.0, 13.0, 23.0, 35.0, 42.0, 85.0, 168.0, 373.0, 1198.0, 4844.0, 35516.0, 877468.0, 116884.0, 8941.0, 1988.0, 518.0, 192.0, 103.0, 54.0, 34.0, 24.0, 12.0, 10.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8681640625, -1.8030242919921875, -1.737884521484375, -1.6727447509765625, -1.60760498046875, -1.5424652099609375, -1.477325439453125, -1.4121856689453125, -1.3470458984375, -1.2819061279296875, -1.216766357421875, -1.1516265869140625, -1.08648681640625, -1.0213470458984375, -0.956207275390625, -0.8910675048828125, -0.825927734375, -0.7607879638671875, -0.695648193359375, -0.6305084228515625, -0.56536865234375, -0.5002288818359375, -0.435089111328125, -0.3699493408203125, -0.3048095703125, -0.2396697998046875, -0.174530029296875, -0.1093902587890625, -0.04425048828125, 0.0208892822265625, 0.086029052734375, 0.1511688232421875, 0.21630859375, 0.2814483642578125, 0.346588134765625, 0.4117279052734375, 0.47686767578125, 0.5420074462890625, 0.607147216796875, 0.6722869873046875, 0.7374267578125, 0.8025665283203125, 0.867706298828125, 0.9328460693359375, 0.99798583984375, 1.0631256103515625, 1.128265380859375, 1.1934051513671875, 1.258544921875, 1.3236846923828125, 1.388824462890625, 1.4539642333984375, 1.51910400390625, 1.5842437744140625, 1.649383544921875, 1.7145233154296875, 1.7796630859375, 1.8448028564453125, 1.909942626953125, 1.9750823974609375, 2.04022216796875, 2.1053619384765625, 2.170501708984375, 2.2356414794921875, 2.30078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 10.0, 30.0, 24.0, 66.0, 107.0, 158.0, 182.0, 167.0, 110.0, 68.0, 26.0, 18.0, 10.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003380775451660156, -0.00033030658960342407, -0.0003225356340408325, -0.00031476467847824097, -0.0003069937229156494, -0.00029922276735305786, -0.0002914518117904663, -0.00028368085622787476, -0.0002759099006652832, -0.00026813894510269165, -0.0002603679895401001, -0.00025259703397750854, -0.000244826078414917, -0.00023705512285232544, -0.0002292841672897339, -0.00022151321172714233, -0.00021374225616455078, -0.00020597130060195923, -0.00019820034503936768, -0.00019042938947677612, -0.00018265843391418457, -0.00017488747835159302, -0.00016711652278900146, -0.0001593455672264099, -0.00015157461166381836, -0.0001438036561012268, -0.00013603270053863525, -0.0001282617449760437, -0.00012049078941345215, -0.0001127198338508606, -0.00010494887828826904, -9.717792272567749e-05, -8.940696716308594e-05, -8.163601160049438e-05, -7.386505603790283e-05, -6.609410047531128e-05, -5.8323144912719727e-05, -5.0552189350128174e-05, -4.278123378753662e-05, -3.501027822494507e-05, -2.7239322662353516e-05, -1.9468367099761963e-05, -1.169741153717041e-05, -3.926455974578857e-06, 3.844499588012695e-06, 1.1615455150604248e-05, 1.93864107131958e-05, 2.7157366275787354e-05, 3.4928321838378906e-05, 4.269927740097046e-05, 5.047023296356201e-05, 5.8241188526153564e-05, 6.601214408874512e-05, 7.378309965133667e-05, 8.155405521392822e-05, 8.932501077651978e-05, 9.709596633911133e-05, 0.00010486692190170288, 0.00011263787746429443, 0.00012040883302688599, 0.00012817978858947754, 0.0001359507441520691, 0.00014372169971466064, 0.0001514926552772522, 0.00015926361083984375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 10.0, 6.0, 12.0, 18.0, 20.0, 34.0, 57.0, 58.0, 117.0, 199.0, 447.0, 1229.0, 4327.0, 23546.0, 599909.0, 394944.0, 18061.0, 3575.0, 1099.0, 398.0, 161.0, 98.0, 90.0, 46.0, 23.0, 16.0, 13.0, 11.0, 10.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.15625, -2.10357666015625, -2.0509033203125, -1.99822998046875, -1.945556640625, -1.89288330078125, -1.8402099609375, -1.78753662109375, -1.73486328125, -1.68218994140625, -1.6295166015625, -1.57684326171875, -1.524169921875, -1.47149658203125, -1.4188232421875, -1.36614990234375, -1.3134765625, -1.26080322265625, -1.2081298828125, -1.15545654296875, -1.102783203125, -1.05010986328125, -0.9974365234375, -0.94476318359375, -0.89208984375, -0.83941650390625, -0.7867431640625, -0.73406982421875, -0.681396484375, -0.62872314453125, -0.5760498046875, -0.52337646484375, -0.470703125, -0.41802978515625, -0.3653564453125, -0.31268310546875, -0.260009765625, -0.20733642578125, -0.1546630859375, -0.10198974609375, -0.04931640625, 0.00335693359375, 0.0560302734375, 0.10870361328125, 0.161376953125, 0.21405029296875, 0.2667236328125, 0.31939697265625, 0.3720703125, 0.42474365234375, 0.4774169921875, 0.53009033203125, 0.582763671875, 0.63543701171875, 0.6881103515625, 0.74078369140625, 0.79345703125, 0.84613037109375, 0.8988037109375, 0.95147705078125, 1.004150390625, 1.05682373046875, 1.1094970703125, 1.16217041015625, 1.21484375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 8.0, 9.0, 6.0, 15.0, 27.0, 83.0, 142.0, 191.0, 177.0, 136.0, 89.0, 49.0, 30.0, 12.0, 10.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.337890625, -3.266998291015625, -3.19610595703125, -3.125213623046875, -3.0543212890625, -2.983428955078125, -2.91253662109375, -2.841644287109375, -2.770751953125, -2.699859619140625, -2.62896728515625, -2.558074951171875, -2.4871826171875, -2.416290283203125, -2.34539794921875, -2.274505615234375, -2.20361328125, -2.132720947265625, -2.06182861328125, -1.990936279296875, -1.9200439453125, -1.849151611328125, -1.77825927734375, -1.707366943359375, -1.636474609375, -1.565582275390625, -1.49468994140625, -1.423797607421875, -1.3529052734375, -1.282012939453125, -1.21112060546875, -1.140228271484375, -1.0693359375, -0.998443603515625, -0.92755126953125, -0.856658935546875, -0.7857666015625, -0.714874267578125, -0.64398193359375, -0.573089599609375, -0.502197265625, -0.431304931640625, -0.36041259765625, -0.289520263671875, -0.2186279296875, -0.147735595703125, -0.07684326171875, -0.005950927734375, 0.06494140625, 0.135833740234375, 0.20672607421875, 0.277618408203125, 0.3485107421875, 0.419403076171875, 0.49029541015625, 0.561187744140625, 0.632080078125, 0.702972412109375, 0.77386474609375, 0.844757080078125, 0.9156494140625, 0.986541748046875, 1.05743408203125, 1.128326416015625, 1.19921875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 9.0, 14.0, 38.0, 87.0, 169.0, 237.0, 192.0, 149.0, 55.0, 26.0, 16.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.055191040039062, -18.141637802124023, -17.228084564208984, -16.314531326293945, -15.400978088378906, -14.487424850463867, -13.573872566223145, -12.660319328308105, -11.746766090393066, -10.833212852478027, -9.919659614562988, -9.006107330322266, -8.092554092407227, -7.179000377655029, -6.265447616577148, -5.351894378662109, -4.43834114074707, -3.5247879028320312, -2.6112349033355713, -1.6976819038391113, -0.7841286659240723, 0.1294245719909668, 1.0429773330688477, 1.9565305709838867, 2.870083808898926, 3.783637046813965, 4.697190284729004, 5.610743045806885, 6.524296283721924, 7.437849521636963, 8.351402282714844, 9.264955520629883, 10.178508758544922, 11.092061996459961, 12.005615234375, 12.919168472290039, 13.832721710205078, 14.746274948120117, 15.65982723236084, 16.573379516601562, 17.486934661865234, 18.400487899780273, 19.314041137695312, 20.22759437561035, 21.14114761352539, 22.05470085144043, 22.96825408935547, 23.881805419921875, 24.795358657836914, 25.708911895751953, 26.622465133666992, 27.53601837158203, 28.44957160949707, 29.36312484741211, 30.276676177978516, 31.190231323242188, 32.103782653808594, 33.017333984375, 33.93088912963867, 34.84444046020508, 35.75799560546875, 36.671546936035156, 37.58510208129883, 38.498653411865234, 39.412208557128906]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 2.0, 5.0, 14.0, 11.0, 11.0, 9.0, 21.0, 16.0, 30.0, 39.0, 30.0, 34.0, 38.0, 54.0, 59.0, 43.0, 51.0, 57.0, 50.0, 42.0, 53.0, 33.0, 41.0, 41.0, 23.0, 28.0, 24.0, 33.0, 24.0, 19.0, 14.0, 15.0, 5.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.899551391601562, -11.535235404968262, -11.170919418334961, -10.806602478027344, -10.442286491394043, -10.077970504760742, -9.713654518127441, -9.34933853149414, -8.985021591186523, -8.620705604553223, -8.256389617919922, -7.892073154449463, -7.527756690979004, -7.163440704345703, -6.799124717712402, -6.434808731079102, -6.070492744445801, -5.7061767578125, -5.341860294342041, -4.97754430770874, -4.613227844238281, -4.2489118576049805, -3.8845958709716797, -3.5202796459198, -3.15596342086792, -2.79164719581604, -2.42733097076416, -2.0630149841308594, -1.6986987590789795, -1.3343825340270996, -0.9700665473937988, -0.605750322341919, -0.24143505096435547, 0.12288111448287964, 0.48719727993011475, 0.8515133857727051, 1.215829610824585, 1.5801458358764648, 1.9444618225097656, 2.3087780475616455, 2.6730942726135254, 3.0374104976654053, 3.401726722717285, 3.766042709350586, 4.130358695983887, 4.494675159454346, 4.8589911460876465, 5.2233076095581055, 5.587623596191406, 5.951939582824707, 6.316256046295166, 6.680572032928467, 7.044888496398926, 7.409204483032227, 7.773520469665527, 8.137836456298828, 8.502153396606445, 8.866469383239746, 9.230785369873047, 9.595102310180664, 9.959418296813965, 10.323734283447266, 10.688050270080566, 11.052366256713867, 11.416682243347168]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 9.0, 11.0, 17.0, 25.0, 47.0, 43.0, 74.0, 142.0, 196.0, 400.0, 759.0, 1438.0, 3298.0, 9382.0, 54131.0, 4095279.0, 19096.0, 5416.0, 2199.0, 1022.0, 500.0, 298.0, 172.0, 114.0, 74.0, 45.0, 32.0, 16.0, 19.0, 14.0, 1.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.248046875, -2.168487548828125, -2.08892822265625, -2.009368896484375, -1.9298095703125, -1.850250244140625, -1.77069091796875, -1.691131591796875, -1.611572265625, -1.532012939453125, -1.45245361328125, -1.372894287109375, -1.2933349609375, -1.213775634765625, -1.13421630859375, -1.054656982421875, -0.97509765625, -0.895538330078125, -0.81597900390625, -0.736419677734375, -0.6568603515625, -0.577301025390625, -0.49774169921875, -0.418182373046875, -0.338623046875, -0.259063720703125, -0.17950439453125, -0.099945068359375, -0.0203857421875, 0.059173583984375, 0.13873291015625, 0.218292236328125, 0.2978515625, 0.377410888671875, 0.45697021484375, 0.536529541015625, 0.6160888671875, 0.695648193359375, 0.77520751953125, 0.854766845703125, 0.934326171875, 1.013885498046875, 1.09344482421875, 1.173004150390625, 1.2525634765625, 1.332122802734375, 1.41168212890625, 1.491241455078125, 1.57080078125, 1.650360107421875, 1.72991943359375, 1.809478759765625, 1.8890380859375, 1.968597412109375, 2.04815673828125, 2.127716064453125, 2.207275390625, 2.286834716796875, 2.36639404296875, 2.445953369140625, 2.5255126953125, 2.605072021484375, 2.68463134765625, 2.764190673828125, 2.84375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 7.0, 7.0, 10.0, 17.0, 24.0, 35.0, 34.0, 50.0, 80.0, 79.0, 108.0, 108.0, 98.0, 81.0, 73.0, 59.0, 45.0, 33.0, 22.0, 17.0, 5.0, 3.0, 3.0, 9.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0107421875, -0.9796981811523438, -0.9486541748046875, -0.9176101684570312, -0.886566162109375, -0.8555221557617188, -0.8244781494140625, -0.7934341430664062, -0.76239013671875, -0.7313461303710938, -0.7003021240234375, -0.6692581176757812, -0.638214111328125, -0.6071701049804688, -0.5761260986328125, -0.5450820922851562, -0.5140380859375, -0.48299407958984375, -0.4519500732421875, -0.42090606689453125, -0.389862060546875, -0.35881805419921875, -0.3277740478515625, -0.29673004150390625, -0.26568603515625, -0.23464202880859375, -0.2035980224609375, -0.17255401611328125, -0.141510009765625, -0.11046600341796875, -0.0794219970703125, -0.04837799072265625, -0.017333984375, 0.01371002197265625, 0.0447540283203125, 0.07579803466796875, 0.106842041015625, 0.13788604736328125, 0.1689300537109375, 0.19997406005859375, 0.23101806640625, 0.26206207275390625, 0.2931060791015625, 0.32415008544921875, 0.355194091796875, 0.38623809814453125, 0.4172821044921875, 0.44832611083984375, 0.4793701171875, 0.5104141235351562, 0.5414581298828125, 0.5725021362304688, 0.603546142578125, 0.6345901489257812, 0.6656341552734375, 0.6966781616210938, 0.72772216796875, 0.7587661743164062, 0.7898101806640625, 0.8208541870117188, 0.851898193359375, 0.8829421997070312, 0.9139862060546875, 0.9450302124023438, 0.97607421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 7.0, 10.0, 9.0, 11.0, 33.0, 35.0, 71.0, 74.0, 104.0, 177.0, 252.0, 471.0, 1065.0, 2525.0, 7156.0, 29387.0, 4053305.0, 79791.0, 12600.0, 3941.0, 1520.0, 723.0, 340.0, 203.0, 133.0, 100.0, 68.0, 50.0, 42.0, 29.0, 17.0, 8.0, 9.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.984375, -2.9052734375, -2.826171875, -2.7470703125, -2.66796875, -2.5888671875, -2.509765625, -2.4306640625, -2.3515625, -2.2724609375, -2.193359375, -2.1142578125, -2.03515625, -1.9560546875, -1.876953125, -1.7978515625, -1.71875, -1.6396484375, -1.560546875, -1.4814453125, -1.40234375, -1.3232421875, -1.244140625, -1.1650390625, -1.0859375, -1.0068359375, -0.927734375, -0.8486328125, -0.76953125, -0.6904296875, -0.611328125, -0.5322265625, -0.453125, -0.3740234375, -0.294921875, -0.2158203125, -0.13671875, -0.0576171875, 0.021484375, 0.1005859375, 0.1796875, 0.2587890625, 0.337890625, 0.4169921875, 0.49609375, 0.5751953125, 0.654296875, 0.7333984375, 0.8125, 0.8916015625, 0.970703125, 1.0498046875, 1.12890625, 1.2080078125, 1.287109375, 1.3662109375, 1.4453125, 1.5244140625, 1.603515625, 1.6826171875, 1.76171875, 1.8408203125, 1.919921875, 1.9990234375, 2.078125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 13.0, 15.0, 30.0, 66.0, 3743.0, 104.0, 42.0, 22.0, 14.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.393310546875, -0.3697242736816406, -0.34613800048828125, -0.3225517272949219, -0.2989654541015625, -0.2753791809082031, -0.25179290771484375, -0.22820663452148438, -0.204620361328125, -0.18103408813476562, -0.15744781494140625, -0.13386154174804688, -0.1102752685546875, -0.08668899536132812, -0.06310272216796875, -0.039516448974609375, -0.01593017578125, 0.007656097412109375, 0.03124237060546875, 0.054828643798828125, 0.0784149169921875, 0.10200119018554688, 0.12558746337890625, 0.14917373657226562, 0.172760009765625, 0.19634628295898438, 0.21993255615234375, 0.24351882934570312, 0.2671051025390625, 0.2906913757324219, 0.31427764892578125, 0.3378639221191406, 0.3614501953125, 0.3850364685058594, 0.40862274169921875, 0.4322090148925781, 0.4557952880859375, 0.4793815612792969, 0.5029678344726562, 0.5265541076660156, 0.550140380859375, 0.5737266540527344, 0.5973129272460938, 0.6208992004394531, 0.6444854736328125, 0.6680717468261719, 0.6916580200195312, 0.7152442932128906, 0.73883056640625, 0.7624168395996094, 0.7860031127929688, 0.8095893859863281, 0.8331756591796875, 0.8567619323730469, 0.8803482055664062, 0.9039344787597656, 0.927520751953125, 0.9511070251464844, 0.9746932983398438, 0.9982795715332031, 1.0218658447265625, 1.0454521179199219, 1.0690383911132812, 1.0926246643066406, 1.1162109375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 13.0, 37.0, 140.0, 343.0, 275.0, 138.0, 43.0, 20.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.988763332366943, -5.83800745010376, -5.687251567840576, -5.536495685577393, -5.385740280151367, -5.234984397888184, -5.084228515625, -4.933472633361816, -4.782716751098633, -4.631960868835449, -4.481204986572266, -4.330449104309082, -4.179693222045898, -4.028937816619873, -3.8781819343566895, -3.727426052093506, -3.5766701698303223, -3.4259142875671387, -3.275158405303955, -3.1244027614593506, -2.973646879196167, -2.8228909969329834, -2.672135353088379, -2.5213794708251953, -2.3706235885620117, -2.219867706298828, -2.0691118240356445, -1.91835618019104, -1.7676002979278564, -1.6168444156646729, -1.4660886526107788, -1.3153328895568848, -1.164576530456543, -1.0138206481933594, -0.8630648851394653, -0.7123090624809265, -0.5615532398223877, -0.4107974171638489, -0.26004159450531006, -0.10928583145141602, 0.04147005081176758, 0.1922258734703064, 0.3429816961288452, 0.49373751878738403, 0.6444933414459229, 0.7952491641044617, 0.9460049867630005, 1.0967607498168945, 1.2475166320800781, 1.3982725143432617, 1.5490282773971558, 1.6997840404510498, 1.8505399227142334, 2.001295804977417, 2.1520514488220215, 2.302807331085205, 2.4535632133483887, 2.6043190956115723, 2.755074977874756, 2.9058306217193604, 3.056586503982544, 3.2073423862457275, 3.358098030090332, 3.5088539123535156, 3.659609794616699]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 4.0, 2.0, 4.0, 8.0, 6.0, 14.0, 6.0, 11.0, 23.0, 21.0, 27.0, 29.0, 17.0, 45.0, 43.0, 40.0, 39.0, 41.0, 38.0, 44.0, 42.0, 34.0, 39.0, 33.0, 46.0, 33.0, 41.0, 40.0, 27.0, 25.0, 27.0, 26.0, 20.0, 25.0, 17.0, 11.0, 12.0, 6.0, 11.0, 7.0, 8.0, 2.0, 2.0, 0.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.998574435710907, -0.9680328369140625, -0.9374912977218628, -0.9069497585296631, -0.8764081597328186, -0.8458665609359741, -0.8153250217437744, -0.7847834825515747, -0.7542418837547302, -0.7237002849578857, -0.693158745765686, -0.6626172065734863, -0.6320756077766418, -0.6015340089797974, -0.5709924697875977, -0.540450930595398, -0.5099093317985535, -0.47936776280403137, -0.4488261938095093, -0.4182846248149872, -0.3877430558204651, -0.357201486825943, -0.3266599178314209, -0.2961183488368988, -0.2655767798423767, -0.23503521084785461, -0.20449364185333252, -0.17395207285881042, -0.14341050386428833, -0.11286893486976624, -0.08232736587524414, -0.051785796880722046, -0.02124422788619995, 0.009297341108322144, 0.03983891010284424, 0.07038047909736633, 0.10092204809188843, 0.13146361708641052, 0.16200518608093262, 0.1925467550754547, 0.2230883240699768, 0.2536298930644989, 0.284171462059021, 0.3147130310535431, 0.3452546000480652, 0.3757961690425873, 0.4063377380371094, 0.43687930703163147, 0.46742087602615356, 0.49796244502067566, 0.5285040140151978, 0.5590455532073975, 0.5895871520042419, 0.6201287508010864, 0.6506702899932861, 0.6812118291854858, 0.7117534279823303, 0.7422950267791748, 0.7728365659713745, 0.8033781051635742, 0.8339197039604187, 0.8644613027572632, 0.8950028419494629, 0.9255443811416626, 0.9560859799385071]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 11.0, 9.0, 33.0, 35.0, 53.0, 91.0, 193.0, 352.0, 746.0, 1516.0, 3649.0, 10522.0, 37583.0, 176774.0, 519201.0, 229328.0, 47665.0, 12790.0, 4449.0, 1823.0, 815.0, 410.0, 195.0, 132.0, 65.0, 36.0, 17.0, 22.0, 10.0, 10.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.1640625, -2.0996246337890625, -2.035186767578125, -1.9707489013671875, -1.90631103515625, -1.8418731689453125, -1.777435302734375, -1.7129974365234375, -1.6485595703125, -1.5841217041015625, -1.519683837890625, -1.4552459716796875, -1.39080810546875, -1.3263702392578125, -1.261932373046875, -1.1974945068359375, -1.133056640625, -1.0686187744140625, -1.004180908203125, -0.9397430419921875, -0.87530517578125, -0.8108673095703125, -0.746429443359375, -0.6819915771484375, -0.6175537109375, -0.5531158447265625, -0.488677978515625, -0.4242401123046875, -0.35980224609375, -0.2953643798828125, -0.230926513671875, -0.1664886474609375, -0.10205078125, -0.0376129150390625, 0.026824951171875, 0.0912628173828125, 0.15570068359375, 0.2201385498046875, 0.284576416015625, 0.3490142822265625, 0.4134521484375, 0.4778900146484375, 0.542327880859375, 0.6067657470703125, 0.67120361328125, 0.7356414794921875, 0.800079345703125, 0.8645172119140625, 0.928955078125, 0.9933929443359375, 1.057830810546875, 1.1222686767578125, 1.18670654296875, 1.2511444091796875, 1.315582275390625, 1.3800201416015625, 1.4444580078125, 1.5088958740234375, 1.573333740234375, 1.6377716064453125, 1.70220947265625, 1.7666473388671875, 1.831085205078125, 1.8955230712890625, 1.9599609375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 11.0, 13.0, 6.0, 18.0, 25.0, 39.0, 45.0, 62.0, 75.0, 89.0, 92.0, 104.0, 94.0, 70.0, 69.0, 62.0, 37.0, 29.0, 25.0, 14.0, 10.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.0931854248046875, -1.060394287109375, -1.0276031494140625, -0.99481201171875, -0.9620208740234375, -0.929229736328125, -0.8964385986328125, -0.8636474609375, -0.8308563232421875, -0.798065185546875, -0.7652740478515625, -0.73248291015625, -0.6996917724609375, -0.666900634765625, -0.6341094970703125, -0.601318359375, -0.5685272216796875, -0.535736083984375, -0.5029449462890625, -0.47015380859375, -0.4373626708984375, -0.404571533203125, -0.3717803955078125, -0.3389892578125, -0.3061981201171875, -0.273406982421875, -0.2406158447265625, -0.20782470703125, -0.1750335693359375, -0.142242431640625, -0.1094512939453125, -0.07666015625, -0.0438690185546875, -0.011077880859375, 0.0217132568359375, 0.05450439453125, 0.0872955322265625, 0.120086669921875, 0.1528778076171875, 0.1856689453125, 0.2184600830078125, 0.251251220703125, 0.2840423583984375, 0.31683349609375, 0.3496246337890625, 0.382415771484375, 0.4152069091796875, 0.447998046875, 0.4807891845703125, 0.513580322265625, 0.5463714599609375, 0.57916259765625, 0.6119537353515625, 0.644744873046875, 0.6775360107421875, 0.7103271484375, 0.7431182861328125, 0.775909423828125, 0.8087005615234375, 0.84149169921875, 0.8742828369140625, 0.907073974609375, 0.9398651123046875, 0.97265625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 11.0, 21.0, 23.0, 53.0, 85.0, 169.0, 262.0, 532.0, 1233.0, 3648.0, 18914.0, 259042.0, 701770.0, 52358.0, 6961.0, 1917.0, 739.0, 335.0, 214.0, 108.0, 54.0, 39.0, 27.0, 17.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.296875, -3.1976318359375, -3.098388671875, -2.9991455078125, -2.89990234375, -2.8006591796875, -2.701416015625, -2.6021728515625, -2.5029296875, -2.4036865234375, -2.304443359375, -2.2052001953125, -2.10595703125, -2.0067138671875, -1.907470703125, -1.8082275390625, -1.708984375, -1.6097412109375, -1.510498046875, -1.4112548828125, -1.31201171875, -1.2127685546875, -1.113525390625, -1.0142822265625, -0.9150390625, -0.8157958984375, -0.716552734375, -0.6173095703125, -0.51806640625, -0.4188232421875, -0.319580078125, -0.2203369140625, -0.12109375, -0.0218505859375, 0.077392578125, 0.1766357421875, 0.27587890625, 0.3751220703125, 0.474365234375, 0.5736083984375, 0.6728515625, 0.7720947265625, 0.871337890625, 0.9705810546875, 1.06982421875, 1.1690673828125, 1.268310546875, 1.3675537109375, 1.466796875, 1.5660400390625, 1.665283203125, 1.7645263671875, 1.86376953125, 1.9630126953125, 2.062255859375, 2.1614990234375, 2.2607421875, 2.3599853515625, 2.459228515625, 2.5584716796875, 2.65771484375, 2.7569580078125, 2.856201171875, 2.9554443359375, 3.0546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 8.0, 8.0, 3.0, 12.0, 13.0, 13.0, 21.0, 23.0, 26.0, 26.0, 44.0, 47.0, 51.0, 55.0, 56.0, 50.0, 44.0, 68.0, 63.0, 50.0, 55.0, 38.0, 46.0, 30.0, 35.0, 27.0, 15.0, 18.0, 10.0, 16.0, 11.0, 6.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.703125, -2.607452392578125, -2.51177978515625, -2.416107177734375, -2.3204345703125, -2.224761962890625, -2.12908935546875, -2.033416748046875, -1.937744140625, -1.842071533203125, -1.74639892578125, -1.650726318359375, -1.5550537109375, -1.459381103515625, -1.36370849609375, -1.268035888671875, -1.17236328125, -1.076690673828125, -0.98101806640625, -0.885345458984375, -0.7896728515625, -0.694000244140625, -0.59832763671875, -0.502655029296875, -0.406982421875, -0.311309814453125, -0.21563720703125, -0.119964599609375, -0.0242919921875, 0.071380615234375, 0.16705322265625, 0.262725830078125, 0.3583984375, 0.454071044921875, 0.54974365234375, 0.645416259765625, 0.7410888671875, 0.836761474609375, 0.93243408203125, 1.028106689453125, 1.123779296875, 1.219451904296875, 1.31512451171875, 1.410797119140625, 1.5064697265625, 1.602142333984375, 1.69781494140625, 1.793487548828125, 1.88916015625, 1.984832763671875, 2.08050537109375, 2.176177978515625, 2.2718505859375, 2.367523193359375, 2.46319580078125, 2.558868408203125, 2.654541015625, 2.750213623046875, 2.84588623046875, 2.941558837890625, 3.0372314453125, 3.132904052734375, 3.22857666015625, 3.324249267578125, 3.419921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 4.0, 5.0, 10.0, 15.0, 21.0, 51.0, 82.0, 176.0, 428.0, 1141.0, 4139.0, 35126.0, 930754.0, 68601.0, 5718.0, 1398.0, 468.0, 193.0, 99.0, 50.0, 23.0, 15.0, 16.0, 5.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.255859375, -3.1756591796875, -3.095458984375, -3.0152587890625, -2.93505859375, -2.8548583984375, -2.774658203125, -2.6944580078125, -2.6142578125, -2.5340576171875, -2.453857421875, -2.3736572265625, -2.29345703125, -2.2132568359375, -2.133056640625, -2.0528564453125, -1.97265625, -1.8924560546875, -1.812255859375, -1.7320556640625, -1.65185546875, -1.5716552734375, -1.491455078125, -1.4112548828125, -1.3310546875, -1.2508544921875, -1.170654296875, -1.0904541015625, -1.01025390625, -0.9300537109375, -0.849853515625, -0.7696533203125, -0.689453125, -0.6092529296875, -0.529052734375, -0.4488525390625, -0.36865234375, -0.2884521484375, -0.208251953125, -0.1280517578125, -0.0478515625, 0.0323486328125, 0.112548828125, 0.1927490234375, 0.27294921875, 0.3531494140625, 0.433349609375, 0.5135498046875, 0.59375, 0.6739501953125, 0.754150390625, 0.8343505859375, 0.91455078125, 0.9947509765625, 1.074951171875, 1.1551513671875, 1.2353515625, 1.3155517578125, 1.395751953125, 1.4759521484375, 1.55615234375, 1.6363525390625, 1.716552734375, 1.7967529296875, 1.876953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 9.0, 7.0, 24.0, 43.0, 70.0, 137.0, 204.0, 207.0, 135.0, 84.0, 36.0, 16.0, 7.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000324249267578125, -0.00031340867280960083, -0.00030256807804107666, -0.0002917274832725525, -0.0002808868885040283, -0.00027004629373550415, -0.00025920569896698, -0.0002483651041984558, -0.00023752450942993164, -0.00022668391466140747, -0.0002158433198928833, -0.00020500272512435913, -0.00019416213035583496, -0.0001833215355873108, -0.00017248094081878662, -0.00016164034605026245, -0.00015079975128173828, -0.0001399591565132141, -0.00012911856174468994, -0.00011827796697616577, -0.0001074373722076416, -9.659677743911743e-05, -8.575618267059326e-05, -7.491558790206909e-05, -6.407499313354492e-05, -5.323439836502075e-05, -4.239380359649658e-05, -3.155320882797241e-05, -2.0712614059448242e-05, -9.872019290924072e-06, 9.685754776000977e-07, 1.1809170246124268e-05, 2.2649765014648438e-05, 3.349035978317261e-05, 4.433095455169678e-05, 5.517154932022095e-05, 6.601214408874512e-05, 7.685273885726929e-05, 8.769333362579346e-05, 9.853392839431763e-05, 0.0001093745231628418, 0.00012021511793136597, 0.00013105571269989014, 0.0001418963074684143, 0.00015273690223693848, 0.00016357749700546265, 0.00017441809177398682, 0.00018525868654251099, 0.00019609928131103516, 0.00020693987607955933, 0.0002177804708480835, 0.00022862106561660767, 0.00023946166038513184, 0.000250302255153656, 0.0002611428499221802, 0.00027198344469070435, 0.0002828240394592285, 0.0002936646342277527, 0.00030450522899627686, 0.000315345823764801, 0.0003261864185333252, 0.00033702701330184937, 0.00034786760807037354, 0.0003587082028388977, 0.0003695487976074219]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 4.0, 11.0, 14.0, 18.0, 14.0, 30.0, 39.0, 83.0, 107.0, 176.0, 288.0, 488.0, 924.0, 1735.0, 3686.0, 9150.0, 35437.0, 422761.0, 515914.0, 39976.0, 9954.0, 3828.0, 1683.0, 935.0, 491.0, 269.0, 184.0, 113.0, 75.0, 42.0, 41.0, 25.0, 12.0, 8.0, 11.0, 6.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.515625, -1.474700927734375, -1.43377685546875, -1.392852783203125, -1.3519287109375, -1.311004638671875, -1.27008056640625, -1.229156494140625, -1.188232421875, -1.147308349609375, -1.10638427734375, -1.065460205078125, -1.0245361328125, -0.983612060546875, -0.94268798828125, -0.901763916015625, -0.86083984375, -0.819915771484375, -0.77899169921875, -0.738067626953125, -0.6971435546875, -0.656219482421875, -0.61529541015625, -0.574371337890625, -0.533447265625, -0.492523193359375, -0.45159912109375, -0.410675048828125, -0.3697509765625, -0.328826904296875, -0.28790283203125, -0.246978759765625, -0.2060546875, -0.165130615234375, -0.12420654296875, -0.083282470703125, -0.0423583984375, -0.001434326171875, 0.03948974609375, 0.080413818359375, 0.121337890625, 0.162261962890625, 0.20318603515625, 0.244110107421875, 0.2850341796875, 0.325958251953125, 0.36688232421875, 0.407806396484375, 0.44873046875, 0.489654541015625, 0.53057861328125, 0.571502685546875, 0.6124267578125, 0.653350830078125, 0.69427490234375, 0.735198974609375, 0.776123046875, 0.817047119140625, 0.85797119140625, 0.898895263671875, 0.9398193359375, 0.980743408203125, 1.02166748046875, 1.062591552734375, 1.103515625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 7.0, 4.0, 4.0, 6.0, 11.0, 14.0, 36.0, 65.0, 137.0, 171.0, 203.0, 142.0, 77.0, 47.0, 15.0, 6.0, 14.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.37109375, -2.28717041015625, -2.2032470703125, -2.11932373046875, -2.035400390625, -1.95147705078125, -1.8675537109375, -1.78363037109375, -1.69970703125, -1.61578369140625, -1.5318603515625, -1.44793701171875, -1.364013671875, -1.28009033203125, -1.1961669921875, -1.11224365234375, -1.0283203125, -0.94439697265625, -0.8604736328125, -0.77655029296875, -0.692626953125, -0.60870361328125, -0.5247802734375, -0.44085693359375, -0.35693359375, -0.27301025390625, -0.1890869140625, -0.10516357421875, -0.021240234375, 0.06268310546875, 0.1466064453125, 0.23052978515625, 0.314453125, 0.39837646484375, 0.4822998046875, 0.56622314453125, 0.650146484375, 0.73406982421875, 0.8179931640625, 0.90191650390625, 0.98583984375, 1.06976318359375, 1.1536865234375, 1.23760986328125, 1.321533203125, 1.40545654296875, 1.4893798828125, 1.57330322265625, 1.6572265625, 1.74114990234375, 1.8250732421875, 1.90899658203125, 1.992919921875, 2.07684326171875, 2.1607666015625, 2.24468994140625, 2.32861328125, 2.41253662109375, 2.4964599609375, 2.58038330078125, 2.664306640625, 2.74822998046875, 2.8321533203125, 2.91607666015625, 3.0]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 11.0, 20.0, 28.0, 64.0, 106.0, 138.0, 144.0, 143.0, 118.0, 78.0, 63.0, 36.0, 32.0, 11.0, 8.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.128128051757812, -23.487226486206055, -22.846324920654297, -22.20542335510254, -21.56452178955078, -20.923620223999023, -20.282718658447266, -19.641815185546875, -19.00091552734375, -18.360013961791992, -17.719112396240234, -17.078210830688477, -16.43730926513672, -15.796407699584961, -15.155505180358887, -14.514603614807129, -13.873701095581055, -13.232799530029297, -12.591897964477539, -11.950996398925781, -11.310094833374023, -10.669193267822266, -10.028290748596191, -9.387389183044434, -8.746487617492676, -8.105586051940918, -7.46468448638916, -6.823782444000244, -6.182880878448486, -5.5419793128967285, -4.9010772705078125, -4.260175704956055, -3.619274139404297, -2.978372573852539, -2.337470769882202, -1.6965690851211548, -1.0556674003601074, -0.4147658348083496, 0.2261359691619873, 0.8670377731323242, 1.507939338684082, 2.14884090423584, 2.7897427082061768, 3.4306445121765137, 4.0715460777282715, 4.712447643280029, 5.353349685668945, 5.994251251220703, 6.635152816772461, 7.276054382324219, 7.916955947875977, 8.557857513427734, 9.198759078979492, 9.83966064453125, 10.480563163757324, 11.121464729309082, 11.76236629486084, 12.403267860412598, 13.044169425964355, 13.685070991516113, 14.325973510742188, 14.966875076293945, 15.607776641845703, 16.24867820739746, 16.88957977294922]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 5.0, 3.0, 7.0, 9.0, 10.0, 14.0, 13.0, 18.0, 15.0, 21.0, 32.0, 36.0, 31.0, 19.0, 34.0, 23.0, 53.0, 36.0, 43.0, 39.0, 51.0, 43.0, 31.0, 34.0, 37.0, 43.0, 31.0, 32.0, 29.0, 19.0, 16.0, 27.0, 27.0, 14.0, 13.0, 19.0, 12.0, 13.0, 14.0, 8.0, 4.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.500033378601074, -12.127107620239258, -11.754181861877441, -11.381256103515625, -11.008330345153809, -10.635404586791992, -10.26247787475586, -9.88955307006836, -9.516626358032227, -9.14370059967041, -8.770774841308594, -8.397849082946777, -8.024923324584961, -7.6519975662231445, -7.27907133102417, -6.9061455726623535, -6.533220291137695, -6.160294532775879, -5.7873687744140625, -5.414443016052246, -5.04151725769043, -4.668591499328613, -4.295665264129639, -3.9227395057678223, -3.549813747406006, -3.1768879890441895, -2.803962230682373, -2.4310362339019775, -2.058110475540161, -1.6851847171783447, -1.3122587203979492, -0.9393329620361328, -0.5664081573486328, -0.19348233938217163, 0.17944347858428955, 0.5523693561553955, 0.9252951145172119, 1.2982208728790283, 1.6711468696594238, 2.0440726280212402, 2.4169983863830566, 2.789924144744873, 3.1628499031066895, 3.535775899887085, 3.9087016582489014, 4.281627655029297, 4.654553413391113, 5.02747917175293, 5.400404930114746, 5.7733306884765625, 6.146256446838379, 6.519182205200195, 6.892107963562012, 7.265033721923828, 7.637959957122803, 8.010885238647461, 8.383811950683594, 8.75673770904541, 9.129663467407227, 9.502589225769043, 9.87551498413086, 10.248440742492676, 10.621366500854492, 10.994293212890625, 11.367218017578125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 9.0, 3.0, 3.0, 3.0, 8.0, 7.0, 17.0, 27.0, 24.0, 33.0, 53.0, 78.0, 130.0, 244.0, 352.0, 753.0, 1698.0, 4619.0, 16677.0, 115503.0, 3993591.0, 45691.0, 9351.0, 2974.0, 1166.0, 521.0, 252.0, 152.0, 101.0, 68.0, 43.0, 33.0, 27.0, 18.0, 12.0, 10.0, 3.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.68359375, -2.6053466796875, -2.527099609375, -2.4488525390625, -2.37060546875, -2.2923583984375, -2.214111328125, -2.1358642578125, -2.0576171875, -1.9793701171875, -1.901123046875, -1.8228759765625, -1.74462890625, -1.6663818359375, -1.588134765625, -1.5098876953125, -1.431640625, -1.3533935546875, -1.275146484375, -1.1968994140625, -1.11865234375, -1.0404052734375, -0.962158203125, -0.8839111328125, -0.8056640625, -0.7274169921875, -0.649169921875, -0.5709228515625, -0.49267578125, -0.4144287109375, -0.336181640625, -0.2579345703125, -0.1796875, -0.1014404296875, -0.023193359375, 0.0550537109375, 0.13330078125, 0.2115478515625, 0.289794921875, 0.3680419921875, 0.4462890625, 0.5245361328125, 0.602783203125, 0.6810302734375, 0.75927734375, 0.8375244140625, 0.915771484375, 0.9940185546875, 1.072265625, 1.1505126953125, 1.228759765625, 1.3070068359375, 1.38525390625, 1.4635009765625, 1.541748046875, 1.6199951171875, 1.6982421875, 1.7764892578125, 1.854736328125, 1.9329833984375, 2.01123046875, 2.0894775390625, 2.167724609375, 2.2459716796875, 2.32421875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 6.0, 17.0, 19.0, 25.0, 29.0, 35.0, 48.0, 48.0, 47.0, 47.0, 47.0, 65.0, 59.0, 49.0, 62.0, 53.0, 46.0, 45.0, 41.0, 24.0, 27.0, 22.0, 22.0, 20.0, 10.0, 11.0, 11.0, 6.0, 8.0, 8.0, 3.0, 6.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.701171875, -0.6803817749023438, -0.6595916748046875, -0.6388015747070312, -0.618011474609375, -0.5972213745117188, -0.5764312744140625, -0.5556411743164062, -0.53485107421875, -0.5140609741210938, -0.4932708740234375, -0.47248077392578125, -0.451690673828125, -0.43090057373046875, -0.4101104736328125, -0.38932037353515625, -0.3685302734375, -0.34774017333984375, -0.3269500732421875, -0.30615997314453125, -0.285369873046875, -0.26457977294921875, -0.2437896728515625, -0.22299957275390625, -0.20220947265625, -0.18141937255859375, -0.1606292724609375, -0.13983917236328125, -0.119049072265625, -0.09825897216796875, -0.0774688720703125, -0.05667877197265625, -0.035888671875, -0.01509857177734375, 0.0056915283203125, 0.02648162841796875, 0.047271728515625, 0.06806182861328125, 0.0888519287109375, 0.10964202880859375, 0.13043212890625, 0.15122222900390625, 0.1720123291015625, 0.19280242919921875, 0.213592529296875, 0.23438262939453125, 0.2551727294921875, 0.27596282958984375, 0.2967529296875, 0.31754302978515625, 0.3383331298828125, 0.35912322998046875, 0.379913330078125, 0.40070343017578125, 0.4214935302734375, 0.44228363037109375, 0.46307373046875, 0.48386383056640625, 0.5046539306640625, 0.5254440307617188, 0.546234130859375, 0.5670242309570312, 0.5878143310546875, 0.6086044311523438, 0.62939453125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 4.0, 7.0, 6.0, 9.0, 11.0, 19.0, 33.0, 32.0, 37.0, 42.0, 64.0, 86.0, 99.0, 156.0, 208.0, 271.0, 530.0, 2414.0, 56787.0, 4120617.0, 10352.0, 1153.0, 383.0, 226.0, 164.0, 133.0, 108.0, 86.0, 62.0, 36.0, 29.0, 26.0, 23.0, 19.0, 12.0, 14.0, 4.0, 6.0, 2.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.625, -8.3734130859375, -8.121826171875, -7.8702392578125, -7.61865234375, -7.3670654296875, -7.115478515625, -6.8638916015625, -6.6123046875, -6.3607177734375, -6.109130859375, -5.8575439453125, -5.60595703125, -5.3543701171875, -5.102783203125, -4.8511962890625, -4.599609375, -4.3480224609375, -4.096435546875, -3.8448486328125, -3.59326171875, -3.3416748046875, -3.090087890625, -2.8385009765625, -2.5869140625, -2.3353271484375, -2.083740234375, -1.8321533203125, -1.58056640625, -1.3289794921875, -1.077392578125, -0.8258056640625, -0.57421875, -0.3226318359375, -0.071044921875, 0.1805419921875, 0.43212890625, 0.6837158203125, 0.935302734375, 1.1868896484375, 1.4384765625, 1.6900634765625, 1.941650390625, 2.1932373046875, 2.44482421875, 2.6964111328125, 2.947998046875, 3.1995849609375, 3.451171875, 3.7027587890625, 3.954345703125, 4.2059326171875, 4.45751953125, 4.7091064453125, 4.960693359375, 5.2122802734375, 5.4638671875, 5.7154541015625, 5.967041015625, 6.2186279296875, 6.47021484375, 6.7218017578125, 6.973388671875, 7.2249755859375, 7.4765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 18.0, 28.0, 114.0, 3492.0, 300.0, 81.0, 25.0, 8.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-4.86328125, -4.7711181640625, -4.678955078125, -4.5867919921875, -4.49462890625, -4.4024658203125, -4.310302734375, -4.2181396484375, -4.1259765625, -4.0338134765625, -3.941650390625, -3.8494873046875, -3.75732421875, -3.6651611328125, -3.572998046875, -3.4808349609375, -3.388671875, -3.2965087890625, -3.204345703125, -3.1121826171875, -3.02001953125, -2.9278564453125, -2.835693359375, -2.7435302734375, -2.6513671875, -2.5592041015625, -2.467041015625, -2.3748779296875, -2.28271484375, -2.1905517578125, -2.098388671875, -2.0062255859375, -1.9140625, -1.8218994140625, -1.729736328125, -1.6375732421875, -1.54541015625, -1.4532470703125, -1.361083984375, -1.2689208984375, -1.1767578125, -1.0845947265625, -0.992431640625, -0.9002685546875, -0.80810546875, -0.7159423828125, -0.623779296875, -0.5316162109375, -0.439453125, -0.3472900390625, -0.255126953125, -0.1629638671875, -0.07080078125, 0.0213623046875, 0.113525390625, 0.2056884765625, 0.2978515625, 0.3900146484375, 0.482177734375, 0.5743408203125, 0.66650390625, 0.7586669921875, 0.850830078125, 0.9429931640625, 1.03515625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 5.0, 15.0, 20.0, 37.0, 42.0, 89.0, 138.0, 157.0, 159.0, 129.0, 82.0, 57.0, 22.0, 19.0, 8.0, 6.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.920400619506836, -8.658134460449219, -8.395867347717285, -8.133601188659668, -7.871334552764893, -7.609067916870117, -7.3468017578125, -7.084535121917725, -6.822268486022949, -6.560001850128174, -6.297735214233398, -6.035469055175781, -5.773202419281006, -5.5109357833862305, -5.248669624328613, -4.986402988433838, -4.7241363525390625, -4.461869716644287, -4.199603080749512, -3.9373369216918945, -3.675070285797119, -3.4128036499023438, -3.1505372524261475, -2.888270854949951, -2.626004219055176, -2.3637375831604004, -2.101471185684204, -1.8392046689987183, -1.5769381523132324, -1.3146716356277466, -1.0524051189422607, -0.7901386022567749, -0.5278730392456055, -0.26560652256011963, -0.003340005874633789, 0.25892651081085205, 0.5211930274963379, 0.7834595441818237, 1.0457260608673096, 1.3079925775527954, 1.5702590942382812, 1.832525610923767, 2.094792127609253, 2.357058525085449, 2.6193251609802246, 2.881591796875, 3.1438581943511963, 3.4061245918273926, 3.668391227722168, 3.9306578636169434, 4.192924499511719, 4.455190658569336, 4.717457294464111, 4.979723930358887, 5.241990089416504, 5.504256725311279, 5.766523361206055, 6.02878999710083, 6.2910566329956055, 6.553322792053223, 6.815589427947998, 7.077856063842773, 7.340122222900391, 7.602388858795166, 7.864655494689941]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 11.0, 7.0, 22.0, 52.0, 46.0, 60.0, 84.0, 86.0, 99.0, 110.0, 107.0, 84.0, 58.0, 54.0, 35.0, 24.0, 16.0, 17.0, 12.0, 3.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.068631172180176, -6.798524856567383, -6.528418064117432, -6.2583112716674805, -5.9882049560546875, -5.7180986404418945, -5.447991847991943, -5.177885055541992, -4.907778739929199, -4.637672424316406, -4.367565631866455, -4.097458839416504, -3.827352523803711, -3.557245969772339, -3.287139415740967, -3.0170328617095947, -2.7469263076782227, -2.4768197536468506, -2.2067131996154785, -1.9366066455841064, -1.6665000915527344, -1.3963935375213623, -1.1262869834899902, -0.8561804294586182, -0.5860738754272461, -0.315967321395874, -0.04586076736450195, 0.22424578666687012, 0.4943523406982422, 0.7644588947296143, 1.0345654487609863, 1.3046720027923584, 1.574777603149414, 1.8448841571807861, 2.114990711212158, 2.3850972652435303, 2.6552038192749023, 2.9253103733062744, 3.1954169273376465, 3.4655234813690186, 3.7356300354003906, 4.005736351013184, 4.275843143463135, 4.545949935913086, 4.816056251525879, 5.086162567138672, 5.356269359588623, 5.626376152038574, 5.896482467651367, 6.16658878326416, 6.436695575714111, 6.7068023681640625, 6.9769086837768555, 7.247014999389648, 7.5171217918396, 7.787228584289551, 8.057334899902344, 8.327441215515137, 8.59754753112793, 8.867654800415039, 9.137761116027832, 9.407867431640625, 9.677974700927734, 9.948081016540527, 10.21818733215332]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 13.0, 7.0, 13.0, 28.0, 42.0, 36.0, 51.0, 106.0, 130.0, 201.0, 326.0, 531.0, 942.0, 1697.0, 3225.0, 6500.0, 14332.0, 34550.0, 88887.0, 224228.0, 344565.0, 196975.0, 76066.0, 29661.0, 12738.0, 5896.0, 2945.0, 1594.0, 904.0, 484.0, 315.0, 175.0, 125.0, 73.0, 63.0, 41.0, 24.0, 20.0, 11.0, 9.0, 8.0, 4.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1494140625, -1.1074981689453125, -1.065582275390625, -1.0236663818359375, -0.98175048828125, -0.9398345947265625, -0.897918701171875, -0.8560028076171875, -0.8140869140625, -0.7721710205078125, -0.730255126953125, -0.6883392333984375, -0.64642333984375, -0.6045074462890625, -0.562591552734375, -0.5206756591796875, -0.478759765625, -0.4368438720703125, -0.394927978515625, -0.3530120849609375, -0.31109619140625, -0.2691802978515625, -0.227264404296875, -0.1853485107421875, -0.1434326171875, -0.1015167236328125, -0.059600830078125, -0.0176849365234375, 0.02423095703125, 0.0661468505859375, 0.108062744140625, 0.1499786376953125, 0.19189453125, 0.2338104248046875, 0.275726318359375, 0.3176422119140625, 0.35955810546875, 0.4014739990234375, 0.443389892578125, 0.4853057861328125, 0.5272216796875, 0.5691375732421875, 0.611053466796875, 0.6529693603515625, 0.69488525390625, 0.7368011474609375, 0.778717041015625, 0.8206329345703125, 0.862548828125, 0.9044647216796875, 0.946380615234375, 0.9882965087890625, 1.03021240234375, 1.0721282958984375, 1.114044189453125, 1.1559600830078125, 1.1978759765625, 1.2397918701171875, 1.281707763671875, 1.3236236572265625, 1.36553955078125, 1.4074554443359375, 1.449371337890625, 1.4912872314453125, 1.533203125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 2.0, 6.0, 10.0, 12.0, 15.0, 13.0, 25.0, 25.0, 30.0, 37.0, 31.0, 45.0, 40.0, 50.0, 71.0, 56.0, 62.0, 71.0, 64.0, 60.0, 39.0, 51.0, 32.0, 31.0, 26.0, 20.0, 14.0, 12.0, 9.0, 7.0, 8.0, 4.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65673828125, -0.6317977905273438, -0.6068572998046875, -0.5819168090820312, -0.556976318359375, -0.5320358276367188, -0.5070953369140625, -0.48215484619140625, -0.45721435546875, -0.43227386474609375, -0.4073333740234375, -0.38239288330078125, -0.357452392578125, -0.33251190185546875, -0.3075714111328125, -0.28263092041015625, -0.2576904296875, -0.23274993896484375, -0.2078094482421875, -0.18286895751953125, -0.157928466796875, -0.13298797607421875, -0.1080474853515625, -0.08310699462890625, -0.05816650390625, -0.03322601318359375, -0.0082855224609375, 0.01665496826171875, 0.041595458984375, 0.06653594970703125, 0.0914764404296875, 0.11641693115234375, 0.141357421875, 0.16629791259765625, 0.1912384033203125, 0.21617889404296875, 0.241119384765625, 0.26605987548828125, 0.2910003662109375, 0.31594085693359375, 0.34088134765625, 0.36582183837890625, 0.3907623291015625, 0.41570281982421875, 0.440643310546875, 0.46558380126953125, 0.4905242919921875, 0.5154647827148438, 0.5404052734375, 0.5653457641601562, 0.5902862548828125, 0.6152267456054688, 0.640167236328125, 0.6651077270507812, 0.6900482177734375, 0.7149887084960938, 0.73992919921875, 0.7648696899414062, 0.7898101806640625, 0.8147506713867188, 0.839691162109375, 0.8646316528320312, 0.8895721435546875, 0.9145126342773438, 0.939453125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 6.0, 9.0, 13.0, 38.0, 40.0, 87.0, 124.0, 183.0, 386.0, 911.0, 3824.0, 67998.0, 935323.0, 35122.0, 2889.0, 763.0, 338.0, 174.0, 119.0, 69.0, 49.0, 26.0, 20.0, 9.0, 9.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8125, -5.61492919921875, -5.4173583984375, -5.21978759765625, -5.022216796875, -4.82464599609375, -4.6270751953125, -4.42950439453125, -4.23193359375, -4.03436279296875, -3.8367919921875, -3.63922119140625, -3.441650390625, -3.24407958984375, -3.0465087890625, -2.84893798828125, -2.6513671875, -2.45379638671875, -2.2562255859375, -2.05865478515625, -1.861083984375, -1.66351318359375, -1.4659423828125, -1.26837158203125, -1.07080078125, -0.87322998046875, -0.6756591796875, -0.47808837890625, -0.280517578125, -0.08294677734375, 0.1146240234375, 0.31219482421875, 0.509765625, 0.70733642578125, 0.9049072265625, 1.10247802734375, 1.300048828125, 1.49761962890625, 1.6951904296875, 1.89276123046875, 2.09033203125, 2.28790283203125, 2.4854736328125, 2.68304443359375, 2.880615234375, 3.07818603515625, 3.2757568359375, 3.47332763671875, 3.6708984375, 3.86846923828125, 4.0660400390625, 4.26361083984375, 4.461181640625, 4.65875244140625, 4.8563232421875, 5.05389404296875, 5.25146484375, 5.44903564453125, 5.6466064453125, 5.84417724609375, 6.041748046875, 6.23931884765625, 6.4368896484375, 6.63446044921875, 6.83203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 9.0, 12.0, 12.0, 13.0, 27.0, 27.0, 40.0, 43.0, 58.0, 52.0, 71.0, 97.0, 74.0, 84.0, 61.0, 73.0, 63.0, 52.0, 36.0, 29.0, 21.0, 16.0, 13.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.015625, -4.86053466796875, -4.7054443359375, -4.55035400390625, -4.395263671875, -4.24017333984375, -4.0850830078125, -3.92999267578125, -3.77490234375, -3.61981201171875, -3.4647216796875, -3.30963134765625, -3.154541015625, -2.99945068359375, -2.8443603515625, -2.68927001953125, -2.5341796875, -2.37908935546875, -2.2239990234375, -2.06890869140625, -1.913818359375, -1.75872802734375, -1.6036376953125, -1.44854736328125, -1.29345703125, -1.13836669921875, -0.9832763671875, -0.82818603515625, -0.673095703125, -0.51800537109375, -0.3629150390625, -0.20782470703125, -0.052734375, 0.10235595703125, 0.2574462890625, 0.41253662109375, 0.567626953125, 0.72271728515625, 0.8778076171875, 1.03289794921875, 1.18798828125, 1.34307861328125, 1.4981689453125, 1.65325927734375, 1.808349609375, 1.96343994140625, 2.1185302734375, 2.27362060546875, 2.4287109375, 2.58380126953125, 2.7388916015625, 2.89398193359375, 3.049072265625, 3.20416259765625, 3.3592529296875, 3.51434326171875, 3.66943359375, 3.82452392578125, 3.9796142578125, 4.13470458984375, 4.289794921875, 4.44488525390625, 4.5999755859375, 4.75506591796875, 4.91015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 10.0, 9.0, 15.0, 17.0, 44.0, 77.0, 136.0, 344.0, 1018.0, 4556.0, 63919.0, 922021.0, 50840.0, 3932.0, 915.0, 352.0, 150.0, 86.0, 34.0, 16.0, 17.0, 15.0, 9.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.14453125, -2.0872955322265625, -2.030059814453125, -1.9728240966796875, -1.91558837890625, -1.8583526611328125, -1.801116943359375, -1.7438812255859375, -1.6866455078125, -1.6294097900390625, -1.572174072265625, -1.5149383544921875, -1.45770263671875, -1.4004669189453125, -1.343231201171875, -1.2859954833984375, -1.228759765625, -1.1715240478515625, -1.114288330078125, -1.0570526123046875, -0.99981689453125, -0.9425811767578125, -0.885345458984375, -0.8281097412109375, -0.7708740234375, -0.7136383056640625, -0.656402587890625, -0.5991668701171875, -0.54193115234375, -0.4846954345703125, -0.427459716796875, -0.3702239990234375, -0.31298828125, -0.2557525634765625, -0.198516845703125, -0.1412811279296875, -0.08404541015625, -0.0268096923828125, 0.030426025390625, 0.0876617431640625, 0.1448974609375, 0.2021331787109375, 0.259368896484375, 0.3166046142578125, 0.37384033203125, 0.4310760498046875, 0.488311767578125, 0.5455474853515625, 0.602783203125, 0.6600189208984375, 0.717254638671875, 0.7744903564453125, 0.83172607421875, 0.8889617919921875, 0.946197509765625, 1.0034332275390625, 1.0606689453125, 1.1179046630859375, 1.175140380859375, 1.2323760986328125, 1.28961181640625, 1.3468475341796875, 1.404083251953125, 1.4613189697265625, 1.5185546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 2.0, 5.0, 4.0, 9.0, 10.0, 10.0, 19.0, 24.0, 34.0, 42.0, 71.0, 92.0, 119.0, 112.0, 109.0, 103.0, 77.0, 39.0, 32.0, 21.0, 22.0, 7.0, 6.0, 11.0, 10.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00023245811462402344, -0.00022589415311813354, -0.00021933019161224365, -0.00021276623010635376, -0.00020620226860046387, -0.00019963830709457397, -0.00019307434558868408, -0.0001865103840827942, -0.0001799464225769043, -0.0001733824610710144, -0.0001668184995651245, -0.00016025453805923462, -0.00015369057655334473, -0.00014712661504745483, -0.00014056265354156494, -0.00013399869203567505, -0.00012743473052978516, -0.00012087076902389526, -0.00011430680751800537, -0.00010774284601211548, -0.00010117888450622559, -9.46149230003357e-05, -8.80509614944458e-05, -8.148699998855591e-05, -7.492303848266602e-05, -6.835907697677612e-05, -6.179511547088623e-05, -5.523115396499634e-05, -4.8667192459106445e-05, -4.210323095321655e-05, -3.553926944732666e-05, -2.8975307941436768e-05, -2.2411346435546875e-05, -1.5847384929656982e-05, -9.28342342376709e-06, -2.7194619178771973e-06, 3.844499588012695e-06, 1.0408461093902588e-05, 1.697242259979248e-05, 2.3536384105682373e-05, 3.0100345611572266e-05, 3.666430711746216e-05, 4.322826862335205e-05, 4.979223012924194e-05, 5.6356191635131836e-05, 6.292015314102173e-05, 6.948411464691162e-05, 7.604807615280151e-05, 8.26120376586914e-05, 8.91759991645813e-05, 9.573996067047119e-05, 0.00010230392217636108, 0.00010886788368225098, 0.00011543184518814087, 0.00012199580669403076, 0.00012855976819992065, 0.00013512372970581055, 0.00014168769121170044, 0.00014825165271759033, 0.00015481561422348022, 0.00016137957572937012, 0.00016794353723526, 0.0001745074987411499, 0.0001810714602470398, 0.0001876354217529297]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 9.0, 7.0, 2.0, 9.0, 14.0, 29.0, 40.0, 58.0, 84.0, 182.0, 390.0, 820.0, 2496.0, 12710.0, 210623.0, 773386.0, 40026.0, 5149.0, 1377.0, 564.0, 247.0, 112.0, 82.0, 54.0, 29.0, 20.0, 13.0, 4.0, 5.0, 1.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4130859375, -1.3692626953125, -1.325439453125, -1.2816162109375, -1.23779296875, -1.1939697265625, -1.150146484375, -1.1063232421875, -1.0625, -1.0186767578125, -0.974853515625, -0.9310302734375, -0.88720703125, -0.8433837890625, -0.799560546875, -0.7557373046875, -0.7119140625, -0.6680908203125, -0.624267578125, -0.5804443359375, -0.53662109375, -0.4927978515625, -0.448974609375, -0.4051513671875, -0.361328125, -0.3175048828125, -0.273681640625, -0.2298583984375, -0.18603515625, -0.1422119140625, -0.098388671875, -0.0545654296875, -0.0107421875, 0.0330810546875, 0.076904296875, 0.1207275390625, 0.16455078125, 0.2083740234375, 0.252197265625, 0.2960205078125, 0.33984375, 0.3836669921875, 0.427490234375, 0.4713134765625, 0.51513671875, 0.5589599609375, 0.602783203125, 0.6466064453125, 0.6904296875, 0.7342529296875, 0.778076171875, 0.8218994140625, 0.86572265625, 0.9095458984375, 0.953369140625, 0.9971923828125, 1.041015625, 1.0848388671875, 1.128662109375, 1.1724853515625, 1.21630859375, 1.2601318359375, 1.303955078125, 1.3477783203125, 1.3916015625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 9.0, 11.0, 17.0, 35.0, 24.0, 58.0, 70.0, 86.0, 110.0, 118.0, 113.0, 93.0, 72.0, 60.0, 40.0, 21.0, 17.0, 11.0, 3.0, 2.0, 3.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.990234375, -0.952606201171875, -0.91497802734375, -0.877349853515625, -0.8397216796875, -0.802093505859375, -0.76446533203125, -0.726837158203125, -0.689208984375, -0.651580810546875, -0.61395263671875, -0.576324462890625, -0.5386962890625, -0.501068115234375, -0.46343994140625, -0.425811767578125, -0.38818359375, -0.350555419921875, -0.31292724609375, -0.275299072265625, -0.2376708984375, -0.200042724609375, -0.16241455078125, -0.124786376953125, -0.087158203125, -0.049530029296875, -0.01190185546875, 0.025726318359375, 0.0633544921875, 0.100982666015625, 0.13861083984375, 0.176239013671875, 0.2138671875, 0.251495361328125, 0.28912353515625, 0.326751708984375, 0.3643798828125, 0.402008056640625, 0.43963623046875, 0.477264404296875, 0.514892578125, 0.552520751953125, 0.59014892578125, 0.627777099609375, 0.6654052734375, 0.703033447265625, 0.74066162109375, 0.778289794921875, 0.81591796875, 0.853546142578125, 0.89117431640625, 0.928802490234375, 0.9664306640625, 1.004058837890625, 1.04168701171875, 1.079315185546875, 1.116943359375, 1.154571533203125, 1.19219970703125, 1.229827880859375, 1.2674560546875, 1.305084228515625, 1.34271240234375, 1.380340576171875, 1.41796875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 15.0, 17.0, 48.0, 104.0, 207.0, 276.0, 188.0, 76.0, 42.0, 24.0, 6.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.46487808227539, -16.038665771484375, -14.612455368041992, -13.186243057250977, -11.760031700134277, -10.333820343017578, -8.907608032226562, -7.481396675109863, -6.055185317993164, -4.628973960876465, -3.2027621269226074, -1.77655029296875, -0.3503389358520508, 1.0758724212646484, 2.502084732055664, 3.9282960891723633, 5.3545074462890625, 6.780718803405762, 8.206930160522461, 9.633142471313477, 11.059353828430176, 12.485565185546875, 13.91177749633789, 15.33798885345459, 16.76420021057129, 18.190412521362305, 19.616622924804688, 21.042835235595703, 22.46904754638672, 23.8952579498291, 25.321470260620117, 26.7476806640625, 28.17389678955078, 29.600109100341797, 31.02631950378418, 32.45252990722656, 33.87874221801758, 35.304954528808594, 36.73116683959961, 38.157379150390625, 39.583587646484375, 41.00979995727539, 42.436012268066406, 43.862220764160156, 45.28843307495117, 46.71464538574219, 48.1408576965332, 49.56707000732422, 50.993282318115234, 52.41949462890625, 53.845706939697266, 55.27191925048828, 56.69812774658203, 58.12434005737305, 59.55055236816406, 60.97676467895508, 62.402976989746094, 63.82918930053711, 65.25540161132812, 66.68161010742188, 68.10782623291016, 69.5340347290039, 70.96025085449219, 72.38645935058594, 73.81266784667969]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 4.0, 5.0, 8.0, 10.0, 16.0, 18.0, 21.0, 20.0, 30.0, 37.0, 42.0, 59.0, 63.0, 61.0, 61.0, 51.0, 75.0, 64.0, 47.0, 51.0, 48.0, 51.0, 36.0, 23.0, 26.0, 14.0, 15.0, 9.0, 9.0, 9.0, 4.0, 7.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.036518096923828, -20.397083282470703, -19.757646560668945, -19.11821174621582, -18.478775024414062, -17.839340209960938, -17.199905395507812, -16.560470581054688, -15.92103385925293, -15.281598091125488, -14.642162322998047, -14.002727508544922, -13.36329174041748, -12.723855972290039, -12.084421157836914, -11.444985389709473, -10.805549621582031, -10.16611385345459, -9.526678085327148, -8.887243270874023, -8.247807502746582, -7.608371734619141, -6.968936443328857, -6.329501152038574, -5.690065383911133, -5.050629615783691, -4.411194324493408, -3.771758794784546, -3.1323232650756836, -2.4928877353668213, -1.853452205657959, -1.2140169143676758, -0.5745811462402344, 0.06485438346862793, 0.7042899131774902, 1.3437254428863525, 1.9831609725952148, 2.622596502304077, 3.2620320320129395, 3.9014673233032227, 4.540903091430664, 5.1803388595581055, 5.819774150848389, 6.459209442138672, 7.098645210266113, 7.738080978393555, 8.37751579284668, 9.016951560974121, 9.656387329101562, 10.295823097229004, 10.935258865356445, 11.57469367980957, 12.214129447937012, 12.853565216064453, 13.493000030517578, 14.13243579864502, 14.771871566772461, 15.411307334899902, 16.050743103027344, 16.69017791748047, 17.329612731933594, 17.96904945373535, 18.608484268188477, 19.247920989990234, 19.88735580444336]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 1.0, 2.0, 7.0, 6.0, 9.0, 9.0, 7.0, 11.0, 13.0, 19.0, 24.0, 33.0, 34.0, 41.0, 65.0, 110.0, 127.0, 223.0, 365.0, 682.0, 1260.0, 3059.0, 7999.0, 27231.0, 142278.0, 3218992.0, 697350.0, 66861.0, 17249.0, 5733.0, 2310.0, 1062.0, 495.0, 232.0, 144.0, 87.0, 53.0, 28.0, 20.0, 12.0, 12.0, 12.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.08203125, -2.030975341796875, -1.97991943359375, -1.928863525390625, -1.8778076171875, -1.826751708984375, -1.77569580078125, -1.724639892578125, -1.673583984375, -1.622528076171875, -1.57147216796875, -1.520416259765625, -1.4693603515625, -1.418304443359375, -1.36724853515625, -1.316192626953125, -1.26513671875, -1.214080810546875, -1.16302490234375, -1.111968994140625, -1.0609130859375, -1.009857177734375, -0.95880126953125, -0.907745361328125, -0.856689453125, -0.805633544921875, -0.75457763671875, -0.703521728515625, -0.6524658203125, -0.601409912109375, -0.55035400390625, -0.499298095703125, -0.4482421875, -0.397186279296875, -0.34613037109375, -0.295074462890625, -0.2440185546875, -0.192962646484375, -0.14190673828125, -0.090850830078125, -0.039794921875, 0.011260986328125, 0.06231689453125, 0.113372802734375, 0.1644287109375, 0.215484619140625, 0.26654052734375, 0.317596435546875, 0.36865234375, 0.419708251953125, 0.47076416015625, 0.521820068359375, 0.5728759765625, 0.623931884765625, 0.67498779296875, 0.726043701171875, 0.777099609375, 0.828155517578125, 0.87921142578125, 0.930267333984375, 0.9813232421875, 1.032379150390625, 1.08343505859375, 1.134490966796875, 1.185546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 20.0, 34.0, 61.0, 89.0, 103.0, 145.0, 142.0, 107.0, 115.0, 57.0, 53.0, 32.0, 11.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.15625, -2.1038665771484375, -2.051483154296875, -1.9990997314453125, -1.94671630859375, -1.8943328857421875, -1.841949462890625, -1.7895660400390625, -1.7371826171875, -1.6847991943359375, -1.632415771484375, -1.5800323486328125, -1.52764892578125, -1.4752655029296875, -1.422882080078125, -1.3704986572265625, -1.318115234375, -1.2657318115234375, -1.213348388671875, -1.1609649658203125, -1.10858154296875, -1.0561981201171875, -1.003814697265625, -0.9514312744140625, -0.8990478515625, -0.8466644287109375, -0.794281005859375, -0.7418975830078125, -0.68951416015625, -0.6371307373046875, -0.584747314453125, -0.5323638916015625, -0.47998046875, -0.4275970458984375, -0.375213623046875, -0.3228302001953125, -0.27044677734375, -0.2180633544921875, -0.165679931640625, -0.1132965087890625, -0.0609130859375, -0.0085296630859375, 0.043853759765625, 0.0962371826171875, 0.14862060546875, 0.2010040283203125, 0.253387451171875, 0.3057708740234375, 0.358154296875, 0.4105377197265625, 0.462921142578125, 0.5153045654296875, 0.56768798828125, 0.6200714111328125, 0.672454833984375, 0.7248382568359375, 0.7772216796875, 0.8296051025390625, 0.881988525390625, 0.9343719482421875, 0.98675537109375, 1.0391387939453125, 1.091522216796875, 1.1439056396484375, 1.1962890625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 7.0, 10.0, 14.0, 20.0, 23.0, 50.0, 73.0, 110.0, 232.0, 518.0, 1252.0, 3844.0, 15148.0, 104116.0, 3659443.0, 368966.0, 30547.0, 6449.0, 1981.0, 780.0, 301.0, 156.0, 85.0, 44.0, 21.0, 14.0, 13.0, 10.0, 6.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.833984375, -2.749908447265625, -2.66583251953125, -2.581756591796875, -2.4976806640625, -2.413604736328125, -2.32952880859375, -2.245452880859375, -2.161376953125, -2.077301025390625, -1.99322509765625, -1.909149169921875, -1.8250732421875, -1.740997314453125, -1.65692138671875, -1.572845458984375, -1.48876953125, -1.404693603515625, -1.32061767578125, -1.236541748046875, -1.1524658203125, -1.068389892578125, -0.98431396484375, -0.900238037109375, -0.816162109375, -0.732086181640625, -0.64801025390625, -0.563934326171875, -0.4798583984375, -0.395782470703125, -0.31170654296875, -0.227630615234375, -0.1435546875, -0.059478759765625, 0.02459716796875, 0.108673095703125, 0.1927490234375, 0.276824951171875, 0.36090087890625, 0.444976806640625, 0.529052734375, 0.613128662109375, 0.69720458984375, 0.781280517578125, 0.8653564453125, 0.949432373046875, 1.03350830078125, 1.117584228515625, 1.20166015625, 1.285736083984375, 1.36981201171875, 1.453887939453125, 1.5379638671875, 1.622039794921875, 1.70611572265625, 1.790191650390625, 1.874267578125, 1.958343505859375, 2.04241943359375, 2.126495361328125, 2.2105712890625, 2.294647216796875, 2.37872314453125, 2.462799072265625, 2.546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 2.0, 7.0, 8.0, 14.0, 15.0, 16.0, 20.0, 37.0, 63.0, 75.0, 147.0, 322.0, 856.0, 1215.0, 645.0, 257.0, 136.0, 66.0, 52.0, 29.0, 17.0, 21.0, 9.0, 7.0, 10.0, 4.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.41796875, -2.34332275390625, -2.2686767578125, -2.19403076171875, -2.119384765625, -2.04473876953125, -1.9700927734375, -1.89544677734375, -1.82080078125, -1.74615478515625, -1.6715087890625, -1.59686279296875, -1.522216796875, -1.44757080078125, -1.3729248046875, -1.29827880859375, -1.2236328125, -1.14898681640625, -1.0743408203125, -0.99969482421875, -0.925048828125, -0.85040283203125, -0.7757568359375, -0.70111083984375, -0.62646484375, -0.55181884765625, -0.4771728515625, -0.40252685546875, -0.327880859375, -0.25323486328125, -0.1785888671875, -0.10394287109375, -0.029296875, 0.04534912109375, 0.1199951171875, 0.19464111328125, 0.269287109375, 0.34393310546875, 0.4185791015625, 0.49322509765625, 0.56787109375, 0.64251708984375, 0.7171630859375, 0.79180908203125, 0.866455078125, 0.94110107421875, 1.0157470703125, 1.09039306640625, 1.1650390625, 1.23968505859375, 1.3143310546875, 1.38897705078125, 1.463623046875, 1.53826904296875, 1.6129150390625, 1.68756103515625, 1.76220703125, 1.83685302734375, 1.9114990234375, 1.98614501953125, 2.060791015625, 2.13543701171875, 2.2100830078125, 2.28472900390625, 2.359375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 8.0, 14.0, 31.0, 94.0, 215.0, 285.0, 194.0, 99.0, 31.0, 9.0, 7.0, 6.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.81629180908203, -35.92899703979492, -35.04170227050781, -34.1544075012207, -33.267112731933594, -32.379817962646484, -31.492525100708008, -30.6052303314209, -29.71793556213379, -28.83064079284668, -27.94334602355957, -27.05605125427246, -26.168758392333984, -25.281463623046875, -24.394168853759766, -23.506874084472656, -22.619579315185547, -21.732284545898438, -20.844989776611328, -19.95769500732422, -19.07040023803711, -18.18310546875, -17.295812606811523, -16.408517837524414, -15.521223068237305, -14.633928298950195, -13.746633529663086, -12.859339714050293, -11.972044944763184, -11.084750175476074, -10.197456359863281, -9.310161590576172, -8.422868728637695, -7.535573959350586, -6.648279666900635, -5.760985374450684, -4.873690605163574, -3.986395835876465, -3.0991015434265137, -2.2118072509765625, -1.3245124816894531, -0.43721795082092285, 0.4500765800476074, 1.3373711109161377, 2.224665641784668, 3.1119604110717773, 3.9992547035217285, 4.88654899597168, 5.773843765258789, 6.661138534545898, 7.54843282699585, 8.4357271194458, 9.32302188873291, 10.21031665802002, 11.097610473632812, 11.984905242919922, 12.872200012207031, 13.75949478149414, 14.64678955078125, 15.534083366394043, 16.42137908935547, 17.308673858642578, 18.195966720581055, 19.083261489868164, 19.970556259155273]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 7.0, 9.0, 13.0, 18.0, 21.0, 19.0, 22.0, 36.0, 28.0, 45.0, 43.0, 48.0, 66.0, 54.0, 60.0, 62.0, 56.0, 52.0, 52.0, 40.0, 40.0, 39.0, 42.0, 21.0, 23.0, 23.0, 13.0, 12.0, 8.0, 7.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.543047904968262, -9.176339149475098, -8.809630393981934, -8.44292163848877, -8.076212882995605, -7.709504127502441, -7.342795372009277, -6.976086616516113, -6.609377861022949, -6.242669105529785, -5.875960350036621, -5.509251594543457, -5.142542839050293, -4.775834083557129, -4.409125328063965, -4.042416572570801, -3.6757073402404785, -3.3089985847473145, -2.9422898292541504, -2.5755810737609863, -2.2088723182678223, -1.8421634435653687, -1.475454568862915, -1.108745813369751, -0.7420370578765869, -0.37532827258110046, -0.008619487285614014, 0.3580893278121948, 0.7247980833053589, 1.091506838798523, 1.4582157135009766, 1.8249244689941406, 2.1916332244873047, 2.5583419799804688, 2.925050735473633, 3.291759490966797, 3.658468246459961, 4.025177001953125, 4.391885757446289, 4.758594512939453, 5.125303268432617, 5.492012023925781, 5.858720779418945, 6.225429534912109, 6.592138290405273, 6.9588470458984375, 7.325555801391602, 7.692264556884766, 8.05897331237793, 8.425682067871094, 8.792390823364258, 9.159099578857422, 9.525808334350586, 9.89251708984375, 10.259225845336914, 10.625934600830078, 10.992644309997559, 11.359353065490723, 11.726061820983887, 12.09277057647705, 12.459479331970215, 12.826188087463379, 13.192896842956543, 13.559605598449707, 13.926314353942871]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 9.0, 5.0, 8.0, 8.0, 18.0, 35.0, 35.0, 70.0, 96.0, 178.0, 266.0, 411.0, 826.0, 1382.0, 2527.0, 5060.0, 10587.0, 23187.0, 53036.0, 118712.0, 230494.0, 278968.0, 173788.0, 81420.0, 35885.0, 16066.0, 7405.0, 3692.0, 1902.0, 989.0, 562.0, 343.0, 191.0, 141.0, 93.0, 48.0, 39.0, 29.0, 12.0, 9.0, 8.0, 6.0, 4.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-1.09765625, -1.0656204223632812, -1.0335845947265625, -1.0015487670898438, -0.969512939453125, -0.9374771118164062, -0.9054412841796875, -0.8734054565429688, -0.84136962890625, -0.8093338012695312, -0.7772979736328125, -0.7452621459960938, -0.713226318359375, -0.6811904907226562, -0.6491546630859375, -0.6171188354492188, -0.5850830078125, -0.5530471801757812, -0.5210113525390625, -0.48897552490234375, -0.456939697265625, -0.42490386962890625, -0.3928680419921875, -0.36083221435546875, -0.32879638671875, -0.29676055908203125, -0.2647247314453125, -0.23268890380859375, -0.200653076171875, -0.16861724853515625, -0.1365814208984375, -0.10454559326171875, -0.072509765625, -0.04047393798828125, -0.0084381103515625, 0.02359771728515625, 0.055633544921875, 0.08766937255859375, 0.1197052001953125, 0.15174102783203125, 0.18377685546875, 0.21581268310546875, 0.2478485107421875, 0.27988433837890625, 0.311920166015625, 0.34395599365234375, 0.3759918212890625, 0.40802764892578125, 0.4400634765625, 0.47209930419921875, 0.5041351318359375, 0.5361709594726562, 0.568206787109375, 0.6002426147460938, 0.6322784423828125, 0.6643142700195312, 0.69635009765625, 0.7283859252929688, 0.7604217529296875, 0.7924575805664062, 0.824493408203125, 0.8565292358398438, 0.8885650634765625, 0.9206008911132812, 0.95263671875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 12.0, 7.0, 15.0, 21.0, 18.0, 39.0, 61.0, 83.0, 81.0, 100.0, 115.0, 97.0, 86.0, 71.0, 65.0, 45.0, 29.0, 22.0, 13.0, 10.0, 10.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3935546875, -1.35540771484375, -1.3172607421875, -1.27911376953125, -1.240966796875, -1.20281982421875, -1.1646728515625, -1.12652587890625, -1.08837890625, -1.05023193359375, -1.0120849609375, -0.97393798828125, -0.935791015625, -0.89764404296875, -0.8594970703125, -0.82135009765625, -0.783203125, -0.74505615234375, -0.7069091796875, -0.66876220703125, -0.630615234375, -0.59246826171875, -0.5543212890625, -0.51617431640625, -0.47802734375, -0.43988037109375, -0.4017333984375, -0.36358642578125, -0.325439453125, -0.28729248046875, -0.2491455078125, -0.21099853515625, -0.1728515625, -0.13470458984375, -0.0965576171875, -0.05841064453125, -0.020263671875, 0.01788330078125, 0.0560302734375, 0.09417724609375, 0.13232421875, 0.17047119140625, 0.2086181640625, 0.24676513671875, 0.284912109375, 0.32305908203125, 0.3612060546875, 0.39935302734375, 0.4375, 0.47564697265625, 0.5137939453125, 0.55194091796875, 0.590087890625, 0.62823486328125, 0.6663818359375, 0.70452880859375, 0.74267578125, 0.78082275390625, 0.8189697265625, 0.85711669921875, 0.895263671875, 0.93341064453125, 0.9715576171875, 1.00970458984375, 1.0478515625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 4.0, 17.0, 14.0, 24.0, 40.0, 44.0, 80.0, 122.0, 171.0, 280.0, 453.0, 743.0, 1439.0, 3079.0, 8967.0, 35384.0, 203057.0, 603385.0, 151022.0, 27166.0, 7176.0, 2705.0, 1258.0, 681.0, 423.0, 267.0, 157.0, 118.0, 69.0, 45.0, 43.0, 34.0, 23.0, 14.0, 8.0, 6.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.71875, -1.6536865234375, -1.588623046875, -1.5235595703125, -1.45849609375, -1.3934326171875, -1.328369140625, -1.2633056640625, -1.1982421875, -1.1331787109375, -1.068115234375, -1.0030517578125, -0.93798828125, -0.8729248046875, -0.807861328125, -0.7427978515625, -0.677734375, -0.6126708984375, -0.547607421875, -0.4825439453125, -0.41748046875, -0.3524169921875, -0.287353515625, -0.2222900390625, -0.1572265625, -0.0921630859375, -0.027099609375, 0.0379638671875, 0.10302734375, 0.1680908203125, 0.233154296875, 0.2982177734375, 0.36328125, 0.4283447265625, 0.493408203125, 0.5584716796875, 0.62353515625, 0.6885986328125, 0.753662109375, 0.8187255859375, 0.8837890625, 0.9488525390625, 1.013916015625, 1.0789794921875, 1.14404296875, 1.2091064453125, 1.274169921875, 1.3392333984375, 1.404296875, 1.4693603515625, 1.534423828125, 1.5994873046875, 1.66455078125, 1.7296142578125, 1.794677734375, 1.8597412109375, 1.9248046875, 1.9898681640625, 2.054931640625, 2.1199951171875, 2.18505859375, 2.2501220703125, 2.315185546875, 2.3802490234375, 2.4453125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 3.0, 1.0, 4.0, 7.0, 14.0, 12.0, 14.0, 17.0, 25.0, 17.0, 26.0, 28.0, 48.0, 46.0, 43.0, 46.0, 56.0, 52.0, 48.0, 42.0, 55.0, 42.0, 46.0, 43.0, 34.0, 43.0, 30.0, 27.0, 25.0, 13.0, 20.0, 18.0, 10.0, 12.0, 5.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9765625, -2.883453369140625, -2.79034423828125, -2.697235107421875, -2.6041259765625, -2.511016845703125, -2.41790771484375, -2.324798583984375, -2.231689453125, -2.138580322265625, -2.04547119140625, -1.952362060546875, -1.8592529296875, -1.766143798828125, -1.67303466796875, -1.579925537109375, -1.48681640625, -1.393707275390625, -1.30059814453125, -1.207489013671875, -1.1143798828125, -1.021270751953125, -0.92816162109375, -0.835052490234375, -0.741943359375, -0.648834228515625, -0.55572509765625, -0.462615966796875, -0.3695068359375, -0.276397705078125, -0.18328857421875, -0.090179443359375, 0.0029296875, 0.096038818359375, 0.18914794921875, 0.282257080078125, 0.3753662109375, 0.468475341796875, 0.56158447265625, 0.654693603515625, 0.747802734375, 0.840911865234375, 0.93402099609375, 1.027130126953125, 1.1202392578125, 1.213348388671875, 1.30645751953125, 1.399566650390625, 1.49267578125, 1.585784912109375, 1.67889404296875, 1.772003173828125, 1.8651123046875, 1.958221435546875, 2.05133056640625, 2.144439697265625, 2.237548828125, 2.330657958984375, 2.42376708984375, 2.516876220703125, 2.6099853515625, 2.703094482421875, 2.79620361328125, 2.889312744140625, 2.982421875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 1.0, 10.0, 24.0, 16.0, 25.0, 57.0, 61.0, 125.0, 234.0, 514.0, 1217.0, 4067.0, 21468.0, 300791.0, 670013.0, 40820.0, 6090.0, 1674.0, 624.0, 300.0, 169.0, 87.0, 54.0, 21.0, 28.0, 18.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2216796875, -1.1858978271484375, -1.150115966796875, -1.1143341064453125, -1.07855224609375, -1.0427703857421875, -1.006988525390625, -0.9712066650390625, -0.9354248046875, -0.8996429443359375, -0.863861083984375, -0.8280792236328125, -0.79229736328125, -0.7565155029296875, -0.720733642578125, -0.6849517822265625, -0.649169921875, -0.6133880615234375, -0.577606201171875, -0.5418243408203125, -0.50604248046875, -0.4702606201171875, -0.434478759765625, -0.3986968994140625, -0.3629150390625, -0.3271331787109375, -0.291351318359375, -0.2555694580078125, -0.21978759765625, -0.1840057373046875, -0.148223876953125, -0.1124420166015625, -0.07666015625, -0.0408782958984375, -0.005096435546875, 0.0306854248046875, 0.06646728515625, 0.1022491455078125, 0.138031005859375, 0.1738128662109375, 0.2095947265625, 0.2453765869140625, 0.281158447265625, 0.3169403076171875, 0.35272216796875, 0.3885040283203125, 0.424285888671875, 0.4600677490234375, 0.495849609375, 0.5316314697265625, 0.567413330078125, 0.6031951904296875, 0.63897705078125, 0.6747589111328125, 0.710540771484375, 0.7463226318359375, 0.7821044921875, 0.8178863525390625, 0.853668212890625, 0.8894500732421875, 0.92523193359375, 0.9610137939453125, 0.996795654296875, 1.0325775146484375, 1.068359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 9.0, 7.0, 15.0, 20.0, 31.0, 40.0, 54.0, 74.0, 78.0, 126.0, 124.0, 109.0, 66.0, 63.0, 52.0, 28.0, 25.0, 19.0, 16.0, 9.0, 4.0, 4.0, 3.0, 2.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019669532775878906, -0.00019000470638275146, -0.00018331408500671387, -0.00017662346363067627, -0.00016993284225463867, -0.00016324222087860107, -0.00015655159950256348, -0.00014986097812652588, -0.00014317035675048828, -0.00013647973537445068, -0.00012978911399841309, -0.0001230984926223755, -0.00011640787124633789, -0.00010971724987030029, -0.0001030266284942627, -9.63360071182251e-05, -8.96453857421875e-05, -8.29547643661499e-05, -7.62641429901123e-05, -6.957352161407471e-05, -6.288290023803711e-05, -5.619227886199951e-05, -4.9501657485961914e-05, -4.2811036109924316e-05, -3.612041473388672e-05, -2.942979335784912e-05, -2.2739171981811523e-05, -1.6048550605773926e-05, -9.357929229736328e-06, -2.6673078536987305e-06, 4.023313522338867e-06, 1.0713934898376465e-05, 1.7404556274414062e-05, 2.409517765045166e-05, 3.078579902648926e-05, 3.7476420402526855e-05, 4.416704177856445e-05, 5.085766315460205e-05, 5.754828453063965e-05, 6.423890590667725e-05, 7.092952728271484e-05, 7.762014865875244e-05, 8.431077003479004e-05, 9.100139141082764e-05, 9.769201278686523e-05, 0.00010438263416290283, 0.00011107325553894043, 0.00011776387691497803, 0.00012445449829101562, 0.00013114511966705322, 0.00013783574104309082, 0.00014452636241912842, 0.00015121698379516602, 0.0001579076051712036, 0.0001645982265472412, 0.0001712888479232788, 0.0001779794692993164, 0.000184670090675354, 0.0001913607120513916, 0.0001980513334274292, 0.0002047419548034668, 0.0002114325761795044, 0.000218123197555542, 0.0002248138189315796, 0.0002315044403076172]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 3.0, 4.0, 6.0, 12.0, 22.0, 24.0, 54.0, 86.0, 162.0, 279.0, 508.0, 1155.0, 3233.0, 11184.0, 80193.0, 722084.0, 200764.0, 20936.0, 4688.0, 1668.0, 705.0, 326.0, 163.0, 104.0, 68.0, 37.0, 25.0, 17.0, 14.0, 8.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9033203125, -0.8738784790039062, -0.8444366455078125, -0.8149948120117188, -0.785552978515625, -0.7561111450195312, -0.7266693115234375, -0.6972274780273438, -0.66778564453125, -0.6383438110351562, -0.6089019775390625, -0.5794601440429688, -0.550018310546875, -0.5205764770507812, -0.4911346435546875, -0.46169281005859375, -0.4322509765625, -0.40280914306640625, -0.3733673095703125, -0.34392547607421875, -0.314483642578125, -0.28504180908203125, -0.2555999755859375, -0.22615814208984375, -0.19671630859375, -0.16727447509765625, -0.1378326416015625, -0.10839080810546875, -0.078948974609375, -0.04950714111328125, -0.0200653076171875, 0.00937652587890625, 0.038818359375, 0.06826019287109375, 0.0977020263671875, 0.12714385986328125, 0.156585693359375, 0.18602752685546875, 0.2154693603515625, 0.24491119384765625, 0.27435302734375, 0.30379486083984375, 0.3332366943359375, 0.36267852783203125, 0.392120361328125, 0.42156219482421875, 0.4510040283203125, 0.48044586181640625, 0.5098876953125, 0.5393295288085938, 0.5687713623046875, 0.5982131958007812, 0.627655029296875, 0.6570968627929688, 0.6865386962890625, 0.7159805297851562, 0.74542236328125, 0.7748641967773438, 0.8043060302734375, 0.8337478637695312, 0.863189697265625, 0.8926315307617188, 0.9220733642578125, 0.9515151977539062, 0.98095703125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 5.0, 8.0, 6.0, 13.0, 15.0, 21.0, 23.0, 33.0, 35.0, 50.0, 53.0, 66.0, 86.0, 80.0, 82.0, 71.0, 69.0, 77.0, 59.0, 30.0, 26.0, 29.0, 14.0, 10.0, 13.0, 9.0, 7.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.66455078125, -0.6380538940429688, -0.6115570068359375, -0.5850601196289062, -0.558563232421875, -0.5320663452148438, -0.5055694580078125, -0.47907257080078125, -0.45257568359375, -0.42607879638671875, -0.3995819091796875, -0.37308502197265625, -0.346588134765625, -0.32009124755859375, -0.2935943603515625, -0.26709747314453125, -0.2406005859375, -0.21410369873046875, -0.1876068115234375, -0.16110992431640625, -0.134613037109375, -0.10811614990234375, -0.0816192626953125, -0.05512237548828125, -0.02862548828125, -0.00212860107421875, 0.0243682861328125, 0.05086517333984375, 0.077362060546875, 0.10385894775390625, 0.1303558349609375, 0.15685272216796875, 0.183349609375, 0.20984649658203125, 0.2363433837890625, 0.26284027099609375, 0.289337158203125, 0.31583404541015625, 0.3423309326171875, 0.36882781982421875, 0.39532470703125, 0.42182159423828125, 0.4483184814453125, 0.47481536865234375, 0.501312255859375, 0.5278091430664062, 0.5543060302734375, 0.5808029174804688, 0.6072998046875, 0.6337966918945312, 0.6602935791015625, 0.6867904663085938, 0.713287353515625, 0.7397842407226562, 0.7662811279296875, 0.7927780151367188, 0.81927490234375, 0.8457717895507812, 0.8722686767578125, 0.8987655639648438, 0.925262451171875, 0.9517593383789062, 0.9782562255859375, 1.0047531127929688, 1.03125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 52.0, 240.0, 532.0, 164.0, 18.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.50355529785156, -74.56202697753906, -72.6205062866211, -70.6789779663086, -68.7374496459961, -66.79592895507812, -64.85440063476562, -62.91287612915039, -60.971351623535156, -59.02982711791992, -57.08829879760742, -55.14677429199219, -53.20524978637695, -51.26372528076172, -49.32219696044922, -47.380672454833984, -45.439144134521484, -43.49761962890625, -41.55609130859375, -39.614566802978516, -37.67304229736328, -35.73151397705078, -33.78998947143555, -31.848464965820312, -29.906938552856445, -27.965412139892578, -26.023887634277344, -24.082361221313477, -22.14083480834961, -20.199310302734375, -18.257783889770508, -16.31625747680664, -14.374736785888672, -12.433211326599121, -10.49168586730957, -8.550159454345703, -6.608633995056152, -4.667108535766602, -2.7255821228027344, -0.7840566635131836, 1.1574687957763672, 3.098994493484497, 5.040520191192627, 6.982046127319336, 8.923571586608887, 10.865097045898438, 12.806623458862305, 14.748148918151855, 16.689674377441406, 18.631200790405273, 20.572725296020508, 22.514251708984375, 24.45577621459961, 26.397302627563477, 28.338829040527344, 30.280353546142578, 32.22187805175781, 34.16340255737305, 36.10493087768555, 38.04645538330078, 39.987979888916016, 41.92950439453125, 43.87103271484375, 45.812557220458984, 47.754085540771484]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 6.0, 11.0, 15.0, 25.0, 38.0, 40.0, 29.0, 57.0, 76.0, 74.0, 82.0, 96.0, 80.0, 75.0, 63.0, 53.0, 35.0, 27.0, 38.0, 27.0, 21.0, 10.0, 4.0, 8.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.208656311035156, -11.64046573638916, -11.072275161743164, -10.504084587097168, -9.935894012451172, -9.36770248413086, -8.799511909484863, -8.231321334838867, -7.663130760192871, -7.094940185546875, -6.526749610900879, -5.958558559417725, -5.3903679847717285, -4.822177410125732, -4.253986358642578, -3.685795783996582, -3.117605209350586, -2.54941463470459, -1.9812238216400146, -1.413033127784729, -0.8448424339294434, -0.27665185928344727, 0.29153895378112793, 0.8597297668457031, 1.4279203414916992, 1.9961110353469849, 2.5643017292022705, 3.1324925422668457, 3.700683116912842, 4.268873691558838, 4.837064743041992, 5.405255317687988, 5.973445892333984, 6.5416364669799805, 7.109827041625977, 7.678018093109131, 8.246208190917969, 8.814399719238281, 9.382590293884277, 9.950780868530273, 10.51897144317627, 11.087162017822266, 11.655352592468262, 12.223543167114258, 12.79173469543457, 13.35992431640625, 13.928115844726562, 14.496306419372559, 15.064496994018555, 15.63268756866455, 16.200878143310547, 16.76906967163086, 17.33725929260254, 17.90545082092285, 18.47364044189453, 19.041831970214844, 19.610023498535156, 20.17821502685547, 20.74640464782715, 21.31459617614746, 21.88278579711914, 22.450977325439453, 23.019166946411133, 23.587358474731445, 24.155548095703125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 3.0, 5.0, 6.0, 13.0, 19.0, 28.0, 49.0, 86.0, 187.0, 374.0, 1018.0, 3378.0, 14450.0, 105262.0, 3593194.0, 439311.0, 27866.0, 5924.0, 1758.0, 675.0, 274.0, 155.0, 72.0, 55.0, 37.0, 26.0, 17.0, 10.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.033203125, -1.9746246337890625, -1.916046142578125, -1.8574676513671875, -1.79888916015625, -1.7403106689453125, -1.681732177734375, -1.6231536865234375, -1.5645751953125, -1.5059967041015625, -1.447418212890625, -1.3888397216796875, -1.33026123046875, -1.2716827392578125, -1.213104248046875, -1.1545257568359375, -1.095947265625, -1.0373687744140625, -0.978790283203125, -0.9202117919921875, -0.86163330078125, -0.8030548095703125, -0.744476318359375, -0.6858978271484375, -0.6273193359375, -0.5687408447265625, -0.510162353515625, -0.4515838623046875, -0.39300537109375, -0.3344268798828125, -0.275848388671875, -0.2172698974609375, -0.15869140625, -0.1001129150390625, -0.041534423828125, 0.0170440673828125, 0.07562255859375, 0.1342010498046875, 0.192779541015625, 0.2513580322265625, 0.3099365234375, 0.3685150146484375, 0.427093505859375, 0.4856719970703125, 0.54425048828125, 0.6028289794921875, 0.661407470703125, 0.7199859619140625, 0.778564453125, 0.8371429443359375, 0.895721435546875, 0.9542999267578125, 1.01287841796875, 1.0714569091796875, 1.130035400390625, 1.1886138916015625, 1.2471923828125, 1.3057708740234375, 1.364349365234375, 1.4229278564453125, 1.48150634765625, 1.5400848388671875, 1.598663330078125, 1.6572418212890625, 1.7158203125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 20.0, 21.0, 32.0, 44.0, 62.0, 94.0, 100.0, 118.0, 114.0, 93.0, 83.0, 68.0, 55.0, 30.0, 18.0, 21.0, 15.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67529296875, -0.6360549926757812, -0.5968170166015625, -0.5575790405273438, -0.518341064453125, -0.47910308837890625, -0.4398651123046875, -0.40062713623046875, -0.36138916015625, -0.32215118408203125, -0.2829132080078125, -0.24367523193359375, -0.204437255859375, -0.16519927978515625, -0.1259613037109375, -0.08672332763671875, -0.0474853515625, -0.00824737548828125, 0.0309906005859375, 0.07022857666015625, 0.109466552734375, 0.14870452880859375, 0.1879425048828125, 0.22718048095703125, 0.26641845703125, 0.30565643310546875, 0.3448944091796875, 0.38413238525390625, 0.423370361328125, 0.46260833740234375, 0.5018463134765625, 0.5410842895507812, 0.580322265625, 0.6195602416992188, 0.6587982177734375, 0.6980361938476562, 0.737274169921875, 0.7765121459960938, 0.8157501220703125, 0.8549880981445312, 0.89422607421875, 0.9334640502929688, 0.9727020263671875, 1.0119400024414062, 1.051177978515625, 1.0904159545898438, 1.1296539306640625, 1.1688919067382812, 1.2081298828125, 1.2473678588867188, 1.2866058349609375, 1.3258438110351562, 1.365081787109375, 1.4043197631835938, 1.4435577392578125, 1.4827957153320312, 1.52203369140625, 1.5612716674804688, 1.6005096435546875, 1.6397476196289062, 1.678985595703125, 1.7182235717773438, 1.7574615478515625, 1.7966995239257812, 1.8359375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 7.0, 2.0, 1.0, 1.0, 12.0, 7.0, 17.0, 31.0, 35.0, 55.0, 108.0, 178.0, 311.0, 703.0, 1453.0, 3292.0, 7941.0, 21684.0, 82117.0, 899304.0, 2946036.0, 175515.0, 36060.0, 11405.0, 4438.0, 1889.0, 810.0, 391.0, 203.0, 108.0, 69.0, 38.0, 19.0, 18.0, 6.0, 9.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5166015625, -1.472259521484375, -1.42791748046875, -1.383575439453125, -1.3392333984375, -1.294891357421875, -1.25054931640625, -1.206207275390625, -1.161865234375, -1.117523193359375, -1.07318115234375, -1.028839111328125, -0.9844970703125, -0.940155029296875, -0.89581298828125, -0.851470947265625, -0.80712890625, -0.762786865234375, -0.71844482421875, -0.674102783203125, -0.6297607421875, -0.585418701171875, -0.54107666015625, -0.496734619140625, -0.452392578125, -0.408050537109375, -0.36370849609375, -0.319366455078125, -0.2750244140625, -0.230682373046875, -0.18634033203125, -0.141998291015625, -0.09765625, -0.053314208984375, -0.00897216796875, 0.035369873046875, 0.0797119140625, 0.124053955078125, 0.16839599609375, 0.212738037109375, 0.257080078125, 0.301422119140625, 0.34576416015625, 0.390106201171875, 0.4344482421875, 0.478790283203125, 0.52313232421875, 0.567474365234375, 0.61181640625, 0.656158447265625, 0.70050048828125, 0.744842529296875, 0.7891845703125, 0.833526611328125, 0.87786865234375, 0.922210693359375, 0.966552734375, 1.010894775390625, 1.05523681640625, 1.099578857421875, 1.1439208984375, 1.188262939453125, 1.23260498046875, 1.276947021484375, 1.3212890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 7.0, 5.0, 8.0, 8.0, 16.0, 19.0, 23.0, 43.0, 43.0, 84.0, 144.0, 289.0, 648.0, 1122.0, 743.0, 334.0, 172.0, 121.0, 75.0, 43.0, 30.0, 20.0, 21.0, 12.0, 11.0, 6.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.958984375, -1.9055633544921875, -1.852142333984375, -1.7987213134765625, -1.74530029296875, -1.6918792724609375, -1.638458251953125, -1.5850372314453125, -1.5316162109375, -1.4781951904296875, -1.424774169921875, -1.3713531494140625, -1.31793212890625, -1.2645111083984375, -1.211090087890625, -1.1576690673828125, -1.104248046875, -1.0508270263671875, -0.997406005859375, -0.9439849853515625, -0.89056396484375, -0.8371429443359375, -0.783721923828125, -0.7303009033203125, -0.6768798828125, -0.6234588623046875, -0.570037841796875, -0.5166168212890625, -0.46319580078125, -0.4097747802734375, -0.356353759765625, -0.3029327392578125, -0.24951171875, -0.1960906982421875, -0.142669677734375, -0.0892486572265625, -0.03582763671875, 0.0175933837890625, 0.071014404296875, 0.1244354248046875, 0.1778564453125, 0.2312774658203125, 0.284698486328125, 0.3381195068359375, 0.39154052734375, 0.4449615478515625, 0.498382568359375, 0.5518035888671875, 0.605224609375, 0.6586456298828125, 0.712066650390625, 0.7654876708984375, 0.81890869140625, 0.8723297119140625, 0.925750732421875, 0.9791717529296875, 1.0325927734375, 1.0860137939453125, 1.139434814453125, 1.1928558349609375, 1.24627685546875, 1.2996978759765625, 1.353118896484375, 1.4065399169921875, 1.4599609375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 20.0, 33.0, 106.0, 206.0, 255.0, 187.0, 93.0, 37.0, 22.0, 5.0, 8.0, 4.0, 9.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.511463165283203, -19.945589065551758, -19.379714965820312, -18.8138427734375, -18.247968673706055, -17.68209457397461, -17.116220474243164, -16.55034637451172, -15.984474182128906, -15.418600082397461, -14.852726936340332, -14.286852836608887, -13.720979690551758, -13.155105590820312, -12.589231491088867, -12.023358345031738, -11.457484245300293, -10.891610145568848, -10.325736999511719, -9.759862899780273, -9.193989753723145, -8.6281156539917, -8.06224250793457, -7.496368408203125, -6.930494785308838, -6.364621162414551, -5.798747539520264, -5.232873916625977, -4.666999816894531, -4.101126670837402, -3.535252571105957, -2.96937894821167, -2.403505325317383, -1.8376317024230957, -1.271757960319519, -0.7058842182159424, -0.14001059532165527, 0.42586302757263184, 0.991736888885498, 1.5576105117797852, 2.1234841346740723, 2.6893577575683594, 3.2552313804626465, 3.8211052417755127, 4.386979103088379, 4.952852249145508, 5.518726348876953, 6.08459997177124, 6.650473594665527, 7.2163472175598145, 7.782220840454102, 8.348094940185547, 8.913968086242676, 9.479842185974121, 10.04571533203125, 10.611589431762695, 11.17746353149414, 11.743337631225586, 12.309210777282715, 12.87508487701416, 13.440958023071289, 14.006832122802734, 14.57270622253418, 15.138579368591309, 15.704452514648438]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 7.0, 7.0, 9.0, 13.0, 17.0, 25.0, 26.0, 29.0, 43.0, 49.0, 54.0, 58.0, 68.0, 73.0, 44.0, 65.0, 57.0, 61.0, 49.0, 55.0, 41.0, 33.0, 27.0, 33.0, 13.0, 16.0, 5.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.97507095336914, -10.702346801757812, -10.4296236038208, -10.156900405883789, -9.884176254272461, -9.611452102661133, -9.338728904724121, -9.06600570678711, -8.793281555175781, -8.520557403564453, -8.247834205627441, -7.9751105308532715, -7.702386856079102, -7.429663181304932, -7.156939506530762, -6.884215831756592, -6.611492156982422, -6.338768482208252, -6.066044807434082, -5.793321132659912, -5.520597457885742, -5.247873783111572, -4.975150108337402, -4.702426433563232, -4.4297027587890625, -4.156979084014893, -3.8842554092407227, -3.6115317344665527, -3.338808059692383, -3.066084384918213, -2.793360710144043, -2.520637035369873, -2.2479124069213867, -1.9751887321472168, -1.7024650573730469, -1.429741382598877, -1.157017707824707, -0.8842940330505371, -0.6115703582763672, -0.33884668350219727, -0.06612300872802734, 0.20660066604614258, 0.4793243408203125, 0.7520480155944824, 1.0247716903686523, 1.2974953651428223, 1.5702190399169922, 1.842942714691162, 2.115666389465332, 2.388390064239502, 2.661113739013672, 2.933837413787842, 3.2065610885620117, 3.4792847633361816, 3.7520084381103516, 4.0247321128845215, 4.297455787658691, 4.570179462432861, 4.842903137207031, 5.115626811981201, 5.388350486755371, 5.661074161529541, 5.933797836303711, 6.206521511077881, 6.479245185852051]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 15.0, 10.0, 18.0, 16.0, 37.0, 72.0, 102.0, 179.0, 282.0, 548.0, 972.0, 1831.0, 3556.0, 7507.0, 16546.0, 39832.0, 97100.0, 224158.0, 319042.0, 194028.0, 81706.0, 33418.0, 14379.0, 6529.0, 3095.0, 1550.0, 895.0, 474.0, 277.0, 150.0, 91.0, 48.0, 26.0, 19.0, 15.0, 11.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.0791015625, -1.04473876953125, -1.0103759765625, -0.97601318359375, -0.941650390625, -0.90728759765625, -0.8729248046875, -0.83856201171875, -0.80419921875, -0.76983642578125, -0.7354736328125, -0.70111083984375, -0.666748046875, -0.63238525390625, -0.5980224609375, -0.56365966796875, -0.529296875, -0.49493408203125, -0.4605712890625, -0.42620849609375, -0.391845703125, -0.35748291015625, -0.3231201171875, -0.28875732421875, -0.25439453125, -0.22003173828125, -0.1856689453125, -0.15130615234375, -0.116943359375, -0.08258056640625, -0.0482177734375, -0.01385498046875, 0.0205078125, 0.05487060546875, 0.0892333984375, 0.12359619140625, 0.157958984375, 0.19232177734375, 0.2266845703125, 0.26104736328125, 0.29541015625, 0.32977294921875, 0.3641357421875, 0.39849853515625, 0.432861328125, 0.46722412109375, 0.5015869140625, 0.53594970703125, 0.5703125, 0.60467529296875, 0.6390380859375, 0.67340087890625, 0.707763671875, 0.74212646484375, 0.7764892578125, 0.81085205078125, 0.84521484375, 0.87957763671875, 0.9139404296875, 0.94830322265625, 0.982666015625, 1.01702880859375, 1.0513916015625, 1.08575439453125, 1.1201171875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 2.0, 9.0, 8.0, 10.0, 22.0, 19.0, 20.0, 23.0, 30.0, 31.0, 43.0, 45.0, 29.0, 41.0, 64.0, 44.0, 67.0, 46.0, 61.0, 43.0, 42.0, 37.0, 50.0, 43.0, 34.0, 20.0, 32.0, 15.0, 11.0, 12.0, 10.0, 13.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5615234375, -0.5419845581054688, -0.5224456787109375, -0.5029067993164062, -0.483367919921875, -0.46382904052734375, -0.4442901611328125, -0.42475128173828125, -0.40521240234375, -0.38567352294921875, -0.3661346435546875, -0.34659576416015625, -0.327056884765625, -0.30751800537109375, -0.2879791259765625, -0.26844024658203125, -0.2489013671875, -0.22936248779296875, -0.2098236083984375, -0.19028472900390625, -0.170745849609375, -0.15120697021484375, -0.1316680908203125, -0.11212921142578125, -0.09259033203125, -0.07305145263671875, -0.0535125732421875, -0.03397369384765625, -0.014434814453125, 0.00510406494140625, 0.0246429443359375, 0.04418182373046875, 0.063720703125, 0.08325958251953125, 0.1027984619140625, 0.12233734130859375, 0.141876220703125, 0.16141510009765625, 0.1809539794921875, 0.20049285888671875, 0.22003173828125, 0.23957061767578125, 0.2591094970703125, 0.27864837646484375, 0.298187255859375, 0.31772613525390625, 0.3372650146484375, 0.35680389404296875, 0.3763427734375, 0.39588165283203125, 0.4154205322265625, 0.43495941162109375, 0.454498291015625, 0.47403717041015625, 0.4935760498046875, 0.5131149291992188, 0.53265380859375, 0.5521926879882812, 0.5717315673828125, 0.5912704467773438, 0.610809326171875, 0.6303482055664062, 0.6498870849609375, 0.6694259643554688, 0.68896484375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 7.0, 6.0, 11.0, 11.0, 23.0, 25.0, 34.0, 47.0, 87.0, 130.0, 231.0, 330.0, 692.0, 1330.0, 3303.0, 11159.0, 56850.0, 386073.0, 500787.0, 67930.0, 12789.0, 3620.0, 1365.0, 713.0, 381.0, 224.0, 132.0, 70.0, 57.0, 30.0, 35.0, 25.0, 18.0, 9.0, 6.0, 2.0, 2.0, 5.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.3125, -2.242523193359375, -2.17254638671875, -2.102569580078125, -2.0325927734375, -1.962615966796875, -1.89263916015625, -1.822662353515625, -1.752685546875, -1.682708740234375, -1.61273193359375, -1.542755126953125, -1.4727783203125, -1.402801513671875, -1.33282470703125, -1.262847900390625, -1.19287109375, -1.122894287109375, -1.05291748046875, -0.982940673828125, -0.9129638671875, -0.842987060546875, -0.77301025390625, -0.703033447265625, -0.633056640625, -0.563079833984375, -0.49310302734375, -0.423126220703125, -0.3531494140625, -0.283172607421875, -0.21319580078125, -0.143218994140625, -0.0732421875, -0.003265380859375, 0.06671142578125, 0.136688232421875, 0.2066650390625, 0.276641845703125, 0.34661865234375, 0.416595458984375, 0.486572265625, 0.556549072265625, 0.62652587890625, 0.696502685546875, 0.7664794921875, 0.836456298828125, 0.90643310546875, 0.976409912109375, 1.04638671875, 1.116363525390625, 1.18634033203125, 1.256317138671875, 1.3262939453125, 1.396270751953125, 1.46624755859375, 1.536224365234375, 1.606201171875, 1.676177978515625, 1.74615478515625, 1.816131591796875, 1.8861083984375, 1.956085205078125, 2.02606201171875, 2.096038818359375, 2.166015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 6.0, 5.0, 8.0, 11.0, 10.0, 15.0, 18.0, 14.0, 18.0, 30.0, 20.0, 36.0, 26.0, 34.0, 40.0, 49.0, 47.0, 59.0, 46.0, 57.0, 52.0, 52.0, 52.0, 49.0, 46.0, 29.0, 32.0, 24.0, 19.0, 23.0, 20.0, 10.0, 13.0, 7.0, 8.0, 9.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.162109375, -2.086944580078125, -2.01177978515625, -1.936614990234375, -1.8614501953125, -1.786285400390625, -1.71112060546875, -1.635955810546875, -1.560791015625, -1.485626220703125, -1.41046142578125, -1.335296630859375, -1.2601318359375, -1.184967041015625, -1.10980224609375, -1.034637451171875, -0.95947265625, -0.884307861328125, -0.80914306640625, -0.733978271484375, -0.6588134765625, -0.583648681640625, -0.50848388671875, -0.433319091796875, -0.358154296875, -0.282989501953125, -0.20782470703125, -0.132659912109375, -0.0574951171875, 0.017669677734375, 0.09283447265625, 0.167999267578125, 0.2431640625, 0.318328857421875, 0.39349365234375, 0.468658447265625, 0.5438232421875, 0.618988037109375, 0.69415283203125, 0.769317626953125, 0.844482421875, 0.919647216796875, 0.99481201171875, 1.069976806640625, 1.1451416015625, 1.220306396484375, 1.29547119140625, 1.370635986328125, 1.44580078125, 1.520965576171875, 1.59613037109375, 1.671295166015625, 1.7464599609375, 1.821624755859375, 1.89678955078125, 1.971954345703125, 2.047119140625, 2.122283935546875, 2.19744873046875, 2.272613525390625, 2.3477783203125, 2.422943115234375, 2.49810791015625, 2.573272705078125, 2.6484375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 11.0, 6.0, 4.0, 9.0, 22.0, 33.0, 54.0, 84.0, 195.0, 392.0, 1119.0, 4001.0, 26140.0, 404726.0, 572790.0, 32325.0, 4476.0, 1196.0, 481.0, 206.0, 112.0, 60.0, 38.0, 27.0, 14.0, 14.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.423828125, -1.3853912353515625, -1.346954345703125, -1.3085174560546875, -1.27008056640625, -1.2316436767578125, -1.193206787109375, -1.1547698974609375, -1.1163330078125, -1.0778961181640625, -1.039459228515625, -1.0010223388671875, -0.96258544921875, -0.9241485595703125, -0.885711669921875, -0.8472747802734375, -0.808837890625, -0.7704010009765625, -0.731964111328125, -0.6935272216796875, -0.65509033203125, -0.6166534423828125, -0.578216552734375, -0.5397796630859375, -0.5013427734375, -0.4629058837890625, -0.424468994140625, -0.3860321044921875, -0.34759521484375, -0.3091583251953125, -0.270721435546875, -0.2322845458984375, -0.19384765625, -0.1554107666015625, -0.116973876953125, -0.0785369873046875, -0.04010009765625, -0.0016632080078125, 0.036773681640625, 0.0752105712890625, 0.1136474609375, 0.1520843505859375, 0.190521240234375, 0.2289581298828125, 0.26739501953125, 0.3058319091796875, 0.344268798828125, 0.3827056884765625, 0.421142578125, 0.4595794677734375, 0.498016357421875, 0.5364532470703125, 0.57489013671875, 0.6133270263671875, 0.651763916015625, 0.6902008056640625, 0.7286376953125, 0.7670745849609375, 0.805511474609375, 0.8439483642578125, 0.88238525390625, 0.9208221435546875, 0.959259033203125, 0.9976959228515625, 1.0361328125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 5.0, 3.0, 10.0, 11.0, 22.0, 20.0, 30.0, 38.0, 55.0, 74.0, 107.0, 147.0, 121.0, 99.0, 90.0, 49.0, 32.0, 23.0, 17.0, 11.0, 12.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024509429931640625, -0.00023714080452919006, -0.00022918730974197388, -0.0002212338149547577, -0.0002132803201675415, -0.00020532682538032532, -0.00019737333059310913, -0.00018941983580589294, -0.00018146634101867676, -0.00017351284623146057, -0.00016555935144424438, -0.0001576058566570282, -0.000149652361869812, -0.00014169886708259583, -0.00013374537229537964, -0.00012579187750816345, -0.00011783838272094727, -0.00010988488793373108, -0.00010193139314651489, -9.39778983592987e-05, -8.602440357208252e-05, -7.807090878486633e-05, -7.011741399765015e-05, -6.216391921043396e-05, -5.4210424423217773e-05, -4.625692963600159e-05, -3.83034348487854e-05, -3.0349940061569214e-05, -2.2396445274353027e-05, -1.444295048713684e-05, -6.489455699920654e-06, 1.4640390872955322e-06, 9.417533874511719e-06, 1.7371028661727905e-05, 2.5324523448944092e-05, 3.327801823616028e-05, 4.1231513023376465e-05, 4.918500781059265e-05, 5.713850259780884e-05, 6.509199738502502e-05, 7.304549217224121e-05, 8.09989869594574e-05, 8.895248174667358e-05, 9.690597653388977e-05, 0.00010485947132110596, 0.00011281296610832214, 0.00012076646089553833, 0.00012871995568275452, 0.0001366734504699707, 0.0001446269452571869, 0.00015258044004440308, 0.00016053393483161926, 0.00016848742961883545, 0.00017644092440605164, 0.00018439441919326782, 0.000192347913980484, 0.0002003014087677002, 0.00020825490355491638, 0.00021620839834213257, 0.00022416189312934875, 0.00023211538791656494, 0.00024006888270378113, 0.0002480223774909973, 0.0002559758722782135, 0.0002639293670654297]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 8.0, 8.0, 10.0, 11.0, 11.0, 26.0, 26.0, 43.0, 56.0, 105.0, 145.0, 225.0, 362.0, 857.0, 1769.0, 4940.0, 17177.0, 89947.0, 563272.0, 304078.0, 48503.0, 10607.0, 3419.0, 1382.0, 615.0, 383.0, 223.0, 123.0, 63.0, 59.0, 28.0, 26.0, 17.0, 12.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.76513671875, -0.7418289184570312, -0.7185211181640625, -0.6952133178710938, -0.671905517578125, -0.6485977172851562, -0.6252899169921875, -0.6019821166992188, -0.57867431640625, -0.5553665161132812, -0.5320587158203125, -0.5087509155273438, -0.485443115234375, -0.46213531494140625, -0.4388275146484375, -0.41551971435546875, -0.3922119140625, -0.36890411376953125, -0.3455963134765625, -0.32228851318359375, -0.298980712890625, -0.27567291259765625, -0.2523651123046875, -0.22905731201171875, -0.20574951171875, -0.18244171142578125, -0.1591339111328125, -0.13582611083984375, -0.112518310546875, -0.08921051025390625, -0.0659027099609375, -0.04259490966796875, -0.019287109375, 0.00402069091796875, 0.0273284912109375, 0.05063629150390625, 0.073944091796875, 0.09725189208984375, 0.1205596923828125, 0.14386749267578125, 0.16717529296875, 0.19048309326171875, 0.2137908935546875, 0.23709869384765625, 0.260406494140625, 0.28371429443359375, 0.3070220947265625, 0.33032989501953125, 0.3536376953125, 0.37694549560546875, 0.4002532958984375, 0.42356109619140625, 0.446868896484375, 0.47017669677734375, 0.4934844970703125, 0.5167922973632812, 0.54010009765625, 0.5634078979492188, 0.5867156982421875, 0.6100234985351562, 0.633331298828125, 0.6566390991210938, 0.6799468994140625, 0.7032546997070312, 0.7265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 8.0, 9.0, 8.0, 5.0, 10.0, 22.0, 20.0, 29.0, 33.0, 42.0, 42.0, 61.0, 63.0, 64.0, 81.0, 82.0, 75.0, 59.0, 62.0, 57.0, 51.0, 33.0, 18.0, 15.0, 14.0, 7.0, 11.0, 5.0, 2.0, 4.0, 3.0, 0.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.90380859375, -0.8791961669921875, -0.854583740234375, -0.8299713134765625, -0.80535888671875, -0.7807464599609375, -0.756134033203125, -0.7315216064453125, -0.7069091796875, -0.6822967529296875, -0.657684326171875, -0.6330718994140625, -0.60845947265625, -0.5838470458984375, -0.559234619140625, -0.5346221923828125, -0.510009765625, -0.4853973388671875, -0.460784912109375, -0.4361724853515625, -0.41156005859375, -0.3869476318359375, -0.362335205078125, -0.3377227783203125, -0.3131103515625, -0.2884979248046875, -0.263885498046875, -0.2392730712890625, -0.21466064453125, -0.1900482177734375, -0.165435791015625, -0.1408233642578125, -0.1162109375, -0.0915985107421875, -0.066986083984375, -0.0423736572265625, -0.01776123046875, 0.0068511962890625, 0.031463623046875, 0.0560760498046875, 0.0806884765625, 0.1053009033203125, 0.129913330078125, 0.1545257568359375, 0.17913818359375, 0.2037506103515625, 0.228363037109375, 0.2529754638671875, 0.277587890625, 0.3022003173828125, 0.326812744140625, 0.3514251708984375, 0.37603759765625, 0.4006500244140625, 0.425262451171875, 0.4498748779296875, 0.4744873046875, 0.4990997314453125, 0.523712158203125, 0.5483245849609375, 0.57293701171875, 0.5975494384765625, 0.622161865234375, 0.6467742919921875, 0.67138671875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 20.0, 28.0, 68.0, 89.0, 136.0, 210.0, 173.0, 121.0, 70.0, 35.0, 19.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.06265640258789, -23.512418746948242, -22.962181091308594, -22.411943435668945, -21.861705780029297, -21.311466217041016, -20.76123046875, -20.21099090576172, -19.66075325012207, -19.110515594482422, -18.560277938842773, -18.010040283203125, -17.459802627563477, -16.909564971923828, -16.359325408935547, -15.809088706970215, -15.258851051330566, -14.708613395690918, -14.15837574005127, -13.608137130737305, -13.057899475097656, -12.507661819458008, -11.95742416381836, -11.407186508178711, -10.856948852539062, -10.306711196899414, -9.756473541259766, -9.206235885620117, -8.655997276306152, -8.105759620666504, -7.5555219650268555, -7.005284309387207, -6.455045700073242, -5.904808044433594, -5.354569911956787, -4.804332256317139, -4.254094123840332, -3.7038564682006836, -3.153618812561035, -2.6033809185028076, -2.05314302444458, -1.5029051303863525, -0.9526673555374146, -0.40242958068847656, 0.14780831336975098, 0.6980462074279785, 1.248283863067627, 1.7985217571258545, 2.348759651184082, 2.8989975452423096, 3.449235439300537, 3.9994730949401855, 4.549711227416992, 5.099948883056641, 5.650186538696289, 6.2004241943359375, 6.750662326812744, 7.300899982452393, 7.851138114929199, 8.401375770568848, 8.951613426208496, 9.501852035522461, 10.05208969116211, 10.602327346801758, 11.152565002441406]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 1.0, 5.0, 11.0, 8.0, 11.0, 9.0, 19.0, 18.0, 21.0, 20.0, 26.0, 33.0, 30.0, 28.0, 44.0, 49.0, 47.0, 60.0, 74.0, 71.0, 53.0, 49.0, 44.0, 31.0, 37.0, 29.0, 27.0, 24.0, 23.0, 18.0, 19.0, 16.0, 16.0, 3.0, 9.0, 9.0, 0.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.196157455444336, -8.872919082641602, -8.549680709838867, -8.226442337036133, -7.90320348739624, -7.579965114593506, -7.256726264953613, -6.933487892150879, -6.6102495193481445, -6.28701114654541, -5.963772773742676, -5.640533924102783, -5.317295551300049, -4.9940571784973145, -4.670818328857422, -4.3475799560546875, -4.024341583251953, -3.7011032104492188, -3.3778645992279053, -3.054625988006592, -2.7313876152038574, -2.408149242401123, -2.0849106311798096, -1.761672019958496, -1.4384336471557617, -1.1151951551437378, -0.7919566631317139, -0.46871817111968994, -0.14547967910766602, 0.1777588129043579, 0.5009973049163818, 0.8242359161376953, 1.1474733352661133, 1.4707118272781372, 1.7939503192901611, 2.1171889305114746, 2.440427303314209, 2.7636656761169434, 3.086904287338257, 3.4101428985595703, 3.7333812713623047, 4.056619644165039, 4.379858016967773, 4.703096866607666, 5.0263352394104, 5.349573612213135, 5.672812461853027, 5.996050834655762, 6.319289207458496, 6.6425275802612305, 6.965765953063965, 7.289004802703857, 7.612243175506592, 7.935481548309326, 8.258720397949219, 8.581958770751953, 8.905197143554688, 9.228435516357422, 9.551673889160156, 9.87491226196289, 10.198150634765625, 10.521389961242676, 10.84462833404541, 11.167866706848145, 11.491105079650879]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 10.0, 5.0, 8.0, 26.0, 20.0, 55.0, 67.0, 118.0, 207.0, 378.0, 685.0, 1303.0, 2768.0, 6139.0, 15233.0, 44501.0, 174596.0, 1136800.0, 2258958.0, 428667.0, 81422.0, 24579.0, 9544.0, 3986.0, 1906.0, 963.0, 517.0, 291.0, 177.0, 100.0, 80.0, 55.0, 25.0, 23.0, 15.0, 15.0, 9.0, 8.0, 8.0, 4.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64990234375, -0.6260528564453125, -0.602203369140625, -0.5783538818359375, -0.55450439453125, -0.5306549072265625, -0.506805419921875, -0.4829559326171875, -0.4591064453125, -0.4352569580078125, -0.411407470703125, -0.3875579833984375, -0.36370849609375, -0.3398590087890625, -0.316009521484375, -0.2921600341796875, -0.268310546875, -0.2444610595703125, -0.220611572265625, -0.1967620849609375, -0.17291259765625, -0.1490631103515625, -0.125213623046875, -0.1013641357421875, -0.0775146484375, -0.0536651611328125, -0.029815673828125, -0.0059661865234375, 0.01788330078125, 0.0417327880859375, 0.065582275390625, 0.0894317626953125, 0.11328125, 0.1371307373046875, 0.160980224609375, 0.1848297119140625, 0.20867919921875, 0.2325286865234375, 0.256378173828125, 0.2802276611328125, 0.3040771484375, 0.3279266357421875, 0.351776123046875, 0.3756256103515625, 0.39947509765625, 0.4233245849609375, 0.447174072265625, 0.4710235595703125, 0.494873046875, 0.5187225341796875, 0.542572021484375, 0.5664215087890625, 0.59027099609375, 0.6141204833984375, 0.637969970703125, 0.6618194580078125, 0.6856689453125, 0.7095184326171875, 0.733367919921875, 0.7572174072265625, 0.78106689453125, 0.8049163818359375, 0.828765869140625, 0.8526153564453125, 0.87646484375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 5.0, 7.0, 6.0, 10.0, 13.0, 9.0, 14.0, 15.0, 31.0, 21.0, 34.0, 51.0, 57.0, 40.0, 44.0, 48.0, 59.0, 53.0, 56.0, 44.0, 44.0, 43.0, 43.0, 46.0, 35.0, 32.0, 29.0, 22.0, 30.0, 17.0, 8.0, 12.0, 10.0, 7.0, 2.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45458984375, -0.43566131591796875, -0.4167327880859375, -0.39780426025390625, -0.378875732421875, -0.35994720458984375, -0.3410186767578125, -0.32209014892578125, -0.30316162109375, -0.28423309326171875, -0.2653045654296875, -0.24637603759765625, -0.227447509765625, -0.20851898193359375, -0.1895904541015625, -0.17066192626953125, -0.1517333984375, -0.13280487060546875, -0.1138763427734375, -0.09494781494140625, -0.076019287109375, -0.05709075927734375, -0.0381622314453125, -0.01923370361328125, -0.00030517578125, 0.01862335205078125, 0.0375518798828125, 0.05648040771484375, 0.075408935546875, 0.09433746337890625, 0.1132659912109375, 0.13219451904296875, 0.151123046875, 0.17005157470703125, 0.1889801025390625, 0.20790863037109375, 0.226837158203125, 0.24576568603515625, 0.2646942138671875, 0.28362274169921875, 0.30255126953125, 0.32147979736328125, 0.3404083251953125, 0.35933685302734375, 0.378265380859375, 0.39719390869140625, 0.4161224365234375, 0.43505096435546875, 0.4539794921875, 0.47290802001953125, 0.4918365478515625, 0.5107650756835938, 0.529693603515625, 0.5486221313476562, 0.5675506591796875, 0.5864791870117188, 0.60540771484375, 0.6243362426757812, 0.6432647705078125, 0.6621932983398438, 0.681121826171875, 0.7000503540039062, 0.7189788818359375, 0.7379074096679688, 0.7568359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 9.0, 8.0, 16.0, 18.0, 27.0, 37.0, 47.0, 80.0, 80.0, 141.0, 227.0, 442.0, 815.0, 1861.0, 4743.0, 14322.0, 56069.0, 385028.0, 3277127.0, 375236.0, 55818.0, 14281.0, 4440.0, 1652.0, 722.0, 369.0, 217.0, 132.0, 87.0, 78.0, 39.0, 36.0, 19.0, 24.0, 9.0, 6.0, 3.0, 5.0, 8.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.244415283203125, -1.20074462890625, -1.157073974609375, -1.1134033203125, -1.069732666015625, -1.02606201171875, -0.982391357421875, -0.938720703125, -0.895050048828125, -0.85137939453125, -0.807708740234375, -0.7640380859375, -0.720367431640625, -0.67669677734375, -0.633026123046875, -0.58935546875, -0.545684814453125, -0.50201416015625, -0.458343505859375, -0.4146728515625, -0.371002197265625, -0.32733154296875, -0.283660888671875, -0.239990234375, -0.196319580078125, -0.15264892578125, -0.108978271484375, -0.0653076171875, -0.021636962890625, 0.02203369140625, 0.065704345703125, 0.109375, 0.153045654296875, 0.19671630859375, 0.240386962890625, 0.2840576171875, 0.327728271484375, 0.37139892578125, 0.415069580078125, 0.458740234375, 0.502410888671875, 0.54608154296875, 0.589752197265625, 0.6334228515625, 0.677093505859375, 0.72076416015625, 0.764434814453125, 0.80810546875, 0.851776123046875, 0.89544677734375, 0.939117431640625, 0.9827880859375, 1.026458740234375, 1.07012939453125, 1.113800048828125, 1.157470703125, 1.201141357421875, 1.24481201171875, 1.288482666015625, 1.3321533203125, 1.375823974609375, 1.41949462890625, 1.463165283203125, 1.5068359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 8.0, 3.0, 5.0, 4.0, 15.0, 12.0, 14.0, 24.0, 21.0, 29.0, 41.0, 68.0, 96.0, 155.0, 213.0, 409.0, 624.0, 750.0, 538.0, 377.0, 201.0, 119.0, 82.0, 58.0, 47.0, 43.0, 23.0, 16.0, 16.0, 11.0, 14.0, 7.0, 11.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.689453125, -1.64306640625, -1.5966796875, -1.55029296875, -1.50390625, -1.45751953125, -1.4111328125, -1.36474609375, -1.318359375, -1.27197265625, -1.2255859375, -1.17919921875, -1.1328125, -1.08642578125, -1.0400390625, -0.99365234375, -0.947265625, -0.90087890625, -0.8544921875, -0.80810546875, -0.76171875, -0.71533203125, -0.6689453125, -0.62255859375, -0.576171875, -0.52978515625, -0.4833984375, -0.43701171875, -0.390625, -0.34423828125, -0.2978515625, -0.25146484375, -0.205078125, -0.15869140625, -0.1123046875, -0.06591796875, -0.01953125, 0.02685546875, 0.0732421875, 0.11962890625, 0.166015625, 0.21240234375, 0.2587890625, 0.30517578125, 0.3515625, 0.39794921875, 0.4443359375, 0.49072265625, 0.537109375, 0.58349609375, 0.6298828125, 0.67626953125, 0.72265625, 0.76904296875, 0.8154296875, 0.86181640625, 0.908203125, 0.95458984375, 1.0009765625, 1.04736328125, 1.09375, 1.14013671875, 1.1865234375, 1.23291015625, 1.279296875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 5.0, 12.0, 21.0, 28.0, 54.0, 100.0, 130.0, 182.0, 158.0, 113.0, 84.0, 41.0, 19.0, 15.0, 8.0, 5.0, 5.0, 6.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.191397666931152, -12.758180618286133, -12.324963569641113, -11.891746520996094, -11.458529472351074, -11.025312423706055, -10.592095375061035, -10.158878326416016, -9.725661277770996, -9.292444229125977, -8.859227180480957, -8.426010131835938, -7.992793083190918, -7.559576034545898, -7.126358985900879, -6.693141937255859, -6.25992488861084, -5.82670783996582, -5.393490791320801, -4.960273742675781, -4.527056694030762, -4.093839645385742, -3.6606225967407227, -3.227405548095703, -2.7941884994506836, -2.360971450805664, -1.9277544021606445, -1.494537353515625, -1.0613203048706055, -0.6281032562255859, -0.1948862075805664, 0.23833084106445312, 0.6715478897094727, 1.1047649383544922, 1.5379819869995117, 1.9711990356445312, 2.404416084289551, 2.8376331329345703, 3.27085018157959, 3.7040672302246094, 4.137284278869629, 4.570501327514648, 5.003718376159668, 5.4369354248046875, 5.870152473449707, 6.303369522094727, 6.736586570739746, 7.169803619384766, 7.603020668029785, 8.036237716674805, 8.469454765319824, 8.902671813964844, 9.335888862609863, 9.769105911254883, 10.202322959899902, 10.635540008544922, 11.068757057189941, 11.501974105834961, 11.93519115447998, 12.368408203125, 12.80162525177002, 13.234842300415039, 13.668059349060059, 14.101276397705078, 14.534493446350098]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 13.0, 8.0, 7.0, 12.0, 10.0, 21.0, 17.0, 24.0, 28.0, 39.0, 38.0, 38.0, 38.0, 46.0, 38.0, 71.0, 58.0, 66.0, 47.0, 46.0, 44.0, 38.0, 35.0, 39.0, 30.0, 24.0, 24.0, 20.0, 15.0, 18.0, 15.0, 10.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.024250030517578, -8.745893478393555, -8.467537879943848, -8.189181327819824, -7.910825252532959, -7.632469177246094, -7.3541131019592285, -7.075757026672363, -6.79740047454834, -6.519044399261475, -6.240688323974609, -5.962331771850586, -5.683975696563721, -5.4056196212768555, -5.12726354598999, -4.848907470703125, -4.57055139541626, -4.2921953201293945, -4.013839244842529, -3.735482931137085, -3.4571266174316406, -3.1787705421447754, -2.90041446685791, -2.622058391571045, -2.3437020778656006, -2.0653460025787354, -1.786989688873291, -1.5086336135864258, -1.230277419090271, -0.9519212245941162, -0.673565149307251, -0.3952089548110962, -0.1168527603149414, 0.161503404378891, 0.4398595690727234, 0.7182157039642334, 0.9965718984603882, 1.274928092956543, 1.5532841682434082, 1.831640362739563, 2.1099965572357178, 2.388352632522583, 2.6667089462280273, 2.9450650215148926, 3.223421096801758, 3.501777410507202, 3.7801334857940674, 4.058489799499512, 4.336845874786377, 4.615201950073242, 4.893558025360107, 5.171914100646973, 5.450270652770996, 5.728626728057861, 6.006982803344727, 6.285338878631592, 6.563694953918457, 6.842051029205322, 7.1204071044921875, 7.398763656616211, 7.677119731903076, 7.955475807189941, 8.233831405639648, 8.512187957763672, 8.790544509887695]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 11.0, 8.0, 25.0, 37.0, 44.0, 62.0, 100.0, 163.0, 267.0, 453.0, 824.0, 1639.0, 3148.0, 6639.0, 13501.0, 28535.0, 59200.0, 115867.0, 198792.0, 242167.0, 179416.0, 100163.0, 50216.0, 24290.0, 11616.0, 5507.0, 2657.0, 1410.0, 731.0, 422.0, 222.0, 131.0, 92.0, 55.0, 45.0, 32.0, 19.0, 12.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6943359375, -0.6698760986328125, -0.645416259765625, -0.6209564208984375, -0.59649658203125, -0.5720367431640625, -0.547576904296875, -0.5231170654296875, -0.4986572265625, -0.4741973876953125, -0.449737548828125, -0.4252777099609375, -0.40081787109375, -0.3763580322265625, -0.351898193359375, -0.3274383544921875, -0.302978515625, -0.2785186767578125, -0.254058837890625, -0.2295989990234375, -0.20513916015625, -0.1806793212890625, -0.156219482421875, -0.1317596435546875, -0.1072998046875, -0.0828399658203125, -0.058380126953125, -0.0339202880859375, -0.00946044921875, 0.0149993896484375, 0.039459228515625, 0.0639190673828125, 0.08837890625, 0.1128387451171875, 0.137298583984375, 0.1617584228515625, 0.18621826171875, 0.2106781005859375, 0.235137939453125, 0.2595977783203125, 0.2840576171875, 0.3085174560546875, 0.332977294921875, 0.3574371337890625, 0.38189697265625, 0.4063568115234375, 0.430816650390625, 0.4552764892578125, 0.479736328125, 0.5041961669921875, 0.528656005859375, 0.5531158447265625, 0.57757568359375, 0.6020355224609375, 0.626495361328125, 0.6509552001953125, 0.6754150390625, 0.6998748779296875, 0.724334716796875, 0.7487945556640625, 0.77325439453125, 0.7977142333984375, 0.822174072265625, 0.8466339111328125, 0.87109375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 7.0, 5.0, 15.0, 10.0, 19.0, 18.0, 27.0, 32.0, 19.0, 51.0, 49.0, 41.0, 50.0, 47.0, 51.0, 50.0, 63.0, 45.0, 38.0, 48.0, 43.0, 37.0, 26.0, 36.0, 39.0, 18.0, 28.0, 11.0, 12.0, 6.0, 15.0, 10.0, 8.0, 12.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5419921875, -0.524017333984375, -0.50604248046875, -0.488067626953125, -0.4700927734375, -0.452117919921875, -0.43414306640625, -0.416168212890625, -0.398193359375, -0.380218505859375, -0.36224365234375, -0.344268798828125, -0.3262939453125, -0.308319091796875, -0.29034423828125, -0.272369384765625, -0.25439453125, -0.236419677734375, -0.21844482421875, -0.200469970703125, -0.1824951171875, -0.164520263671875, -0.14654541015625, -0.128570556640625, -0.110595703125, -0.092620849609375, -0.07464599609375, -0.056671142578125, -0.0386962890625, -0.020721435546875, -0.00274658203125, 0.015228271484375, 0.033203125, 0.051177978515625, 0.06915283203125, 0.087127685546875, 0.1051025390625, 0.123077392578125, 0.14105224609375, 0.159027099609375, 0.177001953125, 0.194976806640625, 0.21295166015625, 0.230926513671875, 0.2489013671875, 0.266876220703125, 0.28485107421875, 0.302825927734375, 0.32080078125, 0.338775634765625, 0.35675048828125, 0.374725341796875, 0.3927001953125, 0.410675048828125, 0.42864990234375, 0.446624755859375, 0.464599609375, 0.482574462890625, 0.50054931640625, 0.518524169921875, 0.5364990234375, 0.554473876953125, 0.57244873046875, 0.590423583984375, 0.6083984375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 10.0, 7.0, 5.0, 12.0, 15.0, 22.0, 30.0, 42.0, 52.0, 71.0, 95.0, 160.0, 186.0, 280.0, 420.0, 653.0, 968.0, 1886.0, 4207.0, 13477.0, 69533.0, 512282.0, 364195.0, 59317.0, 12055.0, 3947.0, 1798.0, 955.0, 602.0, 353.0, 236.0, 223.0, 119.0, 100.0, 70.0, 38.0, 32.0, 24.0, 15.0, 13.0, 14.0, 12.0, 13.0, 4.0, 3.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.62890625, -1.5684814453125, -1.508056640625, -1.4476318359375, -1.38720703125, -1.3267822265625, -1.266357421875, -1.2059326171875, -1.1455078125, -1.0850830078125, -1.024658203125, -0.9642333984375, -0.90380859375, -0.8433837890625, -0.782958984375, -0.7225341796875, -0.662109375, -0.6016845703125, -0.541259765625, -0.4808349609375, -0.42041015625, -0.3599853515625, -0.299560546875, -0.2391357421875, -0.1787109375, -0.1182861328125, -0.057861328125, 0.0025634765625, 0.06298828125, 0.1234130859375, 0.183837890625, 0.2442626953125, 0.3046875, 0.3651123046875, 0.425537109375, 0.4859619140625, 0.54638671875, 0.6068115234375, 0.667236328125, 0.7276611328125, 0.7880859375, 0.8485107421875, 0.908935546875, 0.9693603515625, 1.02978515625, 1.0902099609375, 1.150634765625, 1.2110595703125, 1.271484375, 1.3319091796875, 1.392333984375, 1.4527587890625, 1.51318359375, 1.5736083984375, 1.634033203125, 1.6944580078125, 1.7548828125, 1.8153076171875, 1.875732421875, 1.9361572265625, 1.99658203125, 2.0570068359375, 2.117431640625, 2.1778564453125, 2.23828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 12.0, 11.0, 17.0, 14.0, 23.0, 26.0, 30.0, 29.0, 45.0, 58.0, 40.0, 57.0, 59.0, 51.0, 58.0, 51.0, 47.0, 64.0, 55.0, 47.0, 39.0, 33.0, 27.0, 21.0, 20.0, 18.0, 11.0, 8.0, 2.0, 6.0, 4.0, 4.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.968658447265625, -1.87677001953125, -1.784881591796875, -1.6929931640625, -1.601104736328125, -1.50921630859375, -1.417327880859375, -1.325439453125, -1.233551025390625, -1.14166259765625, -1.049774169921875, -0.9578857421875, -0.865997314453125, -0.77410888671875, -0.682220458984375, -0.59033203125, -0.498443603515625, -0.40655517578125, -0.314666748046875, -0.2227783203125, -0.130889892578125, -0.03900146484375, 0.052886962890625, 0.144775390625, 0.236663818359375, 0.32855224609375, 0.420440673828125, 0.5123291015625, 0.604217529296875, 0.69610595703125, 0.787994384765625, 0.8798828125, 0.971771240234375, 1.06365966796875, 1.155548095703125, 1.2474365234375, 1.339324951171875, 1.43121337890625, 1.523101806640625, 1.614990234375, 1.706878662109375, 1.79876708984375, 1.890655517578125, 1.9825439453125, 2.074432373046875, 2.16632080078125, 2.258209228515625, 2.35009765625, 2.441986083984375, 2.53387451171875, 2.625762939453125, 2.7176513671875, 2.809539794921875, 2.90142822265625, 2.993316650390625, 3.085205078125, 3.177093505859375, 3.26898193359375, 3.360870361328125, 3.4527587890625, 3.544647216796875, 3.63653564453125, 3.728424072265625, 3.8203125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 19.0, 35.0, 59.0, 83.0, 141.0, 293.0, 473.0, 1036.0, 2098.0, 4999.0, 15111.0, 139286.0, 840623.0, 30437.0, 7827.0, 3065.0, 1407.0, 717.0, 345.0, 215.0, 117.0, 72.0, 37.0, 24.0, 13.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.81640625, -1.756317138671875, -1.69622802734375, -1.636138916015625, -1.5760498046875, -1.515960693359375, -1.45587158203125, -1.395782470703125, -1.335693359375, -1.275604248046875, -1.21551513671875, -1.155426025390625, -1.0953369140625, -1.035247802734375, -0.97515869140625, -0.915069580078125, -0.85498046875, -0.794891357421875, -0.73480224609375, -0.674713134765625, -0.6146240234375, -0.554534912109375, -0.49444580078125, -0.434356689453125, -0.374267578125, -0.314178466796875, -0.25408935546875, -0.194000244140625, -0.1339111328125, -0.073822021484375, -0.01373291015625, 0.046356201171875, 0.1064453125, 0.166534423828125, 0.22662353515625, 0.286712646484375, 0.3468017578125, 0.406890869140625, 0.46697998046875, 0.527069091796875, 0.587158203125, 0.647247314453125, 0.70733642578125, 0.767425537109375, 0.8275146484375, 0.887603759765625, 0.94769287109375, 1.007781982421875, 1.06787109375, 1.127960205078125, 1.18804931640625, 1.248138427734375, 1.3082275390625, 1.368316650390625, 1.42840576171875, 1.488494873046875, 1.548583984375, 1.608673095703125, 1.66876220703125, 1.728851318359375, 1.7889404296875, 1.849029541015625, 1.90911865234375, 1.969207763671875, 2.029296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 9.0, 14.0, 22.0, 94.0, 440.0, 325.0, 40.0, 21.0, 15.0, 8.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014066696166992188, -0.001362532377243042, -0.0013183951377868652, -0.0012742578983306885, -0.0012301206588745117, -0.001185983419418335, -0.0011418461799621582, -0.0010977089405059814, -0.0010535717010498047, -0.001009434461593628, -0.0009652972221374512, -0.0009211599826812744, -0.0008770227432250977, -0.0008328855037689209, -0.0007887482643127441, -0.0007446110248565674, -0.0007004737854003906, -0.0006563365459442139, -0.0006121993064880371, -0.0005680620670318604, -0.0005239248275756836, -0.00047978758811950684, -0.0004356503486633301, -0.0003915131092071533, -0.00034737586975097656, -0.0003032386302947998, -0.00025910139083862305, -0.0002149641513824463, -0.00017082691192626953, -0.00012668967247009277, -8.255243301391602e-05, -3.841519355773926e-05, 5.7220458984375e-06, 4.985928535461426e-05, 9.399652481079102e-05, 0.00013813376426696777, 0.00018227100372314453, 0.0002264082431793213, 0.00027054548263549805, 0.0003146827220916748, 0.00035881996154785156, 0.0004029572010040283, 0.0004470944404602051, 0.0004912316799163818, 0.0005353689193725586, 0.0005795061588287354, 0.0006236433982849121, 0.0006677806377410889, 0.0007119178771972656, 0.0007560551166534424, 0.0008001923561096191, 0.0008443295955657959, 0.0008884668350219727, 0.0009326040744781494, 0.0009767413139343262, 0.001020878553390503, 0.0010650157928466797, 0.0011091530323028564, 0.0011532902717590332, 0.00119742751121521, 0.0012415647506713867, 0.0012857019901275635, 0.0013298392295837402, 0.001373976469039917, 0.0014181137084960938]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 2.0, 11.0, 10.0, 13.0, 19.0, 23.0, 36.0, 82.0, 99.0, 166.0, 251.0, 465.0, 856.0, 1601.0, 3260.0, 7605.0, 21834.0, 235502.0, 726519.0, 31927.0, 9853.0, 4098.0, 1870.0, 1001.0, 565.0, 315.0, 177.0, 125.0, 70.0, 68.0, 36.0, 34.0, 13.0, 13.0, 9.0, 7.0, 4.0, 4.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.529296875, -1.4844970703125, -1.439697265625, -1.3948974609375, -1.35009765625, -1.3052978515625, -1.260498046875, -1.2156982421875, -1.1708984375, -1.1260986328125, -1.081298828125, -1.0364990234375, -0.99169921875, -0.9468994140625, -0.902099609375, -0.8572998046875, -0.8125, -0.7677001953125, -0.722900390625, -0.6781005859375, -0.63330078125, -0.5885009765625, -0.543701171875, -0.4989013671875, -0.4541015625, -0.4093017578125, -0.364501953125, -0.3197021484375, -0.27490234375, -0.2301025390625, -0.185302734375, -0.1405029296875, -0.095703125, -0.0509033203125, -0.006103515625, 0.0386962890625, 0.08349609375, 0.1282958984375, 0.173095703125, 0.2178955078125, 0.2626953125, 0.3074951171875, 0.352294921875, 0.3970947265625, 0.44189453125, 0.4866943359375, 0.531494140625, 0.5762939453125, 0.62109375, 0.6658935546875, 0.710693359375, 0.7554931640625, 0.80029296875, 0.8450927734375, 0.889892578125, 0.9346923828125, 0.9794921875, 1.0242919921875, 1.069091796875, 1.1138916015625, 1.15869140625, 1.2034912109375, 1.248291015625, 1.2930908203125, 1.337890625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 1.0, 9.0, 6.0, 10.0, 14.0, 20.0, 25.0, 38.0, 35.0, 57.0, 85.0, 100.0, 117.0, 109.0, 101.0, 65.0, 41.0, 37.0, 32.0, 16.0, 17.0, 9.0, 12.0, 4.0, 4.0, 5.0, 7.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2783203125, -1.2392730712890625, -1.200225830078125, -1.1611785888671875, -1.12213134765625, -1.0830841064453125, -1.044036865234375, -1.0049896240234375, -0.9659423828125, -0.9268951416015625, -0.887847900390625, -0.8488006591796875, -0.80975341796875, -0.7707061767578125, -0.731658935546875, -0.6926116943359375, -0.653564453125, -0.6145172119140625, -0.575469970703125, -0.5364227294921875, -0.49737548828125, -0.4583282470703125, -0.419281005859375, -0.3802337646484375, -0.3411865234375, -0.3021392822265625, -0.263092041015625, -0.2240447998046875, -0.18499755859375, -0.1459503173828125, -0.106903076171875, -0.0678558349609375, -0.02880859375, 0.0102386474609375, 0.049285888671875, 0.0883331298828125, 0.12738037109375, 0.1664276123046875, 0.205474853515625, 0.2445220947265625, 0.2835693359375, 0.3226165771484375, 0.361663818359375, 0.4007110595703125, 0.43975830078125, 0.4788055419921875, 0.517852783203125, 0.5569000244140625, 0.595947265625, 0.6349945068359375, 0.674041748046875, 0.7130889892578125, 0.75213623046875, 0.7911834716796875, 0.830230712890625, 0.8692779541015625, 0.9083251953125, 0.9473724365234375, 0.986419677734375, 1.0254669189453125, 1.06451416015625, 1.1035614013671875, 1.142608642578125, 1.1816558837890625, 1.220703125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 9.0, 6.0, 10.0, 19.0, 24.0, 37.0, 44.0, 71.0, 107.0, 223.0, 183.0, 107.0, 72.0, 35.0, 13.0, 14.0, 5.0, 7.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.703315734863281, -14.059226036071777, -13.41513729095459, -12.771047592163086, -12.126957893371582, -11.482868194580078, -10.83877944946289, -10.194689750671387, -9.550600051879883, -8.906510353088379, -8.262421607971191, -7.6183319091796875, -6.974242210388184, -6.330152988433838, -5.686063766479492, -5.041974067687988, -4.397885322570801, -3.753795862197876, -3.109706401824951, -2.4656171798706055, -1.8215277194976807, -1.1774382591247559, -0.5333490371704102, 0.11074066162109375, 0.7548298835754395, 1.3989193439483643, 2.043008804321289, 2.6870980262756348, 3.3311874866485596, 3.9752769470214844, 4.61936616897583, 5.263455867767334, 5.90754508972168, 6.551634311676025, 7.195724010467529, 7.839813232421875, 8.483902931213379, 9.127992630004883, 9.77208137512207, 10.416171073913574, 11.060260772705078, 11.704350471496582, 12.34843921661377, 12.992528915405273, 13.636618614196777, 14.280708312988281, 14.924797058105469, 15.568886756896973, 16.212974548339844, 16.85706329345703, 17.50115394592285, 18.14524269104004, 18.789331436157227, 19.433422088623047, 20.077510833740234, 20.721599578857422, 21.365690231323242, 22.00977897644043, 22.65386962890625, 23.297958374023438, 23.942047119140625, 24.586137771606445, 25.230226516723633, 25.874317169189453, 26.51840591430664]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 3.0, 4.0, 9.0, 17.0, 11.0, 23.0, 20.0, 27.0, 31.0, 35.0, 34.0, 37.0, 50.0, 56.0, 72.0, 79.0, 80.0, 48.0, 52.0, 39.0, 33.0, 33.0, 33.0, 28.0, 27.0, 20.0, 19.0, 9.0, 10.0, 11.0, 12.0, 7.0, 4.0, 3.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.255025863647461, -13.868809700012207, -13.482592582702637, -13.096376419067383, -12.710159301757812, -12.323943138122559, -11.937726974487305, -11.551509857177734, -11.16529369354248, -10.779077529907227, -10.392860412597656, -10.006644248962402, -9.620427131652832, -9.234210968017578, -8.847993850708008, -8.461777687072754, -8.0755615234375, -7.689344882965088, -7.303128242492676, -6.916912078857422, -6.53069543838501, -6.144478797912598, -5.7582621574401855, -5.372045516967773, -4.985828399658203, -4.599611759185791, -4.213395118713379, -3.827178716659546, -3.440962314605713, -3.054745674133301, -2.6685290336608887, -2.2823126316070557, -1.8960962295532227, -1.5098797082901, -1.1236631870269775, -0.7374465465545654, -0.35123002529144287, 0.03498649597167969, 0.4212031364440918, 0.8074195384979248, 1.193636178970337, 1.5798527002334595, 1.966069221496582, 2.352285861968994, 2.7385025024414062, 3.1247189044952393, 3.5109355449676514, 3.8971519470214844, 4.2833685874938965, 4.669585227966309, 5.055801868438721, 5.442018508911133, 5.828234672546387, 6.214451313018799, 6.600667953491211, 6.986884117126465, 7.373101234436035, 7.759317874908447, 8.14553451538086, 8.531750679016113, 8.917967796325684, 9.304183959960938, 9.690401077270508, 10.076617240905762, 10.462833404541016]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 8.0, 14.0, 11.0, 15.0, 27.0, 39.0, 35.0, 54.0, 86.0, 98.0, 189.0, 452.0, 1372.0, 7601.0, 72853.0, 2176094.0, 1859394.0, 64413.0, 8054.0, 2032.0, 745.0, 273.0, 131.0, 75.0, 56.0, 21.0, 27.0, 20.0, 29.0, 5.0, 11.0, 6.0, 11.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.546875, -1.495269775390625, -1.44366455078125, -1.392059326171875, -1.3404541015625, -1.288848876953125, -1.23724365234375, -1.185638427734375, -1.134033203125, -1.082427978515625, -1.03082275390625, -0.979217529296875, -0.9276123046875, -0.876007080078125, -0.82440185546875, -0.772796630859375, -0.72119140625, -0.669586181640625, -0.61798095703125, -0.566375732421875, -0.5147705078125, -0.463165283203125, -0.41156005859375, -0.359954833984375, -0.308349609375, -0.256744384765625, -0.20513916015625, -0.153533935546875, -0.1019287109375, -0.050323486328125, 0.00128173828125, 0.052886962890625, 0.1044921875, 0.156097412109375, 0.20770263671875, 0.259307861328125, 0.3109130859375, 0.362518310546875, 0.41412353515625, 0.465728759765625, 0.517333984375, 0.568939208984375, 0.62054443359375, 0.672149658203125, 0.7237548828125, 0.775360107421875, 0.82696533203125, 0.878570556640625, 0.93017578125, 0.981781005859375, 1.03338623046875, 1.084991455078125, 1.1365966796875, 1.188201904296875, 1.23980712890625, 1.291412353515625, 1.343017578125, 1.394622802734375, 1.44622802734375, 1.497833251953125, 1.5494384765625, 1.601043701171875, 1.65264892578125, 1.704254150390625, 1.755859375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 12.0, 22.0, 37.0, 64.0, 74.0, 133.0, 120.0, 140.0, 121.0, 106.0, 63.0, 41.0, 35.0, 17.0, 8.0, 6.0, 4.0, 0.0, 1.0, 1.0], "bins": [-2.376953125, -2.3304977416992188, -2.2840423583984375, -2.2375869750976562, -2.191131591796875, -2.1446762084960938, -2.0982208251953125, -2.0517654418945312, -2.00531005859375, -1.9588546752929688, -1.9123992919921875, -1.8659439086914062, -1.819488525390625, -1.7730331420898438, -1.7265777587890625, -1.6801223754882812, -1.6336669921875, -1.5872116088867188, -1.5407562255859375, -1.4943008422851562, -1.447845458984375, -1.4013900756835938, -1.3549346923828125, -1.3084793090820312, -1.26202392578125, -1.2155685424804688, -1.1691131591796875, -1.1226577758789062, -1.076202392578125, -1.0297470092773438, -0.9832916259765625, -0.9368362426757812, -0.890380859375, -0.8439254760742188, -0.7974700927734375, -0.7510147094726562, -0.704559326171875, -0.6581039428710938, -0.6116485595703125, -0.5651931762695312, -0.51873779296875, -0.47228240966796875, -0.4258270263671875, -0.37937164306640625, -0.332916259765625, -0.28646087646484375, -0.2400054931640625, -0.19355010986328125, -0.1470947265625, -0.10063934326171875, -0.0541839599609375, -0.00772857666015625, 0.038726806640625, 0.08518218994140625, 0.1316375732421875, 0.17809295654296875, 0.22454833984375, 0.27100372314453125, 0.3174591064453125, 0.36391448974609375, 0.410369873046875, 0.45682525634765625, 0.5032806396484375, 0.5497360229492188, 0.59619140625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 16.0, 22.0, 33.0, 48.0, 80.0, 124.0, 177.0, 281.0, 636.0, 2786.0, 36136.0, 3736828.0, 403534.0, 11165.0, 1573.0, 450.0, 191.0, 90.0, 42.0, 27.0, 13.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.205078125, -3.097442626953125, -2.98980712890625, -2.882171630859375, -2.7745361328125, -2.666900634765625, -2.55926513671875, -2.451629638671875, -2.343994140625, -2.236358642578125, -2.12872314453125, -2.021087646484375, -1.9134521484375, -1.805816650390625, -1.69818115234375, -1.590545654296875, -1.48291015625, -1.375274658203125, -1.26763916015625, -1.160003662109375, -1.0523681640625, -0.944732666015625, -0.83709716796875, -0.729461669921875, -0.621826171875, -0.514190673828125, -0.40655517578125, -0.298919677734375, -0.1912841796875, -0.083648681640625, 0.02398681640625, 0.131622314453125, 0.2392578125, 0.346893310546875, 0.45452880859375, 0.562164306640625, 0.6697998046875, 0.777435302734375, 0.88507080078125, 0.992706298828125, 1.100341796875, 1.207977294921875, 1.31561279296875, 1.423248291015625, 1.5308837890625, 1.638519287109375, 1.74615478515625, 1.853790283203125, 1.96142578125, 2.069061279296875, 2.17669677734375, 2.284332275390625, 2.3919677734375, 2.499603271484375, 2.60723876953125, 2.714874267578125, 2.822509765625, 2.930145263671875, 3.03778076171875, 3.145416259765625, 3.2530517578125, 3.360687255859375, 3.46832275390625, 3.575958251953125, 3.68359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 15.0, 12.0, 12.0, 29.0, 68.0, 134.0, 346.0, 932.0, 1314.0, 693.0, 243.0, 123.0, 74.0, 36.0, 16.0, 10.0, 8.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.39453125, -4.2976226806640625, -4.200714111328125, -4.1038055419921875, -4.00689697265625, -3.9099884033203125, -3.813079833984375, -3.7161712646484375, -3.6192626953125, -3.5223541259765625, -3.425445556640625, -3.3285369873046875, -3.23162841796875, -3.1347198486328125, -3.037811279296875, -2.9409027099609375, -2.843994140625, -2.7470855712890625, -2.650177001953125, -2.5532684326171875, -2.45635986328125, -2.3594512939453125, -2.262542724609375, -2.1656341552734375, -2.0687255859375, -1.9718170166015625, -1.874908447265625, -1.7779998779296875, -1.68109130859375, -1.5841827392578125, -1.487274169921875, -1.3903656005859375, -1.29345703125, -1.1965484619140625, -1.099639892578125, -1.0027313232421875, -0.90582275390625, -0.8089141845703125, -0.712005615234375, -0.6150970458984375, -0.5181884765625, -0.4212799072265625, -0.324371337890625, -0.2274627685546875, -0.13055419921875, -0.0336456298828125, 0.063262939453125, 0.1601715087890625, 0.257080078125, 0.3539886474609375, 0.450897216796875, 0.5478057861328125, 0.64471435546875, 0.7416229248046875, 0.838531494140625, 0.9354400634765625, 1.0323486328125, 1.1292572021484375, 1.226165771484375, 1.3230743408203125, 1.41998291015625, 1.5168914794921875, 1.613800048828125, 1.7107086181640625, 1.8076171875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 10.0, 13.0, 18.0, 49.0, 81.0, 131.0, 183.0, 198.0, 146.0, 93.0, 27.0, 15.0, 11.0, 5.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.392019271850586, -15.848381042480469, -15.304742813110352, -14.761104583740234, -14.217467308044434, -13.673829078674316, -13.1301908493042, -12.586552619934082, -12.042915344238281, -11.499277114868164, -10.955638885498047, -10.41200065612793, -9.868363380432129, -9.324725151062012, -8.781086921691895, -8.237448692321777, -7.69381046295166, -7.150172233581543, -6.606534481048584, -6.062896251678467, -5.519258499145508, -4.975620269775391, -4.431982040405273, -3.8883440494537354, -3.3447060585021973, -2.801068067550659, -2.257430076599121, -1.713791847229004, -1.1701538562774658, -0.6265158653259277, -0.08287763595581055, 0.46076035499572754, 1.0043983459472656, 1.5480363368988037, 2.091674327850342, 2.635312557220459, 3.178950548171997, 3.722588539123535, 4.266226768493652, 4.8098649978637695, 5.3535027503967285, 5.897140979766846, 6.440778732299805, 6.984416961669922, 7.528055191040039, 8.071693420410156, 8.615331649780273, 9.158968925476074, 9.702607154846191, 10.246245384216309, 10.789883613586426, 11.333520889282227, 11.877159118652344, 12.420797348022461, 12.964435577392578, 13.508073806762695, 14.051712036132812, 14.59535026550293, 15.138988494873047, 15.682626724243164, 16.22626495361328, 16.769901275634766, 17.313541412353516, 17.857177734375, 18.400815963745117]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 3.0, 11.0, 15.0, 15.0, 20.0, 27.0, 30.0, 47.0, 52.0, 59.0, 67.0, 70.0, 73.0, 75.0, 72.0, 87.0, 66.0, 49.0, 38.0, 39.0, 27.0, 16.0, 14.0, 6.0, 8.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.370281219482422, -9.933174133300781, -9.496066093444824, -9.058959007263184, -8.621851921081543, -8.184743881225586, -7.747636795043945, -7.310529708862305, -6.873422145843506, -6.436314582824707, -5.999207496643066, -5.562099933624268, -5.124992370605469, -4.687885284423828, -4.250777721405029, -3.8136703968048096, -3.37656307220459, -2.93945574760437, -2.5023484230041504, -2.0652408599853516, -1.6281335353851318, -1.191026210784912, -0.7539186477661133, -0.31681132316589355, 0.12029600143432617, 0.5574033856391907, 0.9945107698440552, 1.4316182136535645, 1.8687255382537842, 2.305832862854004, 2.7429404258728027, 3.1800477504730225, 3.617155075073242, 4.054262638092041, 4.491369724273682, 4.9284772872924805, 5.365584373474121, 5.80269193649292, 6.239799499511719, 6.676906585693359, 7.114014148712158, 7.551121711730957, 7.988228797912598, 8.425336837768555, 8.862443923950195, 9.299551010131836, 9.736658096313477, 10.173766136169434, 10.610873222351074, 11.047980308532715, 11.485088348388672, 11.922195434570312, 12.359302520751953, 12.796409606933594, 13.23351764678955, 13.670624732971191, 14.107732772827148, 14.544839859008789, 14.981947898864746, 15.419054985046387, 15.856162071228027, 16.293270111083984, 16.730377197265625, 17.167484283447266, 17.604591369628906]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 13.0, 17.0, 31.0, 39.0, 73.0, 88.0, 123.0, 212.0, 294.0, 469.0, 761.0, 1185.0, 1915.0, 2948.0, 5029.0, 8687.0, 15109.0, 26355.0, 47191.0, 83182.0, 143071.0, 206311.0, 198500.0, 131061.0, 75399.0, 42442.0, 24242.0, 13709.0, 7799.0, 4687.0, 2801.0, 1755.0, 1121.0, 675.0, 423.0, 279.0, 181.0, 125.0, 76.0, 51.0, 46.0, 26.0, 7.0, 8.0, 8.0, 9.0, 4.0, 6.0, 1.0, 2.0], "bins": [-0.822265625, -0.7993698120117188, -0.7764739990234375, -0.7535781860351562, -0.730682373046875, -0.7077865600585938, -0.6848907470703125, -0.6619949340820312, -0.63909912109375, -0.6162033081054688, -0.5933074951171875, -0.5704116821289062, -0.547515869140625, -0.5246200561523438, -0.5017242431640625, -0.47882843017578125, -0.4559326171875, -0.43303680419921875, -0.4101409912109375, -0.38724517822265625, -0.364349365234375, -0.34145355224609375, -0.3185577392578125, -0.29566192626953125, -0.27276611328125, -0.24987030029296875, -0.2269744873046875, -0.20407867431640625, -0.181182861328125, -0.15828704833984375, -0.1353912353515625, -0.11249542236328125, -0.089599609375, -0.06670379638671875, -0.0438079833984375, -0.02091217041015625, 0.001983642578125, 0.02487945556640625, 0.0477752685546875, 0.07067108154296875, 0.09356689453125, 0.11646270751953125, 0.1393585205078125, 0.16225433349609375, 0.185150146484375, 0.20804595947265625, 0.2309417724609375, 0.25383758544921875, 0.2767333984375, 0.29962921142578125, 0.3225250244140625, 0.34542083740234375, 0.368316650390625, 0.39121246337890625, 0.4141082763671875, 0.43700408935546875, 0.45989990234375, 0.48279571533203125, 0.5056915283203125, 0.5285873413085938, 0.551483154296875, 0.5743789672851562, 0.5972747802734375, 0.6201705932617188, 0.64306640625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 4.0, 4.0, 6.0, 1.0, 5.0, 8.0, 8.0, 12.0, 12.0, 19.0, 16.0, 17.0, 16.0, 30.0, 26.0, 30.0, 30.0, 30.0, 51.0, 52.0, 56.0, 53.0, 32.0, 53.0, 46.0, 62.0, 36.0, 47.0, 25.0, 35.0, 21.0, 22.0, 25.0, 22.0, 13.0, 13.0, 9.0, 6.0, 9.0, 5.0, 9.0, 10.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.6796875, -0.6604156494140625, -0.641143798828125, -0.6218719482421875, -0.60260009765625, -0.5833282470703125, -0.564056396484375, -0.5447845458984375, -0.5255126953125, -0.5062408447265625, -0.486968994140625, -0.4676971435546875, -0.44842529296875, -0.4291534423828125, -0.409881591796875, -0.3906097412109375, -0.371337890625, -0.3520660400390625, -0.332794189453125, -0.3135223388671875, -0.29425048828125, -0.2749786376953125, -0.255706787109375, -0.2364349365234375, -0.2171630859375, -0.1978912353515625, -0.178619384765625, -0.1593475341796875, -0.14007568359375, -0.1208038330078125, -0.101531982421875, -0.0822601318359375, -0.06298828125, -0.0437164306640625, -0.024444580078125, -0.0051727294921875, 0.01409912109375, 0.0333709716796875, 0.052642822265625, 0.0719146728515625, 0.0911865234375, 0.1104583740234375, 0.129730224609375, 0.1490020751953125, 0.16827392578125, 0.1875457763671875, 0.206817626953125, 0.2260894775390625, 0.245361328125, 0.2646331787109375, 0.283905029296875, 0.3031768798828125, 0.32244873046875, 0.3417205810546875, 0.360992431640625, 0.3802642822265625, 0.3995361328125, 0.4188079833984375, 0.438079833984375, 0.4573516845703125, 0.47662353515625, 0.4958953857421875, 0.515167236328125, 0.5344390869140625, 0.5537109375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 7.0, 8.0, 9.0, 22.0, 29.0, 36.0, 55.0, 89.0, 141.0, 207.0, 311.0, 541.0, 1067.0, 2110.0, 6461.0, 35481.0, 379485.0, 569003.0, 41540.0, 7012.0, 2282.0, 1072.0, 581.0, 379.0, 196.0, 136.0, 79.0, 65.0, 51.0, 26.0, 21.0, 19.0, 6.0, 9.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.765625, -2.670379638671875, -2.57513427734375, -2.479888916015625, -2.3846435546875, -2.289398193359375, -2.19415283203125, -2.098907470703125, -2.003662109375, -1.908416748046875, -1.81317138671875, -1.717926025390625, -1.6226806640625, -1.527435302734375, -1.43218994140625, -1.336944580078125, -1.24169921875, -1.146453857421875, -1.05120849609375, -0.955963134765625, -0.8607177734375, -0.765472412109375, -0.67022705078125, -0.574981689453125, -0.479736328125, -0.384490966796875, -0.28924560546875, -0.194000244140625, -0.0987548828125, -0.003509521484375, 0.09173583984375, 0.186981201171875, 0.2822265625, 0.377471923828125, 0.47271728515625, 0.567962646484375, 0.6632080078125, 0.758453369140625, 0.85369873046875, 0.948944091796875, 1.044189453125, 1.139434814453125, 1.23468017578125, 1.329925537109375, 1.4251708984375, 1.520416259765625, 1.61566162109375, 1.710906982421875, 1.80615234375, 1.901397705078125, 1.99664306640625, 2.091888427734375, 2.1871337890625, 2.282379150390625, 2.37762451171875, 2.472869873046875, 2.568115234375, 2.663360595703125, 2.75860595703125, 2.853851318359375, 2.9490966796875, 3.044342041015625, 3.13958740234375, 3.234832763671875, 3.330078125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 11.0, 14.0, 13.0, 15.0, 7.0, 14.0, 22.0, 20.0, 28.0, 29.0, 28.0, 34.0, 39.0, 42.0, 60.0, 44.0, 56.0, 63.0, 43.0, 67.0, 57.0, 32.0, 30.0, 43.0, 32.0, 31.0, 22.0, 17.0, 22.0, 18.0, 7.0, 12.0, 9.0, 2.0, 4.0, 3.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.673828125, -3.57470703125, -3.4755859375, -3.37646484375, -3.27734375, -3.17822265625, -3.0791015625, -2.97998046875, -2.880859375, -2.78173828125, -2.6826171875, -2.58349609375, -2.484375, -2.38525390625, -2.2861328125, -2.18701171875, -2.087890625, -1.98876953125, -1.8896484375, -1.79052734375, -1.69140625, -1.59228515625, -1.4931640625, -1.39404296875, -1.294921875, -1.19580078125, -1.0966796875, -0.99755859375, -0.8984375, -0.79931640625, -0.7001953125, -0.60107421875, -0.501953125, -0.40283203125, -0.3037109375, -0.20458984375, -0.10546875, -0.00634765625, 0.0927734375, 0.19189453125, 0.291015625, 0.39013671875, 0.4892578125, 0.58837890625, 0.6875, 0.78662109375, 0.8857421875, 0.98486328125, 1.083984375, 1.18310546875, 1.2822265625, 1.38134765625, 1.48046875, 1.57958984375, 1.6787109375, 1.77783203125, 1.876953125, 1.97607421875, 2.0751953125, 2.17431640625, 2.2734375, 2.37255859375, 2.4716796875, 2.57080078125, 2.669921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 10.0, 12.0, 17.0, 44.0, 50.0, 99.0, 188.0, 440.0, 1219.0, 4560.0, 32037.0, 883045.0, 114669.0, 8966.0, 1982.0, 619.0, 274.0, 120.0, 74.0, 38.0, 29.0, 8.0, 16.0, 8.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5595703125, -1.4988861083984375, -1.438201904296875, -1.3775177001953125, -1.31683349609375, -1.2561492919921875, -1.195465087890625, -1.1347808837890625, -1.0740966796875, -1.0134124755859375, -0.952728271484375, -0.8920440673828125, -0.83135986328125, -0.7706756591796875, -0.709991455078125, -0.6493072509765625, -0.588623046875, -0.5279388427734375, -0.467254638671875, -0.4065704345703125, -0.34588623046875, -0.2852020263671875, -0.224517822265625, -0.1638336181640625, -0.1031494140625, -0.0424652099609375, 0.018218994140625, 0.0789031982421875, 0.13958740234375, 0.2002716064453125, 0.260955810546875, 0.3216400146484375, 0.38232421875, 0.4430084228515625, 0.503692626953125, 0.5643768310546875, 0.62506103515625, 0.6857452392578125, 0.746429443359375, 0.8071136474609375, 0.8677978515625, 0.9284820556640625, 0.989166259765625, 1.0498504638671875, 1.11053466796875, 1.1712188720703125, 1.231903076171875, 1.2925872802734375, 1.353271484375, 1.4139556884765625, 1.474639892578125, 1.5353240966796875, 1.59600830078125, 1.6566925048828125, 1.717376708984375, 1.7780609130859375, 1.8387451171875, 1.8994293212890625, 1.960113525390625, 2.0207977294921875, 2.08148193359375, 2.1421661376953125, 2.202850341796875, 2.2635345458984375, 2.32421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 7.0, 11.0, 26.0, 41.0, 97.0, 170.0, 260.0, 166.0, 113.0, 47.0, 22.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005397796630859375, -0.0005214959383010864, -0.0005032122135162354, -0.0004849284887313843, -0.0004666447639465332, -0.00044836103916168213, -0.00043007731437683105, -0.00041179358959198, -0.0003935098648071289, -0.00037522614002227783, -0.00035694241523742676, -0.0003386586904525757, -0.0003203749656677246, -0.00030209124088287354, -0.00028380751609802246, -0.0002655237913131714, -0.0002472400665283203, -0.00022895634174346924, -0.00021067261695861816, -0.0001923888921737671, -0.00017410516738891602, -0.00015582144260406494, -0.00013753771781921387, -0.00011925399303436279, -0.00010097026824951172, -8.268654346466064e-05, -6.440281867980957e-05, -4.6119093894958496e-05, -2.7835369110107422e-05, -9.551644325256348e-06, 8.732080459594727e-06, 2.70158052444458e-05, 4.5299530029296875e-05, 6.358325481414795e-05, 8.186697959899902e-05, 0.0001001507043838501, 0.00011843442916870117, 0.00013671815395355225, 0.00015500187873840332, 0.0001732856035232544, 0.00019156932830810547, 0.00020985305309295654, 0.00022813677787780762, 0.0002464205026626587, 0.00026470422744750977, 0.00028298795223236084, 0.0003012716770172119, 0.000319555401802063, 0.00033783912658691406, 0.00035612285137176514, 0.0003744065761566162, 0.0003926903009414673, 0.00041097402572631836, 0.00042925775051116943, 0.0004475414752960205, 0.0004658252000808716, 0.00048410892486572266, 0.0005023926496505737, 0.0005206763744354248, 0.0005389600992202759, 0.000557243824005127, 0.000575527548789978, 0.0005938112735748291, 0.0006120949983596802, 0.0006303787231445312]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 8.0, 20.0, 27.0, 43.0, 101.0, 152.0, 380.0, 924.0, 2763.0, 13791.0, 242430.0, 755837.0, 25741.0, 4199.0, 1205.0, 496.0, 201.0, 87.0, 61.0, 23.0, 22.0, 10.0, 10.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4609375, -1.4124755859375, -1.364013671875, -1.3155517578125, -1.26708984375, -1.2186279296875, -1.170166015625, -1.1217041015625, -1.0732421875, -1.0247802734375, -0.976318359375, -0.9278564453125, -0.87939453125, -0.8309326171875, -0.782470703125, -0.7340087890625, -0.685546875, -0.6370849609375, -0.588623046875, -0.5401611328125, -0.49169921875, -0.4432373046875, -0.394775390625, -0.3463134765625, -0.2978515625, -0.2493896484375, -0.200927734375, -0.1524658203125, -0.10400390625, -0.0555419921875, -0.007080078125, 0.0413818359375, 0.08984375, 0.1383056640625, 0.186767578125, 0.2352294921875, 0.28369140625, 0.3321533203125, 0.380615234375, 0.4290771484375, 0.4775390625, 0.5260009765625, 0.574462890625, 0.6229248046875, 0.67138671875, 0.7198486328125, 0.768310546875, 0.8167724609375, 0.865234375, 0.9136962890625, 0.962158203125, 1.0106201171875, 1.05908203125, 1.1075439453125, 1.156005859375, 1.2044677734375, 1.2529296875, 1.3013916015625, 1.349853515625, 1.3983154296875, 1.44677734375, 1.4952392578125, 1.543701171875, 1.5921630859375, 1.640625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 9.0, 10.0, 10.0, 10.0, 15.0, 19.0, 33.0, 50.0, 56.0, 85.0, 106.0, 121.0, 115.0, 89.0, 79.0, 47.0, 47.0, 24.0, 18.0, 16.0, 6.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2119140625, -1.1768646240234375, -1.141815185546875, -1.1067657470703125, -1.07171630859375, -1.0366668701171875, -1.001617431640625, -0.9665679931640625, -0.9315185546875, -0.8964691162109375, -0.861419677734375, -0.8263702392578125, -0.79132080078125, -0.7562713623046875, -0.721221923828125, -0.6861724853515625, -0.651123046875, -0.6160736083984375, -0.581024169921875, -0.5459747314453125, -0.51092529296875, -0.4758758544921875, -0.440826416015625, -0.4057769775390625, -0.3707275390625, -0.3356781005859375, -0.300628662109375, -0.2655792236328125, -0.23052978515625, -0.1954803466796875, -0.160430908203125, -0.1253814697265625, -0.09033203125, -0.0552825927734375, -0.020233154296875, 0.0148162841796875, 0.04986572265625, 0.0849151611328125, 0.119964599609375, 0.1550140380859375, 0.1900634765625, 0.2251129150390625, 0.260162353515625, 0.2952117919921875, 0.33026123046875, 0.3653106689453125, 0.400360107421875, 0.4354095458984375, 0.470458984375, 0.5055084228515625, 0.540557861328125, 0.5756072998046875, 0.61065673828125, 0.6457061767578125, 0.680755615234375, 0.7158050537109375, 0.7508544921875, 0.7859039306640625, 0.820953369140625, 0.8560028076171875, 0.89105224609375, 0.9261016845703125, 0.961151123046875, 0.9962005615234375, 1.03125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 15.0, 16.0, 56.0, 146.0, 318.0, 195.0, 134.0, 53.0, 27.0, 16.0, 11.0, 5.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.215835571289062, -29.22852897644043, -28.241222381591797, -27.253915786743164, -26.26660919189453, -25.27930450439453, -24.2919979095459, -23.304691314697266, -22.317384719848633, -21.330078125, -20.342771530151367, -19.355464935302734, -18.368160247802734, -17.38085174560547, -16.39354705810547, -15.406240463256836, -14.418933868408203, -13.43162727355957, -12.444320678710938, -11.457015037536621, -10.469708442687988, -9.482401847839355, -8.495096206665039, -7.507789611816406, -6.520483016967773, -5.533176422119141, -4.545870304107666, -3.5585639476776123, -2.5712575912475586, -1.5839509963989258, -0.5966448783874512, 0.39066123962402344, 1.3779678344726562, 2.36527419090271, 3.3525805473327637, 4.339886665344238, 5.327193260192871, 6.314499855041504, 7.3018059730529785, 8.289112091064453, 9.276418685913086, 10.263725280761719, 11.251031875610352, 12.238337516784668, 13.2256441116333, 14.212950706481934, 15.20025634765625, 16.187562942504883, 17.174869537353516, 18.16217613220215, 19.14948272705078, 20.136789321899414, 21.124095916748047, 22.111400604248047, 23.09870719909668, 24.086013793945312, 25.073320388793945, 26.060626983642578, 27.04793357849121, 28.035240173339844, 29.022544860839844, 30.00985336303711, 30.99715805053711, 31.984464645385742, 32.971771240234375]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 2.0, 8.0, 6.0, 7.0, 11.0, 17.0, 14.0, 19.0, 21.0, 32.0, 43.0, 38.0, 48.0, 43.0, 60.0, 117.0, 92.0, 78.0, 63.0, 45.0, 40.0, 29.0, 36.0, 22.0, 27.0, 16.0, 18.0, 12.0, 10.0, 4.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.239904403686523, -14.637977600097656, -14.036050796508789, -13.434123992919922, -12.832198143005371, -12.230271339416504, -11.628344535827637, -11.026418685913086, -10.424491882324219, -9.822565078735352, -9.220638275146484, -8.618711471557617, -8.016785621643066, -7.414858818054199, -6.812932014465332, -6.211005687713623, -5.609078407287598, -5.0071516036987305, -4.4052252769470215, -3.8032984733581543, -3.201371908187866, -2.599445343017578, -1.997518539428711, -1.395592212677002, -0.7936654090881348, -0.1917387843132019, 0.41018784046173096, 1.0121145248413086, 1.6140410900115967, 2.2159676551818848, 2.817894458770752, 3.419820785522461, 4.021747589111328, 4.623674392700195, 5.225600719451904, 5.8275275230407715, 6.4294538497924805, 7.031380653381348, 7.633307456970215, 8.235233306884766, 8.837160110473633, 9.4390869140625, 10.041013717651367, 10.642940521240234, 11.244866371154785, 11.846793174743652, 12.44871997833252, 13.05064582824707, 13.652573585510254, 14.254500389099121, 14.856427192687988, 15.458353042602539, 16.060279846191406, 16.662206649780273, 17.26413345336914, 17.866060256958008, 18.467987060546875, 19.069913864135742, 19.67184066772461, 20.273767471313477, 20.875694274902344, 21.477619171142578, 22.079547882080078, 22.681472778320312, 23.28339958190918]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 11.0, 11.0, 24.0, 30.0, 43.0, 80.0, 103.0, 165.0, 271.0, 575.0, 1392.0, 3839.0, 15375.0, 113253.0, 1639912.0, 2225719.0, 165510.0, 20355.0, 4649.0, 1492.0, 630.0, 310.0, 166.0, 138.0, 67.0, 46.0, 34.0, 22.0, 17.0, 6.0, 9.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130859375, -1.09326171875, -1.0556640625, -1.01806640625, -0.98046875, -0.94287109375, -0.9052734375, -0.86767578125, -0.830078125, -0.79248046875, -0.7548828125, -0.71728515625, -0.6796875, -0.64208984375, -0.6044921875, -0.56689453125, -0.529296875, -0.49169921875, -0.4541015625, -0.41650390625, -0.37890625, -0.34130859375, -0.3037109375, -0.26611328125, -0.228515625, -0.19091796875, -0.1533203125, -0.11572265625, -0.078125, -0.04052734375, -0.0029296875, 0.03466796875, 0.072265625, 0.10986328125, 0.1474609375, 0.18505859375, 0.22265625, 0.26025390625, 0.2978515625, 0.33544921875, 0.373046875, 0.41064453125, 0.4482421875, 0.48583984375, 0.5234375, 0.56103515625, 0.5986328125, 0.63623046875, 0.673828125, 0.71142578125, 0.7490234375, 0.78662109375, 0.82421875, 0.86181640625, 0.8994140625, 0.93701171875, 0.974609375, 1.01220703125, 1.0498046875, 1.08740234375, 1.125, 1.16259765625, 1.2001953125, 1.23779296875, 1.275390625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 10.0, 13.0, 16.0, 15.0, 31.0, 23.0, 44.0, 37.0, 29.0, 49.0, 50.0, 51.0, 56.0, 73.0, 45.0, 43.0, 59.0, 50.0, 42.0, 42.0, 51.0, 32.0, 23.0, 23.0, 26.0, 13.0, 10.0, 7.0, 7.0, 10.0, 3.0, 1.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.759765625, -0.7361373901367188, -0.7125091552734375, -0.6888809204101562, -0.665252685546875, -0.6416244506835938, -0.6179962158203125, -0.5943679809570312, -0.57073974609375, -0.5471115112304688, -0.5234832763671875, -0.49985504150390625, -0.476226806640625, -0.45259857177734375, -0.4289703369140625, -0.40534210205078125, -0.3817138671875, -0.35808563232421875, -0.3344573974609375, -0.31082916259765625, -0.287200927734375, -0.26357269287109375, -0.2399444580078125, -0.21631622314453125, -0.19268798828125, -0.16905975341796875, -0.1454315185546875, -0.12180328369140625, -0.098175048828125, -0.07454681396484375, -0.0509185791015625, -0.02729034423828125, -0.003662109375, 0.01996612548828125, 0.0435943603515625, 0.06722259521484375, 0.090850830078125, 0.11447906494140625, 0.1381072998046875, 0.16173553466796875, 0.18536376953125, 0.20899200439453125, 0.2326202392578125, 0.25624847412109375, 0.279876708984375, 0.30350494384765625, 0.3271331787109375, 0.35076141357421875, 0.3743896484375, 0.39801788330078125, 0.4216461181640625, 0.44527435302734375, 0.468902587890625, 0.49253082275390625, 0.5161590576171875, 0.5397872924804688, 0.56341552734375, 0.5870437622070312, 0.6106719970703125, 0.6343002319335938, 0.657928466796875, 0.6815567016601562, 0.7051849365234375, 0.7288131713867188, 0.75244140625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 7.0, 7.0, 15.0, 25.0, 43.0, 81.0, 123.0, 203.0, 357.0, 694.0, 2163.0, 22211.0, 3815071.0, 343682.0, 6976.0, 1379.0, 501.0, 304.0, 143.0, 96.0, 61.0, 37.0, 25.0, 15.0, 17.0, 8.0, 7.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.603515625, -3.482574462890625, -3.36163330078125, -3.240692138671875, -3.1197509765625, -2.998809814453125, -2.87786865234375, -2.756927490234375, -2.635986328125, -2.515045166015625, -2.39410400390625, -2.273162841796875, -2.1522216796875, -2.031280517578125, -1.91033935546875, -1.789398193359375, -1.66845703125, -1.547515869140625, -1.42657470703125, -1.305633544921875, -1.1846923828125, -1.063751220703125, -0.94281005859375, -0.821868896484375, -0.700927734375, -0.579986572265625, -0.45904541015625, -0.338104248046875, -0.2171630859375, -0.096221923828125, 0.02471923828125, 0.145660400390625, 0.2666015625, 0.387542724609375, 0.50848388671875, 0.629425048828125, 0.7503662109375, 0.871307373046875, 0.99224853515625, 1.113189697265625, 1.234130859375, 1.355072021484375, 1.47601318359375, 1.596954345703125, 1.7178955078125, 1.838836669921875, 1.95977783203125, 2.080718994140625, 2.20166015625, 2.322601318359375, 2.44354248046875, 2.564483642578125, 2.6854248046875, 2.806365966796875, 2.92730712890625, 3.048248291015625, 3.169189453125, 3.290130615234375, 3.41107177734375, 3.532012939453125, 3.6529541015625, 3.773895263671875, 3.89483642578125, 4.015777587890625, 4.13671875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 14.0, 30.0, 69.0, 154.0, 534.0, 1596.0, 1183.0, 316.0, 97.0, 52.0, 20.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.95703125, -3.832794189453125, -3.70855712890625, -3.584320068359375, -3.4600830078125, -3.335845947265625, -3.21160888671875, -3.087371826171875, -2.963134765625, -2.838897705078125, -2.71466064453125, -2.590423583984375, -2.4661865234375, -2.341949462890625, -2.21771240234375, -2.093475341796875, -1.96923828125, -1.845001220703125, -1.72076416015625, -1.596527099609375, -1.4722900390625, -1.348052978515625, -1.22381591796875, -1.099578857421875, -0.975341796875, -0.851104736328125, -0.72686767578125, -0.602630615234375, -0.4783935546875, -0.354156494140625, -0.22991943359375, -0.105682373046875, 0.0185546875, 0.142791748046875, 0.26702880859375, 0.391265869140625, 0.5155029296875, 0.639739990234375, 0.76397705078125, 0.888214111328125, 1.012451171875, 1.136688232421875, 1.26092529296875, 1.385162353515625, 1.5093994140625, 1.633636474609375, 1.75787353515625, 1.882110595703125, 2.00634765625, 2.130584716796875, 2.25482177734375, 2.379058837890625, 2.5032958984375, 2.627532958984375, 2.75177001953125, 2.876007080078125, 3.000244140625, 3.124481201171875, 3.24871826171875, 3.372955322265625, 3.4971923828125, 3.621429443359375, 3.74566650390625, 3.869903564453125, 3.994140625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 8.0, 10.0, 22.0, 60.0, 186.0, 276.0, 224.0, 119.0, 53.0, 19.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.307045936584473, -12.55985164642334, -11.812658309936523, -11.06546401977539, -10.318269729614258, -9.571075439453125, -8.823881149291992, -8.076687812805176, -7.329493522644043, -6.58229923248291, -5.8351054191589355, -5.087911605834961, -4.340717315673828, -3.5935232639312744, -2.8463292121887207, -2.099135398864746, -1.3519411087036133, -0.6047470569610596, 0.14244699478149414, 0.8896410465240479, 1.6368350982666016, 2.3840291500091553, 3.131223201751709, 3.8784170150756836, 4.625611305236816, 5.372805595397949, 6.119999408721924, 6.867193222045898, 7.614387512207031, 8.361581802368164, 9.108776092529297, 9.855969429016113, 10.603164672851562, 11.350358963012695, 12.097553253173828, 12.844746589660645, 13.591940879821777, 14.33913516998291, 15.086328506469727, 15.83352279663086, 16.580717086791992, 17.327911376953125, 18.075105667114258, 18.82229995727539, 19.56949234008789, 20.316686630249023, 21.063880920410156, 21.81107521057129, 22.558269500732422, 23.305463790893555, 24.052658081054688, 24.79985237121582, 25.547046661376953, 26.294239044189453, 27.041433334350586, 27.78862762451172, 28.53582191467285, 29.283016204833984, 30.030210494995117, 30.77740478515625, 31.52459716796875, 32.271793365478516, 33.018985748291016, 33.76618194580078, 34.51337432861328]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 4.0, 6.0, 5.0, 11.0, 9.0, 6.0, 15.0, 17.0, 24.0, 18.0, 29.0, 28.0, 34.0, 54.0, 48.0, 57.0, 43.0, 49.0, 38.0, 49.0, 60.0, 51.0, 53.0, 58.0, 28.0, 34.0, 41.0, 32.0, 22.0, 23.0, 12.0, 12.0, 9.0, 9.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-10.2860746383667, -10.0123872756958, -9.738698959350586, -9.465011596679688, -9.191324234008789, -8.91763687133789, -8.643948554992676, -8.370261192321777, -8.096573829650879, -7.822885990142822, -7.549198627471924, -7.275510787963867, -7.001823425292969, -6.728135585784912, -6.4544477462768555, -6.180760383605957, -5.9070725440979, -5.633384704589844, -5.359697341918945, -5.086009502410889, -4.81232213973999, -4.538634300231934, -4.264946937561035, -3.9912590980529785, -3.717571496963501, -3.4438838958740234, -3.170196294784546, -2.8965086936950684, -2.6228208541870117, -2.3491334915161133, -2.0754456520080566, -1.801758050918579, -1.5280704498291016, -1.254382848739624, -0.9806951880455017, -0.7070075273513794, -0.43331992626190186, -0.15963232517242432, 0.11405539512634277, 0.3877429962158203, 0.6614305973052979, 0.9351181983947754, 1.208805799484253, 1.48249351978302, 1.7561811208724976, 2.0298686027526855, 2.303556442260742, 2.5772440433502197, 2.8509316444396973, 3.124619245529175, 3.3983068466186523, 3.671994686126709, 3.9456820487976074, 4.219369888305664, 4.4930572509765625, 4.766745090484619, 5.040432929992676, 5.314120769500732, 5.587808132171631, 5.8614959716796875, 6.135183334350586, 6.408871173858643, 6.682559013366699, 6.956246376037598, 7.229933738708496]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 8.0, 20.0, 20.0, 30.0, 40.0, 77.0, 130.0, 182.0, 297.0, 473.0, 794.0, 1454.0, 2482.0, 4490.0, 8647.0, 16863.0, 34537.0, 68646.0, 129081.0, 203231.0, 224588.0, 163753.0, 92608.0, 47174.0, 23429.0, 11892.0, 5846.0, 3316.0, 1769.0, 1007.0, 636.0, 372.0, 248.0, 137.0, 85.0, 64.0, 44.0, 26.0, 14.0, 10.0, 12.0, 4.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7451171875, -0.7204666137695312, -0.6958160400390625, -0.6711654663085938, -0.646514892578125, -0.6218643188476562, -0.5972137451171875, -0.5725631713867188, -0.54791259765625, -0.5232620239257812, -0.4986114501953125, -0.47396087646484375, -0.449310302734375, -0.42465972900390625, -0.4000091552734375, -0.37535858154296875, -0.3507080078125, -0.32605743408203125, -0.3014068603515625, -0.27675628662109375, -0.252105712890625, -0.22745513916015625, -0.2028045654296875, -0.17815399169921875, -0.15350341796875, -0.12885284423828125, -0.1042022705078125, -0.07955169677734375, -0.054901123046875, -0.03025054931640625, -0.0055999755859375, 0.01905059814453125, 0.043701171875, 0.06835174560546875, 0.0930023193359375, 0.11765289306640625, 0.142303466796875, 0.16695404052734375, 0.1916046142578125, 0.21625518798828125, 0.24090576171875, 0.26555633544921875, 0.2902069091796875, 0.31485748291015625, 0.339508056640625, 0.36415863037109375, 0.3888092041015625, 0.41345977783203125, 0.4381103515625, 0.46276092529296875, 0.4874114990234375, 0.5120620727539062, 0.536712646484375, 0.5613632202148438, 0.5860137939453125, 0.6106643676757812, 0.63531494140625, 0.6599655151367188, 0.6846160888671875, 0.7092666625976562, 0.733917236328125, 0.7585678100585938, 0.7832183837890625, 0.8078689575195312, 0.83251953125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 10.0, 13.0, 11.0, 18.0, 10.0, 18.0, 21.0, 33.0, 27.0, 33.0, 29.0, 41.0, 38.0, 45.0, 35.0, 47.0, 48.0, 41.0, 58.0, 43.0, 35.0, 38.0, 42.0, 38.0, 34.0, 38.0, 30.0, 23.0, 19.0, 15.0, 23.0, 8.0, 10.0, 11.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71337890625, -0.691925048828125, -0.67047119140625, -0.649017333984375, -0.6275634765625, -0.606109619140625, -0.58465576171875, -0.563201904296875, -0.541748046875, -0.520294189453125, -0.49884033203125, -0.477386474609375, -0.4559326171875, -0.434478759765625, -0.41302490234375, -0.391571044921875, -0.3701171875, -0.348663330078125, -0.32720947265625, -0.305755615234375, -0.2843017578125, -0.262847900390625, -0.24139404296875, -0.219940185546875, -0.198486328125, -0.177032470703125, -0.15557861328125, -0.134124755859375, -0.1126708984375, -0.091217041015625, -0.06976318359375, -0.048309326171875, -0.02685546875, -0.005401611328125, 0.01605224609375, 0.037506103515625, 0.0589599609375, 0.080413818359375, 0.10186767578125, 0.123321533203125, 0.144775390625, 0.166229248046875, 0.18768310546875, 0.209136962890625, 0.2305908203125, 0.252044677734375, 0.27349853515625, 0.294952392578125, 0.31640625, 0.337860107421875, 0.35931396484375, 0.380767822265625, 0.4022216796875, 0.423675537109375, 0.44512939453125, 0.466583251953125, 0.488037109375, 0.509490966796875, 0.53094482421875, 0.552398681640625, 0.5738525390625, 0.595306396484375, 0.61676025390625, 0.638214111328125, 0.65966796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 11.0, 13.0, 31.0, 36.0, 46.0, 103.0, 189.0, 401.0, 1028.0, 3925.0, 24854.0, 263316.0, 685095.0, 58954.0, 7819.0, 1643.0, 532.0, 240.0, 121.0, 74.0, 44.0, 22.0, 13.0, 12.0, 13.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.861328125, -3.7652587890625, -3.669189453125, -3.5731201171875, -3.47705078125, -3.3809814453125, -3.284912109375, -3.1888427734375, -3.0927734375, -2.9967041015625, -2.900634765625, -2.8045654296875, -2.70849609375, -2.6124267578125, -2.516357421875, -2.4202880859375, -2.32421875, -2.2281494140625, -2.132080078125, -2.0360107421875, -1.93994140625, -1.8438720703125, -1.747802734375, -1.6517333984375, -1.5556640625, -1.4595947265625, -1.363525390625, -1.2674560546875, -1.17138671875, -1.0753173828125, -0.979248046875, -0.8831787109375, -0.787109375, -0.6910400390625, -0.594970703125, -0.4989013671875, -0.40283203125, -0.3067626953125, -0.210693359375, -0.1146240234375, -0.0185546875, 0.0775146484375, 0.173583984375, 0.2696533203125, 0.36572265625, 0.4617919921875, 0.557861328125, 0.6539306640625, 0.75, 0.8460693359375, 0.942138671875, 1.0382080078125, 1.13427734375, 1.2303466796875, 1.326416015625, 1.4224853515625, 1.5185546875, 1.6146240234375, 1.710693359375, 1.8067626953125, 1.90283203125, 1.9989013671875, 2.094970703125, 2.1910400390625, 2.287109375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 5.0, 4.0, 8.0, 5.0, 16.0, 14.0, 19.0, 13.0, 24.0, 23.0, 28.0, 36.0, 38.0, 36.0, 26.0, 53.0, 42.0, 54.0, 34.0, 59.0, 63.0, 34.0, 48.0, 35.0, 35.0, 40.0, 32.0, 25.0, 23.0, 29.0, 18.0, 16.0, 7.0, 4.0, 6.0, 5.0, 8.0, 3.0, 5.0, 6.0, 1.0, 6.0, 2.0, 2.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.318359375, -2.241180419921875, -2.16400146484375, -2.086822509765625, -2.0096435546875, -1.932464599609375, -1.85528564453125, -1.778106689453125, -1.700927734375, -1.623748779296875, -1.54656982421875, -1.469390869140625, -1.3922119140625, -1.315032958984375, -1.23785400390625, -1.160675048828125, -1.08349609375, -1.006317138671875, -0.92913818359375, -0.851959228515625, -0.7747802734375, -0.697601318359375, -0.62042236328125, -0.543243408203125, -0.466064453125, -0.388885498046875, -0.31170654296875, -0.234527587890625, -0.1573486328125, -0.080169677734375, -0.00299072265625, 0.074188232421875, 0.1513671875, 0.228546142578125, 0.30572509765625, 0.382904052734375, 0.4600830078125, 0.537261962890625, 0.61444091796875, 0.691619873046875, 0.768798828125, 0.845977783203125, 0.92315673828125, 1.000335693359375, 1.0775146484375, 1.154693603515625, 1.23187255859375, 1.309051513671875, 1.38623046875, 1.463409423828125, 1.54058837890625, 1.617767333984375, 1.6949462890625, 1.772125244140625, 1.84930419921875, 1.926483154296875, 2.003662109375, 2.080841064453125, 2.15802001953125, 2.235198974609375, 2.3123779296875, 2.389556884765625, 2.46673583984375, 2.543914794921875, 2.62109375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 10.0, 20.0, 17.0, 31.0, 57.0, 99.0, 176.0, 290.0, 518.0, 1058.0, 2246.0, 5096.0, 13239.0, 37278.0, 126909.0, 552656.0, 214808.0, 60576.0, 19974.0, 7337.0, 3089.0, 1434.0, 693.0, 386.0, 217.0, 109.0, 76.0, 40.0, 39.0, 16.0, 19.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4990234375, -0.4822235107421875, -0.465423583984375, -0.4486236572265625, -0.43182373046875, -0.4150238037109375, -0.398223876953125, -0.3814239501953125, -0.3646240234375, -0.3478240966796875, -0.331024169921875, -0.3142242431640625, -0.29742431640625, -0.2806243896484375, -0.263824462890625, -0.2470245361328125, -0.230224609375, -0.2134246826171875, -0.196624755859375, -0.1798248291015625, -0.16302490234375, -0.1462249755859375, -0.129425048828125, -0.1126251220703125, -0.0958251953125, -0.0790252685546875, -0.062225341796875, -0.0454254150390625, -0.02862548828125, -0.0118255615234375, 0.004974365234375, 0.0217742919921875, 0.03857421875, 0.0553741455078125, 0.072174072265625, 0.0889739990234375, 0.10577392578125, 0.1225738525390625, 0.139373779296875, 0.1561737060546875, 0.1729736328125, 0.1897735595703125, 0.206573486328125, 0.2233734130859375, 0.24017333984375, 0.2569732666015625, 0.273773193359375, 0.2905731201171875, 0.307373046875, 0.3241729736328125, 0.340972900390625, 0.3577728271484375, 0.37457275390625, 0.3913726806640625, 0.408172607421875, 0.4249725341796875, 0.4417724609375, 0.4585723876953125, 0.475372314453125, 0.4921722412109375, 0.50897216796875, 0.5257720947265625, 0.542572021484375, 0.5593719482421875, 0.576171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 11.0, 17.0, 19.0, 39.0, 56.0, 109.0, 147.0, 154.0, 145.0, 101.0, 64.0, 43.0, 30.0, 16.0, 16.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003688335418701172, -0.0003575049340724945, -0.0003461763262748718, -0.00033484771847724915, -0.00032351911067962646, -0.0003121905028820038, -0.0003008618950843811, -0.0002895332872867584, -0.00027820467948913574, -0.00026687607169151306, -0.0002555474638938904, -0.0002442188560962677, -0.00023289024829864502, -0.00022156164050102234, -0.00021023303270339966, -0.00019890442490577698, -0.0001875758171081543, -0.00017624720931053162, -0.00016491860151290894, -0.00015358999371528625, -0.00014226138591766357, -0.0001309327781200409, -0.00011960417032241821, -0.00010827556252479553, -9.694695472717285e-05, -8.561834692955017e-05, -7.428973913192749e-05, -6.296113133430481e-05, -5.163252353668213e-05, -4.030391573905945e-05, -2.8975307941436768e-05, -1.7646700143814087e-05, -6.318092346191406e-06, 5.010515451431274e-06, 1.6339123249053955e-05, 2.7667731046676636e-05, 3.8996338844299316e-05, 5.0324946641922e-05, 6.165355443954468e-05, 7.298216223716736e-05, 8.431077003479004e-05, 9.563937783241272e-05, 0.0001069679856300354, 0.00011829659342765808, 0.00012962520122528076, 0.00014095380902290344, 0.00015228241682052612, 0.0001636110246181488, 0.00017493963241577148, 0.00018626824021339417, 0.00019759684801101685, 0.00020892545580863953, 0.0002202540636062622, 0.0002315826714038849, 0.00024291127920150757, 0.00025423988699913025, 0.00026556849479675293, 0.0002768971025943756, 0.0002882257103919983, 0.00029955431818962097, 0.00031088292598724365, 0.00032221153378486633, 0.000333540141582489, 0.0003448687493801117, 0.0003561973571777344]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 9.0, 12.0, 25.0, 33.0, 74.0, 137.0, 292.0, 722.0, 2157.0, 8946.0, 52022.0, 392390.0, 524518.0, 54376.0, 9289.0, 2265.0, 688.0, 284.0, 138.0, 57.0, 42.0, 15.0, 16.0, 16.0, 5.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -1.0019607543945312, -0.9756011962890625, -0.9492416381835938, -0.922882080078125, -0.8965225219726562, -0.8701629638671875, -0.8438034057617188, -0.81744384765625, -0.7910842895507812, -0.7647247314453125, -0.7383651733398438, -0.712005615234375, -0.6856460571289062, -0.6592864990234375, -0.6329269409179688, -0.6065673828125, -0.5802078247070312, -0.5538482666015625, -0.5274887084960938, -0.501129150390625, -0.47476959228515625, -0.4484100341796875, -0.42205047607421875, -0.39569091796875, -0.36933135986328125, -0.3429718017578125, -0.31661224365234375, -0.290252685546875, -0.26389312744140625, -0.2375335693359375, -0.21117401123046875, -0.184814453125, -0.15845489501953125, -0.1320953369140625, -0.10573577880859375, -0.079376220703125, -0.05301666259765625, -0.0266571044921875, -0.00029754638671875, 0.02606201171875, 0.05242156982421875, 0.0787811279296875, 0.10514068603515625, 0.131500244140625, 0.15785980224609375, 0.1842193603515625, 0.21057891845703125, 0.2369384765625, 0.26329803466796875, 0.2896575927734375, 0.31601715087890625, 0.342376708984375, 0.36873626708984375, 0.3950958251953125, 0.42145538330078125, 0.44781494140625, 0.47417449951171875, 0.5005340576171875, 0.5268936157226562, 0.553253173828125, 0.5796127319335938, 0.6059722900390625, 0.6323318481445312, 0.65869140625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 10.0, 6.0, 13.0, 17.0, 18.0, 23.0, 33.0, 43.0, 41.0, 73.0, 75.0, 89.0, 93.0, 71.0, 74.0, 69.0, 53.0, 46.0, 39.0, 33.0, 22.0, 18.0, 15.0, 15.0, 4.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.578125, -0.5546722412109375, -0.531219482421875, -0.5077667236328125, -0.48431396484375, -0.4608612060546875, -0.437408447265625, -0.4139556884765625, -0.3905029296875, -0.3670501708984375, -0.343597412109375, -0.3201446533203125, -0.29669189453125, -0.2732391357421875, -0.249786376953125, -0.2263336181640625, -0.202880859375, -0.1794281005859375, -0.155975341796875, -0.1325225830078125, -0.10906982421875, -0.0856170654296875, -0.062164306640625, -0.0387115478515625, -0.0152587890625, 0.0081939697265625, 0.031646728515625, 0.0550994873046875, 0.07855224609375, 0.1020050048828125, 0.125457763671875, 0.1489105224609375, 0.17236328125, 0.1958160400390625, 0.219268798828125, 0.2427215576171875, 0.26617431640625, 0.2896270751953125, 0.313079833984375, 0.3365325927734375, 0.3599853515625, 0.3834381103515625, 0.406890869140625, 0.4303436279296875, 0.45379638671875, 0.4772491455078125, 0.500701904296875, 0.5241546630859375, 0.547607421875, 0.5710601806640625, 0.594512939453125, 0.6179656982421875, 0.64141845703125, 0.6648712158203125, 0.688323974609375, 0.7117767333984375, 0.7352294921875, 0.7586822509765625, 0.782135009765625, 0.8055877685546875, 0.82904052734375, 0.8524932861328125, 0.875946044921875, 0.8993988037109375, 0.9228515625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 14.0, 21.0, 40.0, 99.0, 166.0, 329.0, 192.0, 81.0, 29.0, 14.0, 6.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.855045318603516, -34.05562210083008, -33.256202697753906, -32.45677947998047, -31.657358169555664, -30.85793685913086, -30.058513641357422, -29.259092330932617, -28.459671020507812, -27.660249710083008, -26.860828399658203, -26.061405181884766, -25.26198387145996, -24.462562561035156, -23.66313934326172, -22.863718032836914, -22.06429672241211, -21.264875411987305, -20.4654541015625, -19.666030883789062, -18.866609573364258, -18.067188262939453, -17.267765045166016, -16.46834373474121, -15.668922424316406, -14.869501113891602, -14.07007884979248, -13.27065658569336, -12.471235275268555, -11.67181396484375, -10.872391700744629, -10.072969436645508, -9.273548126220703, -8.474126815795898, -7.674704551696777, -6.8752827644348145, -6.075860977172852, -5.276439189910889, -4.477017402648926, -3.677595615386963, -2.878173828125, -2.078752040863037, -1.2793302536010742, -0.47990846633911133, 0.31951332092285156, 1.1189351081848145, 1.9183568954467773, 2.7177786827087402, 3.517200469970703, 4.316622257232666, 5.116044044494629, 5.915465831756592, 6.714887619018555, 7.514309406280518, 8.31373119354248, 9.113153457641602, 9.912574768066406, 10.711996078491211, 11.511418342590332, 12.310840606689453, 13.110261917114258, 13.909683227539062, 14.709105491638184, 15.508527755737305, 16.30794906616211]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 7.0, 6.0, 9.0, 12.0, 7.0, 11.0, 18.0, 17.0, 15.0, 29.0, 33.0, 33.0, 24.0, 33.0, 38.0, 44.0, 44.0, 77.0, 73.0, 75.0, 50.0, 39.0, 44.0, 30.0, 22.0, 31.0, 27.0, 17.0, 22.0, 14.0, 16.0, 11.0, 10.0, 15.0, 7.0, 10.0, 6.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-11.15542221069336, -10.822574615478516, -10.489727020263672, -10.156880378723145, -9.8240327835083, -9.491185188293457, -9.158337593078613, -8.825490951538086, -8.492643356323242, -8.159795761108398, -7.826948642730713, -7.494101047515869, -7.161253929138184, -6.82840633392334, -6.495558738708496, -6.1627116203308105, -5.829864025115967, -5.497016429901123, -5.1641693115234375, -4.831321716308594, -4.498474597930908, -4.1656270027160645, -3.8327796459198, -3.499932289123535, -3.1670849323272705, -2.834237575531006, -2.501390218734741, -2.1685428619384766, -1.8356953859329224, -1.5028480291366577, -1.1700005531311035, -0.8371531963348389, -0.5043058395385742, -0.17145845293998718, 0.16138893365859985, 0.4942363500595093, 0.8270837068557739, 1.1599310636520386, 1.4927785396575928, 1.8256258964538574, 2.158473253250122, 2.4913206100463867, 2.8241679668426514, 3.157015323638916, 3.4898629188537598, 3.8227100372314453, 4.155557632446289, 4.488405227661133, 4.821252346038818, 5.154099941253662, 5.486947059631348, 5.819794654846191, 6.152641773223877, 6.485489368438721, 6.818336486816406, 7.15118408203125, 7.484031677246094, 7.8168792724609375, 8.149726867675781, 8.482573509216309, 8.815421104431152, 9.148268699645996, 9.48111629486084, 9.813962936401367, 10.146810531616211]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 19.0, 19.0, 22.0, 33.0, 68.0, 99.0, 158.0, 250.0, 389.0, 620.0, 1185.0, 2440.0, 5490.0, 15645.0, 57658.0, 274725.0, 1244048.0, 1866085.0, 566245.0, 115034.0, 27873.0, 8877.0, 3519.0, 1668.0, 897.0, 459.0, 284.0, 172.0, 88.0, 68.0, 47.0, 24.0, 22.0, 15.0, 6.0, 16.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.75439453125, -0.7329788208007812, -0.7115631103515625, -0.6901473999023438, -0.668731689453125, -0.6473159790039062, -0.6259002685546875, -0.6044845581054688, -0.58306884765625, -0.5616531372070312, -0.5402374267578125, -0.5188217163085938, -0.497406005859375, -0.47599029541015625, -0.4545745849609375, -0.43315887451171875, -0.4117431640625, -0.39032745361328125, -0.3689117431640625, -0.34749603271484375, -0.326080322265625, -0.30466461181640625, -0.2832489013671875, -0.26183319091796875, -0.24041748046875, -0.21900177001953125, -0.1975860595703125, -0.17617034912109375, -0.154754638671875, -0.13333892822265625, -0.1119232177734375, -0.09050750732421875, -0.069091796875, -0.04767608642578125, -0.0262603759765625, -0.00484466552734375, 0.016571044921875, 0.03798675537109375, 0.0594024658203125, 0.08081817626953125, 0.10223388671875, 0.12364959716796875, 0.1450653076171875, 0.16648101806640625, 0.187896728515625, 0.20931243896484375, 0.2307281494140625, 0.25214385986328125, 0.2735595703125, 0.29497528076171875, 0.3163909912109375, 0.33780670166015625, 0.359222412109375, 0.38063812255859375, 0.4020538330078125, 0.42346954345703125, 0.44488525390625, 0.46630096435546875, 0.4877166748046875, 0.5091323852539062, 0.530548095703125, 0.5519638061523438, 0.5733795166015625, 0.5947952270507812, 0.6162109375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 4.0, 3.0, 1.0, 9.0, 6.0, 14.0, 10.0, 9.0, 23.0, 23.0, 22.0, 21.0, 35.0, 29.0, 48.0, 28.0, 42.0, 43.0, 47.0, 55.0, 37.0, 49.0, 55.0, 45.0, 35.0, 40.0, 48.0, 31.0, 31.0, 32.0, 18.0, 20.0, 21.0, 11.0, 14.0, 8.0, 7.0, 8.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67919921875, -0.6595535278320312, -0.6399078369140625, -0.6202621459960938, -0.600616455078125, -0.5809707641601562, -0.5613250732421875, -0.5416793823242188, -0.52203369140625, -0.5023880004882812, -0.4827423095703125, -0.46309661865234375, -0.443450927734375, -0.42380523681640625, -0.4041595458984375, -0.38451385498046875, -0.3648681640625, -0.34522247314453125, -0.3255767822265625, -0.30593109130859375, -0.286285400390625, -0.26663970947265625, -0.2469940185546875, -0.22734832763671875, -0.20770263671875, -0.18805694580078125, -0.1684112548828125, -0.14876556396484375, -0.129119873046875, -0.10947418212890625, -0.0898284912109375, -0.07018280029296875, -0.050537109375, -0.03089141845703125, -0.0112457275390625, 0.00839996337890625, 0.028045654296875, 0.04769134521484375, 0.0673370361328125, 0.08698272705078125, 0.10662841796875, 0.12627410888671875, 0.1459197998046875, 0.16556549072265625, 0.185211181640625, 0.20485687255859375, 0.2245025634765625, 0.24414825439453125, 0.2637939453125, 0.28343963623046875, 0.3030853271484375, 0.32273101806640625, 0.342376708984375, 0.36202239990234375, 0.3816680908203125, 0.40131378173828125, 0.42095947265625, 0.44060516357421875, 0.4602508544921875, 0.47989654541015625, 0.499542236328125, 0.5191879272460938, 0.5388336181640625, 0.5584793090820312, 0.578125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 9.0, 15.0, 16.0, 20.0, 46.0, 73.0, 117.0, 220.0, 516.0, 1163.0, 3633.0, 26255.0, 1113403.0, 2991733.0, 49127.0, 5288.0, 1451.0, 578.0, 288.0, 159.0, 74.0, 36.0, 15.0, 17.0, 5.0, 9.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.240234375, -2.168243408203125, -2.09625244140625, -2.024261474609375, -1.9522705078125, -1.880279541015625, -1.80828857421875, -1.736297607421875, -1.664306640625, -1.592315673828125, -1.52032470703125, -1.448333740234375, -1.3763427734375, -1.304351806640625, -1.23236083984375, -1.160369873046875, -1.08837890625, -1.016387939453125, -0.94439697265625, -0.872406005859375, -0.8004150390625, -0.728424072265625, -0.65643310546875, -0.584442138671875, -0.512451171875, -0.440460205078125, -0.36846923828125, -0.296478271484375, -0.2244873046875, -0.152496337890625, -0.08050537109375, -0.008514404296875, 0.0634765625, 0.135467529296875, 0.20745849609375, 0.279449462890625, 0.3514404296875, 0.423431396484375, 0.49542236328125, 0.567413330078125, 0.639404296875, 0.711395263671875, 0.78338623046875, 0.855377197265625, 0.9273681640625, 0.999359130859375, 1.07135009765625, 1.143341064453125, 1.21533203125, 1.287322998046875, 1.35931396484375, 1.431304931640625, 1.5032958984375, 1.575286865234375, 1.64727783203125, 1.719268798828125, 1.791259765625, 1.863250732421875, 1.93524169921875, 2.007232666015625, 2.0792236328125, 2.151214599609375, 2.22320556640625, 2.295196533203125, 2.3671875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 14.0, 11.0, 20.0, 31.0, 44.0, 60.0, 118.0, 217.0, 355.0, 607.0, 800.0, 698.0, 455.0, 250.0, 134.0, 83.0, 48.0, 42.0, 32.0, 15.0, 6.0, 9.0, 8.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.802734375, -1.7476654052734375, -1.692596435546875, -1.6375274658203125, -1.58245849609375, -1.5273895263671875, -1.472320556640625, -1.4172515869140625, -1.3621826171875, -1.3071136474609375, -1.252044677734375, -1.1969757080078125, -1.14190673828125, -1.0868377685546875, -1.031768798828125, -0.9766998291015625, -0.921630859375, -0.8665618896484375, -0.811492919921875, -0.7564239501953125, -0.70135498046875, -0.6462860107421875, -0.591217041015625, -0.5361480712890625, -0.4810791015625, -0.4260101318359375, -0.370941162109375, -0.3158721923828125, -0.26080322265625, -0.2057342529296875, -0.150665283203125, -0.0955963134765625, -0.04052734375, 0.0145416259765625, 0.069610595703125, 0.1246795654296875, 0.17974853515625, 0.2348175048828125, 0.289886474609375, 0.3449554443359375, 0.4000244140625, 0.4550933837890625, 0.510162353515625, 0.5652313232421875, 0.62030029296875, 0.6753692626953125, 0.730438232421875, 0.7855072021484375, 0.840576171875, 0.8956451416015625, 0.950714111328125, 1.0057830810546875, 1.06085205078125, 1.1159210205078125, 1.170989990234375, 1.2260589599609375, 1.2811279296875, 1.3361968994140625, 1.391265869140625, 1.4463348388671875, 1.50140380859375, 1.5564727783203125, 1.611541748046875, 1.6666107177734375, 1.7216796875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 4.0, 8.0, 19.0, 26.0, 48.0, 79.0, 151.0, 143.0, 159.0, 133.0, 108.0, 61.0, 25.0, 13.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.149273872375488, -7.768694877624512, -7.388116359710693, -7.007537364959717, -6.626958847045898, -6.246379852294922, -5.865800857543945, -5.485221862792969, -5.10464334487915, -4.724064350128174, -4.3434858322143555, -3.962906837463379, -3.5823280811309814, -3.201749324798584, -2.8211703300476074, -2.44059157371521, -2.0600128173828125, -1.679434061050415, -1.298855185508728, -0.918276309967041, -0.5376975536346436, -0.1571187973022461, 0.22346019744873047, 0.6040389537811279, 0.9846177101135254, 1.3651964664459229, 1.7457753419876099, 2.126354217529297, 2.5069329738616943, 2.887511730194092, 3.2680907249450684, 3.648669481277466, 4.02924919128418, 4.409828186035156, 4.790406703948975, 5.170985698699951, 5.5515642166137695, 5.932143211364746, 6.312722206115723, 6.693301200866699, 7.073879718780518, 7.454458713531494, 7.8350372314453125, 8.215616226196289, 8.596195220947266, 8.976774215698242, 9.357353210449219, 9.737931251525879, 10.118510246276855, 10.499089241027832, 10.879668235778809, 11.260246276855469, 11.640825271606445, 12.021404266357422, 12.401983261108398, 12.782562255859375, 13.163141250610352, 13.543720245361328, 13.924299240112305, 14.304878234863281, 14.685456275939941, 15.066035270690918, 15.446614265441895, 15.827193260192871, 16.20777130126953]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 15.0, 17.0, 16.0, 21.0, 27.0, 32.0, 30.0, 49.0, 50.0, 38.0, 56.0, 73.0, 60.0, 72.0, 53.0, 59.0, 49.0, 46.0, 32.0, 32.0, 33.0, 30.0, 17.0, 16.0, 19.0, 11.0, 7.0, 12.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.081058502197266, -6.836199760437012, -6.591341495513916, -6.346482753753662, -6.101624488830566, -5.8567657470703125, -5.611907005310059, -5.367048740386963, -5.122190475463867, -4.877331733703613, -4.632473468780518, -4.387614727020264, -4.142756462097168, -3.897897720336914, -3.6530392169952393, -3.4081807136535645, -3.1633219718933105, -2.9184634685516357, -2.673604965209961, -2.428746223449707, -2.1838879585266113, -1.939029335975647, -1.6941707134246826, -1.4493122100830078, -1.204453706741333, -0.9595952033996582, -0.7147366404533386, -0.46987807750701904, -0.22501957416534424, 0.019838929176330566, 0.2646975517272949, 0.5095560550689697, 0.7544145584106445, 0.9992730617523193, 1.2441315650939941, 1.4889901876449585, 1.7338486909866333, 1.978707194328308, 2.2235658168792725, 2.4684243202209473, 2.713282823562622, 2.958141326904297, 3.2029998302459717, 3.4478583335876465, 3.6927170753479004, 3.937575340270996, 4.18243408203125, 4.427292823791504, 4.6721510887146, 4.9170098304748535, 5.161868095397949, 5.406726837158203, 5.651585102081299, 5.896443843841553, 6.141302108764648, 6.386160850524902, 6.631019592285156, 6.87587833404541, 7.120736598968506, 7.36559534072876, 7.6104536056518555, 7.855312347412109, 8.100171089172363, 8.345029830932617, 8.589887619018555]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 10.0, 13.0, 22.0, 16.0, 30.0, 57.0, 62.0, 113.0, 152.0, 266.0, 410.0, 635.0, 1103.0, 1959.0, 3326.0, 6205.0, 11379.0, 21732.0, 41598.0, 79800.0, 146213.0, 223435.0, 215456.0, 137174.0, 74127.0, 38934.0, 20326.0, 10693.0, 5625.0, 3067.0, 1754.0, 1114.0, 629.0, 376.0, 255.0, 151.0, 106.0, 67.0, 45.0, 36.0, 22.0, 13.0, 15.0, 11.0, 5.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.7548828125, -0.7326431274414062, -0.7104034423828125, -0.6881637573242188, -0.665924072265625, -0.6436843872070312, -0.6214447021484375, -0.5992050170898438, -0.57696533203125, -0.5547256469726562, -0.5324859619140625, -0.5102462768554688, -0.488006591796875, -0.46576690673828125, -0.4435272216796875, -0.42128753662109375, -0.3990478515625, -0.37680816650390625, -0.3545684814453125, -0.33232879638671875, -0.310089111328125, -0.28784942626953125, -0.2656097412109375, -0.24337005615234375, -0.22113037109375, -0.19889068603515625, -0.1766510009765625, -0.15441131591796875, -0.132171630859375, -0.10993194580078125, -0.0876922607421875, -0.06545257568359375, -0.043212890625, -0.02097320556640625, 0.0012664794921875, 0.02350616455078125, 0.045745849609375, 0.06798553466796875, 0.0902252197265625, 0.11246490478515625, 0.13470458984375, 0.15694427490234375, 0.1791839599609375, 0.20142364501953125, 0.223663330078125, 0.24590301513671875, 0.2681427001953125, 0.29038238525390625, 0.3126220703125, 0.33486175537109375, 0.3571014404296875, 0.37934112548828125, 0.401580810546875, 0.42382049560546875, 0.4460601806640625, 0.46829986572265625, 0.49053955078125, 0.5127792358398438, 0.5350189208984375, 0.5572586059570312, 0.579498291015625, 0.6017379760742188, 0.6239776611328125, 0.6462173461914062, 0.66845703125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 7.0, 3.0, 6.0, 14.0, 18.0, 22.0, 20.0, 24.0, 36.0, 29.0, 44.0, 53.0, 48.0, 68.0, 48.0, 61.0, 57.0, 51.0, 60.0, 48.0, 36.0, 55.0, 34.0, 43.0, 17.0, 15.0, 25.0, 13.0, 11.0, 9.0, 7.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8759765625, -0.8508224487304688, -0.8256683349609375, -0.8005142211914062, -0.775360107421875, -0.7502059936523438, -0.7250518798828125, -0.6998977661132812, -0.67474365234375, -0.6495895385742188, -0.6244354248046875, -0.5992813110351562, -0.574127197265625, -0.5489730834960938, -0.5238189697265625, -0.49866485595703125, -0.4735107421875, -0.44835662841796875, -0.4232025146484375, -0.39804840087890625, -0.372894287109375, -0.34774017333984375, -0.3225860595703125, -0.29743194580078125, -0.27227783203125, -0.24712371826171875, -0.2219696044921875, -0.19681549072265625, -0.171661376953125, -0.14650726318359375, -0.1213531494140625, -0.09619903564453125, -0.071044921875, -0.04589080810546875, -0.0207366943359375, 0.00441741943359375, 0.029571533203125, 0.05472564697265625, 0.0798797607421875, 0.10503387451171875, 0.13018798828125, 0.15534210205078125, 0.1804962158203125, 0.20565032958984375, 0.230804443359375, 0.25595855712890625, 0.2811126708984375, 0.30626678466796875, 0.3314208984375, 0.35657501220703125, 0.3817291259765625, 0.40688323974609375, 0.432037353515625, 0.45719146728515625, 0.4823455810546875, 0.5074996948242188, 0.53265380859375, 0.5578079223632812, 0.5829620361328125, 0.6081161499023438, 0.633270263671875, 0.6584243774414062, 0.6835784912109375, 0.7087326049804688, 0.73388671875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 4.0, 5.0, 11.0, 14.0, 16.0, 19.0, 33.0, 40.0, 62.0, 111.0, 180.0, 274.0, 465.0, 850.0, 2159.0, 6746.0, 35104.0, 281289.0, 646502.0, 59388.0, 10001.0, 2802.0, 1067.0, 576.0, 288.0, 185.0, 126.0, 75.0, 44.0, 37.0, 24.0, 19.0, 8.0, 6.0, 9.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.56640625, -2.48895263671875, -2.4114990234375, -2.33404541015625, -2.256591796875, -2.17913818359375, -2.1016845703125, -2.02423095703125, -1.94677734375, -1.86932373046875, -1.7918701171875, -1.71441650390625, -1.636962890625, -1.55950927734375, -1.4820556640625, -1.40460205078125, -1.3271484375, -1.24969482421875, -1.1722412109375, -1.09478759765625, -1.017333984375, -0.93988037109375, -0.8624267578125, -0.78497314453125, -0.70751953125, -0.63006591796875, -0.5526123046875, -0.47515869140625, -0.397705078125, -0.32025146484375, -0.2427978515625, -0.16534423828125, -0.087890625, -0.01043701171875, 0.0670166015625, 0.14447021484375, 0.221923828125, 0.29937744140625, 0.3768310546875, 0.45428466796875, 0.53173828125, 0.60919189453125, 0.6866455078125, 0.76409912109375, 0.841552734375, 0.91900634765625, 0.9964599609375, 1.07391357421875, 1.1513671875, 1.22882080078125, 1.3062744140625, 1.38372802734375, 1.461181640625, 1.53863525390625, 1.6160888671875, 1.69354248046875, 1.77099609375, 1.84844970703125, 1.9259033203125, 2.00335693359375, 2.080810546875, 2.15826416015625, 2.2357177734375, 2.31317138671875, 2.390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 9.0, 10.0, 10.0, 9.0, 19.0, 23.0, 14.0, 30.0, 36.0, 39.0, 43.0, 51.0, 75.0, 57.0, 80.0, 60.0, 56.0, 62.0, 60.0, 45.0, 37.0, 34.0, 38.0, 24.0, 15.0, 16.0, 9.0, 8.0, 6.0, 0.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.73828125, -2.633453369140625, -2.52862548828125, -2.423797607421875, -2.3189697265625, -2.214141845703125, -2.10931396484375, -2.004486083984375, -1.899658203125, -1.794830322265625, -1.69000244140625, -1.585174560546875, -1.4803466796875, -1.375518798828125, -1.27069091796875, -1.165863037109375, -1.06103515625, -0.956207275390625, -0.85137939453125, -0.746551513671875, -0.6417236328125, -0.536895751953125, -0.43206787109375, -0.327239990234375, -0.222412109375, -0.117584228515625, -0.01275634765625, 0.092071533203125, 0.1968994140625, 0.301727294921875, 0.40655517578125, 0.511383056640625, 0.6162109375, 0.721038818359375, 0.82586669921875, 0.930694580078125, 1.0355224609375, 1.140350341796875, 1.24517822265625, 1.350006103515625, 1.454833984375, 1.559661865234375, 1.66448974609375, 1.769317626953125, 1.8741455078125, 1.978973388671875, 2.08380126953125, 2.188629150390625, 2.29345703125, 2.398284912109375, 2.50311279296875, 2.607940673828125, 2.7127685546875, 2.817596435546875, 2.92242431640625, 3.027252197265625, 3.132080078125, 3.236907958984375, 3.34173583984375, 3.446563720703125, 3.5513916015625, 3.656219482421875, 3.76104736328125, 3.865875244140625, 3.970703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 7.0, 7.0, 8.0, 3.0, 14.0, 19.0, 17.0, 24.0, 37.0, 61.0, 98.0, 125.0, 234.0, 386.0, 786.0, 1553.0, 3600.0, 9300.0, 27990.0, 100194.0, 610582.0, 213967.0, 52849.0, 16244.0, 5755.0, 2314.0, 1040.0, 500.0, 300.0, 186.0, 111.0, 73.0, 41.0, 33.0, 28.0, 20.0, 17.0, 11.0, 7.0, 2.0, 8.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.5517578125, -0.5363273620605469, -0.5208969116210938, -0.5054664611816406, -0.4900360107421875, -0.4746055603027344, -0.45917510986328125, -0.4437446594238281, -0.428314208984375, -0.4128837585449219, -0.39745330810546875, -0.3820228576660156, -0.3665924072265625, -0.3511619567871094, -0.33573150634765625, -0.3203010559082031, -0.30487060546875, -0.2894401550292969, -0.27400970458984375, -0.2585792541503906, -0.2431488037109375, -0.22771835327148438, -0.21228790283203125, -0.19685745239257812, -0.181427001953125, -0.16599655151367188, -0.15056610107421875, -0.13513565063476562, -0.1197052001953125, -0.10427474975585938, -0.08884429931640625, -0.07341384887695312, -0.0579833984375, -0.042552947998046875, -0.02712249755859375, -0.011692047119140625, 0.0037384033203125, 0.019168853759765625, 0.03459930419921875, 0.050029754638671875, 0.065460205078125, 0.08089065551757812, 0.09632110595703125, 0.11175155639648438, 0.1271820068359375, 0.14261245727539062, 0.15804290771484375, 0.17347335815429688, 0.18890380859375, 0.20433425903320312, 0.21976470947265625, 0.23519515991210938, 0.2506256103515625, 0.2660560607910156, 0.28148651123046875, 0.2969169616699219, 0.312347412109375, 0.3277778625488281, 0.34320831298828125, 0.3586387634277344, 0.3740692138671875, 0.3894996643066406, 0.40493011474609375, 0.4203605651855469, 0.435791015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 4.0, 4.0, 3.0, 8.0, 6.0, 14.0, 6.0, 15.0, 17.0, 20.0, 35.0, 50.0, 61.0, 86.0, 103.0, 93.0, 115.0, 78.0, 55.0, 45.0, 47.0, 31.0, 28.0, 25.0, 18.0, 8.0, 7.0, 4.0, 5.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0001710653305053711, -0.00016509182751178741, -0.00015911832451820374, -0.00015314482152462006, -0.00014717131853103638, -0.0001411978155374527, -0.00013522431254386902, -0.00012925080955028534, -0.00012327730655670166, -0.00011730380356311798, -0.0001113303005695343, -0.00010535679757595062, -9.938329458236694e-05, -9.340979158878326e-05, -8.743628859519958e-05, -8.14627856016159e-05, -7.548928260803223e-05, -6.951577961444855e-05, -6.354227662086487e-05, -5.756877362728119e-05, -5.159527063369751e-05, -4.562176764011383e-05, -3.964826464653015e-05, -3.367476165294647e-05, -2.7701258659362793e-05, -2.1727755665779114e-05, -1.5754252672195435e-05, -9.780749678611755e-06, -3.807246685028076e-06, 2.166256308555603e-06, 8.139759302139282e-06, 1.4113262295722961e-05, 2.008676528930664e-05, 2.606026828289032e-05, 3.2033771276474e-05, 3.800727427005768e-05, 4.398077726364136e-05, 4.995428025722504e-05, 5.5927783250808716e-05, 6.19012862443924e-05, 6.787478923797607e-05, 7.384829223155975e-05, 7.982179522514343e-05, 8.579529821872711e-05, 9.176880121231079e-05, 9.774230420589447e-05, 0.00010371580719947815, 0.00010968931019306183, 0.00011566281318664551, 0.00012163631618022919, 0.00012760981917381287, 0.00013358332216739655, 0.00013955682516098022, 0.0001455303281545639, 0.00015150383114814758, 0.00015747733414173126, 0.00016345083713531494, 0.00016942434012889862, 0.0001753978431224823, 0.00018137134611606598, 0.00018734484910964966, 0.00019331835210323334, 0.00019929185509681702, 0.0002052653580904007, 0.00021123886108398438]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 8.0, 3.0, 9.0, 23.0, 19.0, 25.0, 34.0, 58.0, 115.0, 220.0, 329.0, 569.0, 1303.0, 3572.0, 12524.0, 61871.0, 630410.0, 280794.0, 42019.0, 9425.0, 2808.0, 1139.0, 582.0, 282.0, 140.0, 90.0, 71.0, 41.0, 15.0, 12.0, 7.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.66943359375, -0.649078369140625, -0.62872314453125, -0.608367919921875, -0.5880126953125, -0.567657470703125, -0.54730224609375, -0.526947021484375, -0.506591796875, -0.486236572265625, -0.46588134765625, -0.445526123046875, -0.4251708984375, -0.404815673828125, -0.38446044921875, -0.364105224609375, -0.34375, -0.323394775390625, -0.30303955078125, -0.282684326171875, -0.2623291015625, -0.241973876953125, -0.22161865234375, -0.201263427734375, -0.180908203125, -0.160552978515625, -0.14019775390625, -0.119842529296875, -0.0994873046875, -0.079132080078125, -0.05877685546875, -0.038421630859375, -0.01806640625, 0.002288818359375, 0.02264404296875, 0.042999267578125, 0.0633544921875, 0.083709716796875, 0.10406494140625, 0.124420166015625, 0.144775390625, 0.165130615234375, 0.18548583984375, 0.205841064453125, 0.2261962890625, 0.246551513671875, 0.26690673828125, 0.287261962890625, 0.3076171875, 0.327972412109375, 0.34832763671875, 0.368682861328125, 0.3890380859375, 0.409393310546875, 0.42974853515625, 0.450103759765625, 0.470458984375, 0.490814208984375, 0.51116943359375, 0.531524658203125, 0.5518798828125, 0.572235107421875, 0.59259033203125, 0.612945556640625, 0.63330078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 9.0, 5.0, 10.0, 8.0, 11.0, 10.0, 13.0, 22.0, 20.0, 20.0, 40.0, 43.0, 48.0, 76.0, 80.0, 86.0, 66.0, 72.0, 66.0, 59.0, 42.0, 38.0, 32.0, 23.0, 12.0, 22.0, 10.0, 6.0, 6.0, 7.0, 9.0, 5.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51806640625, -0.5023002624511719, -0.48653411865234375, -0.4707679748535156, -0.4550018310546875, -0.4392356872558594, -0.42346954345703125, -0.4077033996582031, -0.391937255859375, -0.3761711120605469, -0.36040496826171875, -0.3446388244628906, -0.3288726806640625, -0.3131065368652344, -0.29734039306640625, -0.2815742492675781, -0.26580810546875, -0.2500419616699219, -0.23427581787109375, -0.21850967407226562, -0.2027435302734375, -0.18697738647460938, -0.17121124267578125, -0.15544509887695312, -0.139678955078125, -0.12391281127929688, -0.10814666748046875, -0.09238052368164062, -0.0766143798828125, -0.060848236083984375, -0.04508209228515625, -0.029315948486328125, -0.0135498046875, 0.002216339111328125, 0.01798248291015625, 0.033748626708984375, 0.0495147705078125, 0.06528091430664062, 0.08104705810546875, 0.09681320190429688, 0.112579345703125, 0.12834548950195312, 0.14411163330078125, 0.15987777709960938, 0.1756439208984375, 0.19141006469726562, 0.20717620849609375, 0.22294235229492188, 0.23870849609375, 0.2544746398925781, 0.27024078369140625, 0.2860069274902344, 0.3017730712890625, 0.3175392150878906, 0.33330535888671875, 0.3490715026855469, 0.364837646484375, 0.3806037902832031, 0.39636993408203125, 0.4121360778808594, 0.4279022216796875, 0.4436683654785156, 0.45943450927734375, 0.4752006530761719, 0.490966796875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 18.0, 10.0, 29.0, 51.0, 102.0, 170.0, 298.0, 132.0, 79.0, 58.0, 23.0, 11.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.802608489990234, -20.228418350219727, -19.65422821044922, -19.08003807067871, -18.505847930908203, -17.931657791137695, -17.357467651367188, -16.783279418945312, -16.209087371826172, -15.634897232055664, -15.060707092285156, -14.486516952514648, -13.91232681274414, -13.338136672973633, -12.763947486877441, -12.189757347106934, -11.615568161010742, -11.041378021240234, -10.467187881469727, -9.892997741699219, -9.318807601928711, -8.744617462158203, -8.170428276062012, -7.596238136291504, -7.022047996520996, -6.447857856750488, -5.8736677169799805, -5.299478054046631, -4.725287914276123, -4.151097774505615, -3.5769078731536865, -3.002717971801758, -2.428529739379883, -1.8543397188186646, -1.2801496982574463, -0.705959677696228, -0.13176965713500977, 0.44242048263549805, 1.0166103839874268, 1.5908002853393555, 2.1649904251098633, 2.739180564880371, 3.3133704662323, 3.8875603675842285, 4.461750507354736, 5.035940647125244, 5.610130310058594, 6.184320449829102, 6.758510589599609, 7.332700729370117, 7.906890869140625, 8.481081008911133, 9.05527114868164, 9.629461288452148, 10.20365047454834, 10.777840614318848, 11.352030754089355, 11.926220893859863, 12.500411033630371, 13.074601173400879, 13.64879035949707, 14.222980499267578, 14.797170639038086, 15.371360778808594, 15.945550918579102]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 0.0, 2.0, 1.0, 6.0, 5.0, 4.0, 8.0, 12.0, 12.0, 16.0, 22.0, 27.0, 30.0, 22.0, 29.0, 22.0, 32.0, 41.0, 50.0, 81.0, 116.0, 99.0, 57.0, 44.0, 38.0, 32.0, 34.0, 25.0, 31.0, 19.0, 14.0, 9.0, 8.0, 8.0, 11.0, 8.0, 2.0, 7.0, 10.0, 1.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.73277759552002, -12.387369155883789, -12.041961669921875, -11.696554183959961, -11.35114574432373, -11.0057373046875, -10.660329818725586, -10.314922332763672, -9.969513893127441, -9.624105453491211, -9.278697967529297, -8.933290481567383, -8.587882041931152, -8.242473602294922, -7.897066116333008, -7.5516581535339355, -7.206250190734863, -6.860842227935791, -6.515434265136719, -6.1700263023376465, -5.824618339538574, -5.479210376739502, -5.13380241394043, -4.788394451141357, -4.442986488342285, -4.097578525543213, -3.7521705627441406, -3.4067625999450684, -3.061354637145996, -2.715946674346924, -2.3705387115478516, -2.0251307487487793, -1.679722785949707, -1.3343148231506348, -0.9889068603515625, -0.6434988975524902, -0.29809093475341797, 0.0473170280456543, 0.39272499084472656, 0.7381329536437988, 1.083540916442871, 1.4289488792419434, 1.7743568420410156, 2.119764804840088, 2.46517276763916, 2.8105807304382324, 3.1559886932373047, 3.501396656036377, 3.846804618835449, 4.1922125816345215, 4.537620544433594, 4.883028507232666, 5.228436470031738, 5.5738444328308105, 5.919252395629883, 6.264660358428955, 6.610068321228027, 6.9554762840271, 7.300884246826172, 7.646292209625244, 7.991700172424316, 8.337108612060547, 8.682516098022461, 9.027923583984375, 9.373332023620605]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 11.0, 21.0, 15.0, 26.0, 58.0, 59.0, 93.0, 165.0, 260.0, 455.0, 853.0, 1549.0, 3761.0, 10311.0, 36010.0, 164310.0, 869684.0, 2086854.0, 810885.0, 157041.0, 34599.0, 10060.0, 3675.0, 1571.0, 784.0, 436.0, 288.0, 156.0, 81.0, 75.0, 44.0, 29.0, 21.0, 9.0, 8.0, 6.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.6380157470703125, -0.613922119140625, -0.5898284912109375, -0.56573486328125, -0.5416412353515625, -0.517547607421875, -0.4934539794921875, -0.4693603515625, -0.4452667236328125, -0.421173095703125, -0.3970794677734375, -0.37298583984375, -0.3488922119140625, -0.324798583984375, -0.3007049560546875, -0.276611328125, -0.2525177001953125, -0.228424072265625, -0.2043304443359375, -0.18023681640625, -0.1561431884765625, -0.132049560546875, -0.1079559326171875, -0.0838623046875, -0.0597686767578125, -0.035675048828125, -0.0115814208984375, 0.01251220703125, 0.0366058349609375, 0.060699462890625, 0.0847930908203125, 0.10888671875, 0.1329803466796875, 0.157073974609375, 0.1811676025390625, 0.20526123046875, 0.2293548583984375, 0.253448486328125, 0.2775421142578125, 0.3016357421875, 0.3257293701171875, 0.349822998046875, 0.3739166259765625, 0.39801025390625, 0.4221038818359375, 0.446197509765625, 0.4702911376953125, 0.494384765625, 0.5184783935546875, 0.542572021484375, 0.5666656494140625, 0.59075927734375, 0.6148529052734375, 0.638946533203125, 0.6630401611328125, 0.6871337890625, 0.7112274169921875, 0.735321044921875, 0.7594146728515625, 0.78350830078125, 0.8076019287109375, 0.831695556640625, 0.8557891845703125, 0.8798828125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 10.0, 6.0, 9.0, 10.0, 17.0, 19.0, 19.0, 24.0, 32.0, 37.0, 37.0, 32.0, 64.0, 44.0, 57.0, 53.0, 57.0, 61.0, 55.0, 48.0, 41.0, 44.0, 48.0, 29.0, 29.0, 27.0, 20.0, 12.0, 18.0, 7.0, 9.0, 11.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76513671875, -0.7414627075195312, -0.7177886962890625, -0.6941146850585938, -0.670440673828125, -0.6467666625976562, -0.6230926513671875, -0.5994186401367188, -0.57574462890625, -0.5520706176757812, -0.5283966064453125, -0.5047225952148438, -0.481048583984375, -0.45737457275390625, -0.4337005615234375, -0.41002655029296875, -0.3863525390625, -0.36267852783203125, -0.3390045166015625, -0.31533050537109375, -0.291656494140625, -0.26798248291015625, -0.2443084716796875, -0.22063446044921875, -0.19696044921875, -0.17328643798828125, -0.1496124267578125, -0.12593841552734375, -0.102264404296875, -0.07859039306640625, -0.0549163818359375, -0.03124237060546875, -0.007568359375, 0.01610565185546875, 0.0397796630859375, 0.06345367431640625, 0.087127685546875, 0.11080169677734375, 0.1344757080078125, 0.15814971923828125, 0.18182373046875, 0.20549774169921875, 0.2291717529296875, 0.25284576416015625, 0.276519775390625, 0.30019378662109375, 0.3238677978515625, 0.34754180908203125, 0.3712158203125, 0.39488983154296875, 0.4185638427734375, 0.44223785400390625, 0.465911865234375, 0.48958587646484375, 0.5132598876953125, 0.5369338989257812, 0.56060791015625, 0.5842819213867188, 0.6079559326171875, 0.6316299438476562, 0.655303955078125, 0.6789779663085938, 0.7026519775390625, 0.7263259887695312, 0.75]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 12.0, 10.0, 36.0, 83.0, 181.0, 338.0, 912.0, 11294.0, 4045942.0, 132319.0, 2155.0, 510.0, 266.0, 120.0, 56.0, 26.0, 12.0, 13.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.25, -3.08526611328125, -2.9205322265625, -2.75579833984375, -2.591064453125, -2.42633056640625, -2.2615966796875, -2.09686279296875, -1.93212890625, -1.76739501953125, -1.6026611328125, -1.43792724609375, -1.273193359375, -1.10845947265625, -0.9437255859375, -0.77899169921875, -0.6142578125, -0.44952392578125, -0.2847900390625, -0.12005615234375, 0.044677734375, 0.20941162109375, 0.3741455078125, 0.53887939453125, 0.70361328125, 0.86834716796875, 1.0330810546875, 1.19781494140625, 1.362548828125, 1.52728271484375, 1.6920166015625, 1.85675048828125, 2.021484375, 2.18621826171875, 2.3509521484375, 2.51568603515625, 2.680419921875, 2.84515380859375, 3.0098876953125, 3.17462158203125, 3.33935546875, 3.50408935546875, 3.6688232421875, 3.83355712890625, 3.998291015625, 4.16302490234375, 4.3277587890625, 4.49249267578125, 4.6572265625, 4.82196044921875, 4.9866943359375, 5.15142822265625, 5.316162109375, 5.48089599609375, 5.6456298828125, 5.81036376953125, 5.97509765625, 6.13983154296875, 6.3045654296875, 6.46929931640625, 6.634033203125, 6.79876708984375, 6.9635009765625, 7.12823486328125, 7.29296875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 10.0, 13.0, 21.0, 61.0, 133.0, 280.0, 686.0, 1243.0, 869.0, 420.0, 156.0, 81.0, 30.0, 29.0, 8.0, 16.0, 6.0, 2.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.869140625, -1.773895263671875, -1.67864990234375, -1.583404541015625, -1.4881591796875, -1.392913818359375, -1.29766845703125, -1.202423095703125, -1.107177734375, -1.011932373046875, -0.91668701171875, -0.821441650390625, -0.7261962890625, -0.630950927734375, -0.53570556640625, -0.440460205078125, -0.34521484375, -0.249969482421875, -0.15472412109375, -0.059478759765625, 0.0357666015625, 0.131011962890625, 0.22625732421875, 0.321502685546875, 0.416748046875, 0.511993408203125, 0.60723876953125, 0.702484130859375, 0.7977294921875, 0.892974853515625, 0.98822021484375, 1.083465576171875, 1.1787109375, 1.273956298828125, 1.36920166015625, 1.464447021484375, 1.5596923828125, 1.654937744140625, 1.75018310546875, 1.845428466796875, 1.940673828125, 2.035919189453125, 2.13116455078125, 2.226409912109375, 2.3216552734375, 2.416900634765625, 2.51214599609375, 2.607391357421875, 2.70263671875, 2.797882080078125, 2.89312744140625, 2.988372802734375, 3.0836181640625, 3.178863525390625, 3.27410888671875, 3.369354248046875, 3.464599609375, 3.559844970703125, 3.65509033203125, 3.750335693359375, 3.8455810546875, 3.940826416015625, 4.03607177734375, 4.131317138671875, 4.2265625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 9.0, 23.0, 60.0, 237.0, 376.0, 198.0, 47.0, 29.0, 10.0, 9.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.704120635986328, -22.638961791992188, -21.573802947998047, -20.508642196655273, -19.443483352661133, -18.378324508666992, -17.31316375732422, -16.248004913330078, -15.182846069335938, -14.117687225341797, -13.05252742767334, -11.987367630004883, -10.922208786010742, -9.857049942016602, -8.791890144348145, -7.726730823516846, -6.661571502685547, -5.596412181854248, -4.531252861022949, -3.4660935401916504, -2.4009342193603516, -1.3357748985290527, -0.2706155776977539, 0.7945437431335449, 1.8597030639648438, 2.9248623847961426, 3.9900217056274414, 5.05518102645874, 6.120340347290039, 7.185499668121338, 8.250658988952637, 9.315818786621094, 10.380973815917969, 11.44613265991211, 12.511292457580566, 13.576452255249023, 14.641611099243164, 15.706769943237305, 16.771930694580078, 17.83708953857422, 18.90224838256836, 19.9674072265625, 21.03256607055664, 22.097726821899414, 23.162885665893555, 24.228044509887695, 25.29320526123047, 26.35836410522461, 27.42352294921875, 28.48868179321289, 29.55384063720703, 30.619001388549805, 31.684160232543945, 32.74932098388672, 33.81447982788086, 34.879638671875, 35.94479751586914, 37.00995635986328, 38.07511520385742, 39.14027404785156, 40.20543670654297, 41.27059555053711, 42.33575439453125, 43.40091323852539, 44.46607208251953]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 7.0, 8.0, 8.0, 17.0, 18.0, 17.0, 14.0, 34.0, 30.0, 38.0, 21.0, 27.0, 33.0, 39.0, 49.0, 56.0, 44.0, 47.0, 59.0, 46.0, 53.0, 44.0, 32.0, 35.0, 22.0, 33.0, 35.0, 22.0, 21.0, 16.0, 12.0, 12.0, 10.0, 7.0, 6.0, 10.0, 8.0, 0.0, 3.0, 2.0, 6.0, 2.0, 0.0, 2.0], "bins": [-9.743474960327148, -9.488177299499512, -9.232880592346191, -8.977582931518555, -8.722286224365234, -8.466988563537598, -8.211691856384277, -7.956394195556641, -7.701097011566162, -7.445799827575684, -7.190502643585205, -6.935205459594727, -6.67990779876709, -6.4246110916137695, -6.169313430786133, -5.914016246795654, -5.658719062805176, -5.403421878814697, -5.148124694824219, -4.89282751083374, -4.637530326843262, -4.382232666015625, -4.1269354820251465, -3.871638298034668, -3.6163411140441895, -3.361043930053711, -3.1057467460632324, -2.850449323654175, -2.5951521396636963, -2.3398549556732178, -2.08455753326416, -1.8292603492736816, -1.5739641189575195, -1.318666934967041, -1.063369631767273, -0.8080723881721497, -0.5527751445770264, -0.29747796058654785, -0.042180657386779785, 0.21311664581298828, 0.4684138298034668, 0.7237110733985901, 0.9790083169937134, 1.2343056201934814, 1.48960280418396, 1.7448999881744385, 2.000197410583496, 2.2554945945739746, 2.510791778564453, 2.7660889625549316, 3.02138614654541, 3.2766835689544678, 3.5319807529449463, 3.787277936935425, 4.042575359344482, 4.297872543334961, 4.5531697273254395, 4.808466911315918, 5.0637640953063965, 5.319061279296875, 5.574358940124512, 5.829655647277832, 6.084953308105469, 6.340250492095947, 6.595547676086426]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 5.0, 9.0, 13.0, 17.0, 39.0, 41.0, 71.0, 83.0, 164.0, 259.0, 401.0, 648.0, 1150.0, 1962.0, 3512.0, 6453.0, 12196.0, 24648.0, 53073.0, 124137.0, 276367.0, 292264.0, 136779.0, 58551.0, 26963.0, 13142.0, 6809.0, 3757.0, 2046.0, 1200.0, 646.0, 404.0, 255.0, 172.0, 104.0, 62.0, 42.0, 33.0, 22.0, 18.0, 10.0, 6.0, 4.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1015625, -1.064910888671875, -1.02825927734375, -0.991607666015625, -0.9549560546875, -0.918304443359375, -0.88165283203125, -0.845001220703125, -0.808349609375, -0.771697998046875, -0.73504638671875, -0.698394775390625, -0.6617431640625, -0.625091552734375, -0.58843994140625, -0.551788330078125, -0.51513671875, -0.478485107421875, -0.44183349609375, -0.405181884765625, -0.3685302734375, -0.331878662109375, -0.29522705078125, -0.258575439453125, -0.221923828125, -0.185272216796875, -0.14862060546875, -0.111968994140625, -0.0753173828125, -0.038665771484375, -0.00201416015625, 0.034637451171875, 0.0712890625, 0.107940673828125, 0.14459228515625, 0.181243896484375, 0.2178955078125, 0.254547119140625, 0.29119873046875, 0.327850341796875, 0.364501953125, 0.401153564453125, 0.43780517578125, 0.474456787109375, 0.5111083984375, 0.547760009765625, 0.58441162109375, 0.621063232421875, 0.65771484375, 0.694366455078125, 0.73101806640625, 0.767669677734375, 0.8043212890625, 0.840972900390625, 0.87762451171875, 0.914276123046875, 0.950927734375, 0.987579345703125, 1.02423095703125, 1.060882568359375, 1.0975341796875, 1.134185791015625, 1.17083740234375, 1.207489013671875, 1.244140625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 8.0, 2.0, 2.0, 7.0, 7.0, 8.0, 12.0, 14.0, 10.0, 11.0, 10.0, 12.0, 23.0, 31.0, 33.0, 24.0, 26.0, 30.0, 63.0, 42.0, 58.0, 43.0, 57.0, 52.0, 37.0, 42.0, 44.0, 46.0, 24.0, 38.0, 27.0, 23.0, 29.0, 16.0, 20.0, 17.0, 17.0, 8.0, 9.0, 9.0, 3.0, 6.0, 1.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.69580078125, -0.6737747192382812, -0.6517486572265625, -0.6297225952148438, -0.607696533203125, -0.5856704711914062, -0.5636444091796875, -0.5416183471679688, -0.51959228515625, -0.49756622314453125, -0.4755401611328125, -0.45351409912109375, -0.431488037109375, -0.40946197509765625, -0.3874359130859375, -0.36540985107421875, -0.3433837890625, -0.32135772705078125, -0.2993316650390625, -0.27730560302734375, -0.255279541015625, -0.23325347900390625, -0.2112274169921875, -0.18920135498046875, -0.16717529296875, -0.14514923095703125, -0.1231231689453125, -0.10109710693359375, -0.079071044921875, -0.05704498291015625, -0.0350189208984375, -0.01299285888671875, 0.009033203125, 0.03105926513671875, 0.0530853271484375, 0.07511138916015625, 0.097137451171875, 0.11916351318359375, 0.1411895751953125, 0.16321563720703125, 0.18524169921875, 0.20726776123046875, 0.2292938232421875, 0.25131988525390625, 0.273345947265625, 0.29537200927734375, 0.3173980712890625, 0.33942413330078125, 0.3614501953125, 0.38347625732421875, 0.4055023193359375, 0.42752838134765625, 0.449554443359375, 0.47158050537109375, 0.4936065673828125, 0.5156326293945312, 0.53765869140625, 0.5596847534179688, 0.5817108154296875, 0.6037368774414062, 0.625762939453125, 0.6477890014648438, 0.6698150634765625, 0.6918411254882812, 0.7138671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 11.0, 9.0, 12.0, 28.0, 41.0, 72.0, 134.0, 221.0, 465.0, 981.0, 2311.0, 9354.0, 111561.0, 863263.0, 50755.0, 5923.0, 1764.0, 777.0, 392.0, 213.0, 110.0, 62.0, 39.0, 22.0, 12.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.544921875, -3.419952392578125, -3.29498291015625, -3.170013427734375, -3.0450439453125, -2.920074462890625, -2.79510498046875, -2.670135498046875, -2.545166015625, -2.420196533203125, -2.29522705078125, -2.170257568359375, -2.0452880859375, -1.920318603515625, -1.79534912109375, -1.670379638671875, -1.54541015625, -1.420440673828125, -1.29547119140625, -1.170501708984375, -1.0455322265625, -0.920562744140625, -0.79559326171875, -0.670623779296875, -0.545654296875, -0.420684814453125, -0.29571533203125, -0.170745849609375, -0.0457763671875, 0.079193115234375, 0.20416259765625, 0.329132080078125, 0.4541015625, 0.579071044921875, 0.70404052734375, 0.829010009765625, 0.9539794921875, 1.078948974609375, 1.20391845703125, 1.328887939453125, 1.453857421875, 1.578826904296875, 1.70379638671875, 1.828765869140625, 1.9537353515625, 2.078704833984375, 2.20367431640625, 2.328643798828125, 2.45361328125, 2.578582763671875, 2.70355224609375, 2.828521728515625, 2.9534912109375, 3.078460693359375, 3.20343017578125, 3.328399658203125, 3.453369140625, 3.578338623046875, 3.70330810546875, 3.828277587890625, 3.9532470703125, 4.078216552734375, 4.20318603515625, 4.328155517578125, 4.453125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 6.0, 8.0, 16.0, 14.0, 30.0, 38.0, 56.0, 66.0, 61.0, 74.0, 89.0, 98.0, 99.0, 85.0, 71.0, 52.0, 32.0, 28.0, 22.0, 14.0, 12.0, 13.0, 8.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.302734375, -3.153839111328125, -3.00494384765625, -2.856048583984375, -2.7071533203125, -2.558258056640625, -2.40936279296875, -2.260467529296875, -2.111572265625, -1.962677001953125, -1.81378173828125, -1.664886474609375, -1.5159912109375, -1.367095947265625, -1.21820068359375, -1.069305419921875, -0.92041015625, -0.771514892578125, -0.62261962890625, -0.473724365234375, -0.3248291015625, -0.175933837890625, -0.02703857421875, 0.121856689453125, 0.270751953125, 0.419647216796875, 0.56854248046875, 0.717437744140625, 0.8663330078125, 1.015228271484375, 1.16412353515625, 1.313018798828125, 1.4619140625, 1.610809326171875, 1.75970458984375, 1.908599853515625, 2.0574951171875, 2.206390380859375, 2.35528564453125, 2.504180908203125, 2.653076171875, 2.801971435546875, 2.95086669921875, 3.099761962890625, 3.2486572265625, 3.397552490234375, 3.54644775390625, 3.695343017578125, 3.84423828125, 3.993133544921875, 4.14202880859375, 4.290924072265625, 4.4398193359375, 4.588714599609375, 4.73760986328125, 4.886505126953125, 5.035400390625, 5.184295654296875, 5.33319091796875, 5.482086181640625, 5.6309814453125, 5.779876708984375, 5.92877197265625, 6.077667236328125, 6.2265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 6.0, 5.0, 7.0, 23.0, 27.0, 40.0, 51.0, 114.0, 234.0, 469.0, 1113.0, 3112.0, 11848.0, 72676.0, 792554.0, 140268.0, 18943.0, 4427.0, 1424.0, 613.0, 251.0, 140.0, 63.0, 55.0, 28.0, 24.0, 12.0, 6.0, 8.0, 11.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6572265625, -0.6315994262695312, -0.6059722900390625, -0.5803451538085938, -0.554718017578125, -0.5290908813476562, -0.5034637451171875, -0.47783660888671875, -0.45220947265625, -0.42658233642578125, -0.4009552001953125, -0.37532806396484375, -0.349700927734375, -0.32407379150390625, -0.2984466552734375, -0.27281951904296875, -0.2471923828125, -0.22156524658203125, -0.1959381103515625, -0.17031097412109375, -0.144683837890625, -0.11905670166015625, -0.0934295654296875, -0.06780242919921875, -0.04217529296875, -0.01654815673828125, 0.0090789794921875, 0.03470611572265625, 0.060333251953125, 0.08596038818359375, 0.1115875244140625, 0.13721466064453125, 0.162841796875, 0.18846893310546875, 0.2140960693359375, 0.23972320556640625, 0.265350341796875, 0.29097747802734375, 0.3166046142578125, 0.34223175048828125, 0.36785888671875, 0.39348602294921875, 0.4191131591796875, 0.44474029541015625, 0.470367431640625, 0.49599456787109375, 0.5216217041015625, 0.5472488403320312, 0.5728759765625, 0.5985031127929688, 0.6241302490234375, 0.6497573852539062, 0.675384521484375, 0.7010116577148438, 0.7266387939453125, 0.7522659301757812, 0.77789306640625, 0.8035202026367188, 0.8291473388671875, 0.8547744750976562, 0.880401611328125, 0.9060287475585938, 0.9316558837890625, 0.9572830200195312, 0.98291015625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 11.0, 11.0, 11.0, 31.0, 35.0, 42.0, 77.0, 112.0, 173.0, 166.0, 115.0, 58.0, 37.0, 36.0, 19.0, 12.0, 16.0, 14.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038623809814453125, -0.00037449970841407776, -0.00036276131868362427, -0.0003510229289531708, -0.0003392845392227173, -0.0003275461494922638, -0.0003158077597618103, -0.0003040693700313568, -0.0002923309803009033, -0.00028059259057044983, -0.00026885420083999634, -0.00025711581110954285, -0.00024537742137908936, -0.00023363903164863586, -0.00022190064191818237, -0.00021016225218772888, -0.0001984238624572754, -0.0001866854727268219, -0.0001749470829963684, -0.00016320869326591492, -0.00015147030353546143, -0.00013973191380500793, -0.00012799352407455444, -0.00011625513434410095, -0.00010451674461364746, -9.277835488319397e-05, -8.103996515274048e-05, -6.930157542228699e-05, -5.7563185691833496e-05, -4.5824795961380005e-05, -3.4086406230926514e-05, -2.2348016500473022e-05, -1.0609626770019531e-05, 1.12876296043396e-06, 1.2867152690887451e-05, 2.4605542421340942e-05, 3.6343932151794434e-05, 4.8082321882247925e-05, 5.9820711612701416e-05, 7.155910134315491e-05, 8.32974910736084e-05, 9.503588080406189e-05, 0.00010677427053451538, 0.00011851266026496887, 0.00013025104999542236, 0.00014198943972587585, 0.00015372782945632935, 0.00016546621918678284, 0.00017720460891723633, 0.00018894299864768982, 0.0002006813883781433, 0.0002124197781085968, 0.0002241581678390503, 0.00023589655756950378, 0.0002476349472999573, 0.00025937333703041077, 0.00027111172676086426, 0.00028285011649131775, 0.00029458850622177124, 0.00030632689595222473, 0.0003180652856826782, 0.0003298036754131317, 0.0003415420651435852, 0.0003532804548740387, 0.0003650188446044922]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 4.0, 3.0, 6.0, 7.0, 17.0, 22.0, 29.0, 38.0, 58.0, 79.0, 178.0, 290.0, 448.0, 920.0, 2232.0, 6509.0, 28665.0, 224388.0, 709796.0, 58325.0, 10637.0, 3198.0, 1277.0, 584.0, 315.0, 187.0, 109.0, 82.0, 46.0, 32.0, 28.0, 10.0, 7.0, 9.0, 3.0, 1.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63671875, -0.616302490234375, -0.59588623046875, -0.575469970703125, -0.5550537109375, -0.534637451171875, -0.51422119140625, -0.493804931640625, -0.473388671875, -0.452972412109375, -0.43255615234375, -0.412139892578125, -0.3917236328125, -0.371307373046875, -0.35089111328125, -0.330474853515625, -0.31005859375, -0.289642333984375, -0.26922607421875, -0.248809814453125, -0.2283935546875, -0.207977294921875, -0.18756103515625, -0.167144775390625, -0.146728515625, -0.126312255859375, -0.10589599609375, -0.085479736328125, -0.0650634765625, -0.044647216796875, -0.02423095703125, -0.003814697265625, 0.0166015625, 0.037017822265625, 0.05743408203125, 0.077850341796875, 0.0982666015625, 0.118682861328125, 0.13909912109375, 0.159515380859375, 0.179931640625, 0.200347900390625, 0.22076416015625, 0.241180419921875, 0.2615966796875, 0.282012939453125, 0.30242919921875, 0.322845458984375, 0.34326171875, 0.363677978515625, 0.38409423828125, 0.404510498046875, 0.4249267578125, 0.445343017578125, 0.46575927734375, 0.486175537109375, 0.506591796875, 0.527008056640625, 0.54742431640625, 0.567840576171875, 0.5882568359375, 0.608673095703125, 0.62908935546875, 0.649505615234375, 0.669921875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 5.0, 8.0, 3.0, 3.0, 10.0, 11.0, 21.0, 23.0, 27.0, 26.0, 37.0, 44.0, 52.0, 62.0, 76.0, 79.0, 81.0, 88.0, 64.0, 49.0, 48.0, 40.0, 30.0, 30.0, 19.0, 15.0, 9.0, 9.0, 6.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.58056640625, -0.5638885498046875, -0.547210693359375, -0.5305328369140625, -0.51385498046875, -0.4971771240234375, -0.480499267578125, -0.4638214111328125, -0.4471435546875, -0.4304656982421875, -0.413787841796875, -0.3971099853515625, -0.38043212890625, -0.3637542724609375, -0.347076416015625, -0.3303985595703125, -0.313720703125, -0.2970428466796875, -0.280364990234375, -0.2636871337890625, -0.24700927734375, -0.2303314208984375, -0.213653564453125, -0.1969757080078125, -0.1802978515625, -0.1636199951171875, -0.146942138671875, -0.1302642822265625, -0.11358642578125, -0.0969085693359375, -0.080230712890625, -0.0635528564453125, -0.046875, -0.0301971435546875, -0.013519287109375, 0.0031585693359375, 0.01983642578125, 0.0365142822265625, 0.053192138671875, 0.0698699951171875, 0.0865478515625, 0.1032257080078125, 0.119903564453125, 0.1365814208984375, 0.15325927734375, 0.1699371337890625, 0.186614990234375, 0.2032928466796875, 0.219970703125, 0.2366485595703125, 0.253326416015625, 0.2700042724609375, 0.28668212890625, 0.3033599853515625, 0.320037841796875, 0.3367156982421875, 0.3533935546875, 0.3700714111328125, 0.386749267578125, 0.4034271240234375, 0.42010498046875, 0.4367828369140625, 0.453460693359375, 0.4701385498046875, 0.48681640625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 9.0, 11.0, 42.0, 60.0, 126.0, 382.0, 180.0, 96.0, 47.0, 21.0, 9.0, 7.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.90968132019043, -23.1590576171875, -22.40843391418457, -21.65781021118164, -20.907188415527344, -20.156564712524414, -19.405941009521484, -18.655317306518555, -17.904693603515625, -17.154069900512695, -16.403446197509766, -15.652823448181152, -14.902199745178223, -14.151576042175293, -13.40095329284668, -12.65032958984375, -11.89970588684082, -11.14908218383789, -10.398458480834961, -9.647835731506348, -8.897212028503418, -8.146588325500488, -7.395965099334717, -6.645341873168945, -5.894718170166016, -5.144094467163086, -4.3934712409973145, -3.642847776412964, -2.8922243118286133, -2.1416008472442627, -1.390977382659912, -0.6403541564941406, 0.11027145385742188, 0.8608949184417725, 1.611518383026123, 2.3621418476104736, 3.112765312194824, 3.863388776779175, 4.614012241363525, 5.364635467529297, 6.115259170532227, 6.865882873535156, 7.616506099700928, 8.3671293258667, 9.117753028869629, 9.868376731872559, 10.618999481201172, 11.369623184204102, 12.120246887207031, 12.870870590209961, 13.62149429321289, 14.372117042541504, 15.122740745544434, 15.873364448547363, 16.623987197875977, 17.374610900878906, 18.125234603881836, 18.875858306884766, 19.626482009887695, 20.377105712890625, 21.127727508544922, 21.87835121154785, 22.62897491455078, 23.37959861755371, 24.13022232055664]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 10.0, 15.0, 13.0, 15.0, 17.0, 27.0, 28.0, 29.0, 31.0, 44.0, 36.0, 48.0, 161.0, 167.0, 59.0, 41.0, 37.0, 27.0, 24.0, 36.0, 15.0, 24.0, 19.0, 15.0, 12.0, 10.0, 12.0, 4.0, 3.0, 7.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.678079605102539, -15.230937004089355, -14.783794403076172, -14.336651802062988, -13.889509201049805, -13.442366600036621, -12.995223999023438, -12.548081398010254, -12.10093879699707, -11.653796195983887, -11.206653594970703, -10.75951099395752, -10.312368392944336, -9.865225791931152, -9.418083190917969, -8.970940589904785, -8.523797988891602, -8.076655387878418, -7.629512786865234, -7.182370185852051, -6.735227584838867, -6.288084983825684, -5.8409423828125, -5.393799781799316, -4.946658134460449, -4.499515533447266, -4.052372932434082, -3.6052303314208984, -3.158087730407715, -2.7109453678131104, -2.2638027667999268, -1.8166601657867432, -1.3695173263549805, -0.9223747253417969, -0.47523218393325806, -0.02808964252471924, 0.41905295848846436, 0.8661954402923584, 1.313338041305542, 1.7604806423187256, 2.207623243331909, 2.6547658443450928, 3.1019084453582764, 3.549050807952881, 3.9961934089660645, 4.443336009979248, 4.890478610992432, 5.337621212005615, 5.784763813018799, 6.231906414031982, 6.679049015045166, 7.12619161605835, 7.573334217071533, 8.020476341247559, 8.467618942260742, 8.914761543273926, 9.36190414428711, 9.809046745300293, 10.256189346313477, 10.70333194732666, 11.150474548339844, 11.597617149353027, 12.044759750366211, 12.491902351379395, 12.939044952392578]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 4.0, 5.0, 6.0, 10.0, 13.0, 18.0, 35.0, 43.0, 57.0, 77.0, 113.0, 156.0, 227.0, 334.0, 507.0, 770.0, 1087.0, 1849.0, 3190.0, 5680.0, 11227.0, 24845.0, 62065.0, 173317.0, 488745.0, 1094812.0, 1272543.0, 646446.0, 253231.0, 88605.0, 32848.0, 14271.0, 7064.0, 3948.0, 2168.0, 1299.0, 849.0, 552.0, 376.0, 243.0, 176.0, 128.0, 97.0, 66.0, 45.0, 40.0, 27.0, 18.0, 17.0, 9.0, 16.0, 7.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.62744140625, -0.605926513671875, -0.58441162109375, -0.562896728515625, -0.5413818359375, -0.519866943359375, -0.49835205078125, -0.476837158203125, -0.455322265625, -0.433807373046875, -0.41229248046875, -0.390777587890625, -0.3692626953125, -0.347747802734375, -0.32623291015625, -0.304718017578125, -0.283203125, -0.261688232421875, -0.24017333984375, -0.218658447265625, -0.1971435546875, -0.175628662109375, -0.15411376953125, -0.132598876953125, -0.111083984375, -0.089569091796875, -0.06805419921875, -0.046539306640625, -0.0250244140625, -0.003509521484375, 0.01800537109375, 0.039520263671875, 0.06103515625, 0.082550048828125, 0.10406494140625, 0.125579833984375, 0.1470947265625, 0.168609619140625, 0.19012451171875, 0.211639404296875, 0.233154296875, 0.254669189453125, 0.27618408203125, 0.297698974609375, 0.3192138671875, 0.340728759765625, 0.36224365234375, 0.383758544921875, 0.4052734375, 0.426788330078125, 0.44830322265625, 0.469818115234375, 0.4913330078125, 0.512847900390625, 0.53436279296875, 0.555877685546875, 0.577392578125, 0.598907470703125, 0.62042236328125, 0.641937255859375, 0.6634521484375, 0.684967041015625, 0.70648193359375, 0.727996826171875, 0.74951171875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 6.0, 14.0, 14.0, 10.0, 11.0, 23.0, 15.0, 20.0, 27.0, 18.0, 28.0, 25.0, 22.0, 48.0, 39.0, 39.0, 41.0, 44.0, 47.0, 45.0, 45.0, 43.0, 44.0, 49.0, 34.0, 34.0, 32.0, 30.0, 28.0, 22.0, 13.0, 18.0, 8.0, 17.0, 7.0, 4.0, 6.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.59228515625, -0.5721893310546875, -0.552093505859375, -0.5319976806640625, -0.51190185546875, -0.4918060302734375, -0.471710205078125, -0.4516143798828125, -0.4315185546875, -0.4114227294921875, -0.391326904296875, -0.3712310791015625, -0.35113525390625, -0.3310394287109375, -0.310943603515625, -0.2908477783203125, -0.270751953125, -0.2506561279296875, -0.230560302734375, -0.2104644775390625, -0.19036865234375, -0.1702728271484375, -0.150177001953125, -0.1300811767578125, -0.1099853515625, -0.0898895263671875, -0.069793701171875, -0.0496978759765625, -0.02960205078125, -0.0095062255859375, 0.010589599609375, 0.0306854248046875, 0.05078125, 0.0708770751953125, 0.090972900390625, 0.1110687255859375, 0.13116455078125, 0.1512603759765625, 0.171356201171875, 0.1914520263671875, 0.2115478515625, 0.2316436767578125, 0.251739501953125, 0.2718353271484375, 0.29193115234375, 0.3120269775390625, 0.332122802734375, 0.3522186279296875, 0.372314453125, 0.3924102783203125, 0.412506103515625, 0.4326019287109375, 0.45269775390625, 0.4727935791015625, 0.492889404296875, 0.5129852294921875, 0.5330810546875, 0.5531768798828125, 0.573272705078125, 0.5933685302734375, 0.61346435546875, 0.6335601806640625, 0.653656005859375, 0.6737518310546875, 0.69384765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 6.0, 19.0, 26.0, 42.0, 61.0, 101.0, 173.0, 344.0, 654.0, 1270.0, 3741.0, 28064.0, 3798826.0, 347729.0, 8903.0, 2278.0, 941.0, 483.0, 259.0, 159.0, 74.0, 47.0, 21.0, 17.0, 12.0, 6.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.09765625, -4.9510498046875, -4.804443359375, -4.6578369140625, -4.51123046875, -4.3646240234375, -4.218017578125, -4.0714111328125, -3.9248046875, -3.7781982421875, -3.631591796875, -3.4849853515625, -3.33837890625, -3.1917724609375, -3.045166015625, -2.8985595703125, -2.751953125, -2.6053466796875, -2.458740234375, -2.3121337890625, -2.16552734375, -2.0189208984375, -1.872314453125, -1.7257080078125, -1.5791015625, -1.4324951171875, -1.285888671875, -1.1392822265625, -0.99267578125, -0.8460693359375, -0.699462890625, -0.5528564453125, -0.40625, -0.2596435546875, -0.113037109375, 0.0335693359375, 0.18017578125, 0.3267822265625, 0.473388671875, 0.6199951171875, 0.7666015625, 0.9132080078125, 1.059814453125, 1.2064208984375, 1.35302734375, 1.4996337890625, 1.646240234375, 1.7928466796875, 1.939453125, 2.0860595703125, 2.232666015625, 2.3792724609375, 2.52587890625, 2.6724853515625, 2.819091796875, 2.9656982421875, 3.1123046875, 3.2589111328125, 3.405517578125, 3.5521240234375, 3.69873046875, 3.8453369140625, 3.991943359375, 4.1385498046875, 4.28515625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 12.0, 9.0, 15.0, 24.0, 36.0, 48.0, 73.0, 120.0, 197.0, 255.0, 403.0, 587.0, 679.0, 554.0, 368.0, 222.0, 135.0, 117.0, 65.0, 58.0, 31.0, 19.0, 16.0, 10.0, 9.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.07421875, -1.989105224609375, -1.90399169921875, -1.818878173828125, -1.7337646484375, -1.648651123046875, -1.56353759765625, -1.478424072265625, -1.393310546875, -1.308197021484375, -1.22308349609375, -1.137969970703125, -1.0528564453125, -0.967742919921875, -0.88262939453125, -0.797515869140625, -0.71240234375, -0.627288818359375, -0.54217529296875, -0.457061767578125, -0.3719482421875, -0.286834716796875, -0.20172119140625, -0.116607666015625, -0.031494140625, 0.053619384765625, 0.13873291015625, 0.223846435546875, 0.3089599609375, 0.394073486328125, 0.47918701171875, 0.564300537109375, 0.6494140625, 0.734527587890625, 0.81964111328125, 0.904754638671875, 0.9898681640625, 1.074981689453125, 1.16009521484375, 1.245208740234375, 1.330322265625, 1.415435791015625, 1.50054931640625, 1.585662841796875, 1.6707763671875, 1.755889892578125, 1.84100341796875, 1.926116943359375, 2.01123046875, 2.096343994140625, 2.18145751953125, 2.266571044921875, 2.3516845703125, 2.436798095703125, 2.52191162109375, 2.607025146484375, 2.692138671875, 2.777252197265625, 2.86236572265625, 2.947479248046875, 3.0325927734375, 3.117706298828125, 3.20281982421875, 3.287933349609375, 3.373046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 12.0, 28.0, 70.0, 215.0, 372.0, 201.0, 66.0, 22.0, 9.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.13917541503906, -50.42607879638672, -48.71297836303711, -46.999881744384766, -45.286781311035156, -43.57368469238281, -41.86058807373047, -40.14748764038086, -38.434391021728516, -36.72129440307617, -35.00819396972656, -33.29509735107422, -31.581998825073242, -29.868900299072266, -28.15580177307129, -26.442703247070312, -24.729604721069336, -23.01650619506836, -21.303407669067383, -19.590309143066406, -17.877212524414062, -16.164113998413086, -14.45101547241211, -12.73791790008545, -11.024819374084473, -9.311720848083496, -7.598623275756836, -5.885524749755859, -4.172426700592041, -2.4593286514282227, -0.7462301254272461, 0.9668674468994141, 2.6799659729003906, 4.393064022064209, 6.106162071228027, 7.819260597229004, 9.532358169555664, 11.24545669555664, 12.958555221557617, 14.671652793884277, 16.384750366210938, 18.097848892211914, 19.81094741821289, 21.524044036865234, 23.23714256286621, 24.950241088867188, 26.663339614868164, 28.37643814086914, 30.089536666870117, 31.802635192871094, 33.51573181152344, 35.22883224487305, 36.94192886352539, 38.655029296875, 40.368125915527344, 42.08122253417969, 43.7943229675293, 45.50741958618164, 47.22052001953125, 48.933616638183594, 50.6467170715332, 52.35981369018555, 54.072914123535156, 55.7860107421875, 57.499107360839844]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 11.0, 8.0, 14.0, 17.0, 22.0, 16.0, 28.0, 30.0, 32.0, 50.0, 40.0, 52.0, 45.0, 66.0, 68.0, 60.0, 52.0, 39.0, 58.0, 36.0, 44.0, 49.0, 23.0, 28.0, 25.0, 18.0, 15.0, 8.0, 15.0, 6.0, 11.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.97799301147461, -15.527382850646973, -15.076772689819336, -14.626163482666016, -14.175553321838379, -13.724943161010742, -13.274333953857422, -12.823723793029785, -12.373113632202148, -11.922503471374512, -11.471893310546875, -11.021284103393555, -10.570673942565918, -10.120063781738281, -9.669454574584961, -9.218844413757324, -8.768234252929688, -8.31762409210205, -7.867014408111572, -7.416404724121094, -6.965794563293457, -6.51518440246582, -6.064574718475342, -5.613965034484863, -5.163354873657227, -4.71274471282959, -4.262135028839111, -3.8115251064300537, -3.360915184020996, -2.9103052616119385, -2.459695339202881, -2.0090854167938232, -1.558476448059082, -1.1078665256500244, -0.6572566032409668, -0.20664668083190918, 0.24396324157714844, 0.694573163986206, 1.1451830863952637, 1.5957930088043213, 2.046402931213379, 2.4970128536224365, 2.947622776031494, 3.3982326984405518, 3.8488426208496094, 4.299452781677246, 4.750062465667725, 5.200672149658203, 5.65128231048584, 6.101892471313477, 6.552502155303955, 7.003111839294434, 7.45372200012207, 7.904332160949707, 8.354942321777344, 8.805551528930664, 9.2561616897583, 9.706771850585938, 10.157381057739258, 10.607991218566895, 11.058601379394531, 11.509211540222168, 11.959821701049805, 12.410430908203125, 12.861041069030762]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 11.0, 19.0, 22.0, 26.0, 46.0, 83.0, 123.0, 226.0, 385.0, 703.0, 1305.0, 2775.0, 5966.0, 14075.0, 36857.0, 109745.0, 470004.0, 284189.0, 75438.0, 26602.0, 10569.0, 4651.0, 2230.0, 1048.0, 587.0, 353.0, 177.0, 108.0, 72.0, 49.0, 28.0, 16.0, 11.0, 14.0, 14.0, 7.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4453125, -1.3999176025390625, -1.354522705078125, -1.3091278076171875, -1.26373291015625, -1.2183380126953125, -1.172943115234375, -1.1275482177734375, -1.0821533203125, -1.0367584228515625, -0.991363525390625, -0.9459686279296875, -0.90057373046875, -0.8551788330078125, -0.809783935546875, -0.7643890380859375, -0.718994140625, -0.6735992431640625, -0.628204345703125, -0.5828094482421875, -0.53741455078125, -0.4920196533203125, -0.446624755859375, -0.4012298583984375, -0.3558349609375, -0.3104400634765625, -0.265045166015625, -0.2196502685546875, -0.17425537109375, -0.1288604736328125, -0.083465576171875, -0.0380706787109375, 0.00732421875, 0.0527191162109375, 0.098114013671875, 0.1435089111328125, 0.18890380859375, 0.2342987060546875, 0.279693603515625, 0.3250885009765625, 0.3704833984375, 0.4158782958984375, 0.461273193359375, 0.5066680908203125, 0.55206298828125, 0.5974578857421875, 0.642852783203125, 0.6882476806640625, 0.733642578125, 0.7790374755859375, 0.824432373046875, 0.8698272705078125, 0.91522216796875, 0.9606170654296875, 1.006011962890625, 1.0514068603515625, 1.0968017578125, 1.1421966552734375, 1.187591552734375, 1.2329864501953125, 1.27838134765625, 1.3237762451171875, 1.369171142578125, 1.4145660400390625, 1.4599609375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 16.0, 15.0, 11.0, 17.0, 26.0, 25.0, 33.0, 39.0, 44.0, 49.0, 62.0, 67.0, 63.0, 57.0, 59.0, 55.0, 54.0, 51.0, 45.0, 44.0, 37.0, 32.0, 19.0, 23.0, 10.0, 11.0, 11.0, 8.0, 8.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2626953125, -1.2306671142578125, -1.198638916015625, -1.1666107177734375, -1.13458251953125, -1.1025543212890625, -1.070526123046875, -1.0384979248046875, -1.0064697265625, -0.9744415283203125, -0.942413330078125, -0.9103851318359375, -0.87835693359375, -0.8463287353515625, -0.814300537109375, -0.7822723388671875, -0.750244140625, -0.7182159423828125, -0.686187744140625, -0.6541595458984375, -0.62213134765625, -0.5901031494140625, -0.558074951171875, -0.5260467529296875, -0.4940185546875, -0.4619903564453125, -0.429962158203125, -0.3979339599609375, -0.36590576171875, -0.3338775634765625, -0.301849365234375, -0.2698211669921875, -0.23779296875, -0.2057647705078125, -0.173736572265625, -0.1417083740234375, -0.10968017578125, -0.0776519775390625, -0.045623779296875, -0.0135955810546875, 0.0184326171875, 0.0504608154296875, 0.082489013671875, 0.1145172119140625, 0.14654541015625, 0.1785736083984375, 0.210601806640625, 0.2426300048828125, 0.274658203125, 0.3066864013671875, 0.338714599609375, 0.3707427978515625, 0.40277099609375, 0.4347991943359375, 0.466827392578125, 0.4988555908203125, 0.5308837890625, 0.5629119873046875, 0.594940185546875, 0.6269683837890625, 0.65899658203125, 0.6910247802734375, 0.723052978515625, 0.7550811767578125, 0.787109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 14.0, 14.0, 11.0, 9.0, 29.0, 31.0, 48.0, 86.0, 104.0, 193.0, 240.0, 417.0, 767.0, 1629.0, 4390.0, 17265.0, 108547.0, 838035.0, 59868.0, 10805.0, 3122.0, 1250.0, 635.0, 360.0, 223.0, 143.0, 74.0, 66.0, 44.0, 36.0, 30.0, 26.0, 11.0, 7.0, 5.0, 3.0, 3.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9521484375, -1.8878326416015625, -1.823516845703125, -1.7592010498046875, -1.69488525390625, -1.6305694580078125, -1.566253662109375, -1.5019378662109375, -1.4376220703125, -1.3733062744140625, -1.308990478515625, -1.2446746826171875, -1.18035888671875, -1.1160430908203125, -1.051727294921875, -0.9874114990234375, -0.923095703125, -0.8587799072265625, -0.794464111328125, -0.7301483154296875, -0.66583251953125, -0.6015167236328125, -0.537200927734375, -0.4728851318359375, -0.4085693359375, -0.3442535400390625, -0.279937744140625, -0.2156219482421875, -0.15130615234375, -0.0869903564453125, -0.022674560546875, 0.0416412353515625, 0.10595703125, 0.1702728271484375, 0.234588623046875, 0.2989044189453125, 0.36322021484375, 0.4275360107421875, 0.491851806640625, 0.5561676025390625, 0.6204833984375, 0.6847991943359375, 0.749114990234375, 0.8134307861328125, 0.87774658203125, 0.9420623779296875, 1.006378173828125, 1.0706939697265625, 1.135009765625, 1.1993255615234375, 1.263641357421875, 1.3279571533203125, 1.39227294921875, 1.4565887451171875, 1.520904541015625, 1.5852203369140625, 1.6495361328125, 1.7138519287109375, 1.778167724609375, 1.8424835205078125, 1.90679931640625, 1.9711151123046875, 2.035430908203125, 2.0997467041015625, 2.1640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 7.0, 8.0, 6.0, 14.0, 6.0, 7.0, 9.0, 19.0, 16.0, 18.0, 19.0, 18.0, 28.0, 24.0, 22.0, 34.0, 40.0, 46.0, 52.0, 78.0, 67.0, 71.0, 58.0, 57.0, 32.0, 40.0, 29.0, 19.0, 27.0, 10.0, 20.0, 13.0, 9.0, 12.0, 10.0, 12.0, 9.0, 11.0, 7.0, 3.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-3.1796875, -3.087432861328125, -2.99517822265625, -2.902923583984375, -2.8106689453125, -2.718414306640625, -2.62615966796875, -2.533905029296875, -2.441650390625, -2.349395751953125, -2.25714111328125, -2.164886474609375, -2.0726318359375, -1.980377197265625, -1.88812255859375, -1.795867919921875, -1.70361328125, -1.611358642578125, -1.51910400390625, -1.426849365234375, -1.3345947265625, -1.242340087890625, -1.15008544921875, -1.057830810546875, -0.965576171875, -0.873321533203125, -0.78106689453125, -0.688812255859375, -0.5965576171875, -0.504302978515625, -0.41204833984375, -0.319793701171875, -0.2275390625, -0.135284423828125, -0.04302978515625, 0.049224853515625, 0.1414794921875, 0.233734130859375, 0.32598876953125, 0.418243408203125, 0.510498046875, 0.602752685546875, 0.69500732421875, 0.787261962890625, 0.8795166015625, 0.971771240234375, 1.06402587890625, 1.156280517578125, 1.24853515625, 1.340789794921875, 1.43304443359375, 1.525299072265625, 1.6175537109375, 1.709808349609375, 1.80206298828125, 1.894317626953125, 1.986572265625, 2.078826904296875, 2.17108154296875, 2.263336181640625, 2.3555908203125, 2.447845458984375, 2.54010009765625, 2.632354736328125, 2.724609375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 11.0, 12.0, 12.0, 18.0, 22.0, 24.0, 35.0, 43.0, 54.0, 108.0, 156.0, 266.0, 523.0, 1078.0, 2669.0, 7526.0, 29994.0, 719766.0, 247471.0, 27092.0, 7039.0, 2428.0, 955.0, 481.0, 274.0, 135.0, 97.0, 60.0, 46.0, 34.0, 31.0, 15.0, 17.0, 9.0, 9.0, 10.0, 7.0, 3.0, 2.0, 4.0, 1.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.47802734375, -0.4635276794433594, -0.44902801513671875, -0.4345283508300781, -0.4200286865234375, -0.4055290222167969, -0.39102935791015625, -0.3765296936035156, -0.362030029296875, -0.3475303649902344, -0.33303070068359375, -0.3185310363769531, -0.3040313720703125, -0.2895317077636719, -0.27503204345703125, -0.2605323791503906, -0.24603271484375, -0.23153305053710938, -0.21703338623046875, -0.20253372192382812, -0.1880340576171875, -0.17353439331054688, -0.15903472900390625, -0.14453506469726562, -0.130035400390625, -0.11553573608398438, -0.10103607177734375, -0.08653640747070312, -0.0720367431640625, -0.057537078857421875, -0.04303741455078125, -0.028537750244140625, -0.0140380859375, 0.000461578369140625, 0.01496124267578125, 0.029460906982421875, 0.0439605712890625, 0.058460235595703125, 0.07295989990234375, 0.08745956420898438, 0.101959228515625, 0.11645889282226562, 0.13095855712890625, 0.14545822143554688, 0.1599578857421875, 0.17445755004882812, 0.18895721435546875, 0.20345687866210938, 0.21795654296875, 0.23245620727539062, 0.24695587158203125, 0.2614555358886719, 0.2759552001953125, 0.2904548645019531, 0.30495452880859375, 0.3194541931152344, 0.333953857421875, 0.3484535217285156, 0.36295318603515625, 0.3774528503417969, 0.3919525146484375, 0.4064521789550781, 0.42095184326171875, 0.4354515075683594, 0.449951171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 7.0, 12.0, 10.0, 14.0, 20.0, 18.0, 22.0, 59.0, 100.0, 149.0, 186.0, 145.0, 77.0, 43.0, 30.0, 24.0, 16.0, 12.0, 4.0, 11.0, 8.0, 1.0, 6.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00027751922607421875, -0.00026943907141685486, -0.00026135891675949097, -0.0002532787621021271, -0.0002451986074447632, -0.0002371184527873993, -0.0002290382981300354, -0.0002209581434726715, -0.00021287798881530762, -0.00020479783415794373, -0.00019671767950057983, -0.00018863752484321594, -0.00018055737018585205, -0.00017247721552848816, -0.00016439706087112427, -0.00015631690621376038, -0.00014823675155639648, -0.0001401565968990326, -0.0001320764422416687, -0.0001239962875843048, -0.00011591613292694092, -0.00010783597826957703, -9.975582361221313e-05, -9.167566895484924e-05, -8.359551429748535e-05, -7.551535964012146e-05, -6.743520498275757e-05, -5.935505032539368e-05, -5.1274895668029785e-05, -4.3194741010665894e-05, -3.5114586353302e-05, -2.703443169593811e-05, -1.895427703857422e-05, -1.0874122381210327e-05, -2.7939677238464355e-06, 5.286186933517456e-06, 1.3366341590881348e-05, 2.144649624824524e-05, 2.952665090560913e-05, 3.760680556297302e-05, 4.5686960220336914e-05, 5.3767114877700806e-05, 6.18472695350647e-05, 6.992742419242859e-05, 7.800757884979248e-05, 8.608773350715637e-05, 9.416788816452026e-05, 0.00010224804282188416, 0.00011032819747924805, 0.00011840835213661194, 0.00012648850679397583, 0.00013456866145133972, 0.0001426488161087036, 0.0001507289707660675, 0.0001588091254234314, 0.0001668892800807953, 0.00017496943473815918, 0.00018304958939552307, 0.00019112974405288696, 0.00019920989871025085, 0.00020729005336761475, 0.00021537020802497864, 0.00022345036268234253, 0.00023153051733970642, 0.0002396106719970703]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 4.0, 3.0, 16.0, 25.0, 23.0, 41.0, 36.0, 42.0, 79.0, 119.0, 210.0, 291.0, 497.0, 755.0, 1265.0, 2390.0, 4719.0, 9941.0, 24780.0, 83697.0, 757233.0, 109867.0, 29464.0, 11438.0, 5209.0, 2671.0, 1458.0, 815.0, 545.0, 312.0, 198.0, 131.0, 87.0, 59.0, 35.0, 25.0, 21.0, 16.0, 10.0, 11.0, 8.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.2587890625, -0.2510833740234375, -0.243377685546875, -0.2356719970703125, -0.22796630859375, -0.2202606201171875, -0.212554931640625, -0.2048492431640625, -0.1971435546875, -0.1894378662109375, -0.181732177734375, -0.1740264892578125, -0.16632080078125, -0.1586151123046875, -0.150909423828125, -0.1432037353515625, -0.135498046875, -0.1277923583984375, -0.120086669921875, -0.1123809814453125, -0.10467529296875, -0.0969696044921875, -0.089263916015625, -0.0815582275390625, -0.0738525390625, -0.0661468505859375, -0.058441162109375, -0.0507354736328125, -0.04302978515625, -0.0353240966796875, -0.027618408203125, -0.0199127197265625, -0.01220703125, -0.0045013427734375, 0.003204345703125, 0.0109100341796875, 0.01861572265625, 0.0263214111328125, 0.034027099609375, 0.0417327880859375, 0.0494384765625, 0.0571441650390625, 0.064849853515625, 0.0725555419921875, 0.08026123046875, 0.0879669189453125, 0.095672607421875, 0.1033782958984375, 0.111083984375, 0.1187896728515625, 0.126495361328125, 0.1342010498046875, 0.14190673828125, 0.1496124267578125, 0.157318115234375, 0.1650238037109375, 0.1727294921875, 0.1804351806640625, 0.188140869140625, 0.1958465576171875, 0.20355224609375, 0.2112579345703125, 0.218963623046875, 0.2266693115234375, 0.234375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 6.0, 5.0, 6.0, 3.0, 6.0, 6.0, 4.0, 10.0, 10.0, 21.0, 17.0, 40.0, 34.0, 58.0, 67.0, 106.0, 110.0, 109.0, 87.0, 87.0, 52.0, 42.0, 29.0, 18.0, 15.0, 12.0, 7.0, 6.0, 1.0, 7.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5185546875, -0.5045013427734375, -0.490447998046875, -0.4763946533203125, -0.46234130859375, -0.4482879638671875, -0.434234619140625, -0.4201812744140625, -0.4061279296875, -0.3920745849609375, -0.378021240234375, -0.3639678955078125, -0.34991455078125, -0.3358612060546875, -0.321807861328125, -0.3077545166015625, -0.293701171875, -0.2796478271484375, -0.265594482421875, -0.2515411376953125, -0.23748779296875, -0.2234344482421875, -0.209381103515625, -0.1953277587890625, -0.1812744140625, -0.1672210693359375, -0.153167724609375, -0.1391143798828125, -0.12506103515625, -0.1110076904296875, -0.096954345703125, -0.0829010009765625, -0.06884765625, -0.0547943115234375, -0.040740966796875, -0.0266876220703125, -0.01263427734375, 0.0014190673828125, 0.015472412109375, 0.0295257568359375, 0.0435791015625, 0.0576324462890625, 0.071685791015625, 0.0857391357421875, 0.09979248046875, 0.1138458251953125, 0.127899169921875, 0.1419525146484375, 0.156005859375, 0.1700592041015625, 0.184112548828125, 0.1981658935546875, 0.21221923828125, 0.2262725830078125, 0.240325927734375, 0.2543792724609375, 0.2684326171875, 0.2824859619140625, 0.296539306640625, 0.3105926513671875, 0.32464599609375, 0.3386993408203125, 0.352752685546875, 0.3668060302734375, 0.380859375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 12.0, 20.0, 60.0, 128.0, 627.0, 98.0, 36.0, 17.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.526641845703125, -32.52521896362305, -31.523794174194336, -30.522369384765625, -29.520946502685547, -28.519521713256836, -27.518096923828125, -26.516674041748047, -25.51525115966797, -24.513826370239258, -23.51240348815918, -22.51097869873047, -21.50955581665039, -20.50813102722168, -19.50670623779297, -18.50528335571289, -17.50385856628418, -16.50243377685547, -15.50101089477539, -14.49958610534668, -13.498163223266602, -12.49673843383789, -11.495314598083496, -10.493890762329102, -9.492466926574707, -8.491043090820312, -7.489619255065918, -6.488194942474365, -5.486771106719971, -4.485347270965576, -3.4839229583740234, -2.482499122619629, -1.4810733795166016, -0.4796494245529175, 0.5217745304107666, 1.5231986045837402, 2.5246224403381348, 3.5260462760925293, 4.527470588684082, 5.528894424438477, 6.530318260192871, 7.531742095947266, 8.53316593170166, 9.534589767456055, 10.536014556884766, 11.537437438964844, 12.538862228393555, 13.54028606414795, 14.541709899902344, 15.543133735656738, 16.544557571411133, 17.545982360839844, 18.547405242919922, 19.548830032348633, 20.550254821777344, 21.551677703857422, 22.5531005859375, 23.55452537536621, 24.55594825744629, 25.557373046875, 26.558795928955078, 27.56022071838379, 28.5616455078125, 29.563068389892578, 30.56449317932129]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 10.0, 4.0, 6.0, 9.0, 12.0, 8.0, 11.0, 22.0, 15.0, 23.0, 25.0, 27.0, 31.0, 27.0, 43.0, 238.0, 230.0, 49.0, 32.0, 24.0, 28.0, 23.0, 17.0, 16.0, 8.0, 15.0, 11.0, 2.0, 4.0, 9.0, 5.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.442407608032227, -8.129712104797363, -7.8170166015625, -7.504321098327637, -7.191625595092773, -6.87893009185791, -6.566235065460205, -6.253539562225342, -5.9408440589904785, -5.628148555755615, -5.315453052520752, -5.002757549285889, -4.690062522888184, -4.37736701965332, -4.064671516418457, -3.7519760131835938, -3.4392805099487305, -3.126585006713867, -2.813889503479004, -2.5011942386627197, -2.1884987354278564, -1.8758032321929932, -1.5631078481674194, -1.2504124641418457, -0.9377169609069824, -0.6250215172767639, -0.3123260736465454, 0.0003693699836730957, 0.3130648136138916, 0.6257603168487549, 0.9384557008743286, 1.2511510848999023, 1.563847541809082, 1.8765430450439453, 2.1892385482788086, 2.5019338130950928, 2.814629316329956, 3.1273248195648193, 3.4400200843811035, 3.752715587615967, 4.06541109085083, 4.378106594085693, 4.690802097320557, 5.00349760055542, 5.316192626953125, 5.628888130187988, 5.941583633422852, 6.254279136657715, 6.566974639892578, 6.879670143127441, 7.192365646362305, 7.505061149597168, 7.817756652832031, 8.130452156066895, 8.443147659301758, 8.755842208862305, 9.068538665771484, 9.381234169006348, 9.693929672241211, 10.006625175476074, 10.319320678710938, 10.6320161819458, 10.944711685180664, 11.257406234741211, 11.570101737976074]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 9.0, 5.0, 6.0, 10.0, 13.0, 11.0, 27.0, 28.0, 46.0, 40.0, 63.0, 126.0, 287.0, 93.0, 57.0, 51.0, 27.0, 30.0, 21.0, 18.0, 6.0, 11.0, 6.0, 5.0, 0.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1708984375, -1.133514404296875, -1.09613037109375, -1.058746337890625, -1.0213623046875, -0.983978271484375, -0.94659423828125, -0.909210205078125, -0.871826171875, -0.834442138671875, -0.79705810546875, -0.759674072265625, -0.7222900390625, -0.684906005859375, -0.64752197265625, -0.610137939453125, -0.57275390625, -0.535369873046875, -0.49798583984375, -0.460601806640625, -0.4232177734375, -0.385833740234375, -0.34844970703125, -0.311065673828125, -0.273681640625, -0.236297607421875, -0.19891357421875, -0.161529541015625, -0.1241455078125, -0.086761474609375, -0.04937744140625, -0.011993408203125, 0.025390625, 0.062774658203125, 0.10015869140625, 0.137542724609375, 0.1749267578125, 0.212310791015625, 0.24969482421875, 0.287078857421875, 0.324462890625, 0.361846923828125, 0.39923095703125, 0.436614990234375, 0.4739990234375, 0.511383056640625, 0.54876708984375, 0.586151123046875, 0.62353515625, 0.660919189453125, 0.69830322265625, 0.735687255859375, 0.7730712890625, 0.810455322265625, 0.84783935546875, 0.885223388671875, 0.922607421875, 0.959991455078125, 0.99737548828125, 1.034759521484375, 1.0721435546875, 1.109527587890625, 1.14691162109375, 1.184295654296875, 1.2216796875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 4.0, 8.0, 11.0, 13.0, 12.0, 28.0, 31.0, 61.0, 102.0, 156.0, 349.0, 989.0, 3840.0, 36363.0, 8334536.0, 9000.0, 1898.0, 605.0, 215.0, 126.0, 84.0, 61.0, 22.0, 15.0, 6.0, 8.0, 4.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.785748481750488, -9.500036239624023, -9.214324951171875, -8.92861270904541, -8.642901420593262, -8.357189178466797, -8.071477890014648, -7.785765647888184, -7.500053882598877, -7.21434211730957, -6.928630352020264, -6.642918586730957, -6.357206344604492, -6.071495056152344, -5.785782814025879, -5.500071048736572, -5.214359283447266, -4.928647518157959, -4.642935752868652, -4.357223987579346, -4.071512222290039, -3.7858002185821533, -3.5000882148742676, -3.214376449584961, -2.9286646842956543, -2.6429529190063477, -2.357241153717041, -2.0715291500091553, -1.7858173847198486, -1.500105619430542, -1.2143937349319458, -0.9286818504333496, -0.642970085144043, -0.35725826025009155, -0.07154643535614014, 0.21416538953781128, 0.4998772144317627, 0.7855889797210693, 1.0713008642196655, 1.3570127487182617, 1.6427245140075684, 1.928436279296875, 2.2141480445861816, 2.4998600482940674, 2.785571813583374, 3.0712835788726807, 3.3569955825805664, 3.642707347869873, 3.9284191131591797, 4.214130878448486, 4.499842643737793, 4.7855544090271, 5.071266174316406, 5.356978416442871, 5.642690181732178, 5.928401947021484, 6.214113712310791, 6.499825477600098, 6.785537242889404, 7.071249008178711, 7.356961250305176, 7.642672538757324, 7.928384780883789, 8.214096069335938, 8.499808311462402]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 6.0, 2.0, 4.0, 8.0, 8.0, 2.0, 4.0, 4.0, 5.0, 9.0, 5.0, 3.0, 6.0, 2.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.060517311096191, -8.824185371398926, -8.58785343170166, -8.351521492004395, -8.115188598632812, -7.878857135772705, -7.642524719238281, -7.406192779541016, -7.16986083984375, -6.933528900146484, -6.697196960449219, -6.460864543914795, -6.224532604217529, -5.988200664520264, -5.75186824798584, -5.515536308288574, -5.279204368591309, -5.042872428894043, -4.806540489196777, -4.5702080726623535, -4.333876132965088, -4.097544193267822, -3.8612120151519775, -3.624879837036133, -3.388547897338867, -3.1522159576416016, -2.915883779525757, -2.679551601409912, -2.4432196617126465, -2.206887722015381, -1.9705555438995361, -1.734223484992981, -1.497891902923584, -1.2615598440170288, -1.0252277851104736, -0.7888957262039185, -0.5525636672973633, -0.3162316083908081, -0.07989954948425293, 0.15643250942230225, 0.3927645683288574, 0.6290966272354126, 0.8654286861419678, 1.101760745048523, 1.3380928039550781, 1.5744248628616333, 1.8107569217681885, 2.047089099884033, 2.283421039581299, 2.5197529792785645, 2.756085157394409, 2.992417335510254, 3.2287492752075195, 3.465081214904785, 3.70141339302063, 3.9377455711364746, 4.17407751083374, 4.410409450531006, 4.64674186706543, 4.883073806762695, 5.119405746459961, 5.355737686157227, 5.592069625854492, 5.828402042388916, 6.064733982086182]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 11.0, 14.0, 11.0, 21.0, 41.0, 46.0, 64.0, 106.0, 153.0, 289.0, 652.0, 1545.0, 4948.0, 18767.0, 85491.0, 268832.0, 109989.0, 23745.0, 6111.0, 1860.0, 733.0, 352.0, 185.0, 117.0, 68.0, 39.0, 28.0, 15.0, 5.0, 7.0, 4.0, 9.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.0859375, -10.7828369140625, -10.479736328125, -10.1766357421875, -9.87353515625, -9.5704345703125, -9.267333984375, -8.9642333984375, -8.6611328125, -8.3580322265625, -8.054931640625, -7.7518310546875, -7.44873046875, -7.1456298828125, -6.842529296875, -6.5394287109375, -6.236328125, -5.9332275390625, -5.630126953125, -5.3270263671875, -5.02392578125, -4.7208251953125, -4.417724609375, -4.1146240234375, -3.8115234375, -3.5084228515625, -3.205322265625, -2.9022216796875, -2.59912109375, -2.2960205078125, -1.992919921875, -1.6898193359375, -1.38671875, -1.0836181640625, -0.780517578125, -0.4774169921875, -0.17431640625, 0.1287841796875, 0.431884765625, 0.7349853515625, 1.0380859375, 1.3411865234375, 1.644287109375, 1.9473876953125, 2.25048828125, 2.5535888671875, 2.856689453125, 3.1597900390625, 3.462890625, 3.7659912109375, 4.069091796875, 4.3721923828125, 4.67529296875, 4.9783935546875, 5.281494140625, 5.5845947265625, 5.8876953125, 6.1907958984375, 6.493896484375, 6.7969970703125, 7.10009765625, 7.4031982421875, 7.706298828125, 8.0093994140625, 8.3125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 10.0, 5.0, 11.0, 13.0, 24.0, 24.0, 25.0, 32.0, 57.0, 47.0, 69.0, 68.0, 75.0, 80.0, 74.0, 79.0, 67.0, 46.0, 51.0, 31.0, 24.0, 23.0, 21.0, 14.0, 8.0, 8.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3447265625, -1.3103790283203125, -1.276031494140625, -1.2416839599609375, -1.20733642578125, -1.1729888916015625, -1.138641357421875, -1.1042938232421875, -1.0699462890625, -1.0355987548828125, -1.001251220703125, -0.9669036865234375, -0.93255615234375, -0.8982086181640625, -0.863861083984375, -0.8295135498046875, -0.795166015625, -0.7608184814453125, -0.726470947265625, -0.6921234130859375, -0.65777587890625, -0.6234283447265625, -0.589080810546875, -0.5547332763671875, -0.5203857421875, -0.4860382080078125, -0.451690673828125, -0.4173431396484375, -0.38299560546875, -0.3486480712890625, -0.314300537109375, -0.2799530029296875, -0.24560546875, -0.2112579345703125, -0.176910400390625, -0.1425628662109375, -0.10821533203125, -0.0738677978515625, -0.039520263671875, -0.0051727294921875, 0.0291748046875, 0.0635223388671875, 0.097869873046875, 0.1322174072265625, 0.16656494140625, 0.2009124755859375, 0.235260009765625, 0.2696075439453125, 0.303955078125, 0.3383026123046875, 0.372650146484375, 0.4069976806640625, 0.44134521484375, 0.4756927490234375, 0.510040283203125, 0.5443878173828125, 0.5787353515625, 0.6130828857421875, 0.647430419921875, 0.6817779541015625, 0.71612548828125, 0.7504730224609375, 0.784820556640625, 0.8191680908203125, 0.853515625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 10.0, 11.0, 19.0, 29.0, 55.0, 82.0, 105.0, 71.0, 43.0, 16.0, 11.0, 10.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.611623764038086, -11.331544876098633, -11.051466941833496, -10.771388053894043, -10.491310119628906, -10.211231231689453, -9.931153297424316, -9.651074409484863, -9.370996475219727, -9.090917587280273, -8.810839653015137, -8.530760765075684, -8.250682830810547, -7.970603942871094, -7.690525531768799, -7.410447120666504, -7.130368232727051, -6.850289821624756, -6.570211410522461, -6.290132999420166, -6.010054588317871, -5.729975700378418, -5.449897289276123, -5.169818878173828, -4.889740467071533, -4.609662055969238, -4.329583644866943, -4.049505233764648, -3.7694265842437744, -3.4893481731414795, -3.2092695236206055, -2.9291911125183105, -2.649113655090332, -2.369035243988037, -2.088956832885742, -1.8088781833648682, -1.5287997722625732, -1.2487213611602783, -0.9686428308486938, -0.6885643005371094, -0.40848588943481445, -0.12840741872787476, 0.15167105197906494, 0.43174952268600464, 0.7118279933929443, 0.9919064044952393, 1.2719849348068237, 1.5520634651184082, 1.8321418762207031, 2.112220287322998, 2.392298698425293, 2.672377347946167, 2.952455759048462, 3.232534170150757, 3.512612819671631, 3.792691230773926, 4.072769641876221, 4.352848052978516, 4.6329264640808105, 4.9130048751831055, 5.193083763122559, 5.473161697387695, 5.753240585327148, 6.033318996429443, 6.313397407531738]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 7.0, 16.0, 13.0, 29.0, 53.0, 92.0, 93.0, 70.0, 34.0, 20.0, 10.0, 10.0, 4.0, 5.0, 2.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.147286891937256, -4.965672969818115, -4.784059047698975, -4.602445125579834, -4.420830726623535, -4.2392168045043945, -4.057602882385254, -3.8759889602661133, -3.6943750381469727, -3.512761116027832, -3.3311471939086914, -3.1495330333709717, -2.967919111251831, -2.7863051891326904, -2.6046910285949707, -2.42307710647583, -2.2414631843566895, -2.059849262237549, -1.8782352209091187, -1.6966211795806885, -1.5150072574615479, -1.3333933353424072, -1.151779294013977, -0.9701652526855469, -0.7885513305664062, -0.6069373488426208, -0.42532336711883545, -0.24370938539505005, -0.06209540367126465, 0.11951857805252075, 0.30113255977630615, 0.48274660110473633, 0.6643600463867188, 0.8459740281105042, 1.0275880098342896, 1.2092020511627197, 1.3908159732818604, 1.572429895401001, 1.7540439367294312, 1.9356579780578613, 2.117271900177002, 2.2988858222961426, 2.480499744415283, 2.662113904953003, 2.8437278270721436, 3.025341749191284, 3.206955909729004, 3.3885698318481445, 3.570183753967285, 3.751797676086426, 3.9334115982055664, 4.115025520324707, 4.296639442443848, 4.4782538414001465, 4.659867763519287, 4.841481685638428, 5.023095607757568, 5.204709529876709, 5.38632345199585, 5.56793737411499, 5.749551773071289, 5.93116569519043, 6.11277961730957, 6.294393539428711, 6.476007461547852]}, "eval/loss": 4.160531044006348, "eval/wer": 2.4565450218167393, "eval/runtime": 1155.2061, "eval/samples_per_second": 2.287, "eval/steps_per_second": 0.287, "train/train_runtime": 8769.6328, "train/train_samples_per_second": 3.254, "train/train_steps_per_second": 0.203, "train/total_flos": 0.0, "train/train_loss": 4.241978131735806} \ No newline at end of file +{"train/loss": 3.5732, "train/learning_rate": 3.1152647975077883e-08, "train/epoch": 1.0, "train/global_step": 1784, "_runtime": 10136, "_timestamp": 1646051161, "_step": 1788, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 9.0, 346.0, 631.0, 30.0, 2.0, 1.0], "bins": [-641.971923828125, -631.305908203125, -620.639892578125, -609.973876953125, -599.307861328125, -588.641845703125, -577.975830078125, -567.309814453125, -556.643798828125, -545.977783203125, -535.311767578125, -524.645751953125, -513.979736328125, -503.313720703125, -492.647705078125, -481.981689453125, -471.315673828125, -460.649658203125, -449.983642578125, -439.317626953125, -428.651611328125, -417.985595703125, -407.319580078125, -396.653564453125, -385.987548828125, -375.321533203125, -364.655517578125, -353.989501953125, -343.323486328125, -332.657470703125, -321.991455078125, -311.325439453125, -300.6593933105469, -289.9933776855469, -279.3273620605469, -268.6613464355469, -257.9953308105469, -247.32931518554688, -236.66329956054688, -225.99728393554688, -215.33126831054688, -204.66525268554688, -193.99923706054688, -183.33322143554688, -172.66720581054688, -162.00119018554688, -151.33517456054688, -140.66915893554688, -130.00314331054688, -119.33712768554688, -108.67111206054688, -98.00509643554688, -87.33908081054688, -76.67306518554688, -66.00704956054688, -55.341033935546875, -44.67502212524414, -34.00900650024414, -23.34299087524414, -12.67697525024414, -2.0109596252441406, 8.65505599975586, 19.32107162475586, 29.98708724975586, 40.65310287475586]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 10.0, 8.0, 10.0, 19.0, 21.0, 16.0, 27.0, 24.0, 29.0, 34.0, 38.0, 42.0, 38.0, 39.0, 44.0, 47.0, 51.0, 52.0, 45.0, 44.0, 38.0, 46.0, 33.0, 29.0, 45.0, 18.0, 31.0, 22.0, 13.0, 15.0, 10.0, 20.0, 11.0, 6.0, 4.0, 8.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-75.822509765625, -73.62486267089844, -71.4272232055664, -69.22957611083984, -67.03193664550781, -64.83428955078125, -62.63664627075195, -60.439002990722656, -58.24135971069336, -56.04371643066406, -53.846073150634766, -51.64842987060547, -49.450782775878906, -47.253143310546875, -45.05549621582031, -42.857852935791016, -40.66020965576172, -38.46256637573242, -36.264923095703125, -34.06727981567383, -31.8696346282959, -29.6719913482666, -27.474346160888672, -25.276702880859375, -23.079059600830078, -20.88141632080078, -18.683773040771484, -16.486127853393555, -14.288484573364258, -12.090841293334961, -9.893197059631348, -7.695552825927734, -5.4979095458984375, -3.3002657890319824, -1.1026220321655273, 1.0950217247009277, 3.292665481567383, 5.49030876159668, 7.687952995300293, 9.885597229003906, 12.083240509033203, 14.2808837890625, 16.478527069091797, 18.676172256469727, 20.873815536499023, 23.07145881652832, 25.26910400390625, 27.466747283935547, 29.664390563964844, 31.86203384399414, 34.05967712402344, 36.257320404052734, 38.45496368408203, 40.652610778808594, 42.85025405883789, 45.04789733886719, 47.245540618896484, 49.44318389892578, 51.64082717895508, 53.838470458984375, 56.03611755371094, 58.23375701904297, 60.43140411376953, 62.62904739379883, 64.82669067382812]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 4.0, 8.0, 11.0, 16.0, 21.0, 32.0, 31.0, 38.0, 38.0, 50.0, 49.0, 55.0, 53.0, 54.0, 61.0, 48.0, 71.0, 50.0, 42.0, 49.0, 33.0, 43.0, 48.0, 24.0, 18.0, 14.0, 15.0, 7.0, 8.0, 7.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-8.375, -8.1734619140625, -7.971923828125, -7.7703857421875, -7.56884765625, -7.3673095703125, -7.165771484375, -6.9642333984375, -6.7626953125, -6.5611572265625, -6.359619140625, -6.1580810546875, -5.95654296875, -5.7550048828125, -5.553466796875, -5.3519287109375, -5.150390625, -4.9488525390625, -4.747314453125, -4.5457763671875, -4.34423828125, -4.1427001953125, -3.941162109375, -3.7396240234375, -3.5380859375, -3.3365478515625, -3.135009765625, -2.9334716796875, -2.73193359375, -2.5303955078125, -2.328857421875, -2.1273193359375, -1.92578125, -1.7242431640625, -1.522705078125, -1.3211669921875, -1.11962890625, -0.9180908203125, -0.716552734375, -0.5150146484375, -0.3134765625, -0.1119384765625, 0.089599609375, 0.2911376953125, 0.49267578125, 0.6942138671875, 0.895751953125, 1.0972900390625, 1.298828125, 1.5003662109375, 1.701904296875, 1.9034423828125, 2.10498046875, 2.3065185546875, 2.508056640625, 2.7095947265625, 2.9111328125, 3.1126708984375, 3.314208984375, 3.5157470703125, 3.71728515625, 3.9188232421875, 4.120361328125, 4.3218994140625, 4.5234375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 3.0, 2.0, 9.0, 6.0, 10.0, 12.0, 25.0, 27.0, 37.0, 68.0, 93.0, 165.0, 224.0, 442.0, 815.0, 1724.0, 4296.0, 14068.0, 99545.0, 2388338.0, 1594739.0, 70897.0, 11734.0, 3624.0, 1570.0, 781.0, 417.0, 250.0, 135.0, 84.0, 51.0, 38.0, 25.0, 10.0, 11.0, 3.0, 5.0, 3.0, 0.0, 2.0], "bins": [-27.78125, -27.148681640625, -26.51611328125, -25.883544921875, -25.2509765625, -24.618408203125, -23.98583984375, -23.353271484375, -22.720703125, -22.088134765625, -21.45556640625, -20.822998046875, -20.1904296875, -19.557861328125, -18.92529296875, -18.292724609375, -17.66015625, -17.027587890625, -16.39501953125, -15.762451171875, -15.1298828125, -14.497314453125, -13.86474609375, -13.232177734375, -12.599609375, -11.967041015625, -11.33447265625, -10.701904296875, -10.0693359375, -9.436767578125, -8.80419921875, -8.171630859375, -7.5390625, -6.906494140625, -6.27392578125, -5.641357421875, -5.0087890625, -4.376220703125, -3.74365234375, -3.111083984375, -2.478515625, -1.845947265625, -1.21337890625, -0.580810546875, 0.0517578125, 0.684326171875, 1.31689453125, 1.949462890625, 2.58203125, 3.214599609375, 3.84716796875, 4.479736328125, 5.1123046875, 5.744873046875, 6.37744140625, 7.010009765625, 7.642578125, 8.275146484375, 8.90771484375, 9.540283203125, 10.1728515625, 10.805419921875, 11.43798828125, 12.070556640625, 12.703125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 11.0, 23.0, 24.0, 57.0, 84.0, 139.0, 236.0, 372.0, 679.0, 886.0, 624.0, 364.0, 231.0, 126.0, 80.0, 38.0, 22.0, 20.0, 24.0, 10.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.734375, -22.9287109375, -22.123046875, -21.3173828125, -20.51171875, -19.7060546875, -18.900390625, -18.0947265625, -17.2890625, -16.4833984375, -15.677734375, -14.8720703125, -14.06640625, -13.2607421875, -12.455078125, -11.6494140625, -10.84375, -10.0380859375, -9.232421875, -8.4267578125, -7.62109375, -6.8154296875, -6.009765625, -5.2041015625, -4.3984375, -3.5927734375, -2.787109375, -1.9814453125, -1.17578125, -0.3701171875, 0.435546875, 1.2412109375, 2.046875, 2.8525390625, 3.658203125, 4.4638671875, 5.26953125, 6.0751953125, 6.880859375, 7.6865234375, 8.4921875, 9.2978515625, 10.103515625, 10.9091796875, 11.71484375, 12.5205078125, 13.326171875, 14.1318359375, 14.9375, 15.7431640625, 16.548828125, 17.3544921875, 18.16015625, 18.9658203125, 19.771484375, 20.5771484375, 21.3828125, 22.1884765625, 22.994140625, 23.7998046875, 24.60546875, 25.4111328125, 26.216796875, 27.0224609375, 27.828125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 16.0, 14.0, 22.0, 40.0, 66.0, 96.0, 225.0, 408.0, 869.0, 2223.0, 22720.0, 4086441.0, 76007.0, 2997.0, 1028.0, 486.0, 245.0, 123.0, 97.0, 56.0, 23.0, 17.0, 15.0, 8.0, 5.0, 5.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.0625, -71.3798828125, -68.697265625, -66.0146484375, -63.33203125, -60.6494140625, -57.966796875, -55.2841796875, -52.6015625, -49.9189453125, -47.236328125, -44.5537109375, -41.87109375, -39.1884765625, -36.505859375, -33.8232421875, -31.140625, -28.4580078125, -25.775390625, -23.0927734375, -20.41015625, -17.7275390625, -15.044921875, -12.3623046875, -9.6796875, -6.9970703125, -4.314453125, -1.6318359375, 1.05078125, 3.7333984375, 6.416015625, 9.0986328125, 11.78125, 14.4638671875, 17.146484375, 19.8291015625, 22.51171875, 25.1943359375, 27.876953125, 30.5595703125, 33.2421875, 35.9248046875, 38.607421875, 41.2900390625, 43.97265625, 46.6552734375, 49.337890625, 52.0205078125, 54.703125, 57.3857421875, 60.068359375, 62.7509765625, 65.43359375, 68.1162109375, 70.798828125, 73.4814453125, 76.1640625, 78.8466796875, 81.529296875, 84.2119140625, 86.89453125, 89.5771484375, 92.259765625, 94.9423828125, 97.625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 81.0, 553.0, 353.0, 21.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-270.17755126953125, -262.1882629394531, -254.198974609375, -246.20968627929688, -238.22039794921875, -230.23110961914062, -222.2418212890625, -214.25253295898438, -206.26324462890625, -198.27395629882812, -190.28466796875, -182.29537963867188, -174.30609130859375, -166.31680297851562, -158.3275146484375, -150.33822631835938, -142.3489532470703, -134.3596649169922, -126.37037658691406, -118.38108825683594, -110.39179992675781, -102.40251159667969, -94.4132308959961, -86.42394256591797, -78.43465423583984, -70.44536590576172, -62.456077575683594, -54.466793060302734, -46.47750473022461, -38.488216400146484, -30.498931884765625, -22.5096435546875, -14.520339965820312, -6.531052589416504, 1.4582347869873047, 9.447521209716797, 17.436809539794922, 25.426097869873047, 33.415382385253906, 41.40467071533203, 49.393959045410156, 57.38324737548828, 65.3725357055664, 73.36181640625, 81.35110473632812, 89.34039306640625, 97.32968139648438, 105.3189697265625, 113.30825805664062, 121.29754638671875, 129.28683471679688, 137.276123046875, 145.26541137695312, 153.25469970703125, 161.24398803710938, 169.2332763671875, 177.22256469726562, 185.21185302734375, 193.20114135742188, 201.1904296875, 209.17971801757812, 217.16900634765625, 225.15829467773438, 233.1475830078125, 241.13685607910156]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 0.0, 4.0, 3.0, 2.0, 10.0, 9.0, 4.0, 8.0, 8.0, 9.0, 15.0, 16.0, 7.0, 27.0, 25.0, 17.0, 24.0, 28.0, 22.0, 29.0, 36.0, 44.0, 38.0, 38.0, 34.0, 32.0, 49.0, 38.0, 45.0, 48.0, 40.0, 34.0, 32.0, 24.0, 24.0, 18.0, 21.0, 26.0, 16.0, 12.0, 20.0, 11.0, 14.0, 9.0, 8.0, 5.0, 4.0, 9.0, 6.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-49.61613464355469, -48.13227462768555, -46.64841842651367, -45.16455841064453, -43.68069839477539, -42.19683837890625, -40.712982177734375, -39.229122161865234, -37.745262145996094, -36.26140213012695, -34.77754592895508, -33.29368591308594, -31.809825897216797, -30.32596778869629, -28.84210968017578, -27.35824966430664, -25.874391555786133, -24.390533447265625, -22.906673431396484, -21.422815322875977, -19.938955307006836, -18.455097198486328, -16.971237182617188, -15.48737907409668, -14.003520011901855, -12.519660949707031, -11.035801887512207, -9.551942825317383, -8.068084716796875, -6.584225177764893, -5.100366592407227, -3.6165075302124023, -2.132648468017578, -0.6487895250320435, 0.8350694179534912, 2.3189282417297363, 3.8027873039245605, 5.286646366119385, 6.770504951477051, 8.254364013671875, 9.7382230758667, 11.222082138061523, 12.705941200256348, 14.189800262451172, 15.67365837097168, 17.15751838684082, 18.641376495361328, 20.12523651123047, 21.609094619750977, 23.092952728271484, 24.576812744140625, 26.060670852661133, 27.544530868530273, 29.02838897705078, 30.512248992919922, 31.99610710144043, 33.47996520996094, 34.96382522583008, 36.44768142700195, 37.931541442871094, 39.415401458740234, 40.899261474609375, 42.38311767578125, 43.86697769165039, 45.35083770751953]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 5.0, 10.0, 12.0, 17.0, 25.0, 24.0, 32.0, 29.0, 34.0, 53.0, 54.0, 40.0, 52.0, 48.0, 64.0, 45.0, 62.0, 44.0, 41.0, 58.0, 35.0, 41.0, 39.0, 40.0, 27.0, 13.0, 16.0, 17.0, 12.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.24139404296875, -7.0335693359375, -6.82574462890625, -6.617919921875, -6.41009521484375, -6.2022705078125, -5.99444580078125, -5.78662109375, -5.57879638671875, -5.3709716796875, -5.16314697265625, -4.955322265625, -4.74749755859375, -4.5396728515625, -4.33184814453125, -4.1240234375, -3.91619873046875, -3.7083740234375, -3.50054931640625, -3.292724609375, -3.08489990234375, -2.8770751953125, -2.66925048828125, -2.46142578125, -2.25360107421875, -2.0457763671875, -1.83795166015625, -1.630126953125, -1.42230224609375, -1.2144775390625, -1.00665283203125, -0.798828125, -0.59100341796875, -0.3831787109375, -0.17535400390625, 0.032470703125, 0.24029541015625, 0.4481201171875, 0.65594482421875, 0.86376953125, 1.07159423828125, 1.2794189453125, 1.48724365234375, 1.695068359375, 1.90289306640625, 2.1107177734375, 2.31854248046875, 2.5263671875, 2.73419189453125, 2.9420166015625, 3.14984130859375, 3.357666015625, 3.56549072265625, 3.7733154296875, 3.98114013671875, 4.18896484375, 4.39678955078125, 4.6046142578125, 4.81243896484375, 5.020263671875, 5.22808837890625, 5.4359130859375, 5.64373779296875, 5.8515625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 9.0, 10.0, 16.0, 22.0, 27.0, 41.0, 78.0, 98.0, 160.0, 212.0, 344.0, 494.0, 814.0, 1440.0, 2241.0, 3882.0, 6698.0, 11812.0, 20901.0, 36784.0, 65891.0, 114348.0, 199263.0, 246334.0, 144137.0, 82930.0, 47360.0, 26393.0, 14927.0, 8406.0, 5019.0, 2796.0, 1710.0, 1104.0, 640.0, 434.0, 259.0, 164.0, 142.0, 81.0, 39.0, 29.0, 21.0, 17.0, 14.0, 13.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.85986328125, -0.8323135375976562, -0.8047637939453125, -0.7772140502929688, -0.749664306640625, -0.7221145629882812, -0.6945648193359375, -0.6670150756835938, -0.63946533203125, -0.6119155883789062, -0.5843658447265625, -0.5568161010742188, -0.529266357421875, -0.5017166137695312, -0.4741668701171875, -0.44661712646484375, -0.4190673828125, -0.39151763916015625, -0.3639678955078125, -0.33641815185546875, -0.308868408203125, -0.28131866455078125, -0.2537689208984375, -0.22621917724609375, -0.19866943359375, -0.17111968994140625, -0.1435699462890625, -0.11602020263671875, -0.088470458984375, -0.06092071533203125, -0.0333709716796875, -0.00582122802734375, 0.021728515625, 0.04927825927734375, 0.0768280029296875, 0.10437774658203125, 0.131927490234375, 0.15947723388671875, 0.1870269775390625, 0.21457672119140625, 0.24212646484375, 0.26967620849609375, 0.2972259521484375, 0.32477569580078125, 0.352325439453125, 0.37987518310546875, 0.4074249267578125, 0.43497467041015625, 0.4625244140625, 0.49007415771484375, 0.5176239013671875, 0.5451736450195312, 0.572723388671875, 0.6002731323242188, 0.6278228759765625, 0.6553726196289062, 0.68292236328125, 0.7104721069335938, 0.7380218505859375, 0.7655715942382812, 0.793121337890625, 0.8206710815429688, 0.8482208251953125, 0.8757705688476562, 0.9033203125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 5.0, 2.0, 11.0, 7.0, 16.0, 15.0, 13.0, 7.0, 16.0, 20.0, 19.0, 31.0, 23.0, 25.0, 29.0, 27.0, 39.0, 34.0, 46.0, 43.0, 34.0, 1062.0, 40.0, 44.0, 37.0, 30.0, 31.0, 32.0, 26.0, 35.0, 26.0, 21.0, 25.0, 16.0, 18.0, 23.0, 15.0, 14.0, 5.0, 10.0, 7.0, 5.0, 5.0, 7.0, 8.0, 3.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.92578125, -2.833282470703125, -2.74078369140625, -2.648284912109375, -2.5557861328125, -2.463287353515625, -2.37078857421875, -2.278289794921875, -2.185791015625, -2.093292236328125, -2.00079345703125, -1.908294677734375, -1.8157958984375, -1.723297119140625, -1.63079833984375, -1.538299560546875, -1.44580078125, -1.353302001953125, -1.26080322265625, -1.168304443359375, -1.0758056640625, -0.983306884765625, -0.89080810546875, -0.798309326171875, -0.705810546875, -0.613311767578125, -0.52081298828125, -0.428314208984375, -0.3358154296875, -0.243316650390625, -0.15081787109375, -0.058319091796875, 0.0341796875, 0.126678466796875, 0.21917724609375, 0.311676025390625, 0.4041748046875, 0.496673583984375, 0.58917236328125, 0.681671142578125, 0.774169921875, 0.866668701171875, 0.95916748046875, 1.051666259765625, 1.1441650390625, 1.236663818359375, 1.32916259765625, 1.421661376953125, 1.51416015625, 1.606658935546875, 1.69915771484375, 1.791656494140625, 1.8841552734375, 1.976654052734375, 2.06915283203125, 2.161651611328125, 2.254150390625, 2.346649169921875, 2.43914794921875, 2.531646728515625, 2.6241455078125, 2.716644287109375, 2.80914306640625, 2.901641845703125, 2.994140625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 8.0, 11.0, 12.0, 26.0, 32.0, 55.0, 75.0, 105.0, 198.0, 248.0, 379.0, 566.0, 840.0, 1308.0, 1928.0, 2883.0, 4379.0, 7044.0, 10684.0, 16859.0, 26844.0, 42249.0, 67583.0, 108797.0, 176921.0, 1259102.0, 137087.0, 85135.0, 53181.0, 33406.0, 21081.0, 13297.0, 8725.0, 5455.0, 3610.0, 2356.0, 1571.0, 1032.0, 685.0, 476.0, 294.0, 196.0, 142.0, 101.0, 58.0, 40.0, 23.0, 15.0, 9.0, 16.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0], "bins": [-0.66650390625, -0.646453857421875, -0.62640380859375, -0.606353759765625, -0.5863037109375, -0.566253662109375, -0.54620361328125, -0.526153564453125, -0.506103515625, -0.486053466796875, -0.46600341796875, -0.445953369140625, -0.4259033203125, -0.405853271484375, -0.38580322265625, -0.365753173828125, -0.345703125, -0.325653076171875, -0.30560302734375, -0.285552978515625, -0.2655029296875, -0.245452880859375, -0.22540283203125, -0.205352783203125, -0.185302734375, -0.165252685546875, -0.14520263671875, -0.125152587890625, -0.1051025390625, -0.085052490234375, -0.06500244140625, -0.044952392578125, -0.02490234375, -0.004852294921875, 0.01519775390625, 0.035247802734375, 0.0552978515625, 0.075347900390625, 0.09539794921875, 0.115447998046875, 0.135498046875, 0.155548095703125, 0.17559814453125, 0.195648193359375, 0.2156982421875, 0.235748291015625, 0.25579833984375, 0.275848388671875, 0.2958984375, 0.315948486328125, 0.33599853515625, 0.356048583984375, 0.3760986328125, 0.396148681640625, 0.41619873046875, 0.436248779296875, 0.456298828125, 0.476348876953125, 0.49639892578125, 0.516448974609375, 0.5364990234375, 0.556549072265625, 0.57659912109375, 0.596649169921875, 0.61669921875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 4.0, 2.0, 4.0, 4.0, 5.0, 12.0, 8.0, 8.0, 16.0, 23.0, 19.0, 27.0, 33.0, 36.0, 41.0, 54.0, 46.0, 49.0, 63.0, 69.0, 63.0, 51.0, 59.0, 31.0, 43.0, 31.0, 39.0, 18.0, 27.0, 21.0, 31.0, 12.0, 10.0, 9.0, 8.0, 8.0, 8.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001129150390625, -0.0010925531387329102, -0.0010559558868408203, -0.0010193586349487305, -0.0009827613830566406, -0.0009461641311645508, -0.0009095668792724609, -0.0008729696273803711, -0.0008363723754882812, -0.0007997751235961914, -0.0007631778717041016, -0.0007265806198120117, -0.0006899833679199219, -0.000653386116027832, -0.0006167888641357422, -0.0005801916122436523, -0.0005435943603515625, -0.0005069971084594727, -0.0004703998565673828, -0.00043380260467529297, -0.0003972053527832031, -0.0003606081008911133, -0.00032401084899902344, -0.0002874135971069336, -0.00025081634521484375, -0.0002142190933227539, -0.00017762184143066406, -0.00014102458953857422, -0.00010442733764648438, -6.783008575439453e-05, -3.123283386230469e-05, 5.364418029785156e-06, 4.1961669921875e-05, 7.855892181396484e-05, 0.00011515617370605469, 0.00015175342559814453, 0.00018835067749023438, 0.00022494792938232422, 0.00026154518127441406, 0.0002981424331665039, 0.00033473968505859375, 0.0003713369369506836, 0.00040793418884277344, 0.0004445314407348633, 0.0004811286926269531, 0.000517725944519043, 0.0005543231964111328, 0.0005909204483032227, 0.0006275177001953125, 0.0006641149520874023, 0.0007007122039794922, 0.000737309455871582, 0.0007739067077636719, 0.0008105039596557617, 0.0008471012115478516, 0.0008836984634399414, 0.0009202957153320312, 0.0009568929672241211, 0.000993490219116211, 0.0010300874710083008, 0.0010666847229003906, 0.0011032819747924805, 0.0011398792266845703, 0.0011764764785766602, 0.00121307373046875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 4.0, 7.0, 11.0, 7.0, 18.0, 20.0, 14.0, 23.0, 27.0, 41.0, 48.0, 68.0, 75.0, 117.0, 129.0, 200.0, 225.0, 287.0, 558.0, 1094.0, 968621.0, 74439.0, 819.0, 463.0, 256.0, 220.0, 149.0, 134.0, 119.0, 85.0, 66.0, 50.0, 35.0, 19.0, 24.0, 19.0, 13.0, 14.0, 4.0, 7.0, 11.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02197265625, -0.02128291130065918, -0.02059316635131836, -0.01990342140197754, -0.01921367645263672, -0.0185239315032959, -0.017834186553955078, -0.017144441604614258, -0.016454696655273438, -0.015764951705932617, -0.015075206756591797, -0.014385461807250977, -0.013695716857910156, -0.013005971908569336, -0.012316226959228516, -0.011626482009887695, -0.010936737060546875, -0.010246992111206055, -0.009557247161865234, -0.008867502212524414, -0.008177757263183594, -0.0074880123138427734, -0.006798267364501953, -0.006108522415161133, -0.0054187774658203125, -0.004729032516479492, -0.004039287567138672, -0.0033495426177978516, -0.0026597976684570312, -0.001970052719116211, -0.0012803077697753906, -0.0005905628204345703, 9.918212890625e-05, 0.0007889270782470703, 0.0014786720275878906, 0.002168416976928711, 0.0028581619262695312, 0.0035479068756103516, 0.004237651824951172, 0.004927396774291992, 0.0056171417236328125, 0.006306886672973633, 0.006996631622314453, 0.0076863765716552734, 0.008376121520996094, 0.009065866470336914, 0.009755611419677734, 0.010445356369018555, 0.011135101318359375, 0.011824846267700195, 0.012514591217041016, 0.013204336166381836, 0.013894081115722656, 0.014583826065063477, 0.015273571014404297, 0.015963315963745117, 0.016653060913085938, 0.017342805862426758, 0.018032550811767578, 0.0187222957611084, 0.01941204071044922, 0.02010178565979004, 0.02079153060913086, 0.02148127555847168, 0.0221710205078125]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 8.0, 160.0, 786.0, 61.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006038642022758722, -0.0004914011806249619, -0.000378938129870221, -0.0002664750791154802, -0.0001540120574645698, -4.154903581365943e-05, 7.091404404491186e-05, 0.00018337706569582224, 0.0002958400873467326, 0.000408303108997643, 0.0005207661306485534, 0.0006332292105071247, 0.000745692232158035, 0.0008581552538089454, 0.0009706183336675167, 0.001083081355318427, 0.0011955443769693375, 0.0013080073986202478, 0.0014204704202711582, 0.0015329334419220686, 0.001645396463572979, 0.0017578594852238894, 0.0018703226232901216, 0.0019827857613563538, 0.0020952485501766205, 0.002207711571827531, 0.0023201745934784412, 0.0024326376151293516, 0.002545100636780262, 0.0026575636584311724, 0.0027700266800820827, 0.0028824899345636368, 0.0029949527233839035, 0.003107415745034814, 0.0032198787666857243, 0.0033323417883366346, 0.003444804809987545, 0.0035572678316384554, 0.0036697308532893658, 0.00378219410777092, 0.0038946568965911865, 0.0040071201510727406, 0.004119582939893007, 0.004232046194374561, 0.004344508983194828, 0.004456972237676382, 0.004569435026496649, 0.004681898280978203, 0.0047943610697984695, 0.004906824324280024, 0.00501928711310029, 0.005131750367581844, 0.005244213156402111, 0.005356676410883665, 0.005469139199703932, 0.005581602454185486, 0.00569406570866704, 0.005806528963148594, 0.005918991751968861, 0.006031455006450415, 0.006143917795270681, 0.006256381049752235, 0.006368843838572502, 0.006481307093054056, 0.006593769881874323]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 7.0, 2.0, 5.0, 6.0, 10.0, 19.0, 15.0, 19.0, 20.0, 24.0, 24.0, 33.0, 40.0, 43.0, 44.0, 39.0, 44.0, 46.0, 53.0, 55.0, 47.0, 53.0, 53.0, 34.0, 32.0, 35.0, 23.0, 32.0, 24.0, 19.0, 23.0, 19.0, 19.0, 10.0, 9.0, 8.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005924105644226074, -0.0005711764097213745, -0.0005499422550201416, -0.0005287081003189087, -0.0005074739456176758, -0.00048623979091644287, -0.00046500563621520996, -0.00044377148151397705, -0.00042253732681274414, -0.00040130317211151123, -0.0003800690174102783, -0.0003588348627090454, -0.0003376007080078125, -0.0003163665533065796, -0.0002951323986053467, -0.00027389824390411377, -0.00025266408920288086, -0.00023142993450164795, -0.00021019577980041504, -0.00018896162509918213, -0.00016772747039794922, -0.0001464933156967163, -0.0001252591609954834, -0.00010402500629425049, -8.279085159301758e-05, -6.155669689178467e-05, -4.032254219055176e-05, -1.9088387489318848e-05, 2.1457672119140625e-06, 2.3379921913146973e-05, 4.461407661437988e-05, 6.584823131561279e-05, 8.70823860168457e-05, 0.00010831654071807861, 0.00012955069541931152, 0.00015078485012054443, 0.00017201900482177734, 0.00019325315952301025, 0.00021448731422424316, 0.00023572146892547607, 0.000256955623626709, 0.0002781897783279419, 0.0002994239330291748, 0.0003206580877304077, 0.0003418922424316406, 0.00036312639713287354, 0.00038436055183410645, 0.00040559470653533936, 0.00042682886123657227, 0.0004480630159378052, 0.0004692971706390381, 0.000490531325340271, 0.0005117654800415039, 0.0005329996347427368, 0.0005542337894439697, 0.0005754679441452026, 0.0005967020988464355, 0.0006179362535476685, 0.0006391704082489014, 0.0006604045629501343, 0.0006816387176513672, 0.0007028728723526001, 0.000724107027053833, 0.0007453411817550659, 0.0007665753364562988]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 5.0, 10.0, 12.0, 17.0, 25.0, 24.0, 32.0, 29.0, 34.0, 53.0, 54.0, 40.0, 52.0, 48.0, 64.0, 45.0, 62.0, 44.0, 41.0, 58.0, 35.0, 41.0, 39.0, 40.0, 27.0, 13.0, 16.0, 17.0, 12.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.24139404296875, -7.0335693359375, -6.82574462890625, -6.617919921875, -6.41009521484375, -6.2022705078125, -5.99444580078125, -5.78662109375, -5.57879638671875, -5.3709716796875, -5.16314697265625, -4.955322265625, -4.74749755859375, -4.5396728515625, -4.33184814453125, -4.1240234375, -3.91619873046875, -3.7083740234375, -3.50054931640625, -3.292724609375, -3.08489990234375, -2.8770751953125, -2.66925048828125, -2.46142578125, -2.25360107421875, -2.0457763671875, -1.83795166015625, -1.630126953125, -1.42230224609375, -1.2144775390625, -1.00665283203125, -0.798828125, -0.59100341796875, -0.3831787109375, -0.17535400390625, 0.032470703125, 0.24029541015625, 0.4481201171875, 0.65594482421875, 0.86376953125, 1.07159423828125, 1.2794189453125, 1.48724365234375, 1.695068359375, 1.90289306640625, 2.1107177734375, 2.31854248046875, 2.5263671875, 2.73419189453125, 2.9420166015625, 3.14984130859375, 3.357666015625, 3.56549072265625, 3.7733154296875, 3.98114013671875, 4.18896484375, 4.39678955078125, 4.6046142578125, 4.81243896484375, 5.020263671875, 5.22808837890625, 5.4359130859375, 5.64373779296875, 5.8515625]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 9.0, 9.0, 10.0, 24.0, 35.0, 36.0, 50.0, 85.0, 115.0, 160.0, 244.0, 363.0, 486.0, 791.0, 1204.0, 2002.0, 3282.0, 5929.0, 13351.0, 58343.0, 879129.0, 55084.0, 13095.0, 5950.0, 3223.0, 1927.0, 1235.0, 733.0, 528.0, 341.0, 224.0, 173.0, 114.0, 72.0, 60.0, 33.0, 34.0, 21.0, 16.0, 12.0, 7.0, 8.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.34375, -35.22509765625, -34.1064453125, -32.98779296875, -31.869140625, -30.75048828125, -29.6318359375, -28.51318359375, -27.39453125, -26.27587890625, -25.1572265625, -24.03857421875, -22.919921875, -21.80126953125, -20.6826171875, -19.56396484375, -18.4453125, -17.32666015625, -16.2080078125, -15.08935546875, -13.970703125, -12.85205078125, -11.7333984375, -10.61474609375, -9.49609375, -8.37744140625, -7.2587890625, -6.14013671875, -5.021484375, -3.90283203125, -2.7841796875, -1.66552734375, -0.546875, 0.57177734375, 1.6904296875, 2.80908203125, 3.927734375, 5.04638671875, 6.1650390625, 7.28369140625, 8.40234375, 9.52099609375, 10.6396484375, 11.75830078125, 12.876953125, 13.99560546875, 15.1142578125, 16.23291015625, 17.3515625, 18.47021484375, 19.5888671875, 20.70751953125, 21.826171875, 22.94482421875, 24.0634765625, 25.18212890625, 26.30078125, 27.41943359375, 28.5380859375, 29.65673828125, 30.775390625, 31.89404296875, 33.0126953125, 34.13134765625, 35.25]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 2.0, 5.0, 8.0, 15.0, 17.0, 14.0, 13.0, 26.0, 26.0, 33.0, 24.0, 41.0, 38.0, 59.0, 50.0, 43.0, 103.0, 299.0, 1620.0, 179.0, 62.0, 51.0, 40.0, 44.0, 39.0, 29.0, 32.0, 20.0, 18.0, 17.0, 22.0, 10.0, 7.0, 14.0, 7.0, 5.0, 0.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-20.0625, -19.524169921875, -18.98583984375, -18.447509765625, -17.9091796875, -17.370849609375, -16.83251953125, -16.294189453125, -15.755859375, -15.217529296875, -14.67919921875, -14.140869140625, -13.6025390625, -13.064208984375, -12.52587890625, -11.987548828125, -11.44921875, -10.910888671875, -10.37255859375, -9.834228515625, -9.2958984375, -8.757568359375, -8.21923828125, -7.680908203125, -7.142578125, -6.604248046875, -6.06591796875, -5.527587890625, -4.9892578125, -4.450927734375, -3.91259765625, -3.374267578125, -2.8359375, -2.297607421875, -1.75927734375, -1.220947265625, -0.6826171875, -0.144287109375, 0.39404296875, 0.932373046875, 1.470703125, 2.009033203125, 2.54736328125, 3.085693359375, 3.6240234375, 4.162353515625, 4.70068359375, 5.239013671875, 5.77734375, 6.315673828125, 6.85400390625, 7.392333984375, 7.9306640625, 8.468994140625, 9.00732421875, 9.545654296875, 10.083984375, 10.622314453125, 11.16064453125, 11.698974609375, 12.2373046875, 12.775634765625, 13.31396484375, 13.852294921875, 14.390625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 9.0, 11.0, 9.0, 12.0, 14.0, 16.0, 18.0, 28.0, 31.0, 27.0, 42.0, 55.0, 59.0, 140.0, 396.0, 2664.0, 3119780.0, 20947.0, 750.0, 229.0, 101.0, 79.0, 56.0, 35.0, 29.0, 29.0, 19.0, 18.0, 21.0, 14.0, 16.0, 15.0, 7.0, 7.0, 3.0, 5.0, 2.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.9375, -63.556640625, -61.17578125, -58.794921875, -56.4140625, -54.033203125, -51.65234375, -49.271484375, -46.890625, -44.509765625, -42.12890625, -39.748046875, -37.3671875, -34.986328125, -32.60546875, -30.224609375, -27.84375, -25.462890625, -23.08203125, -20.701171875, -18.3203125, -15.939453125, -13.55859375, -11.177734375, -8.796875, -6.416015625, -4.03515625, -1.654296875, 0.7265625, 3.107421875, 5.48828125, 7.869140625, 10.25, 12.630859375, 15.01171875, 17.392578125, 19.7734375, 22.154296875, 24.53515625, 26.916015625, 29.296875, 31.677734375, 34.05859375, 36.439453125, 38.8203125, 41.201171875, 43.58203125, 45.962890625, 48.34375, 50.724609375, 53.10546875, 55.486328125, 57.8671875, 60.248046875, 62.62890625, 65.009765625, 67.390625, 69.771484375, 72.15234375, 74.533203125, 76.9140625, 79.294921875, 81.67578125, 84.056640625, 86.4375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 134.0, 874.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.75433349609375, -229.62741088867188, -222.50048828125, -215.37355041503906, -208.2466278076172, -201.1197052001953, -193.99276733398438, -186.8658447265625, -179.73892211914062, -172.61199951171875, -165.48507690429688, -158.35813903808594, -151.23121643066406, -144.1042938232422, -136.97735595703125, -129.85043334960938, -122.7235107421875, -115.59658813476562, -108.46965789794922, -101.34272766113281, -94.21580505371094, -87.08888244628906, -79.96195220947266, -72.83502197265625, -65.70809936523438, -58.581172943115234, -51.454246520996094, -44.32732009887695, -37.20039367675781, -30.073467254638672, -22.94654083251953, -15.81961441040039, -8.692672729492188, -1.5657463073730469, 5.561180114746094, 12.688106536865234, 19.815032958984375, 26.941959381103516, 34.068885803222656, 41.1958122253418, 48.32273864746094, 55.44966506958008, 62.57659149169922, 69.70352172851562, 76.8304443359375, 83.95736694335938, 91.08429718017578, 98.21122741699219, 105.33815002441406, 112.46507263183594, 119.59200286865234, 126.71893310546875, 133.84585571289062, 140.9727783203125, 148.09970092773438, 155.2266387939453, 162.3535614013672, 169.48048400878906, 176.607421875, 183.73434448242188, 190.86126708984375, 197.98818969726562, 205.1151123046875, 212.24205017089844, 219.3689727783203]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 6.0, 17.0, 5.0, 16.0, 10.0, 17.0, 21.0, 20.0, 31.0, 32.0, 16.0, 27.0, 25.0, 26.0, 54.0, 40.0, 53.0, 33.0, 51.0, 33.0, 35.0, 42.0, 40.0, 33.0, 29.0, 52.0, 38.0, 28.0, 26.0, 22.0, 17.0, 19.0, 13.0, 12.0, 9.0, 13.0, 6.0, 5.0, 6.0, 5.0, 8.0, 3.0, 3.0, 2.0, 0.0, 3.0], "bins": [-66.52519226074219, -64.83065032958984, -63.13611602783203, -61.44157409667969, -59.74703598022461, -58.05249786376953, -56.35795593261719, -54.66341781616211, -52.96887969970703, -51.27434158325195, -49.579803466796875, -47.88526153564453, -46.19072341918945, -44.496185302734375, -42.80164337158203, -41.10710525512695, -39.412567138671875, -37.7180290222168, -36.02349090576172, -34.328948974609375, -32.6344108581543, -30.93987274169922, -29.245332717895508, -27.550792694091797, -25.85625457763672, -24.16171646118164, -22.46717643737793, -20.77263641357422, -19.07809829711914, -17.383560180664062, -15.689020156860352, -13.994481086730957, -12.299945831298828, -10.605406761169434, -8.910867691040039, -7.2163286209106445, -5.52178955078125, -3.8272504806518555, -2.132711410522461, -0.4381723403930664, 1.2563667297363281, 2.9509057998657227, 4.645444869995117, 6.339983940124512, 8.034523010253906, 9.7290620803833, 11.423601150512695, 13.11814022064209, 14.812679290771484, 16.507217407226562, 18.201757431030273, 19.896297454833984, 21.590835571289062, 23.28537368774414, 24.97991371154785, 26.674453735351562, 28.36899185180664, 30.06352996826172, 31.75806999206543, 33.45261001586914, 35.14714813232422, 36.8416862487793, 38.536224365234375, 40.23076629638672, 41.9253044128418]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 4.0, 10.0, 15.0, 11.0, 13.0, 26.0, 20.0, 37.0, 27.0, 41.0, 45.0, 32.0, 55.0, 52.0, 40.0, 45.0, 57.0, 61.0, 49.0, 36.0, 53.0, 35.0, 51.0, 37.0, 27.0, 33.0, 25.0, 19.0, 11.0, 16.0, 11.0, 5.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.22265625, -7.01123046875, -6.7998046875, -6.58837890625, -6.376953125, -6.16552734375, -5.9541015625, -5.74267578125, -5.53125, -5.31982421875, -5.1083984375, -4.89697265625, -4.685546875, -4.47412109375, -4.2626953125, -4.05126953125, -3.83984375, -3.62841796875, -3.4169921875, -3.20556640625, -2.994140625, -2.78271484375, -2.5712890625, -2.35986328125, -2.1484375, -1.93701171875, -1.7255859375, -1.51416015625, -1.302734375, -1.09130859375, -0.8798828125, -0.66845703125, -0.45703125, -0.24560546875, -0.0341796875, 0.17724609375, 0.388671875, 0.60009765625, 0.8115234375, 1.02294921875, 1.234375, 1.44580078125, 1.6572265625, 1.86865234375, 2.080078125, 2.29150390625, 2.5029296875, 2.71435546875, 2.92578125, 3.13720703125, 3.3486328125, 3.56005859375, 3.771484375, 3.98291015625, 4.1943359375, 4.40576171875, 4.6171875, 4.82861328125, 5.0400390625, 5.25146484375, 5.462890625, 5.67431640625, 5.8857421875, 6.09716796875, 6.30859375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 11.0, 15.0, 22.0, 32.0, 45.0, 81.0, 132.0, 239.0, 383.0, 819.0, 1857.0, 4844.0, 15047.0, 81848.0, 3400880.0, 640020.0, 33620.0, 8549.0, 3156.0, 1293.0, 598.0, 309.0, 175.0, 107.0, 64.0, 41.0, 27.0, 17.0, 18.0, 5.0, 8.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.3125, -41.095703125, -39.87890625, -38.662109375, -37.4453125, -36.228515625, -35.01171875, -33.794921875, -32.578125, -31.361328125, -30.14453125, -28.927734375, -27.7109375, -26.494140625, -25.27734375, -24.060546875, -22.84375, -21.626953125, -20.41015625, -19.193359375, -17.9765625, -16.759765625, -15.54296875, -14.326171875, -13.109375, -11.892578125, -10.67578125, -9.458984375, -8.2421875, -7.025390625, -5.80859375, -4.591796875, -3.375, -2.158203125, -0.94140625, 0.275390625, 1.4921875, 2.708984375, 3.92578125, 5.142578125, 6.359375, 7.576171875, 8.79296875, 10.009765625, 11.2265625, 12.443359375, 13.66015625, 14.876953125, 16.09375, 17.310546875, 18.52734375, 19.744140625, 20.9609375, 22.177734375, 23.39453125, 24.611328125, 25.828125, 27.044921875, 28.26171875, 29.478515625, 30.6953125, 31.912109375, 33.12890625, 34.345703125, 35.5625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 3.0, 10.0, 11.0, 21.0, 19.0, 40.0, 55.0, 101.0, 160.0, 253.0, 427.0, 704.0, 828.0, 590.0, 332.0, 201.0, 121.0, 64.0, 40.0, 30.0, 29.0, 15.0, 8.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.25, -33.221435546875, -32.19287109375, -31.164306640625, -30.1357421875, -29.107177734375, -28.07861328125, -27.050048828125, -26.021484375, -24.992919921875, -23.96435546875, -22.935791015625, -21.9072265625, -20.878662109375, -19.85009765625, -18.821533203125, -17.79296875, -16.764404296875, -15.73583984375, -14.707275390625, -13.6787109375, -12.650146484375, -11.62158203125, -10.593017578125, -9.564453125, -8.535888671875, -7.50732421875, -6.478759765625, -5.4501953125, -4.421630859375, -3.39306640625, -2.364501953125, -1.3359375, -0.307373046875, 0.72119140625, 1.749755859375, 2.7783203125, 3.806884765625, 4.83544921875, 5.864013671875, 6.892578125, 7.921142578125, 8.94970703125, 9.978271484375, 11.0068359375, 12.035400390625, 13.06396484375, 14.092529296875, 15.12109375, 16.149658203125, 17.17822265625, 18.206787109375, 19.2353515625, 20.263916015625, 21.29248046875, 22.321044921875, 23.349609375, 24.378173828125, 25.40673828125, 26.435302734375, 27.4638671875, 28.492431640625, 29.52099609375, 30.549560546875, 31.578125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 8.0, 5.0, 11.0, 18.0, 19.0, 25.0, 51.0, 85.0, 118.0, 208.0, 425.0, 1958.0, 3494723.0, 694082.0, 1523.0, 433.0, 216.0, 133.0, 71.0, 59.0, 23.0, 31.0, 17.0, 15.0, 5.0, 5.0, 2.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.125, -93.845703125, -89.56640625, -85.287109375, -81.0078125, -76.728515625, -72.44921875, -68.169921875, -63.890625, -59.611328125, -55.33203125, -51.052734375, -46.7734375, -42.494140625, -38.21484375, -33.935546875, -29.65625, -25.376953125, -21.09765625, -16.818359375, -12.5390625, -8.259765625, -3.98046875, 0.298828125, 4.578125, 8.857421875, 13.13671875, 17.416015625, 21.6953125, 25.974609375, 30.25390625, 34.533203125, 38.8125, 43.091796875, 47.37109375, 51.650390625, 55.9296875, 60.208984375, 64.48828125, 68.767578125, 73.046875, 77.326171875, 81.60546875, 85.884765625, 90.1640625, 94.443359375, 98.72265625, 103.001953125, 107.28125, 111.560546875, 115.83984375, 120.119140625, 124.3984375, 128.677734375, 132.95703125, 137.236328125, 141.515625, 145.794921875, 150.07421875, 154.353515625, 158.6328125, 162.912109375, 167.19140625, 171.470703125, 175.75]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 82.0, 619.0, 298.0, 12.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-526.989501953125, -517.1840209960938, -507.37847900390625, -497.5729675292969, -487.7674560546875, -477.9619445800781, -468.15643310546875, -458.3509521484375, -448.54541015625, -438.7398986816406, -428.93438720703125, -419.1288757324219, -409.3233642578125, -399.5178527832031, -389.71234130859375, -379.9068603515625, -370.1013488769531, -360.29583740234375, -350.4903259277344, -340.684814453125, -330.8793029785156, -321.07379150390625, -311.2682800292969, -301.4627685546875, -291.65728759765625, -281.8517761230469, -272.0462646484375, -262.2407531738281, -252.43524169921875, -242.62973022460938, -232.82423400878906, -223.0187225341797, -213.2132110595703, -203.40769958496094, -193.60218811035156, -183.7966766357422, -173.99118041992188, -164.1856689453125, -154.38015747070312, -144.57464599609375, -134.76913452148438, -124.963623046875, -115.15811157226562, -105.35260772705078, -95.5470962524414, -85.74158477783203, -75.93608093261719, -66.13056945800781, -56.32505798339844, -46.51954650878906, -36.71403884887695, -26.90852928161621, -17.10301971435547, -7.297508239746094, 2.5079994201660156, 12.313507080078125, 22.1190185546875, 31.924528121948242, 41.730037689208984, 51.535545349121094, 61.34105682373047, 71.14656829833984, 80.95207214355469, 90.75758361816406, 100.56309509277344]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 4.0, 2.0, 5.0, 5.0, 4.0, 5.0, 7.0, 11.0, 22.0, 24.0, 18.0, 30.0, 25.0, 38.0, 40.0, 42.0, 41.0, 45.0, 55.0, 54.0, 46.0, 43.0, 50.0, 53.0, 42.0, 34.0, 43.0, 25.0, 32.0, 20.0, 31.0, 24.0, 21.0, 22.0, 12.0, 7.0, 7.0, 4.0, 10.0, 3.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.2261962890625, -72.79197692871094, -70.35775756835938, -67.92353057861328, -65.48931121826172, -63.055091857910156, -60.620872497558594, -58.18665313720703, -55.7524299621582, -53.31821060180664, -50.88398742675781, -48.44976806640625, -46.01554870605469, -43.58132553100586, -41.1471061706543, -38.71288299560547, -36.278663635253906, -33.844444274902344, -31.410221099853516, -28.976001739501953, -26.541780471801758, -24.107559204101562, -21.67333984375, -19.239118576049805, -16.80489730834961, -14.370676040649414, -11.936455726623535, -9.502235412597656, -7.068014144897461, -4.633792877197266, -2.1995725631713867, 0.2346477508544922, 2.6688613891601562, 5.103082180023193, 7.5373029708862305, 9.97152328491211, 12.405744552612305, 14.8399658203125, 17.274185180664062, 19.708406448364258, 22.142627716064453, 24.57684898376465, 27.011070251464844, 29.445289611816406, 31.8795108795166, 34.3137321472168, 36.74795150756836, 39.18217468261719, 41.61639404296875, 44.05061340332031, 46.48483657836914, 48.9190559387207, 51.35327911376953, 53.787498474121094, 56.221717834472656, 58.65593719482422, 61.09016036987305, 63.52437973022461, 65.95860290527344, 68.392822265625, 70.82704162597656, 73.26126098632812, 75.69548797607422, 78.12970733642578, 80.56392669677734]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 16.0, 17.0, 17.0, 23.0, 19.0, 19.0, 27.0, 38.0, 34.0, 41.0, 47.0, 43.0, 43.0, 36.0, 49.0, 52.0, 64.0, 41.0, 48.0, 41.0, 42.0, 36.0, 36.0, 25.0, 34.0, 22.0, 16.0, 16.0, 19.0, 9.0, 7.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -6.01800537109375, -5.8172607421875, -5.61651611328125, -5.415771484375, -5.21502685546875, -5.0142822265625, -4.81353759765625, -4.61279296875, -4.41204833984375, -4.2113037109375, -4.01055908203125, -3.809814453125, -3.60906982421875, -3.4083251953125, -3.20758056640625, -3.0068359375, -2.80609130859375, -2.6053466796875, -2.40460205078125, -2.203857421875, -2.00311279296875, -1.8023681640625, -1.60162353515625, -1.40087890625, -1.20013427734375, -0.9993896484375, -0.79864501953125, -0.597900390625, -0.39715576171875, -0.1964111328125, 0.00433349609375, 0.205078125, 0.40582275390625, 0.6065673828125, 0.80731201171875, 1.008056640625, 1.20880126953125, 1.4095458984375, 1.61029052734375, 1.81103515625, 2.01177978515625, 2.2125244140625, 2.41326904296875, 2.614013671875, 2.81475830078125, 3.0155029296875, 3.21624755859375, 3.4169921875, 3.61773681640625, 3.8184814453125, 4.01922607421875, 4.219970703125, 4.42071533203125, 4.6214599609375, 4.82220458984375, 5.02294921875, 5.22369384765625, 5.4244384765625, 5.62518310546875, 5.825927734375, 6.02667236328125, 6.2274169921875, 6.42816162109375, 6.62890625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 14.0, 11.0, 26.0, 49.0, 61.0, 105.0, 136.0, 232.0, 335.0, 551.0, 846.0, 1300.0, 2074.0, 3348.0, 5380.0, 8925.0, 14475.0, 24006.0, 39963.0, 66798.0, 109409.0, 176064.0, 225560.0, 144446.0, 88432.0, 53493.0, 32439.0, 19450.0, 11754.0, 7115.0, 4385.0, 2761.0, 1677.0, 1039.0, 665.0, 408.0, 253.0, 196.0, 111.0, 67.0, 54.0, 48.0, 24.0, 20.0, 18.0, 10.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.85546875, -0.8289718627929688, -0.8024749755859375, -0.7759780883789062, -0.749481201171875, -0.7229843139648438, -0.6964874267578125, -0.6699905395507812, -0.64349365234375, -0.6169967651367188, -0.5904998779296875, -0.5640029907226562, -0.537506103515625, -0.5110092163085938, -0.4845123291015625, -0.45801544189453125, -0.4315185546875, -0.40502166748046875, -0.3785247802734375, -0.35202789306640625, -0.325531005859375, -0.29903411865234375, -0.2725372314453125, -0.24604034423828125, -0.21954345703125, -0.19304656982421875, -0.1665496826171875, -0.14005279541015625, -0.113555908203125, -0.08705902099609375, -0.0605621337890625, -0.03406524658203125, -0.007568359375, 0.01892852783203125, 0.0454254150390625, 0.07192230224609375, 0.098419189453125, 0.12491607666015625, 0.1514129638671875, 0.17790985107421875, 0.20440673828125, 0.23090362548828125, 0.2574005126953125, 0.28389739990234375, 0.310394287109375, 0.33689117431640625, 0.3633880615234375, 0.38988494873046875, 0.4163818359375, 0.44287872314453125, 0.4693756103515625, 0.49587249755859375, 0.522369384765625, 0.5488662719726562, 0.5753631591796875, 0.6018600463867188, 0.62835693359375, 0.6548538208007812, 0.6813507080078125, 0.7078475952148438, 0.734344482421875, 0.7608413696289062, 0.7873382568359375, 0.8138351440429688, 0.84033203125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 7.0, 1.0, 6.0, 3.0, 8.0, 15.0, 7.0, 17.0, 10.0, 14.0, 25.0, 33.0, 34.0, 19.0, 26.0, 34.0, 40.0, 35.0, 39.0, 47.0, 36.0, 1061.0, 51.0, 46.0, 40.0, 45.0, 42.0, 42.0, 32.0, 29.0, 29.0, 18.0, 20.0, 19.0, 23.0, 16.0, 10.0, 15.0, 7.0, 5.0, 6.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.576171875, -3.466796875, -3.357421875, -3.248046875, -3.138671875, -3.029296875, -2.919921875, -2.810546875, -2.701171875, -2.591796875, -2.482421875, -2.373046875, -2.263671875, -2.154296875, -2.044921875, -1.935546875, -1.826171875, -1.716796875, -1.607421875, -1.498046875, -1.388671875, -1.279296875, -1.169921875, -1.060546875, -0.951171875, -0.841796875, -0.732421875, -0.623046875, -0.513671875, -0.404296875, -0.294921875, -0.185546875, -0.076171875, 0.033203125, 0.142578125, 0.251953125, 0.361328125, 0.470703125, 0.580078125, 0.689453125, 0.798828125, 0.908203125, 1.017578125, 1.126953125, 1.236328125, 1.345703125, 1.455078125, 1.564453125, 1.673828125, 1.783203125, 1.892578125, 2.001953125, 2.111328125, 2.220703125, 2.330078125, 2.439453125, 2.548828125, 2.658203125, 2.767578125, 2.876953125, 2.986328125, 3.095703125, 3.205078125, 3.314453125, 3.423828125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 1.0, 2.0, 8.0, 6.0, 14.0, 21.0, 32.0, 40.0, 60.0, 104.0, 150.0, 224.0, 330.0, 512.0, 776.0, 1231.0, 1898.0, 2983.0, 4656.0, 7609.0, 11910.0, 19415.0, 31709.0, 51009.0, 83708.0, 133248.0, 1253794.0, 185341.0, 116215.0, 72561.0, 44711.0, 27564.0, 16985.0, 10397.0, 6547.0, 4056.0, 2569.0, 1624.0, 1060.0, 692.0, 474.0, 299.0, 212.0, 136.0, 87.0, 47.0, 40.0, 24.0, 17.0, 18.0, 9.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65576171875, -0.6337966918945312, -0.6118316650390625, -0.5898666381835938, -0.567901611328125, -0.5459365844726562, -0.5239715576171875, -0.5020065307617188, -0.48004150390625, -0.45807647705078125, -0.4361114501953125, -0.41414642333984375, -0.392181396484375, -0.37021636962890625, -0.3482513427734375, -0.32628631591796875, -0.3043212890625, -0.28235626220703125, -0.2603912353515625, -0.23842620849609375, -0.216461181640625, -0.19449615478515625, -0.1725311279296875, -0.15056610107421875, -0.12860107421875, -0.10663604736328125, -0.0846710205078125, -0.06270599365234375, -0.040740966796875, -0.01877593994140625, 0.0031890869140625, 0.02515411376953125, 0.047119140625, 0.06908416748046875, 0.0910491943359375, 0.11301422119140625, 0.134979248046875, 0.15694427490234375, 0.1789093017578125, 0.20087432861328125, 0.22283935546875, 0.24480438232421875, 0.2667694091796875, 0.28873443603515625, 0.310699462890625, 0.33266448974609375, 0.3546295166015625, 0.37659454345703125, 0.3985595703125, 0.42052459716796875, 0.4424896240234375, 0.46445465087890625, 0.486419677734375, 0.5083847045898438, 0.5303497314453125, 0.5523147583007812, 0.57427978515625, 0.5962448120117188, 0.6182098388671875, 0.6401748657226562, 0.662139892578125, 0.6841049194335938, 0.7060699462890625, 0.7280349731445312, 0.75]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 8.0, 8.0, 9.0, 17.0, 14.0, 25.0, 18.0, 33.0, 46.0, 50.0, 73.0, 59.0, 70.0, 85.0, 88.0, 79.0, 60.0, 51.0, 45.0, 36.0, 27.0, 17.0, 11.0, 19.0, 11.0, 11.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0014743804931640625, -0.001429229974746704, -0.0013840794563293457, -0.0013389289379119873, -0.001293778419494629, -0.0012486279010772705, -0.0012034773826599121, -0.0011583268642425537, -0.0011131763458251953, -0.001068025827407837, -0.0010228753089904785, -0.0009777247905731201, -0.0009325742721557617, -0.0008874237537384033, -0.0008422732353210449, -0.0007971227169036865, -0.0007519721984863281, -0.0007068216800689697, -0.0006616711616516113, -0.0006165206432342529, -0.0005713701248168945, -0.0005262196063995361, -0.00048106908798217773, -0.00043591856956481934, -0.00039076805114746094, -0.00034561753273010254, -0.00030046701431274414, -0.00025531649589538574, -0.00021016597747802734, -0.00016501545906066895, -0.00011986494064331055, -7.471442222595215e-05, -2.956390380859375e-05, 1.558661460876465e-05, 6.073713302612305e-05, 0.00010588765144348145, 0.00015103816986083984, 0.00019618868827819824, 0.00024133920669555664, 0.00028648972511291504, 0.00033164024353027344, 0.00037679076194763184, 0.00042194128036499023, 0.00046709179878234863, 0.000512242317199707, 0.0005573928356170654, 0.0006025433540344238, 0.0006476938724517822, 0.0006928443908691406, 0.000737994909286499, 0.0007831454277038574, 0.0008282959461212158, 0.0008734464645385742, 0.0009185969829559326, 0.000963747501373291, 0.0010088980197906494, 0.0010540485382080078, 0.0010991990566253662, 0.0011443495750427246, 0.001189500093460083, 0.0012346506118774414, 0.0012798011302947998, 0.0013249516487121582, 0.0013701021671295166, 0.001415252685546875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 7.0, 12.0, 20.0, 14.0, 19.0, 22.0, 34.0, 43.0, 48.0, 69.0, 123.0, 164.0, 181.0, 264.0, 642.0, 8181.0, 1034501.0, 2754.0, 499.0, 268.0, 199.0, 116.0, 86.0, 74.0, 47.0, 35.0, 23.0, 14.0, 17.0, 12.0, 12.0, 18.0, 7.0, 6.0, 1.0, 6.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025634765625, -0.024762630462646484, -0.02389049530029297, -0.023018360137939453, -0.022146224975585938, -0.021274089813232422, -0.020401954650878906, -0.01952981948852539, -0.018657684326171875, -0.01778554916381836, -0.016913414001464844, -0.016041278839111328, -0.015169143676757812, -0.014297008514404297, -0.013424873352050781, -0.012552738189697266, -0.01168060302734375, -0.010808467864990234, -0.009936332702636719, -0.009064197540283203, -0.008192062377929688, -0.007319927215576172, -0.006447792053222656, -0.005575656890869141, -0.004703521728515625, -0.0038313865661621094, -0.0029592514038085938, -0.002087116241455078, -0.0012149810791015625, -0.0003428459167480469, 0.0005292892456054688, 0.0014014244079589844, 0.0022735595703125, 0.0031456947326660156, 0.004017829895019531, 0.004889965057373047, 0.0057621002197265625, 0.006634235382080078, 0.007506370544433594, 0.00837850570678711, 0.009250640869140625, 0.01012277603149414, 0.010994911193847656, 0.011867046356201172, 0.012739181518554688, 0.013611316680908203, 0.014483451843261719, 0.015355587005615234, 0.01622772216796875, 0.017099857330322266, 0.01797199249267578, 0.018844127655029297, 0.019716262817382812, 0.020588397979736328, 0.021460533142089844, 0.02233266830444336, 0.023204803466796875, 0.02407693862915039, 0.024949073791503906, 0.025821208953857422, 0.026693344116210938, 0.027565479278564453, 0.02843761444091797, 0.029309749603271484, 0.030181884765625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 47.0, 370.0, 497.0, 81.0, 15.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0035810621920973063, -0.0034896391443908215, -0.0033982160966843367, -0.003306793048977852, -0.0032153702341020107, -0.003123947186395526, -0.003032524138689041, -0.0029411010909825563, -0.0028496780432760715, -0.0027582549955695868, -0.002666831947863102, -0.002575408900156617, -0.0024839858524501324, -0.0023925630375742912, -0.0023011399898678064, -0.0022097169421613216, -0.002118293894454837, -0.002026870846748352, -0.0019354477990418673, -0.0018440248677507043, -0.0017526018200442195, -0.0016611787723377347, -0.0015697558410465717, -0.001478332793340087, -0.0013869097456336021, -0.0012954866979271173, -0.0012040636502206326, -0.0011126407189294696, -0.0010212176712229848, -0.0009297946235165, -0.0008383716340176761, -0.0007469486445188522, -0.0006555255968123674, -0.0005641025491058826, -0.00047267955960705876, -0.0003812565410044044, -0.0002898335224017501, -0.00019841050379909575, -0.00010698748519644141, -1.556449569761753e-05, 7.585855200886726e-05, 0.0001672815706115216, 0.00025870458921417594, 0.0003501276078168303, 0.0004415506264194846, 0.0005329736741259694, 0.0006243966636247933, 0.0007158196531236172, 0.000807242700830102, 0.0008986657485365868, 0.0009900887962430716, 0.0010815117275342345, 0.0011729347752407193, 0.0012643578229472041, 0.001355780754238367, 0.0014472038019448519, 0.0015386268496513367, 0.0016300498973578215, 0.0017214729450643063, 0.0018128958763554692, 0.001904318924061954, 0.001995741855353117, 0.002087164903059602, 0.0021785879507660866, 0.0022700109984725714]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 6.0, 4.0, 12.0, 9.0, 11.0, 17.0, 18.0, 22.0, 22.0, 41.0, 27.0, 26.0, 21.0, 39.0, 29.0, 40.0, 38.0, 45.0, 46.0, 47.0, 53.0, 49.0, 40.0, 29.0, 37.0, 24.0, 34.0, 37.0, 24.0, 22.0, 21.0, 15.0, 21.0, 10.0, 12.0, 9.0, 9.0, 6.0, 11.0, 5.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0005835890769958496, -0.0005641374737024307, -0.0005446858704090118, -0.000525234267115593, -0.0005057826638221741, -0.0004863310605287552, -0.0004668794572353363, -0.0004474278539419174, -0.00042797625064849854, -0.00040852464735507965, -0.00038907304406166077, -0.0003696214407682419, -0.000350169837474823, -0.0003307182341814041, -0.00031126663088798523, -0.00029181502759456635, -0.00027236342430114746, -0.0002529118210077286, -0.0002334602177143097, -0.0002140086144208908, -0.00019455701112747192, -0.00017510540783405304, -0.00015565380454063416, -0.00013620220124721527, -0.00011675059795379639, -9.72989946603775e-05, -7.784739136695862e-05, -5.8395788073539734e-05, -3.894418478012085e-05, -1.9492581486701965e-05, -4.0978193283081055e-08, 1.9410625100135803e-05, 3.886222839355469e-05, 5.831383168697357e-05, 7.776543498039246e-05, 9.721703827381134e-05, 0.00011666864156723022, 0.0001361202448606491, 0.000155571848154068, 0.00017502345144748688, 0.00019447505474090576, 0.00021392665803432465, 0.00023337826132774353, 0.0002528298646211624, 0.0002722814679145813, 0.0002917330712080002, 0.00031118467450141907, 0.00033063627779483795, 0.00035008788108825684, 0.0003695394843816757, 0.0003889910876750946, 0.0004084426909685135, 0.0004278942942619324, 0.00044734589755535126, 0.00046679750084877014, 0.000486249104142189, 0.0005057007074356079, 0.0005251523107290268, 0.0005446039140224457, 0.0005640555173158646, 0.0005835071206092834, 0.0006029587239027023, 0.0006224103271961212, 0.0006418619304895401, 0.000661313533782959]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 16.0, 17.0, 17.0, 23.0, 19.0, 19.0, 27.0, 38.0, 34.0, 41.0, 47.0, 43.0, 43.0, 36.0, 49.0, 52.0, 64.0, 41.0, 48.0, 41.0, 42.0, 36.0, 36.0, 25.0, 34.0, 22.0, 16.0, 16.0, 19.0, 9.0, 7.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.21875, -6.01800537109375, -5.8172607421875, -5.61651611328125, -5.415771484375, -5.21502685546875, -5.0142822265625, -4.81353759765625, -4.61279296875, -4.41204833984375, -4.2113037109375, -4.01055908203125, -3.809814453125, -3.60906982421875, -3.4083251953125, -3.20758056640625, -3.0068359375, -2.80609130859375, -2.6053466796875, -2.40460205078125, -2.203857421875, -2.00311279296875, -1.8023681640625, -1.60162353515625, -1.40087890625, -1.20013427734375, -0.9993896484375, -0.79864501953125, -0.597900390625, -0.39715576171875, -0.1964111328125, 0.00433349609375, 0.205078125, 0.40582275390625, 0.6065673828125, 0.80731201171875, 1.008056640625, 1.20880126953125, 1.4095458984375, 1.61029052734375, 1.81103515625, 2.01177978515625, 2.2125244140625, 2.41326904296875, 2.614013671875, 2.81475830078125, 3.0155029296875, 3.21624755859375, 3.4169921875, 3.61773681640625, 3.8184814453125, 4.01922607421875, 4.219970703125, 4.42071533203125, 4.6214599609375, 4.82220458984375, 5.02294921875, 5.22369384765625, 5.4244384765625, 5.62518310546875, 5.825927734375, 6.02667236328125, 6.2274169921875, 6.42816162109375, 6.62890625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 8.0, 13.0, 10.0, 22.0, 32.0, 47.0, 61.0, 85.0, 132.0, 197.0, 293.0, 442.0, 809.0, 1523.0, 3349.0, 9449.0, 33706.0, 160917.0, 589902.0, 190129.0, 39143.0, 10620.0, 3719.0, 1649.0, 835.0, 518.0, 293.0, 203.0, 138.0, 101.0, 70.0, 46.0, 24.0, 20.0, 19.0, 8.0, 8.0, 4.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.28515625, -6.0859375, -5.88671875, -5.6875, -5.48828125, -5.2890625, -5.08984375, -4.890625, -4.69140625, -4.4921875, -4.29296875, -4.09375, -3.89453125, -3.6953125, -3.49609375, -3.296875, -3.09765625, -2.8984375, -2.69921875, -2.5, -2.30078125, -2.1015625, -1.90234375, -1.703125, -1.50390625, -1.3046875, -1.10546875, -0.90625, -0.70703125, -0.5078125, -0.30859375, -0.109375, 0.08984375, 0.2890625, 0.48828125, 0.6875, 0.88671875, 1.0859375, 1.28515625, 1.484375, 1.68359375, 1.8828125, 2.08203125, 2.28125, 2.48046875, 2.6796875, 2.87890625, 3.078125, 3.27734375, 3.4765625, 3.67578125, 3.875, 4.07421875, 4.2734375, 4.47265625, 4.671875, 4.87109375, 5.0703125, 5.26953125, 5.46875, 5.66796875, 5.8671875, 6.06640625, 6.265625, 6.46484375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 2.0, 9.0, 9.0, 4.0, 14.0, 13.0, 21.0, 18.0, 18.0, 26.0, 40.0, 29.0, 45.0, 48.0, 47.0, 51.0, 64.0, 354.0, 1728.0, 91.0, 63.0, 40.0, 23.0, 52.0, 41.0, 34.0, 25.0, 26.0, 18.0, 16.0, 18.0, 16.0, 9.0, 6.0, 7.0, 8.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.890625, -22.219970703125, -21.54931640625, -20.878662109375, -20.2080078125, -19.537353515625, -18.86669921875, -18.196044921875, -17.525390625, -16.854736328125, -16.18408203125, -15.513427734375, -14.8427734375, -14.172119140625, -13.50146484375, -12.830810546875, -12.16015625, -11.489501953125, -10.81884765625, -10.148193359375, -9.4775390625, -8.806884765625, -8.13623046875, -7.465576171875, -6.794921875, -6.124267578125, -5.45361328125, -4.782958984375, -4.1123046875, -3.441650390625, -2.77099609375, -2.100341796875, -1.4296875, -0.759033203125, -0.08837890625, 0.582275390625, 1.2529296875, 1.923583984375, 2.59423828125, 3.264892578125, 3.935546875, 4.606201171875, 5.27685546875, 5.947509765625, 6.6181640625, 7.288818359375, 7.95947265625, 8.630126953125, 9.30078125, 9.971435546875, 10.64208984375, 11.312744140625, 11.9833984375, 12.654052734375, 13.32470703125, 13.995361328125, 14.666015625, 15.336669921875, 16.00732421875, 16.677978515625, 17.3486328125, 18.019287109375, 18.68994140625, 19.360595703125, 20.03125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 5.0, 8.0, 7.0, 13.0, 14.0, 15.0, 12.0, 20.0, 24.0, 22.0, 48.0, 50.0, 74.0, 68.0, 127.0, 356.0, 1040.0, 47212.0, 3092069.0, 3242.0, 563.0, 218.0, 108.0, 81.0, 64.0, 40.0, 40.0, 28.0, 23.0, 20.0, 16.0, 12.0, 17.0, 8.0, 5.0, 6.0, 6.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.6875, -42.24365234375, -40.7998046875, -39.35595703125, -37.912109375, -36.46826171875, -35.0244140625, -33.58056640625, -32.13671875, -30.69287109375, -29.2490234375, -27.80517578125, -26.361328125, -24.91748046875, -23.4736328125, -22.02978515625, -20.5859375, -19.14208984375, -17.6982421875, -16.25439453125, -14.810546875, -13.36669921875, -11.9228515625, -10.47900390625, -9.03515625, -7.59130859375, -6.1474609375, -4.70361328125, -3.259765625, -1.81591796875, -0.3720703125, 1.07177734375, 2.515625, 3.95947265625, 5.4033203125, 6.84716796875, 8.291015625, 9.73486328125, 11.1787109375, 12.62255859375, 14.06640625, 15.51025390625, 16.9541015625, 18.39794921875, 19.841796875, 21.28564453125, 22.7294921875, 24.17333984375, 25.6171875, 27.06103515625, 28.5048828125, 29.94873046875, 31.392578125, 32.83642578125, 34.2802734375, 35.72412109375, 37.16796875, 38.61181640625, 40.0556640625, 41.49951171875, 42.943359375, 44.38720703125, 45.8310546875, 47.27490234375, 48.71875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 27.0, 778.0, 207.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.676727294921875, -34.175716400146484, -30.674705505371094, -27.17369270324707, -23.67268180847168, -20.17167091369629, -16.670658111572266, -13.169647216796875, -9.668636322021484, -6.1676249504089355, -2.6666135787963867, 0.8343982696533203, 4.335409164428711, 7.836420059204102, 11.337432861328125, 14.838443756103516, 18.339454650878906, 21.840465545654297, 25.341476440429688, 28.84248924255371, 32.34349822998047, 35.844512939453125, 39.345523834228516, 42.846534729003906, 46.3475456237793, 49.84855651855469, 53.34956741333008, 56.85057830810547, 60.351593017578125, 63.85260009765625, 67.3536148071289, 70.85462951660156, 74.35563659667969, 77.85665130615234, 81.35765838623047, 84.85867309570312, 88.35968017578125, 91.8606948852539, 95.36170959472656, 98.86271667480469, 102.36372375488281, 105.86473846435547, 109.3657455444336, 112.86676025390625, 116.36776733398438, 119.86878204345703, 123.36979675292969, 126.87080383300781, 130.371826171875, 133.87283325195312, 137.3738555908203, 140.87486267089844, 144.37586975097656, 147.8768768310547, 151.37789916992188, 154.87890625, 158.37991333007812, 161.88092041015625, 165.38194274902344, 168.88294982910156, 172.3839569091797, 175.8849639892578, 179.385986328125, 182.88699340820312, 186.38800048828125]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 6.0, 6.0, 8.0, 9.0, 7.0, 16.0, 19.0, 18.0, 19.0, 27.0, 25.0, 38.0, 44.0, 38.0, 41.0, 46.0, 54.0, 30.0, 51.0, 53.0, 47.0, 39.0, 52.0, 50.0, 28.0, 40.0, 36.0, 37.0, 21.0, 18.0, 16.0, 12.0, 18.0, 9.0, 3.0, 8.0, 5.0, 5.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.67066955566406, -55.525943756103516, -53.38121795654297, -51.23649215698242, -49.091766357421875, -46.94703674316406, -44.802310943603516, -42.65758514404297, -40.51285934448242, -38.368133544921875, -36.22340774536133, -34.07868194580078, -31.9339542388916, -29.789228439331055, -27.644500732421875, -25.499774932861328, -23.35504913330078, -21.210323333740234, -19.065597534179688, -16.920869827270508, -14.776144027709961, -12.631418228149414, -10.48669147491455, -8.341964721679688, -6.197238922119141, -4.0525126457214355, -1.9077863693237305, 0.2369399070739746, 2.3816661834716797, 4.526391983032227, 6.67111873626709, 8.815845489501953, 10.9605712890625, 13.105297088623047, 15.25002384185791, 17.394750595092773, 19.53947639465332, 21.684202194213867, 23.828929901123047, 25.973655700683594, 28.11838150024414, 30.263107299804688, 32.407833099365234, 34.55255889892578, 36.697288513183594, 38.842010498046875, 40.98674011230469, 43.131465911865234, 45.27619171142578, 47.42091751098633, 49.565643310546875, 51.71036911010742, 53.85509490966797, 55.99982452392578, 58.14455032348633, 60.289276123046875, 62.43400192260742, 64.57872772216797, 66.72345733642578, 68.86817932128906, 71.01290893554688, 73.15763092041016, 75.30236053466797, 77.44708251953125, 79.59181213378906]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 8.0, 18.0, 13.0, 17.0, 22.0, 21.0, 20.0, 25.0, 33.0, 48.0, 30.0, 49.0, 45.0, 40.0, 38.0, 52.0, 62.0, 44.0, 46.0, 43.0, 55.0, 34.0, 42.0, 31.0, 29.0, 27.0, 27.0, 13.0, 13.0, 17.0, 9.0, 11.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.11328125, -5.90863037109375, -5.7039794921875, -5.49932861328125, -5.294677734375, -5.09002685546875, -4.8853759765625, -4.68072509765625, -4.47607421875, -4.27142333984375, -4.0667724609375, -3.86212158203125, -3.657470703125, -3.45281982421875, -3.2481689453125, -3.04351806640625, -2.8388671875, -2.63421630859375, -2.4295654296875, -2.22491455078125, -2.020263671875, -1.81561279296875, -1.6109619140625, -1.40631103515625, -1.20166015625, -0.99700927734375, -0.7923583984375, -0.58770751953125, -0.383056640625, -0.17840576171875, 0.0262451171875, 0.23089599609375, 0.435546875, 0.64019775390625, 0.8448486328125, 1.04949951171875, 1.254150390625, 1.45880126953125, 1.6634521484375, 1.86810302734375, 2.07275390625, 2.27740478515625, 2.4820556640625, 2.68670654296875, 2.891357421875, 3.09600830078125, 3.3006591796875, 3.50531005859375, 3.7099609375, 3.91461181640625, 4.1192626953125, 4.32391357421875, 4.528564453125, 4.73321533203125, 4.9378662109375, 5.14251708984375, 5.34716796875, 5.55181884765625, 5.7564697265625, 5.96112060546875, 6.165771484375, 6.37042236328125, 6.5750732421875, 6.77972412109375, 6.984375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 3.0, 8.0, 13.0, 5.0, 15.0, 22.0, 25.0, 37.0, 41.0, 65.0, 100.0, 141.0, 274.0, 667.0, 2686.0, 21747.0, 643685.0, 3342953.0, 169786.0, 9406.0, 1518.0, 476.0, 212.0, 121.0, 73.0, 47.0, 30.0, 35.0, 27.0, 19.0, 10.0, 9.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.4375, -24.696533203125, -23.95556640625, -23.214599609375, -22.4736328125, -21.732666015625, -20.99169921875, -20.250732421875, -19.509765625, -18.768798828125, -18.02783203125, -17.286865234375, -16.5458984375, -15.804931640625, -15.06396484375, -14.322998046875, -13.58203125, -12.841064453125, -12.10009765625, -11.359130859375, -10.6181640625, -9.877197265625, -9.13623046875, -8.395263671875, -7.654296875, -6.913330078125, -6.17236328125, -5.431396484375, -4.6904296875, -3.949462890625, -3.20849609375, -2.467529296875, -1.7265625, -0.985595703125, -0.24462890625, 0.496337890625, 1.2373046875, 1.978271484375, 2.71923828125, 3.460205078125, 4.201171875, 4.942138671875, 5.68310546875, 6.424072265625, 7.1650390625, 7.906005859375, 8.64697265625, 9.387939453125, 10.12890625, 10.869873046875, 11.61083984375, 12.351806640625, 13.0927734375, 13.833740234375, 14.57470703125, 15.315673828125, 16.056640625, 16.797607421875, 17.53857421875, 18.279541015625, 19.0205078125, 19.761474609375, 20.50244140625, 21.243408203125, 21.984375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 10.0, 7.0, 14.0, 25.0, 32.0, 53.0, 89.0, 115.0, 180.0, 268.0, 407.0, 607.0, 660.0, 523.0, 354.0, 265.0, 156.0, 95.0, 75.0, 47.0, 32.0, 17.0, 15.0, 12.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.34375, -24.560546875, -23.77734375, -22.994140625, -22.2109375, -21.427734375, -20.64453125, -19.861328125, -19.078125, -18.294921875, -17.51171875, -16.728515625, -15.9453125, -15.162109375, -14.37890625, -13.595703125, -12.8125, -12.029296875, -11.24609375, -10.462890625, -9.6796875, -8.896484375, -8.11328125, -7.330078125, -6.546875, -5.763671875, -4.98046875, -4.197265625, -3.4140625, -2.630859375, -1.84765625, -1.064453125, -0.28125, 0.501953125, 1.28515625, 2.068359375, 2.8515625, 3.634765625, 4.41796875, 5.201171875, 5.984375, 6.767578125, 7.55078125, 8.333984375, 9.1171875, 9.900390625, 10.68359375, 11.466796875, 12.25, 13.033203125, 13.81640625, 14.599609375, 15.3828125, 16.166015625, 16.94921875, 17.732421875, 18.515625, 19.298828125, 20.08203125, 20.865234375, 21.6484375, 22.431640625, 23.21484375, 23.998046875, 24.78125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 8.0, 7.0, 12.0, 10.0, 31.0, 52.0, 77.0, 122.0, 208.0, 359.0, 780.0, 4845.0, 1651574.0, 2528988.0, 5417.0, 868.0, 365.0, 207.0, 121.0, 75.0, 53.0, 36.0, 22.0, 14.0, 12.0, 7.0, 4.0, 0.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.25, -56.6767578125, -54.103515625, -51.5302734375, -48.95703125, -46.3837890625, -43.810546875, -41.2373046875, -38.6640625, -36.0908203125, -33.517578125, -30.9443359375, -28.37109375, -25.7978515625, -23.224609375, -20.6513671875, -18.078125, -15.5048828125, -12.931640625, -10.3583984375, -7.78515625, -5.2119140625, -2.638671875, -0.0654296875, 2.5078125, 5.0810546875, 7.654296875, 10.2275390625, 12.80078125, 15.3740234375, 17.947265625, 20.5205078125, 23.09375, 25.6669921875, 28.240234375, 30.8134765625, 33.38671875, 35.9599609375, 38.533203125, 41.1064453125, 43.6796875, 46.2529296875, 48.826171875, 51.3994140625, 53.97265625, 56.5458984375, 59.119140625, 61.6923828125, 64.265625, 66.8388671875, 69.412109375, 71.9853515625, 74.55859375, 77.1318359375, 79.705078125, 82.2783203125, 84.8515625, 87.4248046875, 89.998046875, 92.5712890625, 95.14453125, 97.7177734375, 100.291015625, 102.8642578125, 105.4375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 106.0, 490.0, 356.0, 59.0, 5.0], "bins": [-534.0560302734375, -525.2754516601562, -516.494873046875, -507.71429443359375, -498.9337158203125, -490.15313720703125, -481.37255859375, -472.5919494628906, -463.8113708496094, -455.0307922363281, -446.2502136230469, -437.4696350097656, -428.6890563964844, -419.908447265625, -411.12786865234375, -402.3472900390625, -393.56671142578125, -384.7861328125, -376.00555419921875, -367.2249755859375, -358.44439697265625, -349.663818359375, -340.88323974609375, -332.1026306152344, -323.32208251953125, -314.54150390625, -305.76092529296875, -296.9803466796875, -288.19976806640625, -279.419189453125, -270.63861083984375, -261.8580017089844, -253.0774383544922, -244.29685974121094, -235.5162811279297, -226.73568725585938, -217.95510864257812, -209.17453002929688, -200.39395141601562, -191.61337280273438, -182.83277893066406, -174.0522003173828, -165.27162170410156, -156.49102783203125, -147.71044921875, -138.92987060546875, -130.1492919921875, -121.36871337890625, -112.58812713623047, -103.80754852294922, -95.02696228027344, -86.24638366699219, -77.46580505371094, -68.68521881103516, -59.904640197753906, -51.12405776977539, -42.343475341796875, -33.56289291381836, -24.782312393188477, -16.001731872558594, -7.221149444580078, 1.5594329833984375, 10.340011596679688, 19.120594024658203, 27.901174545288086]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 2.0, 4.0, 3.0, 3.0, 8.0, 14.0, 8.0, 8.0, 17.0, 18.0, 27.0, 20.0, 37.0, 24.0, 37.0, 33.0, 17.0, 32.0, 38.0, 27.0, 46.0, 34.0, 41.0, 41.0, 28.0, 35.0, 41.0, 48.0, 38.0, 26.0, 26.0, 29.0, 24.0, 26.0, 16.0, 20.0, 15.0, 10.0, 11.0, 17.0, 6.0, 7.0, 10.0, 6.0, 10.0, 4.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-62.429046630859375, -60.59641647338867, -58.76378631591797, -56.93115997314453, -55.09852981567383, -53.265899658203125, -51.43326950073242, -49.60063934326172, -47.76801300048828, -45.93538284301758, -44.102752685546875, -42.27012634277344, -40.437496185302734, -38.60486602783203, -36.77223587036133, -34.939605712890625, -33.10697555541992, -31.27434539794922, -29.44171714782715, -27.609086990356445, -25.776458740234375, -23.943828582763672, -22.11119842529297, -20.278568267822266, -18.445940017700195, -16.613309860229492, -14.780681610107422, -12.948051452636719, -11.115422248840332, -9.282793045043945, -7.450162887573242, -5.6175336837768555, -3.7849044799804688, -1.952275037765503, -0.11964559555053711, 1.7129840850830078, 3.5456132888793945, 5.378242492675781, 7.210872650146484, 9.043501853942871, 10.876131057739258, 12.708760261535645, 14.541389465332031, 16.374019622802734, 18.206649780273438, 20.039278030395508, 21.87190818786621, 23.70453643798828, 25.537166595458984, 27.369796752929688, 29.202425003051758, 31.03505516052246, 32.86768341064453, 34.700313568115234, 36.53294372558594, 38.36557388305664, 40.198204040527344, 42.03083419799805, 43.86346435546875, 45.69609069824219, 47.52872085571289, 49.361351013183594, 51.1939811706543, 53.026611328125, 54.85923767089844]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 14.0, 10.0, 9.0, 17.0, 10.0, 25.0, 24.0, 27.0, 27.0, 30.0, 32.0, 32.0, 44.0, 43.0, 46.0, 49.0, 45.0, 44.0, 46.0, 57.0, 42.0, 37.0, 49.0, 37.0, 32.0, 34.0, 23.0, 20.0, 23.0, 14.0, 14.0, 8.0, 9.0, 11.0, 6.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.7542724609375, -5.555419921875, -5.3565673828125, -5.15771484375, -4.9588623046875, -4.760009765625, -4.5611572265625, -4.3623046875, -4.1634521484375, -3.964599609375, -3.7657470703125, -3.56689453125, -3.3680419921875, -3.169189453125, -2.9703369140625, -2.771484375, -2.5726318359375, -2.373779296875, -2.1749267578125, -1.97607421875, -1.7772216796875, -1.578369140625, -1.3795166015625, -1.1806640625, -0.9818115234375, -0.782958984375, -0.5841064453125, -0.38525390625, -0.1864013671875, 0.012451171875, 0.2113037109375, 0.41015625, 0.6090087890625, 0.807861328125, 1.0067138671875, 1.20556640625, 1.4044189453125, 1.603271484375, 1.8021240234375, 2.0009765625, 2.1998291015625, 2.398681640625, 2.5975341796875, 2.79638671875, 2.9952392578125, 3.194091796875, 3.3929443359375, 3.591796875, 3.7906494140625, 3.989501953125, 4.1883544921875, 4.38720703125, 4.5860595703125, 4.784912109375, 4.9837646484375, 5.1826171875, 5.3814697265625, 5.580322265625, 5.7791748046875, 5.97802734375, 6.1768798828125, 6.375732421875, 6.5745849609375, 6.7734375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 10.0, 6.0, 7.0, 11.0, 31.0, 31.0, 53.0, 73.0, 128.0, 187.0, 308.0, 481.0, 718.0, 1219.0, 1949.0, 3326.0, 5491.0, 8985.0, 15255.0, 25142.0, 42550.0, 71816.0, 120532.0, 192259.0, 215563.0, 137405.0, 83017.0, 49137.0, 29052.0, 17386.0, 10431.0, 6310.0, 3739.0, 2252.0, 1402.0, 861.0, 544.0, 289.0, 209.0, 128.0, 96.0, 49.0, 42.0, 35.0, 11.0, 17.0, 8.0, 5.0, 3.0, 4.0, 1.0, 2.0], "bins": [-1.0087890625, -0.9808731079101562, -0.9529571533203125, -0.9250411987304688, -0.897125244140625, -0.8692092895507812, -0.8412933349609375, -0.8133773803710938, -0.78546142578125, -0.7575454711914062, -0.7296295166015625, -0.7017135620117188, -0.673797607421875, -0.6458816528320312, -0.6179656982421875, -0.5900497436523438, -0.5621337890625, -0.5342178344726562, -0.5063018798828125, -0.47838592529296875, -0.450469970703125, -0.42255401611328125, -0.3946380615234375, -0.36672210693359375, -0.33880615234375, -0.31089019775390625, -0.2829742431640625, -0.25505828857421875, -0.227142333984375, -0.19922637939453125, -0.1713104248046875, -0.14339447021484375, -0.115478515625, -0.08756256103515625, -0.0596466064453125, -0.03173065185546875, -0.003814697265625, 0.02410125732421875, 0.0520172119140625, 0.07993316650390625, 0.10784912109375, 0.13576507568359375, 0.1636810302734375, 0.19159698486328125, 0.219512939453125, 0.24742889404296875, 0.2753448486328125, 0.30326080322265625, 0.3311767578125, 0.35909271240234375, 0.3870086669921875, 0.41492462158203125, 0.442840576171875, 0.47075653076171875, 0.4986724853515625, 0.5265884399414062, 0.55450439453125, 0.5824203491210938, 0.6103363037109375, 0.6382522583007812, 0.666168212890625, 0.6940841674804688, 0.7220001220703125, 0.7499160766601562, 0.77783203125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 5.0, 7.0, 13.0, 14.0, 16.0, 22.0, 27.0, 18.0, 27.0, 29.0, 29.0, 33.0, 36.0, 46.0, 42.0, 53.0, 44.0, 45.0, 1068.0, 33.0, 40.0, 32.0, 32.0, 26.0, 31.0, 30.0, 28.0, 34.0, 29.0, 29.0, 20.0, 16.0, 14.0, 10.0, 10.0, 10.0, 4.0, 6.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.908203125, -3.791839599609375, -3.67547607421875, -3.559112548828125, -3.4427490234375, -3.326385498046875, -3.21002197265625, -3.093658447265625, -2.977294921875, -2.860931396484375, -2.74456787109375, -2.628204345703125, -2.5118408203125, -2.395477294921875, -2.27911376953125, -2.162750244140625, -2.04638671875, -1.930023193359375, -1.81365966796875, -1.697296142578125, -1.5809326171875, -1.464569091796875, -1.34820556640625, -1.231842041015625, -1.115478515625, -0.999114990234375, -0.88275146484375, -0.766387939453125, -0.6500244140625, -0.533660888671875, -0.41729736328125, -0.300933837890625, -0.1845703125, -0.068206787109375, 0.04815673828125, 0.164520263671875, 0.2808837890625, 0.397247314453125, 0.51361083984375, 0.629974365234375, 0.746337890625, 0.862701416015625, 0.97906494140625, 1.095428466796875, 1.2117919921875, 1.328155517578125, 1.44451904296875, 1.560882568359375, 1.67724609375, 1.793609619140625, 1.90997314453125, 2.026336669921875, 2.1427001953125, 2.259063720703125, 2.37542724609375, 2.491790771484375, 2.608154296875, 2.724517822265625, 2.84088134765625, 2.957244873046875, 3.0736083984375, 3.189971923828125, 3.30633544921875, 3.422698974609375, 3.5390625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 13.0, 11.0, 8.0, 32.0, 35.0, 52.0, 101.0, 130.0, 201.0, 291.0, 437.0, 679.0, 1078.0, 1655.0, 2535.0, 4038.0, 6038.0, 9627.0, 14721.0, 22083.0, 34451.0, 54376.0, 85770.0, 136089.0, 1251012.0, 171601.0, 108281.0, 68698.0, 43321.0, 28185.0, 18023.0, 11866.0, 7501.0, 4983.0, 3203.0, 2126.0, 1313.0, 904.0, 571.0, 341.0, 255.0, 158.0, 108.0, 67.0, 71.0, 33.0, 26.0, 18.0, 6.0, 10.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7021484375, -0.6800384521484375, -0.657928466796875, -0.6358184814453125, -0.61370849609375, -0.5915985107421875, -0.569488525390625, -0.5473785400390625, -0.5252685546875, -0.5031585693359375, -0.481048583984375, -0.4589385986328125, -0.43682861328125, -0.4147186279296875, -0.392608642578125, -0.3704986572265625, -0.348388671875, -0.3262786865234375, -0.304168701171875, -0.2820587158203125, -0.25994873046875, -0.2378387451171875, -0.215728759765625, -0.1936187744140625, -0.1715087890625, -0.1493988037109375, -0.127288818359375, -0.1051788330078125, -0.08306884765625, -0.0609588623046875, -0.038848876953125, -0.0167388916015625, 0.00537109375, 0.0274810791015625, 0.049591064453125, 0.0717010498046875, 0.09381103515625, 0.1159210205078125, 0.138031005859375, 0.1601409912109375, 0.1822509765625, 0.2043609619140625, 0.226470947265625, 0.2485809326171875, 0.27069091796875, 0.2928009033203125, 0.314910888671875, 0.3370208740234375, 0.359130859375, 0.3812408447265625, 0.403350830078125, 0.4254608154296875, 0.44757080078125, 0.4696807861328125, 0.491790771484375, 0.5139007568359375, 0.5360107421875, 0.5581207275390625, 0.580230712890625, 0.6023406982421875, 0.62445068359375, 0.6465606689453125, 0.668670654296875, 0.6907806396484375, 0.712890625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 7.0, 5.0, 4.0, 5.0, 9.0, 8.0, 14.0, 29.0, 24.0, 27.0, 56.0, 61.0, 80.0, 90.0, 79.0, 99.0, 83.0, 70.0, 58.0, 44.0, 33.0, 29.0, 21.0, 14.0, 13.0, 4.0, 6.0, 7.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001674652099609375, -0.0016166865825653076, -0.0015587210655212402, -0.0015007555484771729, -0.0014427900314331055, -0.001384824514389038, -0.0013268589973449707, -0.0012688934803009033, -0.001210927963256836, -0.0011529624462127686, -0.0010949969291687012, -0.0010370314121246338, -0.0009790658950805664, -0.000921100378036499, -0.0008631348609924316, -0.0008051693439483643, -0.0007472038269042969, -0.0006892383098602295, -0.0006312727928161621, -0.0005733072757720947, -0.0005153417587280273, -0.00045737624168395996, -0.0003994107246398926, -0.0003414452075958252, -0.0002834796905517578, -0.00022551417350769043, -0.00016754865646362305, -0.00010958313941955566, -5.161762237548828e-05, 6.3478946685791016e-06, 6.431341171264648e-05, 0.00012227892875671387, 0.00018024444580078125, 0.00023820996284484863, 0.000296175479888916, 0.0003541409969329834, 0.0004121065139770508, 0.00047007203102111816, 0.0005280375480651855, 0.0005860030651092529, 0.0006439685821533203, 0.0007019340991973877, 0.0007598996162414551, 0.0008178651332855225, 0.0008758306503295898, 0.0009337961673736572, 0.0009917616844177246, 0.001049727201461792, 0.0011076927185058594, 0.0011656582355499268, 0.0012236237525939941, 0.0012815892696380615, 0.001339554786682129, 0.0013975203037261963, 0.0014554858207702637, 0.001513451337814331, 0.0015714168548583984, 0.0016293823719024658, 0.0016873478889465332, 0.0017453134059906006, 0.001803278923034668, 0.0018612444400787354, 0.0019192099571228027, 0.00197717547416687, 0.0020351409912109375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 0.0, 5.0, 6.0, 6.0, 10.0, 7.0, 13.0, 18.0, 20.0, 23.0, 57.0, 72.0, 106.0, 163.0, 295.0, 536.0, 15372.0, 1029790.0, 1100.0, 342.0, 212.0, 120.0, 78.0, 70.0, 36.0, 23.0, 20.0, 10.0, 7.0, 8.0, 8.0, 7.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.044464111328125, -0.04320240020751953, -0.04194068908691406, -0.040678977966308594, -0.039417266845703125, -0.038155555725097656, -0.03689384460449219, -0.03563213348388672, -0.03437042236328125, -0.03310871124267578, -0.03184700012207031, -0.030585289001464844, -0.029323577880859375, -0.028061866760253906, -0.026800155639648438, -0.02553844451904297, -0.0242767333984375, -0.02301502227783203, -0.021753311157226562, -0.020491600036621094, -0.019229888916015625, -0.017968177795410156, -0.016706466674804688, -0.015444755554199219, -0.01418304443359375, -0.012921333312988281, -0.011659622192382812, -0.010397911071777344, -0.009136199951171875, -0.007874488830566406, -0.0066127777099609375, -0.005351066589355469, -0.00408935546875, -0.0028276443481445312, -0.0015659332275390625, -0.00030422210693359375, 0.000957489013671875, 0.0022192001342773438, 0.0034809112548828125, 0.004742622375488281, 0.00600433349609375, 0.007266044616699219, 0.008527755737304688, 0.009789466857910156, 0.011051177978515625, 0.012312889099121094, 0.013574600219726562, 0.014836311340332031, 0.0160980224609375, 0.01735973358154297, 0.018621444702148438, 0.019883155822753906, 0.021144866943359375, 0.022406578063964844, 0.023668289184570312, 0.02493000030517578, 0.02619171142578125, 0.02745342254638672, 0.028715133666992188, 0.029976844787597656, 0.031238555908203125, 0.032500267028808594, 0.03376197814941406, 0.03502368927001953, 0.036285400390625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 20.0, 409.0, 543.0, 44.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004643936641514301, -0.004494477994740009, -0.004345019347965717, -0.004195560701191425, -0.004046102054417133, -0.0038966434076428413, -0.0037471847608685493, -0.0035977261140942574, -0.0034482674673199654, -0.0032988088205456734, -0.0031493501737713814, -0.0029998915269970894, -0.0028504328802227974, -0.0027009742334485054, -0.0025515155866742134, -0.0024020569398999214, -0.0022525980602949858, -0.0021031394135206938, -0.001953680766746402, -0.0018042221199721098, -0.0016547634731978178, -0.0015053048264235258, -0.001355846063233912, -0.00120638741645962, -0.001056928769685328, -0.000907470122911036, -0.000758011476136744, -0.0006085527711547911, -0.0004590941243804991, -0.00030963547760620713, -0.00016017677262425423, -1.0718125849962234e-05, 0.00013874052092432976, 0.00028819916769862175, 0.0004376578435767442, 0.0005871165194548666, 0.0007365751662291586, 0.0008860338130034506, 0.0010354925179854035, 0.0011849511647596955, 0.0013344098115339875, 0.0014838684583082795, 0.0016333271050825715, 0.0017827858682721853, 0.0019322445150464773, 0.0020817031618207693, 0.0022311618085950613, 0.0023806204553693533, 0.0025300791021436453, 0.0026795377489179373, 0.0028289963956922293, 0.0029784550424665213, 0.0031279136892408133, 0.0032773723360151052, 0.003426831215620041, 0.003576289862394333, 0.003725748509168625, 0.003875207155942917, 0.004024665802717209, 0.004174124449491501, 0.004323583096265793, 0.004473041743040085, 0.004622500389814377, 0.004771959036588669, 0.004921417683362961]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 4.0, 8.0, 4.0, 5.0, 8.0, 9.0, 3.0, 12.0, 16.0, 15.0, 19.0, 28.0, 24.0, 28.0, 33.0, 22.0, 37.0, 29.0, 41.0, 48.0, 36.0, 47.0, 37.0, 52.0, 42.0, 36.0, 31.0, 38.0, 33.0, 36.0, 34.0, 31.0, 21.0, 17.0, 29.0, 10.0, 10.0, 11.0, 12.0, 12.0, 8.0, 2.0, 3.0, 5.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0007987618446350098, -0.000775020569562912, -0.0007512792944908142, -0.0007275380194187164, -0.0007037967443466187, -0.0006800554692745209, -0.0006563141942024231, -0.0006325729191303253, -0.0006088316440582275, -0.0005850903689861298, -0.000561349093914032, -0.0005376078188419342, -0.0005138665437698364, -0.0004901252686977386, -0.00046638399362564087, -0.0004426427185535431, -0.0004189014434814453, -0.00039516016840934753, -0.00037141889333724976, -0.000347677618265152, -0.0003239363431930542, -0.0003001950681209564, -0.00027645379304885864, -0.00025271251797676086, -0.00022897124290466309, -0.0002052299678325653, -0.00018148869276046753, -0.00015774741768836975, -0.00013400614261627197, -0.0001102648675441742, -8.652359247207642e-05, -6.278231739997864e-05, -3.904104232788086e-05, -1.529976725578308e-05, 8.441507816314697e-06, 3.2182782888412476e-05, 5.5924057960510254e-05, 7.966533303260803e-05, 0.00010340660810470581, 0.0001271478831768036, 0.00015088915824890137, 0.00017463043332099915, 0.00019837170839309692, 0.0002221129834651947, 0.0002458542585372925, 0.00026959553360939026, 0.00029333680868148804, 0.0003170780837535858, 0.0003408193588256836, 0.00036456063389778137, 0.00038830190896987915, 0.00041204318404197693, 0.0004357844591140747, 0.0004595257341861725, 0.00048326700925827026, 0.000507008284330368, 0.0005307495594024658, 0.0005544908344745636, 0.0005782321095466614, 0.0006019733846187592, 0.0006257146596908569, 0.0006494559347629547, 0.0006731972098350525, 0.0006969384849071503, 0.000720679759979248]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 14.0, 10.0, 9.0, 17.0, 10.0, 25.0, 24.0, 27.0, 27.0, 30.0, 32.0, 32.0, 44.0, 43.0, 46.0, 49.0, 45.0, 44.0, 46.0, 57.0, 42.0, 37.0, 49.0, 37.0, 32.0, 34.0, 23.0, 20.0, 23.0, 14.0, 14.0, 8.0, 9.0, 11.0, 6.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.953125, -5.7542724609375, -5.555419921875, -5.3565673828125, -5.15771484375, -4.9588623046875, -4.760009765625, -4.5611572265625, -4.3623046875, -4.1634521484375, -3.964599609375, -3.7657470703125, -3.56689453125, -3.3680419921875, -3.169189453125, -2.9703369140625, -2.771484375, -2.5726318359375, -2.373779296875, -2.1749267578125, -1.97607421875, -1.7772216796875, -1.578369140625, -1.3795166015625, -1.1806640625, -0.9818115234375, -0.782958984375, -0.5841064453125, -0.38525390625, -0.1864013671875, 0.012451171875, 0.2113037109375, 0.41015625, 0.6090087890625, 0.807861328125, 1.0067138671875, 1.20556640625, 1.4044189453125, 1.603271484375, 1.8021240234375, 2.0009765625, 2.1998291015625, 2.398681640625, 2.5975341796875, 2.79638671875, 2.9952392578125, 3.194091796875, 3.3929443359375, 3.591796875, 3.7906494140625, 3.989501953125, 4.1883544921875, 4.38720703125, 4.5860595703125, 4.784912109375, 4.9837646484375, 5.1826171875, 5.3814697265625, 5.580322265625, 5.7791748046875, 5.97802734375, 6.1768798828125, 6.375732421875, 6.5745849609375, 6.7734375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 7.0, 17.0, 43.0, 31.0, 49.0, 97.0, 129.0, 282.0, 395.0, 728.0, 1294.0, 2335.0, 4368.0, 8990.0, 20549.0, 55672.0, 215835.0, 530116.0, 136491.0, 40039.0, 15741.0, 7175.0, 3595.0, 1880.0, 1143.0, 617.0, 342.0, 231.0, 156.0, 72.0, 51.0, 28.0, 19.0, 14.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9140625, -4.77099609375, -4.6279296875, -4.48486328125, -4.341796875, -4.19873046875, -4.0556640625, -3.91259765625, -3.76953125, -3.62646484375, -3.4833984375, -3.34033203125, -3.197265625, -3.05419921875, -2.9111328125, -2.76806640625, -2.625, -2.48193359375, -2.3388671875, -2.19580078125, -2.052734375, -1.90966796875, -1.7666015625, -1.62353515625, -1.48046875, -1.33740234375, -1.1943359375, -1.05126953125, -0.908203125, -0.76513671875, -0.6220703125, -0.47900390625, -0.3359375, -0.19287109375, -0.0498046875, 0.09326171875, 0.236328125, 0.37939453125, 0.5224609375, 0.66552734375, 0.80859375, 0.95166015625, 1.0947265625, 1.23779296875, 1.380859375, 1.52392578125, 1.6669921875, 1.81005859375, 1.953125, 2.09619140625, 2.2392578125, 2.38232421875, 2.525390625, 2.66845703125, 2.8115234375, 2.95458984375, 3.09765625, 3.24072265625, 3.3837890625, 3.52685546875, 3.669921875, 3.81298828125, 3.9560546875, 4.09912109375, 4.2421875]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 3.0, 8.0, 6.0, 7.0, 16.0, 16.0, 10.0, 18.0, 20.0, 24.0, 27.0, 26.0, 34.0, 38.0, 37.0, 39.0, 63.0, 85.0, 1715.0, 336.0, 77.0, 51.0, 45.0, 38.0, 48.0, 37.0, 24.0, 25.0, 26.0, 28.0, 21.0, 20.0, 21.0, 18.0, 11.0, 3.0, 6.0, 5.0, 7.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.109375, -17.435791015625, -16.76220703125, -16.088623046875, -15.4150390625, -14.741455078125, -14.06787109375, -13.394287109375, -12.720703125, -12.047119140625, -11.37353515625, -10.699951171875, -10.0263671875, -9.352783203125, -8.67919921875, -8.005615234375, -7.33203125, -6.658447265625, -5.98486328125, -5.311279296875, -4.6376953125, -3.964111328125, -3.29052734375, -2.616943359375, -1.943359375, -1.269775390625, -0.59619140625, 0.077392578125, 0.7509765625, 1.424560546875, 2.09814453125, 2.771728515625, 3.4453125, 4.118896484375, 4.79248046875, 5.466064453125, 6.1396484375, 6.813232421875, 7.48681640625, 8.160400390625, 8.833984375, 9.507568359375, 10.18115234375, 10.854736328125, 11.5283203125, 12.201904296875, 12.87548828125, 13.549072265625, 14.22265625, 14.896240234375, 15.56982421875, 16.243408203125, 16.9169921875, 17.590576171875, 18.26416015625, 18.937744140625, 19.611328125, 20.284912109375, 20.95849609375, 21.632080078125, 22.3056640625, 22.979248046875, 23.65283203125, 24.326416015625, 25.0]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 5.0, 5.0, 3.0, 6.0, 14.0, 19.0, 20.0, 14.0, 28.0, 28.0, 34.0, 37.0, 43.0, 72.0, 92.0, 156.0, 260.0, 556.0, 2719.0, 140098.0, 2990659.0, 8915.0, 1032.0, 323.0, 151.0, 107.0, 78.0, 43.0, 25.0, 34.0, 26.0, 17.0, 16.0, 10.0, 16.0, 15.0, 3.0, 8.0, 7.0, 1.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0], "bins": [-41.75, -40.628173828125, -39.50634765625, -38.384521484375, -37.2626953125, -36.140869140625, -35.01904296875, -33.897216796875, -32.775390625, -31.653564453125, -30.53173828125, -29.409912109375, -28.2880859375, -27.166259765625, -26.04443359375, -24.922607421875, -23.80078125, -22.678955078125, -21.55712890625, -20.435302734375, -19.3134765625, -18.191650390625, -17.06982421875, -15.947998046875, -14.826171875, -13.704345703125, -12.58251953125, -11.460693359375, -10.3388671875, -9.217041015625, -8.09521484375, -6.973388671875, -5.8515625, -4.729736328125, -3.60791015625, -2.486083984375, -1.3642578125, -0.242431640625, 0.87939453125, 2.001220703125, 3.123046875, 4.244873046875, 5.36669921875, 6.488525390625, 7.6103515625, 8.732177734375, 9.85400390625, 10.975830078125, 12.09765625, 13.219482421875, 14.34130859375, 15.463134765625, 16.5849609375, 17.706787109375, 18.82861328125, 19.950439453125, 21.072265625, 22.194091796875, 23.31591796875, 24.437744140625, 25.5595703125, 26.681396484375, 27.80322265625, 28.925048828125, 30.046875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [19.0, 846.0, 152.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.61663818359375, -4.067175388336182, 1.4822874069213867, 7.031749725341797, 12.581212997436523, 18.13067626953125, 23.680137634277344, 29.229602813720703, 34.7790641784668, 40.32852554321289, 45.87799072265625, 51.427452087402344, 56.97691345214844, 62.5263786315918, 68.07583618164062, 73.62530517578125, 79.17476654052734, 84.72422790527344, 90.27368927001953, 95.82315063476562, 101.37261962890625, 106.92208099365234, 112.47154235839844, 118.02101135253906, 123.57046508789062, 129.11993408203125, 134.6693878173828, 140.21885681152344, 145.768310546875, 151.31777954101562, 156.86724853515625, 162.4167022705078, 167.96617126464844, 173.51564025878906, 179.06509399414062, 184.61456298828125, 190.1640167236328, 195.71348571777344, 201.262939453125, 206.81240844726562, 212.36187744140625, 217.91134643554688, 223.46080017089844, 229.01026916503906, 234.55972290039062, 240.10919189453125, 245.65866088867188, 251.20811462402344, 256.757568359375, 262.3070373535156, 267.85650634765625, 273.40594482421875, 278.9554138183594, 284.5048828125, 290.0543518066406, 295.60382080078125, 301.1532897949219, 306.7027587890625, 312.2522277832031, 317.8016662597656, 323.35113525390625, 328.9006042480469, 334.4500732421875, 339.9995422363281, 345.5489807128906]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 8.0, 4.0, 7.0, 9.0, 8.0, 9.0, 11.0, 16.0, 23.0, 15.0, 18.0, 13.0, 32.0, 19.0, 31.0, 47.0, 40.0, 35.0, 37.0, 44.0, 40.0, 39.0, 44.0, 33.0, 49.0, 37.0, 37.0, 51.0, 26.0, 34.0, 28.0, 27.0, 24.0, 18.0, 17.0, 23.0, 20.0, 6.0, 4.0, 10.0, 8.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-76.71792602539062, -74.57952880859375, -72.44113159179688, -70.30274200439453, -68.16434478759766, -66.02594757080078, -63.88755416870117, -61.74916076660156, -59.61076354980469, -57.47236633300781, -55.3339729309082, -53.195579528808594, -51.05718231201172, -48.918785095214844, -46.780391693115234, -44.641998291015625, -42.50360107421875, -40.365203857421875, -38.226810455322266, -36.088417053222656, -33.95001983642578, -31.81162452697754, -29.673229217529297, -27.534833908081055, -25.396438598632812, -23.25804328918457, -21.119647979736328, -18.981252670288086, -16.842857360839844, -14.704462051391602, -12.56606674194336, -10.427671432495117, -8.289268493652344, -6.150873184204102, -4.012477874755859, -1.8740825653076172, 0.264312744140625, 2.402708053588867, 4.541103363037109, 6.679498672485352, 8.817893981933594, 10.956289291381836, 13.094684600830078, 15.23307991027832, 17.371475219726562, 19.509870529174805, 21.648265838623047, 23.78666114807129, 25.92505645751953, 28.063451766967773, 30.201847076416016, 32.340240478515625, 34.4786376953125, 36.617034912109375, 38.755428314208984, 40.893821716308594, 43.03221893310547, 45.170616149902344, 47.30900955200195, 49.44740295410156, 51.58580017089844, 53.72419738769531, 55.86259078979492, 58.00098419189453, 60.139381408691406]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 10.0, 11.0, 9.0, 16.0, 13.0, 15.0, 34.0, 17.0, 28.0, 32.0, 29.0, 43.0, 36.0, 45.0, 39.0, 45.0, 42.0, 49.0, 58.0, 52.0, 46.0, 39.0, 33.0, 46.0, 33.0, 27.0, 29.0, 26.0, 17.0, 20.0, 13.0, 8.0, 8.0, 11.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.171875, -5.96710205078125, -5.7623291015625, -5.55755615234375, -5.352783203125, -5.14801025390625, -4.9432373046875, -4.73846435546875, -4.53369140625, -4.32891845703125, -4.1241455078125, -3.91937255859375, -3.714599609375, -3.50982666015625, -3.3050537109375, -3.10028076171875, -2.8955078125, -2.69073486328125, -2.4859619140625, -2.28118896484375, -2.076416015625, -1.87164306640625, -1.6668701171875, -1.46209716796875, -1.25732421875, -1.05255126953125, -0.8477783203125, -0.64300537109375, -0.438232421875, -0.23345947265625, -0.0286865234375, 0.17608642578125, 0.380859375, 0.58563232421875, 0.7904052734375, 0.99517822265625, 1.199951171875, 1.40472412109375, 1.6094970703125, 1.81427001953125, 2.01904296875, 2.22381591796875, 2.4285888671875, 2.63336181640625, 2.838134765625, 3.04290771484375, 3.2476806640625, 3.45245361328125, 3.6572265625, 3.86199951171875, 4.0667724609375, 4.27154541015625, 4.476318359375, 4.68109130859375, 4.8858642578125, 5.09063720703125, 5.29541015625, 5.50018310546875, 5.7049560546875, 5.90972900390625, 6.114501953125, 6.31927490234375, 6.5240478515625, 6.72882080078125, 6.93359375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 8.0, 14.0, 18.0, 17.0, 18.0, 28.0, 19.0, 26.0, 33.0, 29.0, 49.0, 44.0, 128.0, 695.0, 17168.0, 3430917.0, 740289.0, 4115.0, 262.0, 80.0, 42.0, 28.0, 42.0, 32.0, 41.0, 25.0, 22.0, 20.0, 15.0, 7.0, 10.0, 8.0, 5.0, 7.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.28125, -38.0068359375, -36.732421875, -35.4580078125, -34.18359375, -32.9091796875, -31.634765625, -30.3603515625, -29.0859375, -27.8115234375, -26.537109375, -25.2626953125, -23.98828125, -22.7138671875, -21.439453125, -20.1650390625, -18.890625, -17.6162109375, -16.341796875, -15.0673828125, -13.79296875, -12.5185546875, -11.244140625, -9.9697265625, -8.6953125, -7.4208984375, -6.146484375, -4.8720703125, -3.59765625, -2.3232421875, -1.048828125, 0.2255859375, 1.5, 2.7744140625, 4.048828125, 5.3232421875, 6.59765625, 7.8720703125, 9.146484375, 10.4208984375, 11.6953125, 12.9697265625, 14.244140625, 15.5185546875, 16.79296875, 18.0673828125, 19.341796875, 20.6162109375, 21.890625, 23.1650390625, 24.439453125, 25.7138671875, 26.98828125, 28.2626953125, 29.537109375, 30.8115234375, 32.0859375, 33.3603515625, 34.634765625, 35.9091796875, 37.18359375, 38.4580078125, 39.732421875, 41.0068359375, 42.28125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 5.0, 11.0, 16.0, 24.0, 38.0, 51.0, 72.0, 134.0, 222.0, 334.0, 511.0, 763.0, 662.0, 463.0, 308.0, 182.0, 111.0, 56.0, 42.0, 34.0, 23.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-38.75, -37.92236328125, -37.0947265625, -36.26708984375, -35.439453125, -34.61181640625, -33.7841796875, -32.95654296875, -32.12890625, -31.30126953125, -30.4736328125, -29.64599609375, -28.818359375, -27.99072265625, -27.1630859375, -26.33544921875, -25.5078125, -24.68017578125, -23.8525390625, -23.02490234375, -22.197265625, -21.36962890625, -20.5419921875, -19.71435546875, -18.88671875, -18.05908203125, -17.2314453125, -16.40380859375, -15.576171875, -14.74853515625, -13.9208984375, -13.09326171875, -12.265625, -11.43798828125, -10.6103515625, -9.78271484375, -8.955078125, -8.12744140625, -7.2998046875, -6.47216796875, -5.64453125, -4.81689453125, -3.9892578125, -3.16162109375, -2.333984375, -1.50634765625, -0.6787109375, 0.14892578125, 0.9765625, 1.80419921875, 2.6318359375, 3.45947265625, 4.287109375, 5.11474609375, 5.9423828125, 6.77001953125, 7.59765625, 8.42529296875, 9.2529296875, 10.08056640625, 10.908203125, 11.73583984375, 12.5634765625, 13.39111328125, 14.21875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 10.0, 8.0, 21.0, 35.0, 53.0, 106.0, 189.0, 256.0, 576.0, 4542.0, 3904237.0, 281852.0, 1420.0, 394.0, 211.0, 141.0, 86.0, 44.0, 36.0, 33.0, 20.0, 6.0, 6.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.0, -41.744140625, -38.48828125, -35.232421875, -31.9765625, -28.720703125, -25.46484375, -22.208984375, -18.953125, -15.697265625, -12.44140625, -9.185546875, -5.9296875, -2.673828125, 0.58203125, 3.837890625, 7.09375, 10.349609375, 13.60546875, 16.861328125, 20.1171875, 23.373046875, 26.62890625, 29.884765625, 33.140625, 36.396484375, 39.65234375, 42.908203125, 46.1640625, 49.419921875, 52.67578125, 55.931640625, 59.1875, 62.443359375, 65.69921875, 68.955078125, 72.2109375, 75.466796875, 78.72265625, 81.978515625, 85.234375, 88.490234375, 91.74609375, 95.001953125, 98.2578125, 101.513671875, 104.76953125, 108.025390625, 111.28125, 114.537109375, 117.79296875, 121.048828125, 124.3046875, 127.560546875, 130.81640625, 134.072265625, 137.328125, 140.583984375, 143.83984375, 147.095703125, 150.3515625, 153.607421875, 156.86328125, 160.119140625, 163.375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 12.0, 52.0, 155.0, 306.0, 292.0, 130.0, 50.0, 13.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-261.0731201171875, -256.14556884765625, -251.21800231933594, -246.2904510498047, -241.36289978027344, -236.4353485107422, -231.50778198242188, -226.58023071289062, -221.65267944335938, -216.72512817382812, -211.7975616455078, -206.87001037597656, -201.9424591064453, -197.01490783691406, -192.08734130859375, -187.1597900390625, -182.23223876953125, -177.3046875, -172.3771209716797, -167.44956970214844, -162.5220184326172, -157.59446716308594, -152.66690063476562, -147.73934936523438, -142.81178283691406, -137.8842315673828, -132.9566650390625, -128.02911376953125, -123.1015625, -118.17400360107422, -113.24644470214844, -108.31889343261719, -103.39134216308594, -98.46378326416016, -93.5362319946289, -88.60867309570312, -83.68112182617188, -78.7535629272461, -73.82600402832031, -68.89845275878906, -63.97089767456055, -59.04334259033203, -54.115787506103516, -49.188232421875, -44.26067352294922, -39.33312225341797, -34.40556335449219, -29.478008270263672, -24.550453186035156, -19.62289810180664, -14.695342063903809, -9.767786026000977, -4.840230941772461, 0.08732414245605469, 5.014881134033203, 9.942436218261719, 14.869991302490234, 19.79754638671875, 24.725101470947266, 29.652658462524414, 34.58021545410156, 39.50776672363281, 44.435325622558594, 49.36288070678711, 54.290435791015625]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 10.0, 7.0, 6.0, 7.0, 9.0, 10.0, 20.0, 15.0, 17.0, 27.0, 25.0, 29.0, 34.0, 31.0, 36.0, 38.0, 45.0, 46.0, 45.0, 40.0, 40.0, 47.0, 33.0, 42.0, 43.0, 35.0, 39.0, 35.0, 30.0, 20.0, 12.0, 31.0, 16.0, 20.0, 16.0, 9.0, 10.0, 10.0, 5.0, 8.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.0679931640625, -53.16908645629883, -51.27018356323242, -49.37127685546875, -47.472373962402344, -45.57346725463867, -43.674560546875, -41.775657653808594, -39.87675476074219, -37.977848052978516, -36.07894515991211, -34.18003845214844, -32.28113555908203, -30.38222885131836, -28.48332405090332, -26.58441925048828, -24.68551254272461, -22.78660774230957, -20.88770294189453, -18.98879623413086, -17.089893341064453, -15.190987586975098, -13.292081832885742, -11.393177032470703, -9.494272232055664, -7.595367431640625, -5.696462154388428, -3.7975568771362305, -1.8986520767211914, 0.00025272369384765625, 1.8991584777832031, 3.798063278198242, 5.696968078613281, 7.59587287902832, 9.49477767944336, 11.393683433532715, 13.292588233947754, 15.191493034362793, 17.09039878845215, 18.989303588867188, 20.888208389282227, 22.787113189697266, 24.686017990112305, 26.584922790527344, 28.483829498291016, 30.382732391357422, 32.281639099121094, 34.1805419921875, 36.07944869995117, 37.978355407714844, 39.87725830078125, 41.77616500854492, 43.67506790161133, 45.573974609375, 47.472877502441406, 49.37178421020508, 51.27069091796875, 53.16959762573242, 55.06850051879883, 56.9674072265625, 58.866310119628906, 60.76521682739258, 62.66412353515625, 64.56302642822266, 66.46192932128906]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 1.0, 5.0, 8.0, 12.0, 15.0, 14.0, 14.0, 11.0, 20.0, 33.0, 24.0, 22.0, 26.0, 37.0, 33.0, 41.0, 39.0, 39.0, 43.0, 34.0, 45.0, 46.0, 55.0, 46.0, 43.0, 41.0, 33.0, 30.0, 26.0, 23.0, 26.0, 23.0, 16.0, 19.0, 19.0, 8.0, 6.0, 4.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83984375, -5.64495849609375, -5.4500732421875, -5.25518798828125, -5.060302734375, -4.86541748046875, -4.6705322265625, -4.47564697265625, -4.28076171875, -4.08587646484375, -3.8909912109375, -3.69610595703125, -3.501220703125, -3.30633544921875, -3.1114501953125, -2.91656494140625, -2.7216796875, -2.52679443359375, -2.3319091796875, -2.13702392578125, -1.942138671875, -1.74725341796875, -1.5523681640625, -1.35748291015625, -1.16259765625, -0.96771240234375, -0.7728271484375, -0.57794189453125, -0.383056640625, -0.18817138671875, 0.0067138671875, 0.20159912109375, 0.396484375, 0.59136962890625, 0.7862548828125, 0.98114013671875, 1.176025390625, 1.37091064453125, 1.5657958984375, 1.76068115234375, 1.95556640625, 2.15045166015625, 2.3453369140625, 2.54022216796875, 2.735107421875, 2.92999267578125, 3.1248779296875, 3.31976318359375, 3.5146484375, 3.70953369140625, 3.9044189453125, 4.09930419921875, 4.294189453125, 4.48907470703125, 4.6839599609375, 4.87884521484375, 5.07373046875, 5.26861572265625, 5.4635009765625, 5.65838623046875, 5.853271484375, 6.04815673828125, 6.2430419921875, 6.43792724609375, 6.6328125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 7.0, 8.0, 10.0, 18.0, 24.0, 59.0, 93.0, 157.0, 210.0, 310.0, 542.0, 892.0, 1488.0, 2488.0, 4343.0, 7467.0, 12771.0, 23088.0, 41299.0, 74690.0, 137901.0, 242062.0, 223268.0, 122775.0, 66783.0, 36434.0, 21030.0, 11919.0, 6722.0, 3880.0, 2323.0, 1384.0, 814.0, 515.0, 286.0, 188.0, 111.0, 60.0, 49.0, 29.0, 21.0, 18.0, 12.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1513671875, -1.1183853149414062, -1.0854034423828125, -1.0524215698242188, -1.019439697265625, -0.9864578247070312, -0.9534759521484375, -0.9204940795898438, -0.88751220703125, -0.8545303344726562, -0.8215484619140625, -0.7885665893554688, -0.755584716796875, -0.7226028442382812, -0.6896209716796875, -0.6566390991210938, -0.6236572265625, -0.5906753540039062, -0.5576934814453125, -0.5247116088867188, -0.491729736328125, -0.45874786376953125, -0.4257659912109375, -0.39278411865234375, -0.35980224609375, -0.32682037353515625, -0.2938385009765625, -0.26085662841796875, -0.227874755859375, -0.19489288330078125, -0.1619110107421875, -0.12892913818359375, -0.095947265625, -0.06296539306640625, -0.0299835205078125, 0.00299835205078125, 0.035980224609375, 0.06896209716796875, 0.1019439697265625, 0.13492584228515625, 0.16790771484375, 0.20088958740234375, 0.2338714599609375, 0.26685333251953125, 0.299835205078125, 0.33281707763671875, 0.3657989501953125, 0.39878082275390625, 0.4317626953125, 0.46474456787109375, 0.4977264404296875, 0.5307083129882812, 0.563690185546875, 0.5966720581054688, 0.6296539306640625, 0.6626358032226562, 0.69561767578125, 0.7285995483398438, 0.7615814208984375, 0.7945632934570312, 0.827545166015625, 0.8605270385742188, 0.8935089111328125, 0.9264907836914062, 0.95947265625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 4.0, 5.0, 10.0, 12.0, 12.0, 11.0, 18.0, 23.0, 22.0, 35.0, 25.0, 27.0, 28.0, 34.0, 35.0, 39.0, 43.0, 41.0, 42.0, 1066.0, 37.0, 42.0, 46.0, 47.0, 34.0, 45.0, 29.0, 28.0, 24.0, 24.0, 20.0, 8.0, 15.0, 12.0, 13.0, 9.0, 11.0, 10.0, 10.0, 6.0, 2.0, 5.0, 2.0, 7.0, 4.0, 1.0], "bins": [-4.39453125, -4.27777099609375, -4.1610107421875, -4.04425048828125, -3.927490234375, -3.81072998046875, -3.6939697265625, -3.57720947265625, -3.46044921875, -3.34368896484375, -3.2269287109375, -3.11016845703125, -2.993408203125, -2.87664794921875, -2.7598876953125, -2.64312744140625, -2.5263671875, -2.40960693359375, -2.2928466796875, -2.17608642578125, -2.059326171875, -1.94256591796875, -1.8258056640625, -1.70904541015625, -1.59228515625, -1.47552490234375, -1.3587646484375, -1.24200439453125, -1.125244140625, -1.00848388671875, -0.8917236328125, -0.77496337890625, -0.658203125, -0.54144287109375, -0.4246826171875, -0.30792236328125, -0.191162109375, -0.07440185546875, 0.0423583984375, 0.15911865234375, 0.27587890625, 0.39263916015625, 0.5093994140625, 0.62615966796875, 0.742919921875, 0.85968017578125, 0.9764404296875, 1.09320068359375, 1.2099609375, 1.32672119140625, 1.4434814453125, 1.56024169921875, 1.677001953125, 1.79376220703125, 1.9105224609375, 2.02728271484375, 2.14404296875, 2.26080322265625, 2.3775634765625, 2.49432373046875, 2.611083984375, 2.72784423828125, 2.8446044921875, 2.96136474609375, 3.078125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 13.0, 9.0, 9.0, 26.0, 34.0, 45.0, 87.0, 133.0, 196.0, 328.0, 517.0, 799.0, 1169.0, 1949.0, 3048.0, 4881.0, 7780.0, 12343.0, 20200.0, 33590.0, 55066.0, 92722.0, 158816.0, 1281879.0, 170331.0, 99590.0, 58753.0, 35364.0, 21679.0, 13362.0, 8288.0, 5202.0, 3226.0, 1993.0, 1375.0, 850.0, 520.0, 339.0, 224.0, 129.0, 110.0, 52.0, 44.0, 26.0, 9.0, 16.0, 7.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.89453125, -0.86865234375, -0.8427734375, -0.81689453125, -0.791015625, -0.76513671875, -0.7392578125, -0.71337890625, -0.6875, -0.66162109375, -0.6357421875, -0.60986328125, -0.583984375, -0.55810546875, -0.5322265625, -0.50634765625, -0.48046875, -0.45458984375, -0.4287109375, -0.40283203125, -0.376953125, -0.35107421875, -0.3251953125, -0.29931640625, -0.2734375, -0.24755859375, -0.2216796875, -0.19580078125, -0.169921875, -0.14404296875, -0.1181640625, -0.09228515625, -0.06640625, -0.04052734375, -0.0146484375, 0.01123046875, 0.037109375, 0.06298828125, 0.0888671875, 0.11474609375, 0.140625, 0.16650390625, 0.1923828125, 0.21826171875, 0.244140625, 0.27001953125, 0.2958984375, 0.32177734375, 0.34765625, 0.37353515625, 0.3994140625, 0.42529296875, 0.451171875, 0.47705078125, 0.5029296875, 0.52880859375, 0.5546875, 0.58056640625, 0.6064453125, 0.63232421875, 0.658203125, 0.68408203125, 0.7099609375, 0.73583984375, 0.76171875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 4.0, 7.0, 6.0, 11.0, 10.0, 20.0, 23.0, 26.0, 28.0, 22.0, 29.0, 36.0, 38.0, 37.0, 50.0, 46.0, 67.0, 56.0, 50.0, 46.0, 47.0, 39.0, 40.0, 55.0, 30.0, 35.0, 23.0, 27.0, 21.0, 13.0, 12.0, 11.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0009469985961914062, -0.0009155869483947754, -0.0008841753005981445, -0.0008527636528015137, -0.0008213520050048828, -0.000789940357208252, -0.0007585287094116211, -0.0007271170616149902, -0.0006957054138183594, -0.0006642937660217285, -0.0006328821182250977, -0.0006014704704284668, -0.0005700588226318359, -0.0005386471748352051, -0.0005072355270385742, -0.00047582387924194336, -0.0004444122314453125, -0.00041300058364868164, -0.0003815889358520508, -0.0003501772880554199, -0.00031876564025878906, -0.0002873539924621582, -0.00025594234466552734, -0.00022453069686889648, -0.00019311904907226562, -0.00016170740127563477, -0.0001302957534790039, -9.888410568237305e-05, -6.747245788574219e-05, -3.606081008911133e-05, -4.649162292480469e-06, 2.676248550415039e-05, 5.817413330078125e-05, 8.958578109741211e-05, 0.00012099742889404297, 0.00015240907669067383, 0.0001838207244873047, 0.00021523237228393555, 0.0002466440200805664, 0.00027805566787719727, 0.0003094673156738281, 0.000340878963470459, 0.00037229061126708984, 0.0004037022590637207, 0.00043511390686035156, 0.0004665255546569824, 0.0004979372024536133, 0.0005293488502502441, 0.000560760498046875, 0.0005921721458435059, 0.0006235837936401367, 0.0006549954414367676, 0.0006864070892333984, 0.0007178187370300293, 0.0007492303848266602, 0.000780642032623291, 0.0008120536804199219, 0.0008434653282165527, 0.0008748769760131836, 0.0009062886238098145, 0.0009377002716064453, 0.0009691119194030762, 0.001000523567199707, 0.0010319352149963379, 0.0010633468627929688]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 7.0, 2.0, 2.0, 2.0, 10.0, 7.0, 7.0, 14.0, 12.0, 39.0, 46.0, 57.0, 73.0, 126.0, 194.0, 331.0, 587.0, 6652.0, 1035684.0, 3267.0, 566.0, 301.0, 178.0, 94.0, 58.0, 56.0, 48.0, 22.0, 25.0, 29.0, 15.0, 13.0, 8.0, 7.0, 6.0, 1.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02850341796875, -0.027624845504760742, -0.026746273040771484, -0.025867700576782227, -0.02498912811279297, -0.02411055564880371, -0.023231983184814453, -0.022353410720825195, -0.021474838256835938, -0.02059626579284668, -0.019717693328857422, -0.018839120864868164, -0.017960548400878906, -0.01708197593688965, -0.01620340347290039, -0.015324831008911133, -0.014446258544921875, -0.013567686080932617, -0.01268911361694336, -0.011810541152954102, -0.010931968688964844, -0.010053396224975586, -0.009174823760986328, -0.00829625129699707, -0.0074176788330078125, -0.006539106369018555, -0.005660533905029297, -0.004781961441040039, -0.0039033889770507812, -0.0030248165130615234, -0.0021462440490722656, -0.0012676715850830078, -0.00038909912109375, 0.0004894733428955078, 0.0013680458068847656, 0.0022466182708740234, 0.0031251907348632812, 0.004003763198852539, 0.004882335662841797, 0.005760908126831055, 0.0066394805908203125, 0.00751805305480957, 0.008396625518798828, 0.009275197982788086, 0.010153770446777344, 0.011032342910766602, 0.01191091537475586, 0.012789487838745117, 0.013668060302734375, 0.014546632766723633, 0.01542520523071289, 0.01630377769470215, 0.017182350158691406, 0.018060922622680664, 0.018939495086669922, 0.01981806755065918, 0.020696640014648438, 0.021575212478637695, 0.022453784942626953, 0.02333235740661621, 0.02421092987060547, 0.025089502334594727, 0.025968074798583984, 0.026846647262573242, 0.0277252197265625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 48.0, 252.0, 519.0, 172.0, 14.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001175920944660902, -0.0010878217872232199, -0.000999722513370216, -0.0009116233559325337, -0.0008235241402871907, -0.0007354249246418476, -0.0006473257672041655, -0.0005592265515588224, -0.00047112733591347933, -0.00038302812026813626, -0.00029492893372662365, -0.00020682974718511105, -0.00011873053153976798, -3.0631315894424915e-05, 5.7467841543257236e-05, 0.0001455670571886003, 0.00023366627283394337, 0.00032176548847928643, 0.00040986467502079904, 0.0004979638615623116, 0.0005860630772076547, 0.0006741622928529978, 0.0007622614502906799, 0.000850360665936023, 0.0009384598815813661, 0.0010265590390190482, 0.0011146583128720522, 0.0012027574703097343, 0.0012908566277474165, 0.0013789559016004205, 0.0014670550590381026, 0.0015551543328911066, 0.0016432534903287888, 0.001731352647766471, 0.0018194519216194749, 0.001907551079057157, 0.001995650352910161, 0.002083749510347843, 0.0021718486677855253, 0.0022599478252232075, 0.0023480472154915333, 0.0024361463729292154, 0.0025242455303668976, 0.0026123449206352234, 0.0027004440780729055, 0.0027885432355105877, 0.00287664239294827, 0.002964741550385952, 0.003052840707823634, 0.0031409398652613163, 0.0032290390226989985, 0.0033171381801366806, 0.0034052375704050064, 0.0034933367278426886, 0.0035814358852803707, 0.003669535042718053, 0.003757634200155735, 0.003845733357593417, 0.003933832515031099, 0.004021931905299425, 0.004110030829906464, 0.004198130220174789, 0.004286229610443115, 0.004374328535050154, 0.0044624279253184795]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 6.0, 3.0, 4.0, 12.0, 13.0, 11.0, 14.0, 12.0, 18.0, 16.0, 26.0, 19.0, 31.0, 23.0, 34.0, 30.0, 29.0, 34.0, 27.0, 48.0, 34.0, 33.0, 38.0, 31.0, 46.0, 41.0, 46.0, 30.0, 32.0, 30.0, 29.0, 24.0, 27.0, 28.0, 22.0, 17.0, 11.0, 16.0, 8.0, 9.0, 10.0, 7.0, 4.0, 11.0, 1.0, 7.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.0005563497543334961, -0.0005402639508247375, -0.000524178147315979, -0.0005080923438072205, -0.0004920065402984619, -0.00047592073678970337, -0.0004598349332809448, -0.0004437491297721863, -0.00042766332626342773, -0.0004115775227546692, -0.00039549171924591064, -0.0003794059157371521, -0.00036332011222839355, -0.000347234308719635, -0.00033114850521087646, -0.0003150627017021179, -0.0002989768981933594, -0.00028289109468460083, -0.0002668052911758423, -0.00025071948766708374, -0.0002346336841583252, -0.00021854788064956665, -0.0002024620771408081, -0.00018637627363204956, -0.00017029047012329102, -0.00015420466661453247, -0.00013811886310577393, -0.00012203305959701538, -0.00010594725608825684, -8.986145257949829e-05, -7.377564907073975e-05, -5.76898455619812e-05, -4.1604042053222656e-05, -2.551823854446411e-05, -9.432435035705566e-06, 6.6533684730529785e-06, 2.2739171981811523e-05, 3.882497549057007e-05, 5.491077899932861e-05, 7.099658250808716e-05, 8.70823860168457e-05, 0.00010316818952560425, 0.00011925399303436279, 0.00013533979654312134, 0.00015142560005187988, 0.00016751140356063843, 0.00018359720706939697, 0.00019968301057815552, 0.00021576881408691406, 0.0002318546175956726, 0.00024794042110443115, 0.0002640262246131897, 0.00028011202812194824, 0.0002961978316307068, 0.00031228363513946533, 0.0003283694386482239, 0.0003444552421569824, 0.00036054104566574097, 0.0003766268491744995, 0.00039271265268325806, 0.0004087984561920166, 0.00042488425970077515, 0.0004409700632095337, 0.00045705586671829224, 0.0004731416702270508]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 1.0, 5.0, 8.0, 12.0, 15.0, 14.0, 14.0, 11.0, 20.0, 33.0, 24.0, 22.0, 26.0, 37.0, 33.0, 41.0, 39.0, 39.0, 43.0, 34.0, 45.0, 46.0, 55.0, 46.0, 43.0, 41.0, 33.0, 30.0, 26.0, 23.0, 26.0, 23.0, 16.0, 19.0, 19.0, 8.0, 6.0, 4.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83984375, -5.64495849609375, -5.4500732421875, -5.25518798828125, -5.060302734375, -4.86541748046875, -4.6705322265625, -4.47564697265625, -4.28076171875, -4.08587646484375, -3.8909912109375, -3.69610595703125, -3.501220703125, -3.30633544921875, -3.1114501953125, -2.91656494140625, -2.7216796875, -2.52679443359375, -2.3319091796875, -2.13702392578125, -1.942138671875, -1.74725341796875, -1.5523681640625, -1.35748291015625, -1.16259765625, -0.96771240234375, -0.7728271484375, -0.57794189453125, -0.383056640625, -0.18817138671875, 0.0067138671875, 0.20159912109375, 0.396484375, 0.59136962890625, 0.7862548828125, 0.98114013671875, 1.176025390625, 1.37091064453125, 1.5657958984375, 1.76068115234375, 1.95556640625, 2.15045166015625, 2.3453369140625, 2.54022216796875, 2.735107421875, 2.92999267578125, 3.1248779296875, 3.31976318359375, 3.5146484375, 3.70953369140625, 3.9044189453125, 4.09930419921875, 4.294189453125, 4.48907470703125, 4.6839599609375, 4.87884521484375, 5.07373046875, 5.26861572265625, 5.4635009765625, 5.65838623046875, 5.853271484375, 6.04815673828125, 6.2430419921875, 6.43792724609375, 6.6328125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 7.0, 10.0, 6.0, 11.0, 9.0, 22.0, 29.0, 45.0, 51.0, 81.0, 106.0, 166.0, 228.0, 348.0, 548.0, 910.0, 1476.0, 2709.0, 5431.0, 12255.0, 30655.0, 104704.0, 471814.0, 307115.0, 67895.0, 22397.0, 9278.0, 4458.0, 2206.0, 1284.0, 737.0, 517.0, 293.0, 205.0, 172.0, 114.0, 66.0, 56.0, 40.0, 28.0, 21.0, 18.0, 12.0, 13.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.35546875, -4.21868896484375, -4.0819091796875, -3.94512939453125, -3.808349609375, -3.67156982421875, -3.5347900390625, -3.39801025390625, -3.26123046875, -3.12445068359375, -2.9876708984375, -2.85089111328125, -2.714111328125, -2.57733154296875, -2.4405517578125, -2.30377197265625, -2.1669921875, -2.03021240234375, -1.8934326171875, -1.75665283203125, -1.619873046875, -1.48309326171875, -1.3463134765625, -1.20953369140625, -1.07275390625, -0.93597412109375, -0.7991943359375, -0.66241455078125, -0.525634765625, -0.38885498046875, -0.2520751953125, -0.11529541015625, 0.021484375, 0.15826416015625, 0.2950439453125, 0.43182373046875, 0.568603515625, 0.70538330078125, 0.8421630859375, 0.97894287109375, 1.11572265625, 1.25250244140625, 1.3892822265625, 1.52606201171875, 1.662841796875, 1.79962158203125, 1.9364013671875, 2.07318115234375, 2.2099609375, 2.34674072265625, 2.4835205078125, 2.62030029296875, 2.757080078125, 2.89385986328125, 3.0306396484375, 3.16741943359375, 3.30419921875, 3.44097900390625, 3.5777587890625, 3.71453857421875, 3.851318359375, 3.98809814453125, 4.1248779296875, 4.26165771484375, 4.3984375]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 8.0, 3.0, 5.0, 10.0, 8.0, 9.0, 20.0, 22.0, 20.0, 22.0, 26.0, 36.0, 36.0, 45.0, 32.0, 55.0, 60.0, 67.0, 162.0, 1857.0, 119.0, 55.0, 43.0, 37.0, 45.0, 40.0, 34.0, 37.0, 23.0, 23.0, 21.0, 12.0, 11.0, 14.0, 9.0, 10.0, 4.0, 4.0, 6.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.9375, -24.251953125, -23.56640625, -22.880859375, -22.1953125, -21.509765625, -20.82421875, -20.138671875, -19.453125, -18.767578125, -18.08203125, -17.396484375, -16.7109375, -16.025390625, -15.33984375, -14.654296875, -13.96875, -13.283203125, -12.59765625, -11.912109375, -11.2265625, -10.541015625, -9.85546875, -9.169921875, -8.484375, -7.798828125, -7.11328125, -6.427734375, -5.7421875, -5.056640625, -4.37109375, -3.685546875, -3.0, -2.314453125, -1.62890625, -0.943359375, -0.2578125, 0.427734375, 1.11328125, 1.798828125, 2.484375, 3.169921875, 3.85546875, 4.541015625, 5.2265625, 5.912109375, 6.59765625, 7.283203125, 7.96875, 8.654296875, 9.33984375, 10.025390625, 10.7109375, 11.396484375, 12.08203125, 12.767578125, 13.453125, 14.138671875, 14.82421875, 15.509765625, 16.1953125, 16.880859375, 17.56640625, 18.251953125, 18.9375]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 3.0, 6.0, 6.0, 7.0, 9.0, 13.0, 10.0, 10.0, 20.0, 18.0, 22.0, 38.0, 42.0, 58.0, 88.0, 111.0, 149.0, 274.0, 659.0, 3229.0, 267982.0, 2865153.0, 5869.0, 880.0, 370.0, 209.0, 114.0, 72.0, 56.0, 41.0, 29.0, 29.0, 26.0, 20.0, 19.0, 19.0, 9.0, 10.0, 7.0, 4.0, 2.0, 8.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.65625, -28.6376953125, -27.619140625, -26.6005859375, -25.58203125, -24.5634765625, -23.544921875, -22.5263671875, -21.5078125, -20.4892578125, -19.470703125, -18.4521484375, -17.43359375, -16.4150390625, -15.396484375, -14.3779296875, -13.359375, -12.3408203125, -11.322265625, -10.3037109375, -9.28515625, -8.2666015625, -7.248046875, -6.2294921875, -5.2109375, -4.1923828125, -3.173828125, -2.1552734375, -1.13671875, -0.1181640625, 0.900390625, 1.9189453125, 2.9375, 3.9560546875, 4.974609375, 5.9931640625, 7.01171875, 8.0302734375, 9.048828125, 10.0673828125, 11.0859375, 12.1044921875, 13.123046875, 14.1416015625, 15.16015625, 16.1787109375, 17.197265625, 18.2158203125, 19.234375, 20.2529296875, 21.271484375, 22.2900390625, 23.30859375, 24.3271484375, 25.345703125, 26.3642578125, 27.3828125, 28.4013671875, 29.419921875, 30.4384765625, 31.45703125, 32.4755859375, 33.494140625, 34.5126953125, 35.53125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 39.0, 641.0, 324.0, 10.0], "bins": [-212.79217529296875, -209.34825134277344, -205.90432739257812, -202.46038818359375, -199.01646423339844, -195.57254028320312, -192.1286163330078, -188.6846923828125, -185.24075317382812, -181.7968292236328, -178.3529052734375, -174.90896606445312, -171.4650421142578, -168.0211181640625, -164.5771942138672, -161.13327026367188, -157.6893310546875, -154.2454071044922, -150.80148315429688, -147.3575439453125, -143.9136199951172, -140.46969604492188, -137.02577209472656, -133.58184814453125, -130.13792419433594, -126.69400024414062, -123.25006866455078, -119.80614471435547, -116.36221313476562, -112.91828918457031, -109.474365234375, -106.03043365478516, -102.58650207519531, -99.142578125, -95.69864654541016, -92.25472259521484, -88.810791015625, -85.36686706542969, -81.92294311523438, -78.47901153564453, -75.03507995605469, -71.59115600585938, -68.14722442626953, -64.70330047607422, -61.259368896484375, -57.81544494628906, -54.371517181396484, -50.927589416503906, -47.48366165161133, -44.03973388671875, -40.59580612182617, -37.151878356933594, -33.70795440673828, -30.26402473449707, -26.820098876953125, -23.376171112060547, -19.93224334716797, -16.48831558227539, -13.044388771057129, -9.600461959838867, -6.156534194946289, -2.712606430053711, 0.7313194274902344, 4.1752471923828125, 7.619174003601074]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 7.0, 3.0, 6.0, 7.0, 12.0, 7.0, 11.0, 16.0, 25.0, 17.0, 15.0, 21.0, 21.0, 27.0, 28.0, 27.0, 28.0, 42.0, 42.0, 45.0, 37.0, 43.0, 26.0, 31.0, 30.0, 30.0, 34.0, 32.0, 34.0, 30.0, 20.0, 31.0, 26.0, 26.0, 23.0, 20.0, 19.0, 21.0, 17.0, 10.0, 14.0, 8.0, 6.0, 5.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0], "bins": [-63.172271728515625, -61.31330871582031, -59.454345703125, -57.59538269042969, -55.736419677734375, -53.87745666503906, -52.01849365234375, -50.15953063964844, -48.300567626953125, -46.44160461425781, -44.5826416015625, -42.72367858886719, -40.864715576171875, -39.00575256347656, -37.14678955078125, -35.28782653808594, -33.42886734008789, -31.569904327392578, -29.710941314697266, -27.851978302001953, -25.99301528930664, -24.134052276611328, -22.27509117126465, -20.416128158569336, -18.557165145874023, -16.69820213317871, -14.839239120483398, -12.980277061462402, -11.12131404876709, -9.262351036071777, -7.403388977050781, -5.544425964355469, -3.685466766357422, -1.8265039920806885, 0.03245878219604492, 1.8914213180541992, 3.7503843307495117, 5.609347343444824, 7.46830940246582, 9.327272415161133, 11.186235427856445, 13.045198440551758, 14.90416145324707, 16.76312255859375, 18.622085571289062, 20.481048583984375, 22.340011596679688, 24.198974609375, 26.057937622070312, 27.916900634765625, 29.775863647460938, 31.63482666015625, 33.49378967285156, 35.352752685546875, 37.21171569824219, 39.0706787109375, 40.92964172363281, 42.788604736328125, 44.64756774902344, 46.50653076171875, 48.36549377441406, 50.224456787109375, 52.08341979980469, 53.9423828125, 55.80134201049805]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 9.0, 15.0, 13.0, 13.0, 15.0, 20.0, 20.0, 31.0, 22.0, 27.0, 38.0, 40.0, 34.0, 43.0, 39.0, 37.0, 36.0, 45.0, 58.0, 45.0, 49.0, 47.0, 38.0, 34.0, 34.0, 22.0, 26.0, 17.0, 22.0, 21.0, 15.0, 18.0, 15.0, 4.0, 7.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0390625, -5.8382568359375, -5.637451171875, -5.4366455078125, -5.23583984375, -5.0350341796875, -4.834228515625, -4.6334228515625, -4.4326171875, -4.2318115234375, -4.031005859375, -3.8302001953125, -3.62939453125, -3.4285888671875, -3.227783203125, -3.0269775390625, -2.826171875, -2.6253662109375, -2.424560546875, -2.2237548828125, -2.02294921875, -1.8221435546875, -1.621337890625, -1.4205322265625, -1.2197265625, -1.0189208984375, -0.818115234375, -0.6173095703125, -0.41650390625, -0.2156982421875, -0.014892578125, 0.1859130859375, 0.38671875, 0.5875244140625, 0.788330078125, 0.9891357421875, 1.18994140625, 1.3907470703125, 1.591552734375, 1.7923583984375, 1.9931640625, 2.1939697265625, 2.394775390625, 2.5955810546875, 2.79638671875, 2.9971923828125, 3.197998046875, 3.3988037109375, 3.599609375, 3.8004150390625, 4.001220703125, 4.2020263671875, 4.40283203125, 4.6036376953125, 4.804443359375, 5.0052490234375, 5.2060546875, 5.4068603515625, 5.607666015625, 5.8084716796875, 6.00927734375, 6.2100830078125, 6.410888671875, 6.6116943359375, 6.8125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 7.0, 7.0, 5.0, 14.0, 11.0, 16.0, 20.0, 21.0, 26.0, 56.0, 80.0, 164.0, 309.0, 621.0, 1497.0, 4457.0, 16046.0, 82897.0, 729731.0, 2446273.0, 794242.0, 94145.0, 16699.0, 4306.0, 1391.0, 536.0, 283.0, 133.0, 80.0, 54.0, 32.0, 22.0, 25.0, 20.0, 16.0, 12.0, 6.0, 7.0, 2.0, 8.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2890625, -11.899169921875, -11.50927734375, -11.119384765625, -10.7294921875, -10.339599609375, -9.94970703125, -9.559814453125, -9.169921875, -8.780029296875, -8.39013671875, -8.000244140625, -7.6103515625, -7.220458984375, -6.83056640625, -6.440673828125, -6.05078125, -5.660888671875, -5.27099609375, -4.881103515625, -4.4912109375, -4.101318359375, -3.71142578125, -3.321533203125, -2.931640625, -2.541748046875, -2.15185546875, -1.761962890625, -1.3720703125, -0.982177734375, -0.59228515625, -0.202392578125, 0.1875, 0.577392578125, 0.96728515625, 1.357177734375, 1.7470703125, 2.136962890625, 2.52685546875, 2.916748046875, 3.306640625, 3.696533203125, 4.08642578125, 4.476318359375, 4.8662109375, 5.256103515625, 5.64599609375, 6.035888671875, 6.42578125, 6.815673828125, 7.20556640625, 7.595458984375, 7.9853515625, 8.375244140625, 8.76513671875, 9.155029296875, 9.544921875, 9.934814453125, 10.32470703125, 10.714599609375, 11.1044921875, 11.494384765625, 11.88427734375, 12.274169921875, 12.6640625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 10.0, 14.0, 21.0, 21.0, 39.0, 50.0, 81.0, 107.0, 139.0, 189.0, 258.0, 420.0, 577.0, 554.0, 478.0, 339.0, 235.0, 143.0, 107.0, 84.0, 63.0, 37.0, 29.0, 22.0, 17.0, 11.0, 8.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.515625, -18.890380859375, -18.26513671875, -17.639892578125, -17.0146484375, -16.389404296875, -15.76416015625, -15.138916015625, -14.513671875, -13.888427734375, -13.26318359375, -12.637939453125, -12.0126953125, -11.387451171875, -10.76220703125, -10.136962890625, -9.51171875, -8.886474609375, -8.26123046875, -7.635986328125, -7.0107421875, -6.385498046875, -5.76025390625, -5.135009765625, -4.509765625, -3.884521484375, -3.25927734375, -2.634033203125, -2.0087890625, -1.383544921875, -0.75830078125, -0.133056640625, 0.4921875, 1.117431640625, 1.74267578125, 2.367919921875, 2.9931640625, 3.618408203125, 4.24365234375, 4.868896484375, 5.494140625, 6.119384765625, 6.74462890625, 7.369873046875, 7.9951171875, 8.620361328125, 9.24560546875, 9.870849609375, 10.49609375, 11.121337890625, 11.74658203125, 12.371826171875, 12.9970703125, 13.622314453125, 14.24755859375, 14.872802734375, 15.498046875, 16.123291015625, 16.74853515625, 17.373779296875, 17.9990234375, 18.624267578125, 19.24951171875, 19.874755859375, 20.5]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 6.0, 2.0, 4.0, 2.0, 7.0, 6.0, 9.0, 11.0, 14.0, 11.0, 17.0, 38.0, 26.0, 40.0, 49.0, 61.0, 73.0, 112.0, 178.0, 250.0, 484.0, 1149.0, 7787.0, 304715.0, 3818826.0, 55206.0, 3285.0, 723.0, 373.0, 216.0, 147.0, 90.0, 78.0, 75.0, 40.0, 36.0, 24.0, 22.0, 28.0, 15.0, 11.0, 9.0, 9.0, 5.0, 5.0, 6.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-49.34375, -47.66015625, -45.9765625, -44.29296875, -42.609375, -40.92578125, -39.2421875, -37.55859375, -35.875, -34.19140625, -32.5078125, -30.82421875, -29.140625, -27.45703125, -25.7734375, -24.08984375, -22.40625, -20.72265625, -19.0390625, -17.35546875, -15.671875, -13.98828125, -12.3046875, -10.62109375, -8.9375, -7.25390625, -5.5703125, -3.88671875, -2.203125, -0.51953125, 1.1640625, 2.84765625, 4.53125, 6.21484375, 7.8984375, 9.58203125, 11.265625, 12.94921875, 14.6328125, 16.31640625, 18.0, 19.68359375, 21.3671875, 23.05078125, 24.734375, 26.41796875, 28.1015625, 29.78515625, 31.46875, 33.15234375, 34.8359375, 36.51953125, 38.203125, 39.88671875, 41.5703125, 43.25390625, 44.9375, 46.62109375, 48.3046875, 49.98828125, 51.671875, 53.35546875, 55.0390625, 56.72265625, 58.40625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 11.0, 21.0, 55.0, 127.0, 174.0, 221.0, 201.0, 108.0, 51.0, 27.0, 11.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.68533325195312, -105.13290405273438, -101.58047485351562, -98.02804565429688, -94.47562408447266, -90.9231948852539, -87.37076568603516, -83.8183364868164, -80.26591491699219, -76.71348571777344, -73.16105651855469, -69.60862731933594, -66.05620574951172, -62.50377655029297, -58.95134735107422, -55.39891815185547, -51.84648895263672, -48.29405975341797, -44.741634368896484, -41.189205169677734, -37.63677978515625, -34.0843505859375, -30.53192138671875, -26.979494094848633, -23.427066802978516, -19.8746395111084, -16.32221221923828, -12.769783020019531, -9.217355728149414, -5.664928436279297, -2.112499237060547, 1.4399280548095703, 4.992362976074219, 8.544790267944336, 12.09721851348877, 15.649646759033203, 19.20207405090332, 22.754501342773438, 26.306930541992188, 29.859357833862305, 33.41178512573242, 36.96421432495117, 40.516639709472656, 44.069068908691406, 47.621498107910156, 51.17392349243164, 54.72635269165039, 58.278778076171875, 61.831207275390625, 65.38363647460938, 68.93606567382812, 72.48849487304688, 76.0409164428711, 79.59334564208984, 83.1457748413086, 86.69820404052734, 90.25062561035156, 93.80305480957031, 97.35548400878906, 100.90791320800781, 104.46033477783203, 108.01276397705078, 111.56519317626953, 115.11762237548828, 118.67005157470703]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 7.0, 1.0, 0.0, 4.0, 7.0, 8.0, 16.0, 16.0, 11.0, 17.0, 12.0, 17.0, 30.0, 24.0, 39.0, 38.0, 38.0, 48.0, 32.0, 49.0, 43.0, 35.0, 43.0, 46.0, 40.0, 42.0, 57.0, 39.0, 32.0, 30.0, 41.0, 19.0, 21.0, 19.0, 21.0, 18.0, 10.0, 9.0, 5.0, 5.0, 3.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.154117584228516, -58.234718322753906, -56.31531524658203, -54.39591598510742, -52.47651290893555, -50.55711364746094, -48.63771057128906, -46.71831130981445, -44.798912048339844, -42.879512786865234, -40.96010971069336, -39.04071044921875, -37.121307373046875, -35.201908111572266, -33.282508850097656, -31.36310577392578, -29.443702697753906, -27.524301528930664, -25.604900360107422, -23.685501098632812, -21.766098022460938, -19.846698760986328, -17.927297592163086, -16.007896423339844, -14.088495254516602, -12.16909408569336, -10.249692916870117, -8.330292701721191, -6.410891532897949, -4.491490364074707, -2.5720901489257812, -0.6526889801025391, 1.2667160034179688, 3.186116933822632, 5.105517864227295, 7.024918556213379, 8.944319725036621, 10.863720893859863, 12.783121109008789, 14.702522277832031, 16.621923446655273, 18.541324615478516, 20.460725784301758, 22.380126953125, 24.29952621459961, 26.218929290771484, 28.138328552246094, 30.057729721069336, 31.977130889892578, 33.89653015136719, 35.81593322753906, 37.73533248901367, 39.65473556518555, 41.574134826660156, 43.49353790283203, 45.41293716430664, 47.33233642578125, 49.25173568725586, 51.171138763427734, 53.090538024902344, 55.00994110107422, 56.92934036254883, 58.84873962402344, 60.76814270019531, 62.68754577636719]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 10.0, 4.0, 9.0, 11.0, 13.0, 12.0, 15.0, 16.0, 29.0, 22.0, 27.0, 21.0, 35.0, 41.0, 33.0, 40.0, 46.0, 39.0, 45.0, 51.0, 31.0, 44.0, 52.0, 47.0, 44.0, 34.0, 27.0, 29.0, 35.0, 29.0, 18.0, 20.0, 15.0, 11.0, 10.0, 10.0, 11.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.48150634765625, -6.2755126953125, -6.06951904296875, -5.863525390625, -5.65753173828125, -5.4515380859375, -5.24554443359375, -5.03955078125, -4.83355712890625, -4.6275634765625, -4.42156982421875, -4.215576171875, -4.00958251953125, -3.8035888671875, -3.59759521484375, -3.3916015625, -3.18560791015625, -2.9796142578125, -2.77362060546875, -2.567626953125, -2.36163330078125, -2.1556396484375, -1.94964599609375, -1.74365234375, -1.53765869140625, -1.3316650390625, -1.12567138671875, -0.919677734375, -0.71368408203125, -0.5076904296875, -0.30169677734375, -0.095703125, 0.11029052734375, 0.3162841796875, 0.52227783203125, 0.728271484375, 0.93426513671875, 1.1402587890625, 1.34625244140625, 1.55224609375, 1.75823974609375, 1.9642333984375, 2.17022705078125, 2.376220703125, 2.58221435546875, 2.7882080078125, 2.99420166015625, 3.2001953125, 3.40618896484375, 3.6121826171875, 3.81817626953125, 4.024169921875, 4.23016357421875, 4.4361572265625, 4.64215087890625, 4.84814453125, 5.05413818359375, 5.2601318359375, 5.46612548828125, 5.672119140625, 5.87811279296875, 6.0841064453125, 6.29010009765625, 6.49609375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 10.0, 8.0, 14.0, 16.0, 28.0, 39.0, 47.0, 87.0, 115.0, 150.0, 229.0, 298.0, 493.0, 730.0, 1093.0, 1545.0, 2266.0, 3231.0, 4886.0, 6998.0, 10406.0, 15536.0, 23018.0, 34757.0, 53455.0, 83133.0, 129901.0, 194971.0, 168794.0, 108059.0, 69322.0, 44760.0, 29310.0, 19771.0, 13135.0, 8878.0, 6074.0, 4118.0, 2789.0, 1916.0, 1361.0, 858.0, 622.0, 387.0, 316.0, 184.0, 147.0, 81.0, 74.0, 42.0, 34.0, 24.0, 17.0, 15.0, 4.0, 2.0, 4.0, 4.0], "bins": [-0.85888671875, -0.8334732055664062, -0.8080596923828125, -0.7826461791992188, -0.757232666015625, -0.7318191528320312, -0.7064056396484375, -0.6809921264648438, -0.65557861328125, -0.6301651000976562, -0.6047515869140625, -0.5793380737304688, -0.553924560546875, -0.5285110473632812, -0.5030975341796875, -0.47768402099609375, -0.4522705078125, -0.42685699462890625, -0.4014434814453125, -0.37602996826171875, -0.350616455078125, -0.32520294189453125, -0.2997894287109375, -0.27437591552734375, -0.24896240234375, -0.22354888916015625, -0.1981353759765625, -0.17272186279296875, -0.147308349609375, -0.12189483642578125, -0.0964813232421875, -0.07106781005859375, -0.045654296875, -0.02024078369140625, 0.0051727294921875, 0.03058624267578125, 0.055999755859375, 0.08141326904296875, 0.1068267822265625, 0.13224029541015625, 0.15765380859375, 0.18306732177734375, 0.2084808349609375, 0.23389434814453125, 0.259307861328125, 0.28472137451171875, 0.3101348876953125, 0.33554840087890625, 0.3609619140625, 0.38637542724609375, 0.4117889404296875, 0.43720245361328125, 0.462615966796875, 0.48802947998046875, 0.5134429931640625, 0.5388565063476562, 0.56427001953125, 0.5896835327148438, 0.6150970458984375, 0.6405105590820312, 0.665924072265625, 0.6913375854492188, 0.7167510986328125, 0.7421646118164062, 0.767578125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 0.0, 6.0, 3.0, 4.0, 6.0, 5.0, 8.0, 10.0, 13.0, 9.0, 13.0, 15.0, 29.0, 15.0, 27.0, 26.0, 34.0, 41.0, 42.0, 35.0, 38.0, 42.0, 29.0, 45.0, 32.0, 1072.0, 43.0, 35.0, 42.0, 31.0, 25.0, 31.0, 29.0, 23.0, 25.0, 32.0, 17.0, 17.0, 12.0, 16.0, 13.0, 8.0, 9.0, 6.0, 5.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.578125, -3.45892333984375, -3.3397216796875, -3.22052001953125, -3.101318359375, -2.98211669921875, -2.8629150390625, -2.74371337890625, -2.62451171875, -2.50531005859375, -2.3861083984375, -2.26690673828125, -2.147705078125, -2.02850341796875, -1.9093017578125, -1.79010009765625, -1.6708984375, -1.55169677734375, -1.4324951171875, -1.31329345703125, -1.194091796875, -1.07489013671875, -0.9556884765625, -0.83648681640625, -0.71728515625, -0.59808349609375, -0.4788818359375, -0.35968017578125, -0.240478515625, -0.12127685546875, -0.0020751953125, 0.11712646484375, 0.236328125, 0.35552978515625, 0.4747314453125, 0.59393310546875, 0.713134765625, 0.83233642578125, 0.9515380859375, 1.07073974609375, 1.18994140625, 1.30914306640625, 1.4283447265625, 1.54754638671875, 1.666748046875, 1.78594970703125, 1.9051513671875, 2.02435302734375, 2.1435546875, 2.26275634765625, 2.3819580078125, 2.50115966796875, 2.620361328125, 2.73956298828125, 2.8587646484375, 2.97796630859375, 3.09716796875, 3.21636962890625, 3.3355712890625, 3.45477294921875, 3.573974609375, 3.69317626953125, 3.8123779296875, 3.93157958984375, 4.05078125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 8.0, 14.0, 20.0, 25.0, 37.0, 59.0, 91.0, 168.0, 208.0, 324.0, 524.0, 803.0, 1189.0, 1887.0, 2908.0, 4392.0, 6967.0, 10612.0, 16581.0, 25456.0, 40176.0, 63115.0, 100232.0, 156474.0, 1251585.0, 150536.0, 95168.0, 60107.0, 38257.0, 24304.0, 15801.0, 10185.0, 6650.0, 4226.0, 2780.0, 1878.0, 1214.0, 757.0, 547.0, 315.0, 180.0, 132.0, 97.0, 49.0, 35.0, 31.0, 16.0, 6.0, 6.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.728515625, -0.70458984375, -0.6806640625, -0.65673828125, -0.6328125, -0.60888671875, -0.5849609375, -0.56103515625, -0.537109375, -0.51318359375, -0.4892578125, -0.46533203125, -0.44140625, -0.41748046875, -0.3935546875, -0.36962890625, -0.345703125, -0.32177734375, -0.2978515625, -0.27392578125, -0.25, -0.22607421875, -0.2021484375, -0.17822265625, -0.154296875, -0.13037109375, -0.1064453125, -0.08251953125, -0.05859375, -0.03466796875, -0.0107421875, 0.01318359375, 0.037109375, 0.06103515625, 0.0849609375, 0.10888671875, 0.1328125, 0.15673828125, 0.1806640625, 0.20458984375, 0.228515625, 0.25244140625, 0.2763671875, 0.30029296875, 0.32421875, 0.34814453125, 0.3720703125, 0.39599609375, 0.419921875, 0.44384765625, 0.4677734375, 0.49169921875, 0.515625, 0.53955078125, 0.5634765625, 0.58740234375, 0.611328125, 0.63525390625, 0.6591796875, 0.68310546875, 0.70703125, 0.73095703125, 0.7548828125, 0.77880859375, 0.802734375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 7.0, 8.0, 5.0, 8.0, 14.0, 14.0, 11.0, 27.0, 20.0, 30.0, 32.0, 53.0, 42.0, 48.0, 78.0, 76.0, 60.0, 55.0, 65.0, 60.0, 56.0, 37.0, 35.0, 38.0, 27.0, 22.0, 14.0, 11.0, 10.0, 13.0, 10.0, 5.0, 3.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014467239379882812, -0.001399114727973938, -0.0013515055179595947, -0.0013038963079452515, -0.0012562870979309082, -0.001208677887916565, -0.0011610686779022217, -0.0011134594678878784, -0.0010658502578735352, -0.001018241047859192, -0.0009706318378448486, -0.0009230226278305054, -0.0008754134178161621, -0.0008278042078018188, -0.0007801949977874756, -0.0007325857877731323, -0.0006849765777587891, -0.0006373673677444458, -0.0005897581577301025, -0.0005421489477157593, -0.000494539737701416, -0.00044693052768707275, -0.0003993213176727295, -0.00035171210765838623, -0.00030410289764404297, -0.0002564936876296997, -0.00020888447761535645, -0.00016127526760101318, -0.00011366605758666992, -6.605684757232666e-05, -1.84476375579834e-05, 2.9161572456359863e-05, 7.677078247070312e-05, 0.0001243799924850464, 0.00017198920249938965, 0.0002195984125137329, 0.00026720762252807617, 0.00031481683254241943, 0.0003624260425567627, 0.00041003525257110596, 0.0004576444625854492, 0.0005052536725997925, 0.0005528628826141357, 0.000600472092628479, 0.0006480813026428223, 0.0006956905126571655, 0.0007432997226715088, 0.000790908932685852, 0.0008385181427001953, 0.0008861273527145386, 0.0009337365627288818, 0.000981345772743225, 0.0010289549827575684, 0.0010765641927719116, 0.0011241734027862549, 0.0011717826128005981, 0.0012193918228149414, 0.0012670010328292847, 0.001314610242843628, 0.0013622194528579712, 0.0014098286628723145, 0.0014574378728866577, 0.001505047082901001, 0.0015526562929153442, 0.0016002655029296875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 8.0, 9.0, 8.0, 16.0, 28.0, 37.0, 53.0, 85.0, 105.0, 148.0, 227.0, 380.0, 1016.0, 243418.0, 800426.0, 1392.0, 428.0, 220.0, 177.0, 114.0, 59.0, 50.0, 37.0, 29.0, 19.0, 19.0, 12.0, 8.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.040985107421875, -0.039879560470581055, -0.03877401351928711, -0.037668466567993164, -0.03656291961669922, -0.03545737266540527, -0.03435182571411133, -0.03324627876281738, -0.03214073181152344, -0.031035184860229492, -0.029929637908935547, -0.0288240909576416, -0.027718544006347656, -0.02661299705505371, -0.025507450103759766, -0.02440190315246582, -0.023296356201171875, -0.02219080924987793, -0.021085262298583984, -0.01997971534729004, -0.018874168395996094, -0.01776862144470215, -0.016663074493408203, -0.015557527542114258, -0.014451980590820312, -0.013346433639526367, -0.012240886688232422, -0.011135339736938477, -0.010029792785644531, -0.008924245834350586, -0.00781869888305664, -0.006713151931762695, -0.00560760498046875, -0.004502058029174805, -0.0033965110778808594, -0.002290964126586914, -0.0011854171752929688, -7.987022399902344e-05, 0.0010256767272949219, 0.002131223678588867, 0.0032367706298828125, 0.004342317581176758, 0.005447864532470703, 0.0065534114837646484, 0.007658958435058594, 0.008764505386352539, 0.009870052337646484, 0.01097559928894043, 0.012081146240234375, 0.01318669319152832, 0.014292240142822266, 0.015397787094116211, 0.016503334045410156, 0.0176088809967041, 0.018714427947998047, 0.019819974899291992, 0.020925521850585938, 0.022031068801879883, 0.023136615753173828, 0.024242162704467773, 0.02534770965576172, 0.026453256607055664, 0.02755880355834961, 0.028664350509643555, 0.0297698974609375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 11.0, 44.0, 94.0, 236.0, 290.0, 207.0, 87.0, 29.0, 11.0, 2.0, 2.0], "bins": [-0.0037928707897663116, -0.0037267417646944523, -0.003660612739622593, -0.00359448348172009, -0.0035283544566482306, -0.003462225431576371, -0.003396096173673868, -0.003329967148602009, -0.0032638381235301495, -0.00319770909845829, -0.0031315800733864307, -0.0030654508154839277, -0.0029993217904120684, -0.002933192765340209, -0.002867063507437706, -0.0028009344823658466, -0.0027348054572939873, -0.002668676432222128, -0.0026025474071502686, -0.0025364181492477655, -0.002470289124175906, -0.002404160099104047, -0.002338030841201544, -0.0022719018161296844, -0.002205772791057825, -0.0021396437659859657, -0.0020735147409141064, -0.0020073854830116034, -0.001941256457939744, -0.0018751274328678846, -0.0018089982913807034, -0.0017428691498935223, -0.001676740124821663, -0.0016106110997498035, -0.0015444819582626224, -0.0014783528167754412, -0.0014122237917035818, -0.0013460947666317225, -0.0012799656251445413, -0.00121383648365736, -0.0011477074585855007, -0.0010815784335136414, -0.0010154492920264602, -0.0009493202087469399, -0.0008831911254674196, -0.0008170620421878994, -0.0007509329589083791, -0.0006848038756288588, -0.0006186748505569994, -0.0005525457672774792, -0.0004864166839979589, -0.0004202876007184386, -0.00035415851743891835, -0.0002880294341593981, -0.0002219003508798778, -0.00015577126760035753, -8.964218432083726e-05, -2.3513101041316986e-05, 4.261598223820329e-05, 0.00010874506551772356, 0.00017487414879724383, 0.0002410032320767641, 0.0003071323153562844, 0.00037326139863580465, 0.0004393904819153249]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 1.0, 6.0, 7.0, 14.0, 11.0, 5.0, 11.0, 16.0, 19.0, 17.0, 26.0, 29.0, 25.0, 23.0, 24.0, 21.0, 34.0, 34.0, 27.0, 30.0, 33.0, 28.0, 42.0, 32.0, 34.0, 31.0, 38.0, 31.0, 40.0, 20.0, 39.0, 33.0, 22.0, 22.0, 13.0, 15.0, 25.0, 15.0, 13.0, 11.0, 16.0, 13.0, 11.0, 7.0, 6.0, 9.0, 6.0, 2.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.000608980655670166, -0.000590234063565731, -0.0005714874714612961, -0.0005527408793568611, -0.0005339942872524261, -0.0005152476951479912, -0.0004965011030435562, -0.00047775451093912125, -0.0004590079188346863, -0.0004402613267302513, -0.00042151473462581635, -0.0004027681425213814, -0.0003840215504169464, -0.00036527495831251144, -0.0003465283662080765, -0.0003277817741036415, -0.00030903518199920654, -0.0002902885898947716, -0.0002715419977903366, -0.00025279540568590164, -0.00023404881358146667, -0.0002153022214770317, -0.00019655562937259674, -0.00017780903726816177, -0.0001590624451637268, -0.00014031585305929184, -0.00012156926095485687, -0.0001028226688504219, -8.407607674598694e-05, -6.532948464155197e-05, -4.6582892537117004e-05, -2.7836300432682037e-05, -9.08970832824707e-06, 9.656883776187897e-06, 2.8403475880622864e-05, 4.715006798505783e-05, 6.58966600894928e-05, 8.464325219392776e-05, 0.00010338984429836273, 0.0001221364364027977, 0.00014088302850723267, 0.00015962962061166763, 0.0001783762127161026, 0.00019712280482053757, 0.00021586939692497253, 0.0002346159890294075, 0.00025336258113384247, 0.00027210917323827744, 0.0002908557653427124, 0.00030960235744714737, 0.00032834894955158234, 0.0003470955416560173, 0.00036584213376045227, 0.00038458872586488724, 0.0004033353179693222, 0.00042208191007375717, 0.00044082850217819214, 0.0004595750942826271, 0.00047832168638706207, 0.000497068278491497, 0.000515814870595932, 0.000534561462700367, 0.0005533080548048019, 0.0005720546469092369, 0.0005908012390136719]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 10.0, 4.0, 9.0, 11.0, 13.0, 12.0, 15.0, 16.0, 29.0, 22.0, 27.0, 21.0, 35.0, 41.0, 33.0, 40.0, 46.0, 39.0, 45.0, 51.0, 31.0, 44.0, 52.0, 46.0, 45.0, 34.0, 27.0, 29.0, 35.0, 29.0, 18.0, 20.0, 15.0, 11.0, 10.0, 10.0, 11.0, 5.0, 3.0, 1.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6875, -6.48150634765625, -6.2755126953125, -6.06951904296875, -5.863525390625, -5.65753173828125, -5.4515380859375, -5.24554443359375, -5.03955078125, -4.83355712890625, -4.6275634765625, -4.42156982421875, -4.215576171875, -4.00958251953125, -3.8035888671875, -3.59759521484375, -3.3916015625, -3.18560791015625, -2.9796142578125, -2.77362060546875, -2.567626953125, -2.36163330078125, -2.1556396484375, -1.94964599609375, -1.74365234375, -1.53765869140625, -1.3316650390625, -1.12567138671875, -0.919677734375, -0.71368408203125, -0.5076904296875, -0.30169677734375, -0.095703125, 0.11029052734375, 0.3162841796875, 0.52227783203125, 0.728271484375, 0.93426513671875, 1.1402587890625, 1.34625244140625, 1.55224609375, 1.75823974609375, 1.9642333984375, 2.17022705078125, 2.376220703125, 2.58221435546875, 2.7882080078125, 2.99420166015625, 3.2001953125, 3.40618896484375, 3.6121826171875, 3.81817626953125, 4.024169921875, 4.23016357421875, 4.4361572265625, 4.64215087890625, 4.84814453125, 5.05413818359375, 5.2601318359375, 5.46612548828125, 5.672119140625, 5.87811279296875, 6.0841064453125, 6.29010009765625, 6.49609375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 9.0, 6.0, 9.0, 22.0, 14.0, 31.0, 40.0, 52.0, 74.0, 122.0, 145.0, 224.0, 353.0, 512.0, 817.0, 1328.0, 2160.0, 3745.0, 7003.0, 14664.0, 37347.0, 118126.0, 416637.0, 307477.0, 83308.0, 28204.0, 11842.0, 5972.0, 3203.0, 1832.0, 1119.0, 700.0, 482.0, 311.0, 208.0, 135.0, 110.0, 46.0, 42.0, 42.0, 29.0, 15.0, 11.0, 4.0, 7.0, 7.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.0078125, -3.88201904296875, -3.7562255859375, -3.63043212890625, -3.504638671875, -3.37884521484375, -3.2530517578125, -3.12725830078125, -3.00146484375, -2.87567138671875, -2.7498779296875, -2.62408447265625, -2.498291015625, -2.37249755859375, -2.2467041015625, -2.12091064453125, -1.9951171875, -1.86932373046875, -1.7435302734375, -1.61773681640625, -1.491943359375, -1.36614990234375, -1.2403564453125, -1.11456298828125, -0.98876953125, -0.86297607421875, -0.7371826171875, -0.61138916015625, -0.485595703125, -0.35980224609375, -0.2340087890625, -0.10821533203125, 0.017578125, 0.14337158203125, 0.2691650390625, 0.39495849609375, 0.520751953125, 0.64654541015625, 0.7723388671875, 0.89813232421875, 1.02392578125, 1.14971923828125, 1.2755126953125, 1.40130615234375, 1.527099609375, 1.65289306640625, 1.7786865234375, 1.90447998046875, 2.0302734375, 2.15606689453125, 2.2818603515625, 2.40765380859375, 2.533447265625, 2.65924072265625, 2.7850341796875, 2.91082763671875, 3.03662109375, 3.16241455078125, 3.2882080078125, 3.41400146484375, 3.539794921875, 3.66558837890625, 3.7913818359375, 3.91717529296875, 4.04296875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 5.0, 6.0, 11.0, 10.0, 9.0, 15.0, 14.0, 15.0, 19.0, 22.0, 27.0, 34.0, 38.0, 51.0, 39.0, 41.0, 55.0, 80.0, 1584.0, 491.0, 76.0, 47.0, 42.0, 33.0, 32.0, 43.0, 30.0, 33.0, 20.0, 26.0, 23.0, 19.0, 12.0, 14.0, 7.0, 5.0, 8.0, 6.0, 5.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.9375, -22.17236328125, -21.4072265625, -20.64208984375, -19.876953125, -19.11181640625, -18.3466796875, -17.58154296875, -16.81640625, -16.05126953125, -15.2861328125, -14.52099609375, -13.755859375, -12.99072265625, -12.2255859375, -11.46044921875, -10.6953125, -9.93017578125, -9.1650390625, -8.39990234375, -7.634765625, -6.86962890625, -6.1044921875, -5.33935546875, -4.57421875, -3.80908203125, -3.0439453125, -2.27880859375, -1.513671875, -0.74853515625, 0.0166015625, 0.78173828125, 1.546875, 2.31201171875, 3.0771484375, 3.84228515625, 4.607421875, 5.37255859375, 6.1376953125, 6.90283203125, 7.66796875, 8.43310546875, 9.1982421875, 9.96337890625, 10.728515625, 11.49365234375, 12.2587890625, 13.02392578125, 13.7890625, 14.55419921875, 15.3193359375, 16.08447265625, 16.849609375, 17.61474609375, 18.3798828125, 19.14501953125, 19.91015625, 20.67529296875, 21.4404296875, 22.20556640625, 22.970703125, 23.73583984375, 24.5009765625, 25.26611328125, 26.03125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 6.0, 10.0, 18.0, 22.0, 22.0, 30.0, 36.0, 36.0, 58.0, 71.0, 92.0, 152.0, 285.0, 554.0, 2765.0, 573221.0, 2563095.0, 3719.0, 618.0, 288.0, 139.0, 100.0, 81.0, 63.0, 49.0, 29.0, 20.0, 24.0, 10.0, 11.0, 13.0, 8.0, 10.0, 10.0, 5.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-42.21875, -40.97900390625, -39.7392578125, -38.49951171875, -37.259765625, -36.02001953125, -34.7802734375, -33.54052734375, -32.30078125, -31.06103515625, -29.8212890625, -28.58154296875, -27.341796875, -26.10205078125, -24.8623046875, -23.62255859375, -22.3828125, -21.14306640625, -19.9033203125, -18.66357421875, -17.423828125, -16.18408203125, -14.9443359375, -13.70458984375, -12.46484375, -11.22509765625, -9.9853515625, -8.74560546875, -7.505859375, -6.26611328125, -5.0263671875, -3.78662109375, -2.546875, -1.30712890625, -0.0673828125, 1.17236328125, 2.412109375, 3.65185546875, 4.8916015625, 6.13134765625, 7.37109375, 8.61083984375, 9.8505859375, 11.09033203125, 12.330078125, 13.56982421875, 14.8095703125, 16.04931640625, 17.2890625, 18.52880859375, 19.7685546875, 21.00830078125, 22.248046875, 23.48779296875, 24.7275390625, 25.96728515625, 27.20703125, 28.44677734375, 29.6865234375, 30.92626953125, 32.166015625, 33.40576171875, 34.6455078125, 35.88525390625, 37.125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [5.0, 167.0, 768.0, 78.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.039982795715332, -5.830307483673096, -1.6206321716308594, 2.589043617248535, 6.798718452453613, 11.008393287658691, 15.218070030212402, 19.427745819091797, 23.637420654296875, 27.847095489501953, 32.05677032470703, 36.266448974609375, 40.47611999511719, 44.68579864501953, 48.89547348022461, 53.10514831542969, 57.314823150634766, 61.524497985839844, 65.73417663574219, 69.94384765625, 74.15352630615234, 78.36319732666016, 82.5728759765625, 86.78254699707031, 90.99222564697266, 95.201904296875, 99.41157531738281, 103.62125396728516, 107.83092498779297, 112.04060363769531, 116.25027465820312, 120.45995330810547, 124.66963195800781, 128.87930297851562, 133.0889892578125, 137.2986602783203, 141.50833129882812, 145.71800231933594, 149.9276885986328, 154.13735961914062, 158.34703063964844, 162.55670166015625, 166.76638793945312, 170.97605895996094, 175.18572998046875, 179.39540100097656, 183.60508728027344, 187.81475830078125, 192.02444458007812, 196.23411560058594, 200.4438018798828, 204.65347290039062, 208.86314392089844, 213.07281494140625, 217.28250122070312, 221.49217224121094, 225.70184326171875, 229.91151428222656, 234.12120056152344, 238.33087158203125, 242.54054260253906, 246.75021362304688, 250.95989990234375, 255.16957092285156, 259.3792419433594]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 8.0, 7.0, 2.0, 7.0, 3.0, 13.0, 7.0, 11.0, 13.0, 19.0, 21.0, 17.0, 16.0, 25.0, 21.0, 24.0, 31.0, 30.0, 24.0, 37.0, 37.0, 41.0, 39.0, 48.0, 35.0, 40.0, 45.0, 43.0, 25.0, 41.0, 44.0, 28.0, 22.0, 20.0, 27.0, 13.0, 15.0, 9.0, 14.0, 17.0, 18.0, 14.0, 7.0, 3.0, 5.0, 9.0, 7.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-72.71269226074219, -70.53578186035156, -68.35887145996094, -66.18196105957031, -64.00505065917969, -61.82814025878906, -59.6512336730957, -57.47432327270508, -55.29741287231445, -53.12050247192383, -50.9435920715332, -48.76668167114258, -46.58977508544922, -44.412864685058594, -42.23595428466797, -40.059043884277344, -37.88213348388672, -35.705223083496094, -33.52831268310547, -31.351404190063477, -29.17449378967285, -26.997583389282227, -24.820674896240234, -22.64376449584961, -20.466854095458984, -18.28994369506836, -16.113033294677734, -13.936124801635742, -11.759214401245117, -9.582304000854492, -7.405394554138184, -5.228485107421875, -3.0515823364257812, -0.8746724128723145, 1.3022375106811523, 3.479147434234619, 5.656057357788086, 7.832967758178711, 10.00987720489502, 12.186786651611328, 14.363697052001953, 16.540607452392578, 18.717517852783203, 20.894426345825195, 23.07133674621582, 25.248247146606445, 27.425155639648438, 29.602066040039062, 31.778976440429688, 33.95588684082031, 36.13279724121094, 38.30970764160156, 40.48661804199219, 42.66352844238281, 44.84043502807617, 47.0173454284668, 49.19425582885742, 51.37116622924805, 53.54807662963867, 55.7249870300293, 57.901893615722656, 60.07880401611328, 62.255714416503906, 64.43262481689453, 66.60953521728516]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 7.0, 5.0, 10.0, 10.0, 13.0, 16.0, 10.0, 19.0, 24.0, 19.0, 34.0, 26.0, 31.0, 33.0, 39.0, 36.0, 43.0, 52.0, 32.0, 43.0, 45.0, 47.0, 48.0, 36.0, 47.0, 40.0, 20.0, 33.0, 31.0, 28.0, 24.0, 21.0, 15.0, 9.0, 10.0, 11.0, 12.0, 5.0, 1.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.71875, -6.51177978515625, -6.3048095703125, -6.09783935546875, -5.890869140625, -5.68389892578125, -5.4769287109375, -5.26995849609375, -5.06298828125, -4.85601806640625, -4.6490478515625, -4.44207763671875, -4.235107421875, -4.02813720703125, -3.8211669921875, -3.61419677734375, -3.4072265625, -3.20025634765625, -2.9932861328125, -2.78631591796875, -2.579345703125, -2.37237548828125, -2.1654052734375, -1.95843505859375, -1.75146484375, -1.54449462890625, -1.3375244140625, -1.13055419921875, -0.923583984375, -0.71661376953125, -0.5096435546875, -0.30267333984375, -0.095703125, 0.11126708984375, 0.3182373046875, 0.52520751953125, 0.732177734375, 0.93914794921875, 1.1461181640625, 1.35308837890625, 1.56005859375, 1.76702880859375, 1.9739990234375, 2.18096923828125, 2.387939453125, 2.59490966796875, 2.8018798828125, 3.00885009765625, 3.2158203125, 3.42279052734375, 3.6297607421875, 3.83673095703125, 4.043701171875, 4.25067138671875, 4.4576416015625, 4.66461181640625, 4.87158203125, 5.07855224609375, 5.2855224609375, 5.49249267578125, 5.699462890625, 5.90643310546875, 6.1134033203125, 6.32037353515625, 6.52734375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 12.0, 13.0, 17.0, 16.0, 17.0, 15.0, 26.0, 28.0, 45.0, 76.0, 111.0, 193.0, 390.0, 1623.0, 8971.0, 108092.0, 2442870.0, 1564272.0, 59460.0, 6003.0, 1107.0, 376.0, 171.0, 94.0, 65.0, 37.0, 29.0, 37.0, 14.0, 16.0, 7.0, 15.0, 12.0, 9.0, 7.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.140625, -20.498046875, -19.85546875, -19.212890625, -18.5703125, -17.927734375, -17.28515625, -16.642578125, -16.0, -15.357421875, -14.71484375, -14.072265625, -13.4296875, -12.787109375, -12.14453125, -11.501953125, -10.859375, -10.216796875, -9.57421875, -8.931640625, -8.2890625, -7.646484375, -7.00390625, -6.361328125, -5.71875, -5.076171875, -4.43359375, -3.791015625, -3.1484375, -2.505859375, -1.86328125, -1.220703125, -0.578125, 0.064453125, 0.70703125, 1.349609375, 1.9921875, 2.634765625, 3.27734375, 3.919921875, 4.5625, 5.205078125, 5.84765625, 6.490234375, 7.1328125, 7.775390625, 8.41796875, 9.060546875, 9.703125, 10.345703125, 10.98828125, 11.630859375, 12.2734375, 12.916015625, 13.55859375, 14.201171875, 14.84375, 15.486328125, 16.12890625, 16.771484375, 17.4140625, 18.056640625, 18.69921875, 19.341796875, 19.984375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 3.0, 12.0, 21.0, 22.0, 33.0, 63.0, 101.0, 127.0, 196.0, 268.0, 441.0, 569.0, 624.0, 524.0, 380.0, 231.0, 148.0, 99.0, 74.0, 42.0, 32.0, 26.0, 11.0, 7.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.546875, -23.848876953125, -23.15087890625, -22.452880859375, -21.7548828125, -21.056884765625, -20.35888671875, -19.660888671875, -18.962890625, -18.264892578125, -17.56689453125, -16.868896484375, -16.1708984375, -15.472900390625, -14.77490234375, -14.076904296875, -13.37890625, -12.680908203125, -11.98291015625, -11.284912109375, -10.5869140625, -9.888916015625, -9.19091796875, -8.492919921875, -7.794921875, -7.096923828125, -6.39892578125, -5.700927734375, -5.0029296875, -4.304931640625, -3.60693359375, -2.908935546875, -2.2109375, -1.512939453125, -0.81494140625, -0.116943359375, 0.5810546875, 1.279052734375, 1.97705078125, 2.675048828125, 3.373046875, 4.071044921875, 4.76904296875, 5.467041015625, 6.1650390625, 6.863037109375, 7.56103515625, 8.259033203125, 8.95703125, 9.655029296875, 10.35302734375, 11.051025390625, 11.7490234375, 12.447021484375, 13.14501953125, 13.843017578125, 14.541015625, 15.239013671875, 15.93701171875, 16.635009765625, 17.3330078125, 18.031005859375, 18.72900390625, 19.427001953125, 20.125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 7.0, 3.0, 5.0, 8.0, 18.0, 18.0, 24.0, 36.0, 52.0, 70.0, 97.0, 136.0, 193.0, 345.0, 944.0, 6419.0, 1688217.0, 2487962.0, 7783.0, 932.0, 327.0, 207.0, 134.0, 94.0, 71.0, 52.0, 37.0, 25.0, 24.0, 19.0, 5.0, 5.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.78125, -50.58447265625, -48.3876953125, -46.19091796875, -43.994140625, -41.79736328125, -39.6005859375, -37.40380859375, -35.20703125, -33.01025390625, -30.8134765625, -28.61669921875, -26.419921875, -24.22314453125, -22.0263671875, -19.82958984375, -17.6328125, -15.43603515625, -13.2392578125, -11.04248046875, -8.845703125, -6.64892578125, -4.4521484375, -2.25537109375, -0.05859375, 2.13818359375, 4.3349609375, 6.53173828125, 8.728515625, 10.92529296875, 13.1220703125, 15.31884765625, 17.515625, 19.71240234375, 21.9091796875, 24.10595703125, 26.302734375, 28.49951171875, 30.6962890625, 32.89306640625, 35.08984375, 37.28662109375, 39.4833984375, 41.68017578125, 43.876953125, 46.07373046875, 48.2705078125, 50.46728515625, 52.6640625, 54.86083984375, 57.0576171875, 59.25439453125, 61.451171875, 63.64794921875, 65.8447265625, 68.04150390625, 70.23828125, 72.43505859375, 74.6318359375, 76.82861328125, 79.025390625, 81.22216796875, 83.4189453125, 85.61572265625, 87.8125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 12.0, 46.0, 105.0, 197.0, 272.0, 196.0, 111.0, 52.0, 13.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.05514526367188, -158.57041931152344, -154.08570861816406, -149.60098266601562, -145.11627197265625, -140.6315460205078, -136.14682006835938, -131.662109375, -127.17738342285156, -122.69266510009766, -118.20794677734375, -113.72322082519531, -109.2385025024414, -104.7537841796875, -100.26905822753906, -95.78433990478516, -91.29962158203125, -86.81490325927734, -82.33018493652344, -77.845458984375, -73.3607406616211, -68.87602233886719, -64.39129638671875, -59.906578063964844, -55.42185974121094, -50.93714141845703, -46.45241928100586, -41.96769714355469, -37.48297882080078, -32.998260498046875, -28.513538360595703, -24.028818130493164, -19.544097900390625, -15.059377670288086, -10.574657440185547, -6.089937210083008, -1.6052169799804688, 2.8795032501220703, 7.364223480224609, 11.848943710327148, 16.333663940429688, 20.818384170532227, 25.303104400634766, 29.787824630737305, 34.272544860839844, 38.75726318359375, 43.24198532104492, 47.726707458496094, 52.21142578125, 56.696144104003906, 61.18086624145508, 65.66558837890625, 70.15030670166016, 74.63502502441406, 79.1197509765625, 83.6044692993164, 88.08918762207031, 92.57390594482422, 97.05862426757812, 101.54335021972656, 106.02806854248047, 110.51278686523438, 114.99751281738281, 119.48223114013672, 123.96694946289062]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 7.0, 7.0, 11.0, 8.0, 13.0, 11.0, 21.0, 20.0, 22.0, 22.0, 20.0, 25.0, 30.0, 26.0, 26.0, 28.0, 37.0, 36.0, 43.0, 37.0, 32.0, 31.0, 41.0, 44.0, 44.0, 41.0, 35.0, 23.0, 30.0, 24.0, 22.0, 22.0, 21.0, 26.0, 20.0, 20.0, 16.0, 10.0, 10.0, 10.0, 5.0, 8.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.805999755859375, -49.17817687988281, -47.550350189208984, -45.922523498535156, -44.294700622558594, -42.66687774658203, -41.0390510559082, -39.411224365234375, -37.78340148925781, -36.15557861328125, -34.52775192260742, -32.899925231933594, -31.27210235595703, -29.644277572631836, -28.01645278930664, -26.388628005981445, -24.76080322265625, -23.132978439331055, -21.50515365600586, -19.877328872680664, -18.24950408935547, -16.621679306030273, -14.993854522705078, -13.366029739379883, -11.738204956054688, -10.110380172729492, -8.482555389404297, -6.854730606079102, -5.226905822753906, -3.599081039428711, -1.9712562561035156, -0.3434314727783203, 1.284393310546875, 2.9122180938720703, 4.540042877197266, 6.167867660522461, 7.795692443847656, 9.423517227172852, 11.051342010498047, 12.679166793823242, 14.306991577148438, 15.934816360473633, 17.562641143798828, 19.190465927124023, 20.81829071044922, 22.446115493774414, 24.07394027709961, 25.701765060424805, 27.32958984375, 28.957414627075195, 30.58523941040039, 32.21306610107422, 33.84088897705078, 35.468711853027344, 37.09653854370117, 38.724365234375, 40.35218811035156, 41.980010986328125, 43.60783767700195, 45.23566436767578, 46.863487243652344, 48.491310119628906, 50.119136810302734, 51.74696350097656, 53.374786376953125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 14.0, 10.0, 7.0, 17.0, 20.0, 16.0, 21.0, 19.0, 30.0, 25.0, 34.0, 29.0, 31.0, 39.0, 41.0, 36.0, 35.0, 46.0, 43.0, 48.0, 39.0, 37.0, 40.0, 32.0, 29.0, 37.0, 29.0, 35.0, 21.0, 23.0, 11.0, 15.0, 21.0, 9.0, 9.0, 12.0, 8.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.68359375, -6.48138427734375, -6.2791748046875, -6.07696533203125, -5.874755859375, -5.67254638671875, -5.4703369140625, -5.26812744140625, -5.06591796875, -4.86370849609375, -4.6614990234375, -4.45928955078125, -4.257080078125, -4.05487060546875, -3.8526611328125, -3.65045166015625, -3.4482421875, -3.24603271484375, -3.0438232421875, -2.84161376953125, -2.639404296875, -2.43719482421875, -2.2349853515625, -2.03277587890625, -1.83056640625, -1.62835693359375, -1.4261474609375, -1.22393798828125, -1.021728515625, -0.81951904296875, -0.6173095703125, -0.41510009765625, -0.212890625, -0.01068115234375, 0.1915283203125, 0.39373779296875, 0.595947265625, 0.79815673828125, 1.0003662109375, 1.20257568359375, 1.40478515625, 1.60699462890625, 1.8092041015625, 2.01141357421875, 2.213623046875, 2.41583251953125, 2.6180419921875, 2.82025146484375, 3.0224609375, 3.22467041015625, 3.4268798828125, 3.62908935546875, 3.831298828125, 4.03350830078125, 4.2357177734375, 4.43792724609375, 4.64013671875, 4.84234619140625, 5.0445556640625, 5.24676513671875, 5.448974609375, 5.65118408203125, 5.8533935546875, 6.05560302734375, 6.2578125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 6.0, 5.0, 12.0, 20.0, 25.0, 26.0, 43.0, 66.0, 100.0, 154.0, 188.0, 256.0, 410.0, 610.0, 863.0, 1221.0, 1764.0, 2702.0, 3810.0, 5770.0, 8495.0, 12696.0, 19409.0, 29798.0, 46139.0, 72337.0, 113949.0, 180878.0, 196869.0, 125031.0, 78774.0, 50229.0, 32163.0, 21011.0, 13904.0, 9401.0, 6178.0, 4119.0, 2787.0, 1977.0, 1382.0, 888.0, 647.0, 432.0, 324.0, 198.0, 159.0, 113.0, 78.0, 52.0, 32.0, 26.0, 11.0, 12.0, 7.0, 3.0, 2.0, 4.0, 3.0, 2.0], "bins": [-0.86572265625, -0.8387527465820312, -0.8117828369140625, -0.7848129272460938, -0.757843017578125, -0.7308731079101562, -0.7039031982421875, -0.6769332885742188, -0.64996337890625, -0.6229934692382812, -0.5960235595703125, -0.5690536499023438, -0.542083740234375, -0.5151138305664062, -0.4881439208984375, -0.46117401123046875, -0.4342041015625, -0.40723419189453125, -0.3802642822265625, -0.35329437255859375, -0.326324462890625, -0.29935455322265625, -0.2723846435546875, -0.24541473388671875, -0.21844482421875, -0.19147491455078125, -0.1645050048828125, -0.13753509521484375, -0.110565185546875, -0.08359527587890625, -0.0566253662109375, -0.02965545654296875, -0.002685546875, 0.02428436279296875, 0.0512542724609375, 0.07822418212890625, 0.105194091796875, 0.13216400146484375, 0.1591339111328125, 0.18610382080078125, 0.21307373046875, 0.24004364013671875, 0.2670135498046875, 0.29398345947265625, 0.320953369140625, 0.34792327880859375, 0.3748931884765625, 0.40186309814453125, 0.4288330078125, 0.45580291748046875, 0.4827728271484375, 0.5097427368164062, 0.536712646484375, 0.5636825561523438, 0.5906524658203125, 0.6176223754882812, 0.64459228515625, 0.6715621948242188, 0.6985321044921875, 0.7255020141601562, 0.752471923828125, 0.7794418334960938, 0.8064117431640625, 0.8333816528320312, 0.8603515625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 5.0, 4.0, 6.0, 4.0, 5.0, 6.0, 12.0, 5.0, 7.0, 13.0, 20.0, 18.0, 29.0, 24.0, 31.0, 15.0, 33.0, 31.0, 42.0, 35.0, 33.0, 36.0, 49.0, 36.0, 1065.0, 45.0, 43.0, 43.0, 36.0, 29.0, 31.0, 20.0, 32.0, 28.0, 26.0, 19.0, 17.0, 16.0, 17.0, 14.0, 9.0, 13.0, 10.0, 7.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.140625, -4.021087646484375, -3.90155029296875, -3.782012939453125, -3.6624755859375, -3.542938232421875, -3.42340087890625, -3.303863525390625, -3.184326171875, -3.064788818359375, -2.94525146484375, -2.825714111328125, -2.7061767578125, -2.586639404296875, -2.46710205078125, -2.347564697265625, -2.22802734375, -2.108489990234375, -1.98895263671875, -1.869415283203125, -1.7498779296875, -1.630340576171875, -1.51080322265625, -1.391265869140625, -1.271728515625, -1.152191162109375, -1.03265380859375, -0.913116455078125, -0.7935791015625, -0.674041748046875, -0.55450439453125, -0.434967041015625, -0.3154296875, -0.195892333984375, -0.07635498046875, 0.043182373046875, 0.1627197265625, 0.282257080078125, 0.40179443359375, 0.521331787109375, 0.640869140625, 0.760406494140625, 0.87994384765625, 0.999481201171875, 1.1190185546875, 1.238555908203125, 1.35809326171875, 1.477630615234375, 1.59716796875, 1.716705322265625, 1.83624267578125, 1.955780029296875, 2.0753173828125, 2.194854736328125, 2.31439208984375, 2.433929443359375, 2.553466796875, 2.673004150390625, 2.79254150390625, 2.912078857421875, 3.0316162109375, 3.151153564453125, 3.27069091796875, 3.390228271484375, 3.509765625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 8.0, 13.0, 11.0, 11.0, 24.0, 42.0, 55.0, 91.0, 147.0, 190.0, 298.0, 419.0, 592.0, 951.0, 1467.0, 2134.0, 3223.0, 4615.0, 6981.0, 10335.0, 15839.0, 24434.0, 37499.0, 57957.0, 89813.0, 139460.0, 1247682.0, 159945.0, 102280.0, 66171.0, 43212.0, 27602.0, 17958.0, 11736.0, 7930.0, 5350.0, 3445.0, 2356.0, 1576.0, 1069.0, 741.0, 485.0, 319.0, 216.0, 173.0, 99.0, 70.0, 34.0, 31.0, 23.0, 13.0, 8.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.77490234375, -0.7504196166992188, -0.7259368896484375, -0.7014541625976562, -0.676971435546875, -0.6524887084960938, -0.6280059814453125, -0.6035232543945312, -0.57904052734375, -0.5545578002929688, -0.5300750732421875, -0.5055923461914062, -0.481109619140625, -0.45662689208984375, -0.4321441650390625, -0.40766143798828125, -0.3831787109375, -0.35869598388671875, -0.3342132568359375, -0.30973052978515625, -0.285247802734375, -0.26076507568359375, -0.2362823486328125, -0.21179962158203125, -0.18731689453125, -0.16283416748046875, -0.1383514404296875, -0.11386871337890625, -0.089385986328125, -0.06490325927734375, -0.0404205322265625, -0.01593780517578125, 0.008544921875, 0.03302764892578125, 0.0575103759765625, 0.08199310302734375, 0.106475830078125, 0.13095855712890625, 0.1554412841796875, 0.17992401123046875, 0.20440673828125, 0.22888946533203125, 0.2533721923828125, 0.27785491943359375, 0.302337646484375, 0.32682037353515625, 0.3513031005859375, 0.37578582763671875, 0.4002685546875, 0.42475128173828125, 0.4492340087890625, 0.47371673583984375, 0.498199462890625, 0.5226821899414062, 0.5471649169921875, 0.5716476440429688, 0.59613037109375, 0.6206130981445312, 0.6450958251953125, 0.6695785522460938, 0.694061279296875, 0.7185440063476562, 0.7430267333984375, 0.7675094604492188, 0.7919921875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 7.0, 9.0, 7.0, 8.0, 12.0, 12.0, 11.0, 15.0, 20.0, 20.0, 27.0, 34.0, 42.0, 47.0, 61.0, 63.0, 68.0, 93.0, 74.0, 62.0, 59.0, 42.0, 27.0, 36.0, 24.0, 28.0, 25.0, 17.0, 14.0, 6.0, 8.0, 9.0, 3.0, 0.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.0018682479858398438, -0.0018110424280166626, -0.0017538368701934814, -0.0016966313123703003, -0.0016394257545471191, -0.001582220196723938, -0.0015250146389007568, -0.0014678090810775757, -0.0014106035232543945, -0.0013533979654312134, -0.0012961924076080322, -0.001238986849784851, -0.00118178129196167, -0.0011245757341384888, -0.0010673701763153076, -0.0010101646184921265, -0.0009529590606689453, -0.0008957535028457642, -0.000838547945022583, -0.0007813423871994019, -0.0007241368293762207, -0.0006669312715530396, -0.0006097257137298584, -0.0005525201559066772, -0.0004953145980834961, -0.00043810904026031494, -0.0003809034824371338, -0.00032369792461395264, -0.0002664923667907715, -0.00020928680896759033, -0.00015208125114440918, -9.487569332122803e-05, -3.7670135498046875e-05, 1.9535422325134277e-05, 7.674098014831543e-05, 0.00013394653797149658, 0.00019115209579467773, 0.0002483576536178589, 0.00030556321144104004, 0.0003627687692642212, 0.00041997432708740234, 0.0004771798849105835, 0.0005343854427337646, 0.0005915910005569458, 0.000648796558380127, 0.0007060021162033081, 0.0007632076740264893, 0.0008204132318496704, 0.0008776187896728516, 0.0009348243474960327, 0.0009920299053192139, 0.001049235463142395, 0.0011064410209655762, 0.0011636465787887573, 0.0012208521366119385, 0.0012780576944351196, 0.0013352632522583008, 0.001392468810081482, 0.001449674367904663, 0.0015068799257278442, 0.0015640854835510254, 0.0016212910413742065, 0.0016784965991973877, 0.0017357021570205688, 0.00179290771484375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 11.0, 4.0, 13.0, 9.0, 23.0, 18.0, 32.0, 45.0, 60.0, 95.0, 160.0, 281.0, 647.0, 28193.0, 1016093.0, 1786.0, 430.0, 205.0, 125.0, 74.0, 43.0, 32.0, 30.0, 23.0, 21.0, 19.0, 12.0, 9.0, 8.0, 10.0, 6.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0372314453125, -0.035913944244384766, -0.03459644317626953, -0.0332789421081543, -0.03196144104003906, -0.030643939971923828, -0.029326438903808594, -0.02800893783569336, -0.026691436767578125, -0.02537393569946289, -0.024056434631347656, -0.022738933563232422, -0.021421432495117188, -0.020103931427001953, -0.01878643035888672, -0.017468929290771484, -0.01615142822265625, -0.014833927154541016, -0.013516426086425781, -0.012198925018310547, -0.010881423950195312, -0.009563922882080078, -0.008246421813964844, -0.006928920745849609, -0.005611419677734375, -0.004293918609619141, -0.0029764175415039062, -0.0016589164733886719, -0.0003414154052734375, 0.0009760856628417969, 0.0022935867309570312, 0.0036110877990722656, 0.0049285888671875, 0.006246089935302734, 0.007563591003417969, 0.008881092071533203, 0.010198593139648438, 0.011516094207763672, 0.012833595275878906, 0.01415109634399414, 0.015468597412109375, 0.01678609848022461, 0.018103599548339844, 0.019421100616455078, 0.020738601684570312, 0.022056102752685547, 0.02337360382080078, 0.024691104888916016, 0.02600860595703125, 0.027326107025146484, 0.02864360809326172, 0.029961109161376953, 0.03127861022949219, 0.03259611129760742, 0.033913612365722656, 0.03523111343383789, 0.036548614501953125, 0.03786611557006836, 0.039183616638183594, 0.04050111770629883, 0.04181861877441406, 0.0431361198425293, 0.04445362091064453, 0.045771121978759766, 0.047088623046875]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 53.0, 427.0, 449.0, 75.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0084548844024539, -0.008292448706924915, -0.008130013011395931, -0.007967577315866947, -0.00780514208599925, -0.007642706390470266, -0.007480270694941282, -0.0073178354650735855, -0.0071553997695446014, -0.006992964074015617, -0.006830528378486633, -0.0066680931486189365, -0.0065056574530899525, -0.006343221757560968, -0.006180786062031984, -0.006018350832164288, -0.0058559151366353035, -0.005693479441106319, -0.005531043745577335, -0.005368608515709639, -0.0052061728201806545, -0.0050437371246516705, -0.004881301429122686, -0.00471886619925499, -0.004556430038064718, -0.004393994342535734, -0.00423155864700675, -0.004069123417139053, -0.003906687721610069, -0.003744252026081085, -0.003581816330552101, -0.0034193808678537607, -0.003256945637986064, -0.00309450994245708, -0.0029320744797587395, -0.0027696387842297554, -0.002607203321531415, -0.002444767626002431, -0.0022823321633040905, -0.0021198964677751064, -0.0019574607722461224, -0.0017950251931324601, -0.0016325896140187979, -0.0014701539184898138, -0.0013077184557914734, -0.0011452827602624893, -0.000982847181148827, -0.0008204116020351648, -0.0006579761393368244, -0.0004955405602231622, -0.0003331049520056695, -0.00017066934378817677, -8.233764674514532e-06, 0.0001542018144391477, 0.00031663745176047087, 0.0004790730308741331, 0.0006415086099877954, 0.0008039441891014576, 0.0009663797682151198, 0.001128815347328782, 0.0012912510428577662, 0.0014536865055561066, 0.0016161222010850906, 0.0017785577801987529, 0.0019409933593124151]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 9.0, 6.0, 1.0, 5.0, 9.0, 5.0, 10.0, 22.0, 19.0, 24.0, 21.0, 25.0, 32.0, 31.0, 30.0, 30.0, 34.0, 30.0, 41.0, 36.0, 45.0, 43.0, 47.0, 28.0, 29.0, 46.0, 47.0, 35.0, 33.0, 31.0, 20.0, 23.0, 29.0, 21.0, 28.0, 17.0, 14.0, 11.0, 8.0, 11.0, 7.0, 1.0, 2.0, 6.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0009077787399291992, -0.0008791247382760048, -0.0008504707366228104, -0.0008218167349696159, -0.0007931627333164215, -0.0007645087316632271, -0.0007358547300100327, -0.0007072007283568382, -0.0006785467267036438, -0.0006498927250504494, -0.0006212387233972549, -0.0005925847217440605, -0.0005639307200908661, -0.0005352767184376717, -0.0005066227167844772, -0.0004779687151312828, -0.0004493147134780884, -0.00042066071182489395, -0.0003920067101716995, -0.0003633527085185051, -0.00033469870686531067, -0.00030604470521211624, -0.0002773907035589218, -0.0002487367019057274, -0.00022008270025253296, -0.00019142869859933853, -0.0001627746969461441, -0.00013412069529294968, -0.00010546669363975525, -7.681269198656082e-05, -4.8158690333366394e-05, -1.9504688680171967e-05, 9.149312973022461e-06, 3.780331462621689e-05, 6.645731627941132e-05, 9.511131793260574e-05, 0.00012376531958580017, 0.0001524193212389946, 0.00018107332289218903, 0.00020972732454538345, 0.00023838132619857788, 0.0002670353278517723, 0.00029568932950496674, 0.00032434333115816116, 0.0003529973328113556, 0.00038165133446455, 0.00041030533611774445, 0.0004389593377709389, 0.0004676133394241333, 0.0004962673410773277, 0.0005249213427305222, 0.0005535753443837166, 0.000582229346036911, 0.0006108833476901054, 0.0006395373493432999, 0.0006681913509964943, 0.0006968453526496887, 0.0007254993543028831, 0.0007541533559560776, 0.000782807357609272, 0.0008114613592624664, 0.0008401153609156609, 0.0008687693625688553, 0.0008974233642220497, 0.0009260773658752441]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 9.0, 14.0, 10.0, 7.0, 17.0, 20.0, 16.0, 21.0, 19.0, 30.0, 25.0, 34.0, 29.0, 31.0, 39.0, 41.0, 36.0, 35.0, 46.0, 43.0, 48.0, 39.0, 37.0, 40.0, 32.0, 29.0, 37.0, 29.0, 35.0, 21.0, 23.0, 11.0, 15.0, 21.0, 9.0, 9.0, 13.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.68359375, -6.48138427734375, -6.2791748046875, -6.07696533203125, -5.874755859375, -5.67254638671875, -5.4703369140625, -5.26812744140625, -5.06591796875, -4.86370849609375, -4.6614990234375, -4.45928955078125, -4.257080078125, -4.05487060546875, -3.8526611328125, -3.65045166015625, -3.4482421875, -3.24603271484375, -3.0438232421875, -2.84161376953125, -2.639404296875, -2.43719482421875, -2.2349853515625, -2.03277587890625, -1.83056640625, -1.62835693359375, -1.4261474609375, -1.22393798828125, -1.021728515625, -0.81951904296875, -0.6173095703125, -0.41510009765625, -0.212890625, -0.01068115234375, 0.1915283203125, 0.39373779296875, 0.595947265625, 0.79815673828125, 1.0003662109375, 1.20257568359375, 1.40478515625, 1.60699462890625, 1.8092041015625, 2.01141357421875, 2.213623046875, 2.41583251953125, 2.6180419921875, 2.82025146484375, 3.0224609375, 3.22467041015625, 3.4268798828125, 3.62908935546875, 3.831298828125, 4.03350830078125, 4.2357177734375, 4.43792724609375, 4.64013671875, 4.84234619140625, 5.0445556640625, 5.24676513671875, 5.448974609375, 5.65118408203125, 5.8533935546875, 6.05560302734375, 6.2578125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 3.0, 4.0, 9.0, 11.0, 17.0, 33.0, 39.0, 67.0, 84.0, 111.0, 182.0, 260.0, 384.0, 609.0, 851.0, 1277.0, 1856.0, 2898.0, 4496.0, 7324.0, 12885.0, 26989.0, 73030.0, 301512.0, 442315.0, 99486.0, 33646.0, 15385.0, 8154.0, 5000.0, 3213.0, 2102.0, 1374.0, 934.0, 647.0, 424.0, 313.0, 183.0, 137.0, 92.0, 77.0, 42.0, 35.0, 18.0, 18.0, 10.0, 3.0, 10.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.23046875, -5.07257080078125, -4.9146728515625, -4.75677490234375, -4.598876953125, -4.44097900390625, -4.2830810546875, -4.12518310546875, -3.96728515625, -3.80938720703125, -3.6514892578125, -3.49359130859375, -3.335693359375, -3.17779541015625, -3.0198974609375, -2.86199951171875, -2.7041015625, -2.54620361328125, -2.3883056640625, -2.23040771484375, -2.072509765625, -1.91461181640625, -1.7567138671875, -1.59881591796875, -1.44091796875, -1.28302001953125, -1.1251220703125, -0.96722412109375, -0.809326171875, -0.65142822265625, -0.4935302734375, -0.33563232421875, -0.177734375, -0.01983642578125, 0.1380615234375, 0.29595947265625, 0.453857421875, 0.61175537109375, 0.7696533203125, 0.92755126953125, 1.08544921875, 1.24334716796875, 1.4012451171875, 1.55914306640625, 1.717041015625, 1.87493896484375, 2.0328369140625, 2.19073486328125, 2.3486328125, 2.50653076171875, 2.6644287109375, 2.82232666015625, 2.980224609375, 3.13812255859375, 3.2960205078125, 3.45391845703125, 3.61181640625, 3.76971435546875, 3.9276123046875, 4.08551025390625, 4.243408203125, 4.40130615234375, 4.5592041015625, 4.71710205078125, 4.875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 11.0, 3.0, 5.0, 6.0, 13.0, 10.0, 20.0, 15.0, 17.0, 22.0, 25.0, 38.0, 30.0, 38.0, 33.0, 35.0, 47.0, 52.0, 76.0, 222.0, 1708.0, 160.0, 65.0, 38.0, 37.0, 47.0, 36.0, 34.0, 34.0, 24.0, 28.0, 26.0, 20.0, 15.0, 13.0, 20.0, 4.0, 7.0, 4.0, 8.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-27.734375, -26.991455078125, -26.24853515625, -25.505615234375, -24.7626953125, -24.019775390625, -23.27685546875, -22.533935546875, -21.791015625, -21.048095703125, -20.30517578125, -19.562255859375, -18.8193359375, -18.076416015625, -17.33349609375, -16.590576171875, -15.84765625, -15.104736328125, -14.36181640625, -13.618896484375, -12.8759765625, -12.133056640625, -11.39013671875, -10.647216796875, -9.904296875, -9.161376953125, -8.41845703125, -7.675537109375, -6.9326171875, -6.189697265625, -5.44677734375, -4.703857421875, -3.9609375, -3.218017578125, -2.47509765625, -1.732177734375, -0.9892578125, -0.246337890625, 0.49658203125, 1.239501953125, 1.982421875, 2.725341796875, 3.46826171875, 4.211181640625, 4.9541015625, 5.697021484375, 6.43994140625, 7.182861328125, 7.92578125, 8.668701171875, 9.41162109375, 10.154541015625, 10.8974609375, 11.640380859375, 12.38330078125, 13.126220703125, 13.869140625, 14.612060546875, 15.35498046875, 16.097900390625, 16.8408203125, 17.583740234375, 18.32666015625, 19.069580078125, 19.8125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 1.0, 5.0, 3.0, 9.0, 6.0, 8.0, 14.0, 19.0, 21.0, 39.0, 35.0, 37.0, 54.0, 90.0, 136.0, 211.0, 309.0, 880.0, 7277.0, 2919289.0, 212619.0, 3169.0, 592.0, 271.0, 181.0, 115.0, 71.0, 66.0, 46.0, 25.0, 29.0, 21.0, 17.0, 13.0, 7.0, 4.0, 10.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.375, -45.7880859375, -44.201171875, -42.6142578125, -41.02734375, -39.4404296875, -37.853515625, -36.2666015625, -34.6796875, -33.0927734375, -31.505859375, -29.9189453125, -28.33203125, -26.7451171875, -25.158203125, -23.5712890625, -21.984375, -20.3974609375, -18.810546875, -17.2236328125, -15.63671875, -14.0498046875, -12.462890625, -10.8759765625, -9.2890625, -7.7021484375, -6.115234375, -4.5283203125, -2.94140625, -1.3544921875, 0.232421875, 1.8193359375, 3.40625, 4.9931640625, 6.580078125, 8.1669921875, 9.75390625, 11.3408203125, 12.927734375, 14.5146484375, 16.1015625, 17.6884765625, 19.275390625, 20.8623046875, 22.44921875, 24.0361328125, 25.623046875, 27.2099609375, 28.796875, 30.3837890625, 31.970703125, 33.5576171875, 35.14453125, 36.7314453125, 38.318359375, 39.9052734375, 41.4921875, 43.0791015625, 44.666015625, 46.2529296875, 47.83984375, 49.4267578125, 51.013671875, 52.6005859375, 54.1875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 111.0, 324.0, 400.0, 127.0, 30.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.56564712524414, -19.198305130004883, -16.830963134765625, -14.463619232177734, -12.096277236938477, -9.728935241699219, -7.3615922927856445, -4.99424934387207, -2.6269073486328125, -0.2595648765563965, 2.1077775955200195, 4.4751200675964355, 6.842462539672852, 9.20980453491211, 11.577147483825684, 13.944490432739258, 16.311832427978516, 18.679174423217773, 21.04651641845703, 23.413860321044922, 25.78120231628418, 28.148544311523438, 30.515888214111328, 32.88323211669922, 35.250572204589844, 37.617916107177734, 39.98525619506836, 42.35260009765625, 44.719940185546875, 47.087284088134766, 49.454627990722656, 51.82196807861328, 54.18931579589844, 56.55665969848633, 58.92399978637695, 61.291343688964844, 63.65868377685547, 66.02603149414062, 68.39337158203125, 70.76071166992188, 73.1280517578125, 75.49539184570312, 77.86273956298828, 80.2300796508789, 82.59741973876953, 84.96476745605469, 87.33210754394531, 89.69944763183594, 92.0667953491211, 94.43413543701172, 96.80148315429688, 99.1688232421875, 101.53616333007812, 103.90350341796875, 106.2708511352539, 108.63819122314453, 111.00553894042969, 113.37287902832031, 115.74022674560547, 118.1075668334961, 120.47490692138672, 122.84225463867188, 125.2095947265625, 127.57693481445312, 129.94427490234375]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 3.0, 5.0, 5.0, 6.0, 7.0, 17.0, 21.0, 20.0, 19.0, 28.0, 18.0, 34.0, 25.0, 27.0, 35.0, 35.0, 28.0, 37.0, 49.0, 44.0, 41.0, 32.0, 34.0, 39.0, 34.0, 36.0, 31.0, 32.0, 35.0, 31.0, 28.0, 25.0, 19.0, 11.0, 24.0, 14.0, 8.0, 9.0, 8.0, 11.0, 11.0, 7.0, 2.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0], "bins": [-73.367431640625, -71.26718139648438, -69.16693115234375, -67.06668090820312, -64.9664306640625, -62.866180419921875, -60.765933990478516, -58.66568374633789, -56.565433502197266, -54.46518325805664, -52.364933013916016, -50.26468276977539, -48.16443634033203, -46.064186096191406, -43.96393585205078, -41.863685607910156, -39.76343536376953, -37.663185119628906, -35.56293487548828, -33.462684631347656, -31.362436294555664, -29.26218605041504, -27.161937713623047, -25.061687469482422, -22.961437225341797, -20.861186981201172, -18.760936737060547, -16.660688400268555, -14.56043815612793, -12.460187911987305, -10.359938621520996, -8.259689331054688, -6.159431457519531, -4.0591816902160645, -1.9589319229125977, 0.14131784439086914, 2.241567611694336, 4.341817855834961, 6.4420671463012695, 8.542316436767578, 10.642566680908203, 12.742816925048828, 14.843066215515137, 16.943315505981445, 19.04356575012207, 21.143815994262695, 23.244064331054688, 25.344314575195312, 27.444564819335938, 29.544815063476562, 31.645065307617188, 33.74531555175781, 35.84556579589844, 37.94581604003906, 40.04606246948242, 42.14631271362305, 44.24656295776367, 46.3468132019043, 48.44706344604492, 50.54731369018555, 52.647560119628906, 54.74781036376953, 56.848060607910156, 58.94831085205078, 61.048561096191406]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 5.0, 7.0, 8.0, 14.0, 9.0, 20.0, 13.0, 10.0, 20.0, 12.0, 28.0, 28.0, 33.0, 30.0, 31.0, 32.0, 38.0, 33.0, 41.0, 32.0, 41.0, 54.0, 37.0, 34.0, 41.0, 36.0, 32.0, 29.0, 30.0, 28.0, 35.0, 21.0, 17.0, 23.0, 16.0, 14.0, 16.0, 9.0, 10.0, 8.0, 9.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0], "bins": [-6.7421875, -6.54388427734375, -6.3455810546875, -6.14727783203125, -5.948974609375, -5.75067138671875, -5.5523681640625, -5.35406494140625, -5.15576171875, -4.95745849609375, -4.7591552734375, -4.56085205078125, -4.362548828125, -4.16424560546875, -3.9659423828125, -3.76763916015625, -3.5693359375, -3.37103271484375, -3.1727294921875, -2.97442626953125, -2.776123046875, -2.57781982421875, -2.3795166015625, -2.18121337890625, -1.98291015625, -1.78460693359375, -1.5863037109375, -1.38800048828125, -1.189697265625, -0.99139404296875, -0.7930908203125, -0.59478759765625, -0.396484375, -0.19818115234375, 0.0001220703125, 0.19842529296875, 0.396728515625, 0.59503173828125, 0.7933349609375, 0.99163818359375, 1.18994140625, 1.38824462890625, 1.5865478515625, 1.78485107421875, 1.983154296875, 2.18145751953125, 2.3797607421875, 2.57806396484375, 2.7763671875, 2.97467041015625, 3.1729736328125, 3.37127685546875, 3.569580078125, 3.76788330078125, 3.9661865234375, 4.16448974609375, 4.36279296875, 4.56109619140625, 4.7593994140625, 4.95770263671875, 5.156005859375, 5.35430908203125, 5.5526123046875, 5.75091552734375, 5.94921875]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 6.0, 1.0, 4.0, 12.0, 17.0, 18.0, 22.0, 39.0, 55.0, 72.0, 100.0, 145.0, 258.0, 425.0, 739.0, 1381.0, 2491.0, 5022.0, 10919.0, 27431.0, 81999.0, 297956.0, 943012.0, 1503351.0, 904241.0, 289908.0, 77680.0, 26095.0, 10496.0, 4789.0, 2444.0, 1284.0, 709.0, 446.0, 245.0, 144.0, 90.0, 64.0, 38.0, 46.0, 30.0, 21.0, 13.0, 12.0, 6.0, 4.0, 5.0, 4.0, 5.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.83526611328125, -7.6080322265625, -7.38079833984375, -7.153564453125, -6.92633056640625, -6.6990966796875, -6.47186279296875, -6.24462890625, -6.01739501953125, -5.7901611328125, -5.56292724609375, -5.335693359375, -5.10845947265625, -4.8812255859375, -4.65399169921875, -4.4267578125, -4.19952392578125, -3.9722900390625, -3.74505615234375, -3.517822265625, -3.29058837890625, -3.0633544921875, -2.83612060546875, -2.60888671875, -2.38165283203125, -2.1544189453125, -1.92718505859375, -1.699951171875, -1.47271728515625, -1.2454833984375, -1.01824951171875, -0.791015625, -0.56378173828125, -0.3365478515625, -0.10931396484375, 0.117919921875, 0.34515380859375, 0.5723876953125, 0.79962158203125, 1.02685546875, 1.25408935546875, 1.4813232421875, 1.70855712890625, 1.935791015625, 2.16302490234375, 2.3902587890625, 2.61749267578125, 2.8447265625, 3.07196044921875, 3.2991943359375, 3.52642822265625, 3.753662109375, 3.98089599609375, 4.2081298828125, 4.43536376953125, 4.66259765625, 4.88983154296875, 5.1170654296875, 5.34429931640625, 5.571533203125, 5.79876708984375, 6.0260009765625, 6.25323486328125, 6.48046875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 4.0, 2.0, 5.0, 11.0, 17.0, 17.0, 25.0, 41.0, 43.0, 50.0, 54.0, 82.0, 78.0, 122.0, 146.0, 209.0, 253.0, 281.0, 379.0, 396.0, 364.0, 312.0, 267.0, 202.0, 160.0, 118.0, 87.0, 75.0, 41.0, 61.0, 39.0, 31.0, 26.0, 21.0, 14.0, 6.0, 6.0, 12.0, 3.0, 2.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.015625, -14.5924072265625, -14.169189453125, -13.7459716796875, -13.32275390625, -12.8995361328125, -12.476318359375, -12.0531005859375, -11.6298828125, -11.2066650390625, -10.783447265625, -10.3602294921875, -9.93701171875, -9.5137939453125, -9.090576171875, -8.6673583984375, -8.244140625, -7.8209228515625, -7.397705078125, -6.9744873046875, -6.55126953125, -6.1280517578125, -5.704833984375, -5.2816162109375, -4.8583984375, -4.4351806640625, -4.011962890625, -3.5887451171875, -3.16552734375, -2.7423095703125, -2.319091796875, -1.8958740234375, -1.47265625, -1.0494384765625, -0.626220703125, -0.2030029296875, 0.22021484375, 0.6434326171875, 1.066650390625, 1.4898681640625, 1.9130859375, 2.3363037109375, 2.759521484375, 3.1827392578125, 3.60595703125, 4.0291748046875, 4.452392578125, 4.8756103515625, 5.298828125, 5.7220458984375, 6.145263671875, 6.5684814453125, 6.99169921875, 7.4149169921875, 7.838134765625, 8.2613525390625, 8.6845703125, 9.1077880859375, 9.531005859375, 9.9542236328125, 10.37744140625, 10.8006591796875, 11.223876953125, 11.6470947265625, 12.0703125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 9.0, 13.0, 11.0, 29.0, 29.0, 32.0, 49.0, 66.0, 101.0, 138.0, 211.0, 388.0, 1128.0, 23521.0, 4022601.0, 142538.0, 2150.0, 490.0, 262.0, 154.0, 101.0, 52.0, 49.0, 46.0, 33.0, 20.0, 16.0, 13.0, 9.0, 10.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.34375, -56.06982421875, -53.7958984375, -51.52197265625, -49.248046875, -46.97412109375, -44.7001953125, -42.42626953125, -40.15234375, -37.87841796875, -35.6044921875, -33.33056640625, -31.056640625, -28.78271484375, -26.5087890625, -24.23486328125, -21.9609375, -19.68701171875, -17.4130859375, -15.13916015625, -12.865234375, -10.59130859375, -8.3173828125, -6.04345703125, -3.76953125, -1.49560546875, 0.7783203125, 3.05224609375, 5.326171875, 7.60009765625, 9.8740234375, 12.14794921875, 14.421875, 16.69580078125, 18.9697265625, 21.24365234375, 23.517578125, 25.79150390625, 28.0654296875, 30.33935546875, 32.61328125, 34.88720703125, 37.1611328125, 39.43505859375, 41.708984375, 43.98291015625, 46.2568359375, 48.53076171875, 50.8046875, 53.07861328125, 55.3525390625, 57.62646484375, 59.900390625, 62.17431640625, 64.4482421875, 66.72216796875, 68.99609375, 71.27001953125, 73.5439453125, 75.81787109375, 78.091796875, 80.36572265625, 82.6396484375, 84.91357421875, 87.1875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 19.0, 30.0, 66.0, 103.0, 140.0, 195.0, 163.0, 125.0, 83.0, 47.0, 17.0, 11.0, 3.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-136.95057678222656, -133.8875274658203, -130.824462890625, -127.76141357421875, -124.69835662841797, -121.63529968261719, -118.5722427368164, -115.50918579101562, -112.44612884521484, -109.38307189941406, -106.32001495361328, -103.2569580078125, -100.19390869140625, -97.13085174560547, -94.06779479980469, -91.0047378540039, -87.94168090820312, -84.87862396240234, -81.81556701660156, -78.75251770019531, -75.68946075439453, -72.62640380859375, -69.56334686279297, -66.50028991699219, -63.43724060058594, -60.374183654785156, -57.31113052368164, -54.24807357788086, -51.18501663208008, -48.12196350097656, -45.05890655517578, -41.995849609375, -38.932796478271484, -35.8697395324707, -32.80668640136719, -29.743629455566406, -26.680572509765625, -23.617517471313477, -20.554462432861328, -17.491405487060547, -14.428350448608398, -11.365294456481934, -8.302238464355469, -5.23918342590332, -2.1761274337768555, 0.8869285583496094, 3.949983596801758, 7.013040542602539, 10.076095581054688, 13.139151573181152, 16.202207565307617, 19.265262603759766, 22.328319549560547, 25.391374588012695, 28.454429626464844, 31.517486572265625, 34.580543518066406, 37.64360046386719, 40.7066535949707, 43.769710540771484, 46.832767486572266, 49.89582061767578, 52.95887756347656, 56.021934509277344, 59.08498764038086]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 8.0, 5.0, 12.0, 8.0, 12.0, 17.0, 17.0, 14.0, 14.0, 19.0, 32.0, 25.0, 27.0, 21.0, 29.0, 30.0, 30.0, 32.0, 42.0, 40.0, 33.0, 38.0, 35.0, 42.0, 42.0, 37.0, 29.0, 32.0, 29.0, 31.0, 25.0, 16.0, 21.0, 15.0, 18.0, 19.0, 14.0, 15.0, 5.0, 11.0, 12.0, 14.0, 2.0, 5.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0], "bins": [-51.87261962890625, -50.37895202636719, -48.88528823852539, -47.391624450683594, -45.89795684814453, -44.40428924560547, -42.91062545776367, -41.416961669921875, -39.92329406738281, -38.42962646484375, -36.93596267700195, -35.442298889160156, -33.948631286621094, -32.45496368408203, -30.961299896240234, -29.467634201049805, -27.973968505859375, -26.480302810668945, -24.986637115478516, -23.492971420288086, -21.999305725097656, -20.505640029907227, -19.011974334716797, -17.518308639526367, -16.024642944335938, -14.530977249145508, -13.037311553955078, -11.543645858764648, -10.049980163574219, -8.556314468383789, -7.062648773193359, -5.56898307800293, -4.0753173828125, -2.5816516876220703, -1.0879859924316406, 0.40567970275878906, 1.8993453979492188, 3.3930110931396484, 4.886676788330078, 6.380342483520508, 7.8740081787109375, 9.367673873901367, 10.861339569091797, 12.355005264282227, 13.848670959472656, 15.342336654663086, 16.836002349853516, 18.329668045043945, 19.823333740234375, 21.316999435424805, 22.810665130615234, 24.304330825805664, 25.797996520996094, 27.291662216186523, 28.785327911376953, 30.278993606567383, 31.772659301757812, 33.266326904296875, 34.75999069213867, 36.25365447998047, 37.74732208251953, 39.240989685058594, 40.73465347290039, 42.22831726074219, 43.72198486328125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 15.0, 12.0, 13.0, 11.0, 11.0, 16.0, 19.0, 27.0, 33.0, 30.0, 39.0, 29.0, 32.0, 37.0, 49.0, 36.0, 32.0, 28.0, 39.0, 47.0, 37.0, 36.0, 35.0, 40.0, 33.0, 35.0, 29.0, 22.0, 19.0, 27.0, 18.0, 17.0, 14.0, 9.0, 12.0, 12.0, 7.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.70703125, -6.5042724609375, -6.301513671875, -6.0987548828125, -5.89599609375, -5.6932373046875, -5.490478515625, -5.2877197265625, -5.0849609375, -4.8822021484375, -4.679443359375, -4.4766845703125, -4.27392578125, -4.0711669921875, -3.868408203125, -3.6656494140625, -3.462890625, -3.2601318359375, -3.057373046875, -2.8546142578125, -2.65185546875, -2.4490966796875, -2.246337890625, -2.0435791015625, -1.8408203125, -1.6380615234375, -1.435302734375, -1.2325439453125, -1.02978515625, -0.8270263671875, -0.624267578125, -0.4215087890625, -0.21875, -0.0159912109375, 0.186767578125, 0.3895263671875, 0.59228515625, 0.7950439453125, 0.997802734375, 1.2005615234375, 1.4033203125, 1.6060791015625, 1.808837890625, 2.0115966796875, 2.21435546875, 2.4171142578125, 2.619873046875, 2.8226318359375, 3.025390625, 3.2281494140625, 3.430908203125, 3.6336669921875, 3.83642578125, 4.0391845703125, 4.241943359375, 4.4447021484375, 4.6474609375, 4.8502197265625, 5.052978515625, 5.2557373046875, 5.45849609375, 5.6612548828125, 5.864013671875, 6.0667724609375, 6.26953125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 11.0, 4.0, 20.0, 40.0, 37.0, 48.0, 77.0, 101.0, 153.0, 233.0, 341.0, 466.0, 654.0, 1014.0, 1497.0, 2048.0, 3012.0, 4218.0, 6172.0, 8682.0, 12628.0, 17771.0, 26541.0, 38487.0, 56806.0, 83962.0, 124107.0, 173788.0, 155264.0, 104948.0, 71257.0, 47931.0, 33047.0, 22203.0, 15215.0, 10780.0, 7659.0, 5198.0, 3748.0, 2582.0, 1738.0, 1191.0, 855.0, 616.0, 447.0, 328.0, 188.0, 148.0, 110.0, 75.0, 39.0, 29.0, 20.0, 7.0, 8.0, 8.0, 5.0, 3.0, 4.0], "bins": [-0.80078125, -0.7763595581054688, -0.7519378662109375, -0.7275161743164062, -0.703094482421875, -0.6786727905273438, -0.6542510986328125, -0.6298294067382812, -0.60540771484375, -0.5809860229492188, -0.5565643310546875, -0.5321426391601562, -0.507720947265625, -0.48329925537109375, -0.4588775634765625, -0.43445587158203125, -0.4100341796875, -0.38561248779296875, -0.3611907958984375, -0.33676910400390625, -0.312347412109375, -0.28792572021484375, -0.2635040283203125, -0.23908233642578125, -0.21466064453125, -0.19023895263671875, -0.1658172607421875, -0.14139556884765625, -0.116973876953125, -0.09255218505859375, -0.0681304931640625, -0.04370880126953125, -0.019287109375, 0.00513458251953125, 0.0295562744140625, 0.05397796630859375, 0.078399658203125, 0.10282135009765625, 0.1272430419921875, 0.15166473388671875, 0.17608642578125, 0.20050811767578125, 0.2249298095703125, 0.24935150146484375, 0.273773193359375, 0.29819488525390625, 0.3226165771484375, 0.34703826904296875, 0.3714599609375, 0.39588165283203125, 0.4203033447265625, 0.44472503662109375, 0.469146728515625, 0.49356842041015625, 0.5179901123046875, 0.5424118041992188, 0.56683349609375, 0.5912551879882812, 0.6156768798828125, 0.6400985717773438, 0.664520263671875, 0.6889419555664062, 0.7133636474609375, 0.7377853393554688, 0.76220703125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 4.0, 5.0, 6.0, 8.0, 5.0, 9.0, 14.0, 11.0, 13.0, 16.0, 15.0, 18.0, 20.0, 33.0, 32.0, 30.0, 33.0, 44.0, 35.0, 31.0, 39.0, 30.0, 1067.0, 44.0, 43.0, 40.0, 42.0, 32.0, 28.0, 29.0, 29.0, 29.0, 29.0, 22.0, 27.0, 24.0, 18.0, 11.0, 12.0, 10.0, 10.0, 11.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.21875, -4.09466552734375, -3.9705810546875, -3.84649658203125, -3.722412109375, -3.59832763671875, -3.4742431640625, -3.35015869140625, -3.22607421875, -3.10198974609375, -2.9779052734375, -2.85382080078125, -2.729736328125, -2.60565185546875, -2.4815673828125, -2.35748291015625, -2.2333984375, -2.10931396484375, -1.9852294921875, -1.86114501953125, -1.737060546875, -1.61297607421875, -1.4888916015625, -1.36480712890625, -1.24072265625, -1.11663818359375, -0.9925537109375, -0.86846923828125, -0.744384765625, -0.62030029296875, -0.4962158203125, -0.37213134765625, -0.248046875, -0.12396240234375, 0.0001220703125, 0.12420654296875, 0.248291015625, 0.37237548828125, 0.4964599609375, 0.62054443359375, 0.74462890625, 0.86871337890625, 0.9927978515625, 1.11688232421875, 1.240966796875, 1.36505126953125, 1.4891357421875, 1.61322021484375, 1.7373046875, 1.86138916015625, 1.9854736328125, 2.10955810546875, 2.233642578125, 2.35772705078125, 2.4818115234375, 2.60589599609375, 2.72998046875, 2.85406494140625, 2.9781494140625, 3.10223388671875, 3.226318359375, 3.35040283203125, 3.4744873046875, 3.59857177734375, 3.72265625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 2.0, 11.0, 13.0, 18.0, 31.0, 29.0, 43.0, 67.0, 120.0, 159.0, 289.0, 413.0, 707.0, 987.0, 1595.0, 2362.0, 3672.0, 6031.0, 9601.0, 15319.0, 24954.0, 40471.0, 66298.0, 107691.0, 173559.0, 1263729.0, 144575.0, 89822.0, 55249.0, 34149.0, 20543.0, 12711.0, 7922.0, 5064.0, 3121.0, 2055.0, 1247.0, 884.0, 574.0, 372.0, 204.0, 156.0, 114.0, 71.0, 52.0, 25.0, 20.0, 14.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.8642578125, -0.8375091552734375, -0.810760498046875, -0.7840118408203125, -0.75726318359375, -0.7305145263671875, -0.703765869140625, -0.6770172119140625, -0.6502685546875, -0.6235198974609375, -0.596771240234375, -0.5700225830078125, -0.54327392578125, -0.5165252685546875, -0.489776611328125, -0.4630279541015625, -0.436279296875, -0.4095306396484375, -0.382781982421875, -0.3560333251953125, -0.32928466796875, -0.3025360107421875, -0.275787353515625, -0.2490386962890625, -0.2222900390625, -0.1955413818359375, -0.168792724609375, -0.1420440673828125, -0.11529541015625, -0.0885467529296875, -0.061798095703125, -0.0350494384765625, -0.00830078125, 0.0184478759765625, 0.045196533203125, 0.0719451904296875, 0.09869384765625, 0.1254425048828125, 0.152191162109375, 0.1789398193359375, 0.2056884765625, 0.2324371337890625, 0.259185791015625, 0.2859344482421875, 0.31268310546875, 0.3394317626953125, 0.366180419921875, 0.3929290771484375, 0.419677734375, 0.4464263916015625, 0.473175048828125, 0.4999237060546875, 0.52667236328125, 0.5534210205078125, 0.580169677734375, 0.6069183349609375, 0.6336669921875, 0.6604156494140625, 0.687164306640625, 0.7139129638671875, 0.74066162109375, 0.7674102783203125, 0.794158935546875, 0.8209075927734375, 0.84765625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 6.0, 8.0, 11.0, 14.0, 7.0, 10.0, 16.0, 18.0, 19.0, 30.0, 34.0, 41.0, 38.0, 49.0, 50.0, 45.0, 58.0, 53.0, 55.0, 41.0, 32.0, 50.0, 51.0, 33.0, 32.0, 33.0, 27.0, 16.0, 30.0, 20.0, 14.0, 15.0, 12.0, 5.0, 3.0, 3.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015764236450195312, -0.0015301108360290527, -0.0014837980270385742, -0.0014374852180480957, -0.0013911724090576172, -0.0013448596000671387, -0.0012985467910766602, -0.0012522339820861816, -0.0012059211730957031, -0.0011596083641052246, -0.001113295555114746, -0.0010669827461242676, -0.001020669937133789, -0.0009743571281433105, -0.000928044319152832, -0.0008817315101623535, -0.000835418701171875, -0.0007891058921813965, -0.000742793083190918, -0.0006964802742004395, -0.0006501674652099609, -0.0006038546562194824, -0.0005575418472290039, -0.0005112290382385254, -0.0004649162292480469, -0.00041860342025756836, -0.00037229061126708984, -0.00032597780227661133, -0.0002796649932861328, -0.0002333521842956543, -0.00018703937530517578, -0.00014072656631469727, -9.441375732421875e-05, -4.8100948333740234e-05, -1.7881393432617188e-06, 4.45246696472168e-05, 9.083747863769531e-05, 0.00013715028762817383, 0.00018346309661865234, 0.00022977590560913086, 0.0002760887145996094, 0.0003224015235900879, 0.0003687143325805664, 0.0004150271415710449, 0.00046133995056152344, 0.000507652759552002, 0.0005539655685424805, 0.000600278377532959, 0.0006465911865234375, 0.000692903995513916, 0.0007392168045043945, 0.000785529613494873, 0.0008318424224853516, 0.0008781552314758301, 0.0009244680404663086, 0.0009707808494567871, 0.0010170936584472656, 0.0010634064674377441, 0.0011097192764282227, 0.0011560320854187012, 0.0012023448944091797, 0.0012486577033996582, 0.0012949705123901367, 0.0013412833213806152, 0.0013875961303710938]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 6.0, 2.0, 8.0, 2.0, 11.0, 6.0, 5.0, 12.0, 20.0, 25.0, 18.0, 22.0, 24.0, 46.0, 55.0, 74.0, 139.0, 258.0, 485.0, 1601.0, 974583.0, 69334.0, 835.0, 370.0, 201.0, 121.0, 71.0, 45.0, 39.0, 23.0, 23.0, 23.0, 11.0, 11.0, 9.0, 9.0, 9.0, 4.0, 4.0, 6.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033905029296875, -0.03272819519042969, -0.031551361083984375, -0.030374526977539062, -0.02919769287109375, -0.028020858764648438, -0.026844024658203125, -0.025667190551757812, -0.0244903564453125, -0.023313522338867188, -0.022136688232421875, -0.020959854125976562, -0.01978302001953125, -0.018606185913085938, -0.017429351806640625, -0.016252517700195312, -0.01507568359375, -0.013898849487304688, -0.012722015380859375, -0.011545181274414062, -0.01036834716796875, -0.009191513061523438, -0.008014678955078125, -0.0068378448486328125, -0.0056610107421875, -0.0044841766357421875, -0.003307342529296875, -0.0021305084228515625, -0.00095367431640625, 0.0002231597900390625, 0.001399993896484375, 0.0025768280029296875, 0.003753662109375, 0.0049304962158203125, 0.006107330322265625, 0.0072841644287109375, 0.00846099853515625, 0.009637832641601562, 0.010814666748046875, 0.011991500854492188, 0.0131683349609375, 0.014345169067382812, 0.015522003173828125, 0.016698837280273438, 0.01787567138671875, 0.019052505493164062, 0.020229339599609375, 0.021406173706054688, 0.0225830078125, 0.023759841918945312, 0.024936676025390625, 0.026113510131835938, 0.02729034423828125, 0.028467178344726562, 0.029644012451171875, 0.030820846557617188, 0.0319976806640625, 0.03317451477050781, 0.034351348876953125, 0.03552818298339844, 0.03670501708984375, 0.03788185119628906, 0.039058685302734375, 0.04023551940917969, 0.041412353515625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 21.0, 145.0, 488.0, 298.0, 55.0, 8.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024785022251307964, -0.0023590559139847755, -0.0022396096028387547, -0.0021201632916927338, -0.002000716980546713, -0.001881270669400692, -0.001761824358254671, -0.0016423780471086502, -0.0015229317359626293, -0.0014034854248166084, -0.0012840391136705875, -0.0011645928025245667, -0.0010451464913785458, -0.0009257001802325249, -0.000806253869086504, -0.0006868075579404831, -0.0005673612467944622, -0.0004479149356484413, -0.0003284686245024204, -0.00020902231335639954, -8.957600221037865e-05, 2.9870308935642242e-05, 0.00014931662008166313, 0.000268762931227684, 0.0003882092423737049, 0.0005076555535197258, 0.0006271018646657467, 0.0007465481758117676, 0.0008659944869577885, 0.0009854407981038094, 0.0011048871092498302, 0.0012243334203958511, 0.001343779731541872, 0.001463226042687893, 0.0015826723538339138, 0.0017021186649799347, 0.0018215649761259556, 0.0019410112872719765, 0.0020604575984179974, 0.0021799039095640182, 0.002299350220710039, 0.00241879653185606, 0.002538242843002081, 0.002657689154148102, 0.0027771354652941227, 0.0028965817764401436, 0.0030160280875861645, 0.0031354743987321854, 0.0032549207098782063, 0.003374367021024227, 0.003493813332170248, 0.003613259643316269, 0.00373270595446229, 0.0038521522656083107, 0.003971598576754332, 0.0040910448879003525, 0.004210491199046373, 0.004329937510192394, 0.004449383821338415, 0.004568830132484436, 0.004688276443630457, 0.004807722754776478, 0.004927169065922499, 0.00504661537706852, 0.0051660616882145405]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 8.0, 5.0, 13.0, 11.0, 14.0, 19.0, 18.0, 16.0, 23.0, 26.0, 18.0, 25.0, 33.0, 30.0, 27.0, 39.0, 26.0, 34.0, 34.0, 32.0, 45.0, 36.0, 46.0, 33.0, 35.0, 33.0, 26.0, 32.0, 23.0, 25.0, 26.0, 26.0, 21.0, 20.0, 14.0, 10.0, 14.0, 9.0, 12.0, 6.0, 9.0, 3.0, 10.0, 5.0, 4.0, 1.0, 5.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.0006586909294128418, -0.0006370516493916512, -0.0006154123693704605, -0.0005937730893492699, -0.0005721338093280792, -0.0005504945293068886, -0.0005288552492856979, -0.0005072159692645073, -0.00048557668924331665, -0.000463937409222126, -0.00044229812920093536, -0.0004206588491797447, -0.0003990195691585541, -0.00037738028913736343, -0.0003557410091161728, -0.00033410172909498215, -0.0003124624490737915, -0.00029082316905260086, -0.0002691838890314102, -0.0002475446090102196, -0.00022590532898902893, -0.0002042660489678383, -0.00018262676894664764, -0.000160987488925457, -0.00013934820890426636, -0.00011770892888307571, -9.606964886188507e-05, -7.443036884069443e-05, -5.2791088819503784e-05, -3.115180879831314e-05, -9.512528777122498e-06, 1.2126751244068146e-05, 3.376603126525879e-05, 5.540531128644943e-05, 7.704459130764008e-05, 9.868387132883072e-05, 0.00012032315135002136, 0.000141962431371212, 0.00016360171139240265, 0.0001852409914135933, 0.00020688027143478394, 0.00022851955145597458, 0.0002501588314771652, 0.00027179811149835587, 0.0002934373915195465, 0.00031507667154073715, 0.0003367159515619278, 0.00035835523158311844, 0.0003799945116043091, 0.0004016337916254997, 0.00042327307164669037, 0.000444912351667881, 0.00046655163168907166, 0.0004881909117102623, 0.0005098301917314529, 0.0005314694717526436, 0.0005531087517738342, 0.0005747480317950249, 0.0005963873118162155, 0.0006180265918374062, 0.0006396658718585968, 0.0006613051518797874, 0.0006829444319009781, 0.0007045837119221687, 0.0007262229919433594]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 6.0, 8.0, 15.0, 12.0, 13.0, 11.0, 11.0, 16.0, 19.0, 27.0, 33.0, 30.0, 39.0, 29.0, 32.0, 37.0, 49.0, 36.0, 32.0, 28.0, 39.0, 47.0, 37.0, 36.0, 35.0, 40.0, 33.0, 35.0, 29.0, 22.0, 19.0, 27.0, 18.0, 17.0, 14.0, 9.0, 12.0, 12.0, 7.0, 7.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.70703125, -6.5042724609375, -6.301513671875, -6.0987548828125, -5.89599609375, -5.6932373046875, -5.490478515625, -5.2877197265625, -5.0849609375, -4.8822021484375, -4.679443359375, -4.4766845703125, -4.27392578125, -4.0711669921875, -3.868408203125, -3.6656494140625, -3.462890625, -3.2601318359375, -3.057373046875, -2.8546142578125, -2.65185546875, -2.4490966796875, -2.246337890625, -2.0435791015625, -1.8408203125, -1.6380615234375, -1.435302734375, -1.2325439453125, -1.02978515625, -0.8270263671875, -0.624267578125, -0.4215087890625, -0.21875, -0.0159912109375, 0.186767578125, 0.3895263671875, 0.59228515625, 0.7950439453125, 0.997802734375, 1.2005615234375, 1.4033203125, 1.6060791015625, 1.808837890625, 2.0115966796875, 2.21435546875, 2.4171142578125, 2.619873046875, 2.8226318359375, 3.025390625, 3.2281494140625, 3.430908203125, 3.6336669921875, 3.83642578125, 4.0391845703125, 4.241943359375, 4.4447021484375, 4.6474609375, 4.8502197265625, 5.052978515625, 5.2557373046875, 5.45849609375, 5.6612548828125, 5.864013671875, 6.0667724609375, 6.26953125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 2.0, 8.0, 2.0, 15.0, 8.0, 28.0, 27.0, 36.0, 47.0, 62.0, 105.0, 158.0, 262.0, 386.0, 556.0, 848.0, 1326.0, 2264.0, 4325.0, 8776.0, 20464.0, 54509.0, 180705.0, 461629.0, 207498.0, 61177.0, 22498.0, 9685.0, 4663.0, 2459.0, 1408.0, 871.0, 571.0, 388.0, 229.0, 180.0, 104.0, 83.0, 52.0, 36.0, 28.0, 23.0, 11.0, 10.0, 9.0, 5.0, 4.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.66015625, -4.50762939453125, -4.3551025390625, -4.20257568359375, -4.050048828125, -3.89752197265625, -3.7449951171875, -3.59246826171875, -3.43994140625, -3.28741455078125, -3.1348876953125, -2.98236083984375, -2.829833984375, -2.67730712890625, -2.5247802734375, -2.37225341796875, -2.2197265625, -2.06719970703125, -1.9146728515625, -1.76214599609375, -1.609619140625, -1.45709228515625, -1.3045654296875, -1.15203857421875, -0.99951171875, -0.84698486328125, -0.6944580078125, -0.54193115234375, -0.389404296875, -0.23687744140625, -0.0843505859375, 0.06817626953125, 0.220703125, 0.37322998046875, 0.5257568359375, 0.67828369140625, 0.830810546875, 0.98333740234375, 1.1358642578125, 1.28839111328125, 1.44091796875, 1.59344482421875, 1.7459716796875, 1.89849853515625, 2.051025390625, 2.20355224609375, 2.3560791015625, 2.50860595703125, 2.6611328125, 2.81365966796875, 2.9661865234375, 3.11871337890625, 3.271240234375, 3.42376708984375, 3.5762939453125, 3.72882080078125, 3.88134765625, 4.03387451171875, 4.1864013671875, 4.33892822265625, 4.491455078125, 4.64398193359375, 4.7965087890625, 4.94903564453125, 5.1015625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 3.0, 5.0, 5.0, 3.0, 5.0, 5.0, 5.0, 9.0, 20.0, 22.0, 20.0, 18.0, 23.0, 34.0, 31.0, 47.0, 42.0, 43.0, 57.0, 69.0, 175.0, 1774.0, 157.0, 70.0, 65.0, 48.0, 45.0, 31.0, 40.0, 22.0, 32.0, 21.0, 20.0, 16.0, 14.0, 11.0, 11.0, 11.0, 5.0, 5.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.375, -25.562744140625, -24.75048828125, -23.938232421875, -23.1259765625, -22.313720703125, -21.50146484375, -20.689208984375, -19.876953125, -19.064697265625, -18.25244140625, -17.440185546875, -16.6279296875, -15.815673828125, -15.00341796875, -14.191162109375, -13.37890625, -12.566650390625, -11.75439453125, -10.942138671875, -10.1298828125, -9.317626953125, -8.50537109375, -7.693115234375, -6.880859375, -6.068603515625, -5.25634765625, -4.444091796875, -3.6318359375, -2.819580078125, -2.00732421875, -1.195068359375, -0.3828125, 0.429443359375, 1.24169921875, 2.053955078125, 2.8662109375, 3.678466796875, 4.49072265625, 5.302978515625, 6.115234375, 6.927490234375, 7.73974609375, 8.552001953125, 9.3642578125, 10.176513671875, 10.98876953125, 11.801025390625, 12.61328125, 13.425537109375, 14.23779296875, 15.050048828125, 15.8623046875, 16.674560546875, 17.48681640625, 18.299072265625, 19.111328125, 19.923583984375, 20.73583984375, 21.548095703125, 22.3603515625, 23.172607421875, 23.98486328125, 24.797119140625, 25.609375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 6.0, 7.0, 12.0, 9.0, 14.0, 16.0, 16.0, 33.0, 23.0, 49.0, 47.0, 77.0, 92.0, 151.0, 173.0, 278.0, 569.0, 3793.0, 2950023.0, 187259.0, 1693.0, 448.0, 249.0, 190.0, 110.0, 73.0, 79.0, 40.0, 36.0, 31.0, 29.0, 20.0, 13.0, 9.0, 5.0, 10.0, 5.0, 7.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.15625, -49.49853515625, -47.8408203125, -46.18310546875, -44.525390625, -42.86767578125, -41.2099609375, -39.55224609375, -37.89453125, -36.23681640625, -34.5791015625, -32.92138671875, -31.263671875, -29.60595703125, -27.9482421875, -26.29052734375, -24.6328125, -22.97509765625, -21.3173828125, -19.65966796875, -18.001953125, -16.34423828125, -14.6865234375, -13.02880859375, -11.37109375, -9.71337890625, -8.0556640625, -6.39794921875, -4.740234375, -3.08251953125, -1.4248046875, 0.23291015625, 1.890625, 3.54833984375, 5.2060546875, 6.86376953125, 8.521484375, 10.17919921875, 11.8369140625, 13.49462890625, 15.15234375, 16.81005859375, 18.4677734375, 20.12548828125, 21.783203125, 23.44091796875, 25.0986328125, 26.75634765625, 28.4140625, 30.07177734375, 31.7294921875, 33.38720703125, 35.044921875, 36.70263671875, 38.3603515625, 40.01806640625, 41.67578125, 43.33349609375, 44.9912109375, 46.64892578125, 48.306640625, 49.96435546875, 51.6220703125, 53.27978515625, 54.9375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [344.0, 666.0, 6.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9185028076171875, -0.8384151458740234, 5.241672515869141, 11.321760177612305, 17.40184783935547, 23.481935501098633, 29.562023162841797, 35.642112731933594, 41.722198486328125, 47.802284240722656, 53.88237380981445, 59.96246337890625, 66.04254913330078, 72.12263488769531, 78.20272827148438, 84.2828140258789, 90.36289978027344, 96.44298553466797, 102.5230712890625, 108.60316467285156, 114.6832504272461, 120.76333618164062, 126.84342956542969, 132.92352294921875, 139.00360107421875, 145.0836944580078, 151.1637725830078, 157.24386596679688, 163.32394409179688, 169.40403747558594, 175.484130859375, 181.564208984375, 187.64431762695312, 193.7244110107422, 199.8044891357422, 205.88458251953125, 211.96466064453125, 218.0447540283203, 224.12484741210938, 230.20492553710938, 236.28501892089844, 242.3651123046875, 248.4451904296875, 254.52528381347656, 260.6053771972656, 266.6854553222656, 272.7655334472656, 278.84564208984375, 284.92572021484375, 291.00579833984375, 297.0859069824219, 303.1659851074219, 309.2460632324219, 315.326171875, 321.40625, 327.486328125, 333.56640625, 339.646484375, 345.7265930175781, 351.8066711425781, 357.8867492675781, 363.96685791015625, 370.04693603515625, 376.12701416015625, 382.2071228027344]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 14.0, 5.0, 10.0, 11.0, 8.0, 8.0, 12.0, 13.0, 16.0, 21.0, 32.0, 35.0, 20.0, 27.0, 35.0, 24.0, 34.0, 24.0, 39.0, 39.0, 40.0, 33.0, 33.0, 36.0, 34.0, 38.0, 35.0, 30.0, 34.0, 31.0, 39.0, 19.0, 22.0, 19.0, 18.0, 17.0, 20.0, 9.0, 13.0, 9.0, 8.0, 6.0, 1.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 3.0], "bins": [-59.544830322265625, -57.8148307800293, -56.08483123779297, -54.35483169555664, -52.62483215332031, -50.894832611083984, -49.164833068847656, -47.43482971191406, -45.704833984375, -43.97483444213867, -42.244834899902344, -40.514835357666016, -38.78483581542969, -37.05483627319336, -35.32483673095703, -33.59483337402344, -31.86483383178711, -30.13483428955078, -28.404834747314453, -26.674835205078125, -24.944835662841797, -23.21483612060547, -21.484834671020508, -19.75483512878418, -18.02483558654785, -16.294836044311523, -14.564836502075195, -12.83483600616455, -11.104836463928223, -9.374836921691895, -7.64483642578125, -5.914836883544922, -4.184833526611328, -2.454833745956421, -0.7248339653015137, 1.0051660537719727, 2.735165596008301, 4.465165138244629, 6.195165634155273, 7.925165176391602, 9.65516471862793, 11.385164260864258, 13.115163803100586, 14.84516429901123, 16.575164794921875, 18.305164337158203, 20.03516387939453, 21.76516342163086, 23.495162963867188, 25.225162506103516, 26.955162048339844, 28.685161590576172, 30.4151611328125, 32.14516067504883, 33.875160217285156, 35.60516357421875, 37.33515930175781, 39.06515884399414, 40.79515838623047, 42.5251579284668, 44.255157470703125, 45.98515701293945, 47.71515655517578, 49.445159912109375, 51.1751594543457]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 4.0, 3.0, 14.0, 9.0, 10.0, 14.0, 15.0, 12.0, 19.0, 19.0, 22.0, 37.0, 34.0, 26.0, 23.0, 58.0, 37.0, 38.0, 36.0, 36.0, 42.0, 28.0, 43.0, 44.0, 32.0, 41.0, 30.0, 36.0, 27.0, 29.0, 24.0, 21.0, 28.0, 15.0, 19.0, 13.0, 9.0, 13.0, 6.0, 8.0, 11.0, 2.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.0390625, -6.831298828125, -6.62353515625, -6.415771484375, -6.2080078125, -6.000244140625, -5.79248046875, -5.584716796875, -5.376953125, -5.169189453125, -4.96142578125, -4.753662109375, -4.5458984375, -4.338134765625, -4.13037109375, -3.922607421875, -3.71484375, -3.507080078125, -3.29931640625, -3.091552734375, -2.8837890625, -2.676025390625, -2.46826171875, -2.260498046875, -2.052734375, -1.844970703125, -1.63720703125, -1.429443359375, -1.2216796875, -1.013916015625, -0.80615234375, -0.598388671875, -0.390625, -0.182861328125, 0.02490234375, 0.232666015625, 0.4404296875, 0.648193359375, 0.85595703125, 1.063720703125, 1.271484375, 1.479248046875, 1.68701171875, 1.894775390625, 2.1025390625, 2.310302734375, 2.51806640625, 2.725830078125, 2.93359375, 3.141357421875, 3.34912109375, 3.556884765625, 3.7646484375, 3.972412109375, 4.18017578125, 4.387939453125, 4.595703125, 4.803466796875, 5.01123046875, 5.218994140625, 5.4267578125, 5.634521484375, 5.84228515625, 6.050048828125, 6.2578125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 4.0, 8.0, 14.0, 13.0, 15.0, 23.0, 8.0, 14.0, 29.0, 36.0, 20.0, 41.0, 56.0, 61.0, 102.0, 139.0, 493.0, 4409.0, 328102.0, 3801132.0, 56746.0, 1938.0, 327.0, 124.0, 70.0, 58.0, 57.0, 37.0, 25.0, 26.0, 31.0, 20.0, 12.0, 15.0, 13.0, 13.0, 8.0, 11.0, 3.0, 7.0, 3.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0], "bins": [-40.4375, -39.29345703125, -38.1494140625, -37.00537109375, -35.861328125, -34.71728515625, -33.5732421875, -32.42919921875, -31.28515625, -30.14111328125, -28.9970703125, -27.85302734375, -26.708984375, -25.56494140625, -24.4208984375, -23.27685546875, -22.1328125, -20.98876953125, -19.8447265625, -18.70068359375, -17.556640625, -16.41259765625, -15.2685546875, -14.12451171875, -12.98046875, -11.83642578125, -10.6923828125, -9.54833984375, -8.404296875, -7.26025390625, -6.1162109375, -4.97216796875, -3.828125, -2.68408203125, -1.5400390625, -0.39599609375, 0.748046875, 1.89208984375, 3.0361328125, 4.18017578125, 5.32421875, 6.46826171875, 7.6123046875, 8.75634765625, 9.900390625, 11.04443359375, 12.1884765625, 13.33251953125, 14.4765625, 15.62060546875, 16.7646484375, 17.90869140625, 19.052734375, 20.19677734375, 21.3408203125, 22.48486328125, 23.62890625, 24.77294921875, 25.9169921875, 27.06103515625, 28.205078125, 29.34912109375, 30.4931640625, 31.63720703125, 32.78125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 4.0, 7.0, 12.0, 14.0, 12.0, 20.0, 30.0, 48.0, 49.0, 60.0, 88.0, 113.0, 179.0, 225.0, 290.0, 397.0, 413.0, 427.0, 390.0, 331.0, 245.0, 214.0, 131.0, 99.0, 78.0, 46.0, 29.0, 31.0, 21.0, 17.0, 15.0, 12.0, 9.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.59375, -11.13134765625, -10.6689453125, -10.20654296875, -9.744140625, -9.28173828125, -8.8193359375, -8.35693359375, -7.89453125, -7.43212890625, -6.9697265625, -6.50732421875, -6.044921875, -5.58251953125, -5.1201171875, -4.65771484375, -4.1953125, -3.73291015625, -3.2705078125, -2.80810546875, -2.345703125, -1.88330078125, -1.4208984375, -0.95849609375, -0.49609375, -0.03369140625, 0.4287109375, 0.89111328125, 1.353515625, 1.81591796875, 2.2783203125, 2.74072265625, 3.203125, 3.66552734375, 4.1279296875, 4.59033203125, 5.052734375, 5.51513671875, 5.9775390625, 6.43994140625, 6.90234375, 7.36474609375, 7.8271484375, 8.28955078125, 8.751953125, 9.21435546875, 9.6767578125, 10.13916015625, 10.6015625, 11.06396484375, 11.5263671875, 11.98876953125, 12.451171875, 12.91357421875, 13.3759765625, 13.83837890625, 14.30078125, 14.76318359375, 15.2255859375, 15.68798828125, 16.150390625, 16.61279296875, 17.0751953125, 17.53759765625, 18.0]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 5.0, 11.0, 6.0, 18.0, 22.0, 26.0, 32.0, 43.0, 68.0, 80.0, 87.0, 151.0, 203.0, 304.0, 528.0, 1497.0, 43787.0, 4030168.0, 113346.0, 2149.0, 614.0, 340.0, 206.0, 134.0, 105.0, 75.0, 75.0, 42.0, 28.0, 29.0, 25.0, 13.0, 15.0, 11.0, 4.0, 6.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-55.78125, -53.75927734375, -51.7373046875, -49.71533203125, -47.693359375, -45.67138671875, -43.6494140625, -41.62744140625, -39.60546875, -37.58349609375, -35.5615234375, -33.53955078125, -31.517578125, -29.49560546875, -27.4736328125, -25.45166015625, -23.4296875, -21.40771484375, -19.3857421875, -17.36376953125, -15.341796875, -13.31982421875, -11.2978515625, -9.27587890625, -7.25390625, -5.23193359375, -3.2099609375, -1.18798828125, 0.833984375, 2.85595703125, 4.8779296875, 6.89990234375, 8.921875, 10.94384765625, 12.9658203125, 14.98779296875, 17.009765625, 19.03173828125, 21.0537109375, 23.07568359375, 25.09765625, 27.11962890625, 29.1416015625, 31.16357421875, 33.185546875, 35.20751953125, 37.2294921875, 39.25146484375, 41.2734375, 43.29541015625, 45.3173828125, 47.33935546875, 49.361328125, 51.38330078125, 53.4052734375, 55.42724609375, 57.44921875, 59.47119140625, 61.4931640625, 63.51513671875, 65.537109375, 67.55908203125, 69.5810546875, 71.60302734375, 73.625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 50.0, 146.0, 259.0, 297.0, 161.0, 70.0, 18.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-262.4325866699219, -257.2919006347656, -252.15122985839844, -247.01055908203125, -241.869873046875, -236.72918701171875, -231.58851623535156, -226.44784545898438, -221.30715942382812, -216.16647338867188, -211.0258026123047, -205.8851318359375, -200.74444580078125, -195.603759765625, -190.4630889892578, -185.32241821289062, -180.18173217773438, -175.04104614257812, -169.90037536621094, -164.75970458984375, -159.6190185546875, -154.47833251953125, -149.33766174316406, -144.19699096679688, -139.05630493164062, -133.91561889648438, -128.7749481201172, -123.63426971435547, -118.49359130859375, -113.35291290283203, -108.21223449707031, -103.0715560913086, -97.9308853149414, -92.79020690917969, -87.64952850341797, -82.50885009765625, -77.36817169189453, -72.22749328613281, -67.0868148803711, -61.946136474609375, -56.805458068847656, -51.66477966308594, -46.52410125732422, -41.3834228515625, -36.24274444580078, -31.102066040039062, -25.961387634277344, -20.820709228515625, -15.680030822753906, -10.539352416992188, -5.398674011230469, -0.25799560546875, 4.882682800292969, 10.023361206054688, 15.164039611816406, 20.304718017578125, 25.445396423339844, 30.586074829101562, 35.72675323486328, 40.867431640625, 46.00811004638672, 51.14878845214844, 56.289466857910156, 61.430145263671875, 66.5708236694336]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 5.0, 6.0, 9.0, 11.0, 12.0, 15.0, 11.0, 18.0, 15.0, 26.0, 17.0, 18.0, 23.0, 23.0, 29.0, 40.0, 41.0, 29.0, 49.0, 34.0, 36.0, 35.0, 39.0, 34.0, 26.0, 41.0, 39.0, 35.0, 32.0, 24.0, 26.0, 25.0, 25.0, 21.0, 16.0, 23.0, 19.0, 12.0, 16.0, 5.0, 7.0, 12.0, 5.0, 5.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-43.546993255615234, -42.135963439941406, -40.724937438964844, -39.313907623291016, -37.90287780761719, -36.49184799194336, -35.08081817626953, -33.66979217529297, -32.25876235961914, -30.847732543945312, -29.436704635620117, -28.025676727294922, -26.614646911621094, -25.203617095947266, -23.79258918762207, -22.381561279296875, -20.970531463623047, -19.55950164794922, -18.148473739624023, -16.737445831298828, -15.326416015625, -13.915387153625488, -12.504358291625977, -11.093329429626465, -9.682300567626953, -8.271271705627441, -6.86024284362793, -5.449213981628418, -4.038185119628906, -2.6271562576293945, -1.2161273956298828, 0.1949014663696289, 1.605926513671875, 3.0169553756713867, 4.427984237670898, 5.83901309967041, 7.250041961669922, 8.661070823669434, 10.072099685668945, 11.483128547668457, 12.894157409667969, 14.30518627166748, 15.716215133666992, 17.127243041992188, 18.538272857666016, 19.949302673339844, 21.36033058166504, 22.771358489990234, 24.182388305664062, 25.59341812133789, 27.004446029663086, 28.41547393798828, 29.82650375366211, 31.237533569335938, 32.6485595703125, 34.05958938598633, 35.470619201660156, 36.881649017333984, 38.29267883300781, 39.703704833984375, 41.1147346496582, 42.52576446533203, 43.936790466308594, 45.34782028198242, 46.75885009765625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 11.0, 7.0, 7.0, 13.0, 9.0, 9.0, 16.0, 17.0, 21.0, 25.0, 21.0, 28.0, 33.0, 27.0, 33.0, 38.0, 39.0, 35.0, 44.0, 28.0, 33.0, 35.0, 40.0, 34.0, 31.0, 33.0, 34.0, 30.0, 29.0, 18.0, 28.0, 24.0, 25.0, 21.0, 16.0, 19.0, 15.0, 14.0, 16.0, 3.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0], "bins": [-6.26171875, -6.06634521484375, -5.8709716796875, -5.67559814453125, -5.480224609375, -5.28485107421875, -5.0894775390625, -4.89410400390625, -4.69873046875, -4.50335693359375, -4.3079833984375, -4.11260986328125, -3.917236328125, -3.72186279296875, -3.5264892578125, -3.33111572265625, -3.1357421875, -2.94036865234375, -2.7449951171875, -2.54962158203125, -2.354248046875, -2.15887451171875, -1.9635009765625, -1.76812744140625, -1.57275390625, -1.37738037109375, -1.1820068359375, -0.98663330078125, -0.791259765625, -0.59588623046875, -0.4005126953125, -0.20513916015625, -0.009765625, 0.18560791015625, 0.3809814453125, 0.57635498046875, 0.771728515625, 0.96710205078125, 1.1624755859375, 1.35784912109375, 1.55322265625, 1.74859619140625, 1.9439697265625, 2.13934326171875, 2.334716796875, 2.53009033203125, 2.7254638671875, 2.92083740234375, 3.1162109375, 3.31158447265625, 3.5069580078125, 3.70233154296875, 3.897705078125, 4.09307861328125, 4.2884521484375, 4.48382568359375, 4.67919921875, 4.87457275390625, 5.0699462890625, 5.26531982421875, 5.460693359375, 5.65606689453125, 5.8514404296875, 6.04681396484375, 6.2421875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 16.0, 21.0, 25.0, 34.0, 71.0, 86.0, 158.0, 234.0, 265.0, 438.0, 621.0, 952.0, 1322.0, 2068.0, 2981.0, 4435.0, 6624.0, 9956.0, 14815.0, 22238.0, 34247.0, 52210.0, 80934.0, 125483.0, 186072.0, 173130.0, 114869.0, 73524.0, 47701.0, 31196.0, 20445.0, 13579.0, 8929.0, 6116.0, 4165.0, 2720.0, 1880.0, 1231.0, 883.0, 612.0, 419.0, 275.0, 187.0, 134.0, 84.0, 68.0, 32.0, 30.0, 14.0, 11.0, 5.0, 3.0, 6.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.87939453125, -0.8509292602539062, -0.8224639892578125, -0.7939987182617188, -0.765533447265625, -0.7370681762695312, -0.7086029052734375, -0.6801376342773438, -0.65167236328125, -0.6232070922851562, -0.5947418212890625, -0.5662765502929688, -0.537811279296875, -0.5093460083007812, -0.4808807373046875, -0.45241546630859375, -0.4239501953125, -0.39548492431640625, -0.3670196533203125, -0.33855438232421875, -0.310089111328125, -0.28162384033203125, -0.2531585693359375, -0.22469329833984375, -0.19622802734375, -0.16776275634765625, -0.1392974853515625, -0.11083221435546875, -0.082366943359375, -0.05390167236328125, -0.0254364013671875, 0.00302886962890625, 0.031494140625, 0.05995941162109375, 0.0884246826171875, 0.11688995361328125, 0.145355224609375, 0.17382049560546875, 0.2022857666015625, 0.23075103759765625, 0.25921630859375, 0.28768157958984375, 0.3161468505859375, 0.34461212158203125, 0.373077392578125, 0.40154266357421875, 0.4300079345703125, 0.45847320556640625, 0.4869384765625, 0.5154037475585938, 0.5438690185546875, 0.5723342895507812, 0.600799560546875, 0.6292648315429688, 0.6577301025390625, 0.6861953735351562, 0.71466064453125, 0.7431259155273438, 0.7715911865234375, 0.8000564575195312, 0.828521728515625, 0.8569869995117188, 0.8854522705078125, 0.9139175415039062, 0.9423828125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 7.0, 10.0, 8.0, 13.0, 12.0, 12.0, 14.0, 22.0, 21.0, 28.0, 29.0, 30.0, 21.0, 34.0, 32.0, 39.0, 46.0, 44.0, 45.0, 1055.0, 49.0, 51.0, 39.0, 45.0, 36.0, 36.0, 36.0, 32.0, 31.0, 20.0, 19.0, 19.0, 16.0, 15.0, 10.0, 10.0, 9.0, 6.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.5625, -4.41912841796875, -4.2757568359375, -4.13238525390625, -3.989013671875, -3.84564208984375, -3.7022705078125, -3.55889892578125, -3.41552734375, -3.27215576171875, -3.1287841796875, -2.98541259765625, -2.842041015625, -2.69866943359375, -2.5552978515625, -2.41192626953125, -2.2685546875, -2.12518310546875, -1.9818115234375, -1.83843994140625, -1.695068359375, -1.55169677734375, -1.4083251953125, -1.26495361328125, -1.12158203125, -0.97821044921875, -0.8348388671875, -0.69146728515625, -0.548095703125, -0.40472412109375, -0.2613525390625, -0.11798095703125, 0.025390625, 0.16876220703125, 0.3121337890625, 0.45550537109375, 0.598876953125, 0.74224853515625, 0.8856201171875, 1.02899169921875, 1.17236328125, 1.31573486328125, 1.4591064453125, 1.60247802734375, 1.745849609375, 1.88922119140625, 2.0325927734375, 2.17596435546875, 2.3193359375, 2.46270751953125, 2.6060791015625, 2.74945068359375, 2.892822265625, 3.03619384765625, 3.1795654296875, 3.32293701171875, 3.46630859375, 3.60968017578125, 3.7530517578125, 3.89642333984375, 4.039794921875, 4.18316650390625, 4.3265380859375, 4.46990966796875, 4.61328125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 16.0, 17.0, 22.0, 41.0, 44.0, 73.0, 112.0, 197.0, 272.0, 383.0, 587.0, 954.0, 1421.0, 2154.0, 3202.0, 5005.0, 7637.0, 11823.0, 18295.0, 28566.0, 45317.0, 71421.0, 113664.0, 182420.0, 1248983.0, 130481.0, 81607.0, 51209.0, 32301.0, 20482.0, 13379.0, 8519.0, 5644.0, 3660.0, 2477.0, 1594.0, 1040.0, 727.0, 480.0, 286.0, 233.0, 110.0, 94.0, 68.0, 39.0, 29.0, 19.0, 11.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.8896484375, -0.861968994140625, -0.83428955078125, -0.806610107421875, -0.7789306640625, -0.751251220703125, -0.72357177734375, -0.695892333984375, -0.668212890625, -0.640533447265625, -0.61285400390625, -0.585174560546875, -0.5574951171875, -0.529815673828125, -0.50213623046875, -0.474456787109375, -0.44677734375, -0.419097900390625, -0.39141845703125, -0.363739013671875, -0.3360595703125, -0.308380126953125, -0.28070068359375, -0.253021240234375, -0.225341796875, -0.197662353515625, -0.16998291015625, -0.142303466796875, -0.1146240234375, -0.086944580078125, -0.05926513671875, -0.031585693359375, -0.00390625, 0.023773193359375, 0.05145263671875, 0.079132080078125, 0.1068115234375, 0.134490966796875, 0.16217041015625, 0.189849853515625, 0.217529296875, 0.245208740234375, 0.27288818359375, 0.300567626953125, 0.3282470703125, 0.355926513671875, 0.38360595703125, 0.411285400390625, 0.43896484375, 0.466644287109375, 0.49432373046875, 0.522003173828125, 0.5496826171875, 0.577362060546875, 0.60504150390625, 0.632720947265625, 0.660400390625, 0.688079833984375, 0.71575927734375, 0.743438720703125, 0.7711181640625, 0.798797607421875, 0.82647705078125, 0.854156494140625, 0.8818359375]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 6.0, 16.0, 10.0, 10.0, 23.0, 24.0, 24.0, 30.0, 39.0, 38.0, 41.0, 54.0, 56.0, 68.0, 70.0, 67.0, 42.0, 59.0, 55.0, 41.0, 45.0, 32.0, 29.0, 18.0, 17.0, 24.0, 11.0, 8.0, 8.0, 12.0, 7.0, 6.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00154876708984375, -0.0014983564615249634, -0.0014479458332061768, -0.0013975352048873901, -0.0013471245765686035, -0.001296713948249817, -0.0012463033199310303, -0.0011958926916122437, -0.001145482063293457, -0.0010950714349746704, -0.0010446608066558838, -0.0009942501783370972, -0.0009438395500183105, -0.0008934289216995239, -0.0008430182933807373, -0.0007926076650619507, -0.0007421970367431641, -0.0006917864084243774, -0.0006413757801055908, -0.0005909651517868042, -0.0005405545234680176, -0.000490143895149231, -0.00043973326683044434, -0.0003893226385116577, -0.0003389120101928711, -0.00028850138187408447, -0.00023809075355529785, -0.00018768012523651123, -0.0001372694969177246, -8.685886859893799e-05, -3.644824028015137e-05, 1.3962388038635254e-05, 6.437301635742188e-05, 0.0001147836446762085, 0.00016519427299499512, 0.00021560490131378174, 0.00026601552963256836, 0.000316426157951355, 0.0003668367862701416, 0.0004172474145889282, 0.00046765804290771484, 0.0005180686712265015, 0.0005684792995452881, 0.0006188899278640747, 0.0006693005561828613, 0.000719711184501648, 0.0007701218128204346, 0.0008205324411392212, 0.0008709430694580078, 0.0009213536977767944, 0.0009717643260955811, 0.0010221749544143677, 0.0010725855827331543, 0.001122996211051941, 0.0011734068393707275, 0.0012238174676895142, 0.0012742280960083008, 0.0013246387243270874, 0.001375049352645874, 0.0014254599809646606, 0.0014758706092834473, 0.0015262812376022339, 0.0015766918659210205, 0.0016271024942398071, 0.0016775131225585938]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 9.0, 11.0, 8.0, 14.0, 20.0, 15.0, 22.0, 37.0, 44.0, 59.0, 87.0, 126.0, 208.0, 517.0, 2968.0, 1025286.0, 17589.0, 743.0, 291.0, 153.0, 95.0, 60.0, 47.0, 33.0, 28.0, 23.0, 15.0, 11.0, 6.0, 6.0, 1.0, 8.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039093017578125, -0.03789567947387695, -0.036698341369628906, -0.03550100326538086, -0.03430366516113281, -0.033106327056884766, -0.03190898895263672, -0.030711650848388672, -0.029514312744140625, -0.028316974639892578, -0.02711963653564453, -0.025922298431396484, -0.024724960327148438, -0.02352762222290039, -0.022330284118652344, -0.021132946014404297, -0.01993560791015625, -0.018738269805908203, -0.017540931701660156, -0.01634359359741211, -0.015146255493164062, -0.013948917388916016, -0.012751579284667969, -0.011554241180419922, -0.010356903076171875, -0.009159564971923828, -0.007962226867675781, -0.006764888763427734, -0.0055675506591796875, -0.004370212554931641, -0.0031728744506835938, -0.001975536346435547, -0.0007781982421875, 0.0004191398620605469, 0.0016164779663085938, 0.0028138160705566406, 0.0040111541748046875, 0.005208492279052734, 0.006405830383300781, 0.007603168487548828, 0.008800506591796875, 0.009997844696044922, 0.011195182800292969, 0.012392520904541016, 0.013589859008789062, 0.01478719711303711, 0.015984535217285156, 0.017181873321533203, 0.01837921142578125, 0.019576549530029297, 0.020773887634277344, 0.02197122573852539, 0.023168563842773438, 0.024365901947021484, 0.02556324005126953, 0.026760578155517578, 0.027957916259765625, 0.029155254364013672, 0.03035259246826172, 0.031549930572509766, 0.03274726867675781, 0.03394460678100586, 0.035141944885253906, 0.03633928298950195, 0.03753662109375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 4.0, 16.0, 42.0, 106.0, 184.0, 210.0, 199.0, 127.0, 69.0, 29.0, 17.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0020032308530062437, -0.0019485864322632551, -0.0018939421279355884, -0.0018392977071925998, -0.0017846532864496112, -0.0017300089821219444, -0.0016753645613789558, -0.0016207201406359673, -0.0015660757198929787, -0.00151143129914999, -0.0014567869948223233, -0.0014021425740793347, -0.0013474981533363461, -0.0012928538490086794, -0.0012382094282656908, -0.0011835650075227022, -0.0011289207031950355, -0.0010742762824520469, -0.0010196319781243801, -0.0009649875573813915, -0.0009103431366384029, -0.0008556987741030753, -0.0008010544115677476, -0.000746409990824759, -0.0006917656282894313, -0.0006371212657541037, -0.0005824768450111151, -0.0005278324824757874, -0.00047318809083662927, -0.00041854369919747114, -0.00036389933666214347, -0.00030925494502298534, -0.0002546104369685054, -0.00019996604532934725, -0.00014532166824210435, -9.067729115486145e-05, -3.603289951570332e-05, 1.861149212345481e-05, 7.325585465878248e-05, 0.0001279002462979406, 0.00018254463793709874, 0.00023718902957625687, 0.000291833421215415, 0.0003464777837507427, 0.0004011221753899008, 0.00045576656702905893, 0.0005104109295643866, 0.0005650552920997143, 0.0006196997128427029, 0.0006743440753780305, 0.0007289884961210191, 0.0007836328586563468, 0.0008382772793993354, 0.0008929216419346631, 0.0009475660044699907, 0.0010022104252129793, 0.001056854845955968, 0.0011114992666989565, 0.0011661435710266232, 0.0012207879917696118, 0.0012754324125126004, 0.0013300767168402672, 0.0013847211375832558, 0.0014393655583262444, 0.0014940098626539111]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 6.0, 1.0, 3.0, 9.0, 4.0, 6.0, 13.0, 14.0, 22.0, 11.0, 18.0, 26.0, 23.0, 32.0, 28.0, 29.0, 29.0, 42.0, 32.0, 34.0, 37.0, 41.0, 41.0, 43.0, 40.0, 40.0, 35.0, 32.0, 28.0, 32.0, 29.0, 28.0, 26.0, 31.0, 19.0, 14.0, 13.0, 19.0, 18.0, 11.0, 13.0, 9.0, 7.0, 4.0, 1.0, 6.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.0007635951042175293, -0.0007400056347250938, -0.0007164161652326584, -0.0006928266957402229, -0.0006692372262477875, -0.000645647756755352, -0.0006220582872629166, -0.0005984688177704811, -0.0005748793482780457, -0.0005512898787856102, -0.0005277004092931747, -0.0005041109398007393, -0.00048052147030830383, -0.0004569320008158684, -0.0004333425313234329, -0.00040975306183099747, -0.000386163592338562, -0.00036257412284612656, -0.0003389846533536911, -0.00031539518386125565, -0.0002918057143688202, -0.00026821624487638474, -0.0002446267753839493, -0.00022103730589151382, -0.00019744783639907837, -0.00017385836690664291, -0.00015026889741420746, -0.000126679427921772, -0.00010308995842933655, -7.950048893690109e-05, -5.591101944446564e-05, -3.232154995203018e-05, -8.732080459594727e-06, 1.4857389032840729e-05, 3.8446858525276184e-05, 6.203632801771164e-05, 8.56257975101471e-05, 0.00010921526700258255, 0.000132804736495018, 0.00015639420598745346, 0.00017998367547988892, 0.00020357314497232437, 0.00022716261446475983, 0.0002507520839571953, 0.00027434155344963074, 0.0002979310229420662, 0.00032152049243450165, 0.0003451099619269371, 0.00036869943141937256, 0.000392288900911808, 0.00041587837040424347, 0.0004394678398966789, 0.0004630573093891144, 0.00048664677888154984, 0.0005102362483739853, 0.0005338257178664207, 0.0005574151873588562, 0.0005810046568512917, 0.0006045941263437271, 0.0006281835958361626, 0.000651773065328598, 0.0006753625348210335, 0.0006989520043134689, 0.0007225414738059044, 0.0007461309432983398]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 11.0, 7.0, 7.0, 13.0, 9.0, 9.0, 15.0, 18.0, 21.0, 25.0, 21.0, 28.0, 32.0, 28.0, 33.0, 37.0, 39.0, 34.0, 46.0, 28.0, 32.0, 36.0, 39.0, 34.0, 32.0, 32.0, 34.0, 31.0, 29.0, 17.0, 29.0, 24.0, 23.0, 23.0, 16.0, 18.0, 16.0, 13.0, 17.0, 3.0, 6.0, 5.0, 5.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 2.0], "bins": [-6.26171875, -6.06640625, -5.87109375, -5.67578125, -5.48046875, -5.28515625, -5.08984375, -4.89453125, -4.69921875, -4.50390625, -4.30859375, -4.11328125, -3.91796875, -3.72265625, -3.52734375, -3.33203125, -3.13671875, -2.94140625, -2.74609375, -2.55078125, -2.35546875, -2.16015625, -1.96484375, -1.76953125, -1.57421875, -1.37890625, -1.18359375, -0.98828125, -0.79296875, -0.59765625, -0.40234375, -0.20703125, -0.01171875, 0.18359375, 0.37890625, 0.57421875, 0.76953125, 0.96484375, 1.16015625, 1.35546875, 1.55078125, 1.74609375, 1.94140625, 2.13671875, 2.33203125, 2.52734375, 2.72265625, 2.91796875, 3.11328125, 3.30859375, 3.50390625, 3.69921875, 3.89453125, 4.08984375, 4.28515625, 4.48046875, 4.67578125, 4.87109375, 5.06640625, 5.26171875, 5.45703125, 5.65234375, 5.84765625, 6.04296875, 6.23828125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 5.0, 2.0, 7.0, 11.0, 17.0, 25.0, 35.0, 52.0, 80.0, 113.0, 178.0, 248.0, 381.0, 577.0, 864.0, 1256.0, 1840.0, 2951.0, 4765.0, 7662.0, 12692.0, 22361.0, 43130.0, 93370.0, 236044.0, 347861.0, 139205.0, 60609.0, 29932.0, 16184.0, 9658.0, 5766.0, 3681.0, 2399.0, 1565.0, 1006.0, 654.0, 417.0, 297.0, 191.0, 145.0, 95.0, 65.0, 46.0, 37.0, 23.0, 20.0, 10.0, 7.0, 8.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.3828125, -3.281005859375, -3.17919921875, -3.077392578125, -2.9755859375, -2.873779296875, -2.77197265625, -2.670166015625, -2.568359375, -2.466552734375, -2.36474609375, -2.262939453125, -2.1611328125, -2.059326171875, -1.95751953125, -1.855712890625, -1.75390625, -1.652099609375, -1.55029296875, -1.448486328125, -1.3466796875, -1.244873046875, -1.14306640625, -1.041259765625, -0.939453125, -0.837646484375, -0.73583984375, -0.634033203125, -0.5322265625, -0.430419921875, -0.32861328125, -0.226806640625, -0.125, -0.023193359375, 0.07861328125, 0.180419921875, 0.2822265625, 0.384033203125, 0.48583984375, 0.587646484375, 0.689453125, 0.791259765625, 0.89306640625, 0.994873046875, 1.0966796875, 1.198486328125, 1.30029296875, 1.402099609375, 1.50390625, 1.605712890625, 1.70751953125, 1.809326171875, 1.9111328125, 2.012939453125, 2.11474609375, 2.216552734375, 2.318359375, 2.420166015625, 2.52197265625, 2.623779296875, 2.7255859375, 2.827392578125, 2.92919921875, 3.031005859375, 3.1328125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 6.0, 7.0, 15.0, 14.0, 10.0, 8.0, 20.0, 15.0, 23.0, 27.0, 39.0, 53.0, 46.0, 33.0, 44.0, 62.0, 149.0, 1739.0, 219.0, 72.0, 53.0, 52.0, 42.0, 43.0, 24.0, 34.0, 30.0, 21.0, 28.0, 27.0, 13.0, 13.0, 9.0, 15.0, 9.0, 8.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.328125, -21.51904296875, -20.7099609375, -19.90087890625, -19.091796875, -18.28271484375, -17.4736328125, -16.66455078125, -15.85546875, -15.04638671875, -14.2373046875, -13.42822265625, -12.619140625, -11.81005859375, -11.0009765625, -10.19189453125, -9.3828125, -8.57373046875, -7.7646484375, -6.95556640625, -6.146484375, -5.33740234375, -4.5283203125, -3.71923828125, -2.91015625, -2.10107421875, -1.2919921875, -0.48291015625, 0.326171875, 1.13525390625, 1.9443359375, 2.75341796875, 3.5625, 4.37158203125, 5.1806640625, 5.98974609375, 6.798828125, 7.60791015625, 8.4169921875, 9.22607421875, 10.03515625, 10.84423828125, 11.6533203125, 12.46240234375, 13.271484375, 14.08056640625, 14.8896484375, 15.69873046875, 16.5078125, 17.31689453125, 18.1259765625, 18.93505859375, 19.744140625, 20.55322265625, 21.3623046875, 22.17138671875, 22.98046875, 23.78955078125, 24.5986328125, 25.40771484375, 26.216796875, 27.02587890625, 27.8349609375, 28.64404296875, 29.453125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 5.0, 8.0, 6.0, 9.0, 16.0, 35.0, 23.0, 34.0, 58.0, 55.0, 88.0, 116.0, 182.0, 354.0, 681.0, 4077.0, 3034288.0, 102925.0, 1499.0, 464.0, 260.0, 180.0, 109.0, 60.0, 39.0, 20.0, 29.0, 25.0, 17.0, 11.0, 12.0, 7.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-78.5625, -76.484375, -74.40625, -72.328125, -70.25, -68.171875, -66.09375, -64.015625, -61.9375, -59.859375, -57.78125, -55.703125, -53.625, -51.546875, -49.46875, -47.390625, -45.3125, -43.234375, -41.15625, -39.078125, -37.0, -34.921875, -32.84375, -30.765625, -28.6875, -26.609375, -24.53125, -22.453125, -20.375, -18.296875, -16.21875, -14.140625, -12.0625, -9.984375, -7.90625, -5.828125, -3.75, -1.671875, 0.40625, 2.484375, 4.5625, 6.640625, 8.71875, 10.796875, 12.875, 14.953125, 17.03125, 19.109375, 21.1875, 23.265625, 25.34375, 27.421875, 29.5, 31.578125, 33.65625, 35.734375, 37.8125, 39.890625, 41.96875, 44.046875, 46.125, 48.203125, 50.28125, 52.359375, 54.4375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 8.0, 13.0, 33.0, 93.0, 176.0, 213.0, 219.0, 140.0, 76.0, 27.0, 7.0, 3.0, 1.0, 1.0, 2.0], "bins": [-77.00790405273438, -75.60250854492188, -74.1971206665039, -72.79173278808594, -71.38633728027344, -69.98094177246094, -68.57555389404297, -67.170166015625, -65.7647705078125, -64.359375, -62.95398712158203, -61.5485954284668, -60.14320373535156, -58.73781204223633, -57.332420349121094, -55.92702865600586, -54.521636962890625, -53.11624526977539, -51.710853576660156, -50.30546188354492, -48.90007019042969, -47.49467849731445, -46.08928680419922, -44.683895111083984, -43.27850341796875, -41.873111724853516, -40.46772003173828, -39.06232833862305, -37.65693664550781, -36.25154495239258, -34.846153259277344, -33.44076156616211, -32.035369873046875, -30.62997817993164, -29.224586486816406, -27.819194793701172, -26.413803100585938, -25.008411407470703, -23.60301971435547, -22.197628021240234, -20.792236328125, -19.386844635009766, -17.98145294189453, -16.576061248779297, -15.170669555664062, -13.765277862548828, -12.359886169433594, -10.95449447631836, -9.549103736877441, -8.143712043762207, -6.738320350646973, -5.332928657531738, -3.927536964416504, -2.5221452713012695, -1.1167535781860352, 0.2886381149291992, 1.6940298080444336, 3.099421501159668, 4.504813194274902, 5.910204887390137, 7.315596580505371, 8.720988273620605, 10.12637996673584, 11.531771659851074, 12.937163352966309]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 4.0, 2.0, 7.0, 7.0, 9.0, 7.0, 13.0, 10.0, 22.0, 29.0, 24.0, 29.0, 20.0, 33.0, 29.0, 39.0, 26.0, 32.0, 51.0, 52.0, 35.0, 43.0, 43.0, 38.0, 39.0, 41.0, 32.0, 31.0, 31.0, 34.0, 24.0, 24.0, 26.0, 22.0, 8.0, 18.0, 21.0, 8.0, 6.0, 12.0, 2.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-63.31575012207031, -61.22175598144531, -59.12776184082031, -57.03377151489258, -54.93977737426758, -52.84578323364258, -50.751792907714844, -48.657798767089844, -46.563804626464844, -44.469810485839844, -42.375816345214844, -40.28182601928711, -38.18783187866211, -36.09383773803711, -33.999847412109375, -31.905853271484375, -29.811859130859375, -27.717864990234375, -25.623872756958008, -23.52988052368164, -21.43588638305664, -19.34189224243164, -17.247900009155273, -15.15390682220459, -13.059913635253906, -10.965920448303223, -8.871927261352539, -6.7779340744018555, -4.683940887451172, -2.5899477005004883, -0.4959545135498047, 1.598038673400879, 3.6920394897460938, 5.786032676696777, 7.880025863647461, 9.974019050598145, 12.068012237548828, 14.162005424499512, 16.255998611450195, 18.349990844726562, 20.443984985351562, 22.537979125976562, 24.63197135925293, 26.725963592529297, 28.819957733154297, 30.913951873779297, 33.00794219970703, 35.10193634033203, 37.19593048095703, 39.28992462158203, 41.38391876220703, 43.477909088134766, 45.571903228759766, 47.665897369384766, 49.7598876953125, 51.8538818359375, 53.9478759765625, 56.0418701171875, 58.1358642578125, 60.229854583740234, 62.323848724365234, 64.41783905029297, 66.51183319091797, 68.60582733154297, 70.69982147216797]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 8.0, 9.0, 5.0, 10.0, 12.0, 5.0, 16.0, 9.0, 22.0, 13.0, 22.0, 19.0, 30.0, 32.0, 27.0, 25.0, 23.0, 44.0, 33.0, 34.0, 34.0, 30.0, 35.0, 32.0, 33.0, 33.0, 33.0, 36.0, 32.0, 35.0, 21.0, 23.0, 28.0, 18.0, 22.0, 20.0, 16.0, 19.0, 16.0, 21.0, 9.0, 13.0, 6.0, 7.0, 6.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 3.0], "bins": [-5.97265625, -5.781494140625, -5.59033203125, -5.399169921875, -5.2080078125, -5.016845703125, -4.82568359375, -4.634521484375, -4.443359375, -4.252197265625, -4.06103515625, -3.869873046875, -3.6787109375, -3.487548828125, -3.29638671875, -3.105224609375, -2.9140625, -2.722900390625, -2.53173828125, -2.340576171875, -2.1494140625, -1.958251953125, -1.76708984375, -1.575927734375, -1.384765625, -1.193603515625, -1.00244140625, -0.811279296875, -0.6201171875, -0.428955078125, -0.23779296875, -0.046630859375, 0.14453125, 0.335693359375, 0.52685546875, 0.718017578125, 0.9091796875, 1.100341796875, 1.29150390625, 1.482666015625, 1.673828125, 1.864990234375, 2.05615234375, 2.247314453125, 2.4384765625, 2.629638671875, 2.82080078125, 3.011962890625, 3.203125, 3.394287109375, 3.58544921875, 3.776611328125, 3.9677734375, 4.158935546875, 4.35009765625, 4.541259765625, 4.732421875, 4.923583984375, 5.11474609375, 5.305908203125, 5.4970703125, 5.688232421875, 5.87939453125, 6.070556640625, 6.26171875]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 13.0, 15.0, 18.0, 28.0, 43.0, 53.0, 73.0, 104.0, 136.0, 231.0, 347.0, 610.0, 1163.0, 2351.0, 5673.0, 16109.0, 66709.0, 369911.0, 1421316.0, 1677084.0, 513443.0, 86435.0, 19875.0, 6569.0, 2761.0, 1344.0, 662.0, 398.0, 234.0, 165.0, 96.0, 74.0, 64.0, 49.0, 40.0, 26.0, 16.0, 12.0, 13.0, 10.0, 4.0, 2.0, 2.0, 3.0], "bins": [-12.4375, -12.119384765625, -11.80126953125, -11.483154296875, -11.1650390625, -10.846923828125, -10.52880859375, -10.210693359375, -9.892578125, -9.574462890625, -9.25634765625, -8.938232421875, -8.6201171875, -8.302001953125, -7.98388671875, -7.665771484375, -7.34765625, -7.029541015625, -6.71142578125, -6.393310546875, -6.0751953125, -5.757080078125, -5.43896484375, -5.120849609375, -4.802734375, -4.484619140625, -4.16650390625, -3.848388671875, -3.5302734375, -3.212158203125, -2.89404296875, -2.575927734375, -2.2578125, -1.939697265625, -1.62158203125, -1.303466796875, -0.9853515625, -0.667236328125, -0.34912109375, -0.031005859375, 0.287109375, 0.605224609375, 0.92333984375, 1.241455078125, 1.5595703125, 1.877685546875, 2.19580078125, 2.513916015625, 2.83203125, 3.150146484375, 3.46826171875, 3.786376953125, 4.1044921875, 4.422607421875, 4.74072265625, 5.058837890625, 5.376953125, 5.695068359375, 6.01318359375, 6.331298828125, 6.6494140625, 6.967529296875, 7.28564453125, 7.603759765625, 7.921875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 3.0, 1.0, 9.0, 9.0, 8.0, 9.0, 10.0, 12.0, 13.0, 18.0, 20.0, 29.0, 42.0, 57.0, 69.0, 85.0, 102.0, 161.0, 176.0, 241.0, 291.0, 335.0, 366.0, 383.0, 319.0, 281.0, 227.0, 176.0, 123.0, 113.0, 78.0, 76.0, 58.0, 39.0, 37.0, 22.0, 23.0, 19.0, 19.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.4375, -10.0361328125, -9.634765625, -9.2333984375, -8.83203125, -8.4306640625, -8.029296875, -7.6279296875, -7.2265625, -6.8251953125, -6.423828125, -6.0224609375, -5.62109375, -5.2197265625, -4.818359375, -4.4169921875, -4.015625, -3.6142578125, -3.212890625, -2.8115234375, -2.41015625, -2.0087890625, -1.607421875, -1.2060546875, -0.8046875, -0.4033203125, -0.001953125, 0.3994140625, 0.80078125, 1.2021484375, 1.603515625, 2.0048828125, 2.40625, 2.8076171875, 3.208984375, 3.6103515625, 4.01171875, 4.4130859375, 4.814453125, 5.2158203125, 5.6171875, 6.0185546875, 6.419921875, 6.8212890625, 7.22265625, 7.6240234375, 8.025390625, 8.4267578125, 8.828125, 9.2294921875, 9.630859375, 10.0322265625, 10.43359375, 10.8349609375, 11.236328125, 11.6376953125, 12.0390625, 12.4404296875, 12.841796875, 13.2431640625, 13.64453125, 14.0458984375, 14.447265625, 14.8486328125, 15.25]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 0.0, 4.0, 5.0, 10.0, 14.0, 12.0, 23.0, 20.0, 15.0, 40.0, 27.0, 54.0, 73.0, 80.0, 108.0, 152.0, 245.0, 389.0, 1067.0, 14258.0, 3378750.0, 791433.0, 5569.0, 775.0, 321.0, 221.0, 149.0, 100.0, 70.0, 59.0, 46.0, 50.0, 29.0, 24.0, 17.0, 20.0, 8.0, 6.0, 13.0, 3.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0], "bins": [-65.9375, -64.04638671875, -62.1552734375, -60.26416015625, -58.373046875, -56.48193359375, -54.5908203125, -52.69970703125, -50.80859375, -48.91748046875, -47.0263671875, -45.13525390625, -43.244140625, -41.35302734375, -39.4619140625, -37.57080078125, -35.6796875, -33.78857421875, -31.8974609375, -30.00634765625, -28.115234375, -26.22412109375, -24.3330078125, -22.44189453125, -20.55078125, -18.65966796875, -16.7685546875, -14.87744140625, -12.986328125, -11.09521484375, -9.2041015625, -7.31298828125, -5.421875, -3.53076171875, -1.6396484375, 0.25146484375, 2.142578125, 4.03369140625, 5.9248046875, 7.81591796875, 9.70703125, 11.59814453125, 13.4892578125, 15.38037109375, 17.271484375, 19.16259765625, 21.0537109375, 22.94482421875, 24.8359375, 26.72705078125, 28.6181640625, 30.50927734375, 32.400390625, 34.29150390625, 36.1826171875, 38.07373046875, 39.96484375, 41.85595703125, 43.7470703125, 45.63818359375, 47.529296875, 49.42041015625, 51.3115234375, 53.20263671875, 55.09375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 7.0, 11.0, 10.0, 14.0, 16.0, 19.0, 26.0, 50.0, 42.0, 58.0, 63.0, 74.0, 82.0, 82.0, 89.0, 91.0, 58.0, 59.0, 38.0, 33.0, 28.0, 19.0, 14.0, 11.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-22.831884384155273, -21.42334747314453, -20.014812469482422, -18.60627555847168, -17.19774055480957, -15.789203643798828, -14.380667686462402, -12.972131729125977, -11.56359577178955, -10.155059814453125, -8.7465238571167, -7.337987422943115, -5.9294514656066895, -4.520915508270264, -3.1123790740966797, -1.703843116760254, -0.2953071594238281, 1.1132289171218872, 2.5217649936676025, 3.9303011894226074, 5.338837146759033, 6.747373104095459, 8.155909538269043, 9.564445495605469, 10.972981452941895, 12.38151741027832, 13.790053367614746, 15.198589324951172, 16.607126235961914, 18.015661239624023, 19.424198150634766, 20.832733154296875, 22.241268157958984, 23.649805068969727, 25.058340072631836, 26.466876983642578, 27.875411987304688, 29.28394889831543, 30.692485809326172, 32.10102081298828, 33.50955581665039, 34.9180908203125, 36.326629638671875, 37.735164642333984, 39.143699645996094, 40.5522346496582, 41.96077346801758, 43.36930847167969, 44.77784729003906, 46.18638229370117, 47.59492111206055, 49.003456115722656, 50.411991119384766, 51.820526123046875, 53.22906494140625, 54.63759994506836, 56.04613494873047, 57.45466995239258, 58.86320877075195, 60.27174377441406, 61.68027877807617, 63.08881378173828, 64.49735260009766, 65.9058837890625, 67.31442260742188]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 12.0, 7.0, 7.0, 6.0, 12.0, 16.0, 19.0, 27.0, 22.0, 27.0, 31.0, 35.0, 39.0, 44.0, 39.0, 30.0, 36.0, 49.0, 46.0, 37.0, 39.0, 33.0, 43.0, 35.0, 31.0, 30.0, 29.0, 26.0, 24.0, 29.0, 27.0, 20.0, 15.0, 13.0, 9.0, 15.0, 11.0, 6.0, 8.0, 2.0, 8.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0, 1.0], "bins": [-53.66212463378906, -52.12750244140625, -50.59288024902344, -49.058258056640625, -47.52363204956055, -45.989009857177734, -44.45438766479492, -42.91976547241211, -41.3851432800293, -39.850521087646484, -38.31589889526367, -36.781272888183594, -35.24665069580078, -33.71202850341797, -32.177406311035156, -30.642784118652344, -29.1081600189209, -27.573537826538086, -26.03891372680664, -24.504291534423828, -22.969669342041016, -21.435047149658203, -19.900423049926758, -18.365800857543945, -16.8311767578125, -15.296553611755371, -13.761931419372559, -12.22730827331543, -10.692686080932617, -9.158062934875488, -7.623439788818359, -6.088817596435547, -4.554195404052734, -3.0195727348327637, -1.4849498271942139, 0.04967308044433594, 1.5842957496643066, 3.1189184188842773, 4.653541564941406, 6.188163757324219, 7.722786903381348, 9.257410049438477, 10.792032241821289, 12.326655387878418, 13.861278533935547, 15.39590072631836, 16.930522918701172, 18.465145111083984, 19.99976921081543, 21.534391403198242, 23.069015502929688, 24.6036376953125, 26.138259887695312, 27.672882080078125, 29.20750617980957, 30.742128372192383, 32.27675247192383, 33.81137466430664, 35.34599685668945, 36.88062286376953, 38.415245056152344, 39.949867248535156, 41.48448944091797, 43.01911163330078, 44.553733825683594]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 9.0, 13.0, 10.0, 11.0, 19.0, 12.0, 18.0, 16.0, 20.0, 18.0, 21.0, 14.0, 39.0, 41.0, 32.0, 40.0, 40.0, 21.0, 29.0, 44.0, 41.0, 34.0, 33.0, 38.0, 34.0, 27.0, 29.0, 30.0, 32.0, 28.0, 23.0, 23.0, 21.0, 21.0, 20.0, 24.0, 6.0, 8.0, 15.0, 7.0, 8.0, 1.0, 6.0, 8.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0], "bins": [-6.0703125, -5.87359619140625, -5.6768798828125, -5.48016357421875, -5.283447265625, -5.08673095703125, -4.8900146484375, -4.69329833984375, -4.49658203125, -4.29986572265625, -4.1031494140625, -3.90643310546875, -3.709716796875, -3.51300048828125, -3.3162841796875, -3.11956787109375, -2.9228515625, -2.72613525390625, -2.5294189453125, -2.33270263671875, -2.135986328125, -1.93927001953125, -1.7425537109375, -1.54583740234375, -1.34912109375, -1.15240478515625, -0.9556884765625, -0.75897216796875, -0.562255859375, -0.36553955078125, -0.1688232421875, 0.02789306640625, 0.224609375, 0.42132568359375, 0.6180419921875, 0.81475830078125, 1.011474609375, 1.20819091796875, 1.4049072265625, 1.60162353515625, 1.79833984375, 1.99505615234375, 2.1917724609375, 2.38848876953125, 2.585205078125, 2.78192138671875, 2.9786376953125, 3.17535400390625, 3.3720703125, 3.56878662109375, 3.7655029296875, 3.96221923828125, 4.158935546875, 4.35565185546875, 4.5523681640625, 4.74908447265625, 4.94580078125, 5.14251708984375, 5.3392333984375, 5.53594970703125, 5.732666015625, 5.92938232421875, 6.1260986328125, 6.32281494140625, 6.51953125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 3.0, 7.0, 8.0, 10.0, 30.0, 32.0, 39.0, 70.0, 98.0, 123.0, 213.0, 329.0, 491.0, 771.0, 1147.0, 1708.0, 2510.0, 3928.0, 5996.0, 8971.0, 13847.0, 20933.0, 32373.0, 50135.0, 77998.0, 125635.0, 199954.0, 184197.0, 113842.0, 71252.0, 45859.0, 29566.0, 19456.0, 12794.0, 8237.0, 5389.0, 3506.0, 2369.0, 1569.0, 982.0, 745.0, 490.0, 296.0, 227.0, 156.0, 96.0, 52.0, 47.0, 27.0, 12.0, 10.0, 11.0, 10.0, 2.0, 4.0, 1.0, 1.0, 3.0], "bins": [-1.0263671875, -0.9951705932617188, -0.9639739990234375, -0.9327774047851562, -0.901580810546875, -0.8703842163085938, -0.8391876220703125, -0.8079910278320312, -0.77679443359375, -0.7455978393554688, -0.7144012451171875, -0.6832046508789062, -0.652008056640625, -0.6208114624023438, -0.5896148681640625, -0.5584182739257812, -0.5272216796875, -0.49602508544921875, -0.4648284912109375, -0.43363189697265625, -0.402435302734375, -0.37123870849609375, -0.3400421142578125, -0.30884552001953125, -0.27764892578125, -0.24645233154296875, -0.2152557373046875, -0.18405914306640625, -0.152862548828125, -0.12166595458984375, -0.0904693603515625, -0.05927276611328125, -0.028076171875, 0.00312042236328125, 0.0343170166015625, 0.06551361083984375, 0.096710205078125, 0.12790679931640625, 0.1591033935546875, 0.19029998779296875, 0.22149658203125, 0.25269317626953125, 0.2838897705078125, 0.31508636474609375, 0.346282958984375, 0.37747955322265625, 0.4086761474609375, 0.43987274169921875, 0.4710693359375, 0.5022659301757812, 0.5334625244140625, 0.5646591186523438, 0.595855712890625, 0.6270523071289062, 0.6582489013671875, 0.6894454956054688, 0.72064208984375, 0.7518386840820312, 0.7830352783203125, 0.8142318725585938, 0.845428466796875, 0.8766250610351562, 0.9078216552734375, 0.9390182495117188, 0.97021484375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 4.0, 6.0, 4.0, 4.0, 4.0, 6.0, 10.0, 8.0, 15.0, 8.0, 13.0, 17.0, 20.0, 20.0, 20.0, 32.0, 31.0, 33.0, 29.0, 39.0, 47.0, 52.0, 45.0, 1064.0, 42.0, 35.0, 40.0, 41.0, 37.0, 39.0, 33.0, 39.0, 28.0, 25.0, 23.0, 26.0, 21.0, 16.0, 10.0, 10.0, 10.0, 9.0, 6.0, 8.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.860107421875, -3.71630859375, -3.572509765625, -3.4287109375, -3.284912109375, -3.14111328125, -2.997314453125, -2.853515625, -2.709716796875, -2.56591796875, -2.422119140625, -2.2783203125, -2.134521484375, -1.99072265625, -1.846923828125, -1.703125, -1.559326171875, -1.41552734375, -1.271728515625, -1.1279296875, -0.984130859375, -0.84033203125, -0.696533203125, -0.552734375, -0.408935546875, -0.26513671875, -0.121337890625, 0.0224609375, 0.166259765625, 0.31005859375, 0.453857421875, 0.59765625, 0.741455078125, 0.88525390625, 1.029052734375, 1.1728515625, 1.316650390625, 1.46044921875, 1.604248046875, 1.748046875, 1.891845703125, 2.03564453125, 2.179443359375, 2.3232421875, 2.467041015625, 2.61083984375, 2.754638671875, 2.8984375, 3.042236328125, 3.18603515625, 3.329833984375, 3.4736328125, 3.617431640625, 3.76123046875, 3.905029296875, 4.048828125, 4.192626953125, 4.33642578125, 4.480224609375, 4.6240234375, 4.767822265625, 4.91162109375, 5.055419921875, 5.19921875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 3.0, 12.0, 16.0, 17.0, 26.0, 45.0, 61.0, 94.0, 116.0, 184.0, 288.0, 442.0, 630.0, 995.0, 1431.0, 2174.0, 3116.0, 4750.0, 7234.0, 10626.0, 15837.0, 24025.0, 35958.0, 54169.0, 81564.0, 124827.0, 1231444.0, 167791.0, 111383.0, 72680.0, 48415.0, 32446.0, 21393.0, 14114.0, 9551.0, 6264.0, 4183.0, 2925.0, 1925.0, 1298.0, 848.0, 635.0, 383.0, 273.0, 189.0, 122.0, 86.0, 58.0, 36.0, 27.0, 10.0, 7.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.78857421875, -0.7630233764648438, -0.7374725341796875, -0.7119216918945312, -0.686370849609375, -0.6608200073242188, -0.6352691650390625, -0.6097183227539062, -0.58416748046875, -0.5586166381835938, -0.5330657958984375, -0.5075149536132812, -0.481964111328125, -0.45641326904296875, -0.4308624267578125, -0.40531158447265625, -0.3797607421875, -0.35420989990234375, -0.3286590576171875, -0.30310821533203125, -0.277557373046875, -0.25200653076171875, -0.2264556884765625, -0.20090484619140625, -0.17535400390625, -0.14980316162109375, -0.1242523193359375, -0.09870147705078125, -0.073150634765625, -0.04759979248046875, -0.0220489501953125, 0.00350189208984375, 0.029052734375, 0.05460357666015625, 0.0801544189453125, 0.10570526123046875, 0.131256103515625, 0.15680694580078125, 0.1823577880859375, 0.20790863037109375, 0.23345947265625, 0.25901031494140625, 0.2845611572265625, 0.31011199951171875, 0.335662841796875, 0.36121368408203125, 0.3867645263671875, 0.41231536865234375, 0.4378662109375, 0.46341705322265625, 0.4889678955078125, 0.5145187377929688, 0.540069580078125, 0.5656204223632812, 0.5911712646484375, 0.6167221069335938, 0.64227294921875, 0.6678237915039062, 0.6933746337890625, 0.7189254760742188, 0.744476318359375, 0.7700271606445312, 0.7955780029296875, 0.8211288452148438, 0.8466796875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 5.0, 7.0, 7.0, 10.0, 7.0, 16.0, 20.0, 31.0, 41.0, 36.0, 42.0, 67.0, 98.0, 82.0, 72.0, 59.0, 52.0, 71.0, 53.0, 39.0, 30.0, 31.0, 32.0, 20.0, 15.0, 4.0, 7.0, 9.0, 7.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019407272338867188, -0.0018734186887741089, -0.001806110143661499, -0.0017388015985488892, -0.0016714930534362793, -0.0016041845083236694, -0.0015368759632110596, -0.0014695674180984497, -0.0014022588729858398, -0.00133495032787323, -0.0012676417827606201, -0.0012003332376480103, -0.0011330246925354004, -0.0010657161474227905, -0.0009984076023101807, -0.0009310990571975708, -0.0008637905120849609, -0.0007964819669723511, -0.0007291734218597412, -0.0006618648767471313, -0.0005945563316345215, -0.0005272477865219116, -0.00045993924140930176, -0.0003926306962966919, -0.00032532215118408203, -0.00025801360607147217, -0.0001907050609588623, -0.00012339651584625244, -5.608797073364258e-05, 1.1220574378967285e-05, 7.852911949157715e-05, 0.000145837664604187, 0.00021314620971679688, 0.00028045475482940674, 0.0003477632999420166, 0.00041507184505462646, 0.00048238039016723633, 0.0005496889352798462, 0.0006169974803924561, 0.0006843060255050659, 0.0007516145706176758, 0.0008189231157302856, 0.0008862316608428955, 0.0009535402059555054, 0.0010208487510681152, 0.001088157296180725, 0.001155465841293335, 0.0012227743864059448, 0.0012900829315185547, 0.0013573914766311646, 0.0014247000217437744, 0.0014920085668563843, 0.0015593171119689941, 0.001626625657081604, 0.0016939342021942139, 0.0017612427473068237, 0.0018285512924194336, 0.0018958598375320435, 0.0019631683826446533, 0.002030476927757263, 0.002097785472869873, 0.002165094017982483, 0.0022324025630950928, 0.0022997111082077026, 0.0023670196533203125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 5.0, 8.0, 8.0, 12.0, 9.0, 15.0, 23.0, 30.0, 41.0, 51.0, 70.0, 91.0, 201.0, 578.0, 3636.0, 1034777.0, 7668.0, 626.0, 253.0, 136.0, 81.0, 53.0, 37.0, 25.0, 36.0, 13.0, 8.0, 8.0, 11.0, 10.0, 5.0, 3.0, 4.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.05267333984375, -0.051192283630371094, -0.04971122741699219, -0.04823017120361328, -0.046749114990234375, -0.04526805877685547, -0.04378700256347656, -0.042305946350097656, -0.04082489013671875, -0.039343833923339844, -0.03786277770996094, -0.03638172149658203, -0.034900665283203125, -0.03341960906982422, -0.03193855285644531, -0.030457496643066406, -0.0289764404296875, -0.027495384216308594, -0.026014328002929688, -0.02453327178955078, -0.023052215576171875, -0.02157115936279297, -0.020090103149414062, -0.018609046936035156, -0.01712799072265625, -0.015646934509277344, -0.014165878295898438, -0.012684822082519531, -0.011203765869140625, -0.009722709655761719, -0.008241653442382812, -0.006760597229003906, -0.005279541015625, -0.0037984848022460938, -0.0023174285888671875, -0.0008363723754882812, 0.000644683837890625, 0.0021257400512695312, 0.0036067962646484375, 0.005087852478027344, 0.00656890869140625, 0.008049964904785156, 0.009531021118164062, 0.011012077331542969, 0.012493133544921875, 0.013974189758300781, 0.015455245971679688, 0.016936302185058594, 0.0184173583984375, 0.019898414611816406, 0.021379470825195312, 0.02286052703857422, 0.024341583251953125, 0.02582263946533203, 0.027303695678710938, 0.028784751892089844, 0.03026580810546875, 0.031746864318847656, 0.03322792053222656, 0.03470897674560547, 0.036190032958984375, 0.03767108917236328, 0.03915214538574219, 0.040633201599121094, 0.0421142578125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 9.0, 94.0, 419.0, 408.0, 77.0, 10.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002539523644372821, -0.002380147809162736, -0.0022207722067832947, -0.0020613963715732098, -0.0019020205363631248, -0.00174264470115304, -0.0015832689823582768, -0.0014238932635635138, -0.0012645174283534288, -0.001105141593143344, -0.0009457658743485808, -0.0007863900973461568, -0.0006270143203437328, -0.00046763854334130883, -0.00030826276633888483, -0.00014888704754412174, 1.0488787665963173e-05, 0.00016986456466838717, 0.0003292403416708112, 0.0004886161186732352, 0.0006479918956756592, 0.0008073676726780832, 0.0009667434496805072, 0.0011261191684752703, 0.0012854950036853552, 0.00144487083889544, 0.0016042465576902032, 0.0017636222764849663, 0.0019229981116950512, 0.002082373946905136, 0.002241749782115221, 0.0024011253844946623, 0.002560501452535391, 0.0027198772877454758, 0.0028792531229555607, 0.003038628725335002, 0.003198004560545087, 0.0033573803957551718, 0.003516755998134613, 0.003676131833344698, 0.003835507668554783, 0.003994883503764868, 0.004154259338974953, 0.004313635174185038, 0.0044730110093951225, 0.00463238637894392, 0.004791762214154005, 0.00495113804936409, 0.005110513884574175, 0.00526988971978426, 0.005429265554994345, 0.00558864139020443, 0.005748016759753227, 0.005907392594963312, 0.006066768430173397, 0.006226144265383482, 0.006385520100593567, 0.006544895935803652, 0.006704271771013737, 0.006863647606223822, 0.0070230234414339066, 0.007182398810982704, 0.007341774646192789, 0.007501150481402874, 0.007660526316612959]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 3.0, 1.0, 7.0, 5.0, 6.0, 11.0, 13.0, 16.0, 15.0, 16.0, 25.0, 20.0, 22.0, 36.0, 25.0, 25.0, 39.0, 29.0, 26.0, 33.0, 30.0, 37.0, 33.0, 44.0, 46.0, 32.0, 36.0, 34.0, 38.0, 29.0, 26.0, 18.0, 27.0, 23.0, 26.0, 26.0, 18.0, 13.0, 19.0, 17.0, 9.0, 10.0, 6.0, 6.0, 5.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009249448776245117, -0.0008970508351922035, -0.0008691567927598953, -0.0008412627503275871, -0.0008133687078952789, -0.0007854746654629707, -0.0007575806230306625, -0.0007296865805983543, -0.0007017925381660461, -0.0006738984957337379, -0.0006460044533014297, -0.0006181104108691216, -0.0005902163684368134, -0.0005623223260045052, -0.000534428283572197, -0.0005065342411398888, -0.00047864019870758057, -0.00045074615627527237, -0.00042285211384296417, -0.000394958071410656, -0.0003670640289783478, -0.0003391699865460396, -0.0003112759441137314, -0.0002833819016814232, -0.000255487859249115, -0.0002275938168168068, -0.0001996997743844986, -0.0001718057319521904, -0.0001439116895198822, -0.000116017647087574, -8.812360465526581e-05, -6.022956222295761e-05, -3.2335519790649414e-05, -4.441477358341217e-06, 2.345256507396698e-05, 5.134660750627518e-05, 7.924064993858337e-05, 0.00010713469237089157, 0.00013502873480319977, 0.00016292277723550797, 0.00019081681966781616, 0.00021871086210012436, 0.00024660490453243256, 0.00027449894696474075, 0.00030239298939704895, 0.00033028703182935715, 0.00035818107426166534, 0.00038607511669397354, 0.00041396915912628174, 0.00044186320155858994, 0.00046975724399089813, 0.0004976512864232063, 0.0005255453288555145, 0.0005534393712878227, 0.0005813334137201309, 0.0006092274561524391, 0.0006371214985847473, 0.0006650155410170555, 0.0006929095834493637, 0.0007208036258816719, 0.0007486976683139801, 0.0007765917107462883, 0.0008044857531785965, 0.0008323797956109047, 0.0008602738380432129]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 9.0, 13.0, 10.0, 11.0, 19.0, 12.0, 18.0, 16.0, 20.0, 18.0, 21.0, 14.0, 39.0, 41.0, 32.0, 40.0, 40.0, 21.0, 29.0, 44.0, 41.0, 34.0, 33.0, 38.0, 34.0, 27.0, 29.0, 30.0, 32.0, 28.0, 23.0, 23.0, 21.0, 21.0, 20.0, 24.0, 6.0, 8.0, 15.0, 7.0, 8.0, 1.0, 6.0, 8.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 4.0, 0.0, 1.0], "bins": [-6.0703125, -5.87359619140625, -5.6768798828125, -5.48016357421875, -5.283447265625, -5.08673095703125, -4.8900146484375, -4.69329833984375, -4.49658203125, -4.29986572265625, -4.1031494140625, -3.90643310546875, -3.709716796875, -3.51300048828125, -3.3162841796875, -3.11956787109375, -2.9228515625, -2.72613525390625, -2.5294189453125, -2.33270263671875, -2.135986328125, -1.93927001953125, -1.7425537109375, -1.54583740234375, -1.34912109375, -1.15240478515625, -0.9556884765625, -0.75897216796875, -0.562255859375, -0.36553955078125, -0.1688232421875, 0.02789306640625, 0.224609375, 0.42132568359375, 0.6180419921875, 0.81475830078125, 1.011474609375, 1.20819091796875, 1.4049072265625, 1.60162353515625, 1.79833984375, 1.99505615234375, 2.1917724609375, 2.38848876953125, 2.585205078125, 2.78192138671875, 2.9786376953125, 3.17535400390625, 3.3720703125, 3.56878662109375, 3.7655029296875, 3.96221923828125, 4.158935546875, 4.35565185546875, 4.5523681640625, 4.74908447265625, 4.94580078125, 5.14251708984375, 5.3392333984375, 5.53594970703125, 5.732666015625, 5.92938232421875, 6.1260986328125, 6.32281494140625, 6.51953125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 8.0, 3.0, 5.0, 5.0, 23.0, 18.0, 27.0, 48.0, 79.0, 91.0, 148.0, 187.0, 300.0, 422.0, 739.0, 1142.0, 2050.0, 3930.0, 7369.0, 15137.0, 31468.0, 68924.0, 164716.0, 380561.0, 211066.0, 84144.0, 38463.0, 17927.0, 8831.0, 4436.0, 2449.0, 1406.0, 859.0, 499.0, 334.0, 223.0, 152.0, 105.0, 92.0, 48.0, 30.0, 24.0, 19.0, 16.0, 8.0, 9.0, 8.0, 7.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.39453125, -4.25103759765625, -4.1075439453125, -3.96405029296875, -3.820556640625, -3.67706298828125, -3.5335693359375, -3.39007568359375, -3.24658203125, -3.10308837890625, -2.9595947265625, -2.81610107421875, -2.672607421875, -2.52911376953125, -2.3856201171875, -2.24212646484375, -2.0986328125, -1.95513916015625, -1.8116455078125, -1.66815185546875, -1.524658203125, -1.38116455078125, -1.2376708984375, -1.09417724609375, -0.95068359375, -0.80718994140625, -0.6636962890625, -0.52020263671875, -0.376708984375, -0.23321533203125, -0.0897216796875, 0.05377197265625, 0.197265625, 0.34075927734375, 0.4842529296875, 0.62774658203125, 0.771240234375, 0.91473388671875, 1.0582275390625, 1.20172119140625, 1.34521484375, 1.48870849609375, 1.6322021484375, 1.77569580078125, 1.919189453125, 2.06268310546875, 2.2061767578125, 2.34967041015625, 2.4931640625, 2.63665771484375, 2.7801513671875, 2.92364501953125, 3.067138671875, 3.21063232421875, 3.3541259765625, 3.49761962890625, 3.64111328125, 3.78460693359375, 3.9281005859375, 4.07159423828125, 4.215087890625, 4.35858154296875, 4.5020751953125, 4.64556884765625, 4.7890625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 7.0, 6.0, 3.0, 7.0, 14.0, 16.0, 17.0, 23.0, 27.0, 26.0, 35.0, 39.0, 32.0, 59.0, 57.0, 80.0, 151.0, 1691.0, 277.0, 82.0, 59.0, 55.0, 44.0, 38.0, 28.0, 22.0, 25.0, 24.0, 29.0, 16.0, 15.0, 11.0, 7.0, 9.0, 9.0, 0.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-34.4375, -33.50048828125, -32.5634765625, -31.62646484375, -30.689453125, -29.75244140625, -28.8154296875, -27.87841796875, -26.94140625, -26.00439453125, -25.0673828125, -24.13037109375, -23.193359375, -22.25634765625, -21.3193359375, -20.38232421875, -19.4453125, -18.50830078125, -17.5712890625, -16.63427734375, -15.697265625, -14.76025390625, -13.8232421875, -12.88623046875, -11.94921875, -11.01220703125, -10.0751953125, -9.13818359375, -8.201171875, -7.26416015625, -6.3271484375, -5.39013671875, -4.453125, -3.51611328125, -2.5791015625, -1.64208984375, -0.705078125, 0.23193359375, 1.1689453125, 2.10595703125, 3.04296875, 3.97998046875, 4.9169921875, 5.85400390625, 6.791015625, 7.72802734375, 8.6650390625, 9.60205078125, 10.5390625, 11.47607421875, 12.4130859375, 13.35009765625, 14.287109375, 15.22412109375, 16.1611328125, 17.09814453125, 18.03515625, 18.97216796875, 19.9091796875, 20.84619140625, 21.783203125, 22.72021484375, 23.6572265625, 24.59423828125, 25.53125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 12.0, 4.0, 13.0, 22.0, 19.0, 20.0, 38.0, 40.0, 55.0, 63.0, 105.0, 126.0, 175.0, 247.0, 450.0, 1498.0, 171382.0, 2966596.0, 3136.0, 596.0, 332.0, 233.0, 138.0, 97.0, 74.0, 50.0, 51.0, 31.0, 30.0, 16.0, 14.0, 8.0, 5.0, 12.0, 3.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.46875, -55.35205078125, -53.2353515625, -51.11865234375, -49.001953125, -46.88525390625, -44.7685546875, -42.65185546875, -40.53515625, -38.41845703125, -36.3017578125, -34.18505859375, -32.068359375, -29.95166015625, -27.8349609375, -25.71826171875, -23.6015625, -21.48486328125, -19.3681640625, -17.25146484375, -15.134765625, -13.01806640625, -10.9013671875, -8.78466796875, -6.66796875, -4.55126953125, -2.4345703125, -0.31787109375, 1.798828125, 3.91552734375, 6.0322265625, 8.14892578125, 10.265625, 12.38232421875, 14.4990234375, 16.61572265625, 18.732421875, 20.84912109375, 22.9658203125, 25.08251953125, 27.19921875, 29.31591796875, 31.4326171875, 33.54931640625, 35.666015625, 37.78271484375, 39.8994140625, 42.01611328125, 44.1328125, 46.24951171875, 48.3662109375, 50.48291015625, 52.599609375, 54.71630859375, 56.8330078125, 58.94970703125, 61.06640625, 63.18310546875, 65.2998046875, 67.41650390625, 69.533203125, 71.64990234375, 73.7666015625, 75.88330078125, 78.0]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 15.0, 166.0, 460.0, 319.0, 48.0, 3.0, 4.0, 2.0], "bins": [-185.8696746826172, -182.70724487304688, -179.5447998046875, -176.3823699951172, -173.21994018554688, -170.0574951171875, -166.8950653076172, -163.73263549804688, -160.5701904296875, -157.4077606201172, -154.2453155517578, -151.0828857421875, -147.9204559326172, -144.7580108642578, -141.5955810546875, -138.43313598632812, -135.2707061767578, -132.1082763671875, -128.94583129882812, -125.78340148925781, -122.62096405029297, -119.45852661132812, -116.29609680175781, -113.13365936279297, -109.97122955322266, -106.80879211425781, -103.6463623046875, -100.48392486572266, -97.32148742675781, -94.15904998779297, -90.99662017822266, -87.83418273925781, -84.67174530029297, -81.50930786132812, -78.34687805175781, -75.18444061279297, -72.02200317382812, -68.85956573486328, -65.69713592529297, -62.534698486328125, -59.37226104736328, -56.2098274230957, -53.04738998413086, -49.88495635986328, -46.72251892089844, -43.56008529663086, -40.39765167236328, -37.23521423339844, -34.07278060913086, -30.91034507751465, -27.747909545898438, -24.58547592163086, -21.423038482666016, -18.260604858398438, -15.098169326782227, -11.935733795166016, -8.773298263549805, -5.610862731933594, -2.448427677154541, 0.7140073776245117, 3.8764429092407227, 7.038878440856934, 10.201313018798828, 13.363748550415039, 16.52618408203125]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 7.0, 3.0, 3.0, 3.0, 6.0, 4.0, 5.0, 17.0, 8.0, 11.0, 19.0, 17.0, 24.0, 17.0, 33.0, 31.0, 26.0, 35.0, 37.0, 38.0, 41.0, 37.0, 34.0, 36.0, 34.0, 49.0, 41.0, 35.0, 47.0, 39.0, 33.0, 23.0, 30.0, 27.0, 34.0, 17.0, 18.0, 16.0, 9.0, 12.0, 17.0, 2.0, 6.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-54.16265869140625, -52.25460433959961, -50.34654998779297, -48.43849563598633, -46.53044128417969, -44.62238693237305, -42.714332580566406, -40.806278228759766, -38.898223876953125, -36.990169525146484, -35.082115173339844, -33.1740608215332, -31.266006469726562, -29.357952117919922, -27.44989776611328, -25.54184341430664, -23.6337890625, -21.72573471069336, -19.81768035888672, -17.909626007080078, -16.001571655273438, -14.093517303466797, -12.185462951660156, -10.277408599853516, -8.369354248046875, -6.461299896240234, -4.553245544433594, -2.645191192626953, -0.7371368408203125, 1.1709175109863281, 3.0789718627929688, 4.987026214599609, 6.89508056640625, 8.80313491821289, 10.711189270019531, 12.619243621826172, 14.527297973632812, 16.435352325439453, 18.343406677246094, 20.251461029052734, 22.159515380859375, 24.067569732666016, 25.975624084472656, 27.883678436279297, 29.791732788085938, 31.699787139892578, 33.60784149169922, 35.51589584350586, 37.4239501953125, 39.33200454711914, 41.24005889892578, 43.14811325073242, 45.05616760253906, 46.9642219543457, 48.872276306152344, 50.780330657958984, 52.688385009765625, 54.596439361572266, 56.504493713378906, 58.41254806518555, 60.32060241699219, 62.22865676879883, 64.13671112060547, 66.04476928710938, 67.95281982421875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 7.0, 8.0, 9.0, 11.0, 18.0, 12.0, 13.0, 15.0, 18.0, 19.0, 22.0, 14.0, 31.0, 30.0, 35.0, 53.0, 34.0, 33.0, 23.0, 37.0, 44.0, 33.0, 36.0, 31.0, 31.0, 35.0, 41.0, 33.0, 25.0, 26.0, 25.0, 16.0, 25.0, 19.0, 26.0, 14.0, 18.0, 12.0, 12.0, 6.0, 11.0, 6.0, 4.0, 3.0, 6.0, 4.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 3.0], "bins": [-6.3984375, -6.19512939453125, -5.9918212890625, -5.78851318359375, -5.585205078125, -5.38189697265625, -5.1785888671875, -4.97528076171875, -4.77197265625, -4.56866455078125, -4.3653564453125, -4.16204833984375, -3.958740234375, -3.75543212890625, -3.5521240234375, -3.34881591796875, -3.1455078125, -2.94219970703125, -2.7388916015625, -2.53558349609375, -2.332275390625, -2.12896728515625, -1.9256591796875, -1.72235107421875, -1.51904296875, -1.31573486328125, -1.1124267578125, -0.90911865234375, -0.705810546875, -0.50250244140625, -0.2991943359375, -0.09588623046875, 0.107421875, 0.31072998046875, 0.5140380859375, 0.71734619140625, 0.920654296875, 1.12396240234375, 1.3272705078125, 1.53057861328125, 1.73388671875, 1.93719482421875, 2.1405029296875, 2.34381103515625, 2.547119140625, 2.75042724609375, 2.9537353515625, 3.15704345703125, 3.3603515625, 3.56365966796875, 3.7669677734375, 3.97027587890625, 4.173583984375, 4.37689208984375, 4.5802001953125, 4.78350830078125, 4.98681640625, 5.19012451171875, 5.3934326171875, 5.59674072265625, 5.800048828125, 6.00335693359375, 6.2066650390625, 6.40997314453125, 6.61328125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 7.0, 6.0, 7.0, 13.0, 10.0, 17.0, 9.0, 17.0, 20.0, 18.0, 15.0, 19.0, 24.0, 22.0, 44.0, 36.0, 73.0, 162.0, 548.0, 2917.0, 31630.0, 1675492.0, 2428421.0, 49747.0, 3740.0, 677.0, 201.0, 76.0, 47.0, 39.0, 25.0, 24.0, 24.0, 13.0, 16.0, 25.0, 20.0, 15.0, 14.0, 9.0, 6.0, 3.0, 9.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0], "bins": [-26.140625, -25.29931640625, -24.4580078125, -23.61669921875, -22.775390625, -21.93408203125, -21.0927734375, -20.25146484375, -19.41015625, -18.56884765625, -17.7275390625, -16.88623046875, -16.044921875, -15.20361328125, -14.3623046875, -13.52099609375, -12.6796875, -11.83837890625, -10.9970703125, -10.15576171875, -9.314453125, -8.47314453125, -7.6318359375, -6.79052734375, -5.94921875, -5.10791015625, -4.2666015625, -3.42529296875, -2.583984375, -1.74267578125, -0.9013671875, -0.06005859375, 0.78125, 1.62255859375, 2.4638671875, 3.30517578125, 4.146484375, 4.98779296875, 5.8291015625, 6.67041015625, 7.51171875, 8.35302734375, 9.1943359375, 10.03564453125, 10.876953125, 11.71826171875, 12.5595703125, 13.40087890625, 14.2421875, 15.08349609375, 15.9248046875, 16.76611328125, 17.607421875, 18.44873046875, 19.2900390625, 20.13134765625, 20.97265625, 21.81396484375, 22.6552734375, 23.49658203125, 24.337890625, 25.17919921875, 26.0205078125, 26.86181640625, 27.703125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 8.0, 11.0, 14.0, 17.0, 34.0, 25.0, 25.0, 49.0, 67.0, 60.0, 85.0, 120.0, 148.0, 194.0, 244.0, 338.0, 379.0, 388.0, 384.0, 315.0, 269.0, 209.0, 162.0, 128.0, 86.0, 81.0, 57.0, 40.0, 27.0, 25.0, 17.0, 14.0, 12.0, 11.0, 4.0, 10.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 3.0], "bins": [-15.65625, -15.2490234375, -14.841796875, -14.4345703125, -14.02734375, -13.6201171875, -13.212890625, -12.8056640625, -12.3984375, -11.9912109375, -11.583984375, -11.1767578125, -10.76953125, -10.3623046875, -9.955078125, -9.5478515625, -9.140625, -8.7333984375, -8.326171875, -7.9189453125, -7.51171875, -7.1044921875, -6.697265625, -6.2900390625, -5.8828125, -5.4755859375, -5.068359375, -4.6611328125, -4.25390625, -3.8466796875, -3.439453125, -3.0322265625, -2.625, -2.2177734375, -1.810546875, -1.4033203125, -0.99609375, -0.5888671875, -0.181640625, 0.2255859375, 0.6328125, 1.0400390625, 1.447265625, 1.8544921875, 2.26171875, 2.6689453125, 3.076171875, 3.4833984375, 3.890625, 4.2978515625, 4.705078125, 5.1123046875, 5.51953125, 5.9267578125, 6.333984375, 6.7412109375, 7.1484375, 7.5556640625, 7.962890625, 8.3701171875, 8.77734375, 9.1845703125, 9.591796875, 9.9990234375, 10.40625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 7.0, 6.0, 8.0, 16.0, 16.0, 29.0, 33.0, 35.0, 49.0, 97.0, 99.0, 169.0, 256.0, 461.0, 1560.0, 175870.0, 4002877.0, 10867.0, 777.0, 347.0, 202.0, 141.0, 82.0, 69.0, 54.0, 25.0, 30.0, 19.0, 19.0, 13.0, 11.0, 8.0, 7.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.25, -63.8212890625, -61.392578125, -58.9638671875, -56.53515625, -54.1064453125, -51.677734375, -49.2490234375, -46.8203125, -44.3916015625, -41.962890625, -39.5341796875, -37.10546875, -34.6767578125, -32.248046875, -29.8193359375, -27.390625, -24.9619140625, -22.533203125, -20.1044921875, -17.67578125, -15.2470703125, -12.818359375, -10.3896484375, -7.9609375, -5.5322265625, -3.103515625, -0.6748046875, 1.75390625, 4.1826171875, 6.611328125, 9.0400390625, 11.46875, 13.8974609375, 16.326171875, 18.7548828125, 21.18359375, 23.6123046875, 26.041015625, 28.4697265625, 30.8984375, 33.3271484375, 35.755859375, 38.1845703125, 40.61328125, 43.0419921875, 45.470703125, 47.8994140625, 50.328125, 52.7568359375, 55.185546875, 57.6142578125, 60.04296875, 62.4716796875, 64.900390625, 67.3291015625, 69.7578125, 72.1865234375, 74.615234375, 77.0439453125, 79.47265625, 81.9013671875, 84.330078125, 86.7587890625, 89.1875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 10.0, 96.0, 292.0, 409.0, 176.0, 29.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.19850158691406, -240.38058471679688, -233.56268310546875, -226.74476623535156, -219.92684936523438, -213.1089324951172, -206.291015625, -199.47311401367188, -192.6551971435547, -185.8372802734375, -179.01937866210938, -172.2014617919922, -165.383544921875, -158.5656280517578, -151.74771118164062, -144.9298095703125, -138.1118927001953, -131.29397583007812, -124.47606658935547, -117.65815734863281, -110.84024047851562, -104.02232360839844, -97.20441436767578, -90.38650512695312, -83.56858825683594, -76.75067138671875, -69.9327621459961, -63.11484909057617, -56.29693603515625, -49.47902297973633, -42.661109924316406, -35.843196868896484, -29.025299072265625, -22.207386016845703, -15.389472961425781, -8.57155990600586, -1.7536468505859375, 5.064266204833984, 11.882179260253906, 18.700092315673828, 25.51800537109375, 32.33591842651367, 39.153831481933594, 45.971744537353516, 52.78965759277344, 59.60757064819336, 66.42548370361328, 73.24339294433594, 80.06130981445312, 86.87922668457031, 93.69713592529297, 100.51504516601562, 107.33296203613281, 114.15087890625, 120.96878814697266, 127.78669738769531, 134.6046142578125, 141.4225311279297, 148.24044799804688, 155.058349609375, 161.8762664794922, 168.69418334960938, 175.5120849609375, 182.3300018310547, 189.14791870117188]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 8.0, 6.0, 8.0, 14.0, 20.0, 17.0, 19.0, 19.0, 25.0, 32.0, 30.0, 36.0, 35.0, 39.0, 44.0, 49.0, 48.0, 40.0, 34.0, 31.0, 49.0, 39.0, 39.0, 35.0, 21.0, 36.0, 29.0, 28.0, 24.0, 27.0, 20.0, 18.0, 11.0, 19.0, 9.0, 6.0, 9.0, 4.0, 3.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-51.380706787109375, -49.83909606933594, -48.297489166259766, -46.75587844848633, -45.21426773071289, -43.67266082763672, -42.13105010986328, -40.589439392089844, -39.047828674316406, -37.50621795654297, -35.9646110534668, -34.42300033569336, -32.88138961791992, -31.339780807495117, -29.798171997070312, -28.256561279296875, -26.714954376220703, -25.1733455657959, -23.63173484802246, -22.090126037597656, -20.54851531982422, -19.006906509399414, -17.46529769897461, -15.923687934875488, -14.382078170776367, -12.840468406677246, -11.298858642578125, -9.75724983215332, -8.2156400680542, -6.674030303955078, -5.132421493530273, -3.5908117294311523, -2.0492019653320312, -0.5075924396514893, 1.0340170860290527, 2.5756263732910156, 4.117236137390137, 5.658845901489258, 7.2004547119140625, 8.742064476013184, 10.283674240112305, 11.825284004211426, 13.366893768310547, 14.908502578735352, 16.450111389160156, 17.991722106933594, 19.5333309173584, 21.074939727783203, 22.61655044555664, 24.158159255981445, 25.699769973754883, 27.241378784179688, 28.782989501953125, 30.32459831237793, 31.866207122802734, 33.40781784057617, 34.949424743652344, 36.49103546142578, 38.03264236450195, 39.57425308227539, 41.11586380004883, 42.657470703125, 44.19908142089844, 45.740692138671875, 47.28230285644531]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 5.0, 10.0, 14.0, 16.0, 16.0, 17.0, 23.0, 13.0, 21.0, 25.0, 23.0, 42.0, 29.0, 38.0, 38.0, 43.0, 37.0, 36.0, 39.0, 44.0, 30.0, 47.0, 40.0, 25.0, 41.0, 34.0, 30.0, 24.0, 26.0, 20.0, 22.0, 22.0, 22.0, 12.0, 11.0, 7.0, 16.0, 7.0, 5.0, 4.0, 1.0, 2.0, 5.0, 5.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.52734375, -6.30364990234375, -6.0799560546875, -5.85626220703125, -5.632568359375, -5.40887451171875, -5.1851806640625, -4.96148681640625, -4.73779296875, -4.51409912109375, -4.2904052734375, -4.06671142578125, -3.843017578125, -3.61932373046875, -3.3956298828125, -3.17193603515625, -2.9482421875, -2.72454833984375, -2.5008544921875, -2.27716064453125, -2.053466796875, -1.82977294921875, -1.6060791015625, -1.38238525390625, -1.15869140625, -0.93499755859375, -0.7113037109375, -0.48760986328125, -0.263916015625, -0.04022216796875, 0.1834716796875, 0.40716552734375, 0.630859375, 0.85455322265625, 1.0782470703125, 1.30194091796875, 1.525634765625, 1.74932861328125, 1.9730224609375, 2.19671630859375, 2.42041015625, 2.64410400390625, 2.8677978515625, 3.09149169921875, 3.315185546875, 3.53887939453125, 3.7625732421875, 3.98626708984375, 4.2099609375, 4.43365478515625, 4.6573486328125, 4.88104248046875, 5.104736328125, 5.32843017578125, 5.5521240234375, 5.77581787109375, 5.99951171875, 6.22320556640625, 6.4468994140625, 6.67059326171875, 6.894287109375, 7.11798095703125, 7.3416748046875, 7.56536865234375, 7.7890625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 20.0, 23.0, 38.0, 62.0, 82.0, 114.0, 199.0, 249.0, 375.0, 547.0, 771.0, 1169.0, 1695.0, 2435.0, 3682.0, 5495.0, 8040.0, 12034.0, 18359.0, 26891.0, 40721.0, 61028.0, 94501.0, 148852.0, 200418.0, 146404.0, 92568.0, 60323.0, 39958.0, 26946.0, 17963.0, 11907.0, 7997.0, 5404.0, 3589.0, 2480.0, 1681.0, 1089.0, 799.0, 508.0, 360.0, 247.0, 187.0, 117.0, 71.0, 51.0, 39.0, 18.0, 22.0, 5.0, 7.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.94140625, -0.9105224609375, -0.879638671875, -0.8487548828125, -0.81787109375, -0.7869873046875, -0.756103515625, -0.7252197265625, -0.6943359375, -0.6634521484375, -0.632568359375, -0.6016845703125, -0.57080078125, -0.5399169921875, -0.509033203125, -0.4781494140625, -0.447265625, -0.4163818359375, -0.385498046875, -0.3546142578125, -0.32373046875, -0.2928466796875, -0.261962890625, -0.2310791015625, -0.2001953125, -0.1693115234375, -0.138427734375, -0.1075439453125, -0.07666015625, -0.0457763671875, -0.014892578125, 0.0159912109375, 0.046875, 0.0777587890625, 0.108642578125, 0.1395263671875, 0.17041015625, 0.2012939453125, 0.232177734375, 0.2630615234375, 0.2939453125, 0.3248291015625, 0.355712890625, 0.3865966796875, 0.41748046875, 0.4483642578125, 0.479248046875, 0.5101318359375, 0.541015625, 0.5718994140625, 0.602783203125, 0.6336669921875, 0.66455078125, 0.6954345703125, 0.726318359375, 0.7572021484375, 0.7880859375, 0.8189697265625, 0.849853515625, 0.8807373046875, 0.91162109375, 0.9425048828125, 0.973388671875, 1.0042724609375, 1.03515625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 7.0, 11.0, 10.0, 9.0, 10.0, 12.0, 11.0, 15.0, 17.0, 17.0, 23.0, 19.0, 18.0, 25.0, 38.0, 40.0, 40.0, 49.0, 47.0, 40.0, 1070.0, 42.0, 38.0, 38.0, 41.0, 32.0, 52.0, 38.0, 31.0, 21.0, 21.0, 28.0, 20.0, 17.0, 19.0, 17.0, 6.0, 7.0, 5.0, 8.0, 8.0, 7.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.078125, -4.9241943359375, -4.770263671875, -4.6163330078125, -4.46240234375, -4.3084716796875, -4.154541015625, -4.0006103515625, -3.8466796875, -3.6927490234375, -3.538818359375, -3.3848876953125, -3.23095703125, -3.0770263671875, -2.923095703125, -2.7691650390625, -2.615234375, -2.4613037109375, -2.307373046875, -2.1534423828125, -1.99951171875, -1.8455810546875, -1.691650390625, -1.5377197265625, -1.3837890625, -1.2298583984375, -1.075927734375, -0.9219970703125, -0.76806640625, -0.6141357421875, -0.460205078125, -0.3062744140625, -0.15234375, 0.0015869140625, 0.155517578125, 0.3094482421875, 0.46337890625, 0.6173095703125, 0.771240234375, 0.9251708984375, 1.0791015625, 1.2330322265625, 1.386962890625, 1.5408935546875, 1.69482421875, 1.8487548828125, 2.002685546875, 2.1566162109375, 2.310546875, 2.4644775390625, 2.618408203125, 2.7723388671875, 2.92626953125, 3.0802001953125, 3.234130859375, 3.3880615234375, 3.5419921875, 3.6959228515625, 3.849853515625, 4.0037841796875, 4.15771484375, 4.3116455078125, 4.465576171875, 4.6195068359375, 4.7734375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 7.0, 9.0, 9.0, 19.0, 22.0, 35.0, 59.0, 82.0, 142.0, 253.0, 379.0, 538.0, 954.0, 1358.0, 2200.0, 3480.0, 5607.0, 8729.0, 13539.0, 21325.0, 33152.0, 53236.0, 88243.0, 149082.0, 1271338.0, 174569.0, 102753.0, 61545.0, 37790.0, 24353.0, 15070.0, 9953.0, 6226.0, 4059.0, 2515.0, 1637.0, 1091.0, 650.0, 426.0, 239.0, 156.0, 113.0, 68.0, 55.0, 26.0, 25.0, 10.0, 7.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96630859375, -0.9347763061523438, -0.9032440185546875, -0.8717117309570312, -0.840179443359375, -0.8086471557617188, -0.7771148681640625, -0.7455825805664062, -0.71405029296875, -0.6825180053710938, -0.6509857177734375, -0.6194534301757812, -0.587921142578125, -0.5563888549804688, -0.5248565673828125, -0.49332427978515625, -0.4617919921875, -0.43025970458984375, -0.3987274169921875, -0.36719512939453125, -0.335662841796875, -0.30413055419921875, -0.2725982666015625, -0.24106597900390625, -0.20953369140625, -0.17800140380859375, -0.1464691162109375, -0.11493682861328125, -0.083404541015625, -0.05187225341796875, -0.0203399658203125, 0.01119232177734375, 0.042724609375, 0.07425689697265625, 0.1057891845703125, 0.13732147216796875, 0.168853759765625, 0.20038604736328125, 0.2319183349609375, 0.26345062255859375, 0.29498291015625, 0.32651519775390625, 0.3580474853515625, 0.38957977294921875, 0.421112060546875, 0.45264434814453125, 0.4841766357421875, 0.5157089233398438, 0.5472412109375, 0.5787734985351562, 0.6103057861328125, 0.6418380737304688, 0.673370361328125, 0.7049026489257812, 0.7364349365234375, 0.7679672241210938, 0.79949951171875, 0.8310317993164062, 0.8625640869140625, 0.8940963745117188, 0.925628662109375, 0.9571609497070312, 0.9886932373046875, 1.0202255249023438, 1.0517578125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 9.0, 10.0, 7.0, 11.0, 19.0, 19.0, 32.0, 56.0, 53.0, 73.0, 77.0, 88.0, 116.0, 93.0, 60.0, 51.0, 50.0, 39.0, 28.0, 27.0, 22.0, 14.0, 15.0, 4.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0025882720947265625, -0.002512216567993164, -0.0024361610412597656, -0.002360105514526367, -0.0022840499877929688, -0.0022079944610595703, -0.002131938934326172, -0.0020558834075927734, -0.001979827880859375, -0.0019037723541259766, -0.0018277168273925781, -0.0017516613006591797, -0.0016756057739257812, -0.0015995502471923828, -0.0015234947204589844, -0.001447439193725586, -0.0013713836669921875, -0.001295328140258789, -0.0012192726135253906, -0.0011432170867919922, -0.0010671615600585938, -0.0009911060333251953, -0.0009150505065917969, -0.0008389949798583984, -0.000762939453125, -0.0006868839263916016, -0.0006108283996582031, -0.0005347728729248047, -0.00045871734619140625, -0.0003826618194580078, -0.0003066062927246094, -0.00023055076599121094, -0.0001544952392578125, -7.843971252441406e-05, -2.384185791015625e-06, 7.367134094238281e-05, 0.00014972686767578125, 0.0002257823944091797, 0.0003018379211425781, 0.00037789344787597656, 0.000453948974609375, 0.0005300045013427734, 0.0006060600280761719, 0.0006821155548095703, 0.0007581710815429688, 0.0008342266082763672, 0.0009102821350097656, 0.000986337661743164, 0.0010623931884765625, 0.001138448715209961, 0.0012145042419433594, 0.0012905597686767578, 0.0013666152954101562, 0.0014426708221435547, 0.0015187263488769531, 0.0015947818756103516, 0.00167083740234375, 0.0017468929290771484, 0.0018229484558105469, 0.0018990039825439453, 0.0019750595092773438, 0.002051115036010742, 0.0021271705627441406, 0.002203226089477539, 0.0022792816162109375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 6.0, 14.0, 16.0, 11.0, 33.0, 37.0, 42.0, 55.0, 104.0, 225.0, 611.0, 28148.0, 1017358.0, 1222.0, 285.0, 144.0, 74.0, 44.0, 29.0, 23.0, 14.0, 7.0, 6.0, 9.0, 7.0, 11.0, 0.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.054473876953125, -0.05267000198364258, -0.050866127014160156, -0.049062252044677734, -0.04725837707519531, -0.04545450210571289, -0.04365062713623047, -0.04184675216674805, -0.040042877197265625, -0.0382390022277832, -0.03643512725830078, -0.03463125228881836, -0.03282737731933594, -0.031023502349853516, -0.029219627380371094, -0.027415752410888672, -0.02561187744140625, -0.023808002471923828, -0.022004127502441406, -0.020200252532958984, -0.018396377563476562, -0.01659250259399414, -0.014788627624511719, -0.012984752655029297, -0.011180877685546875, -0.009377002716064453, -0.007573127746582031, -0.005769252777099609, -0.0039653778076171875, -0.0021615028381347656, -0.00035762786865234375, 0.0014462471008300781, 0.0032501220703125, 0.005053997039794922, 0.006857872009277344, 0.008661746978759766, 0.010465621948242188, 0.01226949691772461, 0.014073371887207031, 0.015877246856689453, 0.017681121826171875, 0.019484996795654297, 0.02128887176513672, 0.02309274673461914, 0.024896621704101562, 0.026700496673583984, 0.028504371643066406, 0.030308246612548828, 0.03211212158203125, 0.03391599655151367, 0.035719871520996094, 0.037523746490478516, 0.03932762145996094, 0.04113149642944336, 0.04293537139892578, 0.0447392463684082, 0.046543121337890625, 0.04834699630737305, 0.05015087127685547, 0.05195474624633789, 0.05375862121582031, 0.055562496185302734, 0.057366371154785156, 0.05917024612426758, 0.06097412109375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 14.0, 161.0, 499.0, 291.0, 41.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025693662464618683, -0.0024316562339663506, -0.002293946221470833, -0.0021562364418059587, -0.002018526429310441, -0.0018808164168149233, -0.0017431065207347274, -0.0016053966246545315, -0.0014676866121590137, -0.001329976599663496, -0.0011922667035833001, -0.0010545568075031042, -0.0009168467950075865, -0.0007791368407197297, -0.0006414268864318728, -0.000503716932144016, -0.0003660069778561592, -0.0002282970235683024, -9.058706928044558e-05, 4.712288500741124e-05, 0.00018483283929526806, 0.0003225427935831249, 0.0004602527478709817, 0.0005979627021588385, 0.0007356726564466953, 0.0008733826107345521, 0.001011092565022409, 0.0011488024611026049, 0.0012865124735981226, 0.0014242224860936403, 0.0015619323821738362, 0.0016996422782540321, 0.0018373527564108372, 0.001975062768906355, 0.0021127727814018726, 0.0022504825610667467, 0.0023881925735622644, 0.002525902586057782, 0.0026636123657226562, 0.002801322378218174, 0.0029390323907136917, 0.0030767424032092094, 0.003214452415704727, 0.0033521621953696012, 0.003489872207865119, 0.0036275822203606367, 0.003765292000025511, 0.0039030020125210285, 0.004040712025016546, 0.004178422037512064, 0.004316132050007582, 0.0044538420625030994, 0.00459155160933733, 0.004729261621832848, 0.004866971634328365, 0.005004681646823883, 0.005142391659319401, 0.0052801016718149185, 0.005417811684310436, 0.005555521696805954, 0.005693231709301472, 0.005830941256135702, 0.00596865126863122, 0.006106361281126738, 0.006244071293622255]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 7.0, 7.0, 11.0, 10.0, 15.0, 24.0, 16.0, 28.0, 19.0, 18.0, 23.0, 27.0, 32.0, 26.0, 39.0, 32.0, 41.0, 30.0, 36.0, 40.0, 46.0, 30.0, 47.0, 38.0, 39.0, 34.0, 25.0, 26.0, 18.0, 29.0, 27.0, 29.0, 19.0, 19.0, 19.0, 14.0, 12.0, 7.0, 13.0, 8.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008105039596557617, -0.000783972442150116, -0.0007574409246444702, -0.0007309094071388245, -0.0007043778896331787, -0.000677846372127533, -0.0006513148546218872, -0.0006247833371162415, -0.0005982518196105957, -0.00057172030210495, -0.0005451887845993042, -0.0005186572670936584, -0.0004921257495880127, -0.00046559423208236694, -0.0004390627145767212, -0.00041253119707107544, -0.0003859996795654297, -0.00035946816205978394, -0.0003329366445541382, -0.00030640512704849243, -0.0002798736095428467, -0.00025334209203720093, -0.00022681057453155518, -0.00020027905702590942, -0.00017374753952026367, -0.00014721602201461792, -0.00012068450450897217, -9.415298700332642e-05, -6.762146949768066e-05, -4.108995199203491e-05, -1.455843448638916e-05, 1.1973083019256592e-05, 3.8504600524902344e-05, 6.50361180305481e-05, 9.156763553619385e-05, 0.0001180991530418396, 0.00014463067054748535, 0.0001711621880531311, 0.00019769370555877686, 0.0002242252230644226, 0.00025075674057006836, 0.0002772882580757141, 0.00030381977558135986, 0.0003303512930870056, 0.00035688281059265137, 0.0003834143280982971, 0.00040994584560394287, 0.0004364773631095886, 0.0004630088806152344, 0.0004895403981208801, 0.0005160719156265259, 0.0005426034331321716, 0.0005691349506378174, 0.0005956664681434631, 0.0006221979856491089, 0.0006487295031547546, 0.0006752610206604004, 0.0007017925381660461, 0.0007283240556716919, 0.0007548555731773376, 0.0007813870906829834, 0.0008079186081886292, 0.0008344501256942749, 0.0008609816431999207, 0.0008875131607055664]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 5.0, 10.0, 14.0, 16.0, 16.0, 17.0, 23.0, 13.0, 21.0, 25.0, 23.0, 42.0, 29.0, 38.0, 38.0, 43.0, 37.0, 36.0, 39.0, 44.0, 30.0, 47.0, 40.0, 25.0, 41.0, 34.0, 30.0, 24.0, 26.0, 20.0, 22.0, 22.0, 22.0, 12.0, 11.0, 7.0, 16.0, 7.0, 5.0, 4.0, 1.0, 2.0, 5.0, 5.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.52734375, -6.30364990234375, -6.0799560546875, -5.85626220703125, -5.632568359375, -5.40887451171875, -5.1851806640625, -4.96148681640625, -4.73779296875, -4.51409912109375, -4.2904052734375, -4.06671142578125, -3.843017578125, -3.61932373046875, -3.3956298828125, -3.17193603515625, -2.9482421875, -2.72454833984375, -2.5008544921875, -2.27716064453125, -2.053466796875, -1.82977294921875, -1.6060791015625, -1.38238525390625, -1.15869140625, -0.93499755859375, -0.7113037109375, -0.48760986328125, -0.263916015625, -0.04022216796875, 0.1834716796875, 0.40716552734375, 0.630859375, 0.85455322265625, 1.0782470703125, 1.30194091796875, 1.525634765625, 1.74932861328125, 1.9730224609375, 2.19671630859375, 2.42041015625, 2.64410400390625, 2.8677978515625, 3.09149169921875, 3.315185546875, 3.53887939453125, 3.7625732421875, 3.98626708984375, 4.2099609375, 4.43365478515625, 4.6573486328125, 4.88104248046875, 5.104736328125, 5.32843017578125, 5.5521240234375, 5.77581787109375, 5.99951171875, 6.22320556640625, 6.4468994140625, 6.67059326171875, 6.894287109375, 7.11798095703125, 7.3416748046875, 7.56536865234375, 7.7890625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 8.0, 7.0, 8.0, 29.0, 20.0, 38.0, 51.0, 78.0, 112.0, 149.0, 202.0, 328.0, 466.0, 885.0, 1562.0, 2837.0, 5641.0, 12122.0, 29697.0, 81469.0, 252799.0, 439947.0, 137187.0, 47649.0, 18381.0, 8036.0, 3850.0, 2084.0, 1100.0, 654.0, 386.0, 242.0, 144.0, 112.0, 76.0, 57.0, 51.0, 22.0, 21.0, 23.0, 11.0, 8.0, 8.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.59375, -4.4117431640625, -4.229736328125, -4.0477294921875, -3.86572265625, -3.6837158203125, -3.501708984375, -3.3197021484375, -3.1376953125, -2.9556884765625, -2.773681640625, -2.5916748046875, -2.40966796875, -2.2276611328125, -2.045654296875, -1.8636474609375, -1.681640625, -1.4996337890625, -1.317626953125, -1.1356201171875, -0.95361328125, -0.7716064453125, -0.589599609375, -0.4075927734375, -0.2255859375, -0.0435791015625, 0.138427734375, 0.3204345703125, 0.50244140625, 0.6844482421875, 0.866455078125, 1.0484619140625, 1.23046875, 1.4124755859375, 1.594482421875, 1.7764892578125, 1.95849609375, 2.1405029296875, 2.322509765625, 2.5045166015625, 2.6865234375, 2.8685302734375, 3.050537109375, 3.2325439453125, 3.41455078125, 3.5965576171875, 3.778564453125, 3.9605712890625, 4.142578125, 4.3245849609375, 4.506591796875, 4.6885986328125, 4.87060546875, 5.0526123046875, 5.234619140625, 5.4166259765625, 5.5986328125, 5.7806396484375, 5.962646484375, 6.1446533203125, 6.32666015625, 6.5086669921875, 6.690673828125, 6.8726806640625, 7.0546875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 0.0, 5.0, 2.0, 6.0, 8.0, 4.0, 9.0, 23.0, 11.0, 20.0, 32.0, 15.0, 30.0, 28.0, 39.0, 39.0, 42.0, 59.0, 59.0, 66.0, 121.0, 1463.0, 404.0, 129.0, 63.0, 50.0, 45.0, 40.0, 30.0, 35.0, 33.0, 20.0, 23.0, 26.0, 23.0, 11.0, 9.0, 6.0, 5.0, 8.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.171875, -22.34375, -21.515625, -20.6875, -19.859375, -19.03125, -18.203125, -17.375, -16.546875, -15.71875, -14.890625, -14.0625, -13.234375, -12.40625, -11.578125, -10.75, -9.921875, -9.09375, -8.265625, -7.4375, -6.609375, -5.78125, -4.953125, -4.125, -3.296875, -2.46875, -1.640625, -0.8125, 0.015625, 0.84375, 1.671875, 2.5, 3.328125, 4.15625, 4.984375, 5.8125, 6.640625, 7.46875, 8.296875, 9.125, 9.953125, 10.78125, 11.609375, 12.4375, 13.265625, 14.09375, 14.921875, 15.75, 16.578125, 17.40625, 18.234375, 19.0625, 19.890625, 20.71875, 21.546875, 22.375, 23.203125, 24.03125, 24.859375, 25.6875, 26.515625, 27.34375, 28.171875, 29.0, 29.828125]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 10.0, 15.0, 23.0, 38.0, 50.0, 68.0, 108.0, 161.0, 310.0, 581.0, 3460.0, 3129814.0, 9328.0, 791.0, 376.0, 191.0, 129.0, 76.0, 66.0, 41.0, 26.0, 16.0, 9.0, 7.0, 8.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.625, -115.3837890625, -112.142578125, -108.9013671875, -105.66015625, -102.4189453125, -99.177734375, -95.9365234375, -92.6953125, -89.4541015625, -86.212890625, -82.9716796875, -79.73046875, -76.4892578125, -73.248046875, -70.0068359375, -66.765625, -63.5244140625, -60.283203125, -57.0419921875, -53.80078125, -50.5595703125, -47.318359375, -44.0771484375, -40.8359375, -37.5947265625, -34.353515625, -31.1123046875, -27.87109375, -24.6298828125, -21.388671875, -18.1474609375, -14.90625, -11.6650390625, -8.423828125, -5.1826171875, -1.94140625, 1.2998046875, 4.541015625, 7.7822265625, 11.0234375, 14.2646484375, 17.505859375, 20.7470703125, 23.98828125, 27.2294921875, 30.470703125, 33.7119140625, 36.953125, 40.1943359375, 43.435546875, 46.6767578125, 49.91796875, 53.1591796875, 56.400390625, 59.6416015625, 62.8828125, 66.1240234375, 69.365234375, 72.6064453125, 75.84765625, 79.0888671875, 82.330078125, 85.5712890625, 88.8125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 608.0, 400.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-446.26690673828125, -437.6774597167969, -429.0880126953125, -420.49859619140625, -411.9091491699219, -403.3197021484375, -394.7302551269531, -386.14080810546875, -377.5513916015625, -368.9619445800781, -360.37249755859375, -351.7830810546875, -343.1936340332031, -334.60418701171875, -326.0147399902344, -317.42529296875, -308.83587646484375, -300.2464294433594, -291.656982421875, -283.06756591796875, -274.4781188964844, -265.888671875, -257.2992248535156, -248.7097930908203, -240.12033081054688, -231.5308837890625, -222.9414520263672, -214.3520050048828, -205.7625732421875, -197.17312622070312, -188.58367919921875, -179.99424743652344, -171.40481567382812, -162.81536865234375, -154.22593688964844, -145.63648986816406, -137.04705810546875, -128.45761108398438, -119.86817169189453, -111.27873229980469, -102.68930053710938, -94.09986114501953, -85.51042175292969, -76.92097473144531, -68.33154296875, -59.74209976196289, -51.15265655517578, -42.56321716308594, -33.973777770996094, -25.38433837890625, -16.794897079467773, -8.205455780029297, 0.3839836120605469, 8.97342300415039, 17.5628662109375, 26.152305603027344, 34.74174499511719, 43.33118438720703, 51.920623779296875, 60.510066986083984, 69.09950256347656, 77.68894958496094, 86.27838897705078, 94.86782836914062, 103.45726776123047]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 4.0, 6.0, 6.0, 7.0, 10.0, 16.0, 17.0, 13.0, 21.0, 29.0, 25.0, 35.0, 37.0, 29.0, 36.0, 43.0, 33.0, 30.0, 51.0, 53.0, 45.0, 47.0, 41.0, 45.0, 33.0, 30.0, 39.0, 26.0, 31.0, 20.0, 29.0, 23.0, 14.0, 14.0, 6.0, 17.0, 8.0, 12.0, 5.0, 6.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.63656616210938, -71.29840087890625, -68.96024322509766, -66.62207794189453, -64.2839126586914, -61.94575500488281, -59.60758972167969, -57.26942825317383, -54.93126678466797, -52.59310531616211, -50.254940032958984, -47.916778564453125, -45.578617095947266, -43.240455627441406, -40.90229034423828, -38.56412887573242, -36.2259635925293, -33.88780212402344, -31.549638748168945, -29.211475372314453, -26.873313903808594, -24.5351505279541, -22.19698715209961, -19.85882568359375, -17.520662307739258, -15.182499885559082, -12.844337463378906, -10.506174087524414, -8.168011665344238, -5.8298492431640625, -3.4916858673095703, -1.153524398803711, 1.1846389770507812, 3.522801637649536, 5.860964298248291, 8.199127197265625, 10.5372896194458, 12.875452041625977, 15.213615417480469, 17.551776885986328, 19.88994026184082, 22.228103637695312, 24.566265106201172, 26.904428482055664, 29.242591857910156, 31.580753326416016, 33.918914794921875, 36.257080078125, 38.59524154663086, 40.93340301513672, 43.271568298339844, 45.6097297668457, 47.94789123535156, 50.28605651855469, 52.62421798706055, 54.962379455566406, 57.30054473876953, 59.63870620727539, 61.976871490478516, 64.31503295898438, 66.6531982421875, 68.9913558959961, 71.32952117919922, 73.66767883300781, 76.00584411621094]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 7.0, 6.0, 8.0, 9.0, 13.0, 17.0, 18.0, 17.0, 19.0, 16.0, 24.0, 33.0, 39.0, 24.0, 45.0, 38.0, 32.0, 30.0, 42.0, 43.0, 41.0, 26.0, 39.0, 32.0, 27.0, 44.0, 31.0, 27.0, 34.0, 25.0, 21.0, 27.0, 16.0, 30.0, 14.0, 15.0, 15.0, 14.0, 12.0, 4.0, 3.0, 1.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.91796875, -6.6854248046875, -6.452880859375, -6.2203369140625, -5.98779296875, -5.7552490234375, -5.522705078125, -5.2901611328125, -5.0576171875, -4.8250732421875, -4.592529296875, -4.3599853515625, -4.12744140625, -3.8948974609375, -3.662353515625, -3.4298095703125, -3.197265625, -2.9647216796875, -2.732177734375, -2.4996337890625, -2.26708984375, -2.0345458984375, -1.802001953125, -1.5694580078125, -1.3369140625, -1.1043701171875, -0.871826171875, -0.6392822265625, -0.40673828125, -0.1741943359375, 0.058349609375, 0.2908935546875, 0.5234375, 0.7559814453125, 0.988525390625, 1.2210693359375, 1.45361328125, 1.6861572265625, 1.918701171875, 2.1512451171875, 2.3837890625, 2.6163330078125, 2.848876953125, 3.0814208984375, 3.31396484375, 3.5465087890625, 3.779052734375, 4.0115966796875, 4.244140625, 4.4766845703125, 4.709228515625, 4.9417724609375, 5.17431640625, 5.4068603515625, 5.639404296875, 5.8719482421875, 6.1044921875, 6.3370361328125, 6.569580078125, 6.8021240234375, 7.03466796875, 7.2672119140625, 7.499755859375, 7.7322998046875, 7.96484375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 9.0, 12.0, 5.0, 7.0, 8.0, 13.0, 15.0, 17.0, 25.0, 11.0, 27.0, 31.0, 38.0, 25.0, 33.0, 57.0, 91.0, 301.0, 1151.0, 6002.0, 100222.0, 2837205.0, 1218902.0, 25788.0, 2915.0, 740.0, 223.0, 87.0, 51.0, 33.0, 34.0, 20.0, 33.0, 16.0, 19.0, 23.0, 14.0, 21.0, 9.0, 12.0, 10.0, 6.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-25.734375, -24.899169921875, -24.06396484375, -23.228759765625, -22.3935546875, -21.558349609375, -20.72314453125, -19.887939453125, -19.052734375, -18.217529296875, -17.38232421875, -16.547119140625, -15.7119140625, -14.876708984375, -14.04150390625, -13.206298828125, -12.37109375, -11.535888671875, -10.70068359375, -9.865478515625, -9.0302734375, -8.195068359375, -7.35986328125, -6.524658203125, -5.689453125, -4.854248046875, -4.01904296875, -3.183837890625, -2.3486328125, -1.513427734375, -0.67822265625, 0.156982421875, 0.9921875, 1.827392578125, 2.66259765625, 3.497802734375, 4.3330078125, 5.168212890625, 6.00341796875, 6.838623046875, 7.673828125, 8.509033203125, 9.34423828125, 10.179443359375, 11.0146484375, 11.849853515625, 12.68505859375, 13.520263671875, 14.35546875, 15.190673828125, 16.02587890625, 16.861083984375, 17.6962890625, 18.531494140625, 19.36669921875, 20.201904296875, 21.037109375, 21.872314453125, 22.70751953125, 23.542724609375, 24.3779296875, 25.213134765625, 26.04833984375, 26.883544921875, 27.71875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 1.0, 6.0, 14.0, 11.0, 15.0, 9.0, 28.0, 34.0, 43.0, 46.0, 68.0, 94.0, 107.0, 182.0, 228.0, 336.0, 396.0, 493.0, 483.0, 384.0, 298.0, 217.0, 150.0, 105.0, 85.0, 83.0, 53.0, 38.0, 16.0, 18.0, 14.0, 5.0, 7.0, 5.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.53125, -12.026123046875, -11.52099609375, -11.015869140625, -10.5107421875, -10.005615234375, -9.50048828125, -8.995361328125, -8.490234375, -7.985107421875, -7.47998046875, -6.974853515625, -6.4697265625, -5.964599609375, -5.45947265625, -4.954345703125, -4.44921875, -3.944091796875, -3.43896484375, -2.933837890625, -2.4287109375, -1.923583984375, -1.41845703125, -0.913330078125, -0.408203125, 0.096923828125, 0.60205078125, 1.107177734375, 1.6123046875, 2.117431640625, 2.62255859375, 3.127685546875, 3.6328125, 4.137939453125, 4.64306640625, 5.148193359375, 5.6533203125, 6.158447265625, 6.66357421875, 7.168701171875, 7.673828125, 8.178955078125, 8.68408203125, 9.189208984375, 9.6943359375, 10.199462890625, 10.70458984375, 11.209716796875, 11.71484375, 12.219970703125, 12.72509765625, 13.230224609375, 13.7353515625, 14.240478515625, 14.74560546875, 15.250732421875, 15.755859375, 16.260986328125, 16.76611328125, 17.271240234375, 17.7763671875, 18.281494140625, 18.78662109375, 19.291748046875, 19.796875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 8.0, 3.0, 7.0, 7.0, 13.0, 18.0, 21.0, 31.0, 46.0, 64.0, 70.0, 105.0, 134.0, 175.0, 233.0, 334.0, 614.0, 2358.0, 482984.0, 3697316.0, 7537.0, 829.0, 377.0, 249.0, 166.0, 131.0, 89.0, 86.0, 57.0, 53.0, 37.0, 26.0, 25.0, 32.0, 9.0, 9.0, 15.0, 4.0, 8.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.875, -66.591796875, -64.30859375, -62.025390625, -59.7421875, -57.458984375, -55.17578125, -52.892578125, -50.609375, -48.326171875, -46.04296875, -43.759765625, -41.4765625, -39.193359375, -36.91015625, -34.626953125, -32.34375, -30.060546875, -27.77734375, -25.494140625, -23.2109375, -20.927734375, -18.64453125, -16.361328125, -14.078125, -11.794921875, -9.51171875, -7.228515625, -4.9453125, -2.662109375, -0.37890625, 1.904296875, 4.1875, 6.470703125, 8.75390625, 11.037109375, 13.3203125, 15.603515625, 17.88671875, 20.169921875, 22.453125, 24.736328125, 27.01953125, 29.302734375, 31.5859375, 33.869140625, 36.15234375, 38.435546875, 40.71875, 43.001953125, 45.28515625, 47.568359375, 49.8515625, 52.134765625, 54.41796875, 56.701171875, 58.984375, 61.267578125, 63.55078125, 65.833984375, 68.1171875, 70.400390625, 72.68359375, 74.966796875, 77.25]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 8.0, 10.0, 47.0, 84.0, 179.0, 228.0, 195.0, 146.0, 70.0, 24.0, 12.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.67079162597656, -94.01847076416016, -90.36614990234375, -86.71383666992188, -83.06151580810547, -79.40919494628906, -75.75687408447266, -72.10455322265625, -68.45223236083984, -64.79991149902344, -61.1475944519043, -57.49527359008789, -53.842952728271484, -50.190635681152344, -46.53831481933594, -42.88599395751953, -39.23367691040039, -35.581356048583984, -31.92903709411621, -28.276718139648438, -24.62439727783203, -20.972078323364258, -17.319759368896484, -13.667438507080078, -10.015119552612305, -6.362799644470215, -2.710480213165283, 0.9418392181396484, 4.594159126281738, 8.246479034423828, 11.898797988891602, 15.551118850708008, 19.20343780517578, 22.855756759643555, 26.50807762145996, 30.160396575927734, 33.81271743774414, 37.46503448486328, 41.11735534667969, 44.769676208496094, 48.4219970703125, 52.074317932128906, 55.72663497924805, 59.37895584106445, 63.03127670288086, 66.68359375, 70.3359146118164, 73.98823547363281, 77.64054870605469, 81.2928695678711, 84.9451904296875, 88.59750366210938, 92.24982452392578, 95.90214538574219, 99.5544662475586, 103.206787109375, 106.8591079711914, 110.51142883300781, 114.16374969482422, 117.81607055664062, 121.4683837890625, 125.1207046508789, 128.7730255126953, 132.42535400390625, 136.07766723632812]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 2.0, 7.0, 8.0, 6.0, 9.0, 8.0, 14.0, 14.0, 19.0, 25.0, 18.0, 22.0, 19.0, 27.0, 21.0, 30.0, 25.0, 32.0, 21.0, 41.0, 40.0, 38.0, 46.0, 34.0, 39.0, 35.0, 37.0, 30.0, 28.0, 31.0, 29.0, 25.0, 27.0, 26.0, 23.0, 16.0, 27.0, 15.0, 10.0, 11.0, 11.0, 14.0, 6.0, 5.0, 6.0, 5.0, 3.0, 4.0, 4.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-44.66520309448242, -43.26557159423828, -41.865936279296875, -40.466304779052734, -39.066673278808594, -37.66703796386719, -36.26740646362305, -34.867774963378906, -33.4681396484375, -32.06850814819336, -30.668874740600586, -29.269241333007812, -27.869609832763672, -26.4699764251709, -25.070343017578125, -23.670711517333984, -22.271080017089844, -20.87144660949707, -19.47181510925293, -18.072181701660156, -16.672550201416016, -15.272916793823242, -13.873283386230469, -12.473650932312012, -11.074018478393555, -9.674386024475098, -8.27475357055664, -6.875120162963867, -5.47548770904541, -4.075855255126953, -2.6762218475341797, -1.2765893936157227, 0.12303924560546875, 1.5226719379425049, 2.922304630279541, 4.321937561035156, 5.721570014953613, 7.12120246887207, 8.520835876464844, 9.9204683303833, 11.320100784301758, 12.719733238220215, 14.119365692138672, 15.518999099731445, 16.91863250732422, 18.31826400756836, 19.717897415161133, 21.117530822753906, 22.517162322998047, 23.91679573059082, 25.31642723083496, 26.716060638427734, 28.115692138671875, 29.51532554626465, 30.914958953857422, 32.31459045410156, 33.71422576904297, 35.11385726928711, 36.513492584228516, 37.913124084472656, 39.3127555847168, 40.71238708496094, 42.112022399902344, 43.511653900146484, 44.911285400390625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 6.0, 5.0, 8.0, 9.0, 11.0, 12.0, 17.0, 12.0, 13.0, 14.0, 30.0, 21.0, 34.0, 40.0, 17.0, 37.0, 39.0, 43.0, 36.0, 42.0, 37.0, 35.0, 44.0, 33.0, 31.0, 30.0, 29.0, 31.0, 37.0, 29.0, 22.0, 22.0, 26.0, 21.0, 16.0, 17.0, 19.0, 17.0, 15.0, 8.0, 8.0, 7.0, 7.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.73046875, -6.5057373046875, -6.281005859375, -6.0562744140625, -5.83154296875, -5.6068115234375, -5.382080078125, -5.1573486328125, -4.9326171875, -4.7078857421875, -4.483154296875, -4.2584228515625, -4.03369140625, -3.8089599609375, -3.584228515625, -3.3594970703125, -3.134765625, -2.9100341796875, -2.685302734375, -2.4605712890625, -2.23583984375, -2.0111083984375, -1.786376953125, -1.5616455078125, -1.3369140625, -1.1121826171875, -0.887451171875, -0.6627197265625, -0.43798828125, -0.2132568359375, 0.011474609375, 0.2362060546875, 0.4609375, 0.6856689453125, 0.910400390625, 1.1351318359375, 1.35986328125, 1.5845947265625, 1.809326171875, 2.0340576171875, 2.2587890625, 2.4835205078125, 2.708251953125, 2.9329833984375, 3.15771484375, 3.3824462890625, 3.607177734375, 3.8319091796875, 4.056640625, 4.2813720703125, 4.506103515625, 4.7308349609375, 4.95556640625, 5.1802978515625, 5.405029296875, 5.6297607421875, 5.8544921875, 6.0792236328125, 6.303955078125, 6.5286865234375, 6.75341796875, 6.9781494140625, 7.202880859375, 7.4276123046875, 7.65234375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 9.0, 6.0, 13.0, 13.0, 31.0, 63.0, 80.0, 135.0, 196.0, 282.0, 530.0, 719.0, 1143.0, 1699.0, 2689.0, 3944.0, 5913.0, 8764.0, 13254.0, 20579.0, 31210.0, 47709.0, 72824.0, 111570.0, 180168.0, 194906.0, 121791.0, 78296.0, 51532.0, 33485.0, 21991.0, 14623.0, 9597.0, 6306.0, 4238.0, 2816.0, 1886.0, 1227.0, 822.0, 505.0, 352.0, 235.0, 160.0, 84.0, 56.0, 49.0, 24.0, 14.0, 12.0, 5.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0361328125, -1.0028076171875, -0.969482421875, -0.9361572265625, -0.90283203125, -0.8695068359375, -0.836181640625, -0.8028564453125, -0.76953125, -0.7362060546875, -0.702880859375, -0.6695556640625, -0.63623046875, -0.6029052734375, -0.569580078125, -0.5362548828125, -0.5029296875, -0.4696044921875, -0.436279296875, -0.4029541015625, -0.36962890625, -0.3363037109375, -0.302978515625, -0.2696533203125, -0.236328125, -0.2030029296875, -0.169677734375, -0.1363525390625, -0.10302734375, -0.0697021484375, -0.036376953125, -0.0030517578125, 0.0302734375, 0.0635986328125, 0.096923828125, 0.1302490234375, 0.16357421875, 0.1968994140625, 0.230224609375, 0.2635498046875, 0.296875, 0.3302001953125, 0.363525390625, 0.3968505859375, 0.43017578125, 0.4635009765625, 0.496826171875, 0.5301513671875, 0.5634765625, 0.5968017578125, 0.630126953125, 0.6634521484375, 0.69677734375, 0.7301025390625, 0.763427734375, 0.7967529296875, 0.830078125, 0.8634033203125, 0.896728515625, 0.9300537109375, 0.96337890625, 0.9967041015625, 1.030029296875, 1.0633544921875, 1.0966796875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 5.0, 1.0, 7.0, 9.0, 13.0, 7.0, 7.0, 15.0, 15.0, 17.0, 22.0, 23.0, 34.0, 31.0, 28.0, 31.0, 34.0, 41.0, 39.0, 40.0, 40.0, 45.0, 1068.0, 39.0, 49.0, 32.0, 42.0, 39.0, 34.0, 27.0, 33.0, 21.0, 19.0, 15.0, 18.0, 23.0, 16.0, 13.0, 11.0, 8.0, 11.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1484375, -4.98284912109375, -4.8172607421875, -4.65167236328125, -4.486083984375, -4.32049560546875, -4.1549072265625, -3.98931884765625, -3.82373046875, -3.65814208984375, -3.4925537109375, -3.32696533203125, -3.161376953125, -2.99578857421875, -2.8302001953125, -2.66461181640625, -2.4990234375, -2.33343505859375, -2.1678466796875, -2.00225830078125, -1.836669921875, -1.67108154296875, -1.5054931640625, -1.33990478515625, -1.17431640625, -1.00872802734375, -0.8431396484375, -0.67755126953125, -0.511962890625, -0.34637451171875, -0.1807861328125, -0.01519775390625, 0.150390625, 0.31597900390625, 0.4815673828125, 0.64715576171875, 0.812744140625, 0.97833251953125, 1.1439208984375, 1.30950927734375, 1.47509765625, 1.64068603515625, 1.8062744140625, 1.97186279296875, 2.137451171875, 2.30303955078125, 2.4686279296875, 2.63421630859375, 2.7998046875, 2.96539306640625, 3.1309814453125, 3.29656982421875, 3.462158203125, 3.62774658203125, 3.7933349609375, 3.95892333984375, 4.12451171875, 4.29010009765625, 4.4556884765625, 4.62127685546875, 4.786865234375, 4.95245361328125, 5.1180419921875, 5.28363037109375, 5.44921875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 11.0, 14.0, 31.0, 38.0, 58.0, 74.0, 125.0, 173.0, 250.0, 349.0, 576.0, 900.0, 1331.0, 2092.0, 3159.0, 4913.0, 7306.0, 11623.0, 17846.0, 27776.0, 44486.0, 70525.0, 111512.0, 176367.0, 1251410.0, 133307.0, 84631.0, 52667.0, 33453.0, 21090.0, 13559.0, 8772.0, 5691.0, 3759.0, 2401.0, 1646.0, 1064.0, 725.0, 463.0, 335.0, 207.0, 138.0, 94.0, 49.0, 45.0, 28.0, 26.0, 9.0, 15.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.048828125, -1.0162506103515625, -0.983673095703125, -0.9510955810546875, -0.91851806640625, -0.8859405517578125, -0.853363037109375, -0.8207855224609375, -0.7882080078125, -0.7556304931640625, -0.723052978515625, -0.6904754638671875, -0.65789794921875, -0.6253204345703125, -0.592742919921875, -0.5601654052734375, -0.527587890625, -0.4950103759765625, -0.462432861328125, -0.4298553466796875, -0.39727783203125, -0.3647003173828125, -0.332122802734375, -0.2995452880859375, -0.2669677734375, -0.2343902587890625, -0.201812744140625, -0.1692352294921875, -0.13665771484375, -0.1040802001953125, -0.071502685546875, -0.0389251708984375, -0.00634765625, 0.0262298583984375, 0.058807373046875, 0.0913848876953125, 0.12396240234375, 0.1565399169921875, 0.189117431640625, 0.2216949462890625, 0.2542724609375, 0.2868499755859375, 0.319427490234375, 0.3520050048828125, 0.38458251953125, 0.4171600341796875, 0.449737548828125, 0.4823150634765625, 0.514892578125, 0.5474700927734375, 0.580047607421875, 0.6126251220703125, 0.64520263671875, 0.6777801513671875, 0.710357666015625, 0.7429351806640625, 0.7755126953125, 0.8080902099609375, 0.840667724609375, 0.8732452392578125, 0.90582275390625, 0.9384002685546875, 0.970977783203125, 1.0035552978515625, 1.0361328125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 7.0, 2.0, 5.0, 7.0, 12.0, 12.0, 18.0, 26.0, 23.0, 25.0, 30.0, 50.0, 39.0, 41.0, 59.0, 70.0, 67.0, 80.0, 70.0, 58.0, 58.0, 46.0, 40.0, 34.0, 28.0, 12.0, 15.0, 16.0, 16.0, 13.0, 3.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002178192138671875, -0.0021116137504577637, -0.0020450353622436523, -0.001978456974029541, -0.0019118785858154297, -0.0018453001976013184, -0.001778721809387207, -0.0017121434211730957, -0.0016455650329589844, -0.001578986644744873, -0.0015124082565307617, -0.0014458298683166504, -0.001379251480102539, -0.0013126730918884277, -0.0012460947036743164, -0.001179516315460205, -0.0011129379272460938, -0.0010463595390319824, -0.000979781150817871, -0.0009132027626037598, -0.0008466243743896484, -0.0007800459861755371, -0.0007134675979614258, -0.0006468892097473145, -0.0005803108215332031, -0.0005137324333190918, -0.00044715404510498047, -0.00038057565689086914, -0.0003139972686767578, -0.0002474188804626465, -0.00018084049224853516, -0.00011426210403442383, -4.76837158203125e-05, 1.8894672393798828e-05, 8.547306060791016e-05, 0.00015205144882202148, 0.0002186298370361328, 0.00028520822525024414, 0.00035178661346435547, 0.0004183650016784668, 0.0004849433898925781, 0.0005515217781066895, 0.0006181001663208008, 0.0006846785545349121, 0.0007512569427490234, 0.0008178353309631348, 0.0008844137191772461, 0.0009509921073913574, 0.0010175704956054688, 0.00108414888381958, 0.0011507272720336914, 0.0012173056602478027, 0.001283884048461914, 0.0013504624366760254, 0.0014170408248901367, 0.001483619213104248, 0.0015501976013183594, 0.0016167759895324707, 0.001683354377746582, 0.0017499327659606934, 0.0018165111541748047, 0.001883089542388916, 0.0019496679306030273, 0.0020162463188171387, 0.00208282470703125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 4.0, 8.0, 10.0, 7.0, 14.0, 14.0, 12.0, 22.0, 30.0, 36.0, 45.0, 66.0, 99.0, 184.0, 419.0, 3466.0, 1039629.0, 3568.0, 390.0, 169.0, 88.0, 66.0, 43.0, 34.0, 35.0, 28.0, 17.0, 14.0, 10.0, 6.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045257568359375, -0.043612003326416016, -0.04196643829345703, -0.04032087326049805, -0.03867530822753906, -0.03702974319458008, -0.035384178161621094, -0.03373861312866211, -0.032093048095703125, -0.03044748306274414, -0.028801918029785156, -0.027156352996826172, -0.025510787963867188, -0.023865222930908203, -0.02221965789794922, -0.020574092864990234, -0.01892852783203125, -0.017282962799072266, -0.01563739776611328, -0.013991832733154297, -0.012346267700195312, -0.010700702667236328, -0.009055137634277344, -0.007409572601318359, -0.005764007568359375, -0.004118442535400391, -0.0024728775024414062, -0.0008273124694824219, 0.0008182525634765625, 0.002463817596435547, 0.004109382629394531, 0.005754947662353516, 0.0074005126953125, 0.009046077728271484, 0.010691642761230469, 0.012337207794189453, 0.013982772827148438, 0.015628337860107422, 0.017273902893066406, 0.01891946792602539, 0.020565032958984375, 0.02221059799194336, 0.023856163024902344, 0.025501728057861328, 0.027147293090820312, 0.028792858123779297, 0.03043842315673828, 0.032083988189697266, 0.03372955322265625, 0.035375118255615234, 0.03702068328857422, 0.0386662483215332, 0.04031181335449219, 0.04195737838745117, 0.043602943420410156, 0.04524850845336914, 0.046894073486328125, 0.04853963851928711, 0.050185203552246094, 0.05183076858520508, 0.05347633361816406, 0.05512189865112305, 0.05676746368408203, 0.058413028717041016, 0.06005859375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 14.0, 35.0, 103.0, 228.0, 309.0, 198.0, 84.0, 33.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004105939995497465, -0.004026070237159729, -0.003946200478821993, -0.0038663307204842567, -0.0037864609621465206, -0.0037065912038087845, -0.0036267214454710484, -0.0035468516871333122, -0.003466981928795576, -0.00338711217045784, -0.003307242412120104, -0.0032273726537823677, -0.0031475028954446316, -0.0030676331371068954, -0.0029877633787691593, -0.002907893620431423, -0.0028280240949243307, -0.0027481543365865946, -0.0026682845782488585, -0.0025884148199111223, -0.002508545061573386, -0.00242867530323565, -0.002348805544897914, -0.0022689360193908215, -0.0021890662610530853, -0.002109196502715349, -0.002029326744377613, -0.001949456986039877, -0.0018695872277021408, -0.0017897174693644047, -0.0017098478274419904, -0.0016299780691042542, -0.0015501080779358745, -0.0014702383195981383, -0.0013903685612604022, -0.001310498802922666, -0.0012306291610002518, -0.0011507594026625156, -0.0010708896443247795, -0.0009910198859870434, -0.0009111501276493073, -0.0008312803693115711, -0.000751410610973835, -0.0006715409108437598, -0.0005916711525060236, -0.0005118013941682875, -0.00043193166493438184, -0.00035206193570047617, -0.00027219217736274004, -0.00019232243357691914, -0.00011245268979109824, -3.2582946005277336e-05, 4.7286797780543566e-05, 0.0001271565561182797, 0.00020702628535218537, 0.00028689601458609104, 0.00036676577292382717, 0.0004466355312615633, 0.0005265052895992994, 0.0006063749897293746, 0.0006862447480671108, 0.0007661145064048469, 0.0008459842065349221, 0.0009258539648726583, 0.0010057237232103944]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 6.0, 7.0, 4.0, 8.0, 7.0, 16.0, 9.0, 15.0, 17.0, 11.0, 25.0, 20.0, 21.0, 37.0, 32.0, 26.0, 46.0, 32.0, 33.0, 38.0, 49.0, 37.0, 31.0, 36.0, 36.0, 34.0, 35.0, 41.0, 37.0, 29.0, 31.0, 24.0, 27.0, 19.0, 20.0, 16.0, 12.0, 11.0, 12.0, 11.0, 13.0, 6.0, 9.0, 4.0, 4.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008845329284667969, -0.0008559860289096832, -0.0008274391293525696, -0.0007988922297954559, -0.0007703453302383423, -0.0007417984306812286, -0.000713251531124115, -0.0006847046315670013, -0.0006561577320098877, -0.000627610832452774, -0.0005990639328956604, -0.0005705170333385468, -0.0005419701337814331, -0.0005134232342243195, -0.0004848763346672058, -0.00045632943511009216, -0.0004277825355529785, -0.00039923563599586487, -0.0003706887364387512, -0.0003421418368816376, -0.0003135949373245239, -0.0002850480377674103, -0.00025650113821029663, -0.00022795423865318298, -0.00019940733909606934, -0.0001708604395389557, -0.00014231353998184204, -0.0001137666404247284, -8.521974086761475e-05, -5.66728413105011e-05, -2.812594175338745e-05, 4.209578037261963e-07, 2.8967857360839844e-05, 5.751475691795349e-05, 8.606165647506714e-05, 0.00011460855603218079, 0.00014315545558929443, 0.00017170235514640808, 0.00020024925470352173, 0.00022879615426063538, 0.000257343053817749, 0.00028588995337486267, 0.0003144368529319763, 0.00034298375248908997, 0.0003715306520462036, 0.00040007755160331726, 0.0004286244511604309, 0.00045717135071754456, 0.0004857182502746582, 0.0005142651498317719, 0.0005428120493888855, 0.0005713589489459991, 0.0005999058485031128, 0.0006284527480602264, 0.0006569996476173401, 0.0006855465471744537, 0.0007140934467315674, 0.000742640346288681, 0.0007711872458457947, 0.0007997341454029083, 0.000828281044960022, 0.0008568279445171356, 0.0008853748440742493, 0.0009139217436313629, 0.0009424686431884766]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 6.0, 5.0, 8.0, 9.0, 11.0, 12.0, 17.0, 12.0, 13.0, 14.0, 30.0, 21.0, 34.0, 40.0, 17.0, 37.0, 39.0, 43.0, 36.0, 42.0, 37.0, 35.0, 44.0, 33.0, 31.0, 30.0, 29.0, 31.0, 37.0, 29.0, 22.0, 22.0, 26.0, 21.0, 17.0, 16.0, 19.0, 17.0, 15.0, 8.0, 7.0, 8.0, 7.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.73046875, -6.5057373046875, -6.281005859375, -6.0562744140625, -5.83154296875, -5.6068115234375, -5.382080078125, -5.1573486328125, -4.9326171875, -4.7078857421875, -4.483154296875, -4.2584228515625, -4.03369140625, -3.8089599609375, -3.584228515625, -3.3594970703125, -3.134765625, -2.9100341796875, -2.685302734375, -2.4605712890625, -2.23583984375, -2.0111083984375, -1.786376953125, -1.5616455078125, -1.3369140625, -1.1121826171875, -0.887451171875, -0.6627197265625, -0.43798828125, -0.2132568359375, 0.011474609375, 0.2362060546875, 0.4609375, 0.6856689453125, 0.910400390625, 1.1351318359375, 1.35986328125, 1.5845947265625, 1.809326171875, 2.0340576171875, 2.2587890625, 2.4835205078125, 2.708251953125, 2.9329833984375, 3.15771484375, 3.3824462890625, 3.607177734375, 3.8319091796875, 4.056640625, 4.2813720703125, 4.506103515625, 4.7308349609375, 4.95556640625, 5.1802978515625, 5.405029296875, 5.6297607421875, 5.8544921875, 6.0792236328125, 6.303955078125, 6.5286865234375, 6.75341796875, 6.9781494140625, 7.202880859375, 7.4276123046875, 7.65234375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 16.0, 15.0, 17.0, 40.0, 45.0, 61.0, 81.0, 109.0, 135.0, 193.0, 284.0, 427.0, 632.0, 997.0, 1807.0, 3298.0, 6005.0, 12248.0, 26092.0, 61734.0, 165667.0, 399695.0, 223175.0, 80697.0, 33321.0, 14836.0, 7340.0, 3862.0, 2121.0, 1256.0, 732.0, 469.0, 347.0, 208.0, 163.0, 104.0, 80.0, 68.0, 38.0, 32.0, 24.0, 22.0, 13.0, 14.0, 12.0, 4.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.45599365234375, -4.2947998046875, -4.13360595703125, -3.972412109375, -3.81121826171875, -3.6500244140625, -3.48883056640625, -3.32763671875, -3.16644287109375, -3.0052490234375, -2.84405517578125, -2.682861328125, -2.52166748046875, -2.3604736328125, -2.19927978515625, -2.0380859375, -1.87689208984375, -1.7156982421875, -1.55450439453125, -1.393310546875, -1.23211669921875, -1.0709228515625, -0.90972900390625, -0.74853515625, -0.58734130859375, -0.4261474609375, -0.26495361328125, -0.103759765625, 0.05743408203125, 0.2186279296875, 0.37982177734375, 0.541015625, 0.70220947265625, 0.8634033203125, 1.02459716796875, 1.185791015625, 1.34698486328125, 1.5081787109375, 1.66937255859375, 1.83056640625, 1.99176025390625, 2.1529541015625, 2.31414794921875, 2.475341796875, 2.63653564453125, 2.7977294921875, 2.95892333984375, 3.1201171875, 3.28131103515625, 3.4425048828125, 3.60369873046875, 3.764892578125, 3.92608642578125, 4.0872802734375, 4.24847412109375, 4.40966796875, 4.57086181640625, 4.7320556640625, 4.89324951171875, 5.054443359375, 5.21563720703125, 5.3768310546875, 5.53802490234375, 5.69921875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 5.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 6.0, 6.0, 11.0, 9.0, 15.0, 13.0, 18.0, 16.0, 19.0, 21.0, 16.0, 25.0, 30.0, 28.0, 35.0, 37.0, 49.0, 67.0, 75.0, 242.0, 1632.0, 147.0, 70.0, 60.0, 42.0, 37.0, 38.0, 29.0, 40.0, 29.0, 30.0, 19.0, 12.0, 18.0, 23.0, 13.0, 9.0, 7.0, 9.0, 13.0, 6.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.84375, -21.146484375, -20.44921875, -19.751953125, -19.0546875, -18.357421875, -17.66015625, -16.962890625, -16.265625, -15.568359375, -14.87109375, -14.173828125, -13.4765625, -12.779296875, -12.08203125, -11.384765625, -10.6875, -9.990234375, -9.29296875, -8.595703125, -7.8984375, -7.201171875, -6.50390625, -5.806640625, -5.109375, -4.412109375, -3.71484375, -3.017578125, -2.3203125, -1.623046875, -0.92578125, -0.228515625, 0.46875, 1.166015625, 1.86328125, 2.560546875, 3.2578125, 3.955078125, 4.65234375, 5.349609375, 6.046875, 6.744140625, 7.44140625, 8.138671875, 8.8359375, 9.533203125, 10.23046875, 10.927734375, 11.625, 12.322265625, 13.01953125, 13.716796875, 14.4140625, 15.111328125, 15.80859375, 16.505859375, 17.203125, 17.900390625, 18.59765625, 19.294921875, 19.9921875, 20.689453125, 21.38671875, 22.083984375, 22.78125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 0.0, 4.0, 2.0, 2.0, 9.0, 3.0, 0.0, 10.0, 15.0, 7.0, 17.0, 30.0, 39.0, 45.0, 70.0, 70.0, 136.0, 173.0, 236.0, 366.0, 676.0, 7416.0, 3113837.0, 20469.0, 821.0, 376.0, 246.0, 164.0, 108.0, 89.0, 78.0, 48.0, 39.0, 26.0, 19.0, 16.0, 14.0, 8.0, 8.0, 8.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.875, -64.5361328125, -62.197265625, -59.8583984375, -57.51953125, -55.1806640625, -52.841796875, -50.5029296875, -48.1640625, -45.8251953125, -43.486328125, -41.1474609375, -38.80859375, -36.4697265625, -34.130859375, -31.7919921875, -29.453125, -27.1142578125, -24.775390625, -22.4365234375, -20.09765625, -17.7587890625, -15.419921875, -13.0810546875, -10.7421875, -8.4033203125, -6.064453125, -3.7255859375, -1.38671875, 0.9521484375, 3.291015625, 5.6298828125, 7.96875, 10.3076171875, 12.646484375, 14.9853515625, 17.32421875, 19.6630859375, 22.001953125, 24.3408203125, 26.6796875, 29.0185546875, 31.357421875, 33.6962890625, 36.03515625, 38.3740234375, 40.712890625, 43.0517578125, 45.390625, 47.7294921875, 50.068359375, 52.4072265625, 54.74609375, 57.0849609375, 59.423828125, 61.7626953125, 64.1015625, 66.4404296875, 68.779296875, 71.1181640625, 73.45703125, 75.7958984375, 78.134765625, 80.4736328125, 82.8125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [2.0, 29.0, 815.0, 172.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.58217430114746, -12.40479850769043, -5.227422714233398, 1.9499530792236328, 9.127328872680664, 16.304704666137695, 23.482080459594727, 30.659456253051758, 37.836830139160156, 45.01420593261719, 52.19158172607422, 59.36895751953125, 66.54633331298828, 73.72370910644531, 80.90108489990234, 88.07846069335938, 95.2558364868164, 102.43321228027344, 109.61058807373047, 116.7879638671875, 123.96533966064453, 131.14271545410156, 138.32009887695312, 145.49746704101562, 152.6748504638672, 159.85223388671875, 167.02960205078125, 174.20697021484375, 181.3843536376953, 188.56173706054688, 195.73910522460938, 202.91647338867188, 210.09384155273438, 217.27120971679688, 224.44859313964844, 231.6259765625, 238.8033447265625, 245.980712890625, 253.15809631347656, 260.3354797363281, 267.5128479003906, 274.6902160644531, 281.86761474609375, 289.04498291015625, 296.22235107421875, 303.39971923828125, 310.57708740234375, 317.7544860839844, 324.9318542480469, 332.1092224121094, 339.28662109375, 346.4639892578125, 353.641357421875, 360.8187255859375, 367.99609375, 375.1734924316406, 382.3508605957031, 389.5282287597656, 396.70562744140625, 403.88299560546875, 411.06036376953125, 418.23773193359375, 425.41510009765625, 432.5924987792969, 439.7698669433594]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 9.0, 7.0, 9.0, 8.0, 13.0, 13.0, 14.0, 21.0, 16.0, 25.0, 25.0, 35.0, 35.0, 43.0, 39.0, 55.0, 44.0, 42.0, 51.0, 57.0, 36.0, 47.0, 34.0, 40.0, 37.0, 34.0, 42.0, 29.0, 31.0, 17.0, 19.0, 13.0, 20.0, 10.0, 5.0, 4.0, 10.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-76.5431900024414, -74.22920989990234, -71.91523742675781, -69.60125732421875, -67.28728485107422, -64.97330474853516, -62.659332275390625, -60.34535217285156, -58.03137969970703, -55.717403411865234, -53.40342712402344, -51.08945083618164, -48.775474548339844, -46.46149826049805, -44.14752197265625, -41.83354187011719, -39.51956558227539, -37.205589294433594, -34.8916130065918, -32.57763671875, -30.263660430908203, -27.949684143066406, -25.635705947875977, -23.32172966003418, -21.007753372192383, -18.693777084350586, -16.37980079650879, -14.065823554992676, -11.751847267150879, -9.437870979309082, -7.123893737792969, -4.809917449951172, -2.495941162109375, -0.18196463584899902, 2.132011890411377, 4.445988655090332, 6.759964942932129, 9.073941230773926, 11.387918472290039, 13.701894760131836, 16.015871047973633, 18.32984733581543, 20.643823623657227, 22.957801818847656, 25.271778106689453, 27.58575439453125, 29.899730682373047, 32.213706970214844, 34.52768325805664, 36.84165954589844, 39.155635833740234, 41.46961212158203, 43.78358840942383, 46.097564697265625, 48.41154479980469, 50.72551727294922, 53.03949737548828, 55.35347366333008, 57.667449951171875, 59.98142623901367, 62.29540252685547, 64.60938262939453, 66.92335510253906, 69.23733520507812, 71.55130767822266]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 11.0, 8.0, 9.0, 11.0, 13.0, 8.0, 15.0, 16.0, 13.0, 20.0, 20.0, 37.0, 25.0, 39.0, 32.0, 29.0, 41.0, 35.0, 51.0, 29.0, 43.0, 38.0, 34.0, 35.0, 33.0, 29.0, 30.0, 26.0, 27.0, 35.0, 23.0, 23.0, 16.0, 15.0, 18.0, 21.0, 14.0, 11.0, 11.0, 16.0, 6.0, 5.0, 7.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.92578125, -6.697021484375, -6.46826171875, -6.239501953125, -6.0107421875, -5.781982421875, -5.55322265625, -5.324462890625, -5.095703125, -4.866943359375, -4.63818359375, -4.409423828125, -4.1806640625, -3.951904296875, -3.72314453125, -3.494384765625, -3.265625, -3.036865234375, -2.80810546875, -2.579345703125, -2.3505859375, -2.121826171875, -1.89306640625, -1.664306640625, -1.435546875, -1.206787109375, -0.97802734375, -0.749267578125, -0.5205078125, -0.291748046875, -0.06298828125, 0.165771484375, 0.39453125, 0.623291015625, 0.85205078125, 1.080810546875, 1.3095703125, 1.538330078125, 1.76708984375, 1.995849609375, 2.224609375, 2.453369140625, 2.68212890625, 2.910888671875, 3.1396484375, 3.368408203125, 3.59716796875, 3.825927734375, 4.0546875, 4.283447265625, 4.51220703125, 4.740966796875, 4.9697265625, 5.198486328125, 5.42724609375, 5.656005859375, 5.884765625, 6.113525390625, 6.34228515625, 6.571044921875, 6.7998046875, 7.028564453125, 7.25732421875, 7.486083984375, 7.71484375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 9.0, 9.0, 16.0, 7.0, 11.0, 12.0, 17.0, 13.0, 22.0, 23.0, 32.0, 46.0, 67.0, 115.0, 186.0, 369.0, 882.0, 2690.0, 11395.0, 134189.0, 2009562.0, 1911760.0, 108268.0, 10255.0, 2486.0, 841.0, 355.0, 197.0, 115.0, 65.0, 40.0, 36.0, 31.0, 23.0, 17.0, 17.0, 10.0, 16.0, 17.0, 9.0, 9.0, 12.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.75, -18.12451171875, -17.4990234375, -16.87353515625, -16.248046875, -15.62255859375, -14.9970703125, -14.37158203125, -13.74609375, -13.12060546875, -12.4951171875, -11.86962890625, -11.244140625, -10.61865234375, -9.9931640625, -9.36767578125, -8.7421875, -8.11669921875, -7.4912109375, -6.86572265625, -6.240234375, -5.61474609375, -4.9892578125, -4.36376953125, -3.73828125, -3.11279296875, -2.4873046875, -1.86181640625, -1.236328125, -0.61083984375, 0.0146484375, 0.64013671875, 1.265625, 1.89111328125, 2.5166015625, 3.14208984375, 3.767578125, 4.39306640625, 5.0185546875, 5.64404296875, 6.26953125, 6.89501953125, 7.5205078125, 8.14599609375, 8.771484375, 9.39697265625, 10.0224609375, 10.64794921875, 11.2734375, 11.89892578125, 12.5244140625, 13.14990234375, 13.775390625, 14.40087890625, 15.0263671875, 15.65185546875, 16.27734375, 16.90283203125, 17.5283203125, 18.15380859375, 18.779296875, 19.40478515625, 20.0302734375, 20.65576171875, 21.28125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 2.0, 7.0, 16.0, 5.0, 17.0, 24.0, 23.0, 35.0, 37.0, 44.0, 68.0, 80.0, 115.0, 133.0, 176.0, 215.0, 257.0, 344.0, 402.0, 358.0, 372.0, 304.0, 226.0, 187.0, 137.0, 92.0, 81.0, 62.0, 50.0, 54.0, 32.0, 28.0, 22.0, 17.0, 16.0, 8.0, 7.0, 9.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6875, -10.2791748046875, -9.870849609375, -9.4625244140625, -9.05419921875, -8.6458740234375, -8.237548828125, -7.8292236328125, -7.4208984375, -7.0125732421875, -6.604248046875, -6.1959228515625, -5.78759765625, -5.3792724609375, -4.970947265625, -4.5626220703125, -4.154296875, -3.7459716796875, -3.337646484375, -2.9293212890625, -2.52099609375, -2.1126708984375, -1.704345703125, -1.2960205078125, -0.8876953125, -0.4793701171875, -0.071044921875, 0.3372802734375, 0.74560546875, 1.1539306640625, 1.562255859375, 1.9705810546875, 2.37890625, 2.7872314453125, 3.195556640625, 3.6038818359375, 4.01220703125, 4.4205322265625, 4.828857421875, 5.2371826171875, 5.6455078125, 6.0538330078125, 6.462158203125, 6.8704833984375, 7.27880859375, 7.6871337890625, 8.095458984375, 8.5037841796875, 8.912109375, 9.3204345703125, 9.728759765625, 10.1370849609375, 10.54541015625, 10.9537353515625, 11.362060546875, 11.7703857421875, 12.1787109375, 12.5870361328125, 12.995361328125, 13.4036865234375, 13.81201171875, 14.2203369140625, 14.628662109375, 15.0369873046875, 15.4453125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 11.0, 10.0, 9.0, 10.0, 28.0, 27.0, 34.0, 41.0, 52.0, 70.0, 80.0, 128.0, 121.0, 190.0, 260.0, 416.0, 923.0, 46247.0, 4109348.0, 33803.0, 820.0, 475.0, 288.0, 218.0, 155.0, 115.0, 83.0, 61.0, 62.0, 50.0, 20.0, 34.0, 28.0, 9.0, 15.0, 7.0, 8.0, 6.0, 5.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-74.625, -72.3271484375, -70.029296875, -67.7314453125, -65.43359375, -63.1357421875, -60.837890625, -58.5400390625, -56.2421875, -53.9443359375, -51.646484375, -49.3486328125, -47.05078125, -44.7529296875, -42.455078125, -40.1572265625, -37.859375, -35.5615234375, -33.263671875, -30.9658203125, -28.66796875, -26.3701171875, -24.072265625, -21.7744140625, -19.4765625, -17.1787109375, -14.880859375, -12.5830078125, -10.28515625, -7.9873046875, -5.689453125, -3.3916015625, -1.09375, 1.2041015625, 3.501953125, 5.7998046875, 8.09765625, 10.3955078125, 12.693359375, 14.9912109375, 17.2890625, 19.5869140625, 21.884765625, 24.1826171875, 26.48046875, 28.7783203125, 31.076171875, 33.3740234375, 35.671875, 37.9697265625, 40.267578125, 42.5654296875, 44.86328125, 47.1611328125, 49.458984375, 51.7568359375, 54.0546875, 56.3525390625, 58.650390625, 60.9482421875, 63.24609375, 65.5439453125, 67.841796875, 70.1396484375, 72.4375]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 9.0, 31.0, 89.0, 213.0, 249.0, 214.0, 121.0, 64.0, 12.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.55559539794922, -95.68846893310547, -91.82134246826172, -87.95421600341797, -84.08708190917969, -80.21995544433594, -76.35282897949219, -72.48570251464844, -68.61857604980469, -64.75144958496094, -60.88432312011719, -57.01719284057617, -53.15006637573242, -49.28293991088867, -45.415809631347656, -41.548683166503906, -37.681556701660156, -33.814430236816406, -29.947301864624023, -26.08017349243164, -22.21304702758789, -18.34592056274414, -14.478792190551758, -10.611663818359375, -6.744537353515625, -2.8774099349975586, 0.9897174835205078, 4.856844902038574, 8.72397232055664, 12.59109878540039, 16.458227157592773, 20.325355529785156, 24.192489624023438, 28.059616088867188, 31.92674446105957, 35.79387283325195, 39.6609992980957, 43.52812576293945, 47.39525604248047, 51.26238250732422, 55.12950897216797, 58.99663543701172, 62.86376190185547, 66.73088836669922, 70.5980224609375, 74.46514892578125, 78.332275390625, 82.19940185546875, 86.0665283203125, 89.93365478515625, 93.80078125, 97.66790771484375, 101.5350341796875, 105.40216064453125, 109.26929473876953, 113.13642120361328, 117.00354766845703, 120.87067413330078, 124.73780059814453, 128.6049346923828, 132.47206115722656, 136.3391876220703, 140.20631408691406, 144.0734405517578, 147.94056701660156]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 4.0, 6.0, 11.0, 11.0, 11.0, 22.0, 28.0, 20.0, 24.0, 25.0, 33.0, 42.0, 46.0, 45.0, 39.0, 49.0, 49.0, 47.0, 49.0, 46.0, 35.0, 64.0, 41.0, 45.0, 31.0, 34.0, 23.0, 20.0, 15.0, 17.0, 16.0, 13.0, 11.0, 9.0, 9.0, 5.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-62.331787109375, -60.52672576904297, -58.7216682434082, -56.91661071777344, -55.111549377441406, -53.306488037109375, -51.50143051147461, -49.696372985839844, -47.89131164550781, -46.08625030517578, -44.281192779541016, -42.47613525390625, -40.67107391357422, -38.86601257324219, -37.06095504760742, -35.255897521972656, -33.450836181640625, -31.645776748657227, -29.840717315673828, -28.03565788269043, -26.23059844970703, -24.425539016723633, -22.620479583740234, -20.815420150756836, -19.010360717773438, -17.20530128479004, -15.40024185180664, -13.595182418823242, -11.790122985839844, -9.985063552856445, -8.180004119873047, -6.374944686889648, -4.56988525390625, -2.7648258209228516, -0.9597663879394531, 0.8452930450439453, 2.6503524780273438, 4.455411911010742, 6.260471343994141, 8.065530776977539, 9.870590209960938, 11.675649642944336, 13.480709075927734, 15.285768508911133, 17.09082794189453, 18.89588737487793, 20.700946807861328, 22.506006240844727, 24.311065673828125, 26.116125106811523, 27.921184539794922, 29.72624397277832, 31.53130340576172, 33.33636474609375, 35.141422271728516, 36.94647979736328, 38.75154113769531, 40.556602478027344, 42.36166000366211, 44.166717529296875, 45.971778869628906, 47.77684020996094, 49.5818977355957, 51.38695526123047, 53.1920166015625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 11.0, 9.0, 6.0, 17.0, 6.0, 13.0, 18.0, 19.0, 22.0, 19.0, 29.0, 29.0, 22.0, 37.0, 32.0, 36.0, 50.0, 37.0, 40.0, 33.0, 55.0, 32.0, 39.0, 31.0, 24.0, 38.0, 33.0, 20.0, 32.0, 19.0, 29.0, 18.0, 16.0, 19.0, 16.0, 15.0, 14.0, 6.0, 8.0, 13.0, 5.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.70703125, -6.47802734375, -6.2490234375, -6.02001953125, -5.791015625, -5.56201171875, -5.3330078125, -5.10400390625, -4.875, -4.64599609375, -4.4169921875, -4.18798828125, -3.958984375, -3.72998046875, -3.5009765625, -3.27197265625, -3.04296875, -2.81396484375, -2.5849609375, -2.35595703125, -2.126953125, -1.89794921875, -1.6689453125, -1.43994140625, -1.2109375, -0.98193359375, -0.7529296875, -0.52392578125, -0.294921875, -0.06591796875, 0.1630859375, 0.39208984375, 0.62109375, 0.85009765625, 1.0791015625, 1.30810546875, 1.537109375, 1.76611328125, 1.9951171875, 2.22412109375, 2.453125, 2.68212890625, 2.9111328125, 3.14013671875, 3.369140625, 3.59814453125, 3.8271484375, 4.05615234375, 4.28515625, 4.51416015625, 4.7431640625, 4.97216796875, 5.201171875, 5.43017578125, 5.6591796875, 5.88818359375, 6.1171875, 6.34619140625, 6.5751953125, 6.80419921875, 7.033203125, 7.26220703125, 7.4912109375, 7.72021484375, 7.94921875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 6.0, 7.0, 14.0, 9.0, 14.0, 21.0, 41.0, 68.0, 90.0, 145.0, 238.0, 353.0, 475.0, 775.0, 1168.0, 1686.0, 2556.0, 3947.0, 5795.0, 8764.0, 12952.0, 19375.0, 29528.0, 44489.0, 67979.0, 104105.0, 161181.0, 195636.0, 133743.0, 86192.0, 56937.0, 37061.0, 24332.0, 16238.0, 11006.0, 7146.0, 4808.0, 3272.0, 2169.0, 1418.0, 917.0, 665.0, 462.0, 245.0, 165.0, 123.0, 87.0, 49.0, 34.0, 29.0, 22.0, 10.0, 9.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.98486328125, -0.9523391723632812, -0.9198150634765625, -0.8872909545898438, -0.854766845703125, -0.8222427368164062, -0.7897186279296875, -0.7571945190429688, -0.72467041015625, -0.6921463012695312, -0.6596221923828125, -0.6270980834960938, -0.594573974609375, -0.5620498657226562, -0.5295257568359375, -0.49700164794921875, -0.4644775390625, -0.43195343017578125, -0.3994293212890625, -0.36690521240234375, -0.334381103515625, -0.30185699462890625, -0.2693328857421875, -0.23680877685546875, -0.20428466796875, -0.17176055908203125, -0.1392364501953125, -0.10671234130859375, -0.074188232421875, -0.04166412353515625, -0.0091400146484375, 0.02338409423828125, 0.055908203125, 0.08843231201171875, 0.1209564208984375, 0.15348052978515625, 0.186004638671875, 0.21852874755859375, 0.2510528564453125, 0.28357696533203125, 0.31610107421875, 0.34862518310546875, 0.3811492919921875, 0.41367340087890625, 0.446197509765625, 0.47872161865234375, 0.5112457275390625, 0.5437698364257812, 0.5762939453125, 0.6088180541992188, 0.6413421630859375, 0.6738662719726562, 0.706390380859375, 0.7389144897460938, 0.7714385986328125, 0.8039627075195312, 0.83648681640625, 0.8690109252929688, 0.9015350341796875, 0.9340591430664062, 0.966583251953125, 0.9991073608398438, 1.0316314697265625, 1.0641555786132812, 1.0966796875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 6.0, 5.0, 8.0, 7.0, 15.0, 3.0, 14.0, 8.0, 9.0, 11.0, 16.0, 12.0, 13.0, 27.0, 22.0, 27.0, 25.0, 30.0, 22.0, 29.0, 33.0, 43.0, 40.0, 40.0, 36.0, 1050.0, 41.0, 39.0, 43.0, 45.0, 22.0, 37.0, 30.0, 27.0, 24.0, 25.0, 20.0, 18.0, 12.0, 24.0, 10.0, 17.0, 8.0, 6.0, 9.0, 4.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.08984375, -3.95098876953125, -3.8121337890625, -3.67327880859375, -3.534423828125, -3.39556884765625, -3.2567138671875, -3.11785888671875, -2.97900390625, -2.84014892578125, -2.7012939453125, -2.56243896484375, -2.423583984375, -2.28472900390625, -2.1458740234375, -2.00701904296875, -1.8681640625, -1.72930908203125, -1.5904541015625, -1.45159912109375, -1.312744140625, -1.17388916015625, -1.0350341796875, -0.89617919921875, -0.75732421875, -0.61846923828125, -0.4796142578125, -0.34075927734375, -0.201904296875, -0.06304931640625, 0.0758056640625, 0.21466064453125, 0.353515625, 0.49237060546875, 0.6312255859375, 0.77008056640625, 0.908935546875, 1.04779052734375, 1.1866455078125, 1.32550048828125, 1.46435546875, 1.60321044921875, 1.7420654296875, 1.88092041015625, 2.019775390625, 2.15863037109375, 2.2974853515625, 2.43634033203125, 2.5751953125, 2.71405029296875, 2.8529052734375, 2.99176025390625, 3.130615234375, 3.26947021484375, 3.4083251953125, 3.54718017578125, 3.68603515625, 3.82489013671875, 3.9637451171875, 4.10260009765625, 4.241455078125, 4.38031005859375, 4.5191650390625, 4.65802001953125, 4.796875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 10.0, 14.0, 25.0, 35.0, 52.0, 77.0, 110.0, 187.0, 281.0, 436.0, 680.0, 1050.0, 1578.0, 2398.0, 3724.0, 5751.0, 8921.0, 13597.0, 20887.0, 32869.0, 51438.0, 81986.0, 130514.0, 1245213.0, 180424.0, 115427.0, 72368.0, 45296.0, 28742.0, 18470.0, 12003.0, 7745.0, 5146.0, 3389.0, 2179.0, 1432.0, 929.0, 638.0, 387.0, 277.0, 162.0, 109.0, 63.0, 37.0, 23.0, 19.0, 17.0, 7.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.041015625, -1.00933837890625, -0.9776611328125, -0.94598388671875, -0.914306640625, -0.88262939453125, -0.8509521484375, -0.81927490234375, -0.78759765625, -0.75592041015625, -0.7242431640625, -0.69256591796875, -0.660888671875, -0.62921142578125, -0.5975341796875, -0.56585693359375, -0.5341796875, -0.50250244140625, -0.4708251953125, -0.43914794921875, -0.407470703125, -0.37579345703125, -0.3441162109375, -0.31243896484375, -0.28076171875, -0.24908447265625, -0.2174072265625, -0.18572998046875, -0.154052734375, -0.12237548828125, -0.0906982421875, -0.05902099609375, -0.02734375, 0.00433349609375, 0.0360107421875, 0.06768798828125, 0.099365234375, 0.13104248046875, 0.1627197265625, 0.19439697265625, 0.22607421875, 0.25775146484375, 0.2894287109375, 0.32110595703125, 0.352783203125, 0.38446044921875, 0.4161376953125, 0.44781494140625, 0.4794921875, 0.51116943359375, 0.5428466796875, 0.57452392578125, 0.606201171875, 0.63787841796875, 0.6695556640625, 0.70123291015625, 0.73291015625, 0.76458740234375, 0.7962646484375, 0.82794189453125, 0.859619140625, 0.89129638671875, 0.9229736328125, 0.95465087890625, 0.986328125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 3.0, 11.0, 2.0, 5.0, 4.0, 12.0, 8.0, 15.0, 8.0, 16.0, 21.0, 23.0, 27.0, 34.0, 42.0, 44.0, 40.0, 61.0, 43.0, 54.0, 48.0, 54.0, 43.0, 37.0, 49.0, 48.0, 36.0, 41.0, 34.0, 28.0, 25.0, 17.0, 16.0, 14.0, 7.0, 8.0, 4.0, 3.0, 5.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0017833709716796875, -0.0017272084951400757, -0.0016710460186004639, -0.001614883542060852, -0.0015587210655212402, -0.0015025585889816284, -0.0014463961124420166, -0.0013902336359024048, -0.001334071159362793, -0.0012779086828231812, -0.0012217462062835693, -0.0011655837297439575, -0.0011094212532043457, -0.0010532587766647339, -0.000997096300125122, -0.0009409338235855103, -0.0008847713470458984, -0.0008286088705062866, -0.0007724463939666748, -0.000716283917427063, -0.0006601214408874512, -0.0006039589643478394, -0.0005477964878082275, -0.0004916340112686157, -0.0004354715347290039, -0.0003793090581893921, -0.0003231465816497803, -0.00026698410511016846, -0.00021082162857055664, -0.00015465915203094482, -9.849667549133301e-05, -4.233419895172119e-05, 1.3828277587890625e-05, 6.999075412750244e-05, 0.00012615323066711426, 0.00018231570720672607, 0.0002384781837463379, 0.0002946406602859497, 0.0003508031368255615, 0.00040696561336517334, 0.00046312808990478516, 0.000519290566444397, 0.0005754530429840088, 0.0006316155195236206, 0.0006877779960632324, 0.0007439404726028442, 0.0008001029491424561, 0.0008562654256820679, 0.0009124279022216797, 0.0009685903787612915, 0.0010247528553009033, 0.0010809153318405151, 0.001137077808380127, 0.0011932402849197388, 0.0012494027614593506, 0.0013055652379989624, 0.0013617277145385742, 0.001417890191078186, 0.0014740526676177979, 0.0015302151441574097, 0.0015863776206970215, 0.0016425400972366333, 0.0016987025737762451, 0.001754865050315857, 0.0018110275268554688]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 2.0, 5.0, 7.0, 5.0, 6.0, 12.0, 17.0, 26.0, 13.0, 27.0, 47.0, 49.0, 54.0, 64.0, 74.0, 119.0, 278.0, 696.0, 7042.0, 1034554.0, 4049.0, 626.0, 239.0, 119.0, 71.0, 72.0, 50.0, 44.0, 33.0, 17.0, 28.0, 17.0, 15.0, 18.0, 7.0, 6.0, 11.0, 6.0, 2.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04229736328125, -0.040993690490722656, -0.03969001770019531, -0.03838634490966797, -0.037082672119140625, -0.03577899932861328, -0.03447532653808594, -0.033171653747558594, -0.03186798095703125, -0.030564308166503906, -0.029260635375976562, -0.02795696258544922, -0.026653289794921875, -0.02534961700439453, -0.024045944213867188, -0.022742271423339844, -0.0214385986328125, -0.020134925842285156, -0.018831253051757812, -0.01752758026123047, -0.016223907470703125, -0.014920234680175781, -0.013616561889648438, -0.012312889099121094, -0.01100921630859375, -0.009705543518066406, -0.008401870727539062, -0.007098197937011719, -0.005794525146484375, -0.004490852355957031, -0.0031871795654296875, -0.0018835067749023438, -0.000579833984375, 0.0007238388061523438, 0.0020275115966796875, 0.0033311843872070312, 0.004634857177734375, 0.005938529968261719, 0.0072422027587890625, 0.008545875549316406, 0.00984954833984375, 0.011153221130371094, 0.012456893920898438, 0.013760566711425781, 0.015064239501953125, 0.01636791229248047, 0.017671585083007812, 0.018975257873535156, 0.0202789306640625, 0.021582603454589844, 0.022886276245117188, 0.02418994903564453, 0.025493621826171875, 0.02679729461669922, 0.028100967407226562, 0.029404640197753906, 0.03070831298828125, 0.032011985778808594, 0.03331565856933594, 0.03461933135986328, 0.035923004150390625, 0.03722667694091797, 0.03853034973144531, 0.039834022521972656, 0.0411376953125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 82.0, 609.0, 306.0, 14.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010601067915558815, -0.010411077179014683, -0.010221085511147976, -0.010031094774603844, -0.009841103106737137, -0.009651112370193005, -0.009461120702326298, -0.009271129965782166, -0.009081138297915459, -0.008891147561371326, -0.00870115589350462, -0.008511165156960487, -0.00832117348909378, -0.008131182752549648, -0.007941191084682941, -0.007751200348138809, -0.00756120914593339, -0.00737121794372797, -0.007181226741522551, -0.006991235539317131, -0.0068012443371117115, -0.006611253134906292, -0.00642126239836216, -0.006231270730495453, -0.006041279993951321, -0.005851288791745901, -0.005661297589540482, -0.005471306387335062, -0.0052813151851296425, -0.005091323982924223, -0.004901332780718803, -0.004711342044174671, -0.004521349910646677, -0.0043313587084412575, -0.004141367506235838, -0.003951376304030418, -0.003761385101824999, -0.0035713938996195793, -0.0033814029302448034, -0.003191411728039384, -0.003001420758664608, -0.0028114295564591885, -0.002621438354253769, -0.0024314471520483494, -0.00224145594984293, -0.0020514647476375103, -0.0018614737782627344, -0.0016714825760573149, -0.0014814912574365735, -0.001291500055231154, -0.0011015089694410563, -0.0009115177672356367, -0.0007215265650302172, -0.0005315353628247976, -0.0003415442770346999, -0.00015155307482928038, 3.8438127376139164e-05, 0.00022842930047772825, 0.00041842047357931733, 0.000608411617577076, 0.0007984028197824955, 0.000988394021987915, 0.0011783851077780128, 0.0013683763099834323, 0.0015583675121888518]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 1.0, 4.0, 4.0, 9.0, 11.0, 11.0, 11.0, 15.0, 20.0, 26.0, 28.0, 21.0, 17.0, 30.0, 29.0, 41.0, 37.0, 41.0, 32.0, 43.0, 37.0, 30.0, 56.0, 39.0, 44.0, 30.0, 49.0, 41.0, 33.0, 29.0, 32.0, 26.0, 20.0, 19.0, 17.0, 16.0, 13.0, 7.0, 13.0, 9.0, 2.0, 3.0, 1.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010439157485961914, -0.0010119974613189697, -0.000980079174041748, -0.0009481608867645264, -0.0009162425994873047, -0.000884324312210083, -0.0008524060249328613, -0.0008204877376556396, -0.000788569450378418, -0.0007566511631011963, -0.0007247328758239746, -0.0006928145885467529, -0.0006608963012695312, -0.0006289780139923096, -0.0005970597267150879, -0.0005651414394378662, -0.0005332231521606445, -0.0005013048648834229, -0.00046938657760620117, -0.0004374682903289795, -0.0004055500030517578, -0.00037363171577453613, -0.00034171342849731445, -0.0003097951412200928, -0.0002778768539428711, -0.0002459585666656494, -0.00021404027938842773, -0.00018212199211120605, -0.00015020370483398438, -0.0001182854175567627, -8.636713027954102e-05, -5.4448843002319336e-05, -2.2530555725097656e-05, 9.387731552124023e-06, 4.13060188293457e-05, 7.322430610656738e-05, 0.00010514259338378906, 0.00013706088066101074, 0.00016897916793823242, 0.0002008974552154541, 0.00023281574249267578, 0.00026473402976989746, 0.00029665231704711914, 0.0003285706043243408, 0.0003604888916015625, 0.0003924071788787842, 0.00042432546615600586, 0.00045624375343322754, 0.0004881620407104492, 0.0005200803279876709, 0.0005519986152648926, 0.0005839169025421143, 0.0006158351898193359, 0.0006477534770965576, 0.0006796717643737793, 0.000711590051651001, 0.0007435083389282227, 0.0007754266262054443, 0.000807344913482666, 0.0008392632007598877, 0.0008711814880371094, 0.0009030997753143311, 0.0009350180625915527, 0.0009669363498687744, 0.000998854637145996]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 7.0, 11.0, 9.0, 6.0, 17.0, 6.0, 13.0, 18.0, 19.0, 22.0, 19.0, 29.0, 29.0, 22.0, 37.0, 32.0, 36.0, 50.0, 37.0, 40.0, 34.0, 54.0, 32.0, 39.0, 31.0, 24.0, 38.0, 33.0, 20.0, 32.0, 19.0, 29.0, 18.0, 16.0, 19.0, 16.0, 15.0, 14.0, 6.0, 8.0, 13.0, 5.0, 6.0, 4.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.70703125, -6.47802734375, -6.2490234375, -6.02001953125, -5.791015625, -5.56201171875, -5.3330078125, -5.10400390625, -4.875, -4.64599609375, -4.4169921875, -4.18798828125, -3.958984375, -3.72998046875, -3.5009765625, -3.27197265625, -3.04296875, -2.81396484375, -2.5849609375, -2.35595703125, -2.126953125, -1.89794921875, -1.6689453125, -1.43994140625, -1.2109375, -0.98193359375, -0.7529296875, -0.52392578125, -0.294921875, -0.06591796875, 0.1630859375, 0.39208984375, 0.62109375, 0.85009765625, 1.0791015625, 1.30810546875, 1.537109375, 1.76611328125, 1.9951171875, 2.22412109375, 2.453125, 2.68212890625, 2.9111328125, 3.14013671875, 3.369140625, 3.59814453125, 3.8271484375, 4.05615234375, 4.28515625, 4.51416015625, 4.7431640625, 4.97216796875, 5.201171875, 5.43017578125, 5.6591796875, 5.88818359375, 6.1171875, 6.34619140625, 6.5751953125, 6.80419921875, 7.033203125, 7.26220703125, 7.4912109375, 7.72021484375, 7.94921875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 11.0, 10.0, 14.0, 11.0, 22.0, 15.0, 29.0, 42.0, 51.0, 71.0, 97.0, 129.0, 199.0, 352.0, 583.0, 1165.0, 2466.0, 6013.0, 16936.0, 58012.0, 246051.0, 526306.0, 136032.0, 34655.0, 11072.0, 4110.0, 1844.0, 875.0, 475.0, 280.0, 165.0, 127.0, 85.0, 62.0, 37.0, 26.0, 29.0, 20.0, 11.0, 14.0, 14.0, 6.0, 8.0, 5.0, 4.0, 2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.51171875, -6.28948974609375, -6.0672607421875, -5.84503173828125, -5.622802734375, -5.40057373046875, -5.1783447265625, -4.95611572265625, -4.73388671875, -4.51165771484375, -4.2894287109375, -4.06719970703125, -3.844970703125, -3.62274169921875, -3.4005126953125, -3.17828369140625, -2.9560546875, -2.73382568359375, -2.5115966796875, -2.28936767578125, -2.067138671875, -1.84490966796875, -1.6226806640625, -1.40045166015625, -1.17822265625, -0.95599365234375, -0.7337646484375, -0.51153564453125, -0.289306640625, -0.06707763671875, 0.1551513671875, 0.37738037109375, 0.599609375, 0.82183837890625, 1.0440673828125, 1.26629638671875, 1.488525390625, 1.71075439453125, 1.9329833984375, 2.15521240234375, 2.37744140625, 2.59967041015625, 2.8218994140625, 3.04412841796875, 3.266357421875, 3.48858642578125, 3.7108154296875, 3.93304443359375, 4.1552734375, 4.37750244140625, 4.5997314453125, 4.82196044921875, 5.044189453125, 5.26641845703125, 5.4886474609375, 5.71087646484375, 5.93310546875, 6.15533447265625, 6.3775634765625, 6.59979248046875, 6.822021484375, 7.04425048828125, 7.2664794921875, 7.48870849609375, 7.7109375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 9.0, 11.0, 13.0, 9.0, 10.0, 17.0, 12.0, 28.0, 21.0, 20.0, 33.0, 31.0, 39.0, 33.0, 34.0, 41.0, 45.0, 89.0, 223.0, 1712.0, 145.0, 63.0, 40.0, 48.0, 30.0, 34.0, 37.0, 28.0, 20.0, 35.0, 19.0, 21.0, 21.0, 14.0, 10.0, 10.0, 8.0, 4.0, 5.0, 6.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.59375, -23.78271484375, -22.9716796875, -22.16064453125, -21.349609375, -20.53857421875, -19.7275390625, -18.91650390625, -18.10546875, -17.29443359375, -16.4833984375, -15.67236328125, -14.861328125, -14.05029296875, -13.2392578125, -12.42822265625, -11.6171875, -10.80615234375, -9.9951171875, -9.18408203125, -8.373046875, -7.56201171875, -6.7509765625, -5.93994140625, -5.12890625, -4.31787109375, -3.5068359375, -2.69580078125, -1.884765625, -1.07373046875, -0.2626953125, 0.54833984375, 1.359375, 2.17041015625, 2.9814453125, 3.79248046875, 4.603515625, 5.41455078125, 6.2255859375, 7.03662109375, 7.84765625, 8.65869140625, 9.4697265625, 10.28076171875, 11.091796875, 11.90283203125, 12.7138671875, 13.52490234375, 14.3359375, 15.14697265625, 15.9580078125, 16.76904296875, 17.580078125, 18.39111328125, 19.2021484375, 20.01318359375, 20.82421875, 21.63525390625, 22.4462890625, 23.25732421875, 24.068359375, 24.87939453125, 25.6904296875, 26.50146484375, 27.3125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 14.0, 21.0, 35.0, 55.0, 114.0, 217.0, 408.0, 1358.0, 3123436.0, 18615.0, 721.0, 340.0, 156.0, 87.0, 46.0, 33.0, 18.0, 9.0, 5.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.0, -133.37109375, -128.7421875, -124.11328125, -119.484375, -114.85546875, -110.2265625, -105.59765625, -100.96875, -96.33984375, -91.7109375, -87.08203125, -82.453125, -77.82421875, -73.1953125, -68.56640625, -63.9375, -59.30859375, -54.6796875, -50.05078125, -45.421875, -40.79296875, -36.1640625, -31.53515625, -26.90625, -22.27734375, -17.6484375, -13.01953125, -8.390625, -3.76171875, 0.8671875, 5.49609375, 10.125, 14.75390625, 19.3828125, 24.01171875, 28.640625, 33.26953125, 37.8984375, 42.52734375, 47.15625, 51.78515625, 56.4140625, 61.04296875, 65.671875, 70.30078125, 74.9296875, 79.55859375, 84.1875, 88.81640625, 93.4453125, 98.07421875, 102.703125, 107.33203125, 111.9609375, 116.58984375, 121.21875, 125.84765625, 130.4765625, 135.10546875, 139.734375, 144.36328125, 148.9921875, 153.62109375, 158.25]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 11.0, 429.0, 560.0, 16.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.37947845458984, -62.586734771728516, -57.79398727416992, -53.001243591308594, -48.20849609375, -43.41575241088867, -38.623008728027344, -33.83026123046875, -29.037517547607422, -24.24477195739746, -19.4520263671875, -14.659282684326172, -9.866537094116211, -5.07379150390625, -0.2810478210449219, 4.511699676513672, 9.304443359375, 14.097188949584961, 18.889934539794922, 23.68267822265625, 28.47542381286621, 33.26816940307617, 38.0609130859375, 42.853660583496094, 47.64640426635742, 52.43914794921875, 57.231895446777344, 62.02463912963867, 66.8173828125, 71.6101303100586, 76.40287780761719, 81.19561767578125, 85.98835754394531, 90.7811050415039, 95.57384490966797, 100.36659240722656, 105.15933990478516, 109.95208740234375, 114.74482727050781, 119.5375747680664, 124.330322265625, 129.12306213378906, 133.9158172607422, 138.70855712890625, 143.5012969970703, 148.29405212402344, 153.0867919921875, 157.87954711914062, 162.67227172851562, 167.4650115966797, 172.2577667236328, 177.05050659179688, 181.84324645996094, 186.63600158691406, 191.42874145507812, 196.22149658203125, 201.0142364501953, 205.80697631835938, 210.5997314453125, 215.39247131347656, 220.18521118164062, 224.97796630859375, 229.7707061767578, 234.56344604492188, 239.356201171875]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 10.0, 10.0, 9.0, 15.0, 19.0, 23.0, 29.0, 23.0, 25.0, 30.0, 29.0, 41.0, 41.0, 45.0, 36.0, 47.0, 41.0, 46.0, 46.0, 54.0, 53.0, 34.0, 45.0, 30.0, 21.0, 26.0, 22.0, 22.0, 26.0, 17.0, 15.0, 15.0, 12.0, 13.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.66453552246094, -73.23259735107422, -70.80065155029297, -68.36871337890625, -65.936767578125, -63.504825592041016, -61.07288360595703, -58.64094543457031, -56.20899963378906, -53.77705764770508, -51.345115661621094, -48.91317367553711, -46.481231689453125, -44.04928970336914, -41.617347717285156, -39.18540954589844, -36.75346755981445, -34.32152557373047, -31.889583587646484, -29.4576416015625, -27.025699615478516, -24.59375762939453, -22.16181755065918, -19.729875564575195, -17.29793357849121, -14.865991592407227, -12.434049606323242, -10.002108573913574, -7.57016658782959, -5.1382246017456055, -2.7062835693359375, -0.2743415832519531, 2.1576004028320312, 4.589542388916016, 7.021483898162842, 9.453425407409668, 11.885367393493652, 14.317309379577637, 16.749250411987305, 19.18119239807129, 21.613134384155273, 24.045076370239258, 26.477018356323242, 28.908958435058594, 31.340900421142578, 33.77284240722656, 36.20478439331055, 38.63672637939453, 41.068668365478516, 43.5006103515625, 45.932552337646484, 48.36449432373047, 50.79643630981445, 53.22837829589844, 55.660316467285156, 58.092262268066406, 60.524200439453125, 62.95614242553711, 65.3880844116211, 67.82002258300781, 70.25196838378906, 72.68390655517578, 75.11585235595703, 77.54779052734375, 79.979736328125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 11.0, 6.0, 11.0, 10.0, 12.0, 11.0, 14.0, 19.0, 20.0, 23.0, 24.0, 18.0, 34.0, 42.0, 35.0, 34.0, 44.0, 52.0, 29.0, 45.0, 37.0, 37.0, 36.0, 37.0, 38.0, 36.0, 23.0, 26.0, 37.0, 24.0, 16.0, 21.0, 22.0, 19.0, 11.0, 11.0, 14.0, 11.0, 11.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.05859375, -6.81732177734375, -6.5760498046875, -6.33477783203125, -6.093505859375, -5.85223388671875, -5.6109619140625, -5.36968994140625, -5.12841796875, -4.88714599609375, -4.6458740234375, -4.40460205078125, -4.163330078125, -3.92205810546875, -3.6807861328125, -3.43951416015625, -3.1982421875, -2.95697021484375, -2.7156982421875, -2.47442626953125, -2.233154296875, -1.99188232421875, -1.7506103515625, -1.50933837890625, -1.26806640625, -1.02679443359375, -0.7855224609375, -0.54425048828125, -0.302978515625, -0.06170654296875, 0.1795654296875, 0.42083740234375, 0.662109375, 0.90338134765625, 1.1446533203125, 1.38592529296875, 1.627197265625, 1.86846923828125, 2.1097412109375, 2.35101318359375, 2.59228515625, 2.83355712890625, 3.0748291015625, 3.31610107421875, 3.557373046875, 3.79864501953125, 4.0399169921875, 4.28118896484375, 4.5224609375, 4.76373291015625, 5.0050048828125, 5.24627685546875, 5.487548828125, 5.72882080078125, 5.9700927734375, 6.21136474609375, 6.45263671875, 6.69390869140625, 6.9351806640625, 7.17645263671875, 7.417724609375, 7.65899658203125, 7.9002685546875, 8.14154052734375, 8.3828125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 10.0, 5.0, 15.0, 13.0, 12.0, 10.0, 18.0, 25.0, 26.0, 28.0, 34.0, 30.0, 42.0, 54.0, 63.0, 76.0, 110.0, 127.0, 240.0, 545.0, 1398.0, 5784.0, 50551.0, 897838.0, 2761164.0, 444690.0, 25146.0, 3832.0, 1080.0, 410.0, 201.0, 162.0, 115.0, 67.0, 62.0, 41.0, 39.0, 45.0, 28.0, 35.0, 21.0, 20.0, 19.0, 15.0, 6.0, 7.0, 8.0, 4.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0], "bins": [-18.0625, -17.4677734375, -16.873046875, -16.2783203125, -15.68359375, -15.0888671875, -14.494140625, -13.8994140625, -13.3046875, -12.7099609375, -12.115234375, -11.5205078125, -10.92578125, -10.3310546875, -9.736328125, -9.1416015625, -8.546875, -7.9521484375, -7.357421875, -6.7626953125, -6.16796875, -5.5732421875, -4.978515625, -4.3837890625, -3.7890625, -3.1943359375, -2.599609375, -2.0048828125, -1.41015625, -0.8154296875, -0.220703125, 0.3740234375, 0.96875, 1.5634765625, 2.158203125, 2.7529296875, 3.34765625, 3.9423828125, 4.537109375, 5.1318359375, 5.7265625, 6.3212890625, 6.916015625, 7.5107421875, 8.10546875, 8.7001953125, 9.294921875, 9.8896484375, 10.484375, 11.0791015625, 11.673828125, 12.2685546875, 12.86328125, 13.4580078125, 14.052734375, 14.6474609375, 15.2421875, 15.8369140625, 16.431640625, 17.0263671875, 17.62109375, 18.2158203125, 18.810546875, 19.4052734375, 20.0]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 2.0, 3.0, 7.0, 8.0, 14.0, 18.0, 17.0, 27.0, 34.0, 36.0, 57.0, 84.0, 75.0, 89.0, 132.0, 150.0, 195.0, 264.0, 315.0, 387.0, 425.0, 397.0, 315.0, 236.0, 156.0, 145.0, 107.0, 81.0, 76.0, 40.0, 43.0, 39.0, 17.0, 22.0, 16.0, 17.0, 9.0, 4.0, 5.0, 5.0, 2.0, 0.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.375, -12.97314453125, -12.5712890625, -12.16943359375, -11.767578125, -11.36572265625, -10.9638671875, -10.56201171875, -10.16015625, -9.75830078125, -9.3564453125, -8.95458984375, -8.552734375, -8.15087890625, -7.7490234375, -7.34716796875, -6.9453125, -6.54345703125, -6.1416015625, -5.73974609375, -5.337890625, -4.93603515625, -4.5341796875, -4.13232421875, -3.73046875, -3.32861328125, -2.9267578125, -2.52490234375, -2.123046875, -1.72119140625, -1.3193359375, -0.91748046875, -0.515625, -0.11376953125, 0.2880859375, 0.68994140625, 1.091796875, 1.49365234375, 1.8955078125, 2.29736328125, 2.69921875, 3.10107421875, 3.5029296875, 3.90478515625, 4.306640625, 4.70849609375, 5.1103515625, 5.51220703125, 5.9140625, 6.31591796875, 6.7177734375, 7.11962890625, 7.521484375, 7.92333984375, 8.3251953125, 8.72705078125, 9.12890625, 9.53076171875, 9.9326171875, 10.33447265625, 10.736328125, 11.13818359375, 11.5400390625, 11.94189453125, 12.34375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 6.0, 5.0, 3.0, 7.0, 12.0, 16.0, 16.0, 10.0, 25.0, 25.0, 38.0, 38.0, 52.0, 67.0, 89.0, 119.0, 137.0, 158.0, 180.0, 227.0, 375.0, 702.0, 6966.0, 3331977.0, 847734.0, 3061.0, 581.0, 372.0, 225.0, 195.0, 160.0, 135.0, 109.0, 97.0, 75.0, 69.0, 41.0, 35.0, 37.0, 25.0, 23.0, 13.0, 10.0, 6.0, 6.0, 8.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-64.6875, -62.6591796875, -60.630859375, -58.6025390625, -56.57421875, -54.5458984375, -52.517578125, -50.4892578125, -48.4609375, -46.4326171875, -44.404296875, -42.3759765625, -40.34765625, -38.3193359375, -36.291015625, -34.2626953125, -32.234375, -30.2060546875, -28.177734375, -26.1494140625, -24.12109375, -22.0927734375, -20.064453125, -18.0361328125, -16.0078125, -13.9794921875, -11.951171875, -9.9228515625, -7.89453125, -5.8662109375, -3.837890625, -1.8095703125, 0.21875, 2.2470703125, 4.275390625, 6.3037109375, 8.33203125, 10.3603515625, 12.388671875, 14.4169921875, 16.4453125, 18.4736328125, 20.501953125, 22.5302734375, 24.55859375, 26.5869140625, 28.615234375, 30.6435546875, 32.671875, 34.7001953125, 36.728515625, 38.7568359375, 40.78515625, 42.8134765625, 44.841796875, 46.8701171875, 48.8984375, 50.9267578125, 52.955078125, 54.9833984375, 57.01171875, 59.0400390625, 61.068359375, 63.0966796875, 65.125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 21.0, 126.0, 411.0, 346.0, 92.0, 18.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.4569854736328, -141.6826171875, -134.90823364257812, -128.13385009765625, -121.35948181152344, -114.5851058959961, -107.81072998046875, -101.0363540649414, -94.26197814941406, -87.48760223388672, -80.71322631835938, -73.93885040283203, -67.16447448730469, -60.390098571777344, -53.61572265625, -46.841346740722656, -40.06697082519531, -33.29259490966797, -26.518218994140625, -19.74384307861328, -12.969467163085938, -6.195091247558594, 0.57928466796875, 7.353660583496094, 14.128036499023438, 20.90241241455078, 27.676788330078125, 34.45116424560547, 41.22554016113281, 47.999916076660156, 54.7742919921875, 61.548667907714844, 68.32302856445312, 75.09740447998047, 81.87178039550781, 88.64615631103516, 95.4205322265625, 102.19490814208984, 108.96928405761719, 115.74365997314453, 122.51803588867188, 129.29241943359375, 136.06678771972656, 142.84115600585938, 149.61553955078125, 156.38992309570312, 163.16429138183594, 169.93865966796875, 176.71304321289062, 183.4874267578125, 190.2617950439453, 197.03616333007812, 203.810546875, 210.58493041992188, 217.3592987060547, 224.1336669921875, 230.90805053710938, 237.68243408203125, 244.45680236816406, 251.23117065429688, 258.00555419921875, 264.7799377441406, 271.5543212890625, 278.32867431640625, 285.1030578613281]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 8.0, 7.0, 9.0, 15.0, 17.0, 15.0, 22.0, 9.0, 17.0, 28.0, 26.0, 28.0, 40.0, 50.0, 40.0, 43.0, 59.0, 47.0, 33.0, 58.0, 34.0, 39.0, 53.0, 39.0, 35.0, 32.0, 35.0, 21.0, 26.0, 21.0, 27.0, 14.0, 13.0, 3.0, 11.0, 3.0, 9.0, 5.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.80086135864258, -54.11524963378906, -52.42964172363281, -50.7440299987793, -49.05842208862305, -47.37281036376953, -45.68720245361328, -44.001590728759766, -42.31597900390625, -40.630367279052734, -38.944759368896484, -37.25914764404297, -35.57353973388672, -33.8879280090332, -32.20231628417969, -30.516708374023438, -28.831100463867188, -27.145490646362305, -25.459880828857422, -23.774269104003906, -22.088661193847656, -20.40304946899414, -18.717439651489258, -17.031829833984375, -15.346220016479492, -13.66061019897461, -11.975000381469727, -10.289389610290527, -8.603779792785645, -6.918169975280762, -5.2325592041015625, -3.5469493865966797, -1.8613357543945312, -0.17572569847106934, 1.5098843574523926, 3.1954946517944336, 4.881104469299316, 6.566714286804199, 8.252325057983398, 9.937934875488281, 11.623544692993164, 13.309154510498047, 14.99476432800293, 16.680374145507812, 18.365985870361328, 20.051593780517578, 21.737205505371094, 23.422815322875977, 25.10842514038086, 26.794034957885742, 28.479644775390625, 30.16525650024414, 31.85086441040039, 33.536476135253906, 35.222084045410156, 36.90769577026367, 38.59330749511719, 40.2789192199707, 41.96452713012695, 43.65013885498047, 45.33574676513672, 47.021358489990234, 48.70697021484375, 50.392578125, 52.07818603515625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 4.0, 8.0, 14.0, 9.0, 8.0, 9.0, 20.0, 16.0, 14.0, 23.0, 30.0, 14.0, 23.0, 44.0, 30.0, 30.0, 43.0, 28.0, 40.0, 46.0, 48.0, 38.0, 33.0, 39.0, 31.0, 37.0, 32.0, 26.0, 26.0, 29.0, 31.0, 16.0, 17.0, 21.0, 12.0, 11.0, 21.0, 14.0, 8.0, 13.0, 16.0, 6.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.4453125, -7.21331787109375, -6.9813232421875, -6.74932861328125, -6.517333984375, -6.28533935546875, -6.0533447265625, -5.82135009765625, -5.58935546875, -5.35736083984375, -5.1253662109375, -4.89337158203125, -4.661376953125, -4.42938232421875, -4.1973876953125, -3.96539306640625, -3.7333984375, -3.50140380859375, -3.2694091796875, -3.03741455078125, -2.805419921875, -2.57342529296875, -2.3414306640625, -2.10943603515625, -1.87744140625, -1.64544677734375, -1.4134521484375, -1.18145751953125, -0.949462890625, -0.71746826171875, -0.4854736328125, -0.25347900390625, -0.021484375, 0.21051025390625, 0.4425048828125, 0.67449951171875, 0.906494140625, 1.13848876953125, 1.3704833984375, 1.60247802734375, 1.83447265625, 2.06646728515625, 2.2984619140625, 2.53045654296875, 2.762451171875, 2.99444580078125, 3.2264404296875, 3.45843505859375, 3.6904296875, 3.92242431640625, 4.1544189453125, 4.38641357421875, 4.618408203125, 4.85040283203125, 5.0823974609375, 5.31439208984375, 5.54638671875, 5.77838134765625, 6.0103759765625, 6.24237060546875, 6.474365234375, 6.70635986328125, 6.9383544921875, 7.17034912109375, 7.40234375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 9.0, 8.0, 12.0, 19.0, 24.0, 40.0, 62.0, 86.0, 130.0, 192.0, 234.0, 381.0, 444.0, 710.0, 1041.0, 1468.0, 2302.0, 3366.0, 4906.0, 7489.0, 11277.0, 16981.0, 25510.0, 39470.0, 60386.0, 92045.0, 139230.0, 195465.0, 151911.0, 100225.0, 66293.0, 42503.0, 28327.0, 18428.0, 12328.0, 8161.0, 5554.0, 3648.0, 2480.0, 1691.0, 1111.0, 797.0, 571.0, 386.0, 262.0, 188.0, 118.0, 83.0, 63.0, 46.0, 43.0, 19.0, 18.0, 9.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.0634765625, -1.0298309326171875, -0.996185302734375, -0.9625396728515625, -0.92889404296875, -0.8952484130859375, -0.861602783203125, -0.8279571533203125, -0.7943115234375, -0.7606658935546875, -0.727020263671875, -0.6933746337890625, -0.65972900390625, -0.6260833740234375, -0.592437744140625, -0.5587921142578125, -0.525146484375, -0.4915008544921875, -0.457855224609375, -0.4242095947265625, -0.39056396484375, -0.3569183349609375, -0.323272705078125, -0.2896270751953125, -0.2559814453125, -0.2223358154296875, -0.188690185546875, -0.1550445556640625, -0.12139892578125, -0.0877532958984375, -0.054107666015625, -0.0204620361328125, 0.01318359375, 0.0468292236328125, 0.080474853515625, 0.1141204833984375, 0.14776611328125, 0.1814117431640625, 0.215057373046875, 0.2487030029296875, 0.2823486328125, 0.3159942626953125, 0.349639892578125, 0.3832855224609375, 0.41693115234375, 0.4505767822265625, 0.484222412109375, 0.5178680419921875, 0.551513671875, 0.5851593017578125, 0.618804931640625, 0.6524505615234375, 0.68609619140625, 0.7197418212890625, 0.753387451171875, 0.7870330810546875, 0.8206787109375, 0.8543243408203125, 0.887969970703125, 0.9216156005859375, 0.95526123046875, 0.9889068603515625, 1.022552490234375, 1.0561981201171875, 1.08984375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 12.0, 2.0, 8.0, 11.0, 14.0, 13.0, 16.0, 20.0, 20.0, 30.0, 36.0, 33.0, 37.0, 33.0, 31.0, 33.0, 45.0, 34.0, 39.0, 1064.0, 35.0, 48.0, 37.0, 45.0, 44.0, 32.0, 35.0, 40.0, 25.0, 22.0, 25.0, 14.0, 16.0, 17.0, 15.0, 8.0, 7.0, 5.0, 8.0, 1.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.26171875, -5.09674072265625, -4.9317626953125, -4.76678466796875, -4.601806640625, -4.43682861328125, -4.2718505859375, -4.10687255859375, -3.94189453125, -3.77691650390625, -3.6119384765625, -3.44696044921875, -3.281982421875, -3.11700439453125, -2.9520263671875, -2.78704833984375, -2.6220703125, -2.45709228515625, -2.2921142578125, -2.12713623046875, -1.962158203125, -1.79718017578125, -1.6322021484375, -1.46722412109375, -1.30224609375, -1.13726806640625, -0.9722900390625, -0.80731201171875, -0.642333984375, -0.47735595703125, -0.3123779296875, -0.14739990234375, 0.017578125, 0.18255615234375, 0.3475341796875, 0.51251220703125, 0.677490234375, 0.84246826171875, 1.0074462890625, 1.17242431640625, 1.33740234375, 1.50238037109375, 1.6673583984375, 1.83233642578125, 1.997314453125, 2.16229248046875, 2.3272705078125, 2.49224853515625, 2.6572265625, 2.82220458984375, 2.9871826171875, 3.15216064453125, 3.317138671875, 3.48211669921875, 3.6470947265625, 3.81207275390625, 3.97705078125, 4.14202880859375, 4.3070068359375, 4.47198486328125, 4.636962890625, 4.80194091796875, 4.9669189453125, 5.13189697265625, 5.296875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 12.0, 17.0, 11.0, 25.0, 22.0, 46.0, 67.0, 96.0, 118.0, 172.0, 281.0, 386.0, 549.0, 876.0, 1228.0, 1842.0, 2721.0, 3916.0, 5924.0, 8790.0, 13717.0, 20413.0, 31658.0, 48940.0, 76555.0, 118493.0, 184608.0, 1225779.0, 123189.0, 79653.0, 50835.0, 32636.0, 21406.0, 13997.0, 9264.0, 5967.0, 4159.0, 2756.0, 1897.0, 1333.0, 830.0, 622.0, 424.0, 272.0, 211.0, 137.0, 99.0, 61.0, 48.0, 29.0, 17.0, 15.0, 10.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0], "bins": [-0.9521484375, -0.921478271484375, -0.89080810546875, -0.860137939453125, -0.8294677734375, -0.798797607421875, -0.76812744140625, -0.737457275390625, -0.706787109375, -0.676116943359375, -0.64544677734375, -0.614776611328125, -0.5841064453125, -0.553436279296875, -0.52276611328125, -0.492095947265625, -0.46142578125, -0.430755615234375, -0.40008544921875, -0.369415283203125, -0.3387451171875, -0.308074951171875, -0.27740478515625, -0.246734619140625, -0.216064453125, -0.185394287109375, -0.15472412109375, -0.124053955078125, -0.0933837890625, -0.062713623046875, -0.03204345703125, -0.001373291015625, 0.029296875, 0.059967041015625, 0.09063720703125, 0.121307373046875, 0.1519775390625, 0.182647705078125, 0.21331787109375, 0.243988037109375, 0.274658203125, 0.305328369140625, 0.33599853515625, 0.366668701171875, 0.3973388671875, 0.428009033203125, 0.45867919921875, 0.489349365234375, 0.52001953125, 0.550689697265625, 0.58135986328125, 0.612030029296875, 0.6427001953125, 0.673370361328125, 0.70404052734375, 0.734710693359375, 0.765380859375, 0.796051025390625, 0.82672119140625, 0.857391357421875, 0.8880615234375, 0.918731689453125, 0.94940185546875, 0.980072021484375, 1.0107421875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 3.0, 5.0, 6.0, 7.0, 9.0, 10.0, 16.0, 25.0, 25.0, 32.0, 27.0, 49.0, 49.0, 48.0, 48.0, 49.0, 63.0, 60.0, 63.0, 40.0, 56.0, 44.0, 48.0, 27.0, 38.0, 35.0, 19.0, 26.0, 12.0, 9.0, 12.0, 9.0, 3.0, 2.0, 7.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0017633438110351562, -0.0017117857933044434, -0.0016602277755737305, -0.0016086697578430176, -0.0015571117401123047, -0.0015055537223815918, -0.001453995704650879, -0.001402437686920166, -0.0013508796691894531, -0.0012993216514587402, -0.0012477636337280273, -0.0011962056159973145, -0.0011446475982666016, -0.0010930895805358887, -0.0010415315628051758, -0.0009899735450744629, -0.00093841552734375, -0.0008868575096130371, -0.0008352994918823242, -0.0007837414741516113, -0.0007321834564208984, -0.0006806254386901855, -0.0006290674209594727, -0.0005775094032287598, -0.0005259513854980469, -0.000474393367767334, -0.0004228353500366211, -0.0003712773323059082, -0.0003197193145751953, -0.0002681612968444824, -0.00021660327911376953, -0.00016504526138305664, -0.00011348724365234375, -6.192922592163086e-05, -1.0371208190917969e-05, 4.118680953979492e-05, 9.274482727050781e-05, 0.0001443028450012207, 0.0001958608627319336, 0.0002474188804626465, 0.0002989768981933594, 0.00035053491592407227, 0.00040209293365478516, 0.00045365095138549805, 0.0005052089691162109, 0.0005567669868469238, 0.0006083250045776367, 0.0006598830223083496, 0.0007114410400390625, 0.0007629990577697754, 0.0008145570755004883, 0.0008661150932312012, 0.0009176731109619141, 0.000969231128692627, 0.0010207891464233398, 0.0010723471641540527, 0.0011239051818847656, 0.0011754631996154785, 0.0012270212173461914, 0.0012785792350769043, 0.0013301372528076172, 0.00138169527053833, 0.001433253288269043, 0.0014848113059997559, 0.0015363693237304688]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 8.0, 0.0, 6.0, 3.0, 8.0, 5.0, 7.0, 8.0, 24.0, 24.0, 21.0, 31.0, 42.0, 39.0, 73.0, 82.0, 115.0, 178.0, 455.0, 2586.0, 1013602.0, 29722.0, 714.0, 263.0, 152.0, 87.0, 65.0, 51.0, 31.0, 28.0, 21.0, 23.0, 23.0, 10.0, 10.0, 9.0, 6.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03759765625, -0.036411285400390625, -0.03522491455078125, -0.034038543701171875, -0.0328521728515625, -0.031665802001953125, -0.03047943115234375, -0.029293060302734375, -0.028106689453125, -0.026920318603515625, -0.02573394775390625, -0.024547576904296875, -0.0233612060546875, -0.022174835205078125, -0.02098846435546875, -0.019802093505859375, -0.01861572265625, -0.017429351806640625, -0.01624298095703125, -0.015056610107421875, -0.0138702392578125, -0.012683868408203125, -0.01149749755859375, -0.010311126708984375, -0.009124755859375, -0.007938385009765625, -0.00675201416015625, -0.005565643310546875, -0.0043792724609375, -0.003192901611328125, -0.00200653076171875, -0.000820159912109375, 0.0003662109375, 0.001552581787109375, 0.00273895263671875, 0.003925323486328125, 0.0051116943359375, 0.006298065185546875, 0.00748443603515625, 0.008670806884765625, 0.009857177734375, 0.011043548583984375, 0.01222991943359375, 0.013416290283203125, 0.0146026611328125, 0.015789031982421875, 0.01697540283203125, 0.018161773681640625, 0.01934814453125, 0.020534515380859375, 0.02172088623046875, 0.022907257080078125, 0.0240936279296875, 0.025279998779296875, 0.02646636962890625, 0.027652740478515625, 0.028839111328125, 0.030025482177734375, 0.03121185302734375, 0.032398223876953125, 0.0335845947265625, 0.034770965576171875, 0.03595733642578125, 0.037143707275390625, 0.038330078125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 12.0, 22.0, 29.0, 52.0, 92.0, 110.0, 144.0, 153.0, 156.0, 86.0, 69.0, 37.0, 24.0, 9.0, 6.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.002105479361489415, -0.002065099310129881, -0.0020247192587703466, -0.0019843392074108124, -0.0019439592724666, -0.0019035792211070657, -0.0018631991697475314, -0.0018228191183879972, -0.0017824391834437847, -0.0017420591320842505, -0.0017016790807247162, -0.0016612991457805037, -0.0016209190944209695, -0.0015805390430614352, -0.001540158991701901, -0.0014997789403423667, -0.0014593988889828324, -0.0014190188376232982, -0.001378638786263764, -0.0013382588513195515, -0.0012978787999600172, -0.001257498748600483, -0.0012171186972409487, -0.0011767386458814144, -0.0011363585945218801, -0.0010959785431623459, -0.0010555984918028116, -0.0010152185568585992, -0.0009748385054990649, -0.0009344584541395307, -0.0008940784027799964, -0.0008536983514204621, -0.0008133184164762497, -0.0007729383651167154, -0.0007325583719648421, -0.0006921783206053078, -0.0006517983274534345, -0.0006114182760939002, -0.0005710382247343659, -0.0005306581733748317, -0.0004902781220152974, -0.0004498980997595936, -0.0004095180775038898, -0.00036913802614435554, -0.00032875800388865173, -0.0002883779816329479, -0.00024799793027341366, -0.00020761790801770985, -0.0001672379148658365, -0.0001268578926101327, -8.647785580251366e-05, -4.609782627085224e-05, -5.717796739190817e-06, 3.466222551651299e-05, 7.504226232413203e-05, 0.00011542229913175106, 0.00015580232138745487, 0.00019618234364315867, 0.0002365623804507777, 0.00027694241725839674, 0.00031732243951410055, 0.00035770246176980436, 0.00039808248402550817, 0.00043846253538504243, 0.00047884255764074624]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 4.0, 6.0, 6.0, 4.0, 15.0, 15.0, 8.0, 14.0, 17.0, 25.0, 20.0, 30.0, 21.0, 32.0, 25.0, 32.0, 39.0, 28.0, 36.0, 43.0, 36.0, 33.0, 34.0, 42.0, 39.0, 37.0, 37.0, 38.0, 31.0, 32.0, 30.0, 26.0, 24.0, 19.0, 20.0, 14.0, 10.0, 15.0, 10.0, 13.0, 8.0, 8.0, 7.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0007726550102233887, -0.0007470259442925453, -0.000721396878361702, -0.0006957678124308586, -0.0006701387465000153, -0.0006445096805691719, -0.0006188806146383286, -0.0005932515487074852, -0.0005676224827766418, -0.0005419934168457985, -0.0005163643509149551, -0.0004907352849841118, -0.00046510621905326843, -0.0004394771531224251, -0.0004138480871915817, -0.00038821902126073837, -0.000362589955329895, -0.00033696088939905167, -0.0003113318234682083, -0.00028570275753736496, -0.0002600736916065216, -0.00023444462567567825, -0.0002088155597448349, -0.00018318649381399155, -0.0001575574278831482, -0.00013192836195230484, -0.00010629929602146149, -8.067023009061813e-05, -5.504116415977478e-05, -2.9412098228931427e-05, -3.7830322980880737e-06, 2.184603363275528e-05, 4.747509956359863e-05, 7.310416549444199e-05, 9.873323142528534e-05, 0.0001243622973561287, 0.00014999136328697205, 0.0001756204292178154, 0.00020124949514865875, 0.0002268785610795021, 0.00025250762701034546, 0.0002781366929411888, 0.00030376575887203217, 0.0003293948248028755, 0.00035502389073371887, 0.0003806529566645622, 0.0004062820225954056, 0.00043191108852624893, 0.0004575401544570923, 0.00048316922038793564, 0.000508798286318779, 0.0005344273522496223, 0.0005600564181804657, 0.000585685484111309, 0.0006113145500421524, 0.0006369436159729958, 0.0006625726819038391, 0.0006882017478346825, 0.0007138308137655258, 0.0007394598796963692, 0.0007650889456272125, 0.0007907180115580559, 0.0008163470774888992, 0.0008419761434197426, 0.0008676052093505859]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 4.0, 8.0, 14.0, 9.0, 8.0, 9.0, 20.0, 16.0, 14.0, 23.0, 30.0, 14.0, 23.0, 44.0, 30.0, 30.0, 43.0, 28.0, 40.0, 46.0, 48.0, 38.0, 33.0, 39.0, 31.0, 37.0, 32.0, 26.0, 26.0, 29.0, 31.0, 16.0, 17.0, 21.0, 12.0, 11.0, 21.0, 14.0, 8.0, 13.0, 16.0, 6.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.4453125, -7.21331787109375, -6.9813232421875, -6.74932861328125, -6.517333984375, -6.28533935546875, -6.0533447265625, -5.82135009765625, -5.58935546875, -5.35736083984375, -5.1253662109375, -4.89337158203125, -4.661376953125, -4.42938232421875, -4.1973876953125, -3.96539306640625, -3.7333984375, -3.50140380859375, -3.2694091796875, -3.03741455078125, -2.805419921875, -2.57342529296875, -2.3414306640625, -2.10943603515625, -1.87744140625, -1.64544677734375, -1.4134521484375, -1.18145751953125, -0.949462890625, -0.71746826171875, -0.4854736328125, -0.25347900390625, -0.021484375, 0.21051025390625, 0.4425048828125, 0.67449951171875, 0.906494140625, 1.13848876953125, 1.3704833984375, 1.60247802734375, 1.83447265625, 2.06646728515625, 2.2984619140625, 2.53045654296875, 2.762451171875, 2.99444580078125, 3.2264404296875, 3.45843505859375, 3.6904296875, 3.92242431640625, 4.1544189453125, 4.38641357421875, 4.618408203125, 4.85040283203125, 5.0823974609375, 5.31439208984375, 5.54638671875, 5.77838134765625, 6.0103759765625, 6.24237060546875, 6.474365234375, 6.70635986328125, 6.9383544921875, 7.17034912109375, 7.40234375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 5.0, 2.0, 7.0, 11.0, 5.0, 8.0, 16.0, 24.0, 25.0, 49.0, 61.0, 107.0, 175.0, 296.0, 493.0, 905.0, 1616.0, 2939.0, 5550.0, 10590.0, 22013.0, 53815.0, 155357.0, 431130.0, 229212.0, 76272.0, 29136.0, 13569.0, 6691.0, 3751.0, 2046.0, 1085.0, 611.0, 377.0, 237.0, 128.0, 73.0, 46.0, 30.0, 23.0, 23.0, 15.0, 9.0, 9.0, 6.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.45703125, -5.28472900390625, -5.1124267578125, -4.94012451171875, -4.767822265625, -4.59552001953125, -4.4232177734375, -4.25091552734375, -4.07861328125, -3.90631103515625, -3.7340087890625, -3.56170654296875, -3.389404296875, -3.21710205078125, -3.0447998046875, -2.87249755859375, -2.7001953125, -2.52789306640625, -2.3555908203125, -2.18328857421875, -2.010986328125, -1.83868408203125, -1.6663818359375, -1.49407958984375, -1.32177734375, -1.14947509765625, -0.9771728515625, -0.80487060546875, -0.632568359375, -0.46026611328125, -0.2879638671875, -0.11566162109375, 0.056640625, 0.22894287109375, 0.4012451171875, 0.57354736328125, 0.745849609375, 0.91815185546875, 1.0904541015625, 1.26275634765625, 1.43505859375, 1.60736083984375, 1.7796630859375, 1.95196533203125, 2.124267578125, 2.29656982421875, 2.4688720703125, 2.64117431640625, 2.8134765625, 2.98577880859375, 3.1580810546875, 3.33038330078125, 3.502685546875, 3.67498779296875, 3.8472900390625, 4.01959228515625, 4.19189453125, 4.36419677734375, 4.5364990234375, 4.70880126953125, 4.881103515625, 5.05340576171875, 5.2257080078125, 5.39801025390625, 5.5703125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 3.0, 5.0, 5.0, 9.0, 14.0, 11.0, 7.0, 30.0, 19.0, 24.0, 26.0, 29.0, 34.0, 42.0, 41.0, 63.0, 63.0, 89.0, 337.0, 1687.0, 102.0, 50.0, 56.0, 50.0, 30.0, 28.0, 43.0, 34.0, 29.0, 14.0, 19.0, 12.0, 11.0, 9.0, 13.0, 4.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.4375, -25.462890625, -24.48828125, -23.513671875, -22.5390625, -21.564453125, -20.58984375, -19.615234375, -18.640625, -17.666015625, -16.69140625, -15.716796875, -14.7421875, -13.767578125, -12.79296875, -11.818359375, -10.84375, -9.869140625, -8.89453125, -7.919921875, -6.9453125, -5.970703125, -4.99609375, -4.021484375, -3.046875, -2.072265625, -1.09765625, -0.123046875, 0.8515625, 1.826171875, 2.80078125, 3.775390625, 4.75, 5.724609375, 6.69921875, 7.673828125, 8.6484375, 9.623046875, 10.59765625, 11.572265625, 12.546875, 13.521484375, 14.49609375, 15.470703125, 16.4453125, 17.419921875, 18.39453125, 19.369140625, 20.34375, 21.318359375, 22.29296875, 23.267578125, 24.2421875, 25.216796875, 26.19140625, 27.166015625, 28.140625, 29.115234375, 30.08984375, 31.064453125, 32.0390625, 33.013671875, 33.98828125, 34.962890625, 35.9375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 4.0, 3.0, 5.0, 8.0, 13.0, 14.0, 21.0, 13.0, 22.0, 30.0, 55.0, 46.0, 87.0, 110.0, 156.0, 215.0, 336.0, 724.0, 10956.0, 3119198.0, 11748.0, 698.0, 362.0, 227.0, 179.0, 114.0, 72.0, 65.0, 45.0, 42.0, 37.0, 26.0, 11.0, 22.0, 12.0, 8.0, 5.0, 7.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-85.0625, -82.732421875, -80.40234375, -78.072265625, -75.7421875, -73.412109375, -71.08203125, -68.751953125, -66.421875, -64.091796875, -61.76171875, -59.431640625, -57.1015625, -54.771484375, -52.44140625, -50.111328125, -47.78125, -45.451171875, -43.12109375, -40.791015625, -38.4609375, -36.130859375, -33.80078125, -31.470703125, -29.140625, -26.810546875, -24.48046875, -22.150390625, -19.8203125, -17.490234375, -15.16015625, -12.830078125, -10.5, -8.169921875, -5.83984375, -3.509765625, -1.1796875, 1.150390625, 3.48046875, 5.810546875, 8.140625, 10.470703125, 12.80078125, 15.130859375, 17.4609375, 19.791015625, 22.12109375, 24.451171875, 26.78125, 29.111328125, 31.44140625, 33.771484375, 36.1015625, 38.431640625, 40.76171875, 43.091796875, 45.421875, 47.751953125, 50.08203125, 52.412109375, 54.7421875, 57.072265625, 59.40234375, 61.732421875, 64.0625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [3.0, 80.0, 740.0, 190.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.543399810791016, -7.847620487213135, -3.151841163635254, 1.5439376831054688, 6.239717483520508, 10.935497283935547, 15.631275177001953, 20.327056884765625, 25.02283477783203, 29.71861457824707, 34.41439437866211, 39.110172271728516, 43.80595397949219, 48.501731872558594, 53.197509765625, 57.89329147338867, 62.58906936645508, 67.28485107421875, 71.98062896728516, 76.67640686035156, 81.37218475341797, 86.06796264648438, 90.76374816894531, 95.45952606201172, 100.15530395507812, 104.85108184814453, 109.54685974121094, 114.24264526367188, 118.93842315673828, 123.63420104980469, 128.32998657226562, 133.0257568359375, 137.72154235839844, 142.41732788085938, 147.11309814453125, 151.8088836669922, 156.50465393066406, 161.200439453125, 165.89620971679688, 170.5919952392578, 175.28778076171875, 179.9835662841797, 184.67933654785156, 189.3751220703125, 194.07089233398438, 198.7666778564453, 203.46246337890625, 208.15823364257812, 212.85400390625, 217.54978942871094, 222.2455596923828, 226.94134521484375, 231.63711547851562, 236.33290100097656, 241.0286865234375, 245.72445678710938, 250.4202423095703, 255.11602783203125, 259.8117980957031, 264.507568359375, 269.203369140625, 273.8991394042969, 278.59490966796875, 283.29071044921875, 287.9864807128906]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 7.0, 2.0, 4.0, 3.0, 7.0, 7.0, 6.0, 7.0, 11.0, 13.0, 14.0, 11.0, 20.0, 27.0, 22.0, 28.0, 25.0, 37.0, 21.0, 45.0, 52.0, 44.0, 40.0, 36.0, 41.0, 44.0, 42.0, 44.0, 32.0, 45.0, 38.0, 26.0, 23.0, 20.0, 26.0, 15.0, 19.0, 9.0, 17.0, 4.0, 16.0, 5.0, 14.0, 6.0, 7.0, 6.0, 6.0, 3.0, 6.0, 4.0, 0.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.086910247802734, -57.02975082397461, -54.97259521484375, -52.915435791015625, -50.8582763671875, -48.801116943359375, -46.74395751953125, -44.68680191040039, -42.629642486572266, -40.57248306274414, -38.51532745361328, -36.458168029785156, -34.40100860595703, -32.343849182128906, -30.286691665649414, -28.229534149169922, -26.172374725341797, -24.115215301513672, -22.05805778503418, -20.000900268554688, -17.943740844726562, -15.886582374572754, -13.829423904418945, -11.772265434265137, -9.715106964111328, -7.6579484939575195, -5.600790023803711, -3.5436315536499023, -1.4864730834960938, 0.5706853866577148, 2.6278438568115234, 4.685002326965332, 6.742156982421875, 8.799315452575684, 10.856473922729492, 12.9136323928833, 14.97079086303711, 17.027950286865234, 19.085107803344727, 21.14226531982422, 23.199424743652344, 25.25658416748047, 27.31374168395996, 29.370899200439453, 31.428058624267578, 33.4852180480957, 35.54237365722656, 37.59953308105469, 39.65669250488281, 41.71385192871094, 43.77101135253906, 45.82816696166992, 47.88532638549805, 49.94248580932617, 51.99964141845703, 54.056800842285156, 56.11396026611328, 58.171119689941406, 60.22827911376953, 62.28543472290039, 64.34259033203125, 66.39974975585938, 68.4569091796875, 70.51406860351562, 72.57122802734375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 6.0, 6.0, 7.0, 11.0, 13.0, 11.0, 17.0, 19.0, 11.0, 17.0, 20.0, 23.0, 33.0, 33.0, 30.0, 34.0, 34.0, 36.0, 34.0, 38.0, 45.0, 35.0, 38.0, 38.0, 44.0, 37.0, 21.0, 31.0, 29.0, 26.0, 22.0, 22.0, 13.0, 25.0, 17.0, 15.0, 16.0, 17.0, 10.0, 14.0, 12.0, 4.0, 12.0, 3.0, 5.0, 1.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-7.1875, -6.9527587890625, -6.718017578125, -6.4832763671875, -6.24853515625, -6.0137939453125, -5.779052734375, -5.5443115234375, -5.3095703125, -5.0748291015625, -4.840087890625, -4.6053466796875, -4.37060546875, -4.1358642578125, -3.901123046875, -3.6663818359375, -3.431640625, -3.1968994140625, -2.962158203125, -2.7274169921875, -2.49267578125, -2.2579345703125, -2.023193359375, -1.7884521484375, -1.5537109375, -1.3189697265625, -1.084228515625, -0.8494873046875, -0.61474609375, -0.3800048828125, -0.145263671875, 0.0894775390625, 0.32421875, 0.5589599609375, 0.793701171875, 1.0284423828125, 1.26318359375, 1.4979248046875, 1.732666015625, 1.9674072265625, 2.2021484375, 2.4368896484375, 2.671630859375, 2.9063720703125, 3.14111328125, 3.3758544921875, 3.610595703125, 3.8453369140625, 4.080078125, 4.3148193359375, 4.549560546875, 4.7843017578125, 5.01904296875, 5.2537841796875, 5.488525390625, 5.7232666015625, 5.9580078125, 6.1927490234375, 6.427490234375, 6.6622314453125, 6.89697265625, 7.1317138671875, 7.366455078125, 7.6011962890625, 7.8359375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 4.0, 3.0, 4.0, 9.0, 7.0, 4.0, 8.0, 9.0, 18.0, 11.0, 15.0, 13.0, 13.0, 22.0, 23.0, 33.0, 35.0, 49.0, 89.0, 125.0, 225.0, 493.0, 1116.0, 3793.0, 23033.0, 526528.0, 3106704.0, 503074.0, 22602.0, 3756.0, 1207.0, 507.0, 254.0, 133.0, 67.0, 59.0, 39.0, 24.0, 26.0, 21.0, 12.0, 13.0, 15.0, 15.0, 17.0, 13.0, 11.0, 11.0, 9.0, 2.0, 5.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0], "bins": [-20.328125, -19.638916015625, -18.94970703125, -18.260498046875, -17.5712890625, -16.882080078125, -16.19287109375, -15.503662109375, -14.814453125, -14.125244140625, -13.43603515625, -12.746826171875, -12.0576171875, -11.368408203125, -10.67919921875, -9.989990234375, -9.30078125, -8.611572265625, -7.92236328125, -7.233154296875, -6.5439453125, -5.854736328125, -5.16552734375, -4.476318359375, -3.787109375, -3.097900390625, -2.40869140625, -1.719482421875, -1.0302734375, -0.341064453125, 0.34814453125, 1.037353515625, 1.7265625, 2.415771484375, 3.10498046875, 3.794189453125, 4.4833984375, 5.172607421875, 5.86181640625, 6.551025390625, 7.240234375, 7.929443359375, 8.61865234375, 9.307861328125, 9.9970703125, 10.686279296875, 11.37548828125, 12.064697265625, 12.75390625, 13.443115234375, 14.13232421875, 14.821533203125, 15.5107421875, 16.199951171875, 16.88916015625, 17.578369140625, 18.267578125, 18.956787109375, 19.64599609375, 20.335205078125, 21.0244140625, 21.713623046875, 22.40283203125, 23.092041015625, 23.78125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 5.0, 4.0, 8.0, 12.0, 22.0, 17.0, 11.0, 16.0, 22.0, 27.0, 36.0, 41.0, 70.0, 75.0, 66.0, 77.0, 112.0, 136.0, 172.0, 233.0, 243.0, 313.0, 346.0, 361.0, 318.0, 256.0, 195.0, 157.0, 129.0, 120.0, 88.0, 74.0, 57.0, 49.0, 35.0, 32.0, 28.0, 18.0, 9.0, 15.0, 19.0, 7.0, 10.0, 6.0, 9.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 4.0, 4.0], "bins": [-11.515625, -11.175537109375, -10.83544921875, -10.495361328125, -10.1552734375, -9.815185546875, -9.47509765625, -9.135009765625, -8.794921875, -8.454833984375, -8.11474609375, -7.774658203125, -7.4345703125, -7.094482421875, -6.75439453125, -6.414306640625, -6.07421875, -5.734130859375, -5.39404296875, -5.053955078125, -4.7138671875, -4.373779296875, -4.03369140625, -3.693603515625, -3.353515625, -3.013427734375, -2.67333984375, -2.333251953125, -1.9931640625, -1.653076171875, -1.31298828125, -0.972900390625, -0.6328125, -0.292724609375, 0.04736328125, 0.387451171875, 0.7275390625, 1.067626953125, 1.40771484375, 1.747802734375, 2.087890625, 2.427978515625, 2.76806640625, 3.108154296875, 3.4482421875, 3.788330078125, 4.12841796875, 4.468505859375, 4.80859375, 5.148681640625, 5.48876953125, 5.828857421875, 6.1689453125, 6.509033203125, 6.84912109375, 7.189208984375, 7.529296875, 7.869384765625, 8.20947265625, 8.549560546875, 8.8896484375, 9.229736328125, 9.56982421875, 9.909912109375, 10.25]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 5.0, 5.0, 6.0, 6.0, 16.0, 19.0, 19.0, 24.0, 25.0, 22.0, 42.0, 51.0, 49.0, 51.0, 86.0, 98.0, 134.0, 161.0, 157.0, 217.0, 304.0, 466.0, 2008.0, 217158.0, 3949513.0, 21029.0, 800.0, 377.0, 273.0, 202.0, 142.0, 148.0, 124.0, 87.0, 79.0, 75.0, 50.0, 46.0, 43.0, 35.0, 35.0, 27.0, 22.0, 8.0, 12.0, 10.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-60.84375, -58.83544921875, -56.8271484375, -54.81884765625, -52.810546875, -50.80224609375, -48.7939453125, -46.78564453125, -44.77734375, -42.76904296875, -40.7607421875, -38.75244140625, -36.744140625, -34.73583984375, -32.7275390625, -30.71923828125, -28.7109375, -26.70263671875, -24.6943359375, -22.68603515625, -20.677734375, -18.66943359375, -16.6611328125, -14.65283203125, -12.64453125, -10.63623046875, -8.6279296875, -6.61962890625, -4.611328125, -2.60302734375, -0.5947265625, 1.41357421875, 3.421875, 5.43017578125, 7.4384765625, 9.44677734375, 11.455078125, 13.46337890625, 15.4716796875, 17.47998046875, 19.48828125, 21.49658203125, 23.5048828125, 25.51318359375, 27.521484375, 29.52978515625, 31.5380859375, 33.54638671875, 35.5546875, 37.56298828125, 39.5712890625, 41.57958984375, 43.587890625, 45.59619140625, 47.6044921875, 49.61279296875, 51.62109375, 53.62939453125, 55.6376953125, 57.64599609375, 59.654296875, 61.66259765625, 63.6708984375, 65.67919921875, 67.6875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 7.0, 13.0, 29.0, 41.0, 64.0, 95.0, 113.0, 134.0, 123.0, 112.0, 78.0, 85.0, 51.0, 32.0, 13.0, 9.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.03321838378906, -68.19615936279297, -66.35910034179688, -64.52204132080078, -62.68497848510742, -60.84791946411133, -59.010860443115234, -57.17380142211914, -55.33673858642578, -53.49967956542969, -51.662620544433594, -49.8255615234375, -47.98849868774414, -46.15143966674805, -44.31438064575195, -42.47732162475586, -40.640262603759766, -38.80320358276367, -36.96614456176758, -35.12908172607422, -33.292022705078125, -31.45496368408203, -29.617904663085938, -27.780845642089844, -25.943784713745117, -24.106725692749023, -22.269664764404297, -20.432605743408203, -18.59554672241211, -16.758485794067383, -14.921426773071289, -13.084366798400879, -11.247306823730469, -9.410246849060059, -7.573187351226807, -5.736127853393555, -3.8990678787231445, -2.0620079040527344, -0.22494888305664062, 1.6121110916137695, 3.4491710662841797, 5.28623104095459, 7.123290538787842, 8.960350036621094, 10.797410011291504, 12.634469985961914, 14.471529006958008, 16.308589935302734, 18.145648956298828, 19.982707977294922, 21.81976890563965, 23.656827926635742, 25.49388885498047, 27.330947875976562, 29.168006896972656, 31.00506591796875, 32.842124938964844, 34.67918395996094, 36.51624298095703, 38.353302001953125, 40.190364837646484, 42.02742385864258, 43.86448287963867, 45.701541900634766, 47.538604736328125]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 1.0, 7.0, 4.0, 10.0, 14.0, 3.0, 20.0, 16.0, 14.0, 21.0, 27.0, 25.0, 35.0, 37.0, 38.0, 33.0, 38.0, 46.0, 39.0, 43.0, 36.0, 49.0, 32.0, 32.0, 34.0, 38.0, 38.0, 31.0, 32.0, 26.0, 30.0, 24.0, 18.0, 22.0, 24.0, 17.0, 14.0, 7.0, 6.0, 11.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.86654281616211, -48.255897521972656, -46.6452522277832, -45.03460693359375, -43.42396545410156, -41.81332015991211, -40.202674865722656, -38.5920295715332, -36.98138427734375, -35.3707389831543, -33.760093688964844, -32.149452209472656, -30.538806915283203, -28.92816162109375, -27.317516326904297, -25.706871032714844, -24.096229553222656, -22.485584259033203, -20.874940872192383, -19.26429557800293, -17.65365219116211, -16.043006896972656, -14.432361602783203, -12.821717262268066, -11.21107292175293, -9.600428581237793, -7.989783763885498, -6.379138946533203, -4.768494606018066, -3.1578502655029297, -1.5472049713134766, 0.06343936920166016, 1.6740798950195312, 3.284724473953247, 4.895369052886963, 6.506013870239258, 8.116658210754395, 9.727302551269531, 11.337947845458984, 12.948592185974121, 14.559236526489258, 16.16988182067871, 17.78052520751953, 19.391170501708984, 21.001815795898438, 22.612459182739258, 24.22310447692871, 25.83374786376953, 27.444393157958984, 29.055038452148438, 30.665681838989258, 32.276329040527344, 33.88697052001953, 35.497615814208984, 37.10826110839844, 38.71890640258789, 40.329551696777344, 41.9401969909668, 43.55084228515625, 45.16148376464844, 46.77212905883789, 48.382774353027344, 49.9934196472168, 51.60406494140625, 53.21470642089844]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 10.0, 7.0, 11.0, 8.0, 14.0, 13.0, 16.0, 12.0, 15.0, 21.0, 20.0, 31.0, 14.0, 22.0, 25.0, 31.0, 26.0, 27.0, 49.0, 36.0, 44.0, 35.0, 34.0, 38.0, 36.0, 37.0, 53.0, 33.0, 24.0, 26.0, 22.0, 26.0, 25.0, 31.0, 16.0, 21.0, 10.0, 15.0, 16.0, 8.0, 9.0, 5.0, 7.0, 7.0, 2.0, 3.0, 2.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.1328125, -6.90472412109375, -6.6766357421875, -6.44854736328125, -6.220458984375, -5.99237060546875, -5.7642822265625, -5.53619384765625, -5.30810546875, -5.08001708984375, -4.8519287109375, -4.62384033203125, -4.395751953125, -4.16766357421875, -3.9395751953125, -3.71148681640625, -3.4833984375, -3.25531005859375, -3.0272216796875, -2.79913330078125, -2.571044921875, -2.34295654296875, -2.1148681640625, -1.88677978515625, -1.65869140625, -1.43060302734375, -1.2025146484375, -0.97442626953125, -0.746337890625, -0.51824951171875, -0.2901611328125, -0.06207275390625, 0.166015625, 0.39410400390625, 0.6221923828125, 0.85028076171875, 1.078369140625, 1.30645751953125, 1.5345458984375, 1.76263427734375, 1.99072265625, 2.21881103515625, 2.4468994140625, 2.67498779296875, 2.903076171875, 3.13116455078125, 3.3592529296875, 3.58734130859375, 3.8154296875, 4.04351806640625, 4.2716064453125, 4.49969482421875, 4.727783203125, 4.95587158203125, 5.1839599609375, 5.41204833984375, 5.64013671875, 5.86822509765625, 6.0963134765625, 6.32440185546875, 6.552490234375, 6.78057861328125, 7.0086669921875, 7.23675537109375, 7.46484375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 5.0, 6.0, 13.0, 23.0, 32.0, 42.0, 86.0, 137.0, 189.0, 354.0, 583.0, 912.0, 1400.0, 2046.0, 3268.0, 4979.0, 7319.0, 11651.0, 18109.0, 28930.0, 46520.0, 76119.0, 128777.0, 216045.0, 198711.0, 116524.0, 69437.0, 42427.0, 26546.0, 16667.0, 10708.0, 7053.0, 4737.0, 2914.0, 1954.0, 1221.0, 780.0, 499.0, 291.0, 202.0, 127.0, 79.0, 52.0, 35.0, 16.0, 17.0, 7.0, 4.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.2578125, -1.2207183837890625, -1.183624267578125, -1.1465301513671875, -1.10943603515625, -1.0723419189453125, -1.035247802734375, -0.9981536865234375, -0.9610595703125, -0.9239654541015625, -0.886871337890625, -0.8497772216796875, -0.81268310546875, -0.7755889892578125, -0.738494873046875, -0.7014007568359375, -0.664306640625, -0.6272125244140625, -0.590118408203125, -0.5530242919921875, -0.51593017578125, -0.4788360595703125, -0.441741943359375, -0.4046478271484375, -0.3675537109375, -0.3304595947265625, -0.293365478515625, -0.2562713623046875, -0.21917724609375, -0.1820831298828125, -0.144989013671875, -0.1078948974609375, -0.07080078125, -0.0337066650390625, 0.003387451171875, 0.0404815673828125, 0.07757568359375, 0.1146697998046875, 0.151763916015625, 0.1888580322265625, 0.2259521484375, 0.2630462646484375, 0.300140380859375, 0.3372344970703125, 0.37432861328125, 0.4114227294921875, 0.448516845703125, 0.4856109619140625, 0.522705078125, 0.5597991943359375, 0.596893310546875, 0.6339874267578125, 0.67108154296875, 0.7081756591796875, 0.745269775390625, 0.7823638916015625, 0.8194580078125, 0.8565521240234375, 0.893646240234375, 0.9307403564453125, 0.96783447265625, 1.0049285888671875, 1.042022705078125, 1.0791168212890625, 1.1162109375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 12.0, 13.0, 17.0, 15.0, 20.0, 21.0, 23.0, 20.0, 33.0, 34.0, 38.0, 46.0, 48.0, 40.0, 42.0, 43.0, 40.0, 1066.0, 56.0, 45.0, 42.0, 34.0, 30.0, 42.0, 29.0, 32.0, 23.0, 24.0, 20.0, 10.0, 21.0, 5.0, 11.0, 6.0, 8.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.640625, -5.46484375, -5.2890625, -5.11328125, -4.9375, -4.76171875, -4.5859375, -4.41015625, -4.234375, -4.05859375, -3.8828125, -3.70703125, -3.53125, -3.35546875, -3.1796875, -3.00390625, -2.828125, -2.65234375, -2.4765625, -2.30078125, -2.125, -1.94921875, -1.7734375, -1.59765625, -1.421875, -1.24609375, -1.0703125, -0.89453125, -0.71875, -0.54296875, -0.3671875, -0.19140625, -0.015625, 0.16015625, 0.3359375, 0.51171875, 0.6875, 0.86328125, 1.0390625, 1.21484375, 1.390625, 1.56640625, 1.7421875, 1.91796875, 2.09375, 2.26953125, 2.4453125, 2.62109375, 2.796875, 2.97265625, 3.1484375, 3.32421875, 3.5, 3.67578125, 3.8515625, 4.02734375, 4.203125, 4.37890625, 4.5546875, 4.73046875, 4.90625, 5.08203125, 5.2578125, 5.43359375, 5.609375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 10.0, 12.0, 8.0, 20.0, 39.0, 39.0, 76.0, 111.0, 153.0, 216.0, 326.0, 516.0, 819.0, 1269.0, 2003.0, 3180.0, 4893.0, 7964.0, 12811.0, 20387.0, 32579.0, 53967.0, 89005.0, 146293.0, 1264745.0, 176899.0, 107427.0, 65455.0, 39849.0, 24527.0, 15296.0, 9637.0, 6050.0, 3790.0, 2446.0, 1513.0, 963.0, 616.0, 450.0, 271.0, 171.0, 129.0, 71.0, 50.0, 28.0, 23.0, 15.0, 7.0, 7.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1279296875, -1.09234619140625, -1.0567626953125, -1.02117919921875, -0.985595703125, -0.95001220703125, -0.9144287109375, -0.87884521484375, -0.84326171875, -0.80767822265625, -0.7720947265625, -0.73651123046875, -0.700927734375, -0.66534423828125, -0.6297607421875, -0.59417724609375, -0.55859375, -0.52301025390625, -0.4874267578125, -0.45184326171875, -0.416259765625, -0.38067626953125, -0.3450927734375, -0.30950927734375, -0.27392578125, -0.23834228515625, -0.2027587890625, -0.16717529296875, -0.131591796875, -0.09600830078125, -0.0604248046875, -0.02484130859375, 0.0107421875, 0.04632568359375, 0.0819091796875, 0.11749267578125, 0.153076171875, 0.18865966796875, 0.2242431640625, 0.25982666015625, 0.29541015625, 0.33099365234375, 0.3665771484375, 0.40216064453125, 0.437744140625, 0.47332763671875, 0.5089111328125, 0.54449462890625, 0.580078125, 0.61566162109375, 0.6512451171875, 0.68682861328125, 0.722412109375, 0.75799560546875, 0.7935791015625, 0.82916259765625, 0.86474609375, 0.90032958984375, 0.9359130859375, 0.97149658203125, 1.007080078125, 1.04266357421875, 1.0782470703125, 1.11383056640625, 1.1494140625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 4.0, 5.0, 11.0, 9.0, 15.0, 15.0, 14.0, 30.0, 30.0, 33.0, 52.0, 43.0, 37.0, 50.0, 49.0, 63.0, 51.0, 52.0, 56.0, 44.0, 52.0, 31.0, 41.0, 31.0, 21.0, 26.0, 20.0, 29.0, 15.0, 14.0, 7.0, 12.0, 8.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0], "bins": [-0.001979827880859375, -0.0019268542528152466, -0.0018738806247711182, -0.0018209069967269897, -0.0017679333686828613, -0.001714959740638733, -0.0016619861125946045, -0.001609012484550476, -0.0015560388565063477, -0.0015030652284622192, -0.0014500916004180908, -0.0013971179723739624, -0.001344144344329834, -0.0012911707162857056, -0.0012381970882415771, -0.0011852234601974487, -0.0011322498321533203, -0.001079276204109192, -0.0010263025760650635, -0.0009733289480209351, -0.0009203553199768066, -0.0008673816919326782, -0.0008144080638885498, -0.0007614344358444214, -0.000708460807800293, -0.0006554871797561646, -0.0006025135517120361, -0.0005495399236679077, -0.0004965662956237793, -0.0004435926675796509, -0.00039061903953552246, -0.00033764541149139404, -0.0002846717834472656, -0.0002316981554031372, -0.0001787245273590088, -0.00012575089931488037, -7.277727127075195e-05, -1.9803643226623535e-05, 3.316998481750488e-05, 8.61436128616333e-05, 0.00013911724090576172, 0.00019209086894989014, 0.00024506449699401855, 0.00029803812503814697, 0.0003510117530822754, 0.0004039853811264038, 0.0004569590091705322, 0.0005099326372146606, 0.0005629062652587891, 0.0006158798933029175, 0.0006688535213470459, 0.0007218271493911743, 0.0007748007774353027, 0.0008277744054794312, 0.0008807480335235596, 0.000933721661567688, 0.0009866952896118164, 0.0010396689176559448, 0.0010926425457000732, 0.0011456161737442017, 0.00119858980178833, 0.0012515634298324585, 0.001304537057876587, 0.0013575106859207153, 0.0014104843139648438]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 5.0, 2.0, 6.0, 8.0, 8.0, 12.0, 10.0, 14.0, 23.0, 27.0, 25.0, 32.0, 39.0, 49.0, 82.0, 113.0, 153.0, 411.0, 1812.0, 1029906.0, 14499.0, 617.0, 211.0, 126.0, 90.0, 61.0, 47.0, 29.0, 34.0, 19.0, 18.0, 15.0, 8.0, 8.0, 9.0, 5.0, 1.0, 6.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.03765869140625, -0.03629875183105469, -0.034938812255859375, -0.03357887268066406, -0.03221893310546875, -0.030858993530273438, -0.029499053955078125, -0.028139114379882812, -0.0267791748046875, -0.025419235229492188, -0.024059295654296875, -0.022699356079101562, -0.02133941650390625, -0.019979476928710938, -0.018619537353515625, -0.017259597778320312, -0.015899658203125, -0.014539718627929688, -0.013179779052734375, -0.011819839477539062, -0.01045989990234375, -0.009099960327148438, -0.007740020751953125, -0.0063800811767578125, -0.0050201416015625, -0.0036602020263671875, -0.002300262451171875, -0.0009403228759765625, 0.00041961669921875, 0.0017795562744140625, 0.003139495849609375, 0.0044994354248046875, 0.005859375, 0.0072193145751953125, 0.008579254150390625, 0.009939193725585938, 0.01129913330078125, 0.012659072875976562, 0.014019012451171875, 0.015378952026367188, 0.0167388916015625, 0.018098831176757812, 0.019458770751953125, 0.020818710327148438, 0.02217864990234375, 0.023538589477539062, 0.024898529052734375, 0.026258468627929688, 0.027618408203125, 0.028978347778320312, 0.030338287353515625, 0.03169822692871094, 0.03305816650390625, 0.03441810607910156, 0.035778045654296875, 0.03713798522949219, 0.0384979248046875, 0.03985786437988281, 0.041217803955078125, 0.04257774353027344, 0.04393768310546875, 0.04529762268066406, 0.046657562255859375, 0.04801750183105469, 0.04937744140625]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 5.0, 62.0, 463.0, 423.0, 62.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006158868200145662, -0.00046125007793307304, -0.00030661336495541036, -0.00015197665197774768, 2.6600901037454605e-06, 0.0001572968321852386, 0.0003119335160590708, 0.0004665703163482249, 0.0006212070002220571, 0.0007758437423035502, 0.0009304804261773825, 0.0010851172264665365, 0.0012397539103403687, 0.001394390594214201, 0.001549027394503355, 0.001703664194792509, 0.0018583007622510195, 0.0020129375625401735, 0.002167574129998684, 0.002322210930287838, 0.002476847730576992, 0.002631484530866146, 0.0027861210983246565, 0.0029407578986138105, 0.0030953946989029646, 0.0032500314991921186, 0.003404668066650629, 0.003559304866939783, 0.003713941667228937, 0.003868578467518091, 0.004023214802145958, 0.004177851602435112, 0.004332488868385553, 0.004487125668674707, 0.0046417624689638615, 0.004796398803591728, 0.004951035603880882, 0.005105672404170036, 0.00526030920445919, 0.005414946004748344, 0.0055695828050374985, 0.0057242196053266525, 0.005878856405615807, 0.006033493205904961, 0.006188129540532827, 0.006342766340821981, 0.0064974031411111355, 0.0066520399414002895, 0.006806676276028156, 0.00696131307631731, 0.007115949876606464, 0.0072705866768956184, 0.007425223011523485, 0.007579859811812639, 0.007734496612101793, 0.00788913294672966, 0.008043770678341389, 0.008198407478630543, 0.008353044278919697, 0.00850768107920885, 0.008662317879498005, 0.008816954679787159, 0.008971590548753738, 0.009126227349042892, 0.009280864149332047]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 11.0, 10.0, 8.0, 8.0, 13.0, 13.0, 12.0, 21.0, 19.0, 25.0, 23.0, 34.0, 27.0, 35.0, 37.0, 39.0, 45.0, 44.0, 50.0, 41.0, 38.0, 32.0, 39.0, 32.0, 32.0, 36.0, 27.0, 32.0, 33.0, 36.0, 21.0, 31.0, 17.0, 16.0, 12.0, 14.0, 12.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00106126070022583, -0.0010304655879735947, -0.0009996704757213593, -0.0009688753634691238, -0.0009380802512168884, -0.000907285138964653, -0.0008764900267124176, -0.0008456949144601822, -0.0008148998022079468, -0.0007841046899557114, -0.000753309577703476, -0.0007225144654512405, -0.0006917193531990051, -0.0006609242409467697, -0.0006301291286945343, -0.0005993340164422989, -0.0005685389041900635, -0.0005377437919378281, -0.0005069486796855927, -0.00047615356743335724, -0.0004453584551811218, -0.0004145633429288864, -0.000383768230676651, -0.0003529731184244156, -0.0003221780061721802, -0.00029138289391994476, -0.00026058778166770935, -0.00022979266941547394, -0.00019899755716323853, -0.0001682024449110031, -0.0001374073326587677, -0.00010661222040653229, -7.581710815429688e-05, -4.502199590206146e-05, -1.422688364982605e-05, 1.6568228602409363e-05, 4.7363340854644775e-05, 7.815845310688019e-05, 0.0001089535653591156, 0.000139748677611351, 0.00017054378986358643, 0.00020133890211582184, 0.00023213401436805725, 0.00026292912662029266, 0.0002937242388725281, 0.0003245193511247635, 0.0003553144633769989, 0.0003861095756292343, 0.0004169046878814697, 0.00044769980013370514, 0.00047849491238594055, 0.000509290024638176, 0.0005400851368904114, 0.0005708802491426468, 0.0006016753613948822, 0.0006324704736471176, 0.000663265585899353, 0.0006940606981515884, 0.0007248558104038239, 0.0007556509226560593, 0.0007864460349082947, 0.0008172411471605301, 0.0008480362594127655, 0.0008788313716650009, 0.0009096264839172363]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 1.0, 10.0, 7.0, 11.0, 8.0, 14.0, 13.0, 16.0, 12.0, 15.0, 21.0, 20.0, 31.0, 14.0, 23.0, 24.0, 31.0, 26.0, 27.0, 49.0, 36.0, 44.0, 35.0, 34.0, 38.0, 36.0, 37.0, 53.0, 33.0, 24.0, 26.0, 22.0, 26.0, 25.0, 31.0, 16.0, 21.0, 10.0, 15.0, 16.0, 8.0, 9.0, 5.0, 7.0, 7.0, 2.0, 3.0, 2.0, 7.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.1328125, -6.90472412109375, -6.6766357421875, -6.44854736328125, -6.220458984375, -5.99237060546875, -5.7642822265625, -5.53619384765625, -5.30810546875, -5.08001708984375, -4.8519287109375, -4.62384033203125, -4.395751953125, -4.16766357421875, -3.9395751953125, -3.71148681640625, -3.4833984375, -3.25531005859375, -3.0272216796875, -2.79913330078125, -2.571044921875, -2.34295654296875, -2.1148681640625, -1.88677978515625, -1.65869140625, -1.43060302734375, -1.2025146484375, -0.97442626953125, -0.746337890625, -0.51824951171875, -0.2901611328125, -0.06207275390625, 0.166015625, 0.39410400390625, 0.6221923828125, 0.85028076171875, 1.078369140625, 1.30645751953125, 1.5345458984375, 1.76263427734375, 1.99072265625, 2.21881103515625, 2.4468994140625, 2.67498779296875, 2.903076171875, 3.13116455078125, 3.3592529296875, 3.58734130859375, 3.8154296875, 4.04351806640625, 4.2716064453125, 4.49969482421875, 4.727783203125, 4.95587158203125, 5.1839599609375, 5.41204833984375, 5.64013671875, 5.86822509765625, 6.0963134765625, 6.32440185546875, 6.552490234375, 6.78057861328125, 7.0086669921875, 7.23675537109375, 7.46484375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 4.0, 8.0, 9.0, 11.0, 9.0, 22.0, 25.0, 39.0, 46.0, 69.0, 74.0, 91.0, 109.0, 172.0, 248.0, 421.0, 791.0, 1592.0, 3644.0, 8697.0, 23064.0, 61624.0, 180445.0, 477799.0, 186153.0, 63537.0, 23431.0, 8879.0, 3679.0, 1649.0, 831.0, 435.0, 290.0, 151.0, 133.0, 90.0, 50.0, 53.0, 35.0, 28.0, 19.0, 22.0, 17.0, 12.0, 16.0, 10.0, 8.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.953125, -6.717529296875, -6.48193359375, -6.246337890625, -6.0107421875, -5.775146484375, -5.53955078125, -5.303955078125, -5.068359375, -4.832763671875, -4.59716796875, -4.361572265625, -4.1259765625, -3.890380859375, -3.65478515625, -3.419189453125, -3.18359375, -2.947998046875, -2.71240234375, -2.476806640625, -2.2412109375, -2.005615234375, -1.77001953125, -1.534423828125, -1.298828125, -1.063232421875, -0.82763671875, -0.592041015625, -0.3564453125, -0.120849609375, 0.11474609375, 0.350341796875, 0.5859375, 0.821533203125, 1.05712890625, 1.292724609375, 1.5283203125, 1.763916015625, 1.99951171875, 2.235107421875, 2.470703125, 2.706298828125, 2.94189453125, 3.177490234375, 3.4130859375, 3.648681640625, 3.88427734375, 4.119873046875, 4.35546875, 4.591064453125, 4.82666015625, 5.062255859375, 5.2978515625, 5.533447265625, 5.76904296875, 6.004638671875, 6.240234375, 6.475830078125, 6.71142578125, 6.947021484375, 7.1826171875, 7.418212890625, 7.65380859375, 7.889404296875, 8.125]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 2.0, 7.0, 9.0, 13.0, 9.0, 11.0, 20.0, 18.0, 23.0, 23.0, 36.0, 27.0, 30.0, 42.0, 52.0, 53.0, 54.0, 136.0, 1710.0, 260.0, 79.0, 61.0, 50.0, 33.0, 44.0, 38.0, 26.0, 27.0, 22.0, 19.0, 17.0, 16.0, 12.0, 15.0, 10.0, 12.0, 6.0, 8.0, 5.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-27.390625, -26.57861328125, -25.7666015625, -24.95458984375, -24.142578125, -23.33056640625, -22.5185546875, -21.70654296875, -20.89453125, -20.08251953125, -19.2705078125, -18.45849609375, -17.646484375, -16.83447265625, -16.0224609375, -15.21044921875, -14.3984375, -13.58642578125, -12.7744140625, -11.96240234375, -11.150390625, -10.33837890625, -9.5263671875, -8.71435546875, -7.90234375, -7.09033203125, -6.2783203125, -5.46630859375, -4.654296875, -3.84228515625, -3.0302734375, -2.21826171875, -1.40625, -0.59423828125, 0.2177734375, 1.02978515625, 1.841796875, 2.65380859375, 3.4658203125, 4.27783203125, 5.08984375, 5.90185546875, 6.7138671875, 7.52587890625, 8.337890625, 9.14990234375, 9.9619140625, 10.77392578125, 11.5859375, 12.39794921875, 13.2099609375, 14.02197265625, 14.833984375, 15.64599609375, 16.4580078125, 17.27001953125, 18.08203125, 18.89404296875, 19.7060546875, 20.51806640625, 21.330078125, 22.14208984375, 22.9541015625, 23.76611328125, 24.578125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 11.0, 8.0, 12.0, 12.0, 25.0, 25.0, 35.0, 37.0, 31.0, 46.0, 57.0, 107.0, 94.0, 183.0, 251.0, 472.0, 801.0, 2646.0, 459542.0, 2674891.0, 3939.0, 1030.0, 488.0, 254.0, 167.0, 108.0, 89.0, 58.0, 57.0, 42.0, 38.0, 19.0, 33.0, 13.0, 11.0, 10.0, 11.0, 8.0, 9.0, 8.0, 4.0, 1.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-61.40625, -59.5498046875, -57.693359375, -55.8369140625, -53.98046875, -52.1240234375, -50.267578125, -48.4111328125, -46.5546875, -44.6982421875, -42.841796875, -40.9853515625, -39.12890625, -37.2724609375, -35.416015625, -33.5595703125, -31.703125, -29.8466796875, -27.990234375, -26.1337890625, -24.27734375, -22.4208984375, -20.564453125, -18.7080078125, -16.8515625, -14.9951171875, -13.138671875, -11.2822265625, -9.42578125, -7.5693359375, -5.712890625, -3.8564453125, -2.0, -0.1435546875, 1.712890625, 3.5693359375, 5.42578125, 7.2822265625, 9.138671875, 10.9951171875, 12.8515625, 14.7080078125, 16.564453125, 18.4208984375, 20.27734375, 22.1337890625, 23.990234375, 25.8466796875, 27.703125, 29.5595703125, 31.416015625, 33.2724609375, 35.12890625, 36.9853515625, 38.841796875, 40.6982421875, 42.5546875, 44.4111328125, 46.267578125, 48.1240234375, 49.98046875, 51.8369140625, 53.693359375, 55.5498046875, 57.40625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 68.0, 672.0, 260.0, 13.0, 1.0, 2.0], "bins": [-266.497802734375, -262.031005859375, -257.5642395019531, -253.09744262695312, -248.6306610107422, -244.16387939453125, -239.69708251953125, -235.2303009033203, -230.76351928710938, -226.29673767089844, -221.8299560546875, -217.3631591796875, -212.89637756347656, -208.42959594726562, -203.96279907226562, -199.4960174560547, -195.02923583984375, -190.5624542236328, -186.09567260742188, -181.62887573242188, -177.16209411621094, -172.6953125, -168.228515625, -163.76173400878906, -159.29495239257812, -154.8281707763672, -150.36138916015625, -145.89459228515625, -141.4278106689453, -136.96102905273438, -132.49423217773438, -128.02745056152344, -123.56065368652344, -119.0938720703125, -114.62708282470703, -110.16029357910156, -105.69351196289062, -101.22673034667969, -96.75994110107422, -92.29315185546875, -87.82637023925781, -83.35958862304688, -78.8927993774414, -74.42601013183594, -69.959228515625, -65.49244689941406, -61.025657653808594, -56.55887222290039, -52.09208679199219, -47.625301361083984, -43.15851593017578, -38.69173049926758, -34.224945068359375, -29.758159637451172, -25.29137420654297, -20.824588775634766, -16.357803344726562, -11.89101791381836, -7.424232482910156, -2.957447052001953, 1.50933837890625, 5.976123809814453, 10.442909240722656, 14.90969467163086, 19.376480102539062]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 7.0, 8.0, 12.0, 8.0, 13.0, 16.0, 17.0, 12.0, 13.0, 22.0, 23.0, 34.0, 32.0, 34.0, 42.0, 28.0, 44.0, 39.0, 35.0, 38.0, 27.0, 41.0, 36.0, 40.0, 38.0, 36.0, 32.0, 37.0, 28.0, 29.0, 23.0, 16.0, 15.0, 22.0, 16.0, 14.0, 15.0, 13.0, 7.0, 10.0, 8.0, 8.0, 0.0, 1.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-67.62173461914062, -65.60232543945312, -63.582908630371094, -61.56349563598633, -59.54408264160156, -57.5246696472168, -55.50525665283203, -53.485843658447266, -51.4664306640625, -49.447017669677734, -47.42760467529297, -45.4081916809082, -43.38877868652344, -41.36936569213867, -39.349952697753906, -37.33053970336914, -35.311126708984375, -33.29171371459961, -31.272300720214844, -29.252887725830078, -27.233474731445312, -25.214061737060547, -23.19464874267578, -21.175235748291016, -19.15582275390625, -17.136409759521484, -15.116996765136719, -13.097583770751953, -11.078170776367188, -9.058757781982422, -7.039344787597656, -5.019931793212891, -3.0005264282226562, -0.9811134338378906, 1.038299560546875, 3.0577125549316406, 5.077125549316406, 7.096538543701172, 9.115951538085938, 11.135364532470703, 13.154777526855469, 15.174190521240234, 17.193603515625, 19.213016510009766, 21.23242950439453, 23.251842498779297, 25.271255493164062, 27.290668487548828, 29.310081481933594, 31.32949447631836, 33.348907470703125, 35.36832046508789, 37.387733459472656, 39.40714645385742, 41.42655944824219, 43.44597244262695, 45.46538543701172, 47.484798431396484, 49.50421142578125, 51.523624420166016, 53.54303741455078, 55.56245040893555, 57.58186340332031, 59.60127639770508, 61.620689392089844]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 7.0, 8.0, 11.0, 7.0, 10.0, 16.0, 15.0, 15.0, 20.0, 26.0, 20.0, 28.0, 19.0, 30.0, 28.0, 31.0, 32.0, 38.0, 57.0, 49.0, 40.0, 37.0, 36.0, 37.0, 27.0, 41.0, 38.0, 29.0, 23.0, 28.0, 25.0, 29.0, 17.0, 18.0, 18.0, 14.0, 12.0, 9.0, 12.0, 9.0, 6.0, 4.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-8.015625, -7.764892578125, -7.51416015625, -7.263427734375, -7.0126953125, -6.761962890625, -6.51123046875, -6.260498046875, -6.009765625, -5.759033203125, -5.50830078125, -5.257568359375, -5.0068359375, -4.756103515625, -4.50537109375, -4.254638671875, -4.00390625, -3.753173828125, -3.50244140625, -3.251708984375, -3.0009765625, -2.750244140625, -2.49951171875, -2.248779296875, -1.998046875, -1.747314453125, -1.49658203125, -1.245849609375, -0.9951171875, -0.744384765625, -0.49365234375, -0.242919921875, 0.0078125, 0.258544921875, 0.50927734375, 0.760009765625, 1.0107421875, 1.261474609375, 1.51220703125, 1.762939453125, 2.013671875, 2.264404296875, 2.51513671875, 2.765869140625, 3.0166015625, 3.267333984375, 3.51806640625, 3.768798828125, 4.01953125, 4.270263671875, 4.52099609375, 4.771728515625, 5.0224609375, 5.273193359375, 5.52392578125, 5.774658203125, 6.025390625, 6.276123046875, 6.52685546875, 6.777587890625, 7.0283203125, 7.279052734375, 7.52978515625, 7.780517578125, 8.03125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 3.0, 2.0, 7.0, 4.0, 10.0, 9.0, 12.0, 10.0, 21.0, 18.0, 31.0, 24.0, 44.0, 49.0, 68.0, 58.0, 120.0, 180.0, 311.0, 768.0, 2952.0, 25932.0, 1128912.0, 2921941.0, 103854.0, 6368.0, 1316.0, 465.0, 227.0, 136.0, 92.0, 59.0, 57.0, 38.0, 32.0, 33.0, 20.0, 21.0, 13.0, 14.0, 9.0, 7.0, 10.0, 6.0, 5.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-26.0, -25.166748046875, -24.33349609375, -23.500244140625, -22.6669921875, -21.833740234375, -21.00048828125, -20.167236328125, -19.333984375, -18.500732421875, -17.66748046875, -16.834228515625, -16.0009765625, -15.167724609375, -14.33447265625, -13.501220703125, -12.66796875, -11.834716796875, -11.00146484375, -10.168212890625, -9.3349609375, -8.501708984375, -7.66845703125, -6.835205078125, -6.001953125, -5.168701171875, -4.33544921875, -3.502197265625, -2.6689453125, -1.835693359375, -1.00244140625, -0.169189453125, 0.6640625, 1.497314453125, 2.33056640625, 3.163818359375, 3.9970703125, 4.830322265625, 5.66357421875, 6.496826171875, 7.330078125, 8.163330078125, 8.99658203125, 9.829833984375, 10.6630859375, 11.496337890625, 12.32958984375, 13.162841796875, 13.99609375, 14.829345703125, 15.66259765625, 16.495849609375, 17.3291015625, 18.162353515625, 18.99560546875, 19.828857421875, 20.662109375, 21.495361328125, 22.32861328125, 23.161865234375, 23.9951171875, 24.828369140625, 25.66162109375, 26.494873046875, 27.328125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 10.0, 9.0, 5.0, 15.0, 23.0, 26.0, 45.0, 62.0, 98.0, 146.0, 172.0, 280.0, 433.0, 586.0, 653.0, 511.0, 344.0, 230.0, 137.0, 95.0, 58.0, 48.0, 34.0, 19.0, 12.0, 6.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-19.34375, -18.72314453125, -18.1025390625, -17.48193359375, -16.861328125, -16.24072265625, -15.6201171875, -14.99951171875, -14.37890625, -13.75830078125, -13.1376953125, -12.51708984375, -11.896484375, -11.27587890625, -10.6552734375, -10.03466796875, -9.4140625, -8.79345703125, -8.1728515625, -7.55224609375, -6.931640625, -6.31103515625, -5.6904296875, -5.06982421875, -4.44921875, -3.82861328125, -3.2080078125, -2.58740234375, -1.966796875, -1.34619140625, -0.7255859375, -0.10498046875, 0.515625, 1.13623046875, 1.7568359375, 2.37744140625, 2.998046875, 3.61865234375, 4.2392578125, 4.85986328125, 5.48046875, 6.10107421875, 6.7216796875, 7.34228515625, 7.962890625, 8.58349609375, 9.2041015625, 9.82470703125, 10.4453125, 11.06591796875, 11.6865234375, 12.30712890625, 12.927734375, 13.54833984375, 14.1689453125, 14.78955078125, 15.41015625, 16.03076171875, 16.6513671875, 17.27197265625, 17.892578125, 18.51318359375, 19.1337890625, 19.75439453125, 20.375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 6.0, 14.0, 4.0, 19.0, 40.0, 43.0, 68.0, 91.0, 125.0, 201.0, 224.0, 370.0, 638.0, 5900.0, 4141783.0, 42478.0, 881.0, 359.0, 241.0, 190.0, 140.0, 122.0, 114.0, 64.0, 50.0, 42.0, 22.0, 8.0, 9.0, 17.0, 5.0, 6.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-111.6875, -108.2666015625, -104.845703125, -101.4248046875, -98.00390625, -94.5830078125, -91.162109375, -87.7412109375, -84.3203125, -80.8994140625, -77.478515625, -74.0576171875, -70.63671875, -67.2158203125, -63.794921875, -60.3740234375, -56.953125, -53.5322265625, -50.111328125, -46.6904296875, -43.26953125, -39.8486328125, -36.427734375, -33.0068359375, -29.5859375, -26.1650390625, -22.744140625, -19.3232421875, -15.90234375, -12.4814453125, -9.060546875, -5.6396484375, -2.21875, 1.2021484375, 4.623046875, 8.0439453125, 11.46484375, 14.8857421875, 18.306640625, 21.7275390625, 25.1484375, 28.5693359375, 31.990234375, 35.4111328125, 38.83203125, 42.2529296875, 45.673828125, 49.0947265625, 52.515625, 55.9365234375, 59.357421875, 62.7783203125, 66.19921875, 69.6201171875, 73.041015625, 76.4619140625, 79.8828125, 83.3037109375, 86.724609375, 90.1455078125, 93.56640625, 96.9873046875, 100.408203125, 103.8291015625, 107.25]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 27.0, 186.0, 464.0, 275.0, 48.0, 11.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-360.4863586425781, -353.8907470703125, -347.2951354980469, -340.69952392578125, -334.1039123535156, -327.50830078125, -320.9126892089844, -314.31707763671875, -307.72149658203125, -301.1258850097656, -294.5302734375, -287.9346618652344, -281.33905029296875, -274.7434387207031, -268.1478271484375, -261.55224609375, -254.95660400390625, -248.36099243164062, -241.765380859375, -235.16976928710938, -228.57415771484375, -221.97854614257812, -215.38294982910156, -208.78733825683594, -202.1917266845703, -195.5961151123047, -189.00050354003906, -182.40489196777344, -175.80929565429688, -169.21368408203125, -162.61807250976562, -156.0224609375, -149.42684936523438, -142.83123779296875, -136.23562622070312, -129.6400146484375, -123.0444107055664, -116.44879913330078, -109.85319519042969, -103.25758361816406, -96.66197204589844, -90.06636047363281, -83.47074890136719, -76.8751449584961, -70.27953338623047, -63.683921813964844, -57.088314056396484, -50.492706298828125, -43.897090911865234, -37.301483154296875, -30.70587158203125, -24.110261917114258, -17.514652252197266, -10.91904067993164, -4.323432922363281, 2.272174835205078, 8.867786407470703, 15.463396072387695, 22.059005737304688, 28.65461540222168, 35.25022506713867, 41.8458366394043, 48.441444396972656, 55.037052154541016, 61.63266372680664]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 6.0, 8.0, 11.0, 8.0, 10.0, 12.0, 13.0, 16.0, 26.0, 25.0, 33.0, 28.0, 28.0, 32.0, 37.0, 50.0, 35.0, 39.0, 36.0, 40.0, 53.0, 36.0, 54.0, 36.0, 30.0, 33.0, 34.0, 26.0, 34.0, 25.0, 16.0, 18.0, 16.0, 21.0, 12.0, 15.0, 5.0, 15.0, 7.0, 5.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-49.81153106689453, -48.25680923461914, -46.70208740234375, -45.147361755371094, -43.5926399230957, -42.03791809082031, -40.48319625854492, -38.92847442626953, -37.37375259399414, -35.81903076171875, -34.26430892944336, -32.70958709716797, -31.154863357543945, -29.600139617919922, -28.04541778564453, -26.49069595336914, -24.935972213745117, -23.381250381469727, -21.826526641845703, -20.271804809570312, -18.717082977294922, -17.16236114501953, -15.607637405395508, -14.052915573120117, -12.49819278717041, -10.943470001220703, -9.388748168945312, -7.8340253829956055, -6.279303073883057, -4.724580764770508, -3.169857978820801, -1.6151361465454102, -0.060413360595703125, 1.4943090677261353, 3.0490314960479736, 4.603754043579102, 6.15847635269165, 7.713198661804199, 9.267921447753906, 10.822643280029297, 12.377366065979004, 13.932088851928711, 15.486810684204102, 17.041534423828125, 18.596256256103516, 20.150978088378906, 21.705699920654297, 23.260421752929688, 24.81514549255371, 26.3698673248291, 27.924591064453125, 29.479312896728516, 31.034034729003906, 32.5887565612793, 34.14347839355469, 35.698204040527344, 37.252925872802734, 38.807647705078125, 40.362369537353516, 41.917091369628906, 43.47181701660156, 45.02653884887695, 46.581260681152344, 48.135982513427734, 49.690704345703125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 1.0, 5.0, 8.0, 17.0, 5.0, 11.0, 11.0, 14.0, 19.0, 22.0, 22.0, 23.0, 20.0, 16.0, 28.0, 27.0, 44.0, 30.0, 51.0, 40.0, 39.0, 49.0, 38.0, 37.0, 51.0, 41.0, 23.0, 33.0, 37.0, 28.0, 27.0, 22.0, 19.0, 25.0, 15.0, 20.0, 15.0, 14.0, 13.0, 5.0, 3.0, 6.0, 5.0, 5.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.55859375, -7.30609130859375, -7.0535888671875, -6.80108642578125, -6.548583984375, -6.29608154296875, -6.0435791015625, -5.79107666015625, -5.53857421875, -5.28607177734375, -5.0335693359375, -4.78106689453125, -4.528564453125, -4.27606201171875, -4.0235595703125, -3.77105712890625, -3.5185546875, -3.26605224609375, -3.0135498046875, -2.76104736328125, -2.508544921875, -2.25604248046875, -2.0035400390625, -1.75103759765625, -1.49853515625, -1.24603271484375, -0.9935302734375, -0.74102783203125, -0.488525390625, -0.23602294921875, 0.0164794921875, 0.26898193359375, 0.521484375, 0.77398681640625, 1.0264892578125, 1.27899169921875, 1.531494140625, 1.78399658203125, 2.0364990234375, 2.28900146484375, 2.54150390625, 2.79400634765625, 3.0465087890625, 3.29901123046875, 3.551513671875, 3.80401611328125, 4.0565185546875, 4.30902099609375, 4.5615234375, 4.81402587890625, 5.0665283203125, 5.31903076171875, 5.571533203125, 5.82403564453125, 6.0765380859375, 6.32904052734375, 6.58154296875, 6.83404541015625, 7.0865478515625, 7.33905029296875, 7.591552734375, 7.84405517578125, 8.0965576171875, 8.34906005859375, 8.6015625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 8.0, 6.0, 10.0, 16.0, 39.0, 49.0, 71.0, 126.0, 187.0, 268.0, 437.0, 655.0, 1101.0, 1552.0, 2450.0, 3772.0, 5810.0, 9110.0, 14171.0, 22815.0, 35903.0, 59225.0, 97962.0, 166807.0, 228347.0, 156867.0, 91926.0, 55897.0, 33845.0, 21248.0, 13515.0, 8735.0, 5437.0, 3464.0, 2368.0, 1555.0, 1053.0, 609.0, 400.0, 281.0, 140.0, 115.0, 76.0, 51.0, 26.0, 23.0, 13.0, 11.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1806640625, -1.141876220703125, -1.10308837890625, -1.064300537109375, -1.0255126953125, -0.986724853515625, -0.94793701171875, -0.909149169921875, -0.870361328125, -0.831573486328125, -0.79278564453125, -0.753997802734375, -0.7152099609375, -0.676422119140625, -0.63763427734375, -0.598846435546875, -0.56005859375, -0.521270751953125, -0.48248291015625, -0.443695068359375, -0.4049072265625, -0.366119384765625, -0.32733154296875, -0.288543701171875, -0.249755859375, -0.210968017578125, -0.17218017578125, -0.133392333984375, -0.0946044921875, -0.055816650390625, -0.01702880859375, 0.021759033203125, 0.060546875, 0.099334716796875, 0.13812255859375, 0.176910400390625, 0.2156982421875, 0.254486083984375, 0.29327392578125, 0.332061767578125, 0.370849609375, 0.409637451171875, 0.44842529296875, 0.487213134765625, 0.5260009765625, 0.564788818359375, 0.60357666015625, 0.642364501953125, 0.68115234375, 0.719940185546875, 0.75872802734375, 0.797515869140625, 0.8363037109375, 0.875091552734375, 0.91387939453125, 0.952667236328125, 0.991455078125, 1.030242919921875, 1.06903076171875, 1.107818603515625, 1.1466064453125, 1.185394287109375, 1.22418212890625, 1.262969970703125, 1.3017578125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 2.0, 6.0, 5.0, 5.0, 15.0, 12.0, 11.0, 19.0, 25.0, 19.0, 30.0, 33.0, 31.0, 40.0, 34.0, 42.0, 49.0, 39.0, 34.0, 1058.0, 38.0, 51.0, 36.0, 39.0, 35.0, 41.0, 28.0, 34.0, 35.0, 28.0, 27.0, 13.0, 14.0, 19.0, 15.0, 11.0, 12.0, 7.0, 5.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0], "bins": [-5.69921875, -5.528564453125, -5.35791015625, -5.187255859375, -5.0166015625, -4.845947265625, -4.67529296875, -4.504638671875, -4.333984375, -4.163330078125, -3.99267578125, -3.822021484375, -3.6513671875, -3.480712890625, -3.31005859375, -3.139404296875, -2.96875, -2.798095703125, -2.62744140625, -2.456787109375, -2.2861328125, -2.115478515625, -1.94482421875, -1.774169921875, -1.603515625, -1.432861328125, -1.26220703125, -1.091552734375, -0.9208984375, -0.750244140625, -0.57958984375, -0.408935546875, -0.23828125, -0.067626953125, 0.10302734375, 0.273681640625, 0.4443359375, 0.614990234375, 0.78564453125, 0.956298828125, 1.126953125, 1.297607421875, 1.46826171875, 1.638916015625, 1.8095703125, 1.980224609375, 2.15087890625, 2.321533203125, 2.4921875, 2.662841796875, 2.83349609375, 3.004150390625, 3.1748046875, 3.345458984375, 3.51611328125, 3.686767578125, 3.857421875, 4.028076171875, 4.19873046875, 4.369384765625, 4.5400390625, 4.710693359375, 4.88134765625, 5.052001953125, 5.22265625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 4.0, 14.0, 22.0, 39.0, 58.0, 84.0, 130.0, 221.0, 334.0, 547.0, 824.0, 1359.0, 2305.0, 3755.0, 6182.0, 10427.0, 17941.0, 30189.0, 52425.0, 90520.0, 160765.0, 1297047.0, 179307.0, 101854.0, 58141.0, 33698.0, 19725.0, 11744.0, 6865.0, 4118.0, 2455.0, 1469.0, 933.0, 608.0, 348.0, 234.0, 162.0, 88.0, 65.0, 42.0, 26.0, 19.0, 14.0, 6.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.267578125, -1.2261505126953125, -1.184722900390625, -1.1432952880859375, -1.10186767578125, -1.0604400634765625, -1.019012451171875, -0.9775848388671875, -0.9361572265625, -0.8947296142578125, -0.853302001953125, -0.8118743896484375, -0.77044677734375, -0.7290191650390625, -0.687591552734375, -0.6461639404296875, -0.604736328125, -0.5633087158203125, -0.521881103515625, -0.4804534912109375, -0.43902587890625, -0.3975982666015625, -0.356170654296875, -0.3147430419921875, -0.2733154296875, -0.2318878173828125, -0.190460205078125, -0.1490325927734375, -0.10760498046875, -0.0661773681640625, -0.024749755859375, 0.0166778564453125, 0.05810546875, 0.0995330810546875, 0.140960693359375, 0.1823883056640625, 0.22381591796875, 0.2652435302734375, 0.306671142578125, 0.3480987548828125, 0.3895263671875, 0.4309539794921875, 0.472381591796875, 0.5138092041015625, 0.55523681640625, 0.5966644287109375, 0.638092041015625, 0.6795196533203125, 0.720947265625, 0.7623748779296875, 0.803802490234375, 0.8452301025390625, 0.88665771484375, 0.9280853271484375, 0.969512939453125, 1.0109405517578125, 1.0523681640625, 1.0937957763671875, 1.135223388671875, 1.1766510009765625, 1.21807861328125, 1.2595062255859375, 1.300933837890625, 1.3423614501953125, 1.3837890625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 5.0, 8.0, 15.0, 17.0, 17.0, 20.0, 25.0, 40.0, 35.0, 34.0, 43.0, 52.0, 50.0, 62.0, 51.0, 62.0, 54.0, 63.0, 41.0, 42.0, 36.0, 35.0, 19.0, 28.0, 17.0, 17.0, 12.0, 11.0, 21.0, 11.0, 9.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0016422271728515625, -0.0015890896320343018, -0.001535952091217041, -0.0014828145503997803, -0.0014296770095825195, -0.0013765394687652588, -0.001323401927947998, -0.0012702643871307373, -0.0012171268463134766, -0.0011639893054962158, -0.001110851764678955, -0.0010577142238616943, -0.0010045766830444336, -0.0009514391422271729, -0.0008983016014099121, -0.0008451640605926514, -0.0007920265197753906, -0.0007388889789581299, -0.0006857514381408691, -0.0006326138973236084, -0.0005794763565063477, -0.0005263388156890869, -0.00047320127487182617, -0.00042006373405456543, -0.0003669261932373047, -0.00031378865242004395, -0.0002606511116027832, -0.00020751357078552246, -0.00015437602996826172, -0.00010123848915100098, -4.8100948333740234e-05, 5.036592483520508e-06, 5.817413330078125e-05, 0.00011131167411804199, 0.00016444921493530273, 0.00021758675575256348, 0.0002707242965698242, 0.00032386183738708496, 0.0003769993782043457, 0.00043013691902160645, 0.0004832744598388672, 0.0005364120006561279, 0.0005895495414733887, 0.0006426870822906494, 0.0006958246231079102, 0.0007489621639251709, 0.0008020997047424316, 0.0008552372455596924, 0.0009083747863769531, 0.0009615123271942139, 0.0010146498680114746, 0.0010677874088287354, 0.001120924949645996, 0.0011740624904632568, 0.0012272000312805176, 0.0012803375720977783, 0.001333475112915039, 0.0013866126537322998, 0.0014397501945495605, 0.0014928877353668213, 0.001546025276184082, 0.0015991628170013428, 0.0016523003578186035, 0.0017054378986358643, 0.001758575439453125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 4.0, 6.0, 9.0, 9.0, 18.0, 17.0, 17.0, 15.0, 31.0, 44.0, 44.0, 50.0, 77.0, 115.0, 177.0, 452.0, 2042.0, 1024301.0, 19655.0, 685.0, 263.0, 136.0, 81.0, 55.0, 55.0, 32.0, 33.0, 30.0, 13.0, 19.0, 13.0, 10.0, 14.0, 3.0, 8.0, 3.0, 3.0, 0.0, 6.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.045623779296875, -0.04427003860473633, -0.042916297912597656, -0.041562557220458984, -0.04020881652832031, -0.03885507583618164, -0.03750133514404297, -0.0361475944519043, -0.034793853759765625, -0.03344011306762695, -0.03208637237548828, -0.03073263168334961, -0.029378890991210938, -0.028025150299072266, -0.026671409606933594, -0.025317668914794922, -0.02396392822265625, -0.022610187530517578, -0.021256446838378906, -0.019902706146240234, -0.018548965454101562, -0.01719522476196289, -0.01584148406982422, -0.014487743377685547, -0.013134002685546875, -0.011780261993408203, -0.010426521301269531, -0.00907278060913086, -0.0077190399169921875, -0.006365299224853516, -0.005011558532714844, -0.003657817840576172, -0.0023040771484375, -0.0009503364562988281, 0.00040340423583984375, 0.0017571449279785156, 0.0031108856201171875, 0.004464626312255859, 0.005818367004394531, 0.007172107696533203, 0.008525848388671875, 0.009879589080810547, 0.011233329772949219, 0.01258707046508789, 0.013940811157226562, 0.015294551849365234, 0.016648292541503906, 0.018002033233642578, 0.01935577392578125, 0.020709514617919922, 0.022063255310058594, 0.023416996002197266, 0.024770736694335938, 0.02612447738647461, 0.02747821807861328, 0.028831958770751953, 0.030185699462890625, 0.0315394401550293, 0.03289318084716797, 0.03424692153930664, 0.03560066223144531, 0.036954402923583984, 0.038308143615722656, 0.03966188430786133, 0.041015625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 8.0, 17.0, 32.0, 69.0, 126.0, 188.0, 196.0, 173.0, 98.0, 54.0, 34.0, 8.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022862080950289965, -0.002235752996057272, -0.0021852978970855474, -0.002134842798113823, -0.0020843876991420984, -0.002033932600170374, -0.0019834775011986494, -0.001933022285811603, -0.0018825671868398786, -0.001832112087868154, -0.0017816569888964295, -0.001731201889924705, -0.0016807467909529805, -0.0016302915755659342, -0.0015798364765942097, -0.0015293813776224852, -0.0014789262786507607, -0.0014284711796790361, -0.0013780160807073116, -0.0013275609817355871, -0.0012771058827638626, -0.001226650783792138, -0.0011761956848204136, -0.0011257404694333673, -0.0010752854868769646, -0.00102483038790524, -0.0009743752889335155, -0.000923920189961791, -0.0008734650327824056, -0.0008230099338106811, -0.0007725548348389566, -0.0007220996776595712, -0.0006716445786878467, -0.0006211894797161222, -0.0005707343807443976, -0.0005202792817726731, -0.0004698241245932877, -0.0004193690256215632, -0.0003689139266498387, -0.0003184587985742837, -0.0002680036996025592, -0.00021754858607891947, -0.00016709347255527973, -0.00011663837358355522, -6.618326005991548e-05, -1.5728146536275744e-05, 3.4726952435448766e-05, 8.518208051100373e-05, 0.00013563717948272824, 0.00018609229300636798, 0.00023654740653000772, 0.00028700250550173223, 0.0003374576335772872, 0.0003879127325490117, 0.0004383678315207362, 0.0004888229304924607, 0.0005392780294641852, 0.0005897331284359097, 0.0006401882274076343, 0.0006906433263793588, 0.0007410984835587442, 0.0007915535825304687, 0.0008420086815021932, 0.0008924638386815786, 0.0009429189376533031]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 6.0, 13.0, 7.0, 6.0, 10.0, 17.0, 5.0, 19.0, 21.0, 22.0, 28.0, 25.0, 28.0, 40.0, 29.0, 34.0, 30.0, 26.0, 45.0, 36.0, 40.0, 40.0, 42.0, 39.0, 35.0, 35.0, 36.0, 35.0, 26.0, 31.0, 23.0, 26.0, 22.0, 22.0, 23.0, 15.0, 11.0, 11.0, 7.0, 6.0, 10.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0009571313858032227, -0.0009287148714065552, -0.0009002983570098877, -0.0008718818426132202, -0.0008434653282165527, -0.0008150488138198853, -0.0007866322994232178, -0.0007582157850265503, -0.0007297992706298828, -0.0007013827562332153, -0.0006729662418365479, -0.0006445497274398804, -0.0006161332130432129, -0.0005877166986465454, -0.0005593001842498779, -0.0005308836698532104, -0.000502467155456543, -0.0004740506410598755, -0.000445634126663208, -0.00041721761226654053, -0.00038880109786987305, -0.00036038458347320557, -0.0003319680690765381, -0.0003035515546798706, -0.0002751350402832031, -0.00024671852588653564, -0.00021830201148986816, -0.00018988549709320068, -0.0001614689826965332, -0.00013305246829986572, -0.00010463595390319824, -7.621943950653076e-05, -4.780292510986328e-05, -1.93864107131958e-05, 9.03010368347168e-06, 3.744661808013916e-05, 6.586313247680664e-05, 9.427964687347412e-05, 0.0001226961612701416, 0.00015111267566680908, 0.00017952919006347656, 0.00020794570446014404, 0.00023636221885681152, 0.000264778733253479, 0.0002931952476501465, 0.00032161176204681396, 0.00035002827644348145, 0.0003784447908401489, 0.0004068613052368164, 0.0004352778196334839, 0.00046369433403015137, 0.0004921108484268188, 0.0005205273628234863, 0.0005489438772201538, 0.0005773603916168213, 0.0006057769060134888, 0.0006341934204101562, 0.0006626099348068237, 0.0006910264492034912, 0.0007194429636001587, 0.0007478594779968262, 0.0007762759923934937, 0.0008046925067901611, 0.0008331090211868286, 0.0008615255355834961]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 1.0, 5.0, 7.0, 18.0, 5.0, 11.0, 11.0, 14.0, 19.0, 22.0, 21.0, 24.0, 20.0, 16.0, 27.0, 28.0, 44.0, 30.0, 51.0, 40.0, 38.0, 50.0, 38.0, 37.0, 51.0, 40.0, 24.0, 33.0, 35.0, 29.0, 28.0, 22.0, 19.0, 25.0, 15.0, 20.0, 15.0, 14.0, 13.0, 5.0, 3.0, 6.0, 5.0, 5.0, 3.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.5625, -7.3099365234375, -7.057373046875, -6.8048095703125, -6.55224609375, -6.2996826171875, -6.047119140625, -5.7945556640625, -5.5419921875, -5.2894287109375, -5.036865234375, -4.7843017578125, -4.53173828125, -4.2791748046875, -4.026611328125, -3.7740478515625, -3.521484375, -3.2689208984375, -3.016357421875, -2.7637939453125, -2.51123046875, -2.2586669921875, -2.006103515625, -1.7535400390625, -1.5009765625, -1.2484130859375, -0.995849609375, -0.7432861328125, -0.49072265625, -0.2381591796875, 0.014404296875, 0.2669677734375, 0.51953125, 0.7720947265625, 1.024658203125, 1.2772216796875, 1.52978515625, 1.7823486328125, 2.034912109375, 2.2874755859375, 2.5400390625, 2.7926025390625, 3.045166015625, 3.2977294921875, 3.55029296875, 3.8028564453125, 4.055419921875, 4.3079833984375, 4.560546875, 4.8131103515625, 5.065673828125, 5.3182373046875, 5.57080078125, 5.8233642578125, 6.075927734375, 6.3284912109375, 6.5810546875, 6.8336181640625, 7.086181640625, 7.3387451171875, 7.59130859375, 7.8438720703125, 8.096435546875, 8.3489990234375, 8.6015625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 4.0, 0.0, 6.0, 2.0, 6.0, 3.0, 6.0, 25.0, 12.0, 17.0, 22.0, 23.0, 35.0, 59.0, 45.0, 69.0, 92.0, 148.0, 172.0, 287.0, 453.0, 918.0, 2205.0, 7583.0, 40485.0, 569883.0, 382884.0, 32543.0, 6457.0, 1848.0, 827.0, 413.0, 283.0, 214.0, 121.0, 92.0, 75.0, 56.0, 37.0, 25.0, 29.0, 27.0, 21.0, 10.0, 5.0, 6.0, 8.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-13.921875, -13.4569091796875, -12.991943359375, -12.5269775390625, -12.06201171875, -11.5970458984375, -11.132080078125, -10.6671142578125, -10.2021484375, -9.7371826171875, -9.272216796875, -8.8072509765625, -8.34228515625, -7.8773193359375, -7.412353515625, -6.9473876953125, -6.482421875, -6.0174560546875, -5.552490234375, -5.0875244140625, -4.62255859375, -4.1575927734375, -3.692626953125, -3.2276611328125, -2.7626953125, -2.2977294921875, -1.832763671875, -1.3677978515625, -0.90283203125, -0.4378662109375, 0.027099609375, 0.4920654296875, 0.95703125, 1.4219970703125, 1.886962890625, 2.3519287109375, 2.81689453125, 3.2818603515625, 3.746826171875, 4.2117919921875, 4.6767578125, 5.1417236328125, 5.606689453125, 6.0716552734375, 6.53662109375, 7.0015869140625, 7.466552734375, 7.9315185546875, 8.396484375, 8.8614501953125, 9.326416015625, 9.7913818359375, 10.25634765625, 10.7213134765625, 11.186279296875, 11.6512451171875, 12.1162109375, 12.5811767578125, 13.046142578125, 13.5111083984375, 13.97607421875, 14.4410400390625, 14.906005859375, 15.3709716796875, 15.8359375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 4.0, 3.0, 5.0, 11.0, 9.0, 7.0, 11.0, 9.0, 14.0, 14.0, 11.0, 15.0, 20.0, 15.0, 24.0, 25.0, 26.0, 26.0, 44.0, 32.0, 36.0, 56.0, 83.0, 406.0, 1564.0, 87.0, 73.0, 46.0, 43.0, 44.0, 34.0, 34.0, 29.0, 32.0, 25.0, 26.0, 14.0, 12.0, 15.0, 12.0, 10.0, 3.0, 6.0, 7.0, 9.0, 7.0, 7.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-22.953125, -22.21337890625, -21.4736328125, -20.73388671875, -19.994140625, -19.25439453125, -18.5146484375, -17.77490234375, -17.03515625, -16.29541015625, -15.5556640625, -14.81591796875, -14.076171875, -13.33642578125, -12.5966796875, -11.85693359375, -11.1171875, -10.37744140625, -9.6376953125, -8.89794921875, -8.158203125, -7.41845703125, -6.6787109375, -5.93896484375, -5.19921875, -4.45947265625, -3.7197265625, -2.97998046875, -2.240234375, -1.50048828125, -0.7607421875, -0.02099609375, 0.71875, 1.45849609375, 2.1982421875, 2.93798828125, 3.677734375, 4.41748046875, 5.1572265625, 5.89697265625, 6.63671875, 7.37646484375, 8.1162109375, 8.85595703125, 9.595703125, 10.33544921875, 11.0751953125, 11.81494140625, 12.5546875, 13.29443359375, 14.0341796875, 14.77392578125, 15.513671875, 16.25341796875, 16.9931640625, 17.73291015625, 18.47265625, 19.21240234375, 19.9521484375, 20.69189453125, 21.431640625, 22.17138671875, 22.9111328125, 23.65087890625, 24.390625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 6.0, 7.0, 5.0, 9.0, 7.0, 7.0, 9.0, 20.0, 15.0, 20.0, 21.0, 24.0, 24.0, 46.0, 48.0, 60.0, 73.0, 101.0, 176.0, 251.0, 557.0, 2233.0, 2909123.0, 230236.0, 1357.0, 424.0, 242.0, 151.0, 100.0, 71.0, 50.0, 29.0, 30.0, 14.0, 23.0, 18.0, 15.0, 15.0, 12.0, 19.0, 6.0, 9.0, 7.0, 15.0, 7.0, 3.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-72.9375, -70.720703125, -68.50390625, -66.287109375, -64.0703125, -61.853515625, -59.63671875, -57.419921875, -55.203125, -52.986328125, -50.76953125, -48.552734375, -46.3359375, -44.119140625, -41.90234375, -39.685546875, -37.46875, -35.251953125, -33.03515625, -30.818359375, -28.6015625, -26.384765625, -24.16796875, -21.951171875, -19.734375, -17.517578125, -15.30078125, -13.083984375, -10.8671875, -8.650390625, -6.43359375, -4.216796875, -2.0, 0.216796875, 2.43359375, 4.650390625, 6.8671875, 9.083984375, 11.30078125, 13.517578125, 15.734375, 17.951171875, 20.16796875, 22.384765625, 24.6015625, 26.818359375, 29.03515625, 31.251953125, 33.46875, 35.685546875, 37.90234375, 40.119140625, 42.3359375, 44.552734375, 46.76953125, 48.986328125, 51.203125, 53.419921875, 55.63671875, 57.853515625, 60.0703125, 62.287109375, 64.50390625, 66.720703125, 68.9375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 238.0, 708.0, 70.0], "bins": [-266.7608947753906, -262.4787902832031, -258.19671630859375, -253.91461181640625, -249.63250732421875, -245.35040283203125, -241.0683135986328, -236.78622436523438, -232.50411987304688, -228.22201538085938, -223.93992614746094, -219.6578369140625, -215.375732421875, -211.0936279296875, -206.81153869628906, -202.52944946289062, -198.24734497070312, -193.96524047851562, -189.6831512451172, -185.40106201171875, -181.11895751953125, -176.83685302734375, -172.5547637939453, -168.27267456054688, -163.99057006835938, -159.70846557617188, -155.42637634277344, -151.144287109375, -146.8621826171875, -142.580078125, -138.29798889160156, -134.01589965820312, -129.73377990722656, -125.4516830444336, -121.16958618164062, -116.88748931884766, -112.60539245605469, -108.32329559326172, -104.04119873046875, -99.75910186767578, -95.47700500488281, -91.19490814208984, -86.91281127929688, -82.6307144165039, -78.34861755371094, -74.06652069091797, -69.784423828125, -65.50232696533203, -61.22023391723633, -56.93813705444336, -52.65604019165039, -48.37394332885742, -44.09184646606445, -39.809749603271484, -35.527652740478516, -31.245555877685547, -26.963457107543945, -22.681360244750977, -18.399263381958008, -14.117166519165039, -9.83506965637207, -5.552972793579102, -1.2708759307861328, 3.011220932006836, 7.2933173179626465]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 6.0, 4.0, 7.0, 4.0, 10.0, 18.0, 10.0, 15.0, 11.0, 23.0, 22.0, 20.0, 20.0, 32.0, 28.0, 45.0, 28.0, 50.0, 47.0, 49.0, 29.0, 40.0, 34.0, 37.0, 46.0, 39.0, 36.0, 31.0, 37.0, 33.0, 24.0, 19.0, 21.0, 20.0, 23.0, 8.0, 16.0, 11.0, 11.0, 7.0, 6.0, 10.0, 2.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-80.03221130371094, -77.61380767822266, -75.19539642333984, -72.77699279785156, -70.35858154296875, -67.94017791748047, -65.52176666259766, -63.103363037109375, -60.68495559692383, -58.26654815673828, -55.848140716552734, -53.42973327636719, -51.011329650878906, -48.592918395996094, -46.17451477050781, -43.756107330322266, -41.33769989013672, -38.91929244995117, -36.500885009765625, -34.08247756958008, -31.664072036743164, -29.245664596557617, -26.827259063720703, -24.408851623535156, -21.99044418334961, -19.572036743164062, -17.153629302978516, -14.735223770141602, -12.316816329956055, -9.898408889770508, -7.480002403259277, -5.061595916748047, -2.6431808471679688, -0.22477388381958008, 2.1936330795288086, 4.612040042877197, 7.030447006225586, 9.448854446411133, 11.867260932922363, 14.285667419433594, 16.70407485961914, 19.122482299804688, 21.540889739990234, 23.95929527282715, 26.377702713012695, 28.796110153198242, 31.214515686035156, 33.6329231262207, 36.05133056640625, 38.4697380065918, 40.888145446777344, 43.30655288696289, 45.72496032714844, 48.14336395263672, 50.561771392822266, 52.98017883300781, 55.39858627319336, 57.816993713378906, 60.23540115356445, 62.65380859375, 65.07221221923828, 67.4906234741211, 69.90902709960938, 72.32743835449219, 74.74584197998047]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 2.0, 9.0, 4.0, 7.0, 10.0, 11.0, 13.0, 16.0, 18.0, 18.0, 16.0, 17.0, 23.0, 28.0, 30.0, 28.0, 36.0, 38.0, 38.0, 41.0, 49.0, 44.0, 52.0, 53.0, 39.0, 35.0, 40.0, 38.0, 21.0, 36.0, 19.0, 32.0, 23.0, 17.0, 16.0, 15.0, 14.0, 16.0, 7.0, 4.0, 10.0, 4.0, 3.0, 4.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0625, -7.7835693359375, -7.504638671875, -7.2257080078125, -6.94677734375, -6.6678466796875, -6.388916015625, -6.1099853515625, -5.8310546875, -5.5521240234375, -5.273193359375, -4.9942626953125, -4.71533203125, -4.4364013671875, -4.157470703125, -3.8785400390625, -3.599609375, -3.3206787109375, -3.041748046875, -2.7628173828125, -2.48388671875, -2.2049560546875, -1.926025390625, -1.6470947265625, -1.3681640625, -1.0892333984375, -0.810302734375, -0.5313720703125, -0.25244140625, 0.0264892578125, 0.305419921875, 0.5843505859375, 0.86328125, 1.1422119140625, 1.421142578125, 1.7000732421875, 1.97900390625, 2.2579345703125, 2.536865234375, 2.8157958984375, 3.0947265625, 3.3736572265625, 3.652587890625, 3.9315185546875, 4.21044921875, 4.4893798828125, 4.768310546875, 5.0472412109375, 5.326171875, 5.6051025390625, 5.884033203125, 6.1629638671875, 6.44189453125, 6.7208251953125, 6.999755859375, 7.2786865234375, 7.5576171875, 7.8365478515625, 8.115478515625, 8.3944091796875, 8.67333984375, 8.9522705078125, 9.231201171875, 9.5101318359375, 9.7890625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 8.0, 9.0, 5.0, 9.0, 6.0, 16.0, 20.0, 17.0, 24.0, 33.0, 39.0, 62.0, 90.0, 89.0, 194.0, 263.0, 440.0, 747.0, 1409.0, 2518.0, 5546.0, 13621.0, 41992.0, 168976.0, 641277.0, 1450368.0, 1243760.0, 455921.0, 115826.0, 30216.0, 10752.0, 4595.0, 2291.0, 1189.0, 699.0, 408.0, 248.0, 159.0, 113.0, 91.0, 60.0, 42.0, 34.0, 24.0, 19.0, 15.0, 11.0, 10.0, 3.0, 6.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.96875, -9.6558837890625, -9.343017578125, -9.0301513671875, -8.71728515625, -8.4044189453125, -8.091552734375, -7.7786865234375, -7.4658203125, -7.1529541015625, -6.840087890625, -6.5272216796875, -6.21435546875, -5.9014892578125, -5.588623046875, -5.2757568359375, -4.962890625, -4.6500244140625, -4.337158203125, -4.0242919921875, -3.71142578125, -3.3985595703125, -3.085693359375, -2.7728271484375, -2.4599609375, -2.1470947265625, -1.834228515625, -1.5213623046875, -1.20849609375, -0.8956298828125, -0.582763671875, -0.2698974609375, 0.04296875, 0.3558349609375, 0.668701171875, 0.9815673828125, 1.29443359375, 1.6072998046875, 1.920166015625, 2.2330322265625, 2.5458984375, 2.8587646484375, 3.171630859375, 3.4844970703125, 3.79736328125, 4.1102294921875, 4.423095703125, 4.7359619140625, 5.048828125, 5.3616943359375, 5.674560546875, 5.9874267578125, 6.30029296875, 6.6131591796875, 6.926025390625, 7.2388916015625, 7.5517578125, 7.8646240234375, 8.177490234375, 8.4903564453125, 8.80322265625, 9.1160888671875, 9.428955078125, 9.7418212890625, 10.0546875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 4.0, 3.0, 10.0, 9.0, 17.0, 23.0, 32.0, 61.0, 89.0, 128.0, 177.0, 263.0, 391.0, 543.0, 653.0, 524.0, 396.0, 269.0, 153.0, 119.0, 79.0, 58.0, 33.0, 18.0, 12.0, 9.0, 8.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-33.25, -32.519287109375, -31.78857421875, -31.057861328125, -30.3271484375, -29.596435546875, -28.86572265625, -28.135009765625, -27.404296875, -26.673583984375, -25.94287109375, -25.212158203125, -24.4814453125, -23.750732421875, -23.02001953125, -22.289306640625, -21.55859375, -20.827880859375, -20.09716796875, -19.366455078125, -18.6357421875, -17.905029296875, -17.17431640625, -16.443603515625, -15.712890625, -14.982177734375, -14.25146484375, -13.520751953125, -12.7900390625, -12.059326171875, -11.32861328125, -10.597900390625, -9.8671875, -9.136474609375, -8.40576171875, -7.675048828125, -6.9443359375, -6.213623046875, -5.48291015625, -4.752197265625, -4.021484375, -3.290771484375, -2.56005859375, -1.829345703125, -1.0986328125, -0.367919921875, 0.36279296875, 1.093505859375, 1.82421875, 2.554931640625, 3.28564453125, 4.016357421875, 4.7470703125, 5.477783203125, 6.20849609375, 6.939208984375, 7.669921875, 8.400634765625, 9.13134765625, 9.862060546875, 10.5927734375, 11.323486328125, 12.05419921875, 12.784912109375, 13.515625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 11.0, 16.0, 23.0, 46.0, 66.0, 101.0, 157.0, 223.0, 335.0, 570.0, 1504.0, 111574.0, 4073539.0, 4061.0, 773.0, 443.0, 276.0, 192.0, 148.0, 73.0, 62.0, 39.0, 25.0, 11.0, 10.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.6875, -104.1259765625, -100.564453125, -97.0029296875, -93.44140625, -89.8798828125, -86.318359375, -82.7568359375, -79.1953125, -75.6337890625, -72.072265625, -68.5107421875, -64.94921875, -61.3876953125, -57.826171875, -54.2646484375, -50.703125, -47.1416015625, -43.580078125, -40.0185546875, -36.45703125, -32.8955078125, -29.333984375, -25.7724609375, -22.2109375, -18.6494140625, -15.087890625, -11.5263671875, -7.96484375, -4.4033203125, -0.841796875, 2.7197265625, 6.28125, 9.8427734375, 13.404296875, 16.9658203125, 20.52734375, 24.0888671875, 27.650390625, 31.2119140625, 34.7734375, 38.3349609375, 41.896484375, 45.4580078125, 49.01953125, 52.5810546875, 56.142578125, 59.7041015625, 63.265625, 66.8271484375, 70.388671875, 73.9501953125, 77.51171875, 81.0732421875, 84.634765625, 88.1962890625, 91.7578125, 95.3193359375, 98.880859375, 102.4423828125, 106.00390625, 109.5654296875, 113.126953125, 116.6884765625, 120.25]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 582.0, 435.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1828.9698486328125, -1795.708251953125, -1762.4466552734375, -1729.1851806640625, -1695.923583984375, -1662.6619873046875, -1629.400390625, -1596.138916015625, -1562.8773193359375, -1529.61572265625, -1496.3541259765625, -1463.0926513671875, -1429.8310546875, -1396.5694580078125, -1363.307861328125, -1330.04638671875, -1296.78466796875, -1263.5230712890625, -1230.261474609375, -1197.0, -1163.7384033203125, -1130.476806640625, -1097.2152099609375, -1063.95361328125, -1030.692138671875, -997.4305419921875, -964.1690063476562, -930.9074096679688, -897.6458740234375, -864.38427734375, -831.1226806640625, -797.8611450195312, -764.599609375, -731.3380126953125, -698.0764770507812, -664.8148803710938, -631.5533447265625, -598.291748046875, -565.0301513671875, -531.7686157226562, -498.507080078125, -465.2455139160156, -431.98394775390625, -398.72235107421875, -365.4608154296875, -332.19921875, -298.9376525878906, -265.67608642578125, -232.41452026367188, -199.1529541015625, -165.89138793945312, -132.6298065185547, -99.36824035644531, -66.10667419433594, -32.8450927734375, 0.416473388671875, 33.67803955078125, 66.93960571289062, 100.20117950439453, 133.46275329589844, 166.7243194580078, 199.9858856201172, 233.24746704101562, 266.509033203125, 299.7705993652344]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 10.0, 8.0, 12.0, 17.0, 26.0, 33.0, 39.0, 33.0, 37.0, 45.0, 43.0, 52.0, 65.0, 52.0, 60.0, 68.0, 67.0, 52.0, 48.0, 50.0, 36.0, 42.0, 31.0, 17.0, 12.0, 10.0, 14.0, 11.0, 11.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.33647155761719, -55.7484130859375, -53.16035079956055, -50.57229232788086, -47.984230041503906, -45.39617156982422, -42.80811309814453, -40.22005081176758, -37.631988525390625, -35.04393005371094, -32.455867767333984, -29.867809295654297, -27.279747009277344, -24.691688537597656, -22.103628158569336, -19.515567779541016, -16.927509307861328, -14.339448928833008, -11.751388549804688, -9.163329124450684, -6.575268745422363, -3.987208366394043, -1.399148941040039, 1.1889114379882812, 3.7769718170166016, 6.365032196044922, 8.953092575073242, 11.541152000427246, 14.129212379455566, 16.717273712158203, 19.30533218383789, 21.89339256286621, 24.48145294189453, 27.06951332092285, 29.657573699951172, 32.24563217163086, 34.83369445800781, 37.4217529296875, 40.00981140136719, 42.59787368774414, 45.185935974121094, 47.77399444580078, 50.362056732177734, 52.95011520385742, 55.538177490234375, 58.12623596191406, 60.71429443359375, 63.3023567199707, 65.89041137695312, 68.47846984863281, 71.0665283203125, 73.65459442138672, 76.2426528930664, 78.8307113647461, 81.41876983642578, 84.0068359375, 86.59489440917969, 89.18295288085938, 91.77101135253906, 94.35907745361328, 96.94713592529297, 99.53519439697266, 102.12325286865234, 104.71131896972656, 107.29937744140625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 5.0, 3.0, 4.0, 5.0, 6.0, 5.0, 11.0, 12.0, 15.0, 18.0, 21.0, 22.0, 17.0, 27.0, 32.0, 28.0, 44.0, 44.0, 36.0, 50.0, 43.0, 50.0, 45.0, 50.0, 46.0, 45.0, 40.0, 48.0, 34.0, 26.0, 20.0, 24.0, 18.0, 20.0, 20.0, 14.0, 14.0, 11.0, 4.0, 7.0, 3.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8359375, -8.55126953125, -8.2666015625, -7.98193359375, -7.697265625, -7.41259765625, -7.1279296875, -6.84326171875, -6.55859375, -6.27392578125, -5.9892578125, -5.70458984375, -5.419921875, -5.13525390625, -4.8505859375, -4.56591796875, -4.28125, -3.99658203125, -3.7119140625, -3.42724609375, -3.142578125, -2.85791015625, -2.5732421875, -2.28857421875, -2.00390625, -1.71923828125, -1.4345703125, -1.14990234375, -0.865234375, -0.58056640625, -0.2958984375, -0.01123046875, 0.2734375, 0.55810546875, 0.8427734375, 1.12744140625, 1.412109375, 1.69677734375, 1.9814453125, 2.26611328125, 2.55078125, 2.83544921875, 3.1201171875, 3.40478515625, 3.689453125, 3.97412109375, 4.2587890625, 4.54345703125, 4.828125, 5.11279296875, 5.3974609375, 5.68212890625, 5.966796875, 6.25146484375, 6.5361328125, 6.82080078125, 7.10546875, 7.39013671875, 7.6748046875, 7.95947265625, 8.244140625, 8.52880859375, 8.8134765625, 9.09814453125, 9.3828125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 3.0, 7.0, 2.0, 14.0, 24.0, 21.0, 36.0, 49.0, 80.0, 109.0, 163.0, 199.0, 354.0, 477.0, 679.0, 938.0, 1443.0, 2059.0, 3033.0, 4424.0, 6366.0, 9271.0, 13525.0, 19563.0, 28001.0, 41595.0, 62630.0, 99367.0, 160021.0, 202115.0, 136025.0, 84958.0, 54647.0, 36148.0, 24741.0, 17215.0, 11899.0, 8301.0, 5606.0, 3869.0, 2712.0, 1882.0, 1213.0, 864.0, 590.0, 420.0, 278.0, 199.0, 140.0, 79.0, 63.0, 57.0, 31.0, 22.0, 12.0, 12.0, 8.0, 5.0, 2.0, 1.0, 2.0], "bins": [-1.0927734375, -1.0589752197265625, -1.025177001953125, -0.9913787841796875, -0.95758056640625, -0.9237823486328125, -0.889984130859375, -0.8561859130859375, -0.8223876953125, -0.7885894775390625, -0.754791259765625, -0.7209930419921875, -0.68719482421875, -0.6533966064453125, -0.619598388671875, -0.5858001708984375, -0.552001953125, -0.5182037353515625, -0.484405517578125, -0.4506072998046875, -0.41680908203125, -0.3830108642578125, -0.349212646484375, -0.3154144287109375, -0.2816162109375, -0.2478179931640625, -0.214019775390625, -0.1802215576171875, -0.14642333984375, -0.1126251220703125, -0.078826904296875, -0.0450286865234375, -0.01123046875, 0.0225677490234375, 0.056365966796875, 0.0901641845703125, 0.12396240234375, 0.1577606201171875, 0.191558837890625, 0.2253570556640625, 0.2591552734375, 0.2929534912109375, 0.326751708984375, 0.3605499267578125, 0.39434814453125, 0.4281463623046875, 0.461944580078125, 0.4957427978515625, 0.529541015625, 0.5633392333984375, 0.597137451171875, 0.6309356689453125, 0.66473388671875, 0.6985321044921875, 0.732330322265625, 0.7661285400390625, 0.7999267578125, 0.8337249755859375, 0.867523193359375, 0.9013214111328125, 0.93511962890625, 0.9689178466796875, 1.002716064453125, 1.0365142822265625, 1.0703125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 5.0, 5.0, 6.0, 8.0, 6.0, 20.0, 10.0, 15.0, 14.0, 18.0, 14.0, 23.0, 18.0, 28.0, 28.0, 26.0, 33.0, 24.0, 26.0, 30.0, 43.0, 44.0, 36.0, 1060.0, 43.0, 35.0, 33.0, 30.0, 32.0, 20.0, 27.0, 29.0, 32.0, 23.0, 29.0, 21.0, 18.0, 14.0, 16.0, 11.0, 11.0, 12.0, 9.0, 4.0, 7.0, 5.0, 6.0, 4.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-4.578125, -4.4312744140625, -4.284423828125, -4.1375732421875, -3.99072265625, -3.8438720703125, -3.697021484375, -3.5501708984375, -3.4033203125, -3.2564697265625, -3.109619140625, -2.9627685546875, -2.81591796875, -2.6690673828125, -2.522216796875, -2.3753662109375, -2.228515625, -2.0816650390625, -1.934814453125, -1.7879638671875, -1.64111328125, -1.4942626953125, -1.347412109375, -1.2005615234375, -1.0537109375, -0.9068603515625, -0.760009765625, -0.6131591796875, -0.46630859375, -0.3194580078125, -0.172607421875, -0.0257568359375, 0.12109375, 0.2679443359375, 0.414794921875, 0.5616455078125, 0.70849609375, 0.8553466796875, 1.002197265625, 1.1490478515625, 1.2958984375, 1.4427490234375, 1.589599609375, 1.7364501953125, 1.88330078125, 2.0301513671875, 2.177001953125, 2.3238525390625, 2.470703125, 2.6175537109375, 2.764404296875, 2.9112548828125, 3.05810546875, 3.2049560546875, 3.351806640625, 3.4986572265625, 3.6455078125, 3.7923583984375, 3.939208984375, 4.0860595703125, 4.23291015625, 4.3797607421875, 4.526611328125, 4.6734619140625, 4.8203125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 10.0, 10.0, 10.0, 25.0, 50.0, 57.0, 66.0, 120.0, 197.0, 291.0, 432.0, 701.0, 1091.0, 1595.0, 2353.0, 3533.0, 5483.0, 8487.0, 12847.0, 20010.0, 31411.0, 48849.0, 77319.0, 120659.0, 486522.0, 937513.0, 121485.0, 77358.0, 49474.0, 31526.0, 20028.0, 12889.0, 8466.0, 5580.0, 3707.0, 2379.0, 1619.0, 973.0, 686.0, 455.0, 309.0, 204.0, 133.0, 84.0, 42.0, 41.0, 16.0, 8.0, 9.0, 15.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.138671875, -1.1041717529296875, -1.069671630859375, -1.0351715087890625, -1.00067138671875, -0.9661712646484375, -0.931671142578125, -0.8971710205078125, -0.8626708984375, -0.8281707763671875, -0.793670654296875, -0.7591705322265625, -0.72467041015625, -0.6901702880859375, -0.655670166015625, -0.6211700439453125, -0.586669921875, -0.5521697998046875, -0.517669677734375, -0.4831695556640625, -0.44866943359375, -0.4141693115234375, -0.379669189453125, -0.3451690673828125, -0.3106689453125, -0.2761688232421875, -0.241668701171875, -0.2071685791015625, -0.17266845703125, -0.1381683349609375, -0.103668212890625, -0.0691680908203125, -0.03466796875, -0.0001678466796875, 0.034332275390625, 0.0688323974609375, 0.10333251953125, 0.1378326416015625, 0.172332763671875, 0.2068328857421875, 0.2413330078125, 0.2758331298828125, 0.310333251953125, 0.3448333740234375, 0.37933349609375, 0.4138336181640625, 0.448333740234375, 0.4828338623046875, 0.517333984375, 0.5518341064453125, 0.586334228515625, 0.6208343505859375, 0.65533447265625, 0.6898345947265625, 0.724334716796875, 0.7588348388671875, 0.7933349609375, 0.8278350830078125, 0.862335205078125, 0.8968353271484375, 0.93133544921875, 0.9658355712890625, 1.000335693359375, 1.0348358154296875, 1.0693359375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 6.0, 10.0, 11.0, 13.0, 17.0, 17.0, 26.0, 32.0, 35.0, 30.0, 42.0, 40.0, 50.0, 52.0, 54.0, 52.0, 58.0, 58.0, 53.0, 56.0, 50.0, 41.0, 37.0, 32.0, 16.0, 25.0, 19.0, 14.0, 11.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0018224716186523438, -0.0017687678337097168, -0.0017150640487670898, -0.0016613602638244629, -0.001607656478881836, -0.001553952693939209, -0.001500248908996582, -0.001446545124053955, -0.0013928413391113281, -0.0013391375541687012, -0.0012854337692260742, -0.0012317299842834473, -0.0011780261993408203, -0.0011243224143981934, -0.0010706186294555664, -0.0010169148445129395, -0.0009632110595703125, -0.0009095072746276855, -0.0008558034896850586, -0.0008020997047424316, -0.0007483959197998047, -0.0006946921348571777, -0.0006409883499145508, -0.0005872845649719238, -0.0005335807800292969, -0.0004798769950866699, -0.00042617321014404297, -0.000372469425201416, -0.00031876564025878906, -0.0002650618553161621, -0.00021135807037353516, -0.0001576542854309082, -0.00010395050048828125, -5.02467155456543e-05, 3.4570693969726562e-06, 5.716085433959961e-05, 0.00011086463928222656, 0.00016456842422485352, 0.00021827220916748047, 0.0002719759941101074, 0.0003256797790527344, 0.00037938356399536133, 0.0004330873489379883, 0.00048679113388061523, 0.0005404949188232422, 0.0005941987037658691, 0.0006479024887084961, 0.000701606273651123, 0.00075531005859375, 0.000809013843536377, 0.0008627176284790039, 0.0009164214134216309, 0.0009701251983642578, 0.0010238289833068848, 0.0010775327682495117, 0.0011312365531921387, 0.0011849403381347656, 0.0012386441230773926, 0.0012923479080200195, 0.0013460516929626465, 0.0013997554779052734, 0.0014534592628479004, 0.0015071630477905273, 0.0015608668327331543, 0.0016145706176757812]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 10.0, 20.0, 25.0, 22.0, 27.0, 36.0, 67.0, 69.0, 96.0, 142.0, 224.0, 524.0, 2062.0, 1000731.0, 42458.0, 976.0, 369.0, 181.0, 102.0, 80.0, 80.0, 57.0, 45.0, 28.0, 27.0, 15.0, 9.0, 14.0, 9.0, 12.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.040313720703125, -0.03900289535522461, -0.03769207000732422, -0.03638124465942383, -0.03507041931152344, -0.03375959396362305, -0.032448768615722656, -0.031137943267822266, -0.029827117919921875, -0.028516292572021484, -0.027205467224121094, -0.025894641876220703, -0.024583816528320312, -0.023272991180419922, -0.02196216583251953, -0.02065134048461914, -0.01934051513671875, -0.01802968978881836, -0.01671886444091797, -0.015408039093017578, -0.014097213745117188, -0.012786388397216797, -0.011475563049316406, -0.010164737701416016, -0.008853912353515625, -0.007543087005615234, -0.006232261657714844, -0.004921436309814453, -0.0036106109619140625, -0.002299785614013672, -0.0009889602661132812, 0.0003218650817871094, 0.0016326904296875, 0.0029435157775878906, 0.004254341125488281, 0.005565166473388672, 0.0068759918212890625, 0.008186817169189453, 0.009497642517089844, 0.010808467864990234, 0.012119293212890625, 0.013430118560791016, 0.014740943908691406, 0.016051769256591797, 0.017362594604492188, 0.018673419952392578, 0.01998424530029297, 0.02129507064819336, 0.02260589599609375, 0.02391672134399414, 0.02522754669189453, 0.026538372039794922, 0.027849197387695312, 0.029160022735595703, 0.030470848083496094, 0.031781673431396484, 0.033092498779296875, 0.034403324127197266, 0.035714149475097656, 0.03702497482299805, 0.03833580017089844, 0.03964662551879883, 0.04095745086669922, 0.04226827621459961, 0.0435791015625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 19.0, 61.0, 151.0, 269.0, 270.0, 159.0, 59.0, 17.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0031445971690118313, -0.0030660019256174564, -0.0029874066822230816, -0.002908811205998063, -0.0028302159626036882, -0.0027516207192093134, -0.0026730254758149385, -0.00259442999958992, -0.002515834756195545, -0.0024372395128011703, -0.0023586442694067955, -0.002280048793181777, -0.002201453549787402, -0.0021228583063930273, -0.0020442630629986525, -0.001965667586773634, -0.001887072459794581, -0.001808477216400206, -0.0017298818565905094, -0.0016512866131961346, -0.001572691253386438, -0.001494096009992063, -0.0014155006501823664, -0.0013369054067879915, -0.0012583101633936167, -0.0011797149199992418, -0.0011011195601895452, -0.0010225243167951703, -0.0009439289569854736, -0.0008653337135910988, -0.000786738411989063, -0.0007081431103870273, -0.0006295477505773306, -0.0005509524489752948, -0.00047235714737325907, -0.00039376187487505376, -0.000315166573273018, -0.00023657127167098224, -0.00015797599917277694, -7.938069757074118e-05, -7.853959687054157e-07, 7.780989835737273e-05, 0.00015640519268345088, 0.0002350004797335714, 0.00031359578133560717, 0.00039219108293764293, 0.00047078635543584824, 0.000549381657037884, 0.0006279769586399198, 0.0007065722602419555, 0.0007851675618439913, 0.0008637628052383661, 0.0009423581650480628, 0.0010209534084424376, 0.0010995487682521343, 0.0011781440116465092, 0.001256739255040884, 0.0013353344984352589, 0.0014139298582449555, 0.0014925251016393304, 0.001571120461449027, 0.001649715704843402, 0.0017283109482377768, 0.0018069063080474734, 0.00188550166785717]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 10.0, 13.0, 14.0, 14.0, 15.0, 16.0, 30.0, 27.0, 24.0, 30.0, 36.0, 27.0, 24.0, 51.0, 49.0, 52.0, 52.0, 51.0, 37.0, 38.0, 44.0, 48.0, 34.0, 35.0, 34.0, 28.0, 26.0, 20.0, 14.0, 22.0, 16.0, 14.0, 6.0, 8.0, 6.0, 9.0, 5.0, 5.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009677410125732422, -0.000937717966735363, -0.0009076949208974838, -0.0008776718750596046, -0.0008476488292217255, -0.0008176257833838463, -0.0007876027375459671, -0.0007575796917080879, -0.0007275566458702087, -0.0006975336000323296, -0.0006675105541944504, -0.0006374875083565712, -0.000607464462518692, -0.0005774414166808128, -0.0005474183708429337, -0.0005173953250050545, -0.0004873722791671753, -0.0004573492333292961, -0.00042732618749141693, -0.00039730314165353775, -0.00036728009581565857, -0.0003372570499777794, -0.0003072340041399002, -0.000277210958302021, -0.00024718791246414185, -0.00021716486662626266, -0.00018714182078838348, -0.0001571187749505043, -0.00012709572911262512, -9.707268327474594e-05, -6.704963743686676e-05, -3.702659159898758e-05, -7.0035457611083984e-06, 2.3019500076770782e-05, 5.304254591464996e-05, 8.306559175252914e-05, 0.00011308863759040833, 0.0001431116834282875, 0.0001731347292661667, 0.00020315777510404587, 0.00023318082094192505, 0.00026320386677980423, 0.0002932269126176834, 0.0003232499584555626, 0.00035327300429344177, 0.00038329605013132095, 0.00041331909596920013, 0.0004433421418070793, 0.0004733651876449585, 0.0005033882334828377, 0.0005334112793207169, 0.000563434325158596, 0.0005934573709964752, 0.0006234804168343544, 0.0006535034626722336, 0.0006835265085101128, 0.0007135495543479919, 0.0007435726001858711, 0.0007735956460237503, 0.0008036186918616295, 0.0008336417376995087, 0.0008636647835373878, 0.000893687829375267, 0.0009237108752131462, 0.0009537339210510254]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 5.0, 3.0, 4.0, 5.0, 6.0, 5.0, 11.0, 12.0, 15.0, 18.0, 21.0, 22.0, 17.0, 27.0, 32.0, 28.0, 44.0, 44.0, 36.0, 50.0, 43.0, 50.0, 45.0, 50.0, 46.0, 45.0, 40.0, 48.0, 34.0, 26.0, 20.0, 24.0, 18.0, 20.0, 20.0, 14.0, 14.0, 11.0, 4.0, 7.0, 3.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8359375, -8.55126953125, -8.2666015625, -7.98193359375, -7.697265625, -7.41259765625, -7.1279296875, -6.84326171875, -6.55859375, -6.27392578125, -5.9892578125, -5.70458984375, -5.419921875, -5.13525390625, -4.8505859375, -4.56591796875, -4.28125, -3.99658203125, -3.7119140625, -3.42724609375, -3.142578125, -2.85791015625, -2.5732421875, -2.28857421875, -2.00390625, -1.71923828125, -1.4345703125, -1.14990234375, -0.865234375, -0.58056640625, -0.2958984375, -0.01123046875, 0.2734375, 0.55810546875, 0.8427734375, 1.12744140625, 1.412109375, 1.69677734375, 1.9814453125, 2.26611328125, 2.55078125, 2.83544921875, 3.1201171875, 3.40478515625, 3.689453125, 3.97412109375, 4.2587890625, 4.54345703125, 4.828125, 5.11279296875, 5.3974609375, 5.68212890625, 5.966796875, 6.25146484375, 6.5361328125, 6.82080078125, 7.10546875, 7.39013671875, 7.6748046875, 7.95947265625, 8.244140625, 8.52880859375, 8.8134765625, 9.09814453125, 9.3828125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 4.0, 6.0, 10.0, 11.0, 23.0, 17.0, 32.0, 36.0, 48.0, 84.0, 108.0, 170.0, 395.0, 743.0, 1650.0, 3526.0, 8626.0, 21335.0, 54551.0, 156613.0, 439405.0, 234982.0, 76305.0, 29234.0, 11636.0, 4835.0, 2097.0, 940.0, 434.0, 246.0, 138.0, 90.0, 61.0, 41.0, 30.0, 23.0, 15.0, 11.0, 11.0, 5.0, 6.0, 7.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8359375, -7.5885009765625, -7.341064453125, -7.0936279296875, -6.84619140625, -6.5987548828125, -6.351318359375, -6.1038818359375, -5.8564453125, -5.6090087890625, -5.361572265625, -5.1141357421875, -4.86669921875, -4.6192626953125, -4.371826171875, -4.1243896484375, -3.876953125, -3.6295166015625, -3.382080078125, -3.1346435546875, -2.88720703125, -2.6397705078125, -2.392333984375, -2.1448974609375, -1.8974609375, -1.6500244140625, -1.402587890625, -1.1551513671875, -0.90771484375, -0.6602783203125, -0.412841796875, -0.1654052734375, 0.08203125, 0.3294677734375, 0.576904296875, 0.8243408203125, 1.07177734375, 1.3192138671875, 1.566650390625, 1.8140869140625, 2.0615234375, 2.3089599609375, 2.556396484375, 2.8038330078125, 3.05126953125, 3.2987060546875, 3.546142578125, 3.7935791015625, 4.041015625, 4.2884521484375, 4.535888671875, 4.7833251953125, 5.03076171875, 5.2781982421875, 5.525634765625, 5.7730712890625, 6.0205078125, 6.2679443359375, 6.515380859375, 6.7628173828125, 7.01025390625, 7.2576904296875, 7.505126953125, 7.7525634765625, 8.0]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 2.0, 5.0, 4.0, 5.0, 9.0, 12.0, 14.0, 12.0, 14.0, 18.0, 18.0, 26.0, 25.0, 25.0, 41.0, 39.0, 36.0, 55.0, 48.0, 76.0, 199.0, 1563.0, 279.0, 77.0, 55.0, 40.0, 46.0, 42.0, 40.0, 32.0, 28.0, 31.0, 19.0, 23.0, 16.0, 14.0, 17.0, 9.0, 4.0, 8.0, 8.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-26.421875, -25.5859375, -24.75, -23.9140625, -23.078125, -22.2421875, -21.40625, -20.5703125, -19.734375, -18.8984375, -18.0625, -17.2265625, -16.390625, -15.5546875, -14.71875, -13.8828125, -13.046875, -12.2109375, -11.375, -10.5390625, -9.703125, -8.8671875, -8.03125, -7.1953125, -6.359375, -5.5234375, -4.6875, -3.8515625, -3.015625, -2.1796875, -1.34375, -0.5078125, 0.328125, 1.1640625, 2.0, 2.8359375, 3.671875, 4.5078125, 5.34375, 6.1796875, 7.015625, 7.8515625, 8.6875, 9.5234375, 10.359375, 11.1953125, 12.03125, 12.8671875, 13.703125, 14.5390625, 15.375, 16.2109375, 17.046875, 17.8828125, 18.71875, 19.5546875, 20.390625, 21.2265625, 22.0625, 22.8984375, 23.734375, 24.5703125, 25.40625, 26.2421875, 27.078125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 5.0, 1.0, 4.0, 3.0, 8.0, 7.0, 13.0, 13.0, 16.0, 32.0, 28.0, 28.0, 45.0, 62.0, 95.0, 115.0, 161.0, 187.0, 337.0, 609.0, 2074.0, 98432.0, 3023566.0, 17195.0, 1212.0, 479.0, 284.0, 213.0, 120.0, 77.0, 71.0, 36.0, 47.0, 33.0, 31.0, 18.0, 20.0, 7.0, 3.0, 3.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-54.4375, -52.8515625, -51.265625, -49.6796875, -48.09375, -46.5078125, -44.921875, -43.3359375, -41.75, -40.1640625, -38.578125, -36.9921875, -35.40625, -33.8203125, -32.234375, -30.6484375, -29.0625, -27.4765625, -25.890625, -24.3046875, -22.71875, -21.1328125, -19.546875, -17.9609375, -16.375, -14.7890625, -13.203125, -11.6171875, -10.03125, -8.4453125, -6.859375, -5.2734375, -3.6875, -2.1015625, -0.515625, 1.0703125, 2.65625, 4.2421875, 5.828125, 7.4140625, 9.0, 10.5859375, 12.171875, 13.7578125, 15.34375, 16.9296875, 18.515625, 20.1015625, 21.6875, 23.2734375, 24.859375, 26.4453125, 28.03125, 29.6171875, 31.203125, 32.7890625, 34.375, 35.9609375, 37.546875, 39.1328125, 40.71875, 42.3046875, 43.890625, 45.4765625, 47.0625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 141.0, 845.0, 28.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-445.35626220703125, -437.0059814453125, -428.6556701660156, -420.3053894042969, -411.9551086425781, -403.60479736328125, -395.2545166015625, -386.90423583984375, -378.5539245605469, -370.2036437988281, -361.85333251953125, -353.5030517578125, -345.15277099609375, -336.8024597167969, -328.4521789550781, -320.1018981933594, -311.7515869140625, -303.40130615234375, -295.0509948730469, -286.7007141113281, -278.3504333496094, -270.0001220703125, -261.64984130859375, -253.29954528808594, -244.94927978515625, -236.59898376464844, -228.2487030029297, -219.89840698242188, -211.54811096191406, -203.19781494140625, -194.8475341796875, -186.4972381591797, -178.14697265625, -169.7966766357422, -161.44639587402344, -153.09609985351562, -144.7458038330078, -136.3955078125, -128.04522705078125, -119.69493103027344, -111.34463500976562, -102.99434661865234, -94.64405059814453, -86.29376220703125, -77.94346618652344, -69.59317779541016, -61.242889404296875, -52.89259719848633, -44.54230499267578, -36.192012786865234, -27.84172248840332, -19.491432189941406, -11.14113998413086, -2.7908477783203125, 5.559440612792969, 13.909732818603516, 22.260025024414062, 30.61031723022461, 38.960609436035156, 47.31089782714844, 55.661190032958984, 64.01148223876953, 72.36177062988281, 80.71206665039062, 89.0623550415039]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 3.0, 6.0, 9.0, 8.0, 14.0, 4.0, 16.0, 10.0, 26.0, 22.0, 27.0, 24.0, 23.0, 25.0, 38.0, 41.0, 31.0, 33.0, 38.0, 49.0, 43.0, 41.0, 45.0, 34.0, 34.0, 33.0, 34.0, 38.0, 26.0, 18.0, 33.0, 20.0, 25.0, 21.0, 14.0, 17.0, 9.0, 16.0, 11.0, 9.0, 9.0, 8.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-63.102821350097656, -61.157371520996094, -59.211917877197266, -57.2664680480957, -55.321014404296875, -53.37556457519531, -51.430110931396484, -49.48466110229492, -47.539207458496094, -45.59375762939453, -43.6483039855957, -41.70285415649414, -39.75740051269531, -37.81195068359375, -35.86649703979492, -33.92104721069336, -31.975595474243164, -30.03014373779297, -28.084692001342773, -26.139240264892578, -24.193788528442383, -22.248336791992188, -20.302886962890625, -18.357433319091797, -16.411983489990234, -14.466531753540039, -12.521080017089844, -10.575628280639648, -8.630176544189453, -6.684725761413574, -4.739274024963379, -2.7938222885131836, -0.8483695983886719, 1.0970820188522339, 3.0425336360931396, 4.987985134124756, 6.933436870574951, 8.878888130187988, 10.824339866638184, 12.769791603088379, 14.715243339538574, 16.660694122314453, 18.60614585876465, 20.551597595214844, 22.49704933166504, 24.442501068115234, 26.38795280456543, 28.333404541015625, 30.27885627746582, 32.224308013916016, 34.16975784301758, 36.115211486816406, 38.06066131591797, 40.0061149597168, 41.95156478881836, 43.89701843261719, 45.84246826171875, 47.78791809082031, 49.73337173461914, 51.6788215637207, 53.62427520751953, 55.569725036621094, 57.51517868041992, 59.460628509521484, 61.40608215332031]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 2.0, 2.0, 4.0, 6.0, 5.0, 7.0, 15.0, 18.0, 15.0, 19.0, 21.0, 31.0, 36.0, 34.0, 30.0, 36.0, 50.0, 51.0, 43.0, 64.0, 37.0, 52.0, 66.0, 41.0, 44.0, 46.0, 28.0, 33.0, 22.0, 22.0, 19.0, 25.0, 19.0, 13.0, 11.0, 4.0, 9.0, 5.0, 2.0, 7.0, 3.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8984375, -9.5826416015625, -9.266845703125, -8.9510498046875, -8.63525390625, -8.3194580078125, -8.003662109375, -7.6878662109375, -7.3720703125, -7.0562744140625, -6.740478515625, -6.4246826171875, -6.10888671875, -5.7930908203125, -5.477294921875, -5.1614990234375, -4.845703125, -4.5299072265625, -4.214111328125, -3.8983154296875, -3.58251953125, -3.2667236328125, -2.950927734375, -2.6351318359375, -2.3193359375, -2.0035400390625, -1.687744140625, -1.3719482421875, -1.05615234375, -0.7403564453125, -0.424560546875, -0.1087646484375, 0.20703125, 0.5228271484375, 0.838623046875, 1.1544189453125, 1.47021484375, 1.7860107421875, 2.101806640625, 2.4176025390625, 2.7333984375, 3.0491943359375, 3.364990234375, 3.6807861328125, 3.99658203125, 4.3123779296875, 4.628173828125, 4.9439697265625, 5.259765625, 5.5755615234375, 5.891357421875, 6.2071533203125, 6.52294921875, 6.8387451171875, 7.154541015625, 7.4703369140625, 7.7861328125, 8.1019287109375, 8.417724609375, 8.7335205078125, 9.04931640625, 9.3651123046875, 9.680908203125, 9.9967041015625, 10.3125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 3.0, 12.0, 4.0, 13.0, 13.0, 16.0, 21.0, 27.0, 22.0, 32.0, 44.0, 56.0, 79.0, 105.0, 201.0, 515.0, 1993.0, 14759.0, 415658.0, 3486065.0, 260233.0, 11623.0, 1709.0, 476.0, 171.0, 89.0, 70.0, 47.0, 43.0, 39.0, 32.0, 22.0, 16.0, 15.0, 13.0, 11.0, 8.0, 5.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.203125, -28.2744140625, -27.345703125, -26.4169921875, -25.48828125, -24.5595703125, -23.630859375, -22.7021484375, -21.7734375, -20.8447265625, -19.916015625, -18.9873046875, -18.05859375, -17.1298828125, -16.201171875, -15.2724609375, -14.34375, -13.4150390625, -12.486328125, -11.5576171875, -10.62890625, -9.7001953125, -8.771484375, -7.8427734375, -6.9140625, -5.9853515625, -5.056640625, -4.1279296875, -3.19921875, -2.2705078125, -1.341796875, -0.4130859375, 0.515625, 1.4443359375, 2.373046875, 3.3017578125, 4.23046875, 5.1591796875, 6.087890625, 7.0166015625, 7.9453125, 8.8740234375, 9.802734375, 10.7314453125, 11.66015625, 12.5888671875, 13.517578125, 14.4462890625, 15.375, 16.3037109375, 17.232421875, 18.1611328125, 19.08984375, 20.0185546875, 20.947265625, 21.8759765625, 22.8046875, 23.7333984375, 24.662109375, 25.5908203125, 26.51953125, 27.4482421875, 28.376953125, 29.3056640625, 30.234375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 3.0, 4.0, 4.0, 8.0, 13.0, 8.0, 16.0, 21.0, 22.0, 30.0, 33.0, 39.0, 72.0, 80.0, 101.0, 131.0, 145.0, 210.0, 290.0, 323.0, 365.0, 402.0, 394.0, 299.0, 236.0, 169.0, 156.0, 97.0, 86.0, 60.0, 53.0, 44.0, 40.0, 24.0, 22.0, 23.0, 4.0, 15.0, 13.0, 4.0, 7.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.613037109375, -12.21044921875, -11.807861328125, -11.4052734375, -11.002685546875, -10.60009765625, -10.197509765625, -9.794921875, -9.392333984375, -8.98974609375, -8.587158203125, -8.1845703125, -7.781982421875, -7.37939453125, -6.976806640625, -6.57421875, -6.171630859375, -5.76904296875, -5.366455078125, -4.9638671875, -4.561279296875, -4.15869140625, -3.756103515625, -3.353515625, -2.950927734375, -2.54833984375, -2.145751953125, -1.7431640625, -1.340576171875, -0.93798828125, -0.535400390625, -0.1328125, 0.269775390625, 0.67236328125, 1.074951171875, 1.4775390625, 1.880126953125, 2.28271484375, 2.685302734375, 3.087890625, 3.490478515625, 3.89306640625, 4.295654296875, 4.6982421875, 5.100830078125, 5.50341796875, 5.906005859375, 6.30859375, 6.711181640625, 7.11376953125, 7.516357421875, 7.9189453125, 8.321533203125, 8.72412109375, 9.126708984375, 9.529296875, 9.931884765625, 10.33447265625, 10.737060546875, 11.1396484375, 11.542236328125, 11.94482421875, 12.347412109375, 12.75]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 4.0, 7.0, 11.0, 13.0, 18.0, 30.0, 28.0, 62.0, 82.0, 110.0, 122.0, 209.0, 308.0, 498.0, 1761.0, 679453.0, 3506693.0, 3191.0, 585.0, 330.0, 212.0, 149.0, 129.0, 73.0, 59.0, 54.0, 32.0, 16.0, 14.0, 13.0, 6.0, 8.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-114.4375, -111.2666015625, -108.095703125, -104.9248046875, -101.75390625, -98.5830078125, -95.412109375, -92.2412109375, -89.0703125, -85.8994140625, -82.728515625, -79.5576171875, -76.38671875, -73.2158203125, -70.044921875, -66.8740234375, -63.703125, -60.5322265625, -57.361328125, -54.1904296875, -51.01953125, -47.8486328125, -44.677734375, -41.5068359375, -38.3359375, -35.1650390625, -31.994140625, -28.8232421875, -25.65234375, -22.4814453125, -19.310546875, -16.1396484375, -12.96875, -9.7978515625, -6.626953125, -3.4560546875, -0.28515625, 2.8857421875, 6.056640625, 9.2275390625, 12.3984375, 15.5693359375, 18.740234375, 21.9111328125, 25.08203125, 28.2529296875, 31.423828125, 34.5947265625, 37.765625, 40.9365234375, 44.107421875, 47.2783203125, 50.44921875, 53.6201171875, 56.791015625, 59.9619140625, 63.1328125, 66.3037109375, 69.474609375, 72.6455078125, 75.81640625, 78.9873046875, 82.158203125, 85.3291015625, 88.5]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 59.0, 459.0, 438.0, 55.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-451.9886169433594, -442.93896484375, -433.8892822265625, -424.8396301269531, -415.78997802734375, -406.74029541015625, -397.6906433105469, -388.6409912109375, -379.59130859375, -370.5416564941406, -361.4919738769531, -352.44232177734375, -343.3926696777344, -334.343017578125, -325.2933349609375, -316.2436828613281, -307.19403076171875, -298.1443786621094, -289.0946960449219, -280.0450439453125, -270.9953918457031, -261.94573974609375, -252.89605712890625, -243.84640502929688, -234.79673767089844, -225.7470703125, -216.69741821289062, -207.6477508544922, -198.59808349609375, -189.54843139648438, -180.49876403808594, -171.4490966796875, -162.39944458007812, -153.3497772216797, -144.3001251220703, -135.25045776367188, -126.20079803466797, -117.15113830566406, -108.10147094726562, -99.05181121826172, -90.00215148925781, -80.9524917602539, -71.90283203125, -62.85316467285156, -53.803504943847656, -44.75384521484375, -35.70418167114258, -26.654518127441406, -17.6048583984375, -8.555196762084961, 0.4944648742675781, 9.544126510620117, 18.593788146972656, 27.643447875976562, 36.693111419677734, 45.742774963378906, 54.79243469238281, 63.84209442138672, 72.89175415039062, 81.94142150878906, 90.99108123779297, 100.04074096679688, 109.09040832519531, 118.14006805419922, 127.18972778320312]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 6.0, 3.0, 4.0, 10.0, 9.0, 12.0, 12.0, 12.0, 14.0, 10.0, 23.0, 20.0, 31.0, 38.0, 33.0, 32.0, 35.0, 28.0, 40.0, 34.0, 35.0, 44.0, 32.0, 36.0, 50.0, 38.0, 31.0, 40.0, 45.0, 30.0, 33.0, 22.0, 28.0, 27.0, 20.0, 13.0, 19.0, 15.0, 12.0, 6.0, 3.0, 3.0, 4.0, 5.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.2247314453125, -50.460514068603516, -48.69629669189453, -46.93207931518555, -45.16786193847656, -43.40364456176758, -41.639427185058594, -39.87520980834961, -38.110992431640625, -36.34677505493164, -34.582557678222656, -32.81834030151367, -31.054122924804688, -29.289905548095703, -27.52568817138672, -25.761470794677734, -23.99725341796875, -22.233036041259766, -20.46881866455078, -18.704601287841797, -16.940383911132812, -15.176166534423828, -13.411949157714844, -11.64773178100586, -9.883514404296875, -8.11929702758789, -6.355079650878906, -4.590862274169922, -2.8266448974609375, -1.0624275207519531, 0.7017898559570312, 2.4660072326660156, 4.230224609375, 5.994441986083984, 7.758659362792969, 9.522876739501953, 11.287094116210938, 13.051311492919922, 14.815528869628906, 16.57974624633789, 18.343963623046875, 20.10818099975586, 21.872398376464844, 23.636615753173828, 25.400833129882812, 27.165050506591797, 28.92926788330078, 30.693485260009766, 32.45770263671875, 34.221920013427734, 35.98613739013672, 37.7503547668457, 39.51457214355469, 41.27878952026367, 43.043006896972656, 44.80722427368164, 46.571441650390625, 48.33565902709961, 50.099876403808594, 51.86409378051758, 53.62831115722656, 55.39252853393555, 57.15674591064453, 58.920963287353516, 60.6851806640625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 11.0, 8.0, 10.0, 11.0, 11.0, 15.0, 13.0, 27.0, 17.0, 25.0, 24.0, 34.0, 28.0, 34.0, 38.0, 38.0, 52.0, 44.0, 48.0, 51.0, 35.0, 35.0, 43.0, 32.0, 39.0, 41.0, 28.0, 34.0, 24.0, 24.0, 22.0, 13.0, 15.0, 18.0, 10.0, 5.0, 7.0, 4.0, 6.0, 8.0, 2.0, 3.0, 0.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.680419921875, -8.39208984375, -8.103759765625, -7.8154296875, -7.527099609375, -7.23876953125, -6.950439453125, -6.662109375, -6.373779296875, -6.08544921875, -5.797119140625, -5.5087890625, -5.220458984375, -4.93212890625, -4.643798828125, -4.35546875, -4.067138671875, -3.77880859375, -3.490478515625, -3.2021484375, -2.913818359375, -2.62548828125, -2.337158203125, -2.048828125, -1.760498046875, -1.47216796875, -1.183837890625, -0.8955078125, -0.607177734375, -0.31884765625, -0.030517578125, 0.2578125, 0.546142578125, 0.83447265625, 1.122802734375, 1.4111328125, 1.699462890625, 1.98779296875, 2.276123046875, 2.564453125, 2.852783203125, 3.14111328125, 3.429443359375, 3.7177734375, 4.006103515625, 4.29443359375, 4.582763671875, 4.87109375, 5.159423828125, 5.44775390625, 5.736083984375, 6.0244140625, 6.312744140625, 6.60107421875, 6.889404296875, 7.177734375, 7.466064453125, 7.75439453125, 8.042724609375, 8.3310546875, 8.619384765625, 8.90771484375, 9.196044921875, 9.484375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 5.0, 4.0, 10.0, 7.0, 12.0, 28.0, 51.0, 70.0, 95.0, 128.0, 176.0, 270.0, 406.0, 580.0, 811.0, 1172.0, 1700.0, 2486.0, 3588.0, 5080.0, 7388.0, 10870.0, 15664.0, 22916.0, 33509.0, 50646.0, 77827.0, 122904.0, 185820.0, 173623.0, 112405.0, 71793.0, 46814.0, 31608.0, 21249.0, 14335.0, 10050.0, 6839.0, 4801.0, 3344.0, 2232.0, 1660.0, 1135.0, 775.0, 534.0, 350.0, 249.0, 178.0, 110.0, 86.0, 64.0, 35.0, 32.0, 21.0, 9.0, 8.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.1494140625, -1.1133880615234375, -1.077362060546875, -1.0413360595703125, -1.00531005859375, -0.9692840576171875, -0.933258056640625, -0.8972320556640625, -0.8612060546875, -0.8251800537109375, -0.789154052734375, -0.7531280517578125, -0.71710205078125, -0.6810760498046875, -0.645050048828125, -0.6090240478515625, -0.572998046875, -0.5369720458984375, -0.500946044921875, -0.4649200439453125, -0.42889404296875, -0.3928680419921875, -0.356842041015625, -0.3208160400390625, -0.2847900390625, -0.2487640380859375, -0.212738037109375, -0.1767120361328125, -0.14068603515625, -0.1046600341796875, -0.068634033203125, -0.0326080322265625, 0.00341796875, 0.0394439697265625, 0.075469970703125, 0.1114959716796875, 0.14752197265625, 0.1835479736328125, 0.219573974609375, 0.2555999755859375, 0.2916259765625, 0.3276519775390625, 0.363677978515625, 0.3997039794921875, 0.43572998046875, 0.4717559814453125, 0.507781982421875, 0.5438079833984375, 0.579833984375, 0.6158599853515625, 0.651885986328125, 0.6879119873046875, 0.72393798828125, 0.7599639892578125, 0.795989990234375, 0.8320159912109375, 0.8680419921875, 0.9040679931640625, 0.940093994140625, 0.9761199951171875, 1.01214599609375, 1.0481719970703125, 1.084197998046875, 1.1202239990234375, 1.15625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 6.0, 5.0, 10.0, 13.0, 10.0, 8.0, 17.0, 28.0, 24.0, 25.0, 15.0, 26.0, 42.0, 48.0, 36.0, 24.0, 39.0, 43.0, 1072.0, 47.0, 45.0, 44.0, 45.0, 47.0, 42.0, 36.0, 36.0, 26.0, 26.0, 19.0, 25.0, 16.0, 16.0, 20.0, 13.0, 8.0, 9.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2421875, -6.040771484375, -5.83935546875, -5.637939453125, -5.4365234375, -5.235107421875, -5.03369140625, -4.832275390625, -4.630859375, -4.429443359375, -4.22802734375, -4.026611328125, -3.8251953125, -3.623779296875, -3.42236328125, -3.220947265625, -3.01953125, -2.818115234375, -2.61669921875, -2.415283203125, -2.2138671875, -2.012451171875, -1.81103515625, -1.609619140625, -1.408203125, -1.206787109375, -1.00537109375, -0.803955078125, -0.6025390625, -0.401123046875, -0.19970703125, 0.001708984375, 0.203125, 0.404541015625, 0.60595703125, 0.807373046875, 1.0087890625, 1.210205078125, 1.41162109375, 1.613037109375, 1.814453125, 2.015869140625, 2.21728515625, 2.418701171875, 2.6201171875, 2.821533203125, 3.02294921875, 3.224365234375, 3.42578125, 3.627197265625, 3.82861328125, 4.030029296875, 4.2314453125, 4.432861328125, 4.63427734375, 4.835693359375, 5.037109375, 5.238525390625, 5.43994140625, 5.641357421875, 5.8427734375, 6.044189453125, 6.24560546875, 6.447021484375, 6.6484375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 12.0, 6.0, 20.0, 16.0, 29.0, 36.0, 73.0, 126.0, 182.0, 288.0, 468.0, 734.0, 1217.0, 2053.0, 3413.0, 5709.0, 9746.0, 15985.0, 27145.0, 47282.0, 83181.0, 146196.0, 1293279.0, 196277.0, 111710.0, 63051.0, 36132.0, 21382.0, 12450.0, 7497.0, 4601.0, 2617.0, 1635.0, 967.0, 612.0, 396.0, 212.0, 152.0, 74.0, 63.0, 47.0, 23.0, 17.0, 14.0, 3.0, 5.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.533203125, -1.4864044189453125, -1.439605712890625, -1.3928070068359375, -1.34600830078125, -1.2992095947265625, -1.252410888671875, -1.2056121826171875, -1.1588134765625, -1.1120147705078125, -1.065216064453125, -1.0184173583984375, -0.97161865234375, -0.9248199462890625, -0.878021240234375, -0.8312225341796875, -0.784423828125, -0.7376251220703125, -0.690826416015625, -0.6440277099609375, -0.59722900390625, -0.5504302978515625, -0.503631591796875, -0.4568328857421875, -0.4100341796875, -0.3632354736328125, -0.316436767578125, -0.2696380615234375, -0.22283935546875, -0.1760406494140625, -0.129241943359375, -0.0824432373046875, -0.03564453125, 0.0111541748046875, 0.057952880859375, 0.1047515869140625, 0.15155029296875, 0.1983489990234375, 0.245147705078125, 0.2919464111328125, 0.3387451171875, 0.3855438232421875, 0.432342529296875, 0.4791412353515625, 0.52593994140625, 0.5727386474609375, 0.619537353515625, 0.6663360595703125, 0.713134765625, 0.7599334716796875, 0.806732177734375, 0.8535308837890625, 0.90032958984375, 0.9471282958984375, 0.993927001953125, 1.0407257080078125, 1.0875244140625, 1.1343231201171875, 1.181121826171875, 1.2279205322265625, 1.27471923828125, 1.3215179443359375, 1.368316650390625, 1.4151153564453125, 1.4619140625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 8.0, 8.0, 6.0, 10.0, 11.0, 22.0, 19.0, 21.0, 34.0, 47.0, 58.0, 57.0, 72.0, 69.0, 96.0, 77.0, 59.0, 69.0, 51.0, 44.0, 37.0, 25.0, 21.0, 16.0, 9.0, 13.0, 4.0, 4.0, 7.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002986907958984375, -0.002899855375289917, -0.002812802791595459, -0.002725750207901001, -0.002638697624206543, -0.002551645040512085, -0.002464592456817627, -0.002377539873123169, -0.002290487289428711, -0.002203434705734253, -0.002116382122039795, -0.002029329538345337, -0.001942276954650879, -0.001855224370956421, -0.0017681717872619629, -0.0016811192035675049, -0.0015940666198730469, -0.0015070140361785889, -0.0014199614524841309, -0.0013329088687896729, -0.0012458562850952148, -0.0011588037014007568, -0.0010717511177062988, -0.0009846985340118408, -0.0008976459503173828, -0.0008105933666229248, -0.0007235407829284668, -0.0006364881992340088, -0.0005494356155395508, -0.0004623830318450928, -0.00037533044815063477, -0.00028827786445617676, -0.00020122528076171875, -0.00011417269706726074, -2.7120113372802734e-05, 5.9932470321655273e-05, 0.00014698505401611328, 0.0002340376377105713, 0.0003210902214050293, 0.0004081428050994873, 0.0004951953887939453, 0.0005822479724884033, 0.0006693005561828613, 0.0007563531398773193, 0.0008434057235717773, 0.0009304583072662354, 0.0010175108909606934, 0.0011045634746551514, 0.0011916160583496094, 0.0012786686420440674, 0.0013657212257385254, 0.0014527738094329834, 0.0015398263931274414, 0.0016268789768218994, 0.0017139315605163574, 0.0018009841442108154, 0.0018880367279052734, 0.0019750893115997314, 0.0020621418952941895, 0.0021491944789886475, 0.0022362470626831055, 0.0023232996463775635, 0.0024103522300720215, 0.0024974048137664795, 0.0025844573974609375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 1.0, 5.0, 6.0, 12.0, 8.0, 11.0, 7.0, 20.0, 40.0, 21.0, 60.0, 92.0, 127.0, 158.0, 346.0, 911.0, 299970.0, 744794.0, 1038.0, 339.0, 176.0, 115.0, 76.0, 55.0, 35.0, 27.0, 22.0, 19.0, 8.0, 12.0, 5.0, 10.0, 6.0, 1.0, 4.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.056793212890625, -0.054837703704833984, -0.05288219451904297, -0.05092668533325195, -0.04897117614746094, -0.04701566696166992, -0.045060157775878906, -0.04310464859008789, -0.041149139404296875, -0.03919363021850586, -0.037238121032714844, -0.03528261184692383, -0.03332710266113281, -0.0313715934753418, -0.02941608428955078, -0.027460575103759766, -0.02550506591796875, -0.023549556732177734, -0.02159404754638672, -0.019638538360595703, -0.017683029174804688, -0.015727519989013672, -0.013772010803222656, -0.01181650161743164, -0.009860992431640625, -0.00790548324584961, -0.005949974060058594, -0.003994464874267578, -0.0020389556884765625, -8.344650268554688e-05, 0.0018720626831054688, 0.0038275718688964844, 0.0057830810546875, 0.007738590240478516, 0.009694099426269531, 0.011649608612060547, 0.013605117797851562, 0.015560626983642578, 0.017516136169433594, 0.01947164535522461, 0.021427154541015625, 0.02338266372680664, 0.025338172912597656, 0.027293682098388672, 0.029249191284179688, 0.031204700469970703, 0.03316020965576172, 0.035115718841552734, 0.03707122802734375, 0.039026737213134766, 0.04098224639892578, 0.0429377555847168, 0.04489326477050781, 0.04684877395629883, 0.048804283142089844, 0.05075979232788086, 0.052715301513671875, 0.05467081069946289, 0.056626319885253906, 0.05858182907104492, 0.06053733825683594, 0.06249284744262695, 0.06444835662841797, 0.06640386581420898, 0.068359375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 7.0, 7.0, 23.0, 79.0, 169.0, 276.0, 230.0, 142.0, 59.0, 20.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006881483714096248, -0.0006108620436862111, -0.0005335757159627974, -0.0004562893882393837, -0.00037900306051597, -0.0003017167327925563, -0.00022443040506914258, -0.00014714407734572887, -6.985774962231517e-05, 7.4285781010985374e-06, 8.471490582451224e-05, 0.00016200123354792595, 0.00023928756127133965, 0.00031657388899475336, 0.00039386021671816707, 0.00047114654444158077, 0.0005484328721649945, 0.0006257191998884082, 0.0007030055276118219, 0.0007802918553352356, 0.0008575781830586493, 0.000934864510782063, 0.0010121508967131376, 0.0010894371662288904, 0.0011667234357446432, 0.001244009705260396, 0.0013212960911914706, 0.0013985824771225452, 0.001475868746638298, 0.0015531550161540508, 0.0016304414020851254, 0.0017077277880162, 0.0017850142903625965, 0.0018623005598783493, 0.001939586945809424, 0.0020168733317404985, 0.0020941596012562513, 0.002171445870772004, 0.0022487323731184006, 0.0023260186426341534, 0.002403304912149906, 0.002480591181665659, 0.0025578774511814117, 0.002635163953527808, 0.002712450223043561, 0.0027897364925593138, 0.0028670229949057102, 0.002944309264421463, 0.003021595533937216, 0.0030988818034529686, 0.0031761680729687214, 0.003253454575315118, 0.0033307408448308706, 0.0034080271143466234, 0.00348531361669302, 0.0035625998862087727, 0.0036398861557245255, 0.0037171724252402782, 0.003794458694756031, 0.0038717451971024275, 0.003949031233787537, 0.004026317968964577, 0.0041036042384803295, 0.004180890507996082, 0.004258176777511835]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 6.0, 11.0, 8.0, 11.0, 10.0, 15.0, 9.0, 18.0, 21.0, 27.0, 27.0, 36.0, 39.0, 40.0, 37.0, 40.0, 46.0, 36.0, 44.0, 32.0, 42.0, 56.0, 29.0, 46.0, 36.0, 37.0, 28.0, 29.0, 36.0, 29.0, 28.0, 14.0, 14.0, 11.0, 14.0, 11.0, 7.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.001127481460571289, -0.0010868236422538757, -0.0010461658239364624, -0.001005508005619049, -0.0009648501873016357, -0.0009241923689842224, -0.0008835345506668091, -0.0008428767323493958, -0.0008022189140319824, -0.0007615610957145691, -0.0007209032773971558, -0.0006802454590797424, -0.0006395876407623291, -0.0005989298224449158, -0.0005582720041275024, -0.0005176141858100891, -0.0004769563674926758, -0.00043629854917526245, -0.0003956407308578491, -0.0003549829125404358, -0.00031432509422302246, -0.00027366727590560913, -0.0002330094575881958, -0.00019235163927078247, -0.00015169382095336914, -0.00011103600263595581, -7.037818431854248e-05, -2.972036600112915e-05, 1.093745231628418e-05, 5.159527063369751e-05, 9.225308895111084e-05, 0.00013291090726852417, 0.0001735687255859375, 0.00021422654390335083, 0.00025488436222076416, 0.0002955421805381775, 0.0003361999988555908, 0.00037685781717300415, 0.0004175156354904175, 0.0004581734538078308, 0.0004988312721252441, 0.0005394890904426575, 0.0005801469087600708, 0.0006208047270774841, 0.0006614625453948975, 0.0007021203637123108, 0.0007427781820297241, 0.0007834360003471375, 0.0008240938186645508, 0.0008647516369819641, 0.0009054094552993774, 0.0009460672736167908, 0.000986725091934204, 0.0010273829102516174, 0.0010680407285690308, 0.001108698546886444, 0.0011493563652038574, 0.0011900141835212708, 0.001230672001838684, 0.0012713298201560974, 0.0013119876384735107, 0.001352645456790924, 0.0013933032751083374, 0.0014339610934257507, 0.001474618911743164]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 11.0, 8.0, 10.0, 11.0, 11.0, 15.0, 13.0, 27.0, 17.0, 25.0, 24.0, 34.0, 28.0, 34.0, 38.0, 38.0, 52.0, 44.0, 48.0, 51.0, 35.0, 35.0, 43.0, 32.0, 39.0, 41.0, 28.0, 34.0, 24.0, 24.0, 22.0, 13.0, 15.0, 18.0, 10.0, 5.0, 7.0, 4.0, 6.0, 8.0, 3.0, 2.0, 0.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.680419921875, -8.39208984375, -8.103759765625, -7.8154296875, -7.527099609375, -7.23876953125, -6.950439453125, -6.662109375, -6.373779296875, -6.08544921875, -5.797119140625, -5.5087890625, -5.220458984375, -4.93212890625, -4.643798828125, -4.35546875, -4.067138671875, -3.77880859375, -3.490478515625, -3.2021484375, -2.913818359375, -2.62548828125, -2.337158203125, -2.048828125, -1.760498046875, -1.47216796875, -1.183837890625, -0.8955078125, -0.607177734375, -0.31884765625, -0.030517578125, 0.2578125, 0.546142578125, 0.83447265625, 1.122802734375, 1.4111328125, 1.699462890625, 1.98779296875, 2.276123046875, 2.564453125, 2.852783203125, 3.14111328125, 3.429443359375, 3.7177734375, 4.006103515625, 4.29443359375, 4.582763671875, 4.87109375, 5.159423828125, 5.44775390625, 5.736083984375, 6.0244140625, 6.312744140625, 6.60107421875, 6.889404296875, 7.177734375, 7.466064453125, 7.75439453125, 8.042724609375, 8.3310546875, 8.619384765625, 8.90771484375, 9.196044921875, 9.484375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 10.0, 15.0, 11.0, 16.0, 10.0, 18.0, 22.0, 30.0, 31.0, 55.0, 62.0, 101.0, 138.0, 166.0, 314.0, 585.0, 1560.0, 5686.0, 31413.0, 314460.0, 630879.0, 50619.0, 8535.0, 1991.0, 704.0, 327.0, 228.0, 160.0, 98.0, 74.0, 52.0, 51.0, 29.0, 29.0, 19.0, 7.0, 13.0, 7.0, 7.0, 4.0, 9.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.75, -17.1796875, -16.609375, -16.0390625, -15.46875, -14.8984375, -14.328125, -13.7578125, -13.1875, -12.6171875, -12.046875, -11.4765625, -10.90625, -10.3359375, -9.765625, -9.1953125, -8.625, -8.0546875, -7.484375, -6.9140625, -6.34375, -5.7734375, -5.203125, -4.6328125, -4.0625, -3.4921875, -2.921875, -2.3515625, -1.78125, -1.2109375, -0.640625, -0.0703125, 0.5, 1.0703125, 1.640625, 2.2109375, 2.78125, 3.3515625, 3.921875, 4.4921875, 5.0625, 5.6328125, 6.203125, 6.7734375, 7.34375, 7.9140625, 8.484375, 9.0546875, 9.625, 10.1953125, 10.765625, 11.3359375, 11.90625, 12.4765625, 13.046875, 13.6171875, 14.1875, 14.7578125, 15.328125, 15.8984375, 16.46875, 17.0390625, 17.609375, 18.1796875, 18.75]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 6.0, 5.0, 6.0, 10.0, 6.0, 10.0, 13.0, 17.0, 21.0, 21.0, 27.0, 18.0, 38.0, 25.0, 33.0, 35.0, 54.0, 51.0, 82.0, 145.0, 1569.0, 334.0, 89.0, 65.0, 37.0, 48.0, 44.0, 33.0, 28.0, 25.0, 19.0, 22.0, 25.0, 15.0, 16.0, 13.0, 10.0, 4.0, 6.0, 4.0, 3.0, 3.0, 5.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.6875, -26.819580078125, -25.95166015625, -25.083740234375, -24.2158203125, -23.347900390625, -22.47998046875, -21.612060546875, -20.744140625, -19.876220703125, -19.00830078125, -18.140380859375, -17.2724609375, -16.404541015625, -15.53662109375, -14.668701171875, -13.80078125, -12.932861328125, -12.06494140625, -11.197021484375, -10.3291015625, -9.461181640625, -8.59326171875, -7.725341796875, -6.857421875, -5.989501953125, -5.12158203125, -4.253662109375, -3.3857421875, -2.517822265625, -1.64990234375, -0.781982421875, 0.0859375, 0.953857421875, 1.82177734375, 2.689697265625, 3.5576171875, 4.425537109375, 5.29345703125, 6.161376953125, 7.029296875, 7.897216796875, 8.76513671875, 9.633056640625, 10.5009765625, 11.368896484375, 12.23681640625, 13.104736328125, 13.97265625, 14.840576171875, 15.70849609375, 16.576416015625, 17.4443359375, 18.312255859375, 19.18017578125, 20.048095703125, 20.916015625, 21.783935546875, 22.65185546875, 23.519775390625, 24.3876953125, 25.255615234375, 26.12353515625, 26.991455078125, 27.859375]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 4.0, 5.0, 3.0, 4.0, 9.0, 8.0, 8.0, 13.0, 18.0, 30.0, 32.0, 29.0, 41.0, 43.0, 48.0, 92.0, 108.0, 160.0, 329.0, 759.0, 5474.0, 2742113.0, 391317.0, 3439.0, 640.0, 316.0, 189.0, 97.0, 67.0, 64.0, 47.0, 29.0, 38.0, 28.0, 28.0, 15.0, 13.0, 11.0, 9.0, 5.0, 7.0, 7.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-64.5625, -62.5390625, -60.515625, -58.4921875, -56.46875, -54.4453125, -52.421875, -50.3984375, -48.375, -46.3515625, -44.328125, -42.3046875, -40.28125, -38.2578125, -36.234375, -34.2109375, -32.1875, -30.1640625, -28.140625, -26.1171875, -24.09375, -22.0703125, -20.046875, -18.0234375, -16.0, -13.9765625, -11.953125, -9.9296875, -7.90625, -5.8828125, -3.859375, -1.8359375, 0.1875, 2.2109375, 4.234375, 6.2578125, 8.28125, 10.3046875, 12.328125, 14.3515625, 16.375, 18.3984375, 20.421875, 22.4453125, 24.46875, 26.4921875, 28.515625, 30.5390625, 32.5625, 34.5859375, 36.609375, 38.6328125, 40.65625, 42.6796875, 44.703125, 46.7265625, 48.75, 50.7734375, 52.796875, 54.8203125, 56.84375, 58.8671875, 60.890625, 62.9140625, 64.9375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 42.0, 471.0, 454.0, 44.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.8292999267578, -123.87491607666016, -118.9205322265625, -113.96614837646484, -109.01176452636719, -104.05738067626953, -99.10299682617188, -94.14860534667969, -89.19422912597656, -84.2398452758789, -79.28546142578125, -74.3310775756836, -69.37669372558594, -64.42230987548828, -59.46792221069336, -54.5135383605957, -49.55915069580078, -44.604766845703125, -39.65038299560547, -34.69599914550781, -29.741613388061523, -24.787229537963867, -19.832843780517578, -14.878459930419922, -9.924076080322266, -4.969691753387451, -0.015307426452636719, 4.939077377319336, 9.893461227416992, 14.847845077514648, 19.802230834960938, 24.756614685058594, 29.71099853515625, 34.665382385253906, 39.61976623535156, 44.57415008544922, 49.528533935546875, 54.48291778564453, 59.43730545043945, 64.39169311523438, 69.3460693359375, 74.30045318603516, 79.25483703613281, 84.20922088623047, 89.16360473632812, 94.11798858642578, 99.07237243652344, 104.02676391601562, 108.98114776611328, 113.93553161621094, 118.8899154663086, 123.84429931640625, 128.79869079589844, 133.75306701660156, 138.70745849609375, 143.66183471679688, 148.61622619628906, 153.57061767578125, 158.52499389648438, 163.47938537597656, 168.4337615966797, 173.38815307617188, 178.342529296875, 183.2969207763672, 188.2512969970703]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 1.0, 5.0, 8.0, 7.0, 8.0, 10.0, 11.0, 19.0, 10.0, 13.0, 13.0, 18.0, 21.0, 26.0, 27.0, 29.0, 22.0, 35.0, 28.0, 27.0, 31.0, 32.0, 38.0, 36.0, 29.0, 37.0, 32.0, 30.0, 46.0, 29.0, 37.0, 25.0, 21.0, 28.0, 21.0, 17.0, 25.0, 20.0, 12.0, 17.0, 20.0, 12.0, 14.0, 11.0, 7.0, 4.0, 7.0, 7.0, 4.0, 3.0, 4.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-59.55815124511719, -57.63398742675781, -55.70982360839844, -53.78565979003906, -51.86149978637695, -49.93733596801758, -48.0131721496582, -46.08900833129883, -44.16484832763672, -42.240684509277344, -40.31652069091797, -38.392356872558594, -36.468196868896484, -34.54403305053711, -32.619869232177734, -30.69570541381836, -28.771541595458984, -26.84737777709961, -24.923215866088867, -22.999052047729492, -21.07489013671875, -19.150726318359375, -17.2265625, -15.302399635314941, -13.378236770629883, -11.454073905944824, -9.529911041259766, -7.605747222900391, -5.681584358215332, -3.7574214935302734, -1.8332576751708984, 0.09090518951416016, 2.0150680541992188, 3.9392311573028564, 5.863394260406494, 7.787557601928711, 9.71172046661377, 11.635883331298828, 13.560047149658203, 15.484210014343262, 17.40837287902832, 19.332536697387695, 21.256698608398438, 23.180862426757812, 25.105026245117188, 27.02918815612793, 28.953351974487305, 30.877513885498047, 32.80167770385742, 34.7258415222168, 36.65000534057617, 38.57416534423828, 40.498329162597656, 42.42249298095703, 44.346656799316406, 46.27082061767578, 48.194984436035156, 50.11914825439453, 52.043312072753906, 53.96747589111328, 55.89163589477539, 57.815799713134766, 59.73996353149414, 61.664127349853516, 63.588287353515625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 9.0, 7.0, 4.0, 7.0, 6.0, 12.0, 9.0, 11.0, 18.0, 20.0, 27.0, 27.0, 26.0, 28.0, 35.0, 32.0, 36.0, 43.0, 43.0, 52.0, 39.0, 37.0, 37.0, 62.0, 34.0, 38.0, 31.0, 39.0, 34.0, 29.0, 33.0, 20.0, 20.0, 17.0, 18.0, 14.0, 9.0, 12.0, 6.0, 4.0, 5.0, 1.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.046875, -8.7479248046875, -8.448974609375, -8.1500244140625, -7.85107421875, -7.5521240234375, -7.253173828125, -6.9542236328125, -6.6552734375, -6.3563232421875, -6.057373046875, -5.7584228515625, -5.45947265625, -5.1605224609375, -4.861572265625, -4.5626220703125, -4.263671875, -3.9647216796875, -3.665771484375, -3.3668212890625, -3.06787109375, -2.7689208984375, -2.469970703125, -2.1710205078125, -1.8720703125, -1.5731201171875, -1.274169921875, -0.9752197265625, -0.67626953125, -0.3773193359375, -0.078369140625, 0.2205810546875, 0.51953125, 0.8184814453125, 1.117431640625, 1.4163818359375, 1.71533203125, 2.0142822265625, 2.313232421875, 2.6121826171875, 2.9111328125, 3.2100830078125, 3.509033203125, 3.8079833984375, 4.10693359375, 4.4058837890625, 4.704833984375, 5.0037841796875, 5.302734375, 5.6016845703125, 5.900634765625, 6.1995849609375, 6.49853515625, 6.7974853515625, 7.096435546875, 7.3953857421875, 7.6943359375, 7.9932861328125, 8.292236328125, 8.5911865234375, 8.89013671875, 9.1890869140625, 9.488037109375, 9.7869873046875, 10.0859375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 0.0, 1.0, 6.0, 11.0, 8.0, 10.0, 13.0, 11.0, 18.0, 20.0, 18.0, 25.0, 50.0, 46.0, 66.0, 162.0, 318.0, 685.0, 2039.0, 7001.0, 36784.0, 612072.0, 3101198.0, 395110.0, 29288.0, 6170.0, 1808.0, 657.0, 256.0, 106.0, 67.0, 51.0, 42.0, 30.0, 33.0, 17.0, 16.0, 11.0, 9.0, 9.0, 5.0, 6.0, 5.0, 10.0, 0.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-25.6875, -24.8955078125, -24.103515625, -23.3115234375, -22.51953125, -21.7275390625, -20.935546875, -20.1435546875, -19.3515625, -18.5595703125, -17.767578125, -16.9755859375, -16.18359375, -15.3916015625, -14.599609375, -13.8076171875, -13.015625, -12.2236328125, -11.431640625, -10.6396484375, -9.84765625, -9.0556640625, -8.263671875, -7.4716796875, -6.6796875, -5.8876953125, -5.095703125, -4.3037109375, -3.51171875, -2.7197265625, -1.927734375, -1.1357421875, -0.34375, 0.4482421875, 1.240234375, 2.0322265625, 2.82421875, 3.6162109375, 4.408203125, 5.2001953125, 5.9921875, 6.7841796875, 7.576171875, 8.3681640625, 9.16015625, 9.9521484375, 10.744140625, 11.5361328125, 12.328125, 13.1201171875, 13.912109375, 14.7041015625, 15.49609375, 16.2880859375, 17.080078125, 17.8720703125, 18.6640625, 19.4560546875, 20.248046875, 21.0400390625, 21.83203125, 22.6240234375, 23.416015625, 24.2080078125, 25.0]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 11.0, 18.0, 11.0, 17.0, 23.0, 40.0, 59.0, 95.0, 131.0, 168.0, 272.0, 395.0, 559.0, 620.0, 531.0, 362.0, 254.0, 153.0, 128.0, 78.0, 44.0, 37.0, 24.0, 12.0, 11.0, 10.0, 6.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.65625, -21.02685546875, -20.3974609375, -19.76806640625, -19.138671875, -18.50927734375, -17.8798828125, -17.25048828125, -16.62109375, -15.99169921875, -15.3623046875, -14.73291015625, -14.103515625, -13.47412109375, -12.8447265625, -12.21533203125, -11.5859375, -10.95654296875, -10.3271484375, -9.69775390625, -9.068359375, -8.43896484375, -7.8095703125, -7.18017578125, -6.55078125, -5.92138671875, -5.2919921875, -4.66259765625, -4.033203125, -3.40380859375, -2.7744140625, -2.14501953125, -1.515625, -0.88623046875, -0.2568359375, 0.37255859375, 1.001953125, 1.63134765625, 2.2607421875, 2.89013671875, 3.51953125, 4.14892578125, 4.7783203125, 5.40771484375, 6.037109375, 6.66650390625, 7.2958984375, 7.92529296875, 8.5546875, 9.18408203125, 9.8134765625, 10.44287109375, 11.072265625, 11.70166015625, 12.3310546875, 12.96044921875, 13.58984375, 14.21923828125, 14.8486328125, 15.47802734375, 16.107421875, 16.73681640625, 17.3662109375, 17.99560546875, 18.625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 8.0, 9.0, 12.0, 11.0, 9.0, 27.0, 36.0, 39.0, 66.0, 78.0, 102.0, 141.0, 240.0, 354.0, 942.0, 6287.0, 773787.0, 3397200.0, 12376.0, 1244.0, 471.0, 247.0, 170.0, 111.0, 85.0, 51.0, 48.0, 42.0, 23.0, 19.0, 14.0, 10.0, 9.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-90.5625, -88.18603515625, -85.8095703125, -83.43310546875, -81.056640625, -78.68017578125, -76.3037109375, -73.92724609375, -71.55078125, -69.17431640625, -66.7978515625, -64.42138671875, -62.044921875, -59.66845703125, -57.2919921875, -54.91552734375, -52.5390625, -50.16259765625, -47.7861328125, -45.40966796875, -43.033203125, -40.65673828125, -38.2802734375, -35.90380859375, -33.52734375, -31.15087890625, -28.7744140625, -26.39794921875, -24.021484375, -21.64501953125, -19.2685546875, -16.89208984375, -14.515625, -12.13916015625, -9.7626953125, -7.38623046875, -5.009765625, -2.63330078125, -0.2568359375, 2.11962890625, 4.49609375, 6.87255859375, 9.2490234375, 11.62548828125, 14.001953125, 16.37841796875, 18.7548828125, 21.13134765625, 23.5078125, 25.88427734375, 28.2607421875, 30.63720703125, 33.013671875, 35.39013671875, 37.7666015625, 40.14306640625, 42.51953125, 44.89599609375, 47.2724609375, 49.64892578125, 52.025390625, 54.40185546875, 56.7783203125, 59.15478515625, 61.53125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 11.0, 31.0, 74.0, 155.0, 248.0, 251.0, 146.0, 64.0, 16.0, 10.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.1055450439453, -158.2458953857422, -154.38623046875, -150.52658081054688, -146.6669158935547, -142.80726623535156, -138.94760131835938, -135.08795166015625, -131.22830200195312, -127.36864471435547, -123.50898742675781, -119.64933776855469, -115.78968048095703, -111.93002319335938, -108.07036590576172, -104.21070861816406, -100.3510513305664, -96.49139404296875, -92.6317367553711, -88.77207946777344, -84.91242980957031, -81.05277252197266, -77.193115234375, -73.33345794677734, -69.47380065917969, -65.61414337158203, -61.75448989868164, -57.894832611083984, -54.035179138183594, -50.17552185058594, -46.31586456298828, -42.456207275390625, -38.5965576171875, -34.736900329589844, -30.877246856689453, -27.017589569091797, -23.157934188842773, -19.29827880859375, -15.438621520996094, -11.57896614074707, -7.719310760498047, -3.8596549034118652, 9.5367431640625e-07, 3.8596572875976562, 7.71931266784668, 11.578968048095703, 15.43862533569336, 19.298280715942383, 23.157936096191406, 27.01759147644043, 30.877246856689453, 34.73690414428711, 38.5965576171875, 42.456214904785156, 46.31587219238281, 50.17552947998047, 54.03518295288086, 57.894840240478516, 61.754493713378906, 65.61415100097656, 69.47380828857422, 73.33346557617188, 77.193115234375, 81.05277252197266, 84.91242980957031]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 11.0, 4.0, 6.0, 9.0, 11.0, 9.0, 23.0, 16.0, 22.0, 25.0, 26.0, 37.0, 32.0, 27.0, 38.0, 39.0, 40.0, 43.0, 30.0, 43.0, 46.0, 47.0, 55.0, 47.0, 43.0, 37.0, 40.0, 31.0, 25.0, 23.0, 12.0, 17.0, 13.0, 11.0, 11.0, 18.0, 12.0, 4.0, 3.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.865867614746094, -52.09005355834961, -50.31423568725586, -48.538421630859375, -46.76260757446289, -44.98678970336914, -43.210975646972656, -41.435157775878906, -39.65934371948242, -37.88352966308594, -36.10771179199219, -34.3318977355957, -32.55608367919922, -30.78026580810547, -29.004451751708984, -27.228635787963867, -25.452821731567383, -23.677005767822266, -21.90119171142578, -20.125375747680664, -18.349559783935547, -16.573745727539062, -14.797929763793945, -13.022113800048828, -11.246298789978027, -9.470483779907227, -7.694667816162109, -5.918852806091309, -4.14303731918335, -2.3672218322753906, -0.5914068222045898, 1.1844091415405273, 2.960224151611328, 4.736039638519287, 6.511855125427246, 8.287670135498047, 10.063486099243164, 11.839301109313965, 13.615116119384766, 15.390932083129883, 17.166748046875, 18.942564010620117, 20.7183780670166, 22.49419403076172, 24.270009994506836, 26.045825958251953, 27.821640014648438, 29.597455978393555, 31.37327003479004, 33.149085998535156, 34.92490005493164, 36.700714111328125, 38.476531982421875, 40.25234603881836, 42.028160095214844, 43.803977966308594, 45.57979202270508, 47.35560607910156, 49.13142395019531, 50.9072380065918, 52.68305206298828, 54.45886993408203, 56.234683990478516, 58.010498046875, 59.78631591796875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 10.0, 6.0, 15.0, 10.0, 15.0, 9.0, 15.0, 20.0, 17.0, 24.0, 27.0, 19.0, 21.0, 30.0, 31.0, 35.0, 31.0, 33.0, 47.0, 40.0, 38.0, 35.0, 42.0, 41.0, 47.0, 33.0, 37.0, 40.0, 38.0, 23.0, 23.0, 29.0, 13.0, 13.0, 18.0, 13.0, 14.0, 9.0, 10.0, 6.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.921875, -9.634521484375, -9.34716796875, -9.059814453125, -8.7724609375, -8.485107421875, -8.19775390625, -7.910400390625, -7.623046875, -7.335693359375, -7.04833984375, -6.760986328125, -6.4736328125, -6.186279296875, -5.89892578125, -5.611572265625, -5.32421875, -5.036865234375, -4.74951171875, -4.462158203125, -4.1748046875, -3.887451171875, -3.60009765625, -3.312744140625, -3.025390625, -2.738037109375, -2.45068359375, -2.163330078125, -1.8759765625, -1.588623046875, -1.30126953125, -1.013916015625, -0.7265625, -0.439208984375, -0.15185546875, 0.135498046875, 0.4228515625, 0.710205078125, 0.99755859375, 1.284912109375, 1.572265625, 1.859619140625, 2.14697265625, 2.434326171875, 2.7216796875, 3.009033203125, 3.29638671875, 3.583740234375, 3.87109375, 4.158447265625, 4.44580078125, 4.733154296875, 5.0205078125, 5.307861328125, 5.59521484375, 5.882568359375, 6.169921875, 6.457275390625, 6.74462890625, 7.031982421875, 7.3193359375, 7.606689453125, 7.89404296875, 8.181396484375, 8.46875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 0.0, 6.0, 9.0, 11.0, 12.0, 26.0, 33.0, 55.0, 80.0, 122.0, 198.0, 299.0, 437.0, 652.0, 980.0, 1390.0, 2107.0, 3334.0, 4769.0, 7394.0, 11065.0, 17093.0, 26534.0, 41011.0, 64601.0, 103356.0, 165459.0, 212187.0, 140626.0, 88323.0, 55046.0, 35440.0, 22600.0, 14491.0, 9617.0, 6478.0, 4192.0, 2797.0, 1917.0, 1267.0, 830.0, 544.0, 359.0, 279.0, 182.0, 122.0, 68.0, 54.0, 49.0, 23.0, 19.0, 10.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2763671875, -1.234283447265625, -1.19219970703125, -1.150115966796875, -1.1080322265625, -1.065948486328125, -1.02386474609375, -0.981781005859375, -0.939697265625, -0.897613525390625, -0.85552978515625, -0.813446044921875, -0.7713623046875, -0.729278564453125, -0.68719482421875, -0.645111083984375, -0.60302734375, -0.560943603515625, -0.51885986328125, -0.476776123046875, -0.4346923828125, -0.392608642578125, -0.35052490234375, -0.308441162109375, -0.266357421875, -0.224273681640625, -0.18218994140625, -0.140106201171875, -0.0980224609375, -0.055938720703125, -0.01385498046875, 0.028228759765625, 0.0703125, 0.112396240234375, 0.15447998046875, 0.196563720703125, 0.2386474609375, 0.280731201171875, 0.32281494140625, 0.364898681640625, 0.406982421875, 0.449066162109375, 0.49114990234375, 0.533233642578125, 0.5753173828125, 0.617401123046875, 0.65948486328125, 0.701568603515625, 0.74365234375, 0.785736083984375, 0.82781982421875, 0.869903564453125, 0.9119873046875, 0.954071044921875, 0.99615478515625, 1.038238525390625, 1.080322265625, 1.122406005859375, 1.16448974609375, 1.206573486328125, 1.2486572265625, 1.290740966796875, 1.33282470703125, 1.374908447265625, 1.4169921875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 9.0, 9.0, 4.0, 10.0, 14.0, 16.0, 22.0, 13.0, 20.0, 19.0, 26.0, 38.0, 31.0, 36.0, 48.0, 45.0, 42.0, 52.0, 40.0, 1079.0, 43.0, 41.0, 32.0, 35.0, 24.0, 36.0, 28.0, 27.0, 25.0, 31.0, 29.0, 17.0, 13.0, 14.0, 8.0, 10.0, 8.0, 11.0, 4.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96484375, -5.765380859375, -5.56591796875, -5.366455078125, -5.1669921875, -4.967529296875, -4.76806640625, -4.568603515625, -4.369140625, -4.169677734375, -3.97021484375, -3.770751953125, -3.5712890625, -3.371826171875, -3.17236328125, -2.972900390625, -2.7734375, -2.573974609375, -2.37451171875, -2.175048828125, -1.9755859375, -1.776123046875, -1.57666015625, -1.377197265625, -1.177734375, -0.978271484375, -0.77880859375, -0.579345703125, -0.3798828125, -0.180419921875, 0.01904296875, 0.218505859375, 0.41796875, 0.617431640625, 0.81689453125, 1.016357421875, 1.2158203125, 1.415283203125, 1.61474609375, 1.814208984375, 2.013671875, 2.213134765625, 2.41259765625, 2.612060546875, 2.8115234375, 3.010986328125, 3.21044921875, 3.409912109375, 3.609375, 3.808837890625, 4.00830078125, 4.207763671875, 4.4072265625, 4.606689453125, 4.80615234375, 5.005615234375, 5.205078125, 5.404541015625, 5.60400390625, 5.803466796875, 6.0029296875, 6.202392578125, 6.40185546875, 6.601318359375, 6.80078125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 7.0, 17.0, 23.0, 45.0, 55.0, 79.0, 108.0, 213.0, 284.0, 517.0, 747.0, 1124.0, 1723.0, 2702.0, 4272.0, 6803.0, 10780.0, 16974.0, 26766.0, 42282.0, 68353.0, 108503.0, 171609.0, 1256187.0, 139284.0, 88107.0, 55507.0, 34449.0, 21652.0, 13749.0, 8725.0, 5563.0, 3518.0, 2296.0, 1520.0, 886.0, 588.0, 365.0, 242.0, 196.0, 102.0, 69.0, 56.0, 27.0, 16.0, 15.0, 9.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2880859375, -1.2469024658203125, -1.205718994140625, -1.1645355224609375, -1.12335205078125, -1.0821685791015625, -1.040985107421875, -0.9998016357421875, -0.9586181640625, -0.9174346923828125, -0.876251220703125, -0.8350677490234375, -0.79388427734375, -0.7527008056640625, -0.711517333984375, -0.6703338623046875, -0.629150390625, -0.5879669189453125, -0.546783447265625, -0.5055999755859375, -0.46441650390625, -0.4232330322265625, -0.382049560546875, -0.3408660888671875, -0.2996826171875, -0.2584991455078125, -0.217315673828125, -0.1761322021484375, -0.13494873046875, -0.0937652587890625, -0.052581787109375, -0.0113983154296875, 0.02978515625, 0.0709686279296875, 0.112152099609375, 0.1533355712890625, 0.19451904296875, 0.2357025146484375, 0.276885986328125, 0.3180694580078125, 0.3592529296875, 0.4004364013671875, 0.441619873046875, 0.4828033447265625, 0.52398681640625, 0.5651702880859375, 0.606353759765625, 0.6475372314453125, 0.688720703125, 0.7299041748046875, 0.771087646484375, 0.8122711181640625, 0.85345458984375, 0.8946380615234375, 0.935821533203125, 0.9770050048828125, 1.0181884765625, 1.0593719482421875, 1.100555419921875, 1.1417388916015625, 1.18292236328125, 1.2241058349609375, 1.265289306640625, 1.3064727783203125, 1.34765625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 6.0, 3.0, 2.0, 4.0, 4.0, 9.0, 7.0, 8.0, 10.0, 15.0, 31.0, 29.0, 41.0, 65.0, 65.0, 73.0, 80.0, 85.0, 100.0, 70.0, 67.0, 52.0, 41.0, 38.0, 24.0, 18.0, 9.0, 14.0, 15.0, 7.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036334991455078125, -0.003529101610183716, -0.003424704074859619, -0.0033203065395355225, -0.0032159090042114258, -0.003111511468887329, -0.0030071139335632324, -0.0029027163982391357, -0.002798318862915039, -0.0026939213275909424, -0.0025895237922668457, -0.002485126256942749, -0.0023807287216186523, -0.0022763311862945557, -0.002171933650970459, -0.0020675361156463623, -0.0019631385803222656, -0.001858741044998169, -0.0017543435096740723, -0.0016499459743499756, -0.001545548439025879, -0.0014411509037017822, -0.0013367533683776855, -0.0012323558330535889, -0.0011279582977294922, -0.0010235607624053955, -0.0009191632270812988, -0.0008147656917572021, -0.0007103681564331055, -0.0006059706211090088, -0.0005015730857849121, -0.00039717555046081543, -0.00029277801513671875, -0.00018838047981262207, -8.398294448852539e-05, 2.041459083557129e-05, 0.00012481212615966797, 0.00022920966148376465, 0.00033360719680786133, 0.000438004732131958, 0.0005424022674560547, 0.0006467998027801514, 0.000751197338104248, 0.0008555948734283447, 0.0009599924087524414, 0.001064389944076538, 0.0011687874794006348, 0.0012731850147247314, 0.0013775825500488281, 0.0014819800853729248, 0.0015863776206970215, 0.0016907751560211182, 0.0017951726913452148, 0.0018995702266693115, 0.002003967761993408, 0.002108365297317505, 0.0022127628326416016, 0.0023171603679656982, 0.002421557903289795, 0.0025259554386138916, 0.0026303529739379883, 0.002734750509262085, 0.0028391480445861816, 0.0029435455799102783, 0.003047943115234375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 2.0, 8.0, 14.0, 20.0, 14.0, 23.0, 28.0, 43.0, 54.0, 96.0, 147.0, 252.0, 687.0, 48673.0, 996295.0, 1241.0, 337.0, 190.0, 122.0, 75.0, 56.0, 39.0, 29.0, 20.0, 22.0, 10.0, 4.0, 11.0, 6.0, 6.0, 9.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059783935546875, -0.057584285736083984, -0.05538463592529297, -0.05318498611450195, -0.05098533630371094, -0.04878568649291992, -0.046586036682128906, -0.04438638687133789, -0.042186737060546875, -0.03998708724975586, -0.037787437438964844, -0.03558778762817383, -0.03338813781738281, -0.031188488006591797, -0.02898883819580078, -0.026789188385009766, -0.02458953857421875, -0.022389888763427734, -0.02019023895263672, -0.017990589141845703, -0.015790939331054688, -0.013591289520263672, -0.011391639709472656, -0.00919198989868164, -0.006992340087890625, -0.004792690277099609, -0.0025930404663085938, -0.0003933906555175781, 0.0018062591552734375, 0.004005908966064453, 0.006205558776855469, 0.008405208587646484, 0.0106048583984375, 0.012804508209228516, 0.015004158020019531, 0.017203807830810547, 0.019403457641601562, 0.021603107452392578, 0.023802757263183594, 0.02600240707397461, 0.028202056884765625, 0.03040170669555664, 0.032601356506347656, 0.03480100631713867, 0.03700065612792969, 0.0392003059387207, 0.04139995574951172, 0.043599605560302734, 0.04579925537109375, 0.047998905181884766, 0.05019855499267578, 0.0523982048034668, 0.05459785461425781, 0.05679750442504883, 0.058997154235839844, 0.06119680404663086, 0.06339645385742188, 0.06559610366821289, 0.0677957534790039, 0.06999540328979492, 0.07219505310058594, 0.07439470291137695, 0.07659435272216797, 0.07879400253295898, 0.08099365234375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 13.0, 503.0, 488.0, 15.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011714515276253223, -0.0007818718440830708, -0.00039229216054081917, -2.712476998567581e-06, 0.000386867206543684, 0.0007764468900859356, 0.0011660265736281872, 0.0015556062571704388, 0.0019451859407126904, 0.002334765624254942, 0.0027243453077971935, 0.003113924991339445, 0.0035035046748816967, 0.0038930843584239483, 0.0042826640419662, 0.0046722437255084515, 0.005061823409050703, 0.005451403092592955, 0.005840982776135206, 0.006230562459677458, 0.006620142143219709, 0.007009721826761961, 0.007399301510304213, 0.007788881193846464, 0.008178461343050003, 0.008568041026592255, 0.008957620710134506, 0.009347200393676758, 0.00973678007721901, 0.010126359760761261, 0.010515939444303513, 0.010905519127845764, 0.011295098811388016, 0.011684678494930267, 0.012074258178472519, 0.01246383786201477, 0.012853417545557022, 0.013242997229099274, 0.013632576912641525, 0.014022156596183777, 0.014411736279726028, 0.01480131596326828, 0.015190895646810532, 0.015580475330352783, 0.015970055013895035, 0.016359634697437286, 0.016749214380979538, 0.01713879406452179, 0.01752837374806404, 0.017917953431606293, 0.018307533115148544, 0.018697112798690796, 0.019086692482233047, 0.0194762721657753, 0.01986585184931755, 0.020255431532859802, 0.020645011216402054, 0.021034590899944305, 0.021424170583486557, 0.02181375026702881, 0.02220332995057106, 0.022592909634113312, 0.022982489317655563, 0.023372069001197815, 0.023761648684740067]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 0.0, 3.0, 5.0, 4.0, 4.0, 6.0, 9.0, 10.0, 4.0, 8.0, 9.0, 9.0, 16.0, 17.0, 24.0, 19.0, 17.0, 30.0, 25.0, 30.0, 25.0, 30.0, 45.0, 45.0, 42.0, 40.0, 42.0, 40.0, 41.0, 38.0, 37.0, 32.0, 43.0, 31.0, 35.0, 28.0, 24.0, 18.0, 13.0, 22.0, 10.0, 13.0, 9.0, 9.0, 12.0, 11.0, 6.0, 5.0, 2.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012637972831726074, -0.001223200000822544, -0.0011826027184724808, -0.0011420054361224174, -0.0011014081537723541, -0.0010608108714222908, -0.0010202135890722275, -0.0009796163067221642, -0.0009390190243721008, -0.0008984217420220375, -0.0008578244596719742, -0.0008172271773219109, -0.0007766298949718475, -0.0007360326126217842, -0.0006954353302717209, -0.0006548380479216576, -0.0006142407655715942, -0.0005736434832215309, -0.0005330462008714676, -0.0004924489185214043, -0.00045185163617134094, -0.0004112543538212776, -0.0003706570714712143, -0.00033005978912115097, -0.00028946250677108765, -0.0002488652244210243, -0.000208267942070961, -0.00016767065972089767, -0.00012707337737083435, -8.647609502077103e-05, -4.58788126707077e-05, -5.281530320644379e-06, 3.5315752029418945e-05, 7.591303437948227e-05, 0.0001165103167295456, 0.00015710759907960892, 0.00019770488142967224, 0.00023830216377973557, 0.0002788994461297989, 0.0003194967284798622, 0.00036009401082992554, 0.00040069129317998886, 0.0004412885755300522, 0.0004818858578801155, 0.0005224831402301788, 0.0005630804225802422, 0.0006036777049303055, 0.0006442749872803688, 0.0006848722696304321, 0.0007254695519804955, 0.0007660668343305588, 0.0008066641166806221, 0.0008472613990306854, 0.0008878586813807487, 0.0009284559637308121, 0.0009690532460808754, 0.0010096505284309387, 0.001050247810781002, 0.0010908450931310654, 0.0011314423754811287, 0.001172039657831192, 0.0012126369401812553, 0.0012532342225313187, 0.001293831504881382, 0.0013344287872314453]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 10.0, 6.0, 15.0, 10.0, 15.0, 9.0, 15.0, 20.0, 17.0, 24.0, 27.0, 19.0, 21.0, 30.0, 31.0, 35.0, 31.0, 33.0, 47.0, 40.0, 38.0, 35.0, 42.0, 41.0, 47.0, 33.0, 37.0, 40.0, 38.0, 23.0, 23.0, 29.0, 13.0, 13.0, 18.0, 13.0, 14.0, 9.0, 10.0, 6.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.921875, -9.634521484375, -9.34716796875, -9.059814453125, -8.7724609375, -8.485107421875, -8.19775390625, -7.910400390625, -7.623046875, -7.335693359375, -7.04833984375, -6.760986328125, -6.4736328125, -6.186279296875, -5.89892578125, -5.611572265625, -5.32421875, -5.036865234375, -4.74951171875, -4.462158203125, -4.1748046875, -3.887451171875, -3.60009765625, -3.312744140625, -3.025390625, -2.738037109375, -2.45068359375, -2.163330078125, -1.8759765625, -1.588623046875, -1.30126953125, -1.013916015625, -0.7265625, -0.439208984375, -0.15185546875, 0.135498046875, 0.4228515625, 0.710205078125, 0.99755859375, 1.284912109375, 1.572265625, 1.859619140625, 2.14697265625, 2.434326171875, 2.7216796875, 3.009033203125, 3.29638671875, 3.583740234375, 3.87109375, 4.158447265625, 4.44580078125, 4.733154296875, 5.0205078125, 5.307861328125, 5.59521484375, 5.882568359375, 6.169921875, 6.457275390625, 6.74462890625, 7.031982421875, 7.3193359375, 7.606689453125, 7.89404296875, 8.181396484375, 8.46875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 2.0, 4.0, 11.0, 8.0, 13.0, 30.0, 28.0, 31.0, 29.0, 48.0, 52.0, 72.0, 89.0, 142.0, 193.0, 249.0, 304.0, 434.0, 636.0, 1263.0, 3553.0, 14187.0, 80078.0, 832710.0, 91245.0, 15553.0, 3854.0, 1238.0, 667.0, 441.0, 350.0, 262.0, 178.0, 162.0, 104.0, 74.0, 52.0, 49.0, 38.0, 23.0, 27.0, 18.0, 10.0, 14.0, 10.0, 4.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-25.078125, -24.351806640625, -23.62548828125, -22.899169921875, -22.1728515625, -21.446533203125, -20.72021484375, -19.993896484375, -19.267578125, -18.541259765625, -17.81494140625, -17.088623046875, -16.3623046875, -15.635986328125, -14.90966796875, -14.183349609375, -13.45703125, -12.730712890625, -12.00439453125, -11.278076171875, -10.5517578125, -9.825439453125, -9.09912109375, -8.372802734375, -7.646484375, -6.920166015625, -6.19384765625, -5.467529296875, -4.7412109375, -4.014892578125, -3.28857421875, -2.562255859375, -1.8359375, -1.109619140625, -0.38330078125, 0.343017578125, 1.0693359375, 1.795654296875, 2.52197265625, 3.248291015625, 3.974609375, 4.700927734375, 5.42724609375, 6.153564453125, 6.8798828125, 7.606201171875, 8.33251953125, 9.058837890625, 9.78515625, 10.511474609375, 11.23779296875, 11.964111328125, 12.6904296875, 13.416748046875, 14.14306640625, 14.869384765625, 15.595703125, 16.322021484375, 17.04833984375, 17.774658203125, 18.5009765625, 19.227294921875, 19.95361328125, 20.679931640625, 21.40625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 7.0, 5.0, 8.0, 6.0, 11.0, 10.0, 20.0, 17.0, 20.0, 21.0, 22.0, 34.0, 41.0, 26.0, 41.0, 50.0, 54.0, 61.0, 180.0, 1741.0, 192.0, 71.0, 57.0, 50.0, 39.0, 37.0, 35.0, 32.0, 26.0, 22.0, 22.0, 10.0, 14.0, 20.0, 10.0, 9.0, 8.0, 5.0, 1.0, 5.0, 1.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.875, -28.984375, -28.09375, -27.203125, -26.3125, -25.421875, -24.53125, -23.640625, -22.75, -21.859375, -20.96875, -20.078125, -19.1875, -18.296875, -17.40625, -16.515625, -15.625, -14.734375, -13.84375, -12.953125, -12.0625, -11.171875, -10.28125, -9.390625, -8.5, -7.609375, -6.71875, -5.828125, -4.9375, -4.046875, -3.15625, -2.265625, -1.375, -0.484375, 0.40625, 1.296875, 2.1875, 3.078125, 3.96875, 4.859375, 5.75, 6.640625, 7.53125, 8.421875, 9.3125, 10.203125, 11.09375, 11.984375, 12.875, 13.765625, 14.65625, 15.546875, 16.4375, 17.328125, 18.21875, 19.109375, 20.0, 20.890625, 21.78125, 22.671875, 23.5625, 24.453125, 25.34375, 26.234375, 27.125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 2.0, 9.0, 13.0, 14.0, 20.0, 16.0, 19.0, 20.0, 32.0, 43.0, 41.0, 46.0, 89.0, 102.0, 192.0, 356.0, 1327.0, 31649.0, 3090045.0, 19573.0, 1078.0, 345.0, 185.0, 116.0, 66.0, 57.0, 36.0, 32.0, 33.0, 30.0, 16.0, 25.0, 12.0, 10.0, 13.0, 4.0, 5.0, 10.0, 5.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.1875, -72.7177734375, -70.248046875, -67.7783203125, -65.30859375, -62.8388671875, -60.369140625, -57.8994140625, -55.4296875, -52.9599609375, -50.490234375, -48.0205078125, -45.55078125, -43.0810546875, -40.611328125, -38.1416015625, -35.671875, -33.2021484375, -30.732421875, -28.2626953125, -25.79296875, -23.3232421875, -20.853515625, -18.3837890625, -15.9140625, -13.4443359375, -10.974609375, -8.5048828125, -6.03515625, -3.5654296875, -1.095703125, 1.3740234375, 3.84375, 6.3134765625, 8.783203125, 11.2529296875, 13.72265625, 16.1923828125, 18.662109375, 21.1318359375, 23.6015625, 26.0712890625, 28.541015625, 31.0107421875, 33.48046875, 35.9501953125, 38.419921875, 40.8896484375, 43.359375, 45.8291015625, 48.298828125, 50.7685546875, 53.23828125, 55.7080078125, 58.177734375, 60.6474609375, 63.1171875, 65.5869140625, 68.056640625, 70.5263671875, 72.99609375, 75.4658203125, 77.935546875, 80.4052734375, 82.875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 19.0, 121.0, 321.0, 377.0, 129.0, 32.0, 9.0, 4.0, 1.0, 1.0], "bins": [-157.57447814941406, -154.81683349609375, -152.05917358398438, -149.30152893066406, -146.54388427734375, -143.78622436523438, -141.02857971191406, -138.27093505859375, -135.51327514648438, -132.75563049316406, -129.9979705810547, -127.24032592773438, -124.48267364501953, -121.72502136230469, -118.96737670898438, -116.20972442626953, -113.45207977294922, -110.69442749023438, -107.93678283691406, -105.17913055419922, -102.42147827148438, -99.66383361816406, -96.90618133544922, -94.14852905273438, -91.39088439941406, -88.63323211669922, -85.8755874633789, -83.11793518066406, -80.36028289794922, -77.60263061523438, -74.84498596191406, -72.08733367919922, -69.3296890258789, -66.57203674316406, -63.814388275146484, -61.056739807128906, -58.29908752441406, -55.541439056396484, -52.783790588378906, -50.02613830566406, -47.268489837646484, -44.510841369628906, -41.75318908691406, -38.995540618896484, -36.237892150878906, -33.48023986816406, -30.722591400146484, -27.964941024780273, -25.207290649414062, -22.44964027404785, -19.69198989868164, -16.934341430664062, -14.176691055297852, -11.41904067993164, -8.661392211914062, -5.903741836547852, -3.1460914611816406, -0.3884415626525879, 2.369208335876465, 5.126857757568359, 7.88450813293457, 10.642158508300781, 13.39980697631836, 16.15745735168457, 18.91510772705078]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 6.0, 10.0, 5.0, 17.0, 20.0, 15.0, 14.0, 31.0, 34.0, 29.0, 36.0, 36.0, 46.0, 55.0, 36.0, 42.0, 48.0, 47.0, 58.0, 46.0, 34.0, 47.0, 33.0, 32.0, 34.0, 32.0, 24.0, 22.0, 28.0, 19.0, 14.0, 12.0, 12.0, 6.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-83.14183807373047, -80.67510986328125, -78.2083740234375, -75.74164581298828, -73.27491760253906, -70.80818176269531, -68.3414535522461, -65.87472534179688, -63.407989501953125, -60.94125747680664, -58.47452926635742, -56.00779724121094, -53.54106521606445, -51.07433319091797, -48.60760498046875, -46.140872955322266, -43.67414474487305, -41.20741271972656, -38.740684509277344, -36.27395248413086, -33.807220458984375, -31.340490341186523, -28.873760223388672, -26.407028198242188, -23.940298080444336, -21.473567962646484, -19.0068359375, -16.54010581970215, -14.07337474822998, -11.606643676757812, -9.139913558959961, -6.673181533813477, -4.206451416015625, -1.7397205829620361, 0.7270102500915527, 3.1937408447265625, 5.6604719161987305, 8.127202987670898, 10.59393310546875, 13.060665130615234, 15.527395248413086, 17.994125366210938, 20.460857391357422, 22.927587509155273, 25.394317626953125, 27.86104965209961, 30.32777976989746, 32.79450988769531, 35.2612419128418, 37.72797393798828, 40.1947021484375, 42.661434173583984, 45.12816619873047, 47.59489440917969, 50.06162643432617, 52.528358459472656, 54.995086669921875, 57.46181869506836, 59.92854690551758, 62.39527893066406, 64.86200714111328, 67.32874298095703, 69.79547119140625, 72.26220703125, 74.72893524169922]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 9.0, 8.0, 14.0, 19.0, 14.0, 16.0, 17.0, 18.0, 23.0, 32.0, 25.0, 29.0, 27.0, 34.0, 29.0, 24.0, 51.0, 49.0, 47.0, 53.0, 60.0, 50.0, 41.0, 44.0, 37.0, 26.0, 29.0, 32.0, 20.0, 20.0, 15.0, 10.0, 20.0, 10.0, 10.0, 5.0, 10.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.015625, -10.695068359375, -10.37451171875, -10.053955078125, -9.7333984375, -9.412841796875, -9.09228515625, -8.771728515625, -8.451171875, -8.130615234375, -7.81005859375, -7.489501953125, -7.1689453125, -6.848388671875, -6.52783203125, -6.207275390625, -5.88671875, -5.566162109375, -5.24560546875, -4.925048828125, -4.6044921875, -4.283935546875, -3.96337890625, -3.642822265625, -3.322265625, -3.001708984375, -2.68115234375, -2.360595703125, -2.0400390625, -1.719482421875, -1.39892578125, -1.078369140625, -0.7578125, -0.437255859375, -0.11669921875, 0.203857421875, 0.5244140625, 0.844970703125, 1.16552734375, 1.486083984375, 1.806640625, 2.127197265625, 2.44775390625, 2.768310546875, 3.0888671875, 3.409423828125, 3.72998046875, 4.050537109375, 4.37109375, 4.691650390625, 5.01220703125, 5.332763671875, 5.6533203125, 5.973876953125, 6.29443359375, 6.614990234375, 6.935546875, 7.256103515625, 7.57666015625, 7.897216796875, 8.2177734375, 8.538330078125, 8.85888671875, 9.179443359375, 9.5]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 5.0, 11.0, 12.0, 7.0, 17.0, 22.0, 19.0, 40.0, 48.0, 75.0, 94.0, 130.0, 176.0, 301.0, 493.0, 1083.0, 2876.0, 9142.0, 44582.0, 702334.0, 2995714.0, 393973.0, 31358.0, 7145.0, 2367.0, 918.0, 470.0, 280.0, 164.0, 114.0, 87.0, 49.0, 51.0, 32.0, 19.0, 19.0, 11.0, 15.0, 8.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-27.296875, -26.50341796875, -25.7099609375, -24.91650390625, -24.123046875, -23.32958984375, -22.5361328125, -21.74267578125, -20.94921875, -20.15576171875, -19.3623046875, -18.56884765625, -17.775390625, -16.98193359375, -16.1884765625, -15.39501953125, -14.6015625, -13.80810546875, -13.0146484375, -12.22119140625, -11.427734375, -10.63427734375, -9.8408203125, -9.04736328125, -8.25390625, -7.46044921875, -6.6669921875, -5.87353515625, -5.080078125, -4.28662109375, -3.4931640625, -2.69970703125, -1.90625, -1.11279296875, -0.3193359375, 0.47412109375, 1.267578125, 2.06103515625, 2.8544921875, 3.64794921875, 4.44140625, 5.23486328125, 6.0283203125, 6.82177734375, 7.615234375, 8.40869140625, 9.2021484375, 9.99560546875, 10.7890625, 11.58251953125, 12.3759765625, 13.16943359375, 13.962890625, 14.75634765625, 15.5498046875, 16.34326171875, 17.13671875, 17.93017578125, 18.7236328125, 19.51708984375, 20.310546875, 21.10400390625, 21.8974609375, 22.69091796875, 23.484375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 16.0, 17.0, 34.0, 64.0, 105.0, 204.0, 316.0, 551.0, 787.0, 767.0, 530.0, 259.0, 170.0, 92.0, 62.0, 33.0, 30.0, 19.0, 9.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.015625, -23.154052734375, -22.29248046875, -21.430908203125, -20.5693359375, -19.707763671875, -18.84619140625, -17.984619140625, -17.123046875, -16.261474609375, -15.39990234375, -14.538330078125, -13.6767578125, -12.815185546875, -11.95361328125, -11.092041015625, -10.23046875, -9.368896484375, -8.50732421875, -7.645751953125, -6.7841796875, -5.922607421875, -5.06103515625, -4.199462890625, -3.337890625, -2.476318359375, -1.61474609375, -0.753173828125, 0.1083984375, 0.969970703125, 1.83154296875, 2.693115234375, 3.5546875, 4.416259765625, 5.27783203125, 6.139404296875, 7.0009765625, 7.862548828125, 8.72412109375, 9.585693359375, 10.447265625, 11.308837890625, 12.17041015625, 13.031982421875, 13.8935546875, 14.755126953125, 15.61669921875, 16.478271484375, 17.33984375, 18.201416015625, 19.06298828125, 19.924560546875, 20.7861328125, 21.647705078125, 22.50927734375, 23.370849609375, 24.232421875, 25.093994140625, 25.95556640625, 26.817138671875, 27.6787109375, 28.540283203125, 29.40185546875, 30.263427734375, 31.125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 7.0, 14.0, 19.0, 19.0, 22.0, 38.0, 38.0, 79.0, 101.0, 133.0, 203.0, 339.0, 734.0, 2516.0, 28444.0, 3683215.0, 467066.0, 8506.0, 1403.0, 553.0, 282.0, 162.0, 114.0, 84.0, 45.0, 39.0, 31.0, 19.0, 20.0, 10.0, 7.0, 8.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-73.75, -71.630859375, -69.51171875, -67.392578125, -65.2734375, -63.154296875, -61.03515625, -58.916015625, -56.796875, -54.677734375, -52.55859375, -50.439453125, -48.3203125, -46.201171875, -44.08203125, -41.962890625, -39.84375, -37.724609375, -35.60546875, -33.486328125, -31.3671875, -29.248046875, -27.12890625, -25.009765625, -22.890625, -20.771484375, -18.65234375, -16.533203125, -14.4140625, -12.294921875, -10.17578125, -8.056640625, -5.9375, -3.818359375, -1.69921875, 0.419921875, 2.5390625, 4.658203125, 6.77734375, 8.896484375, 11.015625, 13.134765625, 15.25390625, 17.373046875, 19.4921875, 21.611328125, 23.73046875, 25.849609375, 27.96875, 30.087890625, 32.20703125, 34.326171875, 36.4453125, 38.564453125, 40.68359375, 42.802734375, 44.921875, 47.041015625, 49.16015625, 51.279296875, 53.3984375, 55.517578125, 57.63671875, 59.755859375, 61.875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 10.0, 347.0, 639.0, 20.0, 0.0, 0.0, 1.0], "bins": [-955.713134765625, -939.5426025390625, -923.3720703125, -907.2015380859375, -891.031005859375, -874.8604736328125, -858.68994140625, -842.5194091796875, -826.348876953125, -810.1783447265625, -794.0078125, -777.8372802734375, -761.666748046875, -745.4962158203125, -729.32568359375, -713.1551513671875, -696.984619140625, -680.8140869140625, -664.6435546875, -648.4730224609375, -632.302490234375, -616.1319580078125, -599.96142578125, -583.7908935546875, -567.6203002929688, -551.4497680664062, -535.2792358398438, -519.1087036132812, -502.93817138671875, -486.76763916015625, -470.59710693359375, -454.42657470703125, -438.2560119628906, -422.0854797363281, -405.9149475097656, -389.7444152832031, -373.5738830566406, -357.4033508300781, -341.2327880859375, -325.062255859375, -308.8917236328125, -292.72119140625, -276.5506591796875, -260.380126953125, -244.2095947265625, -228.0390625, -211.86851501464844, -195.69798278808594, -179.5274658203125, -163.35693359375, -147.1864013671875, -131.015869140625, -114.84532928466797, -98.67479705810547, -82.50425720214844, -66.33372497558594, -50.163185119628906, -33.992652893066406, -17.82211685180664, -1.651580810546875, 14.518951416015625, 30.689483642578125, 46.860023498535156, 63.030555725097656, 79.20108795166016]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 8.0, 8.0, 16.0, 17.0, 7.0, 13.0, 17.0, 29.0, 22.0, 21.0, 25.0, 31.0, 29.0, 30.0, 41.0, 45.0, 43.0, 40.0, 45.0, 34.0, 42.0, 41.0, 41.0, 34.0, 45.0, 31.0, 32.0, 19.0, 31.0, 19.0, 19.0, 21.0, 18.0, 16.0, 15.0, 12.0, 8.0, 6.0, 6.0, 4.0, 5.0, 5.0, 9.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.43505859375, -46.72454071044922, -45.0140266418457, -43.30350875854492, -41.59299087524414, -39.882476806640625, -38.171958923339844, -36.46144104003906, -34.75092315673828, -33.0404052734375, -31.32988929748535, -29.619373321533203, -27.908855438232422, -26.198339462280273, -24.487823486328125, -22.777305603027344, -21.066791534423828, -19.35627555847168, -17.6457576751709, -15.93524169921875, -14.224724769592285, -12.51420783996582, -10.803691864013672, -9.093174934387207, -7.382658004760742, -5.672141075134277, -3.9616246223449707, -2.251108169555664, -0.5405912399291992, 1.1699256896972656, 2.880441665649414, 4.590958595275879, 6.301475524902344, 8.011992454528809, 9.722509384155273, 11.433025360107422, 13.143542289733887, 14.854059219360352, 16.5645751953125, 18.27509307861328, 19.98560905456543, 21.696125030517578, 23.40664291381836, 25.117158889770508, 26.827674865722656, 28.538192749023438, 30.248708724975586, 31.959224700927734, 33.669742584228516, 35.3802604675293, 37.09077453613281, 38.801292419433594, 40.511810302734375, 42.222328186035156, 43.93284225463867, 45.64336013793945, 47.35387420654297, 49.06439208984375, 50.774906158447266, 52.48542404174805, 54.19594192504883, 55.906455993652344, 57.616973876953125, 59.327491760253906, 61.03800964355469]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 2.0, 4.0, 7.0, 9.0, 17.0, 13.0, 16.0, 22.0, 17.0, 25.0, 38.0, 29.0, 36.0, 37.0, 38.0, 43.0, 58.0, 47.0, 44.0, 47.0, 55.0, 51.0, 50.0, 38.0, 38.0, 33.0, 27.0, 26.0, 24.0, 19.0, 27.0, 16.0, 12.0, 9.0, 5.0, 9.0, 2.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.171875, -12.781982421875, -12.39208984375, -12.002197265625, -11.6123046875, -11.222412109375, -10.83251953125, -10.442626953125, -10.052734375, -9.662841796875, -9.27294921875, -8.883056640625, -8.4931640625, -8.103271484375, -7.71337890625, -7.323486328125, -6.93359375, -6.543701171875, -6.15380859375, -5.763916015625, -5.3740234375, -4.984130859375, -4.59423828125, -4.204345703125, -3.814453125, -3.424560546875, -3.03466796875, -2.644775390625, -2.2548828125, -1.864990234375, -1.47509765625, -1.085205078125, -0.6953125, -0.305419921875, 0.08447265625, 0.474365234375, 0.8642578125, 1.254150390625, 1.64404296875, 2.033935546875, 2.423828125, 2.813720703125, 3.20361328125, 3.593505859375, 3.9833984375, 4.373291015625, 4.76318359375, 5.153076171875, 5.54296875, 5.932861328125, 6.32275390625, 6.712646484375, 7.1025390625, 7.492431640625, 7.88232421875, 8.272216796875, 8.662109375, 9.052001953125, 9.44189453125, 9.831787109375, 10.2216796875, 10.611572265625, 11.00146484375, 11.391357421875, 11.78125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 12.0, 16.0, 16.0, 18.0, 34.0, 49.0, 74.0, 114.0, 161.0, 250.0, 294.0, 474.0, 667.0, 883.0, 1306.0, 1933.0, 2638.0, 4054.0, 6149.0, 9040.0, 13995.0, 20733.0, 32112.0, 49117.0, 76438.0, 122291.0, 194058.0, 185837.0, 115655.0, 72732.0, 46896.0, 30442.0, 19860.0, 13222.0, 8711.0, 5776.0, 3817.0, 2733.0, 1792.0, 1255.0, 894.0, 608.0, 397.0, 296.0, 237.0, 138.0, 112.0, 69.0, 50.0, 41.0, 37.0, 20.0, 10.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.501953125, -1.45635986328125, -1.4107666015625, -1.36517333984375, -1.319580078125, -1.27398681640625, -1.2283935546875, -1.18280029296875, -1.13720703125, -1.09161376953125, -1.0460205078125, -1.00042724609375, -0.954833984375, -0.90924072265625, -0.8636474609375, -0.81805419921875, -0.7724609375, -0.72686767578125, -0.6812744140625, -0.63568115234375, -0.590087890625, -0.54449462890625, -0.4989013671875, -0.45330810546875, -0.40771484375, -0.36212158203125, -0.3165283203125, -0.27093505859375, -0.225341796875, -0.17974853515625, -0.1341552734375, -0.08856201171875, -0.04296875, 0.00262451171875, 0.0482177734375, 0.09381103515625, 0.139404296875, 0.18499755859375, 0.2305908203125, 0.27618408203125, 0.32177734375, 0.36737060546875, 0.4129638671875, 0.45855712890625, 0.504150390625, 0.54974365234375, 0.5953369140625, 0.64093017578125, 0.6865234375, 0.73211669921875, 0.7777099609375, 0.82330322265625, 0.868896484375, 0.91448974609375, 0.9600830078125, 1.00567626953125, 1.05126953125, 1.09686279296875, 1.1424560546875, 1.18804931640625, 1.233642578125, 1.27923583984375, 1.3248291015625, 1.37042236328125, 1.416015625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 8.0, 5.0, 10.0, 10.0, 11.0, 19.0, 13.0, 18.0, 21.0, 21.0, 26.0, 30.0, 30.0, 31.0, 35.0, 42.0, 36.0, 40.0, 33.0, 1065.0, 38.0, 40.0, 39.0, 41.0, 36.0, 50.0, 28.0, 37.0, 27.0, 24.0, 27.0, 10.0, 17.0, 15.0, 14.0, 10.0, 10.0, 14.0, 16.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.9140625, -5.71533203125, -5.5166015625, -5.31787109375, -5.119140625, -4.92041015625, -4.7216796875, -4.52294921875, -4.32421875, -4.12548828125, -3.9267578125, -3.72802734375, -3.529296875, -3.33056640625, -3.1318359375, -2.93310546875, -2.734375, -2.53564453125, -2.3369140625, -2.13818359375, -1.939453125, -1.74072265625, -1.5419921875, -1.34326171875, -1.14453125, -0.94580078125, -0.7470703125, -0.54833984375, -0.349609375, -0.15087890625, 0.0478515625, 0.24658203125, 0.4453125, 0.64404296875, 0.8427734375, 1.04150390625, 1.240234375, 1.43896484375, 1.6376953125, 1.83642578125, 2.03515625, 2.23388671875, 2.4326171875, 2.63134765625, 2.830078125, 3.02880859375, 3.2275390625, 3.42626953125, 3.625, 3.82373046875, 4.0224609375, 4.22119140625, 4.419921875, 4.61865234375, 4.8173828125, 5.01611328125, 5.21484375, 5.41357421875, 5.6123046875, 5.81103515625, 6.009765625, 6.20849609375, 6.4072265625, 6.60595703125, 6.8046875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 6.0, 3.0, 7.0, 8.0, 15.0, 23.0, 26.0, 51.0, 69.0, 99.0, 160.0, 233.0, 336.0, 477.0, 648.0, 1033.0, 1635.0, 2292.0, 3556.0, 5312.0, 8088.0, 12724.0, 19916.0, 31327.0, 49623.0, 79181.0, 123660.0, 1154455.0, 266695.0, 122198.0, 77339.0, 48870.0, 30911.0, 19822.0, 12677.0, 7944.0, 5230.0, 3567.0, 2269.0, 1517.0, 1024.0, 688.0, 446.0, 324.0, 203.0, 152.0, 86.0, 75.0, 52.0, 32.0, 25.0, 10.0, 14.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.3095703125, -1.267303466796875, -1.22503662109375, -1.182769775390625, -1.1405029296875, -1.098236083984375, -1.05596923828125, -1.013702392578125, -0.971435546875, -0.929168701171875, -0.88690185546875, -0.844635009765625, -0.8023681640625, -0.760101318359375, -0.71783447265625, -0.675567626953125, -0.63330078125, -0.591033935546875, -0.54876708984375, -0.506500244140625, -0.4642333984375, -0.421966552734375, -0.37969970703125, -0.337432861328125, -0.295166015625, -0.252899169921875, -0.21063232421875, -0.168365478515625, -0.1260986328125, -0.083831787109375, -0.04156494140625, 0.000701904296875, 0.04296875, 0.085235595703125, 0.12750244140625, 0.169769287109375, 0.2120361328125, 0.254302978515625, 0.29656982421875, 0.338836669921875, 0.381103515625, 0.423370361328125, 0.46563720703125, 0.507904052734375, 0.5501708984375, 0.592437744140625, 0.63470458984375, 0.676971435546875, 0.71923828125, 0.761505126953125, 0.80377197265625, 0.846038818359375, 0.8883056640625, 0.930572509765625, 0.97283935546875, 1.015106201171875, 1.057373046875, 1.099639892578125, 1.14190673828125, 1.184173583984375, 1.2264404296875, 1.268707275390625, 1.31097412109375, 1.353240966796875, 1.3955078125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 5.0, 6.0, 9.0, 9.0, 10.0, 30.0, 25.0, 27.0, 35.0, 27.0, 42.0, 38.0, 60.0, 63.0, 66.0, 72.0, 70.0, 57.0, 58.0, 53.0, 35.0, 33.0, 28.0, 29.0, 18.0, 24.0, 12.0, 14.0, 8.0, 9.0, 6.0, 2.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00247955322265625, -0.0024029910564422607, -0.0023264288902282715, -0.0022498667240142822, -0.002173304557800293, -0.0020967423915863037, -0.0020201802253723145, -0.0019436180591583252, -0.001867055892944336, -0.0017904937267303467, -0.0017139315605163574, -0.0016373693943023682, -0.001560807228088379, -0.0014842450618743896, -0.0014076828956604004, -0.0013311207294464111, -0.0012545585632324219, -0.0011779963970184326, -0.0011014342308044434, -0.001024872064590454, -0.0009483098983764648, -0.0008717477321624756, -0.0007951855659484863, -0.0007186233997344971, -0.0006420612335205078, -0.0005654990673065186, -0.0004889369010925293, -0.00041237473487854004, -0.0003358125686645508, -0.0002592504024505615, -0.00018268823623657227, -0.00010612607002258301, -2.956390380859375e-05, 4.699826240539551e-05, 0.00012356042861938477, 0.00020012259483337402, 0.0002766847610473633, 0.00035324692726135254, 0.0004298090934753418, 0.0005063712596893311, 0.0005829334259033203, 0.0006594955921173096, 0.0007360577583312988, 0.0008126199245452881, 0.0008891820907592773, 0.0009657442569732666, 0.0010423064231872559, 0.0011188685894012451, 0.0011954307556152344, 0.0012719929218292236, 0.0013485550880432129, 0.0014251172542572021, 0.0015016794204711914, 0.0015782415866851807, 0.00165480375289917, 0.0017313659191131592, 0.0018079280853271484, 0.0018844902515411377, 0.001961052417755127, 0.002037614583969116, 0.0021141767501831055, 0.0021907389163970947, 0.002267301082611084, 0.0023438632488250732, 0.0024204254150390625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 8.0, 8.0, 10.0, 14.0, 14.0, 22.0, 21.0, 28.0, 42.0, 54.0, 71.0, 102.0, 158.0, 253.0, 531.0, 1812.0, 982875.0, 60642.0, 856.0, 380.0, 181.0, 128.0, 77.0, 63.0, 54.0, 32.0, 25.0, 27.0, 10.0, 10.0, 11.0, 10.0, 5.0, 7.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.060272216796875, -0.05853986740112305, -0.056807518005371094, -0.05507516860961914, -0.05334281921386719, -0.051610469818115234, -0.04987812042236328, -0.04814577102661133, -0.046413421630859375, -0.04468107223510742, -0.04294872283935547, -0.041216373443603516, -0.03948402404785156, -0.03775167465209961, -0.036019325256347656, -0.0342869758605957, -0.03255462646484375, -0.030822277069091797, -0.029089927673339844, -0.02735757827758789, -0.025625228881835938, -0.023892879486083984, -0.02216053009033203, -0.020428180694580078, -0.018695831298828125, -0.016963481903076172, -0.015231132507324219, -0.013498783111572266, -0.011766433715820312, -0.01003408432006836, -0.008301734924316406, -0.006569385528564453, -0.0048370361328125, -0.003104686737060547, -0.0013723373413085938, 0.0003600120544433594, 0.0020923614501953125, 0.0038247108459472656, 0.005557060241699219, 0.007289409637451172, 0.009021759033203125, 0.010754108428955078, 0.012486457824707031, 0.014218807220458984, 0.015951156616210938, 0.01768350601196289, 0.019415855407714844, 0.021148204803466797, 0.02288055419921875, 0.024612903594970703, 0.026345252990722656, 0.02807760238647461, 0.029809951782226562, 0.031542301177978516, 0.03327465057373047, 0.03500699996948242, 0.036739349365234375, 0.03847169876098633, 0.04020404815673828, 0.041936397552490234, 0.04366874694824219, 0.04540109634399414, 0.047133445739746094, 0.04886579513549805, 0.05059814453125]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 38.0, 244.0, 482.0, 209.0, 38.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028597526252269745, -0.002674409653991461, -0.002489066682755947, -0.0023037237115204334, -0.0021183807402849197, -0.0019330378854647279, -0.001747695030644536, -0.0015623520594090223, -0.0013770090881735086, -0.001191666116937995, -0.0010063231457024813, -0.0008209802908822894, -0.0006356373196467757, -0.00045029434841126204, -0.0002649514935910702, -7.960852235555649e-05, 0.0001057344488799572, 0.00029107739101164043, 0.00047642033314332366, 0.0006617632461711764, 0.0008471062174066901, 0.0010324491886422038, 0.0012177920434623957, 0.0014031350146979094, 0.001588477985933423, 0.0017738209571689367, 0.0019591639284044504, 0.0021445066668093204, 0.002329849638044834, 0.002515192609280348, 0.0027005355805158615, 0.002885878551751375, 0.003071221522986889, 0.0032565644942224026, 0.0034419074654579163, 0.00362725043669343, 0.0038125934079289436, 0.003997936379164457, 0.004183279350399971, 0.004368621855974197, 0.004553965292870998, 0.004739308264106512, 0.004924651235342026, 0.0051099942065775394, 0.005295337177813053, 0.005480680149048567, 0.0056660231202840805, 0.005851365625858307, 0.006036708597093821, 0.006222051568329334, 0.006407394539564848, 0.006592737510800362, 0.006778080482035875, 0.006963423453271389, 0.007148765958845615, 0.007334109395742416, 0.007519451901316643, 0.0077047948725521564, 0.00789013784378767, 0.008075480349361897, 0.008260823786258698, 0.008446166291832924, 0.008631509728729725, 0.008816852234303951, 0.009002195671200752]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 3.0, 7.0, 6.0, 8.0, 8.0, 13.0, 13.0, 7.0, 16.0, 17.0, 24.0, 24.0, 30.0, 32.0, 22.0, 35.0, 42.0, 33.0, 28.0, 34.0, 48.0, 38.0, 48.0, 41.0, 33.0, 39.0, 37.0, 37.0, 32.0, 32.0, 25.0, 24.0, 20.0, 22.0, 24.0, 11.0, 15.0, 16.0, 15.0, 8.0, 4.0, 5.0, 3.0, 5.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.0012595653533935547, -0.0012222090736031532, -0.0011848527938127518, -0.0011474965140223503, -0.0011101402342319489, -0.0010727839544415474, -0.001035427674651146, -0.0009980713948607445, -0.000960715115070343, -0.0009233588352799416, -0.0008860025554895401, -0.0008486462756991386, -0.0008112899959087372, -0.0007739337161183357, -0.0007365774363279343, -0.0006992211565375328, -0.0006618648767471313, -0.0006245085969567299, -0.0005871523171663284, -0.000549796037375927, -0.0005124397575855255, -0.00047508347779512405, -0.0004377271980047226, -0.00040037091821432114, -0.0003630146384239197, -0.0003256583586335182, -0.00028830207884311676, -0.0002509457990527153, -0.00021358951926231384, -0.00017623323947191238, -0.00013887695968151093, -0.00010152067989110947, -6.416440010070801e-05, -2.680812031030655e-05, 1.054815948009491e-05, 4.790443927049637e-05, 8.526071906089783e-05, 0.00012261699885129929, 0.00015997327864170074, 0.0001973295584321022, 0.00023468583822250366, 0.0002720421180129051, 0.0003093983978033066, 0.00034675467759370804, 0.0003841109573841095, 0.00042146723717451096, 0.0004588235169649124, 0.0004961797967553139, 0.0005335360765457153, 0.0005708923563361168, 0.0006082486361265182, 0.0006456049159169197, 0.0006829611957073212, 0.0007203174754977226, 0.0007576737552881241, 0.0007950300350785255, 0.000832386314868927, 0.0008697425946593285, 0.0009070988744497299, 0.0009444551542401314, 0.0009818114340305328, 0.0010191677138209343, 0.0010565239936113358, 0.0010938802734017372, 0.0011312365531921387]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 2.0, 4.0, 7.0, 9.0, 17.0, 13.0, 16.0, 22.0, 17.0, 25.0, 38.0, 29.0, 36.0, 37.0, 38.0, 43.0, 58.0, 47.0, 44.0, 47.0, 55.0, 51.0, 50.0, 38.0, 38.0, 33.0, 27.0, 26.0, 24.0, 19.0, 27.0, 16.0, 12.0, 9.0, 5.0, 9.0, 2.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.171875, -12.781982421875, -12.39208984375, -12.002197265625, -11.6123046875, -11.222412109375, -10.83251953125, -10.442626953125, -10.052734375, -9.662841796875, -9.27294921875, -8.883056640625, -8.4931640625, -8.103271484375, -7.71337890625, -7.323486328125, -6.93359375, -6.543701171875, -6.15380859375, -5.763916015625, -5.3740234375, -4.984130859375, -4.59423828125, -4.204345703125, -3.814453125, -3.424560546875, -3.03466796875, -2.644775390625, -2.2548828125, -1.864990234375, -1.47509765625, -1.085205078125, -0.6953125, -0.305419921875, 0.08447265625, 0.474365234375, 0.8642578125, 1.254150390625, 1.64404296875, 2.033935546875, 2.423828125, 2.813720703125, 3.20361328125, 3.593505859375, 3.9833984375, 4.373291015625, 4.76318359375, 5.153076171875, 5.54296875, 5.932861328125, 6.32275390625, 6.712646484375, 7.1025390625, 7.492431640625, 7.88232421875, 8.272216796875, 8.662109375, 9.052001953125, 9.44189453125, 9.831787109375, 10.2216796875, 10.611572265625, 11.00146484375, 11.391357421875, 11.78125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 3.0, 5.0, 10.0, 16.0, 18.0, 23.0, 29.0, 52.0, 61.0, 75.0, 123.0, 154.0, 324.0, 636.0, 1221.0, 3184.0, 8592.0, 25904.0, 86328.0, 400235.0, 395655.0, 85708.0, 25699.0, 8614.0, 3117.0, 1293.0, 583.0, 299.0, 173.0, 128.0, 78.0, 53.0, 41.0, 38.0, 17.0, 23.0, 6.0, 14.0, 6.0, 4.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-17.09375, -16.5909423828125, -16.088134765625, -15.5853271484375, -15.08251953125, -14.5797119140625, -14.076904296875, -13.5740966796875, -13.0712890625, -12.5684814453125, -12.065673828125, -11.5628662109375, -11.06005859375, -10.5572509765625, -10.054443359375, -9.5516357421875, -9.048828125, -8.5460205078125, -8.043212890625, -7.5404052734375, -7.03759765625, -6.5347900390625, -6.031982421875, -5.5291748046875, -5.0263671875, -4.5235595703125, -4.020751953125, -3.5179443359375, -3.01513671875, -2.5123291015625, -2.009521484375, -1.5067138671875, -1.00390625, -0.5010986328125, 0.001708984375, 0.5045166015625, 1.00732421875, 1.5101318359375, 2.012939453125, 2.5157470703125, 3.0185546875, 3.5213623046875, 4.024169921875, 4.5269775390625, 5.02978515625, 5.5325927734375, 6.035400390625, 6.5382080078125, 7.041015625, 7.5438232421875, 8.046630859375, 8.5494384765625, 9.05224609375, 9.5550537109375, 10.057861328125, 10.5606689453125, 11.0634765625, 11.5662841796875, 12.069091796875, 12.5718994140625, 13.07470703125, 13.5775146484375, 14.080322265625, 14.5831298828125, 15.0859375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 10.0, 5.0, 2.0, 9.0, 10.0, 8.0, 8.0, 15.0, 18.0, 17.0, 19.0, 18.0, 22.0, 23.0, 33.0, 28.0, 32.0, 49.0, 47.0, 53.0, 92.0, 178.0, 1580.0, 244.0, 103.0, 69.0, 42.0, 36.0, 28.0, 20.0, 26.0, 24.0, 24.0, 28.0, 16.0, 22.0, 15.0, 18.0, 6.0, 7.0, 10.0, 13.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.59375, -24.7294921875, -23.865234375, -23.0009765625, -22.13671875, -21.2724609375, -20.408203125, -19.5439453125, -18.6796875, -17.8154296875, -16.951171875, -16.0869140625, -15.22265625, -14.3583984375, -13.494140625, -12.6298828125, -11.765625, -10.9013671875, -10.037109375, -9.1728515625, -8.30859375, -7.4443359375, -6.580078125, -5.7158203125, -4.8515625, -3.9873046875, -3.123046875, -2.2587890625, -1.39453125, -0.5302734375, 0.333984375, 1.1982421875, 2.0625, 2.9267578125, 3.791015625, 4.6552734375, 5.51953125, 6.3837890625, 7.248046875, 8.1123046875, 8.9765625, 9.8408203125, 10.705078125, 11.5693359375, 12.43359375, 13.2978515625, 14.162109375, 15.0263671875, 15.890625, 16.7548828125, 17.619140625, 18.4833984375, 19.34765625, 20.2119140625, 21.076171875, 21.9404296875, 22.8046875, 23.6689453125, 24.533203125, 25.3974609375, 26.26171875, 27.1259765625, 27.990234375, 28.8544921875, 29.71875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 7.0, 9.0, 2.0, 11.0, 18.0, 30.0, 20.0, 36.0, 34.0, 73.0, 64.0, 112.0, 146.0, 198.0, 320.0, 628.0, 2268.0, 26725.0, 2303653.0, 790290.0, 17700.0, 1741.0, 544.0, 283.0, 197.0, 137.0, 107.0, 86.0, 54.0, 43.0, 30.0, 28.0, 19.0, 13.0, 22.0, 10.0, 9.0, 4.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.0, -40.5966796875, -39.193359375, -37.7900390625, -36.38671875, -34.9833984375, -33.580078125, -32.1767578125, -30.7734375, -29.3701171875, -27.966796875, -26.5634765625, -25.16015625, -23.7568359375, -22.353515625, -20.9501953125, -19.546875, -18.1435546875, -16.740234375, -15.3369140625, -13.93359375, -12.5302734375, -11.126953125, -9.7236328125, -8.3203125, -6.9169921875, -5.513671875, -4.1103515625, -2.70703125, -1.3037109375, 0.099609375, 1.5029296875, 2.90625, 4.3095703125, 5.712890625, 7.1162109375, 8.51953125, 9.9228515625, 11.326171875, 12.7294921875, 14.1328125, 15.5361328125, 16.939453125, 18.3427734375, 19.74609375, 21.1494140625, 22.552734375, 23.9560546875, 25.359375, 26.7626953125, 28.166015625, 29.5693359375, 30.97265625, 32.3759765625, 33.779296875, 35.1826171875, 36.5859375, 37.9892578125, 39.392578125, 40.7958984375, 42.19921875, 43.6025390625, 45.005859375, 46.4091796875, 47.8125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 212.0, 785.0, 19.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-571.7947387695312, -561.2528076171875, -550.7108154296875, -540.1688842773438, -529.6268920898438, -519.0849609375, -508.54296875, -498.00103759765625, -487.4590759277344, -476.9171142578125, -466.3751525878906, -455.83319091796875, -445.2912292480469, -434.749267578125, -424.20733642578125, -413.6653747558594, -403.1234130859375, -392.5814514160156, -382.03948974609375, -371.4975280761719, -360.95556640625, -350.41363525390625, -339.87164306640625, -329.3297119140625, -318.7877197265625, -308.2457580566406, -297.70379638671875, -287.1618347167969, -276.619873046875, -266.07794189453125, -255.5359649658203, -244.9940185546875, -234.45208740234375, -223.91012573242188, -213.3681640625, -202.82620239257812, -192.2842559814453, -181.74229431152344, -171.20033264160156, -160.65838623046875, -150.1164093017578, -139.57444763183594, -129.03248596191406, -118.49053192138672, -107.94857788085938, -97.4066162109375, -86.86465454101562, -76.32270050048828, -65.7807388305664, -55.2387809753418, -44.69682312011719, -34.15486145019531, -23.612903594970703, -13.070945739746094, -2.5289840698242188, 8.012969970703125, 18.554931640625, 29.09688949584961, 39.63884735107422, 50.180809020996094, 60.7227668762207, 71.26472473144531, 81.80668640136719, 92.34864044189453, 102.8906021118164]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 8.0, 12.0, 7.0, 18.0, 10.0, 12.0, 14.0, 17.0, 19.0, 18.0, 29.0, 27.0, 21.0, 39.0, 29.0, 52.0, 28.0, 45.0, 49.0, 42.0, 41.0, 34.0, 36.0, 40.0, 43.0, 39.0, 26.0, 27.0, 31.0, 24.0, 31.0, 17.0, 15.0, 14.0, 14.0, 16.0, 12.0, 10.0, 5.0, 4.0, 4.0, 3.0, 2.0, 8.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-67.27494812011719, -65.1795883178711, -63.084232330322266, -60.98887634277344, -58.89352035522461, -56.79816436767578, -54.70280456542969, -52.60744857788086, -50.51209259033203, -48.4167366027832, -46.32137680053711, -44.22602081298828, -42.13066482543945, -40.035308837890625, -37.93994903564453, -35.8445930480957, -33.74923324584961, -31.65387535095215, -29.55851936340332, -27.46316146850586, -25.36780548095703, -23.27244758605957, -21.17708969116211, -19.08173370361328, -16.98637580871582, -14.891018867492676, -12.795661926269531, -10.70030403137207, -8.604947090148926, -6.509590148925781, -4.41423225402832, -2.318875312805176, -0.22351837158203125, 1.8718388080596924, 3.967195987701416, 6.062553405761719, 8.157910346984863, 10.253267288208008, 12.348625183105469, 14.443982124328613, 16.539339065551758, 18.63469696044922, 20.730052947998047, 22.825410842895508, 24.92076873779297, 27.016124725341797, 29.111482620239258, 31.20684051513672, 33.30219650268555, 35.397552490234375, 37.49291229248047, 39.5882682800293, 41.683624267578125, 43.77898406982422, 45.87434005737305, 47.969696044921875, 50.06505584716797, 52.1604118347168, 54.25577163696289, 56.35112762451172, 58.44648361206055, 60.541839599609375, 62.63719940185547, 64.73255920410156, 66.82791137695312]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 4.0, 12.0, 12.0, 11.0, 21.0, 8.0, 34.0, 18.0, 20.0, 30.0, 41.0, 38.0, 35.0, 46.0, 48.0, 39.0, 36.0, 59.0, 50.0, 49.0, 54.0, 47.0, 34.0, 30.0, 34.0, 16.0, 28.0, 28.0, 24.0, 23.0, 9.0, 13.0, 13.0, 5.0, 10.0, 5.0, 4.0, 1.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.3046875, -12.91943359375, -12.5341796875, -12.14892578125, -11.763671875, -11.37841796875, -10.9931640625, -10.60791015625, -10.22265625, -9.83740234375, -9.4521484375, -9.06689453125, -8.681640625, -8.29638671875, -7.9111328125, -7.52587890625, -7.140625, -6.75537109375, -6.3701171875, -5.98486328125, -5.599609375, -5.21435546875, -4.8291015625, -4.44384765625, -4.05859375, -3.67333984375, -3.2880859375, -2.90283203125, -2.517578125, -2.13232421875, -1.7470703125, -1.36181640625, -0.9765625, -0.59130859375, -0.2060546875, 0.17919921875, 0.564453125, 0.94970703125, 1.3349609375, 1.72021484375, 2.10546875, 2.49072265625, 2.8759765625, 3.26123046875, 3.646484375, 4.03173828125, 4.4169921875, 4.80224609375, 5.1875, 5.57275390625, 5.9580078125, 6.34326171875, 6.728515625, 7.11376953125, 7.4990234375, 7.88427734375, 8.26953125, 8.65478515625, 9.0400390625, 9.42529296875, 9.810546875, 10.19580078125, 10.5810546875, 10.96630859375, 11.3515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 7.0, 4.0, 10.0, 9.0, 15.0, 12.0, 24.0, 17.0, 21.0, 33.0, 50.0, 72.0, 132.0, 350.0, 1223.0, 4552.0, 26972.0, 791875.0, 3219900.0, 134142.0, 11212.0, 2456.0, 612.0, 245.0, 108.0, 63.0, 37.0, 31.0, 20.0, 15.0, 9.0, 13.0, 13.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.96875, -33.81396484375, -32.6591796875, -31.50439453125, -30.349609375, -29.19482421875, -28.0400390625, -26.88525390625, -25.73046875, -24.57568359375, -23.4208984375, -22.26611328125, -21.111328125, -19.95654296875, -18.8017578125, -17.64697265625, -16.4921875, -15.33740234375, -14.1826171875, -13.02783203125, -11.873046875, -10.71826171875, -9.5634765625, -8.40869140625, -7.25390625, -6.09912109375, -4.9443359375, -3.78955078125, -2.634765625, -1.47998046875, -0.3251953125, 0.82958984375, 1.984375, 3.13916015625, 4.2939453125, 5.44873046875, 6.603515625, 7.75830078125, 8.9130859375, 10.06787109375, 11.22265625, 12.37744140625, 13.5322265625, 14.68701171875, 15.841796875, 16.99658203125, 18.1513671875, 19.30615234375, 20.4609375, 21.61572265625, 22.7705078125, 23.92529296875, 25.080078125, 26.23486328125, 27.3896484375, 28.54443359375, 29.69921875, 30.85400390625, 32.0087890625, 33.16357421875, 34.318359375, 35.47314453125, 36.6279296875, 37.78271484375, 38.9375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 8.0, 9.0, 18.0, 9.0, 15.0, 17.0, 26.0, 37.0, 45.0, 82.0, 101.0, 152.0, 233.0, 394.0, 591.0, 609.0, 611.0, 408.0, 253.0, 144.0, 97.0, 69.0, 42.0, 36.0, 21.0, 16.0, 10.0, 8.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.71875, -24.09326171875, -23.4677734375, -22.84228515625, -22.216796875, -21.59130859375, -20.9658203125, -20.34033203125, -19.71484375, -19.08935546875, -18.4638671875, -17.83837890625, -17.212890625, -16.58740234375, -15.9619140625, -15.33642578125, -14.7109375, -14.08544921875, -13.4599609375, -12.83447265625, -12.208984375, -11.58349609375, -10.9580078125, -10.33251953125, -9.70703125, -9.08154296875, -8.4560546875, -7.83056640625, -7.205078125, -6.57958984375, -5.9541015625, -5.32861328125, -4.703125, -4.07763671875, -3.4521484375, -2.82666015625, -2.201171875, -1.57568359375, -0.9501953125, -0.32470703125, 0.30078125, 0.92626953125, 1.5517578125, 2.17724609375, 2.802734375, 3.42822265625, 4.0537109375, 4.67919921875, 5.3046875, 5.93017578125, 6.5556640625, 7.18115234375, 7.806640625, 8.43212890625, 9.0576171875, 9.68310546875, 10.30859375, 10.93408203125, 11.5595703125, 12.18505859375, 12.810546875, 13.43603515625, 14.0615234375, 14.68701171875, 15.3125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 1.0, 1.0, 11.0, 6.0, 9.0, 8.0, 14.0, 17.0, 23.0, 35.0, 54.0, 111.0, 151.0, 279.0, 588.0, 1420.0, 5363.0, 29450.0, 318200.0, 3553644.0, 252934.0, 24811.0, 4632.0, 1308.0, 481.0, 275.0, 153.0, 68.0, 66.0, 44.0, 33.0, 22.0, 16.0, 8.0, 11.0, 14.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-34.84375, -33.736328125, -32.62890625, -31.521484375, -30.4140625, -29.306640625, -28.19921875, -27.091796875, -25.984375, -24.876953125, -23.76953125, -22.662109375, -21.5546875, -20.447265625, -19.33984375, -18.232421875, -17.125, -16.017578125, -14.91015625, -13.802734375, -12.6953125, -11.587890625, -10.48046875, -9.373046875, -8.265625, -7.158203125, -6.05078125, -4.943359375, -3.8359375, -2.728515625, -1.62109375, -0.513671875, 0.59375, 1.701171875, 2.80859375, 3.916015625, 5.0234375, 6.130859375, 7.23828125, 8.345703125, 9.453125, 10.560546875, 11.66796875, 12.775390625, 13.8828125, 14.990234375, 16.09765625, 17.205078125, 18.3125, 19.419921875, 20.52734375, 21.634765625, 22.7421875, 23.849609375, 24.95703125, 26.064453125, 27.171875, 28.279296875, 29.38671875, 30.494140625, 31.6015625, 32.708984375, 33.81640625, 34.923828125, 36.03125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 22.0, 50.0, 130.0, 226.0, 231.0, 179.0, 103.0, 28.0, 19.0, 8.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-173.52529907226562, -170.01736450195312, -166.50941467285156, -163.00148010253906, -159.4935302734375, -155.985595703125, -152.47764587402344, -148.96971130371094, -145.46176147460938, -141.95382690429688, -138.4458770751953, -134.9379425048828, -131.42999267578125, -127.92205047607422, -124.41410827636719, -120.90617370605469, -117.39823150634766, -113.89028930664062, -110.3823471069336, -106.87440490722656, -103.36646270751953, -99.8585205078125, -96.3505859375, -92.84263610839844, -89.33470153808594, -85.8267593383789, -82.31881713867188, -78.81087493896484, -75.30293273925781, -71.79499053955078, -68.28704833984375, -64.77911376953125, -61.27117156982422, -57.76322937011719, -54.255287170410156, -50.747344970703125, -47.239402770996094, -43.73146057128906, -40.2235221862793, -36.715579986572266, -33.207637786865234, -29.699695587158203, -26.191753387451172, -22.683813095092773, -19.175870895385742, -15.667928695678711, -12.159988403320312, -8.652046203613281, -5.14410400390625, -1.636162281036377, 1.871779441833496, 5.379720687866211, 8.887662887573242, 12.395605087280273, 15.903545379638672, 19.411487579345703, 22.919429779052734, 26.427371978759766, 29.935314178466797, 33.44325256347656, 36.951194763183594, 40.459136962890625, 43.967079162597656, 47.47502136230469, 50.98296356201172]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 8.0, 4.0, 7.0, 14.0, 12.0, 13.0, 27.0, 26.0, 22.0, 32.0, 30.0, 36.0, 35.0, 43.0, 50.0, 43.0, 47.0, 41.0, 39.0, 44.0, 56.0, 40.0, 40.0, 40.0, 28.0, 32.0, 32.0, 26.0, 21.0, 16.0, 15.0, 17.0, 14.0, 12.0, 10.0, 11.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.31184005737305, -55.43180847167969, -53.551780700683594, -51.671749114990234, -49.79172134399414, -47.91168975830078, -46.03166198730469, -44.15163040161133, -42.27159881591797, -40.39156723022461, -38.511539459228516, -36.631507873535156, -34.75148010253906, -32.8714485168457, -30.991418838500977, -29.11138916015625, -27.231361389160156, -25.35133171081543, -23.471302032470703, -21.591270446777344, -19.71124267578125, -17.83121109008789, -15.951181411743164, -14.071151733398438, -12.191122055053711, -10.311092376708984, -8.431062698364258, -6.551032066345215, -4.671002388000488, -2.7909727096557617, -0.9109420776367188, 0.9690876007080078, 2.8491134643554688, 4.729143142700195, 6.60917329788208, 8.489203453063965, 10.369233131408691, 12.249262809753418, 14.129293441772461, 16.009323120117188, 17.889352798461914, 19.76938247680664, 21.649412155151367, 23.529441833496094, 25.409473419189453, 27.289501190185547, 29.169532775878906, 31.049562454223633, 32.92959213256836, 34.80962371826172, 36.68965148925781, 38.56968307495117, 40.449710845947266, 42.329742431640625, 44.20977020263672, 46.08980178833008, 47.96983337402344, 49.8498649597168, 51.72989273071289, 53.60992431640625, 55.489952087402344, 57.3699836730957, 59.25001525878906, 61.130043029785156, 63.01007080078125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 1.0, 3.0, 11.0, 4.0, 10.0, 15.0, 13.0, 12.0, 19.0, 28.0, 21.0, 21.0, 33.0, 22.0, 29.0, 32.0, 35.0, 48.0, 44.0, 41.0, 38.0, 48.0, 44.0, 41.0, 44.0, 39.0, 40.0, 28.0, 25.0, 22.0, 29.0, 24.0, 24.0, 19.0, 16.0, 16.0, 12.0, 4.0, 17.0, 6.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.2109375, -10.8543701171875, -10.497802734375, -10.1412353515625, -9.78466796875, -9.4281005859375, -9.071533203125, -8.7149658203125, -8.3583984375, -8.0018310546875, -7.645263671875, -7.2886962890625, -6.93212890625, -6.5755615234375, -6.218994140625, -5.8624267578125, -5.505859375, -5.1492919921875, -4.792724609375, -4.4361572265625, -4.07958984375, -3.7230224609375, -3.366455078125, -3.0098876953125, -2.6533203125, -2.2967529296875, -1.940185546875, -1.5836181640625, -1.22705078125, -0.8704833984375, -0.513916015625, -0.1573486328125, 0.19921875, 0.5557861328125, 0.912353515625, 1.2689208984375, 1.62548828125, 1.9820556640625, 2.338623046875, 2.6951904296875, 3.0517578125, 3.4083251953125, 3.764892578125, 4.1214599609375, 4.47802734375, 4.8345947265625, 5.191162109375, 5.5477294921875, 5.904296875, 6.2608642578125, 6.617431640625, 6.9739990234375, 7.33056640625, 7.6871337890625, 8.043701171875, 8.4002685546875, 8.7568359375, 9.1134033203125, 9.469970703125, 9.8265380859375, 10.18310546875, 10.5396728515625, 10.896240234375, 11.2528076171875, 11.609375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 6.0, 2.0, 11.0, 11.0, 17.0, 23.0, 35.0, 55.0, 69.0, 113.0, 153.0, 201.0, 298.0, 464.0, 645.0, 1004.0, 1456.0, 2164.0, 3401.0, 5241.0, 8283.0, 13221.0, 20938.0, 34417.0, 56590.0, 96935.0, 167362.0, 232381.0, 163245.0, 94146.0, 55419.0, 33699.0, 20545.0, 12833.0, 8004.0, 5205.0, 3329.0, 2176.0, 1456.0, 952.0, 658.0, 397.0, 314.0, 237.0, 133.0, 95.0, 75.0, 43.0, 33.0, 26.0, 10.0, 13.0, 10.0, 9.0, 3.0, 2.0, 1.0, 3.0], "bins": [-1.8154296875, -1.761199951171875, -1.70697021484375, -1.652740478515625, -1.5985107421875, -1.544281005859375, -1.49005126953125, -1.435821533203125, -1.381591796875, -1.327362060546875, -1.27313232421875, -1.218902587890625, -1.1646728515625, -1.110443115234375, -1.05621337890625, -1.001983642578125, -0.94775390625, -0.893524169921875, -0.83929443359375, -0.785064697265625, -0.7308349609375, -0.676605224609375, -0.62237548828125, -0.568145751953125, -0.513916015625, -0.459686279296875, -0.40545654296875, -0.351226806640625, -0.2969970703125, -0.242767333984375, -0.18853759765625, -0.134307861328125, -0.080078125, -0.025848388671875, 0.02838134765625, 0.082611083984375, 0.1368408203125, 0.191070556640625, 0.24530029296875, 0.299530029296875, 0.353759765625, 0.407989501953125, 0.46221923828125, 0.516448974609375, 0.5706787109375, 0.624908447265625, 0.67913818359375, 0.733367919921875, 0.78759765625, 0.841827392578125, 0.89605712890625, 0.950286865234375, 1.0045166015625, 1.058746337890625, 1.11297607421875, 1.167205810546875, 1.221435546875, 1.275665283203125, 1.32989501953125, 1.384124755859375, 1.4383544921875, 1.492584228515625, 1.54681396484375, 1.601043701171875, 1.6552734375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 5.0, 8.0, 1.0, 7.0, 17.0, 5.0, 7.0, 7.0, 19.0, 26.0, 24.0, 35.0, 28.0, 34.0, 28.0, 25.0, 35.0, 38.0, 50.0, 43.0, 42.0, 1072.0, 33.0, 53.0, 60.0, 49.0, 33.0, 35.0, 24.0, 30.0, 29.0, 15.0, 23.0, 17.0, 13.0, 16.0, 10.0, 8.0, 11.0, 3.0, 3.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.578125, -8.3406982421875, -8.103271484375, -7.8658447265625, -7.62841796875, -7.3909912109375, -7.153564453125, -6.9161376953125, -6.6787109375, -6.4412841796875, -6.203857421875, -5.9664306640625, -5.72900390625, -5.4915771484375, -5.254150390625, -5.0167236328125, -4.779296875, -4.5418701171875, -4.304443359375, -4.0670166015625, -3.82958984375, -3.5921630859375, -3.354736328125, -3.1173095703125, -2.8798828125, -2.6424560546875, -2.405029296875, -2.1676025390625, -1.93017578125, -1.6927490234375, -1.455322265625, -1.2178955078125, -0.98046875, -0.7430419921875, -0.505615234375, -0.2681884765625, -0.03076171875, 0.2066650390625, 0.444091796875, 0.6815185546875, 0.9189453125, 1.1563720703125, 1.393798828125, 1.6312255859375, 1.86865234375, 2.1060791015625, 2.343505859375, 2.5809326171875, 2.818359375, 3.0557861328125, 3.293212890625, 3.5306396484375, 3.76806640625, 4.0054931640625, 4.242919921875, 4.4803466796875, 4.7177734375, 4.9552001953125, 5.192626953125, 5.4300537109375, 5.66748046875, 5.9049072265625, 6.142333984375, 6.3797607421875, 6.6171875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 2.0, 3.0, 8.0, 11.0, 12.0, 28.0, 37.0, 48.0, 63.0, 109.0, 160.0, 241.0, 343.0, 548.0, 782.0, 1261.0, 1837.0, 2833.0, 4263.0, 6344.0, 9724.0, 14726.0, 23056.0, 36298.0, 57566.0, 92299.0, 150842.0, 1258960.0, 162509.0, 99884.0, 62108.0, 38855.0, 24959.0, 15996.0, 10350.0, 6841.0, 4432.0, 2888.0, 1942.0, 1294.0, 926.0, 578.0, 361.0, 292.0, 171.0, 121.0, 79.0, 54.0, 35.0, 22.0, 15.0, 8.0, 15.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4296875, -1.3829345703125, -1.336181640625, -1.2894287109375, -1.24267578125, -1.1959228515625, -1.149169921875, -1.1024169921875, -1.0556640625, -1.0089111328125, -0.962158203125, -0.9154052734375, -0.86865234375, -0.8218994140625, -0.775146484375, -0.7283935546875, -0.681640625, -0.6348876953125, -0.588134765625, -0.5413818359375, -0.49462890625, -0.4478759765625, -0.401123046875, -0.3543701171875, -0.3076171875, -0.2608642578125, -0.214111328125, -0.1673583984375, -0.12060546875, -0.0738525390625, -0.027099609375, 0.0196533203125, 0.06640625, 0.1131591796875, 0.159912109375, 0.2066650390625, 0.25341796875, 0.3001708984375, 0.346923828125, 0.3936767578125, 0.4404296875, 0.4871826171875, 0.533935546875, 0.5806884765625, 0.62744140625, 0.6741943359375, 0.720947265625, 0.7677001953125, 0.814453125, 0.8612060546875, 0.907958984375, 0.9547119140625, 1.00146484375, 1.0482177734375, 1.094970703125, 1.1417236328125, 1.1884765625, 1.2352294921875, 1.281982421875, 1.3287353515625, 1.37548828125, 1.4222412109375, 1.468994140625, 1.5157470703125, 1.5625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 3.0, 7.0, 3.0, 9.0, 12.0, 9.0, 15.0, 19.0, 31.0, 39.0, 39.0, 60.0, 49.0, 65.0, 54.0, 59.0, 67.0, 63.0, 52.0, 44.0, 54.0, 51.0, 36.0, 27.0, 24.0, 24.0, 12.0, 19.0, 13.0, 6.0, 8.0, 5.0, 3.0, 5.0, 0.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003002166748046875, -0.002920866012573242, -0.0028395652770996094, -0.0027582645416259766, -0.0026769638061523438, -0.002595663070678711, -0.002514362335205078, -0.0024330615997314453, -0.0023517608642578125, -0.0022704601287841797, -0.002189159393310547, -0.002107858657836914, -0.0020265579223632812, -0.0019452571868896484, -0.0018639564514160156, -0.0017826557159423828, -0.00170135498046875, -0.0016200542449951172, -0.0015387535095214844, -0.0014574527740478516, -0.0013761520385742188, -0.001294851303100586, -0.0012135505676269531, -0.0011322498321533203, -0.0010509490966796875, -0.0009696483612060547, -0.0008883476257324219, -0.0008070468902587891, -0.0007257461547851562, -0.0006444454193115234, -0.0005631446838378906, -0.0004818439483642578, -0.000400543212890625, -0.0003192424774169922, -0.00023794174194335938, -0.00015664100646972656, -7.534027099609375e-05, 5.9604644775390625e-06, 8.726119995117188e-05, 0.0001685619354248047, 0.0002498626708984375, 0.0003311634063720703, 0.0004124641418457031, 0.0004937648773193359, 0.0005750656127929688, 0.0006563663482666016, 0.0007376670837402344, 0.0008189678192138672, 0.0009002685546875, 0.0009815692901611328, 0.0010628700256347656, 0.0011441707611083984, 0.0012254714965820312, 0.001306772232055664, 0.0013880729675292969, 0.0014693737030029297, 0.0015506744384765625, 0.0016319751739501953, 0.0017132759094238281, 0.001794576644897461, 0.0018758773803710938, 0.0019571781158447266, 0.0020384788513183594, 0.002119779586791992, 0.002201080322265625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 8.0, 6.0, 7.0, 22.0, 14.0, 22.0, 23.0, 30.0, 40.0, 51.0, 74.0, 100.0, 119.0, 186.0, 286.0, 551.0, 2066.0, 929521.0, 113110.0, 1043.0, 450.0, 227.0, 152.0, 116.0, 78.0, 70.0, 38.0, 31.0, 15.0, 16.0, 13.0, 12.0, 10.0, 11.0, 5.0, 5.0, 9.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045013427734375, -0.0433964729309082, -0.041779518127441406, -0.04016256332397461, -0.03854560852050781, -0.036928653717041016, -0.03531169891357422, -0.03369474411010742, -0.032077789306640625, -0.030460834503173828, -0.02884387969970703, -0.027226924896240234, -0.025609970092773438, -0.02399301528930664, -0.022376060485839844, -0.020759105682373047, -0.01914215087890625, -0.017525196075439453, -0.015908241271972656, -0.01429128646850586, -0.012674331665039062, -0.011057376861572266, -0.009440422058105469, -0.007823467254638672, -0.006206512451171875, -0.004589557647705078, -0.0029726028442382812, -0.0013556480407714844, 0.0002613067626953125, 0.0018782615661621094, 0.0034952163696289062, 0.005112171173095703, 0.0067291259765625, 0.008346080780029297, 0.009963035583496094, 0.01157999038696289, 0.013196945190429688, 0.014813899993896484, 0.01643085479736328, 0.018047809600830078, 0.019664764404296875, 0.021281719207763672, 0.02289867401123047, 0.024515628814697266, 0.026132583618164062, 0.02774953842163086, 0.029366493225097656, 0.030983448028564453, 0.03260040283203125, 0.03421735763549805, 0.035834312438964844, 0.03745126724243164, 0.03906822204589844, 0.040685176849365234, 0.04230213165283203, 0.04391908645629883, 0.045536041259765625, 0.04715299606323242, 0.04876995086669922, 0.050386905670166016, 0.05200386047363281, 0.05362081527709961, 0.055237770080566406, 0.0568547248840332, 0.0584716796875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 23.0, 159.0, 567.0, 231.0, 31.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01107342541217804, -0.010858663357794285, -0.010643900372087955, -0.0104291383177042, -0.010214376263320446, -0.009999613277614117, -0.009784851223230362, -0.009570089168846607, -0.009355326183140278, -0.009140564128756523, -0.008925801143050194, -0.008711039088666439, -0.008496277034282684, -0.008281514048576355, -0.0080667519941926, -0.007851989939808846, -0.0076372274197638035, -0.0074224648997187614, -0.007207702845335007, -0.006992940325289965, -0.006778177805244923, -0.006563415750861168, -0.006348653230816126, -0.006133890710771084, -0.005919128656387329, -0.005704366136342287, -0.005489604081958532, -0.00527484156191349, -0.005060079041868448, -0.004845316521823406, -0.0046305544674396515, -0.0044157919473946095, -0.004201029427349567, -0.003986266907304525, -0.003771504620090127, -0.0035567423328757286, -0.0033419798128306866, -0.003127217525616288, -0.00291245523840189, -0.0026976927183568478, -0.002482930663973093, -0.0022681683767586946, -0.0020534058567136526, -0.0018386435694992542, -0.001623881165869534, -0.0014091187622398138, -0.0011943564750254154, -0.0009795940713956952, -0.000764831667765975, -0.0005500692641362548, -0.0003353069187141955, -0.00012054457329213619, 9.421783033758402e-05, 0.00030898023396730423, 0.0005237425211817026, 0.0007385049248114228, 0.000953267328441143, 0.0011680297320708632, 0.0013827921357005835, 0.0015975544229149818, 0.001812316826544702, 0.0020270792301744223, 0.0022418415173888206, 0.0024566040374338627, 0.002671366324648261]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 3.0, 4.0, 12.0, 7.0, 10.0, 11.0, 10.0, 19.0, 20.0, 20.0, 19.0, 23.0, 30.0, 39.0, 32.0, 31.0, 38.0, 37.0, 33.0, 39.0, 44.0, 28.0, 29.0, 35.0, 43.0, 34.0, 36.0, 24.0, 34.0, 36.0, 26.0, 35.0, 15.0, 20.0, 18.0, 7.0, 17.0, 14.0, 20.0, 6.0, 5.0, 6.0, 11.0, 4.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.00114518404006958, -0.0011092368513345718, -0.0010732896625995636, -0.0010373424738645554, -0.0010013952851295471, -0.0009654480963945389, -0.0009295009076595306, -0.0008935537189245224, -0.0008576065301895142, -0.0008216593414545059, -0.0007857121527194977, -0.0007497649639844894, -0.0007138177752494812, -0.000677870586514473, -0.0006419233977794647, -0.0006059762090444565, -0.0005700290203094482, -0.00053408183157444, -0.0004981346428394318, -0.0004621874541044235, -0.0004262402653694153, -0.00039029307663440704, -0.0003543458878993988, -0.00031839869916439056, -0.0002824515104293823, -0.0002465043216943741, -0.00021055713295936584, -0.0001746099442243576, -0.00013866275548934937, -0.00010271556675434113, -6.676837801933289e-05, -3.0821189284324646e-05, 5.125999450683594e-06, 4.1073188185691833e-05, 7.702037692070007e-05, 0.00011296756565570831, 0.00014891475439071655, 0.0001848619431257248, 0.00022080913186073303, 0.00025675632059574127, 0.0002927035093307495, 0.00032865069806575775, 0.000364597886800766, 0.00040054507553577423, 0.00043649226427078247, 0.0004724394530057907, 0.000508386641740799, 0.0005443338304758072, 0.0005802810192108154, 0.0006162282079458237, 0.0006521753966808319, 0.0006881225854158401, 0.0007240697741508484, 0.0007600169628858566, 0.0007959641516208649, 0.0008319113403558731, 0.0008678585290908813, 0.0009038057178258896, 0.0009397529065608978, 0.0009757000952959061, 0.0010116472840309143, 0.0010475944727659225, 0.0010835416615009308, 0.001119488850235939, 0.0011554360389709473]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 3.0, 1.0, 3.0, 11.0, 4.0, 10.0, 15.0, 13.0, 12.0, 19.0, 28.0, 21.0, 21.0, 33.0, 22.0, 29.0, 32.0, 35.0, 48.0, 44.0, 41.0, 38.0, 48.0, 44.0, 41.0, 44.0, 39.0, 40.0, 28.0, 25.0, 22.0, 29.0, 24.0, 24.0, 19.0, 16.0, 16.0, 12.0, 4.0, 17.0, 6.0, 7.0, 7.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-11.2109375, -10.8543701171875, -10.497802734375, -10.1412353515625, -9.78466796875, -9.4281005859375, -9.071533203125, -8.7149658203125, -8.3583984375, -8.0018310546875, -7.645263671875, -7.2886962890625, -6.93212890625, -6.5755615234375, -6.218994140625, -5.8624267578125, -5.505859375, -5.1492919921875, -4.792724609375, -4.4361572265625, -4.07958984375, -3.7230224609375, -3.366455078125, -3.0098876953125, -2.6533203125, -2.2967529296875, -1.940185546875, -1.5836181640625, -1.22705078125, -0.8704833984375, -0.513916015625, -0.1573486328125, 0.19921875, 0.5557861328125, 0.912353515625, 1.2689208984375, 1.62548828125, 1.9820556640625, 2.338623046875, 2.6951904296875, 3.0517578125, 3.4083251953125, 3.764892578125, 4.1214599609375, 4.47802734375, 4.8345947265625, 5.191162109375, 5.5477294921875, 5.904296875, 6.2608642578125, 6.617431640625, 6.9739990234375, 7.33056640625, 7.6871337890625, 8.043701171875, 8.4002685546875, 8.7568359375, 9.1134033203125, 9.469970703125, 9.8265380859375, 10.18310546875, 10.5396728515625, 10.896240234375, 11.2528076171875, 11.609375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 6.0, 3.0, 22.0, 10.0, 24.0, 23.0, 46.0, 54.0, 80.0, 98.0, 145.0, 241.0, 318.0, 429.0, 620.0, 989.0, 1715.0, 3290.0, 7053.0, 17460.0, 46330.0, 138051.0, 459733.0, 250180.0, 73824.0, 26794.0, 10538.0, 4539.0, 2288.0, 1174.0, 749.0, 487.0, 337.0, 266.0, 191.0, 143.0, 79.0, 70.0, 45.0, 46.0, 19.0, 18.0, 8.0, 4.0, 9.0, 8.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.015625, -12.6053466796875, -12.195068359375, -11.7847900390625, -11.37451171875, -10.9642333984375, -10.553955078125, -10.1436767578125, -9.7333984375, -9.3231201171875, -8.912841796875, -8.5025634765625, -8.09228515625, -7.6820068359375, -7.271728515625, -6.8614501953125, -6.451171875, -6.0408935546875, -5.630615234375, -5.2203369140625, -4.81005859375, -4.3997802734375, -3.989501953125, -3.5792236328125, -3.1689453125, -2.7586669921875, -2.348388671875, -1.9381103515625, -1.52783203125, -1.1175537109375, -0.707275390625, -0.2969970703125, 0.11328125, 0.5235595703125, 0.933837890625, 1.3441162109375, 1.75439453125, 2.1646728515625, 2.574951171875, 2.9852294921875, 3.3955078125, 3.8057861328125, 4.216064453125, 4.6263427734375, 5.03662109375, 5.4468994140625, 5.857177734375, 6.2674560546875, 6.677734375, 7.0880126953125, 7.498291015625, 7.9085693359375, 8.31884765625, 8.7291259765625, 9.139404296875, 9.5496826171875, 9.9599609375, 10.3702392578125, 10.780517578125, 11.1907958984375, 11.60107421875, 12.0113525390625, 12.421630859375, 12.8319091796875, 13.2421875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 2.0, 6.0, 3.0, 5.0, 9.0, 11.0, 18.0, 13.0, 15.0, 15.0, 20.0, 24.0, 24.0, 35.0, 23.0, 27.0, 41.0, 36.0, 50.0, 65.0, 120.0, 310.0, 1564.0, 148.0, 73.0, 53.0, 45.0, 35.0, 29.0, 26.0, 20.0, 31.0, 22.0, 27.0, 20.0, 17.0, 14.0, 9.0, 7.0, 7.0, 9.0, 8.0, 5.0, 4.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-27.4375, -26.634765625, -25.83203125, -25.029296875, -24.2265625, -23.423828125, -22.62109375, -21.818359375, -21.015625, -20.212890625, -19.41015625, -18.607421875, -17.8046875, -17.001953125, -16.19921875, -15.396484375, -14.59375, -13.791015625, -12.98828125, -12.185546875, -11.3828125, -10.580078125, -9.77734375, -8.974609375, -8.171875, -7.369140625, -6.56640625, -5.763671875, -4.9609375, -4.158203125, -3.35546875, -2.552734375, -1.75, -0.947265625, -0.14453125, 0.658203125, 1.4609375, 2.263671875, 3.06640625, 3.869140625, 4.671875, 5.474609375, 6.27734375, 7.080078125, 7.8828125, 8.685546875, 9.48828125, 10.291015625, 11.09375, 11.896484375, 12.69921875, 13.501953125, 14.3046875, 15.107421875, 15.91015625, 16.712890625, 17.515625, 18.318359375, 19.12109375, 19.923828125, 20.7265625, 21.529296875, 22.33203125, 23.134765625, 23.9375]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 10.0, 14.0, 14.0, 20.0, 38.0, 27.0, 53.0, 73.0, 96.0, 163.0, 231.0, 369.0, 801.0, 5957.0, 326591.0, 2791882.0, 16797.0, 1247.0, 429.0, 271.0, 176.0, 115.0, 93.0, 60.0, 39.0, 31.0, 25.0, 15.0, 16.0, 9.0, 12.0, 4.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-61.84375, -60.0849609375, -58.326171875, -56.5673828125, -54.80859375, -53.0498046875, -51.291015625, -49.5322265625, -47.7734375, -46.0146484375, -44.255859375, -42.4970703125, -40.73828125, -38.9794921875, -37.220703125, -35.4619140625, -33.703125, -31.9443359375, -30.185546875, -28.4267578125, -26.66796875, -24.9091796875, -23.150390625, -21.3916015625, -19.6328125, -17.8740234375, -16.115234375, -14.3564453125, -12.59765625, -10.8388671875, -9.080078125, -7.3212890625, -5.5625, -3.8037109375, -2.044921875, -0.2861328125, 1.47265625, 3.2314453125, 4.990234375, 6.7490234375, 8.5078125, 10.2666015625, 12.025390625, 13.7841796875, 15.54296875, 17.3017578125, 19.060546875, 20.8193359375, 22.578125, 24.3369140625, 26.095703125, 27.8544921875, 29.61328125, 31.3720703125, 33.130859375, 34.8896484375, 36.6484375, 38.4072265625, 40.166015625, 41.9248046875, 43.68359375, 45.4423828125, 47.201171875, 48.9599609375, 50.71875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 30.0, 221.0, 497.0, 244.0, 24.0, 1.0, 1.0], "bins": [-249.39454650878906, -245.20701599121094, -241.01947021484375, -236.83193969726562, -232.6444091796875, -228.4568634033203, -224.2693328857422, -220.08180236816406, -215.89425659179688, -211.70672607421875, -207.51918029785156, -203.33164978027344, -199.1441192626953, -194.95657348632812, -190.76904296875, -186.58151245117188, -182.39398193359375, -178.20645141601562, -174.01890563964844, -169.8313751220703, -165.6438446044922, -161.456298828125, -157.26876831054688, -153.08123779296875, -148.89369201660156, -144.70616149902344, -140.51861572265625, -136.33108520507812, -132.1435546875, -127.95600891113281, -123.76847839355469, -119.58094024658203, -115.39338684082031, -111.20584869384766, -107.01831817626953, -102.83078002929688, -98.64324188232422, -94.45570373535156, -90.26817321777344, -86.08063507080078, -81.89310455322266, -77.70556640625, -73.51803588867188, -69.33049774169922, -65.14295959472656, -60.95542526245117, -56.76789093017578, -52.580352783203125, -48.392818450927734, -44.205284118652344, -40.01774597167969, -35.8302116394043, -31.642675399780273, -27.45513916015625, -23.26760482788086, -19.080068588256836, -14.892532348632812, -10.704996109008789, -6.517460823059082, -2.329925537109375, 1.8576107025146484, 6.045146942138672, 10.232681274414062, 14.420217514038086, 18.60775375366211]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 6.0, 10.0, 9.0, 12.0, 15.0, 18.0, 19.0, 34.0, 32.0, 27.0, 36.0, 33.0, 30.0, 32.0, 33.0, 34.0, 33.0, 40.0, 45.0, 41.0, 41.0, 44.0, 34.0, 42.0, 40.0, 30.0, 26.0, 25.0, 20.0, 22.0, 14.0, 14.0, 18.0, 15.0, 12.0, 9.0, 9.0, 7.0, 5.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-62.89476013183594, -61.11080551147461, -59.32685089111328, -57.54289245605469, -55.75893783569336, -53.97498321533203, -52.1910285949707, -50.407073974609375, -48.62311935424805, -46.83916473388672, -45.05521011352539, -43.27125549316406, -41.48729705810547, -39.70334243774414, -37.91938781738281, -36.135433197021484, -34.351478576660156, -32.56752395629883, -30.783567428588867, -28.99961280822754, -27.21565818786621, -25.43170166015625, -23.647747039794922, -21.863792419433594, -20.079833984375, -18.295879364013672, -16.51192283630371, -14.727968215942383, -12.944013595581055, -11.16005802154541, -9.376102447509766, -7.5921478271484375, -5.808193206787109, -4.024238109588623, -2.2402827739715576, -0.4563274383544922, 1.3276276588439941, 3.1115827560424805, 4.895538330078125, 6.679492950439453, 8.463448524475098, 10.247404098510742, 12.03135871887207, 13.815314292907715, 15.59926986694336, 17.383224487304688, 19.167179107666016, 20.951133728027344, 22.735090255737305, 24.519044876098633, 26.303001403808594, 28.086956024169922, 29.87091064453125, 31.654865264892578, 33.438819885253906, 35.2227783203125, 37.00673294067383, 38.790687561035156, 40.574642181396484, 42.35859680175781, 44.142555236816406, 45.926509857177734, 47.71046447753906, 49.49441909790039, 51.27837371826172]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 6.0, 7.0, 13.0, 14.0, 15.0, 21.0, 23.0, 17.0, 21.0, 29.0, 30.0, 32.0, 37.0, 34.0, 40.0, 35.0, 48.0, 58.0, 55.0, 37.0, 36.0, 46.0, 45.0, 34.0, 33.0, 23.0, 34.0, 30.0, 24.0, 18.0, 29.0, 13.0, 9.0, 11.0, 10.0, 7.0, 7.0, 3.0, 7.0, 3.0, 2.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.21875, -11.842529296875, -11.46630859375, -11.090087890625, -10.7138671875, -10.337646484375, -9.96142578125, -9.585205078125, -9.208984375, -8.832763671875, -8.45654296875, -8.080322265625, -7.7041015625, -7.327880859375, -6.95166015625, -6.575439453125, -6.19921875, -5.822998046875, -5.44677734375, -5.070556640625, -4.6943359375, -4.318115234375, -3.94189453125, -3.565673828125, -3.189453125, -2.813232421875, -2.43701171875, -2.060791015625, -1.6845703125, -1.308349609375, -0.93212890625, -0.555908203125, -0.1796875, 0.196533203125, 0.57275390625, 0.948974609375, 1.3251953125, 1.701416015625, 2.07763671875, 2.453857421875, 2.830078125, 3.206298828125, 3.58251953125, 3.958740234375, 4.3349609375, 4.711181640625, 5.08740234375, 5.463623046875, 5.83984375, 6.216064453125, 6.59228515625, 6.968505859375, 7.3447265625, 7.720947265625, 8.09716796875, 8.473388671875, 8.849609375, 9.225830078125, 9.60205078125, 9.978271484375, 10.3544921875, 10.730712890625, 11.10693359375, 11.483154296875, 11.859375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 6.0, 4.0, 4.0, 13.0, 12.0, 13.0, 18.0, 28.0, 27.0, 36.0, 53.0, 62.0, 92.0, 124.0, 188.0, 273.0, 335.0, 461.0, 2908.0, 4186821.0, 1144.0, 477.0, 343.0, 223.0, 165.0, 121.0, 81.0, 62.0, 48.0, 34.0, 28.0, 12.0, 11.0, 22.0, 9.0, 6.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-289.5, -279.96875, -270.4375, -260.90625, -251.375, -241.84375, -232.3125, -222.78125, -213.25, -203.71875, -194.1875, -184.65625, -175.125, -165.59375, -156.0625, -146.53125, -137.0, -127.46875, -117.9375, -108.40625, -98.875, -89.34375, -79.8125, -70.28125, -60.75, -51.21875, -41.6875, -32.15625, -22.625, -13.09375, -3.5625, 5.96875, 15.5, 25.03125, 34.5625, 44.09375, 53.625, 63.15625, 72.6875, 82.21875, 91.75, 101.28125, 110.8125, 120.34375, 129.875, 139.40625, 148.9375, 158.46875, 168.0, 177.53125, 187.0625, 196.59375, 206.125, 215.65625, 225.1875, 234.71875, 244.25, 253.78125, 263.3125, 272.84375, 282.375, 291.90625, 301.4375, 310.96875, 320.5]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 12.0, 16.0, 37.0, 46.0, 66.0, 144.0, 312.0, 771.0, 1212.0, 801.0, 306.0, 157.0, 82.0, 41.0, 35.0, 16.0, 15.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.0, -29.87353515625, -28.7470703125, -27.62060546875, -26.494140625, -25.36767578125, -24.2412109375, -23.11474609375, -21.98828125, -20.86181640625, -19.7353515625, -18.60888671875, -17.482421875, -16.35595703125, -15.2294921875, -14.10302734375, -12.9765625, -11.85009765625, -10.7236328125, -9.59716796875, -8.470703125, -7.34423828125, -6.2177734375, -5.09130859375, -3.96484375, -2.83837890625, -1.7119140625, -0.58544921875, 0.541015625, 1.66748046875, 2.7939453125, 3.92041015625, 5.046875, 6.17333984375, 7.2998046875, 8.42626953125, 9.552734375, 10.67919921875, 11.8056640625, 12.93212890625, 14.05859375, 15.18505859375, 16.3115234375, 17.43798828125, 18.564453125, 19.69091796875, 20.8173828125, 21.94384765625, 23.0703125, 24.19677734375, 25.3232421875, 26.44970703125, 27.576171875, 28.70263671875, 29.8291015625, 30.95556640625, 32.08203125, 33.20849609375, 34.3349609375, 35.46142578125, 36.587890625, 37.71435546875, 38.8408203125, 39.96728515625, 41.09375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 9.0, 13.0, 12.0, 16.0, 20.0, 20.0, 22.0, 25.0, 34.0, 51.0, 60.0, 70.0, 137.0, 383.0, 5507.0, 4171130.0, 15705.0, 549.0, 156.0, 65.0, 62.0, 40.0, 33.0, 24.0, 22.0, 20.0, 28.0, 17.0, 9.0, 8.0, 7.0, 6.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-170.875, -166.072265625, -161.26953125, -156.466796875, -151.6640625, -146.861328125, -142.05859375, -137.255859375, -132.453125, -127.650390625, -122.84765625, -118.044921875, -113.2421875, -108.439453125, -103.63671875, -98.833984375, -94.03125, -89.228515625, -84.42578125, -79.623046875, -74.8203125, -70.017578125, -65.21484375, -60.412109375, -55.609375, -50.806640625, -46.00390625, -41.201171875, -36.3984375, -31.595703125, -26.79296875, -21.990234375, -17.1875, -12.384765625, -7.58203125, -2.779296875, 2.0234375, 6.826171875, 11.62890625, 16.431640625, 21.234375, 26.037109375, 30.83984375, 35.642578125, 40.4453125, 45.248046875, 50.05078125, 54.853515625, 59.65625, 64.458984375, 69.26171875, 74.064453125, 78.8671875, 83.669921875, 88.47265625, 93.275390625, 98.078125, 102.880859375, 107.68359375, 112.486328125, 117.2890625, 122.091796875, 126.89453125, 131.697265625, 136.5]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 17.0, 40.0, 180.0, 319.0, 301.0, 118.0, 32.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.09324645996094, -121.01203918457031, -115.93083190917969, -110.84961700439453, -105.7684097290039, -100.68720245361328, -95.60598754882812, -90.5247802734375, -85.44357299804688, -80.36236572265625, -75.28115844726562, -70.19994354248047, -65.11873626708984, -60.03752899169922, -54.95631790161133, -49.87510681152344, -44.79389953613281, -39.71269226074219, -34.6314811706543, -29.55027198791504, -24.46906280517578, -19.387853622436523, -14.306644439697266, -9.225433349609375, -4.14422607421875, 0.9369831085205078, 6.018192291259766, 11.099401473999023, 16.18061065673828, 21.26181983947754, 26.343029022216797, 31.424240112304688, 36.50544738769531, 41.58665466308594, 46.66786575317383, 51.74907684326172, 56.830284118652344, 61.91149139404297, 66.99270629882812, 72.07391357421875, 77.15512084960938, 82.236328125, 87.31753540039062, 92.39875030517578, 97.4799575805664, 102.56116485595703, 107.64237976074219, 112.72358703613281, 117.80479431152344, 122.88600158691406, 127.96720886230469, 133.0484161376953, 138.129638671875, 143.21084594726562, 148.29205322265625, 153.37326049804688, 158.4544677734375, 163.53567504882812, 168.61688232421875, 173.69808959960938, 178.779296875, 183.8605194091797, 188.9417266845703, 194.02293395996094, 199.10414123535156]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 4.0, 10.0, 6.0, 7.0, 13.0, 9.0, 21.0, 24.0, 20.0, 15.0, 35.0, 30.0, 33.0, 44.0, 47.0, 46.0, 34.0, 41.0, 48.0, 51.0, 44.0, 36.0, 37.0, 26.0, 45.0, 39.0, 23.0, 26.0, 28.0, 24.0, 24.0, 24.0, 18.0, 17.0, 10.0, 8.0, 9.0, 8.0, 7.0, 1.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-60.21525573730469, -58.28989028930664, -56.364524841308594, -54.43915939331055, -52.5137939453125, -50.58842468261719, -48.66305923461914, -46.737693786621094, -44.81232833862305, -42.886962890625, -40.96159744262695, -39.036231994628906, -37.110862731933594, -35.18550109863281, -33.2601318359375, -31.334766387939453, -29.409400939941406, -27.48403549194336, -25.558670043945312, -23.633302688598633, -21.707937240600586, -19.78257179260254, -17.85720443725586, -15.931838989257812, -14.006473541259766, -12.081108093261719, -10.155741691589355, -8.230375289916992, -6.305009841918945, -4.379644393920898, -2.454277992248535, -0.5289115905761719, 1.396453857421875, 3.32181978225708, 5.247185707092285, 7.17255163192749, 9.097917556762695, 11.023283004760742, 12.948649406433105, 14.874015808105469, 16.799381256103516, 18.724746704101562, 20.65011215209961, 22.57547950744629, 24.500844955444336, 26.426210403442383, 28.351577758789062, 30.27694320678711, 32.202308654785156, 34.1276741027832, 36.05303955078125, 37.9784049987793, 39.903770446777344, 41.829139709472656, 43.7545051574707, 45.67987060546875, 47.6052360534668, 49.530601501464844, 51.45596694946289, 53.38133239746094, 55.30670166015625, 57.23206329345703, 59.157432556152344, 61.08279800415039, 63.00816345214844]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 4.0, 4.0, 10.0, 7.0, 15.0, 21.0, 15.0, 18.0, 16.0, 25.0, 18.0, 26.0, 20.0, 27.0, 36.0, 24.0, 42.0, 40.0, 53.0, 32.0, 49.0, 33.0, 49.0, 31.0, 31.0, 39.0, 28.0, 27.0, 34.0, 25.0, 28.0, 23.0, 14.0, 19.0, 11.0, 22.0, 15.0, 12.0, 11.0, 7.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-9.3046875, -8.9827880859375, -8.660888671875, -8.3389892578125, -8.01708984375, -7.6951904296875, -7.373291015625, -7.0513916015625, -6.7294921875, -6.4075927734375, -6.085693359375, -5.7637939453125, -5.44189453125, -5.1199951171875, -4.798095703125, -4.4761962890625, -4.154296875, -3.8323974609375, -3.510498046875, -3.1885986328125, -2.86669921875, -2.5447998046875, -2.222900390625, -1.9010009765625, -1.5791015625, -1.2572021484375, -0.935302734375, -0.6134033203125, -0.29150390625, 0.0303955078125, 0.352294921875, 0.6741943359375, 0.99609375, 1.3179931640625, 1.639892578125, 1.9617919921875, 2.28369140625, 2.6055908203125, 2.927490234375, 3.2493896484375, 3.5712890625, 3.8931884765625, 4.215087890625, 4.5369873046875, 4.85888671875, 5.1807861328125, 5.502685546875, 5.8245849609375, 6.146484375, 6.4683837890625, 6.790283203125, 7.1121826171875, 7.43408203125, 7.7559814453125, 8.077880859375, 8.3997802734375, 8.7216796875, 9.0435791015625, 9.365478515625, 9.6873779296875, 10.00927734375, 10.3311767578125, 10.653076171875, 10.9749755859375, 11.296875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 9.0, 10.0, 14.0, 22.0, 30.0, 57.0, 65.0, 120.0, 184.0, 282.0, 457.0, 816.0, 1287.0, 2349.0, 4101.0, 7127.0, 13172.0, 24340.0, 46690.0, 91519.0, 181940.0, 295030.0, 183914.0, 92618.0, 47368.0, 24522.0, 13407.0, 7265.0, 4092.0, 2302.0, 1369.0, 784.0, 479.0, 311.0, 179.0, 104.0, 86.0, 53.0, 28.0, 21.0, 11.0, 7.0, 3.0, 6.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.09765625, -2.028900146484375, -1.96014404296875, -1.891387939453125, -1.8226318359375, -1.753875732421875, -1.68511962890625, -1.616363525390625, -1.547607421875, -1.478851318359375, -1.41009521484375, -1.341339111328125, -1.2725830078125, -1.203826904296875, -1.13507080078125, -1.066314697265625, -0.99755859375, -0.928802490234375, -0.86004638671875, -0.791290283203125, -0.7225341796875, -0.653778076171875, -0.58502197265625, -0.516265869140625, -0.447509765625, -0.378753662109375, -0.30999755859375, -0.241241455078125, -0.1724853515625, -0.103729248046875, -0.03497314453125, 0.033782958984375, 0.1025390625, 0.171295166015625, 0.24005126953125, 0.308807373046875, 0.3775634765625, 0.446319580078125, 0.51507568359375, 0.583831787109375, 0.652587890625, 0.721343994140625, 0.79010009765625, 0.858856201171875, 0.9276123046875, 0.996368408203125, 1.06512451171875, 1.133880615234375, 1.20263671875, 1.271392822265625, 1.34014892578125, 1.408905029296875, 1.4776611328125, 1.546417236328125, 1.61517333984375, 1.683929443359375, 1.752685546875, 1.821441650390625, 1.89019775390625, 1.958953857421875, 2.0277099609375, 2.096466064453125, 2.16522216796875, 2.233978271484375, 2.302734375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 5.0, 6.0, 7.0, 10.0, 16.0, 11.0, 13.0, 15.0, 26.0, 31.0, 35.0, 41.0, 34.0, 33.0, 47.0, 37.0, 45.0, 50.0, 1078.0, 40.0, 48.0, 57.0, 45.0, 22.0, 42.0, 39.0, 38.0, 28.0, 28.0, 29.0, 14.0, 10.0, 10.0, 8.0, 10.0, 8.0, 4.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.90625, -7.641845703125, -7.37744140625, -7.113037109375, -6.8486328125, -6.584228515625, -6.31982421875, -6.055419921875, -5.791015625, -5.526611328125, -5.26220703125, -4.997802734375, -4.7333984375, -4.468994140625, -4.20458984375, -3.940185546875, -3.67578125, -3.411376953125, -3.14697265625, -2.882568359375, -2.6181640625, -2.353759765625, -2.08935546875, -1.824951171875, -1.560546875, -1.296142578125, -1.03173828125, -0.767333984375, -0.5029296875, -0.238525390625, 0.02587890625, 0.290283203125, 0.5546875, 0.819091796875, 1.08349609375, 1.347900390625, 1.6123046875, 1.876708984375, 2.14111328125, 2.405517578125, 2.669921875, 2.934326171875, 3.19873046875, 3.463134765625, 3.7275390625, 3.991943359375, 4.25634765625, 4.520751953125, 4.78515625, 5.049560546875, 5.31396484375, 5.578369140625, 5.8427734375, 6.107177734375, 6.37158203125, 6.635986328125, 6.900390625, 7.164794921875, 7.42919921875, 7.693603515625, 7.9580078125, 8.222412109375, 8.48681640625, 8.751220703125, 9.015625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 6.0, 9.0, 16.0, 20.0, 34.0, 38.0, 68.0, 139.0, 184.0, 341.0, 539.0, 918.0, 1512.0, 2420.0, 4053.0, 6998.0, 11793.0, 19922.0, 34904.0, 60925.0, 109274.0, 197086.0, 1301775.0, 149166.0, 83046.0, 46597.0, 26851.0, 15618.0, 9292.0, 5538.0, 3249.0, 1912.0, 1125.0, 674.0, 443.0, 230.0, 166.0, 94.0, 52.0, 47.0, 29.0, 12.0, 10.0, 4.0, 5.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8974609375, -1.838653564453125, -1.77984619140625, -1.721038818359375, -1.6622314453125, -1.603424072265625, -1.54461669921875, -1.485809326171875, -1.427001953125, -1.368194580078125, -1.30938720703125, -1.250579833984375, -1.1917724609375, -1.132965087890625, -1.07415771484375, -1.015350341796875, -0.95654296875, -0.897735595703125, -0.83892822265625, -0.780120849609375, -0.7213134765625, -0.662506103515625, -0.60369873046875, -0.544891357421875, -0.486083984375, -0.427276611328125, -0.36846923828125, -0.309661865234375, -0.2508544921875, -0.192047119140625, -0.13323974609375, -0.074432373046875, -0.015625, 0.043182373046875, 0.10198974609375, 0.160797119140625, 0.2196044921875, 0.278411865234375, 0.33721923828125, 0.396026611328125, 0.454833984375, 0.513641357421875, 0.57244873046875, 0.631256103515625, 0.6900634765625, 0.748870849609375, 0.80767822265625, 0.866485595703125, 0.92529296875, 0.984100341796875, 1.04290771484375, 1.101715087890625, 1.1605224609375, 1.219329833984375, 1.27813720703125, 1.336944580078125, 1.395751953125, 1.454559326171875, 1.51336669921875, 1.572174072265625, 1.6309814453125, 1.689788818359375, 1.74859619140625, 1.807403564453125, 1.8662109375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 9.0, 11.0, 13.0, 17.0, 13.0, 26.0, 18.0, 27.0, 43.0, 50.0, 66.0, 62.0, 78.0, 83.0, 65.0, 76.0, 74.0, 46.0, 40.0, 40.0, 27.0, 29.0, 12.0, 13.0, 10.0, 8.0, 12.0, 8.0, 4.0, 2.0, 2.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.002712249755859375, -0.0026206672191619873, -0.0025290846824645996, -0.002437502145767212, -0.0023459196090698242, -0.0022543370723724365, -0.002162754535675049, -0.002071171998977661, -0.0019795894622802734, -0.0018880069255828857, -0.001796424388885498, -0.0017048418521881104, -0.0016132593154907227, -0.001521676778793335, -0.0014300942420959473, -0.0013385117053985596, -0.0012469291687011719, -0.0011553466320037842, -0.0010637640953063965, -0.0009721815586090088, -0.0008805990219116211, -0.0007890164852142334, -0.0006974339485168457, -0.000605851411819458, -0.0005142688751220703, -0.0004226863384246826, -0.0003311038017272949, -0.00023952126502990723, -0.00014793872833251953, -5.6356191635131836e-05, 3.522634506225586e-05, 0.00012680888175964355, 0.00021839141845703125, 0.00030997395515441895, 0.00040155649185180664, 0.0004931390285491943, 0.000584721565246582, 0.0006763041019439697, 0.0007678866386413574, 0.0008594691753387451, 0.0009510517120361328, 0.0010426342487335205, 0.0011342167854309082, 0.001225799322128296, 0.0013173818588256836, 0.0014089643955230713, 0.001500546932220459, 0.0015921294689178467, 0.0016837120056152344, 0.001775294542312622, 0.0018668770790100098, 0.0019584596157073975, 0.002050042152404785, 0.002141624689102173, 0.0022332072257995605, 0.0023247897624969482, 0.002416372299194336, 0.0025079548358917236, 0.0025995373725891113, 0.002691119909286499, 0.0027827024459838867, 0.0028742849826812744, 0.002965867519378662, 0.00305745005607605, 0.0031490325927734375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 4.0, 7.0, 8.0, 6.0, 5.0, 10.0, 24.0, 14.0, 26.0, 22.0, 41.0, 63.0, 82.0, 102.0, 152.0, 217.0, 376.0, 617.0, 1405.0, 584950.0, 457275.0, 1401.0, 610.0, 358.0, 208.0, 143.0, 98.0, 72.0, 73.0, 46.0, 31.0, 33.0, 15.0, 8.0, 7.0, 5.0, 3.0, 3.0, 5.0, 4.0, 4.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.053497314453125, -0.05196809768676758, -0.050438880920410156, -0.048909664154052734, -0.04738044738769531, -0.04585123062133789, -0.04432201385498047, -0.04279279708862305, -0.041263580322265625, -0.0397343635559082, -0.03820514678955078, -0.03667593002319336, -0.03514671325683594, -0.033617496490478516, -0.032088279724121094, -0.030559062957763672, -0.02902984619140625, -0.027500629425048828, -0.025971412658691406, -0.024442195892333984, -0.022912979125976562, -0.02138376235961914, -0.01985454559326172, -0.018325328826904297, -0.016796112060546875, -0.015266895294189453, -0.013737678527832031, -0.01220846176147461, -0.010679244995117188, -0.009150028228759766, -0.007620811462402344, -0.006091594696044922, -0.0045623779296875, -0.003033161163330078, -0.0015039443969726562, 2.5272369384765625e-05, 0.0015544891357421875, 0.0030837059020996094, 0.004612922668457031, 0.006142139434814453, 0.007671356201171875, 0.009200572967529297, 0.010729789733886719, 0.01225900650024414, 0.013788223266601562, 0.015317440032958984, 0.016846656799316406, 0.018375873565673828, 0.01990509033203125, 0.021434307098388672, 0.022963523864746094, 0.024492740631103516, 0.026021957397460938, 0.02755117416381836, 0.02908039093017578, 0.030609607696533203, 0.032138824462890625, 0.03366804122924805, 0.03519725799560547, 0.03672647476196289, 0.03825569152832031, 0.039784908294677734, 0.041314125061035156, 0.04284334182739258, 0.04437255859375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 12.0, 100.0, 471.0, 371.0, 58.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008021735586225986, -0.007834665477275848, -0.007647596299648285, -0.007460526656359434, -0.007273457013070583, -0.007086386904120445, -0.0068993172608315945, -0.006712247617542744, -0.006525177974253893, -0.006338108330965042, -0.006151038687676191, -0.0059639690443873405, -0.0057768989354372025, -0.005589829292148352, -0.005402759648859501, -0.00521569000557065, -0.005028620362281799, -0.0048415507189929485, -0.004654481075704098, -0.004467411432415247, -0.004280341789126396, -0.004093271680176258, -0.0039062020368874073, -0.0037191323935985565, -0.0035320627503097057, -0.003344993107020855, -0.003157923463732004, -0.0029708535876125097, -0.002783783944323659, -0.002596714301034808, -0.0024096444249153137, -0.002222574781626463, -0.002035504672676325, -0.001848435029387474, -0.0016613652696833014, -0.0014742955099791288, -0.001287225866690278, -0.0011001562234014273, -0.0009130864636972547, -0.000726016703993082, -0.0005389470607042313, -0.00035187735920771956, -0.00016480765771120787, 2.226204378530383e-05, 0.00020933174528181553, 0.0003964014467783272, 0.0005834711482748389, 0.0007705409079790115, 0.0009576105512678623, 0.001144680194556713, 0.0013317499542608857, 0.0015188197139650583, 0.0017058893572539091, 0.00189295900054276, 0.0020800288766622543, 0.002267098519951105, 0.002454168163239956, 0.0026412378065288067, 0.0028283074498176575, 0.003015377325937152, 0.0032024469692260027, 0.0033895166125148535, 0.003576586488634348, 0.0037636561319231987, 0.0039507257752120495]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 6.0, 8.0, 6.0, 10.0, 14.0, 15.0, 8.0, 18.0, 24.0, 19.0, 28.0, 31.0, 36.0, 40.0, 50.0, 36.0, 48.0, 54.0, 52.0, 61.0, 47.0, 42.0, 44.0, 35.0, 35.0, 35.0, 36.0, 26.0, 25.0, 13.0, 22.0, 10.0, 15.0, 14.0, 7.0, 10.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00129777193069458, -0.0012513287365436554, -0.0012048855423927307, -0.001158442348241806, -0.0011119991540908813, -0.0010655559599399567, -0.001019112765789032, -0.0009726695716381073, -0.0009262263774871826, -0.0008797831833362579, -0.0008333399891853333, -0.0007868967950344086, -0.0007404536008834839, -0.0006940104067325592, -0.0006475672125816345, -0.0006011240184307098, -0.0005546808242797852, -0.0005082376301288605, -0.0004617944359779358, -0.0004153512418270111, -0.0003689080476760864, -0.00032246485352516174, -0.00027602165937423706, -0.00022957846522331238, -0.0001831352710723877, -0.000136692076921463, -9.024888277053833e-05, -4.380568861961365e-05, 2.637505531311035e-06, 4.908069968223572e-05, 9.55238938331604e-05, 0.00014196708798408508, 0.00018841028213500977, 0.00023485347628593445, 0.00028129667043685913, 0.0003277398645877838, 0.0003741830587387085, 0.0004206262528896332, 0.00046706944704055786, 0.0005135126411914825, 0.0005599558353424072, 0.0006063990294933319, 0.0006528422236442566, 0.0006992854177951813, 0.000745728611946106, 0.0007921718060970306, 0.0008386150002479553, 0.00088505819439888, 0.0009315013885498047, 0.0009779445827007294, 0.001024387776851654, 0.0010708309710025787, 0.0011172741651535034, 0.001163717359304428, 0.0012101605534553528, 0.0012566037476062775, 0.0013030469417572021, 0.0013494901359081268, 0.0013959333300590515, 0.0014423765242099762, 0.0014888197183609009, 0.0015352629125118256, 0.0015817061066627502, 0.001628149300813675, 0.0016745924949645996]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 2.0, 2.0, 4.0, 3.0, 8.0, 4.0, 4.0, 10.0, 7.0, 15.0, 21.0, 15.0, 18.0, 16.0, 25.0, 18.0, 26.0, 20.0, 27.0, 36.0, 24.0, 42.0, 40.0, 53.0, 32.0, 49.0, 33.0, 49.0, 31.0, 31.0, 39.0, 28.0, 27.0, 34.0, 25.0, 28.0, 23.0, 14.0, 19.0, 11.0, 22.0, 15.0, 12.0, 11.0, 7.0, 9.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-9.3046875, -8.9827880859375, -8.660888671875, -8.3389892578125, -8.01708984375, -7.6951904296875, -7.373291015625, -7.0513916015625, -6.7294921875, -6.4075927734375, -6.085693359375, -5.7637939453125, -5.44189453125, -5.1199951171875, -4.798095703125, -4.4761962890625, -4.154296875, -3.8323974609375, -3.510498046875, -3.1885986328125, -2.86669921875, -2.5447998046875, -2.222900390625, -1.9010009765625, -1.5791015625, -1.2572021484375, -0.935302734375, -0.6134033203125, -0.29150390625, 0.0303955078125, 0.352294921875, 0.6741943359375, 0.99609375, 1.3179931640625, 1.639892578125, 1.9617919921875, 2.28369140625, 2.6055908203125, 2.927490234375, 3.2493896484375, 3.5712890625, 3.8931884765625, 4.215087890625, 4.5369873046875, 4.85888671875, 5.1807861328125, 5.502685546875, 5.8245849609375, 6.146484375, 6.4683837890625, 6.790283203125, 7.1121826171875, 7.43408203125, 7.7559814453125, 8.077880859375, 8.3997802734375, 8.7216796875, 9.0435791015625, 9.365478515625, 9.6873779296875, 10.00927734375, 10.3311767578125, 10.653076171875, 10.9749755859375, 11.296875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 5.0, 1.0, 5.0, 8.0, 7.0, 12.0, 12.0, 19.0, 23.0, 40.0, 44.0, 56.0, 99.0, 94.0, 150.0, 196.0, 298.0, 377.0, 443.0, 612.0, 819.0, 1154.0, 1891.0, 4145.0, 14035.0, 71630.0, 419636.0, 433038.0, 74598.0, 14326.0, 4291.0, 2002.0, 1165.0, 851.0, 598.0, 466.0, 388.0, 266.0, 179.0, 157.0, 106.0, 83.0, 71.0, 46.0, 29.0, 22.0, 17.0, 19.0, 10.0, 10.0, 5.0, 6.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-18.609375, -18.00927734375, -17.4091796875, -16.80908203125, -16.208984375, -15.60888671875, -15.0087890625, -14.40869140625, -13.80859375, -13.20849609375, -12.6083984375, -12.00830078125, -11.408203125, -10.80810546875, -10.2080078125, -9.60791015625, -9.0078125, -8.40771484375, -7.8076171875, -7.20751953125, -6.607421875, -6.00732421875, -5.4072265625, -4.80712890625, -4.20703125, -3.60693359375, -3.0068359375, -2.40673828125, -1.806640625, -1.20654296875, -0.6064453125, -0.00634765625, 0.59375, 1.19384765625, 1.7939453125, 2.39404296875, 2.994140625, 3.59423828125, 4.1943359375, 4.79443359375, 5.39453125, 5.99462890625, 6.5947265625, 7.19482421875, 7.794921875, 8.39501953125, 8.9951171875, 9.59521484375, 10.1953125, 10.79541015625, 11.3955078125, 11.99560546875, 12.595703125, 13.19580078125, 13.7958984375, 14.39599609375, 14.99609375, 15.59619140625, 16.1962890625, 16.79638671875, 17.396484375, 17.99658203125, 18.5966796875, 19.19677734375, 19.796875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 4.0, 6.0, 2.0, 7.0, 11.0, 11.0, 17.0, 19.0, 16.0, 21.0, 26.0, 26.0, 31.0, 38.0, 43.0, 54.0, 80.0, 107.0, 404.0, 1504.0, 126.0, 73.0, 55.0, 58.0, 42.0, 40.0, 32.0, 23.0, 25.0, 35.0, 17.0, 23.0, 11.0, 14.0, 6.0, 10.0, 5.0, 2.0, 7.0, 4.0, 3.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-31.046875, -30.1611328125, -29.275390625, -28.3896484375, -27.50390625, -26.6181640625, -25.732421875, -24.8466796875, -23.9609375, -23.0751953125, -22.189453125, -21.3037109375, -20.41796875, -19.5322265625, -18.646484375, -17.7607421875, -16.875, -15.9892578125, -15.103515625, -14.2177734375, -13.33203125, -12.4462890625, -11.560546875, -10.6748046875, -9.7890625, -8.9033203125, -8.017578125, -7.1318359375, -6.24609375, -5.3603515625, -4.474609375, -3.5888671875, -2.703125, -1.8173828125, -0.931640625, -0.0458984375, 0.83984375, 1.7255859375, 2.611328125, 3.4970703125, 4.3828125, 5.2685546875, 6.154296875, 7.0400390625, 7.92578125, 8.8115234375, 9.697265625, 10.5830078125, 11.46875, 12.3544921875, 13.240234375, 14.1259765625, 15.01171875, 15.8974609375, 16.783203125, 17.6689453125, 18.5546875, 19.4404296875, 20.326171875, 21.2119140625, 22.09765625, 22.9833984375, 23.869140625, 24.7548828125, 25.640625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 3.0, 7.0, 9.0, 7.0, 9.0, 14.0, 13.0, 9.0, 17.0, 23.0, 25.0, 36.0, 42.0, 53.0, 87.0, 140.0, 194.0, 356.0, 585.0, 1367.0, 52055.0, 3085553.0, 3103.0, 830.0, 412.0, 226.0, 151.0, 107.0, 58.0, 43.0, 45.0, 32.0, 15.0, 10.0, 9.0, 10.0, 6.0, 10.0, 6.0, 6.0, 3.0, 9.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0], "bins": [-115.875, -112.7646484375, -109.654296875, -106.5439453125, -103.43359375, -100.3232421875, -97.212890625, -94.1025390625, -90.9921875, -87.8818359375, -84.771484375, -81.6611328125, -78.55078125, -75.4404296875, -72.330078125, -69.2197265625, -66.109375, -62.9990234375, -59.888671875, -56.7783203125, -53.66796875, -50.5576171875, -47.447265625, -44.3369140625, -41.2265625, -38.1162109375, -35.005859375, -31.8955078125, -28.78515625, -25.6748046875, -22.564453125, -19.4541015625, -16.34375, -13.2333984375, -10.123046875, -7.0126953125, -3.90234375, -0.7919921875, 2.318359375, 5.4287109375, 8.5390625, 11.6494140625, 14.759765625, 17.8701171875, 20.98046875, 24.0908203125, 27.201171875, 30.3115234375, 33.421875, 36.5322265625, 39.642578125, 42.7529296875, 45.86328125, 48.9736328125, 52.083984375, 55.1943359375, 58.3046875, 61.4150390625, 64.525390625, 67.6357421875, 70.74609375, 73.8564453125, 76.966796875, 80.0771484375, 83.1875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 50.0, 329.0, 527.0, 104.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.00137329101562, -148.02281188964844, -141.0442352294922, -134.065673828125, -127.08710479736328, -120.10853576660156, -113.12997436523438, -106.15140533447266, -99.17283630371094, -92.19426727294922, -85.21570587158203, -78.23713684082031, -71.2585678100586, -64.27999877929688, -57.30143737792969, -50.32286834716797, -43.34430694580078, -36.36574172973633, -29.38717269897461, -22.408607482910156, -15.43004035949707, -8.451473236083984, -1.4729080200195312, 5.5056610107421875, 12.48422622680664, 19.462793350219727, 26.441360473632812, 33.419925689697266, 40.39849090576172, 47.37705993652344, 54.35562515258789, 61.33419418334961, 68.31275939941406, 75.29132843017578, 82.26988983154297, 89.24845886230469, 96.2270278930664, 103.20559692382812, 110.18415832519531, 117.16272735595703, 124.14129638671875, 131.11985778808594, 138.0984344482422, 145.07699584960938, 152.05555725097656, 159.0341339111328, 166.0126953125, 172.99127197265625, 179.96981811523438, 186.94837951660156, 193.9269561767578, 200.905517578125, 207.8840789794922, 214.86265563964844, 221.84121704101562, 228.81979370117188, 235.79835510253906, 242.77691650390625, 249.7554931640625, 256.73406982421875, 263.7126159667969, 270.6911926269531, 277.66973876953125, 284.6483154296875, 291.62689208984375]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 5.0, 5.0, 13.0, 13.0, 16.0, 8.0, 18.0, 9.0, 20.0, 28.0, 16.0, 25.0, 21.0, 28.0, 38.0, 26.0, 30.0, 42.0, 48.0, 43.0, 47.0, 36.0, 43.0, 40.0, 34.0, 37.0, 29.0, 40.0, 34.0, 31.0, 29.0, 30.0, 14.0, 18.0, 10.0, 20.0, 15.0, 6.0, 4.0, 4.0, 6.0, 7.0, 10.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0], "bins": [-77.30536651611328, -75.1236343383789, -72.94190979003906, -70.76017761230469, -68.57844543457031, -66.39671325683594, -64.2149887084961, -62.03325653076172, -59.851524353027344, -57.669795989990234, -55.48806381225586, -53.30633544921875, -51.124603271484375, -48.942874908447266, -46.761146545410156, -44.57941436767578, -42.39768600463867, -40.21595764160156, -38.03422546386719, -35.85249710083008, -33.6707649230957, -31.489036560058594, -29.30730628967285, -27.12557601928711, -24.943845748901367, -22.762115478515625, -20.580385208129883, -18.39865493774414, -16.21692657470703, -14.035195350646973, -11.853466033935547, -9.671735763549805, -7.4900054931640625, -5.30827522277832, -3.1265454292297363, -0.9448156356811523, 1.2369146347045898, 3.418644905090332, 5.600374221801758, 7.7821044921875, 9.963834762573242, 12.145565032958984, 14.327295303344727, 16.50902557373047, 18.690753936767578, 20.872486114501953, 23.054214477539062, 25.235944747924805, 27.417675018310547, 29.59940528869629, 31.78113555908203, 33.96286392211914, 36.144596099853516, 38.326324462890625, 40.508056640625, 42.68978500366211, 44.87151336669922, 47.05324172973633, 49.2349739074707, 51.41670227050781, 53.59843444824219, 55.7801628112793, 57.961891174316406, 60.14362335205078, 62.325355529785156]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 6.0, 6.0, 5.0, 3.0, 8.0, 13.0, 17.0, 17.0, 17.0, 20.0, 19.0, 28.0, 25.0, 42.0, 27.0, 34.0, 40.0, 37.0, 35.0, 47.0, 54.0, 38.0, 36.0, 49.0, 41.0, 34.0, 27.0, 33.0, 33.0, 40.0, 24.0, 20.0, 18.0, 17.0, 15.0, 15.0, 12.0, 12.0, 8.0, 10.0, 3.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.53125, -9.181396484375, -8.83154296875, -8.481689453125, -8.1318359375, -7.781982421875, -7.43212890625, -7.082275390625, -6.732421875, -6.382568359375, -6.03271484375, -5.682861328125, -5.3330078125, -4.983154296875, -4.63330078125, -4.283447265625, -3.93359375, -3.583740234375, -3.23388671875, -2.884033203125, -2.5341796875, -2.184326171875, -1.83447265625, -1.484619140625, -1.134765625, -0.784912109375, -0.43505859375, -0.085205078125, 0.2646484375, 0.614501953125, 0.96435546875, 1.314208984375, 1.6640625, 2.013916015625, 2.36376953125, 2.713623046875, 3.0634765625, 3.413330078125, 3.76318359375, 4.113037109375, 4.462890625, 4.812744140625, 5.16259765625, 5.512451171875, 5.8623046875, 6.212158203125, 6.56201171875, 6.911865234375, 7.26171875, 7.611572265625, 7.96142578125, 8.311279296875, 8.6611328125, 9.010986328125, 9.36083984375, 9.710693359375, 10.060546875, 10.410400390625, 10.76025390625, 11.110107421875, 11.4599609375, 11.809814453125, 12.15966796875, 12.509521484375, 12.859375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 3.0, 8.0, 10.0, 10.0, 17.0, 19.0, 18.0, 36.0, 39.0, 43.0, 68.0, 83.0, 105.0, 172.0, 266.0, 453.0, 1136.0, 3186.0, 15300.0, 227280.0, 2921422.0, 975070.0, 39895.0, 6127.0, 1786.0, 663.0, 333.0, 204.0, 131.0, 93.0, 61.0, 59.0, 43.0, 34.0, 25.0, 18.0, 12.0, 16.0, 10.0, 5.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-32.53125, -31.566650390625, -30.60205078125, -29.637451171875, -28.6728515625, -27.708251953125, -26.74365234375, -25.779052734375, -24.814453125, -23.849853515625, -22.88525390625, -21.920654296875, -20.9560546875, -19.991455078125, -19.02685546875, -18.062255859375, -17.09765625, -16.133056640625, -15.16845703125, -14.203857421875, -13.2392578125, -12.274658203125, -11.31005859375, -10.345458984375, -9.380859375, -8.416259765625, -7.45166015625, -6.487060546875, -5.5224609375, -4.557861328125, -3.59326171875, -2.628662109375, -1.6640625, -0.699462890625, 0.26513671875, 1.229736328125, 2.1943359375, 3.158935546875, 4.12353515625, 5.088134765625, 6.052734375, 7.017333984375, 7.98193359375, 8.946533203125, 9.9111328125, 10.875732421875, 11.84033203125, 12.804931640625, 13.76953125, 14.734130859375, 15.69873046875, 16.663330078125, 17.6279296875, 18.592529296875, 19.55712890625, 20.521728515625, 21.486328125, 22.450927734375, 23.41552734375, 24.380126953125, 25.3447265625, 26.309326171875, 27.27392578125, 28.238525390625, 29.203125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 12.0, 19.0, 21.0, 45.0, 66.0, 73.0, 60.0, 113.0, 145.0, 214.0, 289.0, 481.0, 653.0, 559.0, 401.0, 271.0, 170.0, 118.0, 92.0, 57.0, 55.0, 42.0, 32.0, 16.0, 10.0, 18.0, 9.0, 10.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-25.953125, -25.283203125, -24.61328125, -23.943359375, -23.2734375, -22.603515625, -21.93359375, -21.263671875, -20.59375, -19.923828125, -19.25390625, -18.583984375, -17.9140625, -17.244140625, -16.57421875, -15.904296875, -15.234375, -14.564453125, -13.89453125, -13.224609375, -12.5546875, -11.884765625, -11.21484375, -10.544921875, -9.875, -9.205078125, -8.53515625, -7.865234375, -7.1953125, -6.525390625, -5.85546875, -5.185546875, -4.515625, -3.845703125, -3.17578125, -2.505859375, -1.8359375, -1.166015625, -0.49609375, 0.173828125, 0.84375, 1.513671875, 2.18359375, 2.853515625, 3.5234375, 4.193359375, 4.86328125, 5.533203125, 6.203125, 6.873046875, 7.54296875, 8.212890625, 8.8828125, 9.552734375, 10.22265625, 10.892578125, 11.5625, 12.232421875, 12.90234375, 13.572265625, 14.2421875, 14.912109375, 15.58203125, 16.251953125, 16.921875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 7.0, 11.0, 23.0, 42.0, 71.0, 114.0, 257.0, 652.0, 2369.0, 32903.0, 4035404.0, 117573.0, 3360.0, 865.0, 293.0, 152.0, 74.0, 48.0, 23.0, 16.0, 10.0, 9.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-89.8125, -87.4248046875, -85.037109375, -82.6494140625, -80.26171875, -77.8740234375, -75.486328125, -73.0986328125, -70.7109375, -68.3232421875, -65.935546875, -63.5478515625, -61.16015625, -58.7724609375, -56.384765625, -53.9970703125, -51.609375, -49.2216796875, -46.833984375, -44.4462890625, -42.05859375, -39.6708984375, -37.283203125, -34.8955078125, -32.5078125, -30.1201171875, -27.732421875, -25.3447265625, -22.95703125, -20.5693359375, -18.181640625, -15.7939453125, -13.40625, -11.0185546875, -8.630859375, -6.2431640625, -3.85546875, -1.4677734375, 0.919921875, 3.3076171875, 5.6953125, 8.0830078125, 10.470703125, 12.8583984375, 15.24609375, 17.6337890625, 20.021484375, 22.4091796875, 24.796875, 27.1845703125, 29.572265625, 31.9599609375, 34.34765625, 36.7353515625, 39.123046875, 41.5107421875, 43.8984375, 46.2861328125, 48.673828125, 51.0615234375, 53.44921875, 55.8369140625, 58.224609375, 60.6123046875, 63.0]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 37.0, 868.0, 110.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1249.329345703125, -1227.6512451171875, -1205.97314453125, -1184.295166015625, -1162.6170654296875, -1140.93896484375, -1119.260986328125, -1097.5828857421875, -1075.90478515625, -1054.2266845703125, -1032.548583984375, -1010.87060546875, -989.1925048828125, -967.514404296875, -945.8363647460938, -924.1583251953125, -902.480224609375, -880.8021240234375, -859.1240844726562, -837.446044921875, -815.7679443359375, -794.08984375, -772.4118041992188, -750.7337646484375, -729.0556640625, -707.3775634765625, -685.6995239257812, -664.021484375, -642.3433837890625, -620.665283203125, -598.9872436523438, -577.3092041015625, -555.631103515625, -533.9530029296875, -512.2749633789062, -490.5968933105469, -468.9188232421875, -447.2407531738281, -425.56268310546875, -403.8846130371094, -382.20654296875, -360.5284729003906, -338.85040283203125, -317.1723327636719, -295.4942626953125, -273.8161926269531, -252.13812255859375, -230.46005249023438, -208.78199768066406, -187.1039276123047, -165.4258575439453, -143.74778747558594, -122.06971740722656, -100.39164733886719, -78.71357727050781, -57.03550720214844, -35.35743713378906, -13.679367065429688, 7.9987030029296875, 29.676773071289062, 51.35484313964844, 73.03291320800781, 94.71098327636719, 116.38905334472656, 138.06712341308594]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 7.0, 5.0, 7.0, 7.0, 3.0, 8.0, 12.0, 6.0, 15.0, 13.0, 26.0, 28.0, 19.0, 32.0, 34.0, 24.0, 31.0, 35.0, 43.0, 49.0, 39.0, 41.0, 62.0, 53.0, 48.0, 35.0, 35.0, 40.0, 30.0, 22.0, 35.0, 27.0, 19.0, 21.0, 12.0, 20.0, 15.0, 13.0, 8.0, 2.0, 8.0, 4.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-80.67355346679688, -78.47052764892578, -76.26750946044922, -74.06448364257812, -71.86146545410156, -69.65843963623047, -67.45541381835938, -65.25239562988281, -63.04936981201172, -60.84634780883789, -58.64332580566406, -56.44029998779297, -54.23727798461914, -52.03425598144531, -49.831233978271484, -47.628211975097656, -45.42518997192383, -43.22216796875, -41.01914596557617, -38.816123962402344, -36.61309814453125, -34.41007614135742, -32.207054138183594, -30.004032135009766, -27.801008224487305, -25.597986221313477, -23.394962310791016, -21.191940307617188, -18.98891830444336, -16.7858943939209, -14.58287239074707, -12.379849433898926, -10.176826477050781, -7.973803520202637, -5.77078104019165, -3.567758560180664, -1.3647356033325195, 0.838287353515625, 3.041309356689453, 5.244332313537598, 7.447355270385742, 9.650378227233887, 11.853401184082031, 14.05642318725586, 16.259445190429688, 18.46246910095215, 20.665491104125977, 22.868515014648438, 25.071537017822266, 27.274559020996094, 29.477582931518555, 31.680604934692383, 33.883628845214844, 36.08665084838867, 38.2896728515625, 40.49269485473633, 42.695716857910156, 44.898738861083984, 47.10176086425781, 49.304786682128906, 51.507808685302734, 53.71083068847656, 55.91385269165039, 58.11687469482422, 60.31990051269531]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 4.0, 6.0, 5.0, 10.0, 12.0, 16.0, 13.0, 13.0, 23.0, 24.0, 29.0, 38.0, 33.0, 43.0, 47.0, 44.0, 48.0, 44.0, 43.0, 34.0, 41.0, 39.0, 46.0, 44.0, 34.0, 39.0, 29.0, 41.0, 26.0, 21.0, 28.0, 15.0, 13.0, 13.0, 10.0, 10.0, 10.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7265625, -7.43310546875, -7.1396484375, -6.84619140625, -6.552734375, -6.25927734375, -5.9658203125, -5.67236328125, -5.37890625, -5.08544921875, -4.7919921875, -4.49853515625, -4.205078125, -3.91162109375, -3.6181640625, -3.32470703125, -3.03125, -2.73779296875, -2.4443359375, -2.15087890625, -1.857421875, -1.56396484375, -1.2705078125, -0.97705078125, -0.68359375, -0.39013671875, -0.0966796875, 0.19677734375, 0.490234375, 0.78369140625, 1.0771484375, 1.37060546875, 1.6640625, 1.95751953125, 2.2509765625, 2.54443359375, 2.837890625, 3.13134765625, 3.4248046875, 3.71826171875, 4.01171875, 4.30517578125, 4.5986328125, 4.89208984375, 5.185546875, 5.47900390625, 5.7724609375, 6.06591796875, 6.359375, 6.65283203125, 6.9462890625, 7.23974609375, 7.533203125, 7.82666015625, 8.1201171875, 8.41357421875, 8.70703125, 9.00048828125, 9.2939453125, 9.58740234375, 9.880859375, 10.17431640625, 10.4677734375, 10.76123046875, 11.0546875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 8.0, 4.0, 9.0, 14.0, 18.0, 24.0, 38.0, 52.0, 76.0, 150.0, 231.0, 384.0, 655.0, 1076.0, 1929.0, 3248.0, 5529.0, 9897.0, 17208.0, 30398.0, 54229.0, 97185.0, 177252.0, 263811.0, 171365.0, 93386.0, 52025.0, 29023.0, 16836.0, 9469.0, 5412.0, 3115.0, 1815.0, 1087.0, 635.0, 367.0, 220.0, 145.0, 81.0, 51.0, 29.0, 19.0, 13.0, 14.0, 6.0, 6.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.5927734375, -1.5437164306640625, -1.494659423828125, -1.4456024169921875, -1.39654541015625, -1.3474884033203125, -1.298431396484375, -1.2493743896484375, -1.2003173828125, -1.1512603759765625, -1.102203369140625, -1.0531463623046875, -1.00408935546875, -0.9550323486328125, -0.905975341796875, -0.8569183349609375, -0.807861328125, -0.7588043212890625, -0.709747314453125, -0.6606903076171875, -0.61163330078125, -0.5625762939453125, -0.513519287109375, -0.4644622802734375, -0.4154052734375, -0.3663482666015625, -0.317291259765625, -0.2682342529296875, -0.21917724609375, -0.1701202392578125, -0.121063232421875, -0.0720062255859375, -0.02294921875, 0.0261077880859375, 0.075164794921875, 0.1242218017578125, 0.17327880859375, 0.2223358154296875, 0.271392822265625, 0.3204498291015625, 0.3695068359375, 0.4185638427734375, 0.467620849609375, 0.5166778564453125, 0.56573486328125, 0.6147918701171875, 0.663848876953125, 0.7129058837890625, 0.761962890625, 0.8110198974609375, 0.860076904296875, 0.9091339111328125, 0.95819091796875, 1.0072479248046875, 1.056304931640625, 1.1053619384765625, 1.1544189453125, 1.2034759521484375, 1.252532958984375, 1.3015899658203125, 1.35064697265625, 1.3997039794921875, 1.448760986328125, 1.4978179931640625, 1.546875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 9.0, 4.0, 12.0, 9.0, 18.0, 22.0, 24.0, 23.0, 17.0, 28.0, 26.0, 37.0, 30.0, 27.0, 32.0, 47.0, 28.0, 41.0, 1064.0, 34.0, 41.0, 47.0, 38.0, 36.0, 43.0, 33.0, 28.0, 30.0, 22.0, 34.0, 25.0, 15.0, 15.0, 13.0, 16.0, 10.0, 10.0, 10.0, 8.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6171875, -4.44537353515625, -4.2735595703125, -4.10174560546875, -3.929931640625, -3.75811767578125, -3.5863037109375, -3.41448974609375, -3.24267578125, -3.07086181640625, -2.8990478515625, -2.72723388671875, -2.555419921875, -2.38360595703125, -2.2117919921875, -2.03997802734375, -1.8681640625, -1.69635009765625, -1.5245361328125, -1.35272216796875, -1.180908203125, -1.00909423828125, -0.8372802734375, -0.66546630859375, -0.49365234375, -0.32183837890625, -0.1500244140625, 0.02178955078125, 0.193603515625, 0.36541748046875, 0.5372314453125, 0.70904541015625, 0.880859375, 1.05267333984375, 1.2244873046875, 1.39630126953125, 1.568115234375, 1.73992919921875, 1.9117431640625, 2.08355712890625, 2.25537109375, 2.42718505859375, 2.5989990234375, 2.77081298828125, 2.942626953125, 3.11444091796875, 3.2862548828125, 3.45806884765625, 3.6298828125, 3.80169677734375, 3.9735107421875, 4.14532470703125, 4.317138671875, 4.48895263671875, 4.6607666015625, 4.83258056640625, 5.00439453125, 5.17620849609375, 5.3480224609375, 5.51983642578125, 5.691650390625, 5.86346435546875, 6.0352783203125, 6.20709228515625, 6.37890625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 7.0, 14.0, 20.0, 38.0, 48.0, 73.0, 100.0, 148.0, 216.0, 323.0, 461.0, 684.0, 1037.0, 1492.0, 2314.0, 3425.0, 5283.0, 8004.0, 11987.0, 18794.0, 28827.0, 45585.0, 71928.0, 113044.0, 175366.0, 1243680.0, 131286.0, 83446.0, 52886.0, 33833.0, 21450.0, 14190.0, 9228.0, 6067.0, 3902.0, 2569.0, 1726.0, 1222.0, 797.0, 542.0, 354.0, 235.0, 155.0, 110.0, 63.0, 61.0, 37.0, 15.0, 23.0, 7.0, 10.0, 7.0, 4.0, 2.0, 3.0, 0.0, 3.0], "bins": [-1.1328125, -1.09759521484375, -1.0623779296875, -1.02716064453125, -0.991943359375, -0.95672607421875, -0.9215087890625, -0.88629150390625, -0.85107421875, -0.81585693359375, -0.7806396484375, -0.74542236328125, -0.710205078125, -0.67498779296875, -0.6397705078125, -0.60455322265625, -0.5693359375, -0.53411865234375, -0.4989013671875, -0.46368408203125, -0.428466796875, -0.39324951171875, -0.3580322265625, -0.32281494140625, -0.28759765625, -0.25238037109375, -0.2171630859375, -0.18194580078125, -0.146728515625, -0.11151123046875, -0.0762939453125, -0.04107666015625, -0.005859375, 0.02935791015625, 0.0645751953125, 0.09979248046875, 0.135009765625, 0.17022705078125, 0.2054443359375, 0.24066162109375, 0.27587890625, 0.31109619140625, 0.3463134765625, 0.38153076171875, 0.416748046875, 0.45196533203125, 0.4871826171875, 0.52239990234375, 0.5576171875, 0.59283447265625, 0.6280517578125, 0.66326904296875, 0.698486328125, 0.73370361328125, 0.7689208984375, 0.80413818359375, 0.83935546875, 0.87457275390625, 0.9097900390625, 0.94500732421875, 0.980224609375, 1.01544189453125, 1.0506591796875, 1.08587646484375, 1.12109375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 5.0, 4.0, 11.0, 17.0, 11.0, 14.0, 21.0, 25.0, 19.0, 33.0, 42.0, 40.0, 61.0, 47.0, 55.0, 55.0, 65.0, 61.0, 51.0, 52.0, 52.0, 39.0, 28.0, 35.0, 33.0, 26.0, 16.0, 17.0, 10.0, 10.0, 15.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002025604248046875, -0.0019669532775878906, -0.0019083023071289062, -0.0018496513366699219, -0.0017910003662109375, -0.0017323493957519531, -0.0016736984252929688, -0.0016150474548339844, -0.001556396484375, -0.0014977455139160156, -0.0014390945434570312, -0.0013804435729980469, -0.0013217926025390625, -0.0012631416320800781, -0.0012044906616210938, -0.0011458396911621094, -0.001087188720703125, -0.0010285377502441406, -0.0009698867797851562, -0.0009112358093261719, -0.0008525848388671875, -0.0007939338684082031, -0.0007352828979492188, -0.0006766319274902344, -0.00061798095703125, -0.0005593299865722656, -0.0005006790161132812, -0.0004420280456542969, -0.0003833770751953125, -0.0003247261047363281, -0.00026607513427734375, -0.00020742416381835938, -0.000148773193359375, -9.012222290039062e-05, -3.147125244140625e-05, 2.7179718017578125e-05, 8.58306884765625e-05, 0.00014448165893554688, 0.00020313262939453125, 0.0002617835998535156, 0.0003204345703125, 0.0003790855407714844, 0.00043773651123046875, 0.0004963874816894531, 0.0005550384521484375, 0.0006136894226074219, 0.0006723403930664062, 0.0007309913635253906, 0.000789642333984375, 0.0008482933044433594, 0.0009069442749023438, 0.0009655952453613281, 0.0010242462158203125, 0.0010828971862792969, 0.0011415481567382812, 0.0012001991271972656, 0.00125885009765625, 0.0013175010681152344, 0.0013761520385742188, 0.0014348030090332031, 0.0014934539794921875, 0.0015521049499511719, 0.0016107559204101562, 0.0016694068908691406, 0.001728057861328125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 6.0, 12.0, 14.0, 12.0, 25.0, 24.0, 33.0, 46.0, 72.0, 104.0, 131.0, 174.0, 263.0, 441.0, 773.0, 4489.0, 1029541.0, 10002.0, 913.0, 456.0, 297.0, 202.0, 132.0, 87.0, 67.0, 69.0, 31.0, 42.0, 17.0, 19.0, 10.0, 9.0, 10.0, 7.0, 2.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.038787841796875, -0.03755903244018555, -0.036330223083496094, -0.03510141372680664, -0.03387260437011719, -0.032643795013427734, -0.03141498565673828, -0.030186176300048828, -0.028957366943359375, -0.027728557586669922, -0.02649974822998047, -0.025270938873291016, -0.024042129516601562, -0.02281332015991211, -0.021584510803222656, -0.020355701446533203, -0.01912689208984375, -0.017898082733154297, -0.016669273376464844, -0.01544046401977539, -0.014211654663085938, -0.012982845306396484, -0.011754035949707031, -0.010525226593017578, -0.009296417236328125, -0.008067607879638672, -0.006838798522949219, -0.005609989166259766, -0.0043811798095703125, -0.0031523704528808594, -0.0019235610961914062, -0.0006947517395019531, 0.0005340576171875, 0.0017628669738769531, 0.0029916763305664062, 0.004220485687255859, 0.0054492950439453125, 0.006678104400634766, 0.007906913757324219, 0.009135723114013672, 0.010364532470703125, 0.011593341827392578, 0.012822151184082031, 0.014050960540771484, 0.015279769897460938, 0.01650857925415039, 0.017737388610839844, 0.018966197967529297, 0.02019500732421875, 0.021423816680908203, 0.022652626037597656, 0.02388143539428711, 0.025110244750976562, 0.026339054107666016, 0.02756786346435547, 0.028796672821044922, 0.030025482177734375, 0.03125429153442383, 0.03248310089111328, 0.033711910247802734, 0.03494071960449219, 0.03616952896118164, 0.037398338317871094, 0.03862714767456055, 0.03985595703125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 65.0, 662.0, 278.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0074579487554728985, -0.007230037357658148, -0.007002125959843397, -0.0067742145620286465, -0.006546303164213896, -0.006318391766399145, -0.006090480834245682, -0.005862569436430931, -0.00563465803861618, -0.00540674664080143, -0.005178835242986679, -0.004950923845171928, -0.004723012447357178, -0.004495101049542427, -0.004267189651727676, -0.004039278253912926, -0.003811366856098175, -0.0035834554582834244, -0.0033555440604686737, -0.003127632662653923, -0.0028997212648391724, -0.0026718098670244217, -0.0024438987020403147, -0.002215987304225564, -0.0019880759064108133, -0.0017601645085960627, -0.001532253110781312, -0.0013043418293818831, -0.0010764304315671325, -0.0008485190337523818, -0.000620607752352953, -0.0003926963545382023, -0.00016478542238473892, 6.312594632618129e-05, 0.0002910373150371015, 0.0005189486546441913, 0.0007468600524589419, 0.0009747714502736926, 0.0012026827316731215, 0.0014305941294878721, 0.0016585055273026228, 0.0018864169251173735, 0.002114328322932124, 0.002342239487916231, 0.002570150885730982, 0.0027980622835457325, 0.003025973681360483, 0.003253885079175234, 0.0034817964769899845, 0.003709707874804735, 0.003937619272619486, 0.0041655306704342365, 0.004393442068248987, 0.004621353466063738, 0.004849264398217201, 0.005077175796031952, 0.005305087193846703, 0.005532998591661453, 0.005760909989476204, 0.005988821387290955, 0.006216732785105705, 0.006444644182920456, 0.006672555580735207, 0.006900466978549957, 0.007128378376364708]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 2.0, 10.0, 5.0, 16.0, 12.0, 16.0, 20.0, 24.0, 24.0, 29.0, 34.0, 34.0, 48.0, 45.0, 46.0, 53.0, 45.0, 43.0, 40.0, 47.0, 44.0, 45.0, 48.0, 34.0, 37.0, 34.0, 36.0, 23.0, 14.0, 23.0, 17.0, 13.0, 8.0, 7.0, 5.0, 6.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012417435646057129, -0.001206129789352417, -0.001170516014099121, -0.0011349022388458252, -0.0010992884635925293, -0.0010636746883392334, -0.0010280609130859375, -0.0009924471378326416, -0.0009568333625793457, -0.0009212195873260498, -0.0008856058120727539, -0.000849992036819458, -0.0008143782615661621, -0.0007787644863128662, -0.0007431507110595703, -0.0007075369358062744, -0.0006719231605529785, -0.0006363093852996826, -0.0006006956100463867, -0.0005650818347930908, -0.0005294680595397949, -0.000493854284286499, -0.0004582405090332031, -0.0004226267337799072, -0.00038701295852661133, -0.00035139918327331543, -0.00031578540802001953, -0.00028017163276672363, -0.00024455785751342773, -0.00020894408226013184, -0.00017333030700683594, -0.00013771653175354004, -0.00010210275650024414, -6.648898124694824e-05, -3.0875205993652344e-05, 4.738569259643555e-06, 4.035234451293945e-05, 7.596611976623535e-05, 0.00011157989501953125, 0.00014719367027282715, 0.00018280744552612305, 0.00021842122077941895, 0.00025403499603271484, 0.00028964877128601074, 0.00032526254653930664, 0.00036087632179260254, 0.00039649009704589844, 0.00043210387229919434, 0.00046771764755249023, 0.0005033314228057861, 0.000538945198059082, 0.0005745589733123779, 0.0006101727485656738, 0.0006457865238189697, 0.0006814002990722656, 0.0007170140743255615, 0.0007526278495788574, 0.0007882416248321533, 0.0008238554000854492, 0.0008594691753387451, 0.000895082950592041, 0.0009306967258453369, 0.0009663105010986328, 0.0010019242763519287, 0.0010375380516052246]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 3.0, 4.0, 6.0, 5.0, 10.0, 12.0, 17.0, 12.0, 13.0, 23.0, 24.0, 29.0, 38.0, 33.0, 43.0, 47.0, 44.0, 48.0, 44.0, 43.0, 34.0, 41.0, 39.0, 46.0, 44.0, 34.0, 39.0, 29.0, 41.0, 26.0, 21.0, 28.0, 15.0, 13.0, 13.0, 10.0, 10.0, 10.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.7265625, -7.43310546875, -7.1396484375, -6.84619140625, -6.552734375, -6.25927734375, -5.9658203125, -5.67236328125, -5.37890625, -5.08544921875, -4.7919921875, -4.49853515625, -4.205078125, -3.91162109375, -3.6181640625, -3.32470703125, -3.03125, -2.73779296875, -2.4443359375, -2.15087890625, -1.857421875, -1.56396484375, -1.2705078125, -0.97705078125, -0.68359375, -0.39013671875, -0.0966796875, 0.19677734375, 0.490234375, 0.78369140625, 1.0771484375, 1.37060546875, 1.6640625, 1.95751953125, 2.2509765625, 2.54443359375, 2.837890625, 3.13134765625, 3.4248046875, 3.71826171875, 4.01171875, 4.30517578125, 4.5986328125, 4.89208984375, 5.185546875, 5.47900390625, 5.7724609375, 6.06591796875, 6.359375, 6.65283203125, 6.9462890625, 7.23974609375, 7.533203125, 7.82666015625, 8.1201171875, 8.41357421875, 8.70703125, 9.00048828125, 9.2939453125, 9.58740234375, 9.880859375, 10.17431640625, 10.4677734375, 10.76123046875, 11.0546875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 6.0, 5.0, 6.0, 13.0, 17.0, 34.0, 36.0, 67.0, 78.0, 101.0, 188.0, 270.0, 467.0, 664.0, 1045.0, 1604.0, 2959.0, 6359.0, 23034.0, 272233.0, 668350.0, 52175.0, 9500.0, 3847.0, 2021.0, 1236.0, 743.0, 532.0, 307.0, 211.0, 139.0, 110.0, 67.0, 39.0, 38.0, 24.0, 5.0, 4.0, 7.0, 10.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-28.5, -27.690185546875, -26.88037109375, -26.070556640625, -25.2607421875, -24.450927734375, -23.64111328125, -22.831298828125, -22.021484375, -21.211669921875, -20.40185546875, -19.592041015625, -18.7822265625, -17.972412109375, -17.16259765625, -16.352783203125, -15.54296875, -14.733154296875, -13.92333984375, -13.113525390625, -12.3037109375, -11.493896484375, -10.68408203125, -9.874267578125, -9.064453125, -8.254638671875, -7.44482421875, -6.635009765625, -5.8251953125, -5.015380859375, -4.20556640625, -3.395751953125, -2.5859375, -1.776123046875, -0.96630859375, -0.156494140625, 0.6533203125, 1.463134765625, 2.27294921875, 3.082763671875, 3.892578125, 4.702392578125, 5.51220703125, 6.322021484375, 7.1318359375, 7.941650390625, 8.75146484375, 9.561279296875, 10.37109375, 11.180908203125, 11.99072265625, 12.800537109375, 13.6103515625, 14.420166015625, 15.22998046875, 16.039794921875, 16.849609375, 17.659423828125, 18.46923828125, 19.279052734375, 20.0888671875, 20.898681640625, 21.70849609375, 22.518310546875, 23.328125]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 9.0, 11.0, 10.0, 7.0, 10.0, 13.0, 10.0, 13.0, 18.0, 28.0, 26.0, 23.0, 40.0, 60.0, 42.0, 61.0, 87.0, 182.0, 1649.0, 286.0, 94.0, 66.0, 47.0, 50.0, 38.0, 28.0, 37.0, 19.0, 25.0, 14.0, 15.0, 7.0, 5.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.109375, -24.26318359375, -23.4169921875, -22.57080078125, -21.724609375, -20.87841796875, -20.0322265625, -19.18603515625, -18.33984375, -17.49365234375, -16.6474609375, -15.80126953125, -14.955078125, -14.10888671875, -13.2626953125, -12.41650390625, -11.5703125, -10.72412109375, -9.8779296875, -9.03173828125, -8.185546875, -7.33935546875, -6.4931640625, -5.64697265625, -4.80078125, -3.95458984375, -3.1083984375, -2.26220703125, -1.416015625, -0.56982421875, 0.2763671875, 1.12255859375, 1.96875, 2.81494140625, 3.6611328125, 4.50732421875, 5.353515625, 6.19970703125, 7.0458984375, 7.89208984375, 8.73828125, 9.58447265625, 10.4306640625, 11.27685546875, 12.123046875, 12.96923828125, 13.8154296875, 14.66162109375, 15.5078125, 16.35400390625, 17.2001953125, 18.04638671875, 18.892578125, 19.73876953125, 20.5849609375, 21.43115234375, 22.27734375, 23.12353515625, 23.9697265625, 24.81591796875, 25.662109375, 26.50830078125, 27.3544921875, 28.20068359375, 29.046875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 2.0, 5.0, 8.0, 11.0, 18.0, 26.0, 30.0, 46.0, 74.0, 93.0, 124.0, 231.0, 359.0, 737.0, 3243.0, 3096460.0, 41438.0, 1393.0, 505.0, 266.0, 191.0, 102.0, 83.0, 75.0, 49.0, 21.0, 32.0, 14.0, 23.0, 9.0, 4.0, 10.0, 6.0, 3.0, 7.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.4375, -94.6337890625, -91.830078125, -89.0263671875, -86.22265625, -83.4189453125, -80.615234375, -77.8115234375, -75.0078125, -72.2041015625, -69.400390625, -66.5966796875, -63.79296875, -60.9892578125, -58.185546875, -55.3818359375, -52.578125, -49.7744140625, -46.970703125, -44.1669921875, -41.36328125, -38.5595703125, -35.755859375, -32.9521484375, -30.1484375, -27.3447265625, -24.541015625, -21.7373046875, -18.93359375, -16.1298828125, -13.326171875, -10.5224609375, -7.71875, -4.9150390625, -2.111328125, 0.6923828125, 3.49609375, 6.2998046875, 9.103515625, 11.9072265625, 14.7109375, 17.5146484375, 20.318359375, 23.1220703125, 25.92578125, 28.7294921875, 31.533203125, 34.3369140625, 37.140625, 39.9443359375, 42.748046875, 45.5517578125, 48.35546875, 51.1591796875, 53.962890625, 56.7666015625, 59.5703125, 62.3740234375, 65.177734375, 67.9814453125, 70.78515625, 73.5888671875, 76.392578125, 79.1962890625, 82.0]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 12.0, 121.0, 427.0, 351.0, 87.0, 10.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.39105224609375, -230.99803161621094, -225.60501098632812, -220.21197509765625, -214.81895446777344, -209.42593383789062, -204.0329132080078, -198.639892578125, -193.24685668945312, -187.8538360595703, -182.4608154296875, -177.06777954101562, -171.6747589111328, -166.28173828125, -160.8887176513672, -155.49569702148438, -150.1026611328125, -144.7096405029297, -139.31661987304688, -133.923583984375, -128.5305633544922, -123.13754272460938, -117.74452209472656, -112.35149383544922, -106.95848083496094, -101.56546020507812, -96.17243194580078, -90.77941131591797, -85.38638305664062, -79.99336242675781, -74.600341796875, -69.20731353759766, -63.814292907714844, -58.421268463134766, -53.02824401855469, -47.635223388671875, -42.24219512939453, -36.84917449951172, -31.45615005493164, -26.063125610351562, -20.670101165771484, -15.277076721191406, -9.884053230285645, -4.491029739379883, 0.9019947052001953, 6.295019149780273, 11.688041687011719, 17.081066131591797, 22.474090576171875, 27.867115020751953, 33.26013946533203, 38.653160095214844, 44.04618835449219, 49.439208984375, 54.83223342895508, 60.225257873535156, 65.6182861328125, 71.01130676269531, 76.40433502197266, 81.79735565185547, 87.19038391113281, 92.58340454101562, 97.97642517089844, 103.36945343017578, 108.7624740600586]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 4.0, 4.0, 8.0, 4.0, 7.0, 12.0, 14.0, 20.0, 19.0, 17.0, 34.0, 33.0, 30.0, 37.0, 35.0, 47.0, 43.0, 48.0, 33.0, 38.0, 52.0, 30.0, 41.0, 31.0, 37.0, 32.0, 39.0, 33.0, 20.0, 33.0, 25.0, 17.0, 17.0, 29.0, 21.0, 12.0, 14.0, 10.0, 4.0, 7.0, 3.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-67.76932525634766, -65.67735290527344, -63.58538055419922, -61.493412017822266, -59.40143966674805, -57.30946731567383, -55.217498779296875, -53.125526428222656, -51.03355407714844, -48.94158172607422, -46.849609375, -44.75764083862305, -42.66566848754883, -40.57369613647461, -38.481727600097656, -36.38975524902344, -34.29778289794922, -32.205810546875, -30.113840103149414, -28.021869659423828, -25.92989730834961, -23.83792495727539, -21.745954513549805, -19.65398406982422, -17.56201171875, -15.470040321350098, -13.378068923950195, -11.286097526550293, -9.19412612915039, -7.102154731750488, -5.010183334350586, -2.9182119369506836, -0.8262481689453125, 1.2657232284545898, 3.357694625854492, 5.4496660232543945, 7.541637420654297, 9.6336088180542, 11.725580215454102, 13.817551612854004, 15.909523010253906, 18.001495361328125, 20.09346580505371, 22.185436248779297, 24.277408599853516, 26.369380950927734, 28.46135139465332, 30.553321838378906, 32.645294189453125, 34.737266540527344, 36.82923889160156, 38.921207427978516, 41.013179779052734, 43.10515213012695, 45.197120666503906, 47.289093017578125, 49.381065368652344, 51.47303771972656, 53.56501007080078, 55.656978607177734, 57.74895095825195, 59.84092330932617, 61.932891845703125, 64.02486419677734, 66.11683654785156]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 1.0, 5.0, 9.0, 4.0, 7.0, 8.0, 11.0, 7.0, 8.0, 11.0, 20.0, 29.0, 22.0, 25.0, 35.0, 31.0, 36.0, 55.0, 40.0, 42.0, 52.0, 40.0, 40.0, 34.0, 41.0, 43.0, 43.0, 32.0, 25.0, 41.0, 27.0, 28.0, 30.0, 24.0, 13.0, 17.0, 17.0, 10.0, 10.0, 3.0, 8.0, 5.0, 6.0, 1.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.109375, -7.823486328125, -7.53759765625, -7.251708984375, -6.9658203125, -6.679931640625, -6.39404296875, -6.108154296875, -5.822265625, -5.536376953125, -5.25048828125, -4.964599609375, -4.6787109375, -4.392822265625, -4.10693359375, -3.821044921875, -3.53515625, -3.249267578125, -2.96337890625, -2.677490234375, -2.3916015625, -2.105712890625, -1.81982421875, -1.533935546875, -1.248046875, -0.962158203125, -0.67626953125, -0.390380859375, -0.1044921875, 0.181396484375, 0.46728515625, 0.753173828125, 1.0390625, 1.324951171875, 1.61083984375, 1.896728515625, 2.1826171875, 2.468505859375, 2.75439453125, 3.040283203125, 3.326171875, 3.612060546875, 3.89794921875, 4.183837890625, 4.4697265625, 4.755615234375, 5.04150390625, 5.327392578125, 5.61328125, 5.899169921875, 6.18505859375, 6.470947265625, 6.7568359375, 7.042724609375, 7.32861328125, 7.614501953125, 7.900390625, 8.186279296875, 8.47216796875, 8.758056640625, 9.0439453125, 9.329833984375, 9.61572265625, 9.901611328125, 10.1875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 8.0, 14.0, 15.0, 21.0, 31.0, 43.0, 62.0, 74.0, 115.0, 152.0, 240.0, 373.0, 604.0, 1120.0, 2107.0, 4673.0, 15259.0, 117386.0, 1514459.0, 2284952.0, 220308.0, 20818.0, 5599.0, 2583.0, 1252.0, 752.0, 441.0, 276.0, 158.0, 104.0, 86.0, 61.0, 31.0, 28.0, 20.0, 15.0, 12.0, 14.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.8984375, -15.2655029296875, -14.632568359375, -13.9996337890625, -13.36669921875, -12.7337646484375, -12.100830078125, -11.4678955078125, -10.8349609375, -10.2020263671875, -9.569091796875, -8.9361572265625, -8.30322265625, -7.6702880859375, -7.037353515625, -6.4044189453125, -5.771484375, -5.1385498046875, -4.505615234375, -3.8726806640625, -3.23974609375, -2.6068115234375, -1.973876953125, -1.3409423828125, -0.7080078125, -0.0750732421875, 0.557861328125, 1.1907958984375, 1.82373046875, 2.4566650390625, 3.089599609375, 3.7225341796875, 4.35546875, 4.9884033203125, 5.621337890625, 6.2542724609375, 6.88720703125, 7.5201416015625, 8.153076171875, 8.7860107421875, 9.4189453125, 10.0518798828125, 10.684814453125, 11.3177490234375, 11.95068359375, 12.5836181640625, 13.216552734375, 13.8494873046875, 14.482421875, 15.1153564453125, 15.748291015625, 16.3812255859375, 17.01416015625, 17.6470947265625, 18.280029296875, 18.9129638671875, 19.5458984375, 20.1788330078125, 20.811767578125, 21.4447021484375, 22.07763671875, 22.7105712890625, 23.343505859375, 23.9764404296875, 24.609375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 2.0, 6.0, 21.0, 31.0, 44.0, 85.0, 196.0, 322.0, 631.0, 1025.0, 785.0, 406.0, 253.0, 125.0, 68.0, 27.0, 24.0, 11.0, 6.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.234375, -23.251220703125, -22.26806640625, -21.284912109375, -20.3017578125, -19.318603515625, -18.33544921875, -17.352294921875, -16.369140625, -15.385986328125, -14.40283203125, -13.419677734375, -12.4365234375, -11.453369140625, -10.47021484375, -9.487060546875, -8.50390625, -7.520751953125, -6.53759765625, -5.554443359375, -4.5712890625, -3.588134765625, -2.60498046875, -1.621826171875, -0.638671875, 0.344482421875, 1.32763671875, 2.310791015625, 3.2939453125, 4.277099609375, 5.26025390625, 6.243408203125, 7.2265625, 8.209716796875, 9.19287109375, 10.176025390625, 11.1591796875, 12.142333984375, 13.12548828125, 14.108642578125, 15.091796875, 16.074951171875, 17.05810546875, 18.041259765625, 19.0244140625, 20.007568359375, 20.99072265625, 21.973876953125, 22.95703125, 23.940185546875, 24.92333984375, 25.906494140625, 26.8896484375, 27.872802734375, 28.85595703125, 29.839111328125, 30.822265625, 31.805419921875, 32.78857421875, 33.771728515625, 34.7548828125, 35.738037109375, 36.72119140625, 37.704345703125, 38.6875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 8.0, 5.0, 11.0, 24.0, 23.0, 36.0, 85.0, 127.0, 262.0, 542.0, 1339.0, 5606.0, 3060638.0, 1118962.0, 4474.0, 1164.0, 477.0, 214.0, 114.0, 69.0, 39.0, 21.0, 8.0, 14.0, 7.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-73.5625, -71.5712890625, -69.580078125, -67.5888671875, -65.59765625, -63.6064453125, -61.615234375, -59.6240234375, -57.6328125, -55.6416015625, -53.650390625, -51.6591796875, -49.66796875, -47.6767578125, -45.685546875, -43.6943359375, -41.703125, -39.7119140625, -37.720703125, -35.7294921875, -33.73828125, -31.7470703125, -29.755859375, -27.7646484375, -25.7734375, -23.7822265625, -21.791015625, -19.7998046875, -17.80859375, -15.8173828125, -13.826171875, -11.8349609375, -9.84375, -7.8525390625, -5.861328125, -3.8701171875, -1.87890625, 0.1123046875, 2.103515625, 4.0947265625, 6.0859375, 8.0771484375, 10.068359375, 12.0595703125, 14.05078125, 16.0419921875, 18.033203125, 20.0244140625, 22.015625, 24.0068359375, 25.998046875, 27.9892578125, 29.98046875, 31.9716796875, 33.962890625, 35.9541015625, 37.9453125, 39.9365234375, 41.927734375, 43.9189453125, 45.91015625, 47.9013671875, 49.892578125, 51.8837890625, 53.875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 36.0, 297.0, 503.0, 163.0, 14.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-347.0843505859375, -339.4287109375, -331.7730407714844, -324.1174011230469, -316.4617614746094, -308.80609130859375, -301.15045166015625, -293.49481201171875, -285.83917236328125, -278.18353271484375, -270.5278625488281, -262.8722229003906, -255.21658325195312, -247.56092834472656, -239.9052734375, -232.2496337890625, -224.59396362304688, -216.9383087158203, -209.2826690673828, -201.62701416015625, -193.97137451171875, -186.3157196044922, -178.66006469726562, -171.00442504882812, -163.34878540039062, -155.69313049316406, -148.03749084472656, -140.3818359375, -132.7261962890625, -125.07054138183594, -117.4148941040039, -109.75924682617188, -102.10359191894531, -94.44794464111328, -86.79229736328125, -79.13664245605469, -71.48099517822266, -63.825347900390625, -56.169700622558594, -48.5140495300293, -40.858402252197266, -33.202754974365234, -25.547103881835938, -17.891456604003906, -10.235807418823242, -2.580158233642578, 5.075489044189453, 12.73114013671875, 20.38678741455078, 28.042436599731445, 35.69808578491211, 43.35373306274414, 51.00938415527344, 58.66503143310547, 66.3206787109375, 73.97633361816406, 81.63197326660156, 89.2876205444336, 96.94326782226562, 104.59892272949219, 112.25457000732422, 119.91021728515625, 127.56586456298828, 135.2215118408203, 142.87716674804688]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 2.0, 6.0, 13.0, 11.0, 16.0, 24.0, 32.0, 36.0, 42.0, 42.0, 54.0, 59.0, 55.0, 55.0, 45.0, 62.0, 58.0, 54.0, 43.0, 33.0, 48.0, 36.0, 43.0, 26.0, 30.0, 17.0, 13.0, 17.0, 4.0, 8.0, 4.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.59625244140625, -82.1253890991211, -79.6545181274414, -77.18365478515625, -74.7127914428711, -72.24192810058594, -69.77105712890625, -67.3001937866211, -64.82933044433594, -62.358463287353516, -59.88759994506836, -57.41673278808594, -54.94586944580078, -52.47500228881836, -50.00413513183594, -47.53327178955078, -45.062400817871094, -42.59153366088867, -40.120670318603516, -37.649803161621094, -35.17893981933594, -32.708072662353516, -30.237205505371094, -27.766340255737305, -25.295475006103516, -22.824609756469727, -20.353744506835938, -17.882877349853516, -15.412012100219727, -12.941146850585938, -10.470280647277832, -7.999414443969727, -5.5285491943359375, -3.0576834678649902, -0.586817741394043, 1.8840479850769043, 4.354913711547852, 6.825778961181641, 9.296645164489746, 11.767511367797852, 14.23837661743164, 16.70924186706543, 19.18010711669922, 21.65097427368164, 24.12183952331543, 26.59270477294922, 29.06357192993164, 31.53443717956543, 34.00530242919922, 36.47616958618164, 38.9470329284668, 41.41790008544922, 43.888763427734375, 46.3596305847168, 48.83049774169922, 51.301361083984375, 53.7722282409668, 56.24309539794922, 58.713958740234375, 61.1848258972168, 63.65569305419922, 66.12655639648438, 68.59741973876953, 71.06829071044922, 73.53915405273438]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 10.0, 11.0, 13.0, 12.0, 13.0, 18.0, 23.0, 31.0, 26.0, 27.0, 29.0, 39.0, 41.0, 46.0, 45.0, 42.0, 54.0, 39.0, 33.0, 45.0, 41.0, 33.0, 38.0, 32.0, 41.0, 30.0, 36.0, 17.0, 27.0, 24.0, 9.0, 15.0, 13.0, 10.0, 8.0, 8.0, 3.0, 2.0, 2.0, 7.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.90966796875, -5.6787109375, -5.44775390625, -5.216796875, -4.98583984375, -4.7548828125, -4.52392578125, -4.29296875, -4.06201171875, -3.8310546875, -3.60009765625, -3.369140625, -3.13818359375, -2.9072265625, -2.67626953125, -2.4453125, -2.21435546875, -1.9833984375, -1.75244140625, -1.521484375, -1.29052734375, -1.0595703125, -0.82861328125, -0.59765625, -0.36669921875, -0.1357421875, 0.09521484375, 0.326171875, 0.55712890625, 0.7880859375, 1.01904296875, 1.25, 1.48095703125, 1.7119140625, 1.94287109375, 2.173828125, 2.40478515625, 2.6357421875, 2.86669921875, 3.09765625, 3.32861328125, 3.5595703125, 3.79052734375, 4.021484375, 4.25244140625, 4.4833984375, 4.71435546875, 4.9453125, 5.17626953125, 5.4072265625, 5.63818359375, 5.869140625, 6.10009765625, 6.3310546875, 6.56201171875, 6.79296875, 7.02392578125, 7.2548828125, 7.48583984375, 7.716796875, 7.94775390625, 8.1787109375, 8.40966796875, 8.640625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 7.0, 17.0, 18.0, 13.0, 35.0, 44.0, 72.0, 115.0, 168.0, 277.0, 413.0, 562.0, 780.0, 1273.0, 1906.0, 2814.0, 4227.0, 6276.0, 9613.0, 14867.0, 22425.0, 35802.0, 57045.0, 93449.0, 151441.0, 215842.0, 160862.0, 98987.0, 61219.0, 38206.0, 24180.0, 15395.0, 10103.0, 6633.0, 4345.0, 2951.0, 2085.0, 1302.0, 923.0, 647.0, 398.0, 258.0, 205.0, 120.0, 84.0, 62.0, 34.0, 20.0, 22.0, 10.0, 1.0, 3.0, 0.0, 5.0, 1.0, 0.0, 3.0], "bins": [-0.98291015625, -0.952728271484375, -0.92254638671875, -0.892364501953125, -0.8621826171875, -0.832000732421875, -0.80181884765625, -0.771636962890625, -0.741455078125, -0.711273193359375, -0.68109130859375, -0.650909423828125, -0.6207275390625, -0.590545654296875, -0.56036376953125, -0.530181884765625, -0.5, -0.469818115234375, -0.43963623046875, -0.409454345703125, -0.3792724609375, -0.349090576171875, -0.31890869140625, -0.288726806640625, -0.258544921875, -0.228363037109375, -0.19818115234375, -0.167999267578125, -0.1378173828125, -0.107635498046875, -0.07745361328125, -0.047271728515625, -0.01708984375, 0.013092041015625, 0.04327392578125, 0.073455810546875, 0.1036376953125, 0.133819580078125, 0.16400146484375, 0.194183349609375, 0.224365234375, 0.254547119140625, 0.28472900390625, 0.314910888671875, 0.3450927734375, 0.375274658203125, 0.40545654296875, 0.435638427734375, 0.4658203125, 0.496002197265625, 0.52618408203125, 0.556365966796875, 0.5865478515625, 0.616729736328125, 0.64691162109375, 0.677093505859375, 0.707275390625, 0.737457275390625, 0.76763916015625, 0.797821044921875, 0.8280029296875, 0.858184814453125, 0.88836669921875, 0.918548583984375, 0.94873046875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 6.0, 8.0, 7.0, 9.0, 10.0, 12.0, 20.0, 21.0, 19.0, 28.0, 28.0, 27.0, 23.0, 43.0, 25.0, 28.0, 36.0, 39.0, 35.0, 41.0, 1057.0, 33.0, 40.0, 38.0, 40.0, 31.0, 29.0, 38.0, 35.0, 32.0, 24.0, 18.0, 16.0, 17.0, 20.0, 11.0, 12.0, 7.0, 9.0, 6.0, 9.0, 7.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.20703125, -4.0836181640625, -3.960205078125, -3.8367919921875, -3.71337890625, -3.5899658203125, -3.466552734375, -3.3431396484375, -3.2197265625, -3.0963134765625, -2.972900390625, -2.8494873046875, -2.72607421875, -2.6026611328125, -2.479248046875, -2.3558349609375, -2.232421875, -2.1090087890625, -1.985595703125, -1.8621826171875, -1.73876953125, -1.6153564453125, -1.491943359375, -1.3685302734375, -1.2451171875, -1.1217041015625, -0.998291015625, -0.8748779296875, -0.75146484375, -0.6280517578125, -0.504638671875, -0.3812255859375, -0.2578125, -0.1343994140625, -0.010986328125, 0.1124267578125, 0.23583984375, 0.3592529296875, 0.482666015625, 0.6060791015625, 0.7294921875, 0.8529052734375, 0.976318359375, 1.0997314453125, 1.22314453125, 1.3465576171875, 1.469970703125, 1.5933837890625, 1.716796875, 1.8402099609375, 1.963623046875, 2.0870361328125, 2.21044921875, 2.3338623046875, 2.457275390625, 2.5806884765625, 2.7041015625, 2.8275146484375, 2.950927734375, 3.0743408203125, 3.19775390625, 3.3211669921875, 3.444580078125, 3.5679931640625, 3.69140625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 9.0, 21.0, 24.0, 43.0, 56.0, 96.0, 141.0, 204.0, 300.0, 426.0, 650.0, 871.0, 1375.0, 2031.0, 2990.0, 4499.0, 6493.0, 10018.0, 15036.0, 23051.0, 35432.0, 54516.0, 82779.0, 124564.0, 1224610.0, 168380.0, 115294.0, 76776.0, 50091.0, 32862.0, 21541.0, 14002.0, 9062.0, 6181.0, 4099.0, 2843.0, 1850.0, 1275.0, 858.0, 617.0, 352.0, 267.0, 177.0, 114.0, 81.0, 47.0, 41.0, 35.0, 19.0, 12.0, 6.0, 6.0, 3.0, 4.0, 1.0], "bins": [-0.88134765625, -0.8553543090820312, -0.8293609619140625, -0.8033676147460938, -0.777374267578125, -0.7513809204101562, -0.7253875732421875, -0.6993942260742188, -0.67340087890625, -0.6474075317382812, -0.6214141845703125, -0.5954208374023438, -0.569427490234375, -0.5434341430664062, -0.5174407958984375, -0.49144744873046875, -0.4654541015625, -0.43946075439453125, -0.4134674072265625, -0.38747406005859375, -0.361480712890625, -0.33548736572265625, -0.3094940185546875, -0.28350067138671875, -0.25750732421875, -0.23151397705078125, -0.2055206298828125, -0.17952728271484375, -0.153533935546875, -0.12754058837890625, -0.1015472412109375, -0.07555389404296875, -0.049560546875, -0.02356719970703125, 0.0024261474609375, 0.02841949462890625, 0.054412841796875, 0.08040618896484375, 0.1063995361328125, 0.13239288330078125, 0.15838623046875, 0.18437957763671875, 0.2103729248046875, 0.23636627197265625, 0.262359619140625, 0.28835296630859375, 0.3143463134765625, 0.34033966064453125, 0.3663330078125, 0.39232635498046875, 0.4183197021484375, 0.44431304931640625, 0.470306396484375, 0.49629974365234375, 0.5222930908203125, 0.5482864379882812, 0.57427978515625, 0.6002731323242188, 0.6262664794921875, 0.6522598266601562, 0.678253173828125, 0.7042465209960938, 0.7302398681640625, 0.7562332153320312, 0.7822265625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 4.0, 5.0, 4.0, 6.0, 6.0, 11.0, 13.0, 24.0, 35.0, 42.0, 33.0, 49.0, 59.0, 56.0, 62.0, 78.0, 73.0, 68.0, 57.0, 54.0, 52.0, 38.0, 31.0, 26.0, 25.0, 16.0, 16.0, 10.0, 16.0, 4.0, 6.0, 2.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017948150634765625, -0.0017390847206115723, -0.001683354377746582, -0.0016276240348815918, -0.0015718936920166016, -0.0015161633491516113, -0.001460433006286621, -0.0014047026634216309, -0.0013489723205566406, -0.0012932419776916504, -0.0012375116348266602, -0.00118178129196167, -0.0011260509490966797, -0.0010703206062316895, -0.0010145902633666992, -0.000958859920501709, -0.0009031295776367188, -0.0008473992347717285, -0.0007916688919067383, -0.000735938549041748, -0.0006802082061767578, -0.0006244778633117676, -0.0005687475204467773, -0.0005130171775817871, -0.0004572868347167969, -0.00040155649185180664, -0.0003458261489868164, -0.00029009580612182617, -0.00023436546325683594, -0.0001786351203918457, -0.00012290477752685547, -6.717443466186523e-05, -1.1444091796875e-05, 4.4286251068115234e-05, 0.00010001659393310547, 0.0001557469367980957, 0.00021147727966308594, 0.00026720762252807617, 0.0003229379653930664, 0.00037866830825805664, 0.0004343986511230469, 0.0004901289939880371, 0.0005458593368530273, 0.0006015896797180176, 0.0006573200225830078, 0.000713050365447998, 0.0007687807083129883, 0.0008245110511779785, 0.0008802413940429688, 0.000935971736907959, 0.0009917020797729492, 0.0010474324226379395, 0.0011031627655029297, 0.00115889310836792, 0.0012146234512329102, 0.0012703537940979004, 0.0013260841369628906, 0.0013818144798278809, 0.001437544822692871, 0.0014932751655578613, 0.0015490055084228516, 0.0016047358512878418, 0.001660466194152832, 0.0017161965370178223, 0.0017719268798828125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 6.0, 11.0, 7.0, 16.0, 18.0, 16.0, 26.0, 43.0, 62.0, 74.0, 72.0, 118.0, 148.0, 245.0, 343.0, 541.0, 1128.0, 151675.0, 890415.0, 1530.0, 667.0, 400.0, 266.0, 164.0, 118.0, 116.0, 65.0, 68.0, 36.0, 35.0, 15.0, 20.0, 17.0, 11.0, 8.0, 10.0, 9.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.0292510986328125, -0.028340578079223633, -0.027430057525634766, -0.0265195369720459, -0.02560901641845703, -0.024698495864868164, -0.023787975311279297, -0.02287745475769043, -0.021966934204101562, -0.021056413650512695, -0.020145893096923828, -0.01923537254333496, -0.018324851989746094, -0.017414331436157227, -0.01650381088256836, -0.015593290328979492, -0.014682769775390625, -0.013772249221801758, -0.01286172866821289, -0.011951208114624023, -0.011040687561035156, -0.010130167007446289, -0.009219646453857422, -0.008309125900268555, -0.0073986053466796875, -0.00648808479309082, -0.005577564239501953, -0.004667043685913086, -0.0037565231323242188, -0.0028460025787353516, -0.0019354820251464844, -0.0010249614715576172, -0.00011444091796875, 0.0007960796356201172, 0.0017066001892089844, 0.0026171207427978516, 0.0035276412963867188, 0.004438161849975586, 0.005348682403564453, 0.00625920295715332, 0.0071697235107421875, 0.008080244064331055, 0.008990764617919922, 0.009901285171508789, 0.010811805725097656, 0.011722326278686523, 0.01263284683227539, 0.013543367385864258, 0.014453887939453125, 0.015364408493041992, 0.01627492904663086, 0.017185449600219727, 0.018095970153808594, 0.01900649070739746, 0.019917011260986328, 0.020827531814575195, 0.021738052368164062, 0.02264857292175293, 0.023559093475341797, 0.024469614028930664, 0.02538013458251953, 0.0262906551361084, 0.027201175689697266, 0.028111696243286133, 0.029022216796875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 22.0, 310.0, 585.0, 92.0, 6.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00799393281340599, -0.007854266092181206, -0.0077146003022789955, -0.007574933581054211, -0.007435267325490713, -0.007295601069927216, -0.007155934814363718, -0.0070162685588002205, -0.006876601837575436, -0.006736935582011938, -0.0065972693264484406, -0.006457602605223656, -0.006317936349660158, -0.006178270094096661, -0.006038603838533163, -0.0058989375829696655, -0.005759270861744881, -0.005619604606181383, -0.005479938350617886, -0.005340271629393101, -0.005200605373829603, -0.005060939118266106, -0.004921272862702608, -0.0047816066071391106, -0.004641940351575613, -0.0045022740960121155, -0.004362607840448618, -0.004222941119223833, -0.0040832748636603355, -0.003943608608096838, -0.0038039423525333405, -0.0036642758641391993, -0.003524609375745058, -0.0033849431201815605, -0.0032452766317874193, -0.0031056103762239218, -0.0029659438878297806, -0.002826277632266283, -0.0026866113767027855, -0.0025469448883086443, -0.002407278399914503, -0.0022676121443510056, -0.0021279456559568644, -0.001988279400393367, -0.0018486129119992256, -0.001708946656435728, -0.0015692802844569087, -0.0014296139124780893, -0.0012899476569145918, -0.0011502812849357724, -0.001010614912956953, -0.0008709485991857946, -0.0007312822272069752, -0.0005916158552281559, -0.0004519495414569974, -0.000312283169478178, -0.00017261679749935865, -3.295044007245451e-05, 0.00010671591735444963, 0.00024638226022943854, 0.0003860486322082579, 0.0005257150041870773, 0.0006653813179582357, 0.0008050476899370551, 0.0009447140619158745]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 7.0, 3.0, 4.0, 11.0, 9.0, 10.0, 19.0, 19.0, 17.0, 18.0, 35.0, 39.0, 36.0, 36.0, 35.0, 38.0, 45.0, 51.0, 47.0, 49.0, 50.0, 41.0, 45.0, 47.0, 44.0, 37.0, 30.0, 21.0, 32.0, 25.0, 16.0, 12.0, 8.0, 15.0, 15.0, 9.0, 5.0, 9.0, 3.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008946657180786133, -0.0008666180074214935, -0.0008385702967643738, -0.000810522586107254, -0.0007824748754501343, -0.0007544271647930145, -0.0007263794541358948, -0.000698331743478775, -0.0006702840328216553, -0.0006422363221645355, -0.0006141886115074158, -0.000586140900850296, -0.0005580931901931763, -0.0005300454795360565, -0.0005019977688789368, -0.000473950058221817, -0.00044590234756469727, -0.0004178546369075775, -0.00038980692625045776, -0.000361759215593338, -0.00033371150493621826, -0.0003056637942790985, -0.00027761608362197876, -0.000249568372964859, -0.00022152066230773926, -0.0001934729516506195, -0.00016542524099349976, -0.00013737753033638, -0.00010932981967926025, -8.12821090221405e-05, -5.323439836502075e-05, -2.5186687707901e-05, 2.86102294921875e-06, 3.09087336063385e-05, 5.895644426345825e-05, 8.7004154920578e-05, 0.00011505186557769775, 0.0001430995762348175, 0.00017114728689193726, 0.000199194997549057, 0.00022724270820617676, 0.0002552904188632965, 0.00028333812952041626, 0.000311385840177536, 0.00033943355083465576, 0.0003674812614917755, 0.00039552897214889526, 0.000423576682806015, 0.00045162439346313477, 0.0004796721041202545, 0.0005077198147773743, 0.000535767525434494, 0.0005638152360916138, 0.0005918629467487335, 0.0006199106574058533, 0.000647958368062973, 0.0006760060787200928, 0.0007040537893772125, 0.0007321015000343323, 0.000760149210691452, 0.0007881969213485718, 0.0008162446320056915, 0.0008442923426628113, 0.000872340053319931, 0.0009003877639770508]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 1.0, 1.0, 3.0, 1.0, 7.0, 3.0, 10.0, 11.0, 13.0, 12.0, 13.0, 18.0, 23.0, 31.0, 26.0, 27.0, 29.0, 39.0, 41.0, 46.0, 45.0, 42.0, 54.0, 39.0, 33.0, 45.0, 41.0, 33.0, 38.0, 32.0, 41.0, 30.0, 37.0, 16.0, 27.0, 24.0, 9.0, 15.0, 13.0, 10.0, 8.0, 8.0, 3.0, 2.0, 2.0, 7.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.140625, -5.90966796875, -5.6787109375, -5.44775390625, -5.216796875, -4.98583984375, -4.7548828125, -4.52392578125, -4.29296875, -4.06201171875, -3.8310546875, -3.60009765625, -3.369140625, -3.13818359375, -2.9072265625, -2.67626953125, -2.4453125, -2.21435546875, -1.9833984375, -1.75244140625, -1.521484375, -1.29052734375, -1.0595703125, -0.82861328125, -0.59765625, -0.36669921875, -0.1357421875, 0.09521484375, 0.326171875, 0.55712890625, 0.7880859375, 1.01904296875, 1.25, 1.48095703125, 1.7119140625, 1.94287109375, 2.173828125, 2.40478515625, 2.6357421875, 2.86669921875, 3.09765625, 3.32861328125, 3.5595703125, 3.79052734375, 4.021484375, 4.25244140625, 4.4833984375, 4.71435546875, 4.9453125, 5.17626953125, 5.4072265625, 5.63818359375, 5.869140625, 6.10009765625, 6.3310546875, 6.56201171875, 6.79296875, 7.02392578125, 7.2548828125, 7.48583984375, 7.716796875, 7.94775390625, 8.1787109375, 8.40966796875, 8.640625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 5.0, 8.0, 7.0, 4.0, 10.0, 17.0, 15.0, 23.0, 33.0, 44.0, 59.0, 94.0, 116.0, 180.0, 241.0, 381.0, 553.0, 946.0, 1644.0, 3580.0, 8637.0, 28345.0, 134399.0, 628501.0, 185726.0, 35539.0, 10532.0, 4121.0, 1875.0, 1057.0, 601.0, 388.0, 256.0, 165.0, 130.0, 86.0, 64.0, 52.0, 27.0, 33.0, 14.0, 9.0, 8.0, 13.0, 5.0, 2.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9296875, -10.5185546875, -10.107421875, -9.6962890625, -9.28515625, -8.8740234375, -8.462890625, -8.0517578125, -7.640625, -7.2294921875, -6.818359375, -6.4072265625, -5.99609375, -5.5849609375, -5.173828125, -4.7626953125, -4.3515625, -3.9404296875, -3.529296875, -3.1181640625, -2.70703125, -2.2958984375, -1.884765625, -1.4736328125, -1.0625, -0.6513671875, -0.240234375, 0.1708984375, 0.58203125, 0.9931640625, 1.404296875, 1.8154296875, 2.2265625, 2.6376953125, 3.048828125, 3.4599609375, 3.87109375, 4.2822265625, 4.693359375, 5.1044921875, 5.515625, 5.9267578125, 6.337890625, 6.7490234375, 7.16015625, 7.5712890625, 7.982421875, 8.3935546875, 8.8046875, 9.2158203125, 9.626953125, 10.0380859375, 10.44921875, 10.8603515625, 11.271484375, 11.6826171875, 12.09375, 12.5048828125, 12.916015625, 13.3271484375, 13.73828125, 14.1494140625, 14.560546875, 14.9716796875, 15.3828125]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 5.0, 2.0, 9.0, 10.0, 8.0, 11.0, 20.0, 14.0, 21.0, 34.0, 39.0, 29.0, 56.0, 52.0, 46.0, 78.0, 184.0, 1732.0, 251.0, 81.0, 33.0, 52.0, 44.0, 43.0, 30.0, 31.0, 20.0, 21.0, 20.0, 17.0, 10.0, 7.0, 10.0, 4.0, 6.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.6875, -21.060302734375, -20.43310546875, -19.805908203125, -19.1787109375, -18.551513671875, -17.92431640625, -17.297119140625, -16.669921875, -16.042724609375, -15.41552734375, -14.788330078125, -14.1611328125, -13.533935546875, -12.90673828125, -12.279541015625, -11.65234375, -11.025146484375, -10.39794921875, -9.770751953125, -9.1435546875, -8.516357421875, -7.88916015625, -7.261962890625, -6.634765625, -6.007568359375, -5.38037109375, -4.753173828125, -4.1259765625, -3.498779296875, -2.87158203125, -2.244384765625, -1.6171875, -0.989990234375, -0.36279296875, 0.264404296875, 0.8916015625, 1.518798828125, 2.14599609375, 2.773193359375, 3.400390625, 4.027587890625, 4.65478515625, 5.281982421875, 5.9091796875, 6.536376953125, 7.16357421875, 7.790771484375, 8.41796875, 9.045166015625, 9.67236328125, 10.299560546875, 10.9267578125, 11.553955078125, 12.18115234375, 12.808349609375, 13.435546875, 14.062744140625, 14.68994140625, 15.317138671875, 15.9443359375, 16.571533203125, 17.19873046875, 17.825927734375, 18.453125]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 8.0, 3.0, 0.0, 6.0, 9.0, 10.0, 6.0, 14.0, 17.0, 19.0, 22.0, 38.0, 54.0, 84.0, 102.0, 193.0, 376.0, 796.0, 5138.0, 3129949.0, 6973.0, 870.0, 402.0, 221.0, 123.0, 68.0, 55.0, 31.0, 33.0, 22.0, 8.0, 16.0, 16.0, 6.0, 5.0, 3.0, 6.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.3125, -54.46826171875, -52.6240234375, -50.77978515625, -48.935546875, -47.09130859375, -45.2470703125, -43.40283203125, -41.55859375, -39.71435546875, -37.8701171875, -36.02587890625, -34.181640625, -32.33740234375, -30.4931640625, -28.64892578125, -26.8046875, -24.96044921875, -23.1162109375, -21.27197265625, -19.427734375, -17.58349609375, -15.7392578125, -13.89501953125, -12.05078125, -10.20654296875, -8.3623046875, -6.51806640625, -4.673828125, -2.82958984375, -0.9853515625, 0.85888671875, 2.703125, 4.54736328125, 6.3916015625, 8.23583984375, 10.080078125, 11.92431640625, 13.7685546875, 15.61279296875, 17.45703125, 19.30126953125, 21.1455078125, 22.98974609375, 24.833984375, 26.67822265625, 28.5224609375, 30.36669921875, 32.2109375, 34.05517578125, 35.8994140625, 37.74365234375, 39.587890625, 41.43212890625, 43.2763671875, 45.12060546875, 46.96484375, 48.80908203125, 50.6533203125, 52.49755859375, 54.341796875, 56.18603515625, 58.0302734375, 59.87451171875, 61.71875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 30.0, 190.0, 546.0, 213.0, 27.0, 4.0, 2.0, 2.0], "bins": [-139.81094360351562, -137.4203338623047, -135.0297393798828, -132.63912963867188, -130.24853515625, -127.85792541503906, -125.46732330322266, -123.07672119140625, -120.68611907958984, -118.29551696777344, -115.90491485595703, -113.51431274414062, -111.12370300292969, -108.73310089111328, -106.34249877929688, -103.95189666748047, -101.56129455566406, -99.17069244384766, -96.78009033203125, -94.38948822021484, -91.99888610839844, -89.6082763671875, -87.2176742553711, -84.82707214355469, -82.43647003173828, -80.04586791992188, -77.65526580810547, -75.26466369628906, -72.87405395507812, -70.48345184326172, -68.09284973144531, -65.7022476196289, -63.311649322509766, -60.92104721069336, -58.53044128417969, -56.13983917236328, -53.749237060546875, -51.35863494873047, -48.96803283691406, -46.57742691040039, -44.186824798583984, -41.79622268676758, -39.405616760253906, -37.0150146484375, -34.624412536621094, -32.23381042480469, -29.84320640563965, -27.45260238647461, -25.062000274658203, -22.671398162841797, -20.280794143676758, -17.89019012451172, -15.499588012695312, -13.10898494720459, -10.718381881713867, -8.327777862548828, -5.937176704406738, -3.5465736389160156, -1.155970573425293, 1.2346324920654297, 3.6252355575561523, 6.015838623046875, 8.406441688537598, 10.797045707702637, 13.187647819519043]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 9.0, 3.0, 5.0, 6.0, 15.0, 10.0, 13.0, 16.0, 23.0, 23.0, 23.0, 23.0, 42.0, 24.0, 33.0, 41.0, 33.0, 38.0, 62.0, 45.0, 50.0, 51.0, 38.0, 34.0, 46.0, 28.0, 34.0, 35.0, 27.0, 23.0, 22.0, 23.0, 22.0, 13.0, 15.0, 11.0, 12.0, 11.0, 3.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.942039489746094, -38.56901168823242, -37.19598388671875, -35.822959899902344, -34.44993209838867, -33.076904296875, -31.70387840270996, -30.330852508544922, -28.95782470703125, -27.584796905517578, -26.21177101135254, -24.8387451171875, -23.465717315673828, -22.092689514160156, -20.719663619995117, -19.346637725830078, -17.973609924316406, -16.600582122802734, -15.227556228637695, -13.85452938079834, -12.481502532958984, -11.108475685119629, -9.735448837280273, -8.362421989440918, -6.9893951416015625, -5.616368293762207, -4.243341445922852, -2.870314598083496, -1.4972877502441406, -0.12426090240478516, 1.2487659454345703, 2.621792793273926, 3.9948158264160156, 5.367842674255371, 6.740869522094727, 8.113896369934082, 9.486923217773438, 10.859950065612793, 12.232976913452148, 13.606003761291504, 14.97903060913086, 16.35205841064453, 17.72508430480957, 19.09811019897461, 20.47113800048828, 21.844165802001953, 23.217191696166992, 24.59021759033203, 25.963245391845703, 27.336273193359375, 28.709299087524414, 30.082324981689453, 31.455352783203125, 32.8283805847168, 34.20140838623047, 35.574432373046875, 36.94746017456055, 38.32048797607422, 39.693511962890625, 41.0665397644043, 42.43956756591797, 43.81259536743164, 45.18562316894531, 46.55864715576172, 47.93167495727539]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 3.0, 15.0, 15.0, 8.0, 16.0, 19.0, 24.0, 19.0, 27.0, 19.0, 29.0, 39.0, 42.0, 34.0, 38.0, 44.0, 41.0, 43.0, 45.0, 46.0, 41.0, 41.0, 48.0, 32.0, 30.0, 34.0, 31.0, 28.0, 19.0, 21.0, 20.0, 14.0, 15.0, 12.0, 2.0, 8.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0, -7.734375, -7.46875, -7.203125, -6.9375, -6.671875, -6.40625, -6.140625, -5.875, -5.609375, -5.34375, -5.078125, -4.8125, -4.546875, -4.28125, -4.015625, -3.75, -3.484375, -3.21875, -2.953125, -2.6875, -2.421875, -2.15625, -1.890625, -1.625, -1.359375, -1.09375, -0.828125, -0.5625, -0.296875, -0.03125, 0.234375, 0.5, 0.765625, 1.03125, 1.296875, 1.5625, 1.828125, 2.09375, 2.359375, 2.625, 2.890625, 3.15625, 3.421875, 3.6875, 3.953125, 4.21875, 4.484375, 4.75, 5.015625, 5.28125, 5.546875, 5.8125, 6.078125, 6.34375, 6.609375, 6.875, 7.140625, 7.40625, 7.671875, 7.9375, 8.203125, 8.46875, 8.734375, 9.0]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 6.0, 11.0, 14.0, 14.0, 21.0, 31.0, 22.0, 41.0, 45.0, 61.0, 58.0, 96.0, 107.0, 146.0, 185.0, 235.0, 351.0, 530.0, 919.0, 2252.0, 14219.0, 2560446.0, 1599058.0, 10708.0, 1919.0, 849.0, 537.0, 338.0, 272.0, 169.0, 120.0, 96.0, 82.0, 57.0, 55.0, 43.0, 37.0, 22.0, 27.0, 21.0, 16.0, 16.0, 11.0, 6.0, 5.0, 6.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.3125, -44.765625, -43.21875, -41.671875, -40.125, -38.578125, -37.03125, -35.484375, -33.9375, -32.390625, -30.84375, -29.296875, -27.75, -26.203125, -24.65625, -23.109375, -21.5625, -20.015625, -18.46875, -16.921875, -15.375, -13.828125, -12.28125, -10.734375, -9.1875, -7.640625, -6.09375, -4.546875, -3.0, -1.453125, 0.09375, 1.640625, 3.1875, 4.734375, 6.28125, 7.828125, 9.375, 10.921875, 12.46875, 14.015625, 15.5625, 17.109375, 18.65625, 20.203125, 21.75, 23.296875, 24.84375, 26.390625, 27.9375, 29.484375, 31.03125, 32.578125, 34.125, 35.671875, 37.21875, 38.765625, 40.3125, 41.859375, 43.40625, 44.953125, 46.5, 48.046875, 49.59375, 51.140625, 52.6875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 7.0, 1.0, 10.0, 9.0, 23.0, 60.0, 82.0, 177.0, 335.0, 665.0, 1044.0, 776.0, 447.0, 196.0, 106.0, 67.0, 25.0, 22.0, 7.0, 8.0, 4.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-32.71875, -31.9862060546875, -31.253662109375, -30.5211181640625, -29.78857421875, -29.0560302734375, -28.323486328125, -27.5909423828125, -26.8583984375, -26.1258544921875, -25.393310546875, -24.6607666015625, -23.92822265625, -23.1956787109375, -22.463134765625, -21.7305908203125, -20.998046875, -20.2655029296875, -19.532958984375, -18.8004150390625, -18.06787109375, -17.3353271484375, -16.602783203125, -15.8702392578125, -15.1376953125, -14.4051513671875, -13.672607421875, -12.9400634765625, -12.20751953125, -11.4749755859375, -10.742431640625, -10.0098876953125, -9.27734375, -8.5447998046875, -7.812255859375, -7.0797119140625, -6.34716796875, -5.6146240234375, -4.882080078125, -4.1495361328125, -3.4169921875, -2.6844482421875, -1.951904296875, -1.2193603515625, -0.48681640625, 0.2457275390625, 0.978271484375, 1.7108154296875, 2.443359375, 3.1759033203125, 3.908447265625, 4.6409912109375, 5.37353515625, 6.1060791015625, 6.838623046875, 7.5711669921875, 8.3037109375, 9.0362548828125, 9.768798828125, 10.5013427734375, 11.23388671875, 11.9664306640625, 12.698974609375, 13.4315185546875, 14.1640625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 7.0, 10.0, 17.0, 39.0, 88.0, 166.0, 498.0, 2369.0, 40642.0, 3957252.0, 187404.0, 4612.0, 752.0, 219.0, 101.0, 46.0, 25.0, 12.0, 7.0, 8.0, 5.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.34375, -43.10009765625, -41.8564453125, -40.61279296875, -39.369140625, -38.12548828125, -36.8818359375, -35.63818359375, -34.39453125, -33.15087890625, -31.9072265625, -30.66357421875, -29.419921875, -28.17626953125, -26.9326171875, -25.68896484375, -24.4453125, -23.20166015625, -21.9580078125, -20.71435546875, -19.470703125, -18.22705078125, -16.9833984375, -15.73974609375, -14.49609375, -13.25244140625, -12.0087890625, -10.76513671875, -9.521484375, -8.27783203125, -7.0341796875, -5.79052734375, -4.546875, -3.30322265625, -2.0595703125, -0.81591796875, 0.427734375, 1.67138671875, 2.9150390625, 4.15869140625, 5.40234375, 6.64599609375, 7.8896484375, 9.13330078125, 10.376953125, 11.62060546875, 12.8642578125, 14.10791015625, 15.3515625, 16.59521484375, 17.8388671875, 19.08251953125, 20.326171875, 21.56982421875, 22.8134765625, 24.05712890625, 25.30078125, 26.54443359375, 27.7880859375, 29.03173828125, 30.275390625, 31.51904296875, 32.7626953125, 34.00634765625, 35.25]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 8.0, 11.0, 20.0, 53.0, 61.0, 106.0, 147.0, 176.0, 153.0, 100.0, 67.0, 46.0, 15.0, 14.0, 9.0, 10.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.93859100341797, -87.90706634521484, -83.87554931640625, -79.84402465820312, -75.8125, -71.78097534179688, -67.74945068359375, -63.717933654785156, -59.68640899658203, -55.654884338378906, -51.62336349487305, -47.59184265136719, -43.56031799316406, -39.52879333496094, -35.49727249145508, -31.465749740600586, -27.434226989746094, -23.4027042388916, -19.37118148803711, -15.339658737182617, -11.308135986328125, -7.276613235473633, -3.2450904846191406, 0.7864322662353516, 4.817955017089844, 8.849477767944336, 12.881000518798828, 16.91252326965332, 20.944046020507812, 24.975568771362305, 29.007091522216797, 33.038612365722656, 37.07014465332031, 41.10166931152344, 45.1331901550293, 49.164710998535156, 53.19623565673828, 57.227760314941406, 61.259281158447266, 65.29080200195312, 69.32232666015625, 73.35385131835938, 77.3853759765625, 81.4168930053711, 85.44841766357422, 89.47994232177734, 93.51145935058594, 97.54298400878906, 101.57450866699219, 105.60603332519531, 109.63755798339844, 113.66907501220703, 117.70059967041016, 121.73212432861328, 125.76364135742188, 129.795166015625, 133.82669067382812, 137.85821533203125, 141.88973999023438, 145.9212646484375, 149.95278930664062, 153.9842987060547, 158.0158233642578, 162.04734802246094, 166.07887268066406]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 7.0, 10.0, 15.0, 13.0, 13.0, 12.0, 21.0, 21.0, 20.0, 24.0, 27.0, 27.0, 31.0, 40.0, 34.0, 37.0, 45.0, 38.0, 30.0, 40.0, 43.0, 45.0, 36.0, 34.0, 39.0, 37.0, 42.0, 22.0, 25.0, 22.0, 24.0, 13.0, 16.0, 18.0, 17.0, 10.0, 6.0, 13.0, 8.0, 7.0, 5.0, 2.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-47.35752487182617, -45.88702392578125, -44.416526794433594, -42.94602584838867, -41.47552490234375, -40.005027770996094, -38.53452682495117, -37.06402587890625, -35.593528747558594, -34.12302780151367, -32.652530670166016, -31.182029724121094, -29.711528778076172, -28.241029739379883, -26.770530700683594, -25.300029754638672, -23.82952880859375, -22.35902976989746, -20.88852882385254, -19.41802978515625, -17.947528839111328, -16.47702980041504, -15.00653076171875, -13.536030769348145, -12.065530776977539, -10.595030784606934, -9.124530792236328, -7.654031753540039, -6.183531761169434, -4.713031768798828, -3.242532730102539, -1.7720327377319336, -0.3015327453613281, 1.1689670085906982, 2.6394667625427246, 4.109966278076172, 5.580466270446777, 7.050966262817383, 8.521465301513672, 9.991965293884277, 11.462465286254883, 12.932965278625488, 14.403465270996094, 15.873964309692383, 17.344463348388672, 18.814964294433594, 20.285463333129883, 21.755962371826172, 23.226463317871094, 24.696962356567383, 26.167463302612305, 27.637962341308594, 29.108463287353516, 30.578962326049805, 32.049461364746094, 33.519962310791016, 34.99046325683594, 36.46096420288086, 37.931461334228516, 39.40196228027344, 40.87246322631836, 42.34296417236328, 43.81346130371094, 45.28396224975586, 46.754459381103516]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 4.0, 11.0, 9.0, 10.0, 14.0, 11.0, 21.0, 14.0, 20.0, 27.0, 29.0, 31.0, 38.0, 40.0, 25.0, 36.0, 51.0, 37.0, 38.0, 32.0, 35.0, 32.0, 44.0, 43.0, 35.0, 39.0, 39.0, 29.0, 26.0, 33.0, 15.0, 20.0, 9.0, 12.0, 13.0, 15.0, 12.0, 11.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-79.5, -77.1416015625, -74.783203125, -72.4248046875, -70.06640625, -67.7080078125, -65.349609375, -62.9912109375, -60.6328125, -58.2744140625, -55.916015625, -53.5576171875, -51.19921875, -48.8408203125, -46.482421875, -44.1240234375, -41.765625, -39.4072265625, -37.048828125, -34.6904296875, -32.33203125, -29.9736328125, -27.615234375, -25.2568359375, -22.8984375, -20.5400390625, -18.181640625, -15.8232421875, -13.46484375, -11.1064453125, -8.748046875, -6.3896484375, -4.03125, -1.6728515625, 0.685546875, 3.0439453125, 5.40234375, 7.7607421875, 10.119140625, 12.4775390625, 14.8359375, 17.1943359375, 19.552734375, 21.9111328125, 24.26953125, 26.6279296875, 28.986328125, 31.3447265625, 33.703125, 36.0615234375, 38.419921875, 40.7783203125, 43.13671875, 45.4951171875, 47.853515625, 50.2119140625, 52.5703125, 54.9287109375, 57.287109375, 59.6455078125, 62.00390625, 64.3623046875, 66.720703125, 69.0791015625, 71.4375]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 5.0, 8.0, 7.0, 7.0, 21.0, 19.0, 44.0, 47.0, 70.0, 112.0, 183.0, 242.0, 383.0, 551.0, 867.0, 1249.0, 1906.0, 2917.0, 4340.0, 6621.0, 10143.0, 15386.0, 23959.0, 36782.0, 56963.0, 87866.0, 139854.0, 200189.0, 163877.0, 103810.0, 66568.0, 42748.0, 27966.0, 18168.0, 11796.0, 7666.0, 5103.0, 3446.0, 2249.0, 1452.0, 998.0, 674.0, 407.0, 302.0, 203.0, 123.0, 90.0, 51.0, 46.0, 28.0, 16.0, 16.0, 5.0, 7.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-9.3046875, -9.010986328125, -8.71728515625, -8.423583984375, -8.1298828125, -7.836181640625, -7.54248046875, -7.248779296875, -6.955078125, -6.661376953125, -6.36767578125, -6.073974609375, -5.7802734375, -5.486572265625, -5.19287109375, -4.899169921875, -4.60546875, -4.311767578125, -4.01806640625, -3.724365234375, -3.4306640625, -3.136962890625, -2.84326171875, -2.549560546875, -2.255859375, -1.962158203125, -1.66845703125, -1.374755859375, -1.0810546875, -0.787353515625, -0.49365234375, -0.199951171875, 0.09375, 0.387451171875, 0.68115234375, 0.974853515625, 1.2685546875, 1.562255859375, 1.85595703125, 2.149658203125, 2.443359375, 2.737060546875, 3.03076171875, 3.324462890625, 3.6181640625, 3.911865234375, 4.20556640625, 4.499267578125, 4.79296875, 5.086669921875, 5.38037109375, 5.674072265625, 5.9677734375, 6.261474609375, 6.55517578125, 6.848876953125, 7.142578125, 7.436279296875, 7.72998046875, 8.023681640625, 8.3173828125, 8.611083984375, 8.90478515625, 9.198486328125, 9.4921875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 6.0, 3.0, 6.0, 6.0, 20.0, 15.0, 14.0, 14.0, 38.0, 28.0, 23.0, 27.0, 45.0, 43.0, 45.0, 34.0, 39.0, 36.0, 1072.0, 31.0, 47.0, 39.0, 40.0, 40.0, 35.0, 45.0, 40.0, 32.0, 34.0, 26.0, 18.0, 22.0, 17.0, 8.0, 13.0, 4.0, 8.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-52.4375, -50.68896484375, -48.9404296875, -47.19189453125, -45.443359375, -43.69482421875, -41.9462890625, -40.19775390625, -38.44921875, -36.70068359375, -34.9521484375, -33.20361328125, -31.455078125, -29.70654296875, -27.9580078125, -26.20947265625, -24.4609375, -22.71240234375, -20.9638671875, -19.21533203125, -17.466796875, -15.71826171875, -13.9697265625, -12.22119140625, -10.47265625, -8.72412109375, -6.9755859375, -5.22705078125, -3.478515625, -1.72998046875, 0.0185546875, 1.76708984375, 3.515625, 5.26416015625, 7.0126953125, 8.76123046875, 10.509765625, 12.25830078125, 14.0068359375, 15.75537109375, 17.50390625, 19.25244140625, 21.0009765625, 22.74951171875, 24.498046875, 26.24658203125, 27.9951171875, 29.74365234375, 31.4921875, 33.24072265625, 34.9892578125, 36.73779296875, 38.486328125, 40.23486328125, 41.9833984375, 43.73193359375, 45.48046875, 47.22900390625, 48.9775390625, 50.72607421875, 52.474609375, 54.22314453125, 55.9716796875, 57.72021484375, 59.46875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 14.0, 13.0, 19.0, 25.0, 27.0, 48.0, 69.0, 114.0, 182.0, 274.0, 449.0, 606.0, 936.0, 1419.0, 2306.0, 3686.0, 5574.0, 8727.0, 13899.0, 21832.0, 34849.0, 55328.0, 87384.0, 137702.0, 1249852.0, 171688.0, 110311.0, 69297.0, 44518.0, 27784.0, 17545.0, 10943.0, 7030.0, 4538.0, 2911.0, 1827.0, 1193.0, 776.0, 471.0, 328.0, 213.0, 154.0, 102.0, 53.0, 44.0, 26.0, 19.0, 12.0, 11.0, 4.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.34375, -9.0399169921875, -8.736083984375, -8.4322509765625, -8.12841796875, -7.8245849609375, -7.520751953125, -7.2169189453125, -6.9130859375, -6.6092529296875, -6.305419921875, -6.0015869140625, -5.69775390625, -5.3939208984375, -5.090087890625, -4.7862548828125, -4.482421875, -4.1785888671875, -3.874755859375, -3.5709228515625, -3.26708984375, -2.9632568359375, -2.659423828125, -2.3555908203125, -2.0517578125, -1.7479248046875, -1.444091796875, -1.1402587890625, -0.83642578125, -0.5325927734375, -0.228759765625, 0.0750732421875, 0.37890625, 0.6827392578125, 0.986572265625, 1.2904052734375, 1.59423828125, 1.8980712890625, 2.201904296875, 2.5057373046875, 2.8095703125, 3.1134033203125, 3.417236328125, 3.7210693359375, 4.02490234375, 4.3287353515625, 4.632568359375, 4.9364013671875, 5.240234375, 5.5440673828125, 5.847900390625, 6.1517333984375, 6.45556640625, 6.7593994140625, 7.063232421875, 7.3670654296875, 7.6708984375, 7.9747314453125, 8.278564453125, 8.5823974609375, 8.88623046875, 9.1900634765625, 9.493896484375, 9.7977294921875, 10.1015625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 12.0, 9.0, 12.0, 20.0, 33.0, 31.0, 30.0, 47.0, 50.0, 56.0, 61.0, 48.0, 54.0, 62.0, 51.0, 46.0, 38.0, 45.0, 45.0, 46.0, 37.0, 23.0, 27.0, 22.0, 14.0, 15.0, 10.0, 10.0, 7.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.022674560546875, -0.02207040786743164, -0.02146625518798828, -0.020862102508544922, -0.020257949829101562, -0.019653797149658203, -0.019049644470214844, -0.018445491790771484, -0.017841339111328125, -0.017237186431884766, -0.016633033752441406, -0.016028881072998047, -0.015424728393554688, -0.014820575714111328, -0.014216423034667969, -0.01361227035522461, -0.01300811767578125, -0.01240396499633789, -0.011799812316894531, -0.011195659637451172, -0.010591506958007812, -0.009987354278564453, -0.009383201599121094, -0.008779048919677734, -0.008174896240234375, -0.007570743560791016, -0.006966590881347656, -0.006362438201904297, -0.0057582855224609375, -0.005154132843017578, -0.004549980163574219, -0.003945827484130859, -0.0033416748046875, -0.0027375221252441406, -0.0021333694458007812, -0.0015292167663574219, -0.0009250640869140625, -0.0003209114074707031, 0.00028324127197265625, 0.0008873939514160156, 0.001491546630859375, 0.0020956993103027344, 0.0026998519897460938, 0.003304004669189453, 0.0039081573486328125, 0.004512310028076172, 0.005116462707519531, 0.005720615386962891, 0.00632476806640625, 0.006928920745849609, 0.007533073425292969, 0.008137226104736328, 0.008741378784179688, 0.009345531463623047, 0.009949684143066406, 0.010553836822509766, 0.011157989501953125, 0.011762142181396484, 0.012366294860839844, 0.012970447540283203, 0.013574600219726562, 0.014178752899169922, 0.014782905578613281, 0.01538705825805664, 0.0159912109375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 7.0, 8.0, 9.0, 16.0, 22.0, 24.0, 55.0, 53.0, 76.0, 104.0, 156.0, 201.0, 305.0, 510.0, 1010.0, 2402.0, 8767.0, 47716.0, 351413.0, 530325.0, 84954.0, 13915.0, 3418.0, 1269.0, 649.0, 385.0, 243.0, 154.0, 116.0, 66.0, 68.0, 32.0, 27.0, 20.0, 12.0, 19.0, 12.0, 8.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.156005859375, -0.15099716186523438, -0.14598846435546875, -0.14097976684570312, -0.1359710693359375, -0.13096237182617188, -0.12595367431640625, -0.12094497680664062, -0.115936279296875, -0.11092758178710938, -0.10591888427734375, -0.10091018676757812, -0.0959014892578125, -0.09089279174804688, -0.08588409423828125, -0.08087539672851562, -0.07586669921875, -0.07085800170898438, -0.06584930419921875, -0.060840606689453125, -0.0558319091796875, -0.050823211669921875, -0.04581451416015625, -0.040805816650390625, -0.035797119140625, -0.030788421630859375, -0.02577972412109375, -0.020771026611328125, -0.0157623291015625, -0.010753631591796875, -0.00574493408203125, -0.000736236572265625, 0.0042724609375, 0.009281158447265625, 0.01428985595703125, 0.019298553466796875, 0.0243072509765625, 0.029315948486328125, 0.03432464599609375, 0.039333343505859375, 0.044342041015625, 0.049350738525390625, 0.05435943603515625, 0.059368133544921875, 0.0643768310546875, 0.06938552856445312, 0.07439422607421875, 0.07940292358398438, 0.08441162109375, 0.08942031860351562, 0.09442901611328125, 0.09943771362304688, 0.1044464111328125, 0.10945510864257812, 0.11446380615234375, 0.11947250366210938, 0.124481201171875, 0.12948989868164062, 0.13449859619140625, 0.13950729370117188, 0.1445159912109375, 0.14952468872070312, 0.15453338623046875, 0.15954208374023438, 0.16455078125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 11.0, 9.0, 17.0, 30.0, 38.0, 55.0, 83.0, 113.0, 131.0, 128.0, 107.0, 86.0, 68.0, 45.0, 26.0, 18.0, 12.0, 8.0, 5.0, 3.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014692848548293114, -0.014030023477971554, -0.013367198407649994, -0.012704374268651009, -0.012041548267006874, -0.011378724128007889, -0.010715899057686329, -0.010053073987364769, -0.009390248917043209, -0.00872742384672165, -0.00806459877640009, -0.007401774171739817, -0.006738949101418257, -0.006076124031096697, -0.005413299426436424, -0.004750474356114864, -0.0040876492857933044, -0.0034248242154717445, -0.0027619993779808283, -0.002099174540489912, -0.0014363494701683521, -0.0007735243998467922, -0.00011069979518651962, 0.0005521252751350403, 0.0012149503454566002, 0.0018777752993628383, 0.0025406002532690763, 0.0032034250907599926, 0.0038662501610815525, 0.004529075231403112, 0.005191899836063385, 0.005854724906384945, 0.006517549976706505, 0.007180375047028065, 0.007843200117349625, 0.00850602425634861, 0.009168850257992744, 0.00983167439699173, 0.01049449946731329, 0.01115732453763485, 0.01182014960795641, 0.01248297467827797, 0.01314579974859953, 0.01380862481892109, 0.014471448957920074, 0.015134274959564209, 0.015797099098563194, 0.01645992323756218, 0.017122749239206314, 0.0177855733782053, 0.018448399379849434, 0.01911122351884842, 0.019774049520492554, 0.02043687365949154, 0.021099697798490524, 0.02176252380013466, 0.022425349801778793, 0.02308817394077778, 0.023750999942421913, 0.0244138240814209, 0.025076650083065033, 0.025739474222064018, 0.026402298361063004, 0.027065124362707138, 0.027727948501706123]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 11.0, 11.0, 10.0, 15.0, 10.0, 23.0, 18.0, 23.0, 24.0, 29.0, 25.0, 31.0, 37.0, 37.0, 43.0, 29.0, 45.0, 41.0, 37.0, 38.0, 32.0, 36.0, 39.0, 28.0, 28.0, 25.0, 22.0, 29.0, 25.0, 22.0, 24.0, 25.0, 18.0, 10.0, 11.0, 15.0, 9.0, 7.0, 8.0, 6.0, 3.0, 9.0, 4.0, 10.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.008817911148071289, -0.008537821471691132, -0.008257731795310974, -0.007977642118930817, -0.007697552442550659, -0.007417462766170502, -0.007137373089790344, -0.006857283413410187, -0.006577193737030029, -0.006297104060649872, -0.006017014384269714, -0.005736924707889557, -0.005456835031509399, -0.005176745355129242, -0.0048966556787490845, -0.004616566002368927, -0.0043364763259887695, -0.004056386649608612, -0.0037762969732284546, -0.003496207296848297, -0.0032161176204681396, -0.002936027944087982, -0.0026559382677078247, -0.0023758485913276672, -0.0020957589149475098, -0.0018156692385673523, -0.0015355795621871948, -0.0012554898858070374, -0.0009754002094268799, -0.0006953105330467224, -0.00041522085666656494, -0.00013513118028640747, 0.00014495849609375, 0.00042504817247390747, 0.0007051378488540649, 0.0009852275252342224, 0.0012653172016143799, 0.0015454068779945374, 0.0018254965543746948, 0.0021055862307548523, 0.0023856759071350098, 0.0026657655835151672, 0.0029458552598953247, 0.003225944936275482, 0.0035060346126556396, 0.003786124289035797, 0.004066213965415955, 0.004346303641796112, 0.0046263933181762695, 0.004906482994556427, 0.0051865726709365845, 0.005466662347316742, 0.005746752023696899, 0.006026841700077057, 0.006306931376457214, 0.006587021052837372, 0.006867110729217529, 0.007147200405597687, 0.007427290081977844, 0.007707379758358002, 0.00798746943473816, 0.008267559111118317, 0.008547648787498474, 0.008827738463878632, 0.009107828140258789]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 9.0, 4.0, 11.0, 9.0, 10.0, 14.0, 11.0, 21.0, 14.0, 20.0, 27.0, 29.0, 32.0, 37.0, 40.0, 24.0, 37.0, 50.0, 38.0, 39.0, 31.0, 35.0, 32.0, 44.0, 42.0, 36.0, 39.0, 39.0, 30.0, 25.0, 33.0, 15.0, 20.0, 9.0, 12.0, 13.0, 15.0, 12.0, 11.0, 8.0, 8.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-79.5, -77.1416015625, -74.783203125, -72.4248046875, -70.06640625, -67.7080078125, -65.349609375, -62.9912109375, -60.6328125, -58.2744140625, -55.916015625, -53.5576171875, -51.19921875, -48.8408203125, -46.482421875, -44.1240234375, -41.765625, -39.4072265625, -37.048828125, -34.6904296875, -32.33203125, -29.9736328125, -27.615234375, -25.2568359375, -22.8984375, -20.5400390625, -18.181640625, -15.8232421875, -13.46484375, -11.1064453125, -8.748046875, -6.3896484375, -4.03125, -1.6728515625, 0.685546875, 3.0439453125, 5.40234375, 7.7607421875, 10.119140625, 12.4775390625, 14.8359375, 17.1943359375, 19.552734375, 21.9111328125, 24.26953125, 26.6279296875, 28.986328125, 31.3447265625, 33.703125, 36.0615234375, 38.419921875, 40.7783203125, 43.13671875, 45.4951171875, 47.853515625, 50.2119140625, 52.5703125, 54.9287109375, 57.287109375, 59.6455078125, 62.00390625, 64.3623046875, 66.720703125, 69.0791015625, 71.4375]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 13.0, 7.0, 12.0, 15.0, 16.0, 23.0, 38.0, 39.0, 67.0, 91.0, 132.0, 202.0, 324.0, 580.0, 1063.0, 1980.0, 3812.0, 8782.0, 25291.0, 110499.0, 571110.0, 253422.0, 45993.0, 13569.0, 5454.0, 2632.0, 1353.0, 803.0, 434.0, 255.0, 156.0, 114.0, 76.0, 54.0, 22.0, 25.0, 23.0, 21.0, 14.0, 7.0, 11.0, 4.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-21.390625, -20.75634765625, -20.1220703125, -19.48779296875, -18.853515625, -18.21923828125, -17.5849609375, -16.95068359375, -16.31640625, -15.68212890625, -15.0478515625, -14.41357421875, -13.779296875, -13.14501953125, -12.5107421875, -11.87646484375, -11.2421875, -10.60791015625, -9.9736328125, -9.33935546875, -8.705078125, -8.07080078125, -7.4365234375, -6.80224609375, -6.16796875, -5.53369140625, -4.8994140625, -4.26513671875, -3.630859375, -2.99658203125, -2.3623046875, -1.72802734375, -1.09375, -0.45947265625, 0.1748046875, 0.80908203125, 1.443359375, 2.07763671875, 2.7119140625, 3.34619140625, 3.98046875, 4.61474609375, 5.2490234375, 5.88330078125, 6.517578125, 7.15185546875, 7.7861328125, 8.42041015625, 9.0546875, 9.68896484375, 10.3232421875, 10.95751953125, 11.591796875, 12.22607421875, 12.8603515625, 13.49462890625, 14.12890625, 14.76318359375, 15.3974609375, 16.03173828125, 16.666015625, 17.30029296875, 17.9345703125, 18.56884765625, 19.203125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 8.0, 9.0, 13.0, 18.0, 25.0, 37.0, 36.0, 49.0, 51.0, 80.0, 69.0, 99.0, 2124.0, 74.0, 74.0, 63.0, 47.0, 44.0, 34.0, 20.0, 26.0, 11.0, 12.0, 9.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-213.125, -206.33984375, -199.5546875, -192.76953125, -185.984375, -179.19921875, -172.4140625, -165.62890625, -158.84375, -152.05859375, -145.2734375, -138.48828125, -131.703125, -124.91796875, -118.1328125, -111.34765625, -104.5625, -97.77734375, -90.9921875, -84.20703125, -77.421875, -70.63671875, -63.8515625, -57.06640625, -50.28125, -43.49609375, -36.7109375, -29.92578125, -23.140625, -16.35546875, -9.5703125, -2.78515625, 4.0, 10.78515625, 17.5703125, 24.35546875, 31.140625, 37.92578125, 44.7109375, 51.49609375, 58.28125, 65.06640625, 71.8515625, 78.63671875, 85.421875, 92.20703125, 98.9921875, 105.77734375, 112.5625, 119.34765625, 126.1328125, 132.91796875, 139.703125, 146.48828125, 153.2734375, 160.05859375, 166.84375, 173.62890625, 180.4140625, 187.19921875, 193.984375, 200.76953125, 207.5546875, 214.33984375, 221.125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 10.0, 9.0, 14.0, 16.0, 23.0, 36.0, 59.0, 80.0, 120.0, 190.0, 318.0, 627.0, 1446.0, 4216.0, 43993.0, 2984604.0, 99964.0, 6366.0, 1825.0, 773.0, 365.0, 212.0, 135.0, 99.0, 50.0, 39.0, 24.0, 22.0, 17.0, 8.0, 9.0, 3.0, 6.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.21875, -44.7568359375, -43.294921875, -41.8330078125, -40.37109375, -38.9091796875, -37.447265625, -35.9853515625, -34.5234375, -33.0615234375, -31.599609375, -30.1376953125, -28.67578125, -27.2138671875, -25.751953125, -24.2900390625, -22.828125, -21.3662109375, -19.904296875, -18.4423828125, -16.98046875, -15.5185546875, -14.056640625, -12.5947265625, -11.1328125, -9.6708984375, -8.208984375, -6.7470703125, -5.28515625, -3.8232421875, -2.361328125, -0.8994140625, 0.5625, 2.0244140625, 3.486328125, 4.9482421875, 6.41015625, 7.8720703125, 9.333984375, 10.7958984375, 12.2578125, 13.7197265625, 15.181640625, 16.6435546875, 18.10546875, 19.5673828125, 21.029296875, 22.4912109375, 23.953125, 25.4150390625, 26.876953125, 28.3388671875, 29.80078125, 31.2626953125, 32.724609375, 34.1865234375, 35.6484375, 37.1103515625, 38.572265625, 40.0341796875, 41.49609375, 42.9580078125, 44.419921875, 45.8818359375, 47.34375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 35.0, 179.0, 642.0, 111.0, 18.0, 8.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1493.390869140625, -1466.4288330078125, -1439.466796875, -1412.5047607421875, -1385.542724609375, -1358.580810546875, -1331.6187744140625, -1304.65673828125, -1277.6947021484375, -1250.732666015625, -1223.7706298828125, -1196.80859375, -1169.8466796875, -1142.8846435546875, -1115.922607421875, -1088.9605712890625, -1061.99853515625, -1035.0364990234375, -1008.074462890625, -981.1124877929688, -954.1504516601562, -927.1884155273438, -900.2264404296875, -873.264404296875, -846.3023681640625, -819.34033203125, -792.3782958984375, -765.4163208007812, -738.4542846679688, -711.4922485351562, -684.5302734375, -657.5682373046875, -630.6062622070312, -603.6442260742188, -576.6822509765625, -549.72021484375, -522.7581787109375, -495.796142578125, -468.8341369628906, -441.87213134765625, -414.91009521484375, -387.94805908203125, -360.9860534667969, -334.0240478515625, -307.06201171875, -280.0999755859375, -253.13796997070312, -226.1759490966797, -199.21392822265625, -172.2519073486328, -145.28988647460938, -118.32786560058594, -91.3658447265625, -64.40382385253906, -37.441802978515625, -10.479782104492188, 16.48223876953125, 43.44425964355469, 70.40628051757812, 97.36830139160156, 124.330322265625, 151.29234313964844, 178.25436401367188, 205.2163848876953, 232.17840576171875]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 12.0, 4.0, 10.0, 13.0, 22.0, 18.0, 18.0, 24.0, 19.0, 32.0, 43.0, 44.0, 42.0, 39.0, 52.0, 58.0, 46.0, 54.0, 53.0, 44.0, 44.0, 53.0, 44.0, 24.0, 37.0, 24.0, 21.0, 19.0, 11.0, 20.0, 10.0, 10.0, 6.0, 4.0, 1.0, 7.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-214.85885620117188, -208.4850311279297, -202.11122131347656, -195.73739624023438, -189.3635711669922, -182.98974609375, -176.61593627929688, -170.2421112060547, -163.8682861328125, -157.4944610595703, -151.1206512451172, -144.746826171875, -138.3730010986328, -131.99917602539062, -125.6253662109375, -119.25154113769531, -112.87773132324219, -106.50391387939453, -100.13008880615234, -93.75627136230469, -87.3824462890625, -81.00862884521484, -74.63481140136719, -68.260986328125, -61.887168884277344, -55.51334762573242, -49.1395263671875, -42.765708923339844, -36.39188766479492, -30.01806640625, -23.644248962402344, -17.270427703857422, -10.8966064453125, -4.5227861404418945, 1.851034164428711, 8.224853515625, 14.598674774169922, 20.972496032714844, 27.3463134765625, 33.72013473510742, 40.093955993652344, 46.467777252197266, 52.84159851074219, 59.215415954589844, 65.5892333984375, 71.96305847167969, 78.33687591552734, 84.710693359375, 91.08451843261719, 97.45833587646484, 103.83216094970703, 110.20597839355469, 116.57980346679688, 122.95362091064453, 129.3274383544922, 135.70126342773438, 142.0750732421875, 148.4488983154297, 154.8227081298828, 161.196533203125, 167.5703582763672, 173.94418334960938, 180.3179931640625, 186.6918182373047, 193.06564331054688]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 8.0, 7.0, 17.0, 17.0, 24.0, 25.0, 33.0, 24.0, 46.0, 70.0, 92.0, 120.0, 168.0, 217.0, 295.0, 417.0, 640.0, 793.0, 1382.0, 1040823.0, 868.0, 637.0, 521.0, 339.0, 222.0, 187.0, 118.0, 92.0, 76.0, 57.0, 42.0, 41.0, 30.0, 21.0, 12.0, 13.0, 22.0, 11.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.26725387573242, -44.62516784667969, -42.98308181762695, -41.34099578857422, -39.69891357421875, -38.05682373046875, -36.41474151611328, -34.77265548706055, -33.13056945800781, -31.488483428955078, -29.846397399902344, -28.204313278198242, -26.562227249145508, -24.920141220092773, -23.278057098388672, -21.635971069335938, -19.993885040283203, -18.35179901123047, -16.709712982177734, -15.067628860473633, -13.425542831420898, -11.783456802368164, -10.141371726989746, -8.499286651611328, -6.857200622558594, -5.215115070343018, -3.5730295181274414, -1.9309439659118652, -0.28885841369628906, 1.3532276153564453, 2.9953126907348633, 4.637397766113281, 6.27947998046875, 7.921565532684326, 9.563651084899902, 11.20573616027832, 12.847822189331055, 14.489908218383789, 16.13199234008789, 17.774078369140625, 19.41616439819336, 21.058250427246094, 22.700336456298828, 24.34242057800293, 25.984506607055664, 27.6265926361084, 29.2686767578125, 30.910762786865234, 32.55284881591797, 34.1949348449707, 35.83702087402344, 37.47910690307617, 39.121192932128906, 40.763275146484375, 42.40536117553711, 44.047447204589844, 45.68953323364258, 47.33161926269531, 48.97370529174805, 50.61579132080078, 52.25787353515625, 53.89996337890625, 55.54204559326172, 57.18413162231445, 58.82621765136719]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 12.0, 12.0, 10.0, 11.0, 31.0, 149.0, 51462728.0, 114.0, 36.0, 12.0, 5.0, 5.0, 4.0, 4.0, 6.0, 3.0, 5.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8412.0771484375, -8002.13037109375, -7592.18359375, -7182.2373046875, -6772.2900390625, -6362.34375, -5952.39697265625, -5542.4501953125, -5132.50341796875, -4722.556640625, -4312.60986328125, -3902.663330078125, -3492.716552734375, -3082.769775390625, -2672.8232421875, -2262.87646484375, -1852.9296875, -1442.98291015625, -1033.0362548828125, -623.089599609375, -213.142822265625, 196.803955078125, 606.75048828125, 1016.697265625, 1426.64404296875, 1836.5908203125, 2246.53759765625, 2656.484130859375, 3066.430908203125, 3476.377685546875, 3886.32421875, 4296.27099609375, 4706.216796875, 5116.16357421875, 5526.1103515625, 5936.056640625, 6346.00390625, 6755.9501953125, 7165.89697265625, 7575.84375, 7985.79052734375, 8395.7373046875, 8805.68359375, 9215.630859375, 9625.5771484375, 10035.5244140625, 10445.470703125, 10855.41796875, 11265.3642578125, 11675.310546875, 12085.2578125, 12495.2041015625, 12905.1513671875, 13315.09765625, 13725.044921875, 14134.9912109375, 14544.9375, 14954.8837890625, 15364.8310546875, 15774.77734375, 16184.724609375, 16594.671875, 17004.6171875, 17414.564453125, 17824.51171875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 7.0, 6.0, 18.0, 19.0, 27.0, 25.0, 54.0, 90.0, 114.0, 154.0, 237.0, 296.0, 427.0, 577.0, 944.0, 1491.0, 2099.0, 3120.0, 4744.0, 7354.0, 11174.0, 17590.0, 27807.0, 42489.0, 65475.0, 100597.0, 161749.0, 266913.0, 501835.0, 3710630.0, 589430.0, 292243.0, 175108.0, 109623.0, 69264.0, 44425.0, 28995.0, 18415.0, 12532.0, 7869.0, 5245.0, 3554.0, 2236.0, 1518.0, 987.0, 600.0, 470.0, 281.0, 176.0, 114.0, 87.0, 70.0, 49.0, 29.0, 28.0, 12.0, 7.0, 6.0, 5.0, 6.0, 2.0, 6.0], "bins": [-4.98046875, -4.82275390625, -4.6650390625, -4.50732421875, -4.349609375, -4.19189453125, -4.0341796875, -3.87646484375, -3.71875, -3.56103515625, -3.4033203125, -3.24560546875, -3.087890625, -2.93017578125, -2.7724609375, -2.61474609375, -2.45703125, -2.29931640625, -2.1416015625, -1.98388671875, -1.826171875, -1.66845703125, -1.5107421875, -1.35302734375, -1.1953125, -1.03759765625, -0.8798828125, -0.72216796875, -0.564453125, -0.40673828125, -0.2490234375, -0.09130859375, 0.06640625, 0.22412109375, 0.3818359375, 0.53955078125, 0.697265625, 0.85498046875, 1.0126953125, 1.17041015625, 1.328125, 1.48583984375, 1.6435546875, 1.80126953125, 1.958984375, 2.11669921875, 2.2744140625, 2.43212890625, 2.58984375, 2.74755859375, 2.9052734375, 3.06298828125, 3.220703125, 3.37841796875, 3.5361328125, 3.69384765625, 3.8515625, 4.00927734375, 4.1669921875, 4.32470703125, 4.482421875, 4.64013671875, 4.7978515625, 4.95556640625, 5.11328125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 5.0, 6.0, 7.0, 8.0, 13.0, 9.0, 16.0, 10.0, 15.0, 18.0, 17.0, 22.0, 23.0, 28.0, 26.0, 20.0, 33.0, 39.0, 53.0, 47.0, 74.0, 342.0, 640.0, 120.0, 41.0, 29.0, 36.0, 47.0, 32.0, 46.0, 32.0, 25.0, 20.0, 26.0, 16.0, 15.0, 14.0, 16.0, 11.0, 7.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.046875, -16.500244140625, -15.95361328125, -15.406982421875, -14.8603515625, -14.313720703125, -13.76708984375, -13.220458984375, -12.673828125, -12.127197265625, -11.58056640625, -11.033935546875, -10.4873046875, -9.940673828125, -9.39404296875, -8.847412109375, -8.30078125, -7.754150390625, -7.20751953125, -6.660888671875, -6.1142578125, -5.567626953125, -5.02099609375, -4.474365234375, -3.927734375, -3.381103515625, -2.83447265625, -2.287841796875, -1.7412109375, -1.194580078125, -0.64794921875, -0.101318359375, 0.4453125, 0.991943359375, 1.53857421875, 2.085205078125, 2.6318359375, 3.178466796875, 3.72509765625, 4.271728515625, 4.818359375, 5.364990234375, 5.91162109375, 6.458251953125, 7.0048828125, 7.551513671875, 8.09814453125, 8.644775390625, 9.19140625, 9.738037109375, 10.28466796875, 10.831298828125, 11.3779296875, 11.924560546875, 12.47119140625, 13.017822265625, 13.564453125, 14.111083984375, 14.65771484375, 15.204345703125, 15.7509765625, 16.297607421875, 16.84423828125, 17.390869140625, 17.9375]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 9.0, 17.0, 21.0, 21.0, 31.0, 37.0, 67.0, 118.0, 202.0, 307.0, 399.0, 527.0, 858.0, 1326.0, 2069.0, 2933.0, 4740.0, 7505.0, 11972.0, 19286.0, 33290.0, 58605.0, 107835.0, 215257.0, 488625.0, 3906621.0, 813894.0, 293322.0, 141828.0, 74140.0, 41390.0, 24292.0, 14582.0, 9115.0, 5665.0, 3522.0, 2427.0, 1550.0, 990.0, 642.0, 448.0, 309.0, 238.0, 167.0, 81.0, 53.0, 30.0, 17.0, 24.0, 13.0, 10.0, 17.0, 2.0, 0.0, 3.0], "bins": [-7.75, -7.52667236328125, -7.3033447265625, -7.08001708984375, -6.856689453125, -6.63336181640625, -6.4100341796875, -6.18670654296875, -5.96337890625, -5.74005126953125, -5.5167236328125, -5.29339599609375, -5.070068359375, -4.84674072265625, -4.6234130859375, -4.40008544921875, -4.1767578125, -3.95343017578125, -3.7301025390625, -3.50677490234375, -3.283447265625, -3.06011962890625, -2.8367919921875, -2.61346435546875, -2.39013671875, -2.16680908203125, -1.9434814453125, -1.72015380859375, -1.496826171875, -1.27349853515625, -1.0501708984375, -0.82684326171875, -0.603515625, -0.38018798828125, -0.1568603515625, 0.06646728515625, 0.289794921875, 0.51312255859375, 0.7364501953125, 0.95977783203125, 1.18310546875, 1.40643310546875, 1.6297607421875, 1.85308837890625, 2.076416015625, 2.29974365234375, 2.5230712890625, 2.74639892578125, 2.9697265625, 3.19305419921875, 3.4163818359375, 3.63970947265625, 3.863037109375, 4.08636474609375, 4.3096923828125, 4.53302001953125, 4.75634765625, 4.97967529296875, 5.2030029296875, 5.42633056640625, 5.649658203125, 5.87298583984375, 6.0963134765625, 6.31964111328125, 6.54296875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 6.0, 3.0, 9.0, 9.0, 8.0, 12.0, 7.0, 13.0, 16.0, 14.0, 21.0, 20.0, 22.0, 25.0, 32.0, 38.0, 41.0, 50.0, 60.0, 126.0, 531.0, 391.0, 119.0, 54.0, 35.0, 38.0, 33.0, 42.0, 39.0, 40.0, 28.0, 27.0, 23.0, 20.0, 16.0, 15.0, 8.0, 7.0, 5.0, 4.0, 5.0, 6.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-11.5546875, -11.192138671875, -10.82958984375, -10.467041015625, -10.1044921875, -9.741943359375, -9.37939453125, -9.016845703125, -8.654296875, -8.291748046875, -7.92919921875, -7.566650390625, -7.2041015625, -6.841552734375, -6.47900390625, -6.116455078125, -5.75390625, -5.391357421875, -5.02880859375, -4.666259765625, -4.3037109375, -3.941162109375, -3.57861328125, -3.216064453125, -2.853515625, -2.490966796875, -2.12841796875, -1.765869140625, -1.4033203125, -1.040771484375, -0.67822265625, -0.315673828125, 0.046875, 0.409423828125, 0.77197265625, 1.134521484375, 1.4970703125, 1.859619140625, 2.22216796875, 2.584716796875, 2.947265625, 3.309814453125, 3.67236328125, 4.034912109375, 4.3974609375, 4.760009765625, 5.12255859375, 5.485107421875, 5.84765625, 6.210205078125, 6.57275390625, 6.935302734375, 7.2978515625, 7.660400390625, 8.02294921875, 8.385498046875, 8.748046875, 9.110595703125, 9.47314453125, 9.835693359375, 10.1982421875, 10.560791015625, 10.92333984375, 11.285888671875, 11.6484375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 0.0, 4.0, 0.0, 9.0, 16.0, 10.0, 10.0, 17.0, 33.0, 40.0, 31.0, 42.0, 67.0, 102.0, 145.0, 125.0, 216.0, 237.0, 307.0, 483.0, 613.0, 800.0, 1146.0, 1709.0, 2496.0, 4286.0, 7230.0, 14983.0, 35570.0, 123251.0, 5875749.0, 144795.0, 39224.0, 16203.0, 7901.0, 4494.0, 2732.0, 1709.0, 1230.0, 943.0, 611.0, 434.0, 337.0, 241.0, 220.0, 161.0, 103.0, 77.0, 82.0, 53.0, 32.0, 30.0, 14.0, 18.0, 22.0, 11.0, 10.0, 5.0, 12.0, 9.0, 8.0], "bins": [-19.125, -18.554931640625, -17.98486328125, -17.414794921875, -16.8447265625, -16.274658203125, -15.70458984375, -15.134521484375, -14.564453125, -13.994384765625, -13.42431640625, -12.854248046875, -12.2841796875, -11.714111328125, -11.14404296875, -10.573974609375, -10.00390625, -9.433837890625, -8.86376953125, -8.293701171875, -7.7236328125, -7.153564453125, -6.58349609375, -6.013427734375, -5.443359375, -4.873291015625, -4.30322265625, -3.733154296875, -3.1630859375, -2.593017578125, -2.02294921875, -1.452880859375, -0.8828125, -0.312744140625, 0.25732421875, 0.827392578125, 1.3974609375, 1.967529296875, 2.53759765625, 3.107666015625, 3.677734375, 4.247802734375, 4.81787109375, 5.387939453125, 5.9580078125, 6.528076171875, 7.09814453125, 7.668212890625, 8.23828125, 8.808349609375, 9.37841796875, 9.948486328125, 10.5185546875, 11.088623046875, 11.65869140625, 12.228759765625, 12.798828125, 13.368896484375, 13.93896484375, 14.509033203125, 15.0791015625, 15.649169921875, 16.21923828125, 16.789306640625, 17.359375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 4.0, 6.0, 11.0, 9.0, 7.0, 6.0, 13.0, 22.0, 15.0, 25.0, 17.0, 19.0, 27.0, 28.0, 28.0, 29.0, 45.0, 56.0, 62.0, 108.0, 248.0, 465.0, 209.0, 95.0, 72.0, 41.0, 36.0, 33.0, 48.0, 28.0, 27.0, 30.0, 26.0, 15.0, 21.0, 12.0, 15.0, 10.0, 12.0, 13.0, 10.0, 6.0, 6.0, 4.0, 2.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.69140625, -7.46063232421875, -7.2298583984375, -6.99908447265625, -6.768310546875, -6.53753662109375, -6.3067626953125, -6.07598876953125, -5.84521484375, -5.61444091796875, -5.3836669921875, -5.15289306640625, -4.922119140625, -4.69134521484375, -4.4605712890625, -4.22979736328125, -3.9990234375, -3.76824951171875, -3.5374755859375, -3.30670166015625, -3.075927734375, -2.84515380859375, -2.6143798828125, -2.38360595703125, -2.15283203125, -1.92205810546875, -1.6912841796875, -1.46051025390625, -1.229736328125, -0.99896240234375, -0.7681884765625, -0.53741455078125, -0.306640625, -0.07586669921875, 0.1549072265625, 0.38568115234375, 0.616455078125, 0.84722900390625, 1.0780029296875, 1.30877685546875, 1.53955078125, 1.77032470703125, 2.0010986328125, 2.23187255859375, 2.462646484375, 2.69342041015625, 2.9241943359375, 3.15496826171875, 3.3857421875, 3.61651611328125, 3.8472900390625, 4.07806396484375, 4.308837890625, 4.53961181640625, 4.7703857421875, 5.00115966796875, 5.23193359375, 5.46270751953125, 5.6934814453125, 5.92425537109375, 6.155029296875, 6.38580322265625, 6.6165771484375, 6.84735107421875, 7.078125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 5.0, 10.0, 40.0, 63.0, 115.0, 223.0, 242.0, 121.0, 77.0, 27.0, 23.0, 15.0, 12.0, 9.0, 3.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.559688568115234, -26.752370834350586, -25.945053100585938, -25.137737274169922, -24.330419540405273, -23.523101806640625, -22.715784072875977, -21.908466339111328, -21.10114860534668, -20.29383087158203, -19.486513137817383, -18.679195404052734, -17.87187957763672, -17.06456184387207, -16.257244110107422, -15.449926376342773, -14.642609596252441, -13.835291862487793, -13.027975082397461, -12.220657348632812, -11.413339614868164, -10.606021881103516, -9.798705101013184, -8.991387367248535, -8.184070587158203, -7.376753330230713, -6.5694355964660645, -5.762118339538574, -4.954800605773926, -4.1474833488464355, -3.3401660919189453, -2.532848358154297, -1.7255306243896484, -0.9182131886482239, -0.11089575290679932, 0.6964216232299805, 1.5037391185760498, 2.311056613922119, 3.1183738708496094, 3.925691604614258, 4.733008861541748, 5.540326118469238, 6.347643852233887, 7.154961109161377, 7.962278366088867, 8.769596099853516, 9.576913833618164, 10.384231567382812, 11.191548347473145, 11.998866081237793, 12.806182861328125, 13.613500595092773, 14.420818328857422, 15.22813606262207, 16.03545379638672, 16.842769622802734, 17.650087356567383, 18.45740509033203, 19.26472282409668, 20.072040557861328, 20.879356384277344, 21.686674118041992, 22.49399185180664, 23.30130958557129, 24.108627319335938]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 10.0, 9.0, 10.0, 20.0, 13.0, 17.0, 24.0, 18.0, 29.0, 24.0, 29.0, 30.0, 41.0, 37.0, 43.0, 49.0, 50.0, 31.0, 45.0, 50.0, 41.0, 28.0, 52.0, 39.0, 39.0, 32.0, 36.0, 24.0, 22.0, 20.0, 11.0, 8.0, 15.0, 8.0, 11.0, 6.0, 6.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-11.969585418701172, -11.603760719299316, -11.237936973571777, -10.872112274169922, -10.506288528442383, -10.140463829040527, -9.774639129638672, -9.408815383911133, -9.042990684509277, -8.677165985107422, -8.311342239379883, -7.945517539978027, -7.57969331741333, -7.213869094848633, -6.8480448722839355, -6.482220649719238, -6.116396427154541, -5.750572204589844, -5.3847479820251465, -5.018923759460449, -4.653099060058594, -4.2872748374938965, -3.921450614929199, -3.555626153945923, -3.1898019313812256, -2.8239777088165283, -2.458153247833252, -2.0923290252685547, -1.7265046834945679, -1.360680341720581, -0.9948561191558838, -0.6290316581726074, -0.26320743560791016, 0.10261687636375427, 0.4684411883354187, 0.8342654705047607, 1.2000898122787476, 1.5659141540527344, 1.9317383766174316, 2.297562837600708, 2.6633870601654053, 3.0292112827301025, 3.395035743713379, 3.760859966278076, 4.126684188842773, 4.492508888244629, 4.858332633972168, 5.224157333374023, 5.589981555938721, 5.955805778503418, 6.321630001068115, 6.6874542236328125, 7.053278923034668, 7.419103145599365, 7.7849273681640625, 8.150752067565918, 8.516575813293457, 8.882400512695312, 9.248224258422852, 9.614048957824707, 9.979872703552246, 10.345697402954102, 10.71152114868164, 11.077345848083496, 11.443170547485352]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 10.0, 10.0, 19.0, 15.0, 21.0, 38.0, 40.0, 52.0, 73.0, 94.0, 109.0, 146.0, 197.0, 258.0, 315.0, 465.0, 651.0, 985.0, 1494.0, 2396.0, 4032.0, 7534.0, 15390.0, 40752.0, 3577404.0, 473719.0, 36671.0, 13747.0, 6909.0, 3680.0, 2245.0, 1445.0, 1049.0, 650.0, 448.0, 369.0, 248.0, 165.0, 129.0, 87.0, 67.0, 45.0, 30.0, 20.0, 23.0, 6.0, 9.0, 9.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0], "bins": [-0.341796875, -0.3320159912109375, -0.322235107421875, -0.3124542236328125, -0.30267333984375, -0.2928924560546875, -0.283111572265625, -0.2733306884765625, -0.2635498046875, -0.2537689208984375, -0.243988037109375, -0.2342071533203125, -0.22442626953125, -0.2146453857421875, -0.204864501953125, -0.1950836181640625, -0.185302734375, -0.1755218505859375, -0.165740966796875, -0.1559600830078125, -0.14617919921875, -0.1363983154296875, -0.126617431640625, -0.1168365478515625, -0.1070556640625, -0.0972747802734375, -0.087493896484375, -0.0777130126953125, -0.06793212890625, -0.0581512451171875, -0.048370361328125, -0.0385894775390625, -0.02880859375, -0.0190277099609375, -0.009246826171875, 0.0005340576171875, 0.01031494140625, 0.0200958251953125, 0.029876708984375, 0.0396575927734375, 0.0494384765625, 0.0592193603515625, 0.069000244140625, 0.0787811279296875, 0.08856201171875, 0.0983428955078125, 0.108123779296875, 0.1179046630859375, 0.127685546875, 0.1374664306640625, 0.147247314453125, 0.1570281982421875, 0.16680908203125, 0.1765899658203125, 0.186370849609375, 0.1961517333984375, 0.2059326171875, 0.2157135009765625, 0.225494384765625, 0.2352752685546875, 0.24505615234375, 0.2548370361328125, 0.264617919921875, 0.2743988037109375, 0.2841796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 6.0, 9.0, 8.0, 5.0, 16.0, 19.0, 23.0, 510.0, 282.0, 31.0, 20.0, 10.0, 12.0, 10.0, 5.0, 8.0, 1.0, 4.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.038909912109375, -0.0377955436706543, -0.036681175231933594, -0.03556680679321289, -0.03445243835449219, -0.033338069915771484, -0.03222370147705078, -0.031109333038330078, -0.029994964599609375, -0.028880596160888672, -0.02776622772216797, -0.026651859283447266, -0.025537490844726562, -0.02442312240600586, -0.023308753967285156, -0.022194385528564453, -0.02108001708984375, -0.019965648651123047, -0.018851280212402344, -0.01773691177368164, -0.016622543334960938, -0.015508174896240234, -0.014393806457519531, -0.013279438018798828, -0.012165069580078125, -0.011050701141357422, -0.009936332702636719, -0.008821964263916016, -0.0077075958251953125, -0.006593227386474609, -0.005478858947753906, -0.004364490509033203, -0.0032501220703125, -0.002135753631591797, -0.0010213851928710938, 9.298324584960938e-05, 0.0012073516845703125, 0.0023217201232910156, 0.0034360885620117188, 0.004550457000732422, 0.005664825439453125, 0.006779193878173828, 0.007893562316894531, 0.009007930755615234, 0.010122299194335938, 0.01123666763305664, 0.012351036071777344, 0.013465404510498047, 0.01457977294921875, 0.015694141387939453, 0.016808509826660156, 0.01792287826538086, 0.019037246704101562, 0.020151615142822266, 0.02126598358154297, 0.022380352020263672, 0.023494720458984375, 0.024609088897705078, 0.02572345733642578, 0.026837825775146484, 0.027952194213867188, 0.02906656265258789, 0.030180931091308594, 0.0312952995300293, 0.03240966796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 8.0, 13.0, 14.0, 16.0, 21.0, 23.0, 27.0, 51.0, 62.0, 103.0, 139.0, 249.0, 460.0, 1074.0, 3074.0, 12072.0, 60596.0, 848251.0, 3146459.0, 96679.0, 17528.0, 4555.0, 1552.0, 539.0, 255.0, 141.0, 75.0, 65.0, 44.0, 41.0, 22.0, 23.0, 14.0, 10.0, 9.0, 6.0, 1.0, 4.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.51904296875, -0.5046730041503906, -0.49030303955078125, -0.4759330749511719, -0.4615631103515625, -0.4471931457519531, -0.43282318115234375, -0.4184532165527344, -0.404083251953125, -0.3897132873535156, -0.37534332275390625, -0.3609733581542969, -0.3466033935546875, -0.3322334289550781, -0.31786346435546875, -0.3034934997558594, -0.28912353515625, -0.2747535705566406, -0.26038360595703125, -0.24601364135742188, -0.2316436767578125, -0.21727371215820312, -0.20290374755859375, -0.18853378295898438, -0.174163818359375, -0.15979385375976562, -0.14542388916015625, -0.13105392456054688, -0.1166839599609375, -0.10231399536132812, -0.08794403076171875, -0.07357406616210938, -0.0592041015625, -0.044834136962890625, -0.03046417236328125, -0.016094207763671875, -0.0017242431640625, 0.012645721435546875, 0.02701568603515625, 0.041385650634765625, 0.055755615234375, 0.07012557983398438, 0.08449554443359375, 0.09886550903320312, 0.1132354736328125, 0.12760543823242188, 0.14197540283203125, 0.15634536743164062, 0.17071533203125, 0.18508529663085938, 0.19945526123046875, 0.21382522583007812, 0.2281951904296875, 0.24256515502929688, 0.25693511962890625, 0.2713050842285156, 0.285675048828125, 0.3000450134277344, 0.31441497802734375, 0.3287849426269531, 0.3431549072265625, 0.3575248718261719, 0.37189483642578125, 0.3862648010253906, 0.400634765625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 8.0, 9.0, 5.0, 11.0, 16.0, 14.0, 15.0, 22.0, 29.0, 44.0, 45.0, 73.0, 79.0, 94.0, 111.0, 184.0, 267.0, 573.0, 1177.0, 423.0, 213.0, 150.0, 97.0, 83.0, 76.0, 46.0, 52.0, 30.0, 27.0, 27.0, 17.0, 12.0, 16.0, 11.0, 4.0, 4.0, 5.0, 2.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.08258056640625, -0.0803070068359375, -0.078033447265625, -0.0757598876953125, -0.073486328125, -0.0712127685546875, -0.068939208984375, -0.0666656494140625, -0.06439208984375, -0.0621185302734375, -0.059844970703125, -0.0575714111328125, -0.0552978515625, -0.0530242919921875, -0.050750732421875, -0.0484771728515625, -0.04620361328125, -0.0439300537109375, -0.041656494140625, -0.0393829345703125, -0.037109375, -0.0348358154296875, -0.032562255859375, -0.0302886962890625, -0.02801513671875, -0.0257415771484375, -0.023468017578125, -0.0211944580078125, -0.0189208984375, -0.0166473388671875, -0.014373779296875, -0.0121002197265625, -0.00982666015625, -0.0075531005859375, -0.005279541015625, -0.0030059814453125, -0.000732421875, 0.0015411376953125, 0.003814697265625, 0.0060882568359375, 0.00836181640625, 0.0106353759765625, 0.012908935546875, 0.0151824951171875, 0.0174560546875, 0.0197296142578125, 0.022003173828125, 0.0242767333984375, 0.02655029296875, 0.0288238525390625, 0.031097412109375, 0.0333709716796875, 0.03564453125, 0.0379180908203125, 0.040191650390625, 0.0424652099609375, 0.04473876953125, 0.0470123291015625, 0.049285888671875, 0.0515594482421875, 0.0538330078125, 0.0561065673828125, 0.058380126953125, 0.0606536865234375, 0.06292724609375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 5.0, 12.0, 9.0, 14.0, 26.0, 47.0, 116.0, 201.0, 259.0, 121.0, 78.0, 39.0, 25.0, 22.0, 8.0, 9.0, 4.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4893340766429901, -0.4651179313659668, -0.44090181589126587, -0.41668567061424255, -0.39246952533721924, -0.3682534098625183, -0.344037264585495, -0.3198211193084717, -0.29560500383377075, -0.27138885855674744, -0.2471727430820465, -0.2229565978050232, -0.19874046742916107, -0.17452433705329895, -0.15030819177627563, -0.1260920614004135, -0.10187593102455139, -0.07765980064868927, -0.05344366282224655, -0.029227524995803833, -0.005011394619941711, 0.01920473575592041, 0.043420881032943726, 0.06763701140880585, 0.09185314178466797, 0.11606927216053009, 0.1402854025363922, 0.16450154781341553, 0.18871767818927765, 0.21293380856513977, 0.23714995384216309, 0.261366069316864, 0.28558218479156494, 0.30979833006858826, 0.3340144455432892, 0.3582305908203125, 0.3824467062950134, 0.40666285157203674, 0.43087899684906006, 0.455095112323761, 0.4793112576007843, 0.5035274028778076, 0.5277435183525085, 0.5519596338272095, 0.5761758089065552, 0.6003919243812561, 0.624608039855957, 0.6488242149353027, 0.6730403304100037, 0.6972564458847046, 0.7214726209640503, 0.7456887364387512, 0.7699048519134521, 0.7941210269927979, 0.8183371424674988, 0.8425532579421997, 0.8667694330215454, 0.8909855484962463, 0.915201723575592, 0.939417839050293, 0.9636339545249939, 0.9878500699996948, 1.0120662450790405, 1.0362824201583862, 1.0604984760284424]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 8.0, 3.0, 5.0, 3.0, 11.0, 7.0, 9.0, 20.0, 11.0, 26.0, 23.0, 30.0, 25.0, 33.0, 39.0, 31.0, 51.0, 44.0, 64.0, 45.0, 59.0, 49.0, 42.0, 29.0, 39.0, 39.0, 43.0, 41.0, 32.0, 25.0, 19.0, 17.0, 20.0, 16.0, 13.0, 9.0, 7.0, 3.0, 2.0, 5.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.31900107860565186, -0.3084261119365692, -0.2978511452674866, -0.2872762084007263, -0.2767012417316437, -0.26612627506256104, -0.2555513083934784, -0.24497634172439575, -0.2344013750553131, -0.22382640838623047, -0.21325145661830902, -0.20267648994922638, -0.19210152328014374, -0.1815265715122223, -0.17095160484313965, -0.160376638174057, -0.14980168640613556, -0.13922671973705292, -0.12865176796913147, -0.11807680130004883, -0.10750183463096619, -0.09692687541246414, -0.0863519161939621, -0.07577694952487946, -0.06520199030637741, -0.05462702736258507, -0.044052064418792725, -0.03347710520029068, -0.022902142256498337, -0.012327179312705994, -0.001752220094203949, 0.008822746574878693, 0.019397705793380737, 0.02997266873717308, 0.040547631680965424, 0.05112259089946747, 0.06169755384325981, 0.07227251678705215, 0.0828474760055542, 0.09342244267463684, 0.10399740189313889, 0.11457236111164093, 0.12514732778072357, 0.13572227954864502, 0.14629724621772766, 0.1568722128868103, 0.16744717955589294, 0.17802214622497559, 0.18859709799289703, 0.19917206466197968, 0.20974701642990112, 0.22032198309898376, 0.2308969497680664, 0.24147191643714905, 0.2520468831062317, 0.26262181997299194, 0.2731967866420746, 0.2837717533111572, 0.29434671998023987, 0.3049216866493225, 0.31549662351608276, 0.3260715901851654, 0.33664655685424805, 0.3472215235233307, 0.35779649019241333]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 9.0, 7.0, 11.0, 12.0, 14.0, 24.0, 36.0, 36.0, 56.0, 90.0, 127.0, 230.0, 349.0, 608.0, 1076.0, 2081.0, 4363.0, 11942.0, 78115.0, 886422.0, 45485.0, 9622.0, 3598.0, 1736.0, 943.0, 561.0, 337.0, 212.0, 147.0, 100.0, 66.0, 44.0, 28.0, 16.0, 12.0, 11.0, 6.0, 9.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.33447265625, -0.3244590759277344, -0.31444549560546875, -0.3044319152832031, -0.2944183349609375, -0.2844047546386719, -0.27439117431640625, -0.2643775939941406, -0.254364013671875, -0.24435043334960938, -0.23433685302734375, -0.22432327270507812, -0.2143096923828125, -0.20429611206054688, -0.19428253173828125, -0.18426895141601562, -0.17425537109375, -0.16424179077148438, -0.15422821044921875, -0.14421463012695312, -0.1342010498046875, -0.12418746948242188, -0.11417388916015625, -0.10416030883789062, -0.094146728515625, -0.08413314819335938, -0.07411956787109375, -0.06410598754882812, -0.0540924072265625, -0.044078826904296875, -0.03406524658203125, -0.024051666259765625, -0.0140380859375, -0.004024505615234375, 0.00598907470703125, 0.016002655029296875, 0.0260162353515625, 0.036029815673828125, 0.04604339599609375, 0.056056976318359375, 0.066070556640625, 0.07608413696289062, 0.08609771728515625, 0.09611129760742188, 0.1061248779296875, 0.11613845825195312, 0.12615203857421875, 0.13616561889648438, 0.14617919921875, 0.15619277954101562, 0.16620635986328125, 0.17621994018554688, 0.1862335205078125, 0.19624710083007812, 0.20626068115234375, 0.21627426147460938, 0.226287841796875, 0.23630142211914062, 0.24631500244140625, 0.2563285827636719, 0.2663421630859375, 0.2763557434082031, 0.28636932373046875, 0.2963829040527344, 0.306396484375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 11.0, 6.0, 7.0, 12.0, 30.0, 85.0, 161.0, 248.0, 195.0, 118.0, 40.0, 29.0, 11.0, 6.0, 4.0, 2.0, 7.0, 3.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03973388671875, -0.038556575775146484, -0.03737926483154297, -0.03620195388793945, -0.03502464294433594, -0.03384733200073242, -0.032670021057128906, -0.03149271011352539, -0.030315399169921875, -0.02913808822631836, -0.027960777282714844, -0.026783466339111328, -0.025606155395507812, -0.024428844451904297, -0.02325153350830078, -0.022074222564697266, -0.02089691162109375, -0.019719600677490234, -0.01854228973388672, -0.017364978790283203, -0.016187667846679688, -0.015010356903076172, -0.013833045959472656, -0.01265573501586914, -0.011478424072265625, -0.01030111312866211, -0.009123802185058594, -0.007946491241455078, -0.0067691802978515625, -0.005591869354248047, -0.004414558410644531, -0.0032372474670410156, -0.0020599365234375, -0.0008826255798339844, 0.00029468536376953125, 0.0014719963073730469, 0.0026493072509765625, 0.003826618194580078, 0.005003929138183594, 0.006181240081787109, 0.007358551025390625, 0.00853586196899414, 0.009713172912597656, 0.010890483856201172, 0.012067794799804688, 0.013245105743408203, 0.014422416687011719, 0.015599727630615234, 0.01677703857421875, 0.017954349517822266, 0.01913166046142578, 0.020308971405029297, 0.021486282348632812, 0.022663593292236328, 0.023840904235839844, 0.02501821517944336, 0.026195526123046875, 0.02737283706665039, 0.028550148010253906, 0.029727458953857422, 0.030904769897460938, 0.03208208084106445, 0.03325939178466797, 0.034436702728271484, 0.035614013671875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 6.0, 7.0, 7.0, 13.0, 22.0, 30.0, 42.0, 62.0, 118.0, 243.0, 576.0, 1697.0, 7804.0, 76880.0, 886664.0, 64739.0, 6912.0, 1586.0, 554.0, 237.0, 134.0, 73.0, 48.0, 26.0, 19.0, 12.0, 9.0, 7.0, 7.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.67236328125, -0.6516571044921875, -0.630950927734375, -0.6102447509765625, -0.58953857421875, -0.5688323974609375, -0.548126220703125, -0.5274200439453125, -0.5067138671875, -0.4860076904296875, -0.465301513671875, -0.4445953369140625, -0.42388916015625, -0.4031829833984375, -0.382476806640625, -0.3617706298828125, -0.341064453125, -0.3203582763671875, -0.299652099609375, -0.2789459228515625, -0.25823974609375, -0.2375335693359375, -0.216827392578125, -0.1961212158203125, -0.1754150390625, -0.1547088623046875, -0.134002685546875, -0.1132965087890625, -0.09259033203125, -0.0718841552734375, -0.051177978515625, -0.0304718017578125, -0.009765625, 0.0109405517578125, 0.031646728515625, 0.0523529052734375, 0.07305908203125, 0.0937652587890625, 0.114471435546875, 0.1351776123046875, 0.1558837890625, 0.1765899658203125, 0.197296142578125, 0.2180023193359375, 0.23870849609375, 0.2594146728515625, 0.280120849609375, 0.3008270263671875, 0.321533203125, 0.3422393798828125, 0.362945556640625, 0.3836517333984375, 0.40435791015625, 0.4250640869140625, 0.445770263671875, 0.4664764404296875, 0.4871826171875, 0.5078887939453125, 0.528594970703125, 0.5493011474609375, 0.57000732421875, 0.5907135009765625, 0.611419677734375, 0.6321258544921875, 0.65283203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 6.0, 4.0, 7.0, 13.0, 12.0, 10.0, 7.0, 12.0, 28.0, 18.0, 27.0, 16.0, 38.0, 30.0, 50.0, 42.0, 51.0, 55.0, 51.0, 36.0, 46.0, 48.0, 47.0, 40.0, 43.0, 33.0, 35.0, 39.0, 29.0, 17.0, 21.0, 17.0, 15.0, 9.0, 11.0, 9.0, 10.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.2054443359375, -0.20029354095458984, -0.1951427459716797, -0.18999195098876953, -0.18484115600585938, -0.17969036102294922, -0.17453956604003906, -0.1693887710571289, -0.16423797607421875, -0.1590871810913086, -0.15393638610839844, -0.14878559112548828, -0.14363479614257812, -0.13848400115966797, -0.1333332061767578, -0.12818241119384766, -0.1230316162109375, -0.11788082122802734, -0.11273002624511719, -0.10757923126220703, -0.10242843627929688, -0.09727764129638672, -0.09212684631347656, -0.0869760513305664, -0.08182525634765625, -0.0766744613647461, -0.07152366638183594, -0.06637287139892578, -0.061222076416015625, -0.05607128143310547, -0.05092048645019531, -0.045769691467285156, -0.040618896484375, -0.035468101501464844, -0.030317306518554688, -0.02516651153564453, -0.020015716552734375, -0.014864921569824219, -0.009714126586914062, -0.004563331604003906, 0.00058746337890625, 0.005738258361816406, 0.010889053344726562, 0.01603984832763672, 0.021190643310546875, 0.02634143829345703, 0.03149223327636719, 0.036643028259277344, 0.0417938232421875, 0.046944618225097656, 0.05209541320800781, 0.05724620819091797, 0.062397003173828125, 0.06754779815673828, 0.07269859313964844, 0.0778493881225586, 0.08300018310546875, 0.0881509780883789, 0.09330177307128906, 0.09845256805419922, 0.10360336303710938, 0.10875415802001953, 0.11390495300292969, 0.11905574798583984, 0.12420654296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 8.0, 9.0, 13.0, 26.0, 23.0, 60.0, 128.0, 310.0, 1042.0, 11773.0, 1028123.0, 5763.0, 787.0, 257.0, 92.0, 48.0, 30.0, 24.0, 12.0, 4.0, 8.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3623046875, -1.310699462890625, -1.25909423828125, -1.207489013671875, -1.1558837890625, -1.104278564453125, -1.05267333984375, -1.001068115234375, -0.949462890625, -0.897857666015625, -0.84625244140625, -0.794647216796875, -0.7430419921875, -0.691436767578125, -0.63983154296875, -0.588226318359375, -0.53662109375, -0.485015869140625, -0.43341064453125, -0.381805419921875, -0.3302001953125, -0.278594970703125, -0.22698974609375, -0.175384521484375, -0.123779296875, -0.072174072265625, -0.02056884765625, 0.031036376953125, 0.0826416015625, 0.134246826171875, 0.18585205078125, 0.237457275390625, 0.2890625, 0.340667724609375, 0.39227294921875, 0.443878173828125, 0.4954833984375, 0.547088623046875, 0.59869384765625, 0.650299072265625, 0.701904296875, 0.753509521484375, 0.80511474609375, 0.856719970703125, 0.9083251953125, 0.959930419921875, 1.01153564453125, 1.063140869140625, 1.11474609375, 1.166351318359375, 1.21795654296875, 1.269561767578125, 1.3211669921875, 1.372772216796875, 1.42437744140625, 1.475982666015625, 1.527587890625, 1.579193115234375, 1.63079833984375, 1.682403564453125, 1.7340087890625, 1.785614013671875, 1.83721923828125, 1.888824462890625, 1.9404296875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 6.0, 9.0, 7.0, 12.0, 18.0, 19.0, 15.0, 40.0, 43.0, 50.0, 76.0, 88.0, 101.0, 121.0, 79.0, 88.0, 53.0, 50.0, 43.0, 17.0, 18.0, 13.0, 5.0, 11.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-2.390146255493164e-05, -2.3270025849342346e-05, -2.2638589143753052e-05, -2.2007152438163757e-05, -2.1375715732574463e-05, -2.074427902698517e-05, -2.0112842321395874e-05, -1.948140561580658e-05, -1.8849968910217285e-05, -1.821853220462799e-05, -1.7587095499038696e-05, -1.6955658793449402e-05, -1.6324222087860107e-05, -1.5692785382270813e-05, -1.5061348676681519e-05, -1.4429911971092224e-05, -1.379847526550293e-05, -1.3167038559913635e-05, -1.253560185432434e-05, -1.1904165148735046e-05, -1.1272728443145752e-05, -1.0641291737556458e-05, -1.0009855031967163e-05, -9.378418326377869e-06, -8.746981620788574e-06, -8.11554491519928e-06, -7.484108209609985e-06, -6.852671504020691e-06, -6.2212347984313965e-06, -5.589798092842102e-06, -4.958361387252808e-06, -4.326924681663513e-06, -3.6954879760742188e-06, -3.0640512704849243e-06, -2.43261456489563e-06, -1.8011778593063354e-06, -1.169741153717041e-06, -5.383044481277466e-07, 9.313225746154785e-08, 7.245689630508423e-07, 1.3560056686401367e-06, 1.987442374229431e-06, 2.6188790798187256e-06, 3.25031578540802e-06, 3.8817524909973145e-06, 4.513189196586609e-06, 5.144625902175903e-06, 5.776062607765198e-06, 6.407499313354492e-06, 7.038936018943787e-06, 7.670372724533081e-06, 8.301809430122375e-06, 8.93324613571167e-06, 9.564682841300964e-06, 1.0196119546890259e-05, 1.0827556252479553e-05, 1.1458992958068848e-05, 1.2090429663658142e-05, 1.2721866369247437e-05, 1.3353303074836731e-05, 1.3984739780426025e-05, 1.461617648601532e-05, 1.5247613191604614e-05, 1.587904989719391e-05, 1.6510486602783203e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 7.0, 12.0, 14.0, 26.0, 21.0, 34.0, 45.0, 69.0, 79.0, 129.0, 170.0, 274.0, 396.0, 635.0, 944.0, 1561.0, 2854.0, 5747.0, 14440.0, 66956.0, 748509.0, 165300.0, 23671.0, 7775.0, 3479.0, 1902.0, 1212.0, 723.0, 477.0, 331.0, 202.0, 164.0, 97.0, 87.0, 43.0, 38.0, 25.0, 25.0, 15.0, 14.0, 16.0, 9.0, 2.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.278564453125, -0.27075958251953125, -0.2629547119140625, -0.25514984130859375, -0.247344970703125, -0.23954010009765625, -0.2317352294921875, -0.22393035888671875, -0.21612548828125, -0.20832061767578125, -0.2005157470703125, -0.19271087646484375, -0.184906005859375, -0.17710113525390625, -0.1692962646484375, -0.16149139404296875, -0.1536865234375, -0.14588165283203125, -0.1380767822265625, -0.13027191162109375, -0.122467041015625, -0.11466217041015625, -0.1068572998046875, -0.09905242919921875, -0.09124755859375, -0.08344268798828125, -0.0756378173828125, -0.06783294677734375, -0.060028076171875, -0.05222320556640625, -0.0444183349609375, -0.03661346435546875, -0.02880859375, -0.02100372314453125, -0.0131988525390625, -0.00539398193359375, 0.002410888671875, 0.01021575927734375, 0.0180206298828125, 0.02582550048828125, 0.03363037109375, 0.04143524169921875, 0.0492401123046875, 0.05704498291015625, 0.064849853515625, 0.07265472412109375, 0.0804595947265625, 0.08826446533203125, 0.0960693359375, 0.10387420654296875, 0.1116790771484375, 0.11948394775390625, 0.127288818359375, 0.13509368896484375, 0.1428985595703125, 0.15070343017578125, 0.15850830078125, 0.16631317138671875, 0.1741180419921875, 0.18192291259765625, 0.189727783203125, 0.19753265380859375, 0.2053375244140625, 0.21314239501953125, 0.220947265625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 6.0, 7.0, 11.0, 30.0, 43.0, 71.0, 122.0, 226.0, 165.0, 110.0, 73.0, 45.0, 20.0, 16.0, 6.0, 11.0, 6.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2047119140625, -0.19680213928222656, -0.18889236450195312, -0.1809825897216797, -0.17307281494140625, -0.1651630401611328, -0.15725326538085938, -0.14934349060058594, -0.1414337158203125, -0.13352394104003906, -0.12561416625976562, -0.11770439147949219, -0.10979461669921875, -0.10188484191894531, -0.09397506713867188, -0.08606529235839844, -0.078155517578125, -0.07024574279785156, -0.062335968017578125, -0.05442619323730469, -0.04651641845703125, -0.03860664367675781, -0.030696868896484375, -0.022787094116210938, -0.0148773193359375, -0.0069675445556640625, 0.000942230224609375, 0.008852005004882812, 0.01676177978515625, 0.024671554565429688, 0.032581329345703125, 0.04049110412597656, 0.04840087890625, 0.05631065368652344, 0.06422042846679688, 0.07213020324707031, 0.08003997802734375, 0.08794975280761719, 0.09585952758789062, 0.10376930236816406, 0.1116790771484375, 0.11958885192871094, 0.12749862670898438, 0.1354084014892578, 0.14331817626953125, 0.1512279510498047, 0.15913772583007812, 0.16704750061035156, 0.174957275390625, 0.18286705017089844, 0.19077682495117188, 0.1986865997314453, 0.20659637451171875, 0.2145061492919922, 0.22241592407226562, 0.23032569885253906, 0.2382354736328125, 0.24614524841308594, 0.2540550231933594, 0.2619647979736328, 0.26987457275390625, 0.2777843475341797, 0.2856941223144531, 0.29360389709472656, 0.301513671875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 11.0, 10.0, 15.0, 59.0, 251.0, 422.0, 131.0, 50.0, 23.0, 13.0, 11.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.01239538192749, -3.870124340057373, -3.727853298187256, -3.5855822563171387, -3.4433112144470215, -3.3010401725769043, -3.158769130706787, -3.01649808883667, -2.8742270469665527, -2.7319560050964355, -2.5896849632263184, -2.447413921356201, -2.305142879486084, -2.162871837615967, -2.0206007957458496, -1.8783297538757324, -1.7360587120056152, -1.593787670135498, -1.4515166282653809, -1.3092455863952637, -1.1669745445251465, -1.0247035026550293, -0.8824324607849121, -0.7401614189147949, -0.5978903770446777, -0.45561933517456055, -0.31334829330444336, -0.17107725143432617, -0.028806209564208984, 0.1134648323059082, 0.2557358741760254, 0.3980069160461426, 0.540278434753418, 0.6825494766235352, 0.8248205184936523, 0.9670915603637695, 1.1093626022338867, 1.251633644104004, 1.393904685974121, 1.5361757278442383, 1.6784467697143555, 1.8207178115844727, 1.9629888534545898, 2.105259895324707, 2.247530937194824, 2.3898019790649414, 2.5320730209350586, 2.674344062805176, 2.816615104675293, 2.95888614654541, 3.1011571884155273, 3.2434282302856445, 3.3856992721557617, 3.527970314025879, 3.670241355895996, 3.8125123977661133, 3.9547834396362305, 4.097054481506348, 4.239325523376465, 4.381596565246582, 4.523867607116699, 4.666138648986816, 4.808409690856934, 4.950680732727051, 5.092951774597168]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 1.0, 3.0, 13.0, 12.0, 20.0, 30.0, 57.0, 101.0, 184.0, 210.0, 140.0, 101.0, 47.0, 20.0, 18.0, 11.0, 6.0, 4.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.699883460998535, -3.581669807434082, -3.463456153869629, -3.345242500305176, -3.2270288467407227, -3.1088151931762695, -2.9906015396118164, -2.8723878860473633, -2.75417423248291, -2.635960578918457, -2.517746925354004, -2.399533271789551, -2.2813196182250977, -2.1631059646606445, -2.0448923110961914, -1.9266787767410278, -1.8084652423858643, -1.6902515888214111, -1.572037935256958, -1.4538242816925049, -1.3356106281280518, -1.2173969745635986, -1.099183440208435, -0.9809697866439819, -0.8627561330795288, -0.7445424795150757, -0.6263288259506226, -0.5081152319908142, -0.3899015784263611, -0.27168792486190796, -0.1534743309020996, -0.035260677337646484, 0.08295297622680664, 0.20116661489009857, 0.3193802535533905, 0.43759387731552124, 0.5558075308799744, 0.6740211844444275, 0.7922347784042358, 0.910448431968689, 1.028662085533142, 1.1468757390975952, 1.2650893926620483, 1.383302927017212, 1.501516580581665, 1.6197302341461182, 1.7379438877105713, 1.8561575412750244, 1.9743711948394775, 2.0925848484039307, 2.210798501968384, 2.329012155532837, 2.44722580909729, 2.565439462661743, 2.683652877807617, 2.8018665313720703, 2.9200801849365234, 3.0382938385009766, 3.1565074920654297, 3.274721145629883, 3.392934799194336, 3.511148452758789, 3.629362106323242, 3.7475757598876953, 3.8657894134521484]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 5.0, 7.0, 12.0, 16.0, 23.0, 64.0, 172.0, 1648.0, 4039815.0, 150873.0, 1316.0, 179.0, 51.0, 28.0, 19.0, 10.0, 11.0, 9.0, 4.0, 2.0, 2.0, 3.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8359375, -2.71221923828125, -2.5885009765625, -2.46478271484375, -2.341064453125, -2.21734619140625, -2.0936279296875, -1.96990966796875, -1.84619140625, -1.72247314453125, -1.5987548828125, -1.47503662109375, -1.351318359375, -1.22760009765625, -1.1038818359375, -0.98016357421875, -0.8564453125, -0.73272705078125, -0.6090087890625, -0.48529052734375, -0.361572265625, -0.23785400390625, -0.1141357421875, 0.00958251953125, 0.13330078125, 0.25701904296875, 0.3807373046875, 0.50445556640625, 0.628173828125, 0.75189208984375, 0.8756103515625, 0.99932861328125, 1.123046875, 1.24676513671875, 1.3704833984375, 1.49420166015625, 1.617919921875, 1.74163818359375, 1.8653564453125, 1.98907470703125, 2.11279296875, 2.23651123046875, 2.3602294921875, 2.48394775390625, 2.607666015625, 2.73138427734375, 2.8551025390625, 2.97882080078125, 3.1025390625, 3.22625732421875, 3.3499755859375, 3.47369384765625, 3.597412109375, 3.72113037109375, 3.8448486328125, 3.96856689453125, 4.09228515625, 4.21600341796875, 4.3397216796875, 4.46343994140625, 4.587158203125, 4.71087646484375, 4.8345947265625, 4.95831298828125, 5.08203125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 0.0, 6.0, 5.0, 8.0, 7.0, 13.0, 13.0, 19.0, 29.0, 60.0, 80.0, 98.0, 127.0, 147.0, 121.0, 86.0, 67.0, 31.0, 17.0, 14.0, 11.0, 6.0, 3.0, 6.0, 2.0, 5.0, 2.0, 1.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0295562744140625, -0.028656959533691406, -0.027757644653320312, -0.02685832977294922, -0.025959014892578125, -0.02505970001220703, -0.024160385131835938, -0.023261070251464844, -0.02236175537109375, -0.021462440490722656, -0.020563125610351562, -0.01966381072998047, -0.018764495849609375, -0.01786518096923828, -0.016965866088867188, -0.016066551208496094, -0.015167236328125, -0.014267921447753906, -0.013368606567382812, -0.012469291687011719, -0.011569976806640625, -0.010670661926269531, -0.009771347045898438, -0.008872032165527344, -0.00797271728515625, -0.007073402404785156, -0.0061740875244140625, -0.005274772644042969, -0.004375457763671875, -0.0034761428833007812, -0.0025768280029296875, -0.0016775131225585938, -0.0007781982421875, 0.00012111663818359375, 0.0010204315185546875, 0.0019197463989257812, 0.002819061279296875, 0.0037183761596679688, 0.0046176910400390625, 0.005517005920410156, 0.00641632080078125, 0.007315635681152344, 0.008214950561523438, 0.009114265441894531, 0.010013580322265625, 0.010912895202636719, 0.011812210083007812, 0.012711524963378906, 0.01361083984375, 0.014510154724121094, 0.015409469604492188, 0.01630878448486328, 0.017208099365234375, 0.01810741424560547, 0.019006729125976562, 0.019906044006347656, 0.02080535888671875, 0.021704673767089844, 0.022603988647460938, 0.02350330352783203, 0.024402618408203125, 0.02530193328857422, 0.026201248168945312, 0.027100563049316406, 0.0279998779296875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 8.0, 26.0, 19.0, 42.0, 54.0, 103.0, 174.0, 408.0, 964.0, 2701.0, 9447.0, 53191.0, 3809455.0, 289487.0, 20720.0, 4973.0, 1563.0, 535.0, 206.0, 82.0, 50.0, 24.0, 12.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.009765625, -0.9866905212402344, -0.9636154174804688, -0.9405403137207031, -0.9174652099609375, -0.8943901062011719, -0.8713150024414062, -0.8482398986816406, -0.825164794921875, -0.8020896911621094, -0.7790145874023438, -0.7559394836425781, -0.7328643798828125, -0.7097892761230469, -0.6867141723632812, -0.6636390686035156, -0.64056396484375, -0.6174888610839844, -0.5944137573242188, -0.5713386535644531, -0.5482635498046875, -0.5251884460449219, -0.5021133422851562, -0.4790382385253906, -0.455963134765625, -0.4328880310058594, -0.40981292724609375, -0.3867378234863281, -0.3636627197265625, -0.3405876159667969, -0.31751251220703125, -0.2944374084472656, -0.2713623046875, -0.24828720092773438, -0.22521209716796875, -0.20213699340820312, -0.1790618896484375, -0.15598678588867188, -0.13291168212890625, -0.10983657836914062, -0.086761474609375, -0.06368637084960938, -0.04061126708984375, -0.017536163330078125, 0.0055389404296875, 0.028614044189453125, 0.05168914794921875, 0.07476425170898438, 0.09783935546875, 0.12091445922851562, 0.14398956298828125, 0.16706466674804688, 0.1901397705078125, 0.21321487426757812, 0.23628997802734375, 0.2593650817871094, 0.282440185546875, 0.3055152893066406, 0.32859039306640625, 0.3516654968261719, 0.3747406005859375, 0.3978157043457031, 0.42089080810546875, 0.4439659118652344, 0.467041015625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 5.0, 4.0, 6.0, 0.0, 8.0, 10.0, 13.0, 17.0, 24.0, 32.0, 46.0, 77.0, 141.0, 392.0, 1618.0, 930.0, 280.0, 148.0, 80.0, 63.0, 33.0, 35.0, 23.0, 8.0, 10.0, 10.0, 7.0, 9.0, 8.0, 8.0, 5.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.056396484375, -0.054781436920166016, -0.05316638946533203, -0.05155134201049805, -0.04993629455566406, -0.04832124710083008, -0.046706199645996094, -0.04509115219116211, -0.043476104736328125, -0.04186105728149414, -0.040246009826660156, -0.03863096237182617, -0.03701591491699219, -0.0354008674621582, -0.03378582000732422, -0.032170772552490234, -0.03055572509765625, -0.028940677642822266, -0.02732563018798828, -0.025710582733154297, -0.024095535278320312, -0.022480487823486328, -0.020865440368652344, -0.01925039291381836, -0.017635345458984375, -0.01602029800415039, -0.014405250549316406, -0.012790203094482422, -0.011175155639648438, -0.009560108184814453, -0.007945060729980469, -0.006330013275146484, -0.0047149658203125, -0.0030999183654785156, -0.0014848709106445312, 0.00013017654418945312, 0.0017452239990234375, 0.003360271453857422, 0.004975318908691406, 0.006590366363525391, 0.008205413818359375, 0.00982046127319336, 0.011435508728027344, 0.013050556182861328, 0.014665603637695312, 0.016280651092529297, 0.01789569854736328, 0.019510746002197266, 0.02112579345703125, 0.022740840911865234, 0.02435588836669922, 0.025970935821533203, 0.027585983276367188, 0.029201030731201172, 0.030816078186035156, 0.03243112564086914, 0.034046173095703125, 0.03566122055053711, 0.037276268005371094, 0.03889131546020508, 0.04050636291503906, 0.04212141036987305, 0.04373645782470703, 0.045351505279541016, 0.046966552734375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 23.0, 582.0, 393.0, 12.0, 4.0], "bins": [-5.504264831542969, -5.414007186889648, -5.323750019073486, -5.233492374420166, -5.143235206604004, -5.052977561950684, -4.9627203941345215, -4.872462749481201, -4.782205581665039, -4.691947937011719, -4.601690769195557, -4.511433124542236, -4.421175956726074, -4.330918312072754, -4.240661144256592, -4.1504034996032715, -4.060146331787109, -3.969888925552368, -3.879631519317627, -3.7893741130828857, -3.6991167068481445, -3.6088593006134033, -3.518601894378662, -3.428344249725342, -3.3380866050720215, -3.2478291988372803, -3.157571792602539, -3.067314386367798, -2.9770569801330566, -2.8867995738983154, -2.796542167663574, -2.706284523010254, -2.6160271167755127, -2.5257697105407715, -2.4355123043060303, -2.345254898071289, -2.254997491836548, -2.1647400856018066, -2.0744824409484863, -1.9842251539230347, -1.893967866897583, -1.8037104606628418, -1.7134530544281006, -1.6231956481933594, -1.5329382419586182, -1.442680835723877, -1.3524233102798462, -1.262165904045105, -1.1719083786010742, -1.081650972366333, -0.9913935661315918, -0.9011361002922058, -0.8108786940574646, -0.7206212878227234, -0.6303638219833374, -0.5401064157485962, -0.44984906911849976, -0.35959166288375854, -0.26933422684669495, -0.17907679080963135, -0.08881938457489014, 0.0014380216598510742, 0.09169548749923706, 0.18195289373397827, 0.2722102999687195]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 7.0, 1.0, 6.0, 10.0, 12.0, 27.0, 45.0, 64.0, 105.0, 128.0, 143.0, 119.0, 104.0, 74.0, 57.0, 34.0, 19.0, 10.0, 8.0, 6.0, 3.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3847852945327759, -0.37370383739471436, -0.36262235045433044, -0.3515408933162689, -0.340459406375885, -0.3293779492378235, -0.31829649209976196, -0.30721500515937805, -0.29613354802131653, -0.285052090883255, -0.2739706039428711, -0.26288914680480957, -0.25180765986442566, -0.24072620272636414, -0.22964473068714142, -0.2185632586479187, -0.20748178660869598, -0.19640031456947327, -0.18531884253025055, -0.17423737049102783, -0.1631559133529663, -0.1520744413137436, -0.14099296927452087, -0.12991151213645935, -0.11883003264665604, -0.10774856060743332, -0.0966670960187912, -0.08558562397956848, -0.07450415194034576, -0.06342268735170364, -0.052341215312480927, -0.041259750723838806, -0.03017827868461609, -0.01909681037068367, -0.008015340194106102, 0.003066129982471466, 0.014147598296403885, 0.025229066610336304, 0.03631053864955902, 0.04739200323820114, 0.05847347527742386, 0.06955494731664658, 0.0806364119052887, 0.09171788394451141, 0.10279935598373413, 0.11388082057237625, 0.12496229261159897, 0.1360437572002411, 0.1471252292394638, 0.15820670127868652, 0.16928817331790924, 0.18036964535713196, 0.19145110249519348, 0.2025325745344162, 0.21361404657363892, 0.22469550371170044, 0.23577699065208435, 0.24685846269130707, 0.2579399347305298, 0.2690213918685913, 0.2801028788089752, 0.29118433594703674, 0.30226582288742065, 0.3133472800254822, 0.3244287371635437]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 7.0, 6.0, 10.0, 8.0, 23.0, 29.0, 44.0, 81.0, 96.0, 158.0, 237.0, 348.0, 539.0, 825.0, 1350.0, 2150.0, 3789.0, 6618.0, 12405.0, 27804.0, 76294.0, 292975.0, 445727.0, 106608.0, 35804.0, 15531.0, 7838.0, 4426.0, 2475.0, 1554.0, 952.0, 630.0, 417.0, 268.0, 185.0, 106.0, 71.0, 57.0, 47.0, 19.0, 19.0, 12.0, 9.0, 7.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1591796875, -0.15437698364257812, -0.14957427978515625, -0.14477157592773438, -0.1399688720703125, -0.13516616821289062, -0.13036346435546875, -0.12556076049804688, -0.120758056640625, -0.11595535278320312, -0.11115264892578125, -0.10634994506835938, -0.1015472412109375, -0.09674453735351562, -0.09194183349609375, -0.08713912963867188, -0.08233642578125, -0.07753372192382812, -0.07273101806640625, -0.06792831420898438, -0.0631256103515625, -0.058322906494140625, -0.05352020263671875, -0.048717498779296875, -0.043914794921875, -0.039112091064453125, -0.03430938720703125, -0.029506683349609375, -0.0247039794921875, -0.019901275634765625, -0.01509857177734375, -0.010295867919921875, -0.0054931640625, -0.000690460205078125, 0.00411224365234375, 0.008914947509765625, 0.0137176513671875, 0.018520355224609375, 0.02332305908203125, 0.028125762939453125, 0.032928466796875, 0.037731170654296875, 0.04253387451171875, 0.047336578369140625, 0.0521392822265625, 0.056941986083984375, 0.06174468994140625, 0.06654739379882812, 0.07135009765625, 0.07615280151367188, 0.08095550537109375, 0.08575820922851562, 0.0905609130859375, 0.09536361694335938, 0.10016632080078125, 0.10496902465820312, 0.109771728515625, 0.11457443237304688, 0.11937713623046875, 0.12417984008789062, 0.1289825439453125, 0.13378524780273438, 0.13858795166015625, 0.14339065551757812, 0.148193359375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 3.0, 5.0, 4.0, 1.0, 6.0, 0.0, 9.0, 8.0, 13.0, 11.0, 13.0, 19.0, 32.0, 46.0, 43.0, 63.0, 74.0, 83.0, 78.0, 80.0, 84.0, 52.0, 48.0, 60.0, 41.0, 32.0, 19.0, 12.0, 10.0, 12.0, 8.0, 9.0, 2.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0170745849609375, -0.01655292510986328, -0.016031265258789062, -0.015509605407714844, -0.014987945556640625, -0.014466285705566406, -0.013944625854492188, -0.013422966003417969, -0.01290130615234375, -0.012379646301269531, -0.011857986450195312, -0.011336326599121094, -0.010814666748046875, -0.010293006896972656, -0.009771347045898438, -0.009249687194824219, -0.00872802734375, -0.008206367492675781, -0.0076847076416015625, -0.007163047790527344, -0.006641387939453125, -0.006119728088378906, -0.0055980682373046875, -0.005076408386230469, -0.00455474853515625, -0.004033088684082031, -0.0035114288330078125, -0.0029897689819335938, -0.002468109130859375, -0.0019464492797851562, -0.0014247894287109375, -0.0009031295776367188, -0.0003814697265625, 0.00014019012451171875, 0.0006618499755859375, 0.0011835098266601562, 0.001705169677734375, 0.0022268295288085938, 0.0027484893798828125, 0.0032701492309570312, 0.00379180908203125, 0.004313468933105469, 0.0048351287841796875, 0.005356788635253906, 0.005878448486328125, 0.006400108337402344, 0.0069217681884765625, 0.007443428039550781, 0.007965087890625, 0.008486747741699219, 0.009008407592773438, 0.009530067443847656, 0.010051727294921875, 0.010573387145996094, 0.011095046997070312, 0.011616706848144531, 0.01213836669921875, 0.012660026550292969, 0.013181686401367188, 0.013703346252441406, 0.014225006103515625, 0.014746665954589844, 0.015268325805664062, 0.01578998565673828, 0.0163116455078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 1.0, 2.0, 6.0, 3.0, 2.0, 3.0, 2.0, 5.0, 7.0, 9.0, 24.0, 86.0, 831.0, 24777.0, 969591.0, 51712.0, 1303.0, 109.0, 34.0, 9.0, 7.0, 3.0, 7.0, 4.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.523406982421875, -0.49798583984375, -0.472564697265625, -0.4471435546875, -0.421722412109375, -0.39630126953125, -0.370880126953125, -0.345458984375, -0.320037841796875, -0.29461669921875, -0.269195556640625, -0.2437744140625, -0.218353271484375, -0.19293212890625, -0.167510986328125, -0.14208984375, -0.116668701171875, -0.09124755859375, -0.065826416015625, -0.0404052734375, -0.014984130859375, 0.01043701171875, 0.035858154296875, 0.061279296875, 0.086700439453125, 0.11212158203125, 0.137542724609375, 0.1629638671875, 0.188385009765625, 0.21380615234375, 0.239227294921875, 0.2646484375, 0.290069580078125, 0.31549072265625, 0.340911865234375, 0.3663330078125, 0.391754150390625, 0.41717529296875, 0.442596435546875, 0.468017578125, 0.493438720703125, 0.51885986328125, 0.544281005859375, 0.5697021484375, 0.595123291015625, 0.62054443359375, 0.645965576171875, 0.67138671875, 0.696807861328125, 0.72222900390625, 0.747650146484375, 0.7730712890625, 0.798492431640625, 0.82391357421875, 0.849334716796875, 0.874755859375, 0.900177001953125, 0.92559814453125, 0.951019287109375, 0.9764404296875, 1.001861572265625, 1.02728271484375, 1.052703857421875, 1.078125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 1.0, 6.0, 7.0, 6.0, 5.0, 11.0, 10.0, 18.0, 15.0, 19.0, 18.0, 29.0, 15.0, 25.0, 37.0, 33.0, 33.0, 42.0, 28.0, 36.0, 46.0, 44.0, 41.0, 45.0, 30.0, 41.0, 43.0, 46.0, 32.0, 40.0, 27.0, 25.0, 26.0, 26.0, 14.0, 13.0, 15.0, 8.0, 11.0, 11.0, 7.0, 7.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.079833984375, -0.07739734649658203, -0.07496070861816406, -0.0725240707397461, -0.07008743286132812, -0.06765079498291016, -0.06521415710449219, -0.06277751922607422, -0.06034088134765625, -0.05790424346923828, -0.05546760559082031, -0.053030967712402344, -0.050594329833984375, -0.048157691955566406, -0.04572105407714844, -0.04328441619873047, -0.0408477783203125, -0.03841114044189453, -0.03597450256347656, -0.033537864685058594, -0.031101226806640625, -0.028664588928222656, -0.026227951049804688, -0.02379131317138672, -0.02135467529296875, -0.01891803741455078, -0.016481399536132812, -0.014044761657714844, -0.011608123779296875, -0.009171485900878906, -0.0067348480224609375, -0.004298210144042969, -0.001861572265625, 0.0005750656127929688, 0.0030117034912109375, 0.005448341369628906, 0.007884979248046875, 0.010321617126464844, 0.012758255004882812, 0.015194892883300781, 0.01763153076171875, 0.02006816864013672, 0.022504806518554688, 0.024941444396972656, 0.027378082275390625, 0.029814720153808594, 0.03225135803222656, 0.03468799591064453, 0.0371246337890625, 0.03956127166748047, 0.04199790954589844, 0.044434547424316406, 0.046871185302734375, 0.049307823181152344, 0.05174446105957031, 0.05418109893798828, 0.05661773681640625, 0.05905437469482422, 0.06149101257324219, 0.06392765045166016, 0.06636428833007812, 0.0688009262084961, 0.07123756408691406, 0.07367420196533203, 0.07611083984375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 5.0, 4.0, 9.0, 12.0, 17.0, 43.0, 175.0, 1856.0, 1031695.0, 14203.0, 382.0, 81.0, 23.0, 17.0, 10.0, 8.0, 8.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.12890625, -2.075286865234375, -2.02166748046875, -1.968048095703125, -1.9144287109375, -1.860809326171875, -1.80718994140625, -1.753570556640625, -1.699951171875, -1.646331787109375, -1.59271240234375, -1.539093017578125, -1.4854736328125, -1.431854248046875, -1.37823486328125, -1.324615478515625, -1.27099609375, -1.217376708984375, -1.16375732421875, -1.110137939453125, -1.0565185546875, -1.002899169921875, -0.94927978515625, -0.895660400390625, -0.842041015625, -0.788421630859375, -0.73480224609375, -0.681182861328125, -0.6275634765625, -0.573944091796875, -0.52032470703125, -0.466705322265625, -0.4130859375, -0.359466552734375, -0.30584716796875, -0.252227783203125, -0.1986083984375, -0.144989013671875, -0.09136962890625, -0.037750244140625, 0.015869140625, 0.069488525390625, 0.12310791015625, 0.176727294921875, 0.2303466796875, 0.283966064453125, 0.33758544921875, 0.391204833984375, 0.44482421875, 0.498443603515625, 0.55206298828125, 0.605682373046875, 0.6593017578125, 0.712921142578125, 0.76654052734375, 0.820159912109375, 0.873779296875, 0.927398681640625, 0.98101806640625, 1.034637451171875, 1.0882568359375, 1.141876220703125, 1.19549560546875, 1.249114990234375, 1.302734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 10.0, 14.0, 20.0, 21.0, 53.0, 142.0, 335.0, 211.0, 78.0, 35.0, 25.0, 10.0, 10.0, 4.0, 7.0, 0.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.679794311523438e-05, -9.392388164997101e-05, -9.104982018470764e-05, -8.817575871944427e-05, -8.530169725418091e-05, -8.242763578891754e-05, -7.955357432365417e-05, -7.667951285839081e-05, -7.380545139312744e-05, -7.093138992786407e-05, -6.805732846260071e-05, -6.518326699733734e-05, -6.230920553207397e-05, -5.943514406681061e-05, -5.656108260154724e-05, -5.3687021136283875e-05, -5.081295967102051e-05, -4.793889820575714e-05, -4.5064836740493774e-05, -4.219077527523041e-05, -3.931671380996704e-05, -3.6442652344703674e-05, -3.356859087944031e-05, -3.069452941417694e-05, -2.7820467948913574e-05, -2.4946406483650208e-05, -2.207234501838684e-05, -1.9198283553123474e-05, -1.6324222087860107e-05, -1.345016062259674e-05, -1.0576099157333374e-05, -7.702037692070007e-06, -4.827976226806641e-06, -1.953914761543274e-06, 9.201467037200928e-07, 3.7942081689834595e-06, 6.668269634246826e-06, 9.542331099510193e-06, 1.241639256477356e-05, 1.5290454030036926e-05, 1.8164515495300293e-05, 2.103857696056366e-05, 2.3912638425827026e-05, 2.6786699891090393e-05, 2.966076135635376e-05, 3.2534822821617126e-05, 3.540888428688049e-05, 3.828294575214386e-05, 4.1157007217407227e-05, 4.403106868267059e-05, 4.690513014793396e-05, 4.977919161319733e-05, 5.265325307846069e-05, 5.552731454372406e-05, 5.840137600898743e-05, 6.12754374742508e-05, 6.414949893951416e-05, 6.702356040477753e-05, 6.98976218700409e-05, 7.277168333530426e-05, 7.564574480056763e-05, 7.8519806265831e-05, 8.139386773109436e-05, 8.426792919635773e-05, 8.71419906616211e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 12.0, 5.0, 14.0, 21.0, 28.0, 36.0, 64.0, 93.0, 166.0, 268.0, 473.0, 883.0, 2018.0, 5160.0, 16673.0, 73675.0, 505068.0, 368448.0, 54522.0, 13125.0, 4251.0, 1725.0, 768.0, 401.0, 255.0, 145.0, 90.0, 55.0, 35.0, 21.0, 15.0, 12.0, 12.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2310791015625, -0.22446060180664062, -0.21784210205078125, -0.21122360229492188, -0.2046051025390625, -0.19798660278320312, -0.19136810302734375, -0.18474960327148438, -0.178131103515625, -0.17151260375976562, -0.16489410400390625, -0.15827560424804688, -0.1516571044921875, -0.14503860473632812, -0.13842010498046875, -0.13180160522460938, -0.12518310546875, -0.11856460571289062, -0.11194610595703125, -0.10532760620117188, -0.0987091064453125, -0.09209060668945312, -0.08547210693359375, -0.07885360717773438, -0.072235107421875, -0.06561660766601562, -0.05899810791015625, -0.052379608154296875, -0.0457611083984375, -0.039142608642578125, -0.03252410888671875, -0.025905609130859375, -0.019287109375, -0.012668609619140625, -0.00605010986328125, 0.000568389892578125, 0.0071868896484375, 0.013805389404296875, 0.02042388916015625, 0.027042388916015625, 0.033660888671875, 0.040279388427734375, 0.04689788818359375, 0.053516387939453125, 0.0601348876953125, 0.06675338745117188, 0.07337188720703125, 0.07999038696289062, 0.08660888671875, 0.09322738647460938, 0.09984588623046875, 0.10646438598632812, 0.1130828857421875, 0.11970138549804688, 0.12631988525390625, 0.13293838500976562, 0.139556884765625, 0.14617538452148438, 0.15279388427734375, 0.15941238403320312, 0.1660308837890625, 0.17264938354492188, 0.17926788330078125, 0.18588638305664062, 0.1925048828125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 5.0, 11.0, 10.0, 19.0, 37.0, 38.0, 42.0, 76.0, 116.0, 132.0, 140.0, 103.0, 78.0, 56.0, 37.0, 39.0, 22.0, 12.0, 7.0, 8.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1575927734375, -0.1531238555908203, -0.14865493774414062, -0.14418601989746094, -0.13971710205078125, -0.13524818420410156, -0.13077926635742188, -0.1263103485107422, -0.1218414306640625, -0.11737251281738281, -0.11290359497070312, -0.10843467712402344, -0.10396575927734375, -0.09949684143066406, -0.09502792358398438, -0.09055900573730469, -0.086090087890625, -0.08162117004394531, -0.07715225219726562, -0.07268333435058594, -0.06821441650390625, -0.06374549865722656, -0.059276580810546875, -0.05480766296386719, -0.0503387451171875, -0.04586982727050781, -0.041400909423828125, -0.03693199157714844, -0.03246307373046875, -0.027994155883789062, -0.023525238037109375, -0.019056320190429688, -0.01458740234375, -0.010118484497070312, -0.005649566650390625, -0.0011806488037109375, 0.00328826904296875, 0.0077571868896484375, 0.012226104736328125, 0.016695022583007812, 0.0211639404296875, 0.025632858276367188, 0.030101776123046875, 0.03457069396972656, 0.03903961181640625, 0.04350852966308594, 0.047977447509765625, 0.05244636535644531, 0.056915283203125, 0.06138420104980469, 0.06585311889648438, 0.07032203674316406, 0.07479095458984375, 0.07925987243652344, 0.08372879028320312, 0.08819770812988281, 0.0926666259765625, 0.09713554382324219, 0.10160446166992188, 0.10607337951660156, 0.11054229736328125, 0.11501121520996094, 0.11948013305664062, 0.12394905090332031, 0.12841796875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 6.0, 15.0, 35.0, 47.0, 158.0, 323.0, 230.0, 105.0, 41.0, 15.0, 8.0, 11.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8318114280700684, -1.7755467891693115, -1.7192820310592651, -1.6630172729492188, -1.606752634048462, -1.550487995147705, -1.4942232370376587, -1.4379584789276123, -1.3816938400268555, -1.3254292011260986, -1.2691644430160522, -1.2128996849060059, -1.156635046005249, -1.1003704071044922, -1.0441056489944458, -0.9878409504890442, -0.9315762519836426, -0.875311553478241, -0.8190468549728394, -0.7627821564674377, -0.7065174579620361, -0.6502527594566345, -0.5939880609512329, -0.5377233624458313, -0.4814586639404297, -0.4251939654350281, -0.36892926692962646, -0.31266456842422485, -0.25639986991882324, -0.20013517141342163, -0.14387047290802002, -0.08760577440261841, -0.03134119510650635, 0.024923503398895264, 0.08118820190429688, 0.1374529004096985, 0.1937175989151001, 0.2499822974205017, 0.3062469959259033, 0.36251169443130493, 0.41877639293670654, 0.47504109144210815, 0.5313057899475098, 0.5875704884529114, 0.643835186958313, 0.7000998854637146, 0.7563645839691162, 0.8126292824745178, 0.8688939809799194, 0.925158679485321, 0.9814233779907227, 1.0376880168914795, 1.0939527750015259, 1.1502175331115723, 1.206482172012329, 1.262746810913086, 1.3190115690231323, 1.3752763271331787, 1.4315409660339355, 1.4878056049346924, 1.5440703630447388, 1.6003351211547852, 1.656599760055542, 1.7128643989562988, 1.7691291570663452]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 5.0, 3.0, 5.0, 5.0, 16.0, 13.0, 18.0, 25.0, 38.0, 47.0, 55.0, 63.0, 75.0, 82.0, 75.0, 74.0, 75.0, 53.0, 56.0, 54.0, 28.0, 25.0, 22.0, 19.0, 11.0, 10.0, 10.0, 7.0, 3.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9033595323562622, -0.8758248686790466, -0.848290205001831, -0.8207556009292603, -0.7932209372520447, -0.7656862735748291, -0.7381516098976135, -0.710616946220398, -0.6830823421478271, -0.6555476784706116, -0.628013014793396, -0.6004784107208252, -0.5729437470436096, -0.545409083366394, -0.5178744196891785, -0.4903397560119629, -0.4628050923347473, -0.43527042865753174, -0.40773579478263855, -0.380201131105423, -0.3526664972305298, -0.3251318335533142, -0.29759716987609863, -0.27006250619888306, -0.24252787232398987, -0.21499322354793549, -0.1874585747718811, -0.15992391109466553, -0.13238926231861115, -0.10485461354255676, -0.07731994986534119, -0.049785301089286804, -0.022250711917877197, 0.0052839405834674835, 0.032818593084812164, 0.060353249311447144, 0.08788789808750153, 0.11542254686355591, 0.14295721054077148, 0.17049185931682587, 0.19802650809288025, 0.22556115686893463, 0.253095805644989, 0.2806304693222046, 0.30816513299942017, 0.33569976687431335, 0.36323443055152893, 0.3907690644264221, 0.4183037281036377, 0.44583839178085327, 0.47337302565574646, 0.5009076595306396, 0.5284423232078552, 0.5559769868850708, 0.5835116505622864, 0.611046314239502, 0.6385809183120728, 0.6661155819892883, 0.6936502456665039, 0.7211848497390747, 0.7487195134162903, 0.7762541770935059, 0.8037888407707214, 0.831323504447937, 0.8588581681251526]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 4.0, 8.0, 16.0, 12.0, 33.0, 49.0, 159.0, 2122.0, 3693807.0, 496830.0, 1054.0, 45.0, 33.0, 14.0, 14.0, 24.0, 16.0, 8.0, 10.0, 4.0, 6.0, 4.0, 6.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1328125, -2.050689697265625, -1.96856689453125, -1.886444091796875, -1.8043212890625, -1.722198486328125, -1.64007568359375, -1.557952880859375, -1.475830078125, -1.393707275390625, -1.31158447265625, -1.229461669921875, -1.1473388671875, -1.065216064453125, -0.98309326171875, -0.900970458984375, -0.81884765625, -0.736724853515625, -0.65460205078125, -0.572479248046875, -0.4903564453125, -0.408233642578125, -0.32611083984375, -0.243988037109375, -0.161865234375, -0.079742431640625, 0.00238037109375, 0.084503173828125, 0.1666259765625, 0.248748779296875, 0.33087158203125, 0.412994384765625, 0.4951171875, 0.577239990234375, 0.65936279296875, 0.741485595703125, 0.8236083984375, 0.905731201171875, 0.98785400390625, 1.069976806640625, 1.152099609375, 1.234222412109375, 1.31634521484375, 1.398468017578125, 1.4805908203125, 1.562713623046875, 1.64483642578125, 1.726959228515625, 1.80908203125, 1.891204833984375, 1.97332763671875, 2.055450439453125, 2.1375732421875, 2.219696044921875, 2.30181884765625, 2.383941650390625, 2.466064453125, 2.548187255859375, 2.63031005859375, 2.712432861328125, 2.7945556640625, 2.876678466796875, 2.95880126953125, 3.040924072265625, 3.123046875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 9.0, 1.0, 3.0, 8.0, 6.0, 10.0, 12.0, 19.0, 18.0, 31.0, 35.0, 43.0, 44.0, 68.0, 61.0, 60.0, 74.0, 77.0, 65.0, 57.0, 54.0, 52.0, 50.0, 38.0, 24.0, 10.0, 10.0, 14.0, 9.0, 8.0, 10.0, 7.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0186614990234375, -0.01820194721221924, -0.017742395401000977, -0.017282843589782715, -0.016823291778564453, -0.01636373996734619, -0.01590418815612793, -0.015444636344909668, -0.014985084533691406, -0.014525532722473145, -0.014065980911254883, -0.013606429100036621, -0.01314687728881836, -0.012687325477600098, -0.012227773666381836, -0.011768221855163574, -0.011308670043945312, -0.01084911823272705, -0.010389566421508789, -0.009930014610290527, -0.009470462799072266, -0.009010910987854004, -0.008551359176635742, -0.00809180736541748, -0.007632255554199219, -0.007172703742980957, -0.006713151931762695, -0.006253600120544434, -0.005794048309326172, -0.00533449649810791, -0.0048749446868896484, -0.004415392875671387, -0.003955841064453125, -0.0034962892532348633, -0.0030367374420166016, -0.00257718563079834, -0.002117633819580078, -0.0016580820083618164, -0.0011985301971435547, -0.000738978385925293, -0.00027942657470703125, 0.00018012523651123047, 0.0006396770477294922, 0.001099228858947754, 0.0015587806701660156, 0.0020183324813842773, 0.002477884292602539, 0.0029374361038208008, 0.0033969879150390625, 0.0038565397262573242, 0.004316091537475586, 0.004775643348693848, 0.005235195159912109, 0.005694746971130371, 0.006154298782348633, 0.0066138505935668945, 0.007073402404785156, 0.007532954216003418, 0.00799250602722168, 0.008452057838439941, 0.008911609649658203, 0.009371161460876465, 0.009830713272094727, 0.010290265083312988, 0.01074981689453125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 4.0, 6.0, 14.0, 64.0, 125.0, 352.0, 2651.0, 990444.0, 3197039.0, 3020.0, 365.0, 129.0, 56.0, 16.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.445556640625, -0.3961753845214844, -0.34679412841796875, -0.2974128723144531, -0.2480316162109375, -0.19865036010742188, -0.14926910400390625, -0.09988784790039062, -0.050506591796875, -0.001125335693359375, 0.04825592041015625, 0.09763717651367188, 0.1470184326171875, 0.19639968872070312, 0.24578094482421875, 0.2951622009277344, 0.34454345703125, 0.3939247131347656, 0.44330596923828125, 0.4926872253417969, 0.5420684814453125, 0.5914497375488281, 0.6408309936523438, 0.6902122497558594, 0.739593505859375, 0.7889747619628906, 0.8383560180664062, 0.8877372741699219, 0.9371185302734375, 0.9864997863769531, 1.0358810424804688, 1.0852622985839844, 1.1346435546875, 1.1840248107910156, 1.2334060668945312, 1.2827873229980469, 1.3321685791015625, 1.3815498352050781, 1.4309310913085938, 1.4803123474121094, 1.529693603515625, 1.5790748596191406, 1.6284561157226562, 1.6778373718261719, 1.7272186279296875, 1.7765998840332031, 1.8259811401367188, 1.8753623962402344, 1.92474365234375, 1.9741249084472656, 2.0235061645507812, 2.072887420654297, 2.1222686767578125, 2.171649932861328, 2.2210311889648438, 2.2704124450683594, 2.319793701171875, 2.3691749572753906, 2.4185562133789062, 2.467937469482422, 2.5173187255859375, 2.566699981689453, 2.6160812377929688, 2.6654624938964844, 2.71484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 2.0, 7.0, 10.0, 14.0, 13.0, 16.0, 17.0, 28.0, 34.0, 39.0, 68.0, 124.0, 201.0, 395.0, 1714.0, 633.0, 249.0, 143.0, 112.0, 65.0, 52.0, 27.0, 28.0, 14.0, 17.0, 11.0, 6.0, 3.0, 8.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.04986572265625, -0.04857921600341797, -0.04729270935058594, -0.046006202697753906, -0.044719696044921875, -0.043433189392089844, -0.04214668273925781, -0.04086017608642578, -0.03957366943359375, -0.03828716278076172, -0.03700065612792969, -0.035714149475097656, -0.034427642822265625, -0.033141136169433594, -0.03185462951660156, -0.03056812286376953, -0.0292816162109375, -0.02799510955810547, -0.026708602905273438, -0.025422096252441406, -0.024135589599609375, -0.022849082946777344, -0.021562576293945312, -0.02027606964111328, -0.01898956298828125, -0.01770305633544922, -0.016416549682617188, -0.015130043029785156, -0.013843536376953125, -0.012557029724121094, -0.011270523071289062, -0.009984016418457031, -0.008697509765625, -0.007411003112792969, -0.0061244964599609375, -0.004837989807128906, -0.003551483154296875, -0.0022649765014648438, -0.0009784698486328125, 0.00030803680419921875, 0.00159454345703125, 0.0028810501098632812, 0.0041675567626953125, 0.005454063415527344, 0.006740570068359375, 0.008027076721191406, 0.009313583374023438, 0.010600090026855469, 0.0118865966796875, 0.013173103332519531, 0.014459609985351562, 0.015746116638183594, 0.017032623291015625, 0.018319129943847656, 0.019605636596679688, 0.02089214324951172, 0.02217864990234375, 0.02346515655517578, 0.024751663208007812, 0.026038169860839844, 0.027324676513671875, 0.028611183166503906, 0.029897689819335938, 0.03118419647216797, 0.032470703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 6.0, 185.0, 765.0, 51.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7070081233978271, -0.5940101146697998, -0.4810120463371277, -0.36801400780677795, -0.2550159692764282, -0.14201796054840088, -0.02901989221572876, 0.08397817611694336, 0.1969761848449707, 0.30997422337532043, 0.42297226190567017, 0.5359703302383423, 0.6489683389663696, 0.761966347694397, 0.8749644160270691, 0.9879624843597412, 1.1009604930877686, 1.213958501815796, 1.3269565105438232, 1.4399546384811401, 1.5529526472091675, 1.6659506559371948, 1.7789487838745117, 1.891946792602539, 2.0049448013305664, 2.1179428100585938, 2.230940818786621, 2.3439388275146484, 2.456936836242676, 2.569934844970703, 2.6829330921173096, 2.795931100845337, 2.908928871154785, 3.0219268798828125, 3.13492488861084, 3.247922897338867, 3.3609209060668945, 3.473918914794922, 3.5869171619415283, 3.6999151706695557, 3.812913179397583, 3.9259111881256104, 4.038909435272217, 4.151907444000244, 4.2649054527282715, 4.377903461456299, 4.490901470184326, 4.6038994789123535, 4.716897487640381, 4.829895496368408, 4.9428935050964355, 5.055891513824463, 5.16888952255249, 5.281887531280518, 5.394885540008545, 5.5078840255737305, 5.620882034301758, 5.733880043029785, 5.8468780517578125, 5.95987606048584, 6.072874069213867, 6.1858720779418945, 6.298870086669922, 6.411868095397949, 6.524866104125977]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 10.0, 14.0, 17.0, 36.0, 45.0, 81.0, 101.0, 120.0, 117.0, 104.0, 95.0, 86.0, 76.0, 51.0, 23.0, 11.0, 8.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.555079460144043, -0.5425467491149902, -0.5300140380859375, -0.5174813270568848, -0.504948616027832, -0.4924158751964569, -0.4798831641674042, -0.46735045313835144, -0.4548177421092987, -0.44228503108024597, -0.42975232005119324, -0.4172195792198181, -0.4046868681907654, -0.39215415716171265, -0.3796214461326599, -0.3670887351036072, -0.35455602407455444, -0.3420233130455017, -0.329490602016449, -0.31695789098739624, -0.3044251501560211, -0.2918924391269684, -0.27935972809791565, -0.2668270170688629, -0.2542942762374878, -0.24176156520843506, -0.22922883927822113, -0.2166961282491684, -0.20416341722011566, -0.19163069128990173, -0.179097980260849, -0.16656526923179626, -0.15403255820274353, -0.1414998471736908, -0.12896712124347687, -0.11643441021442413, -0.1039016991853714, -0.09136898070573807, -0.07883626222610474, -0.066303551197052, -0.05377083271741867, -0.04123811796307564, -0.028705401346087456, -0.016172684729099274, -0.003639969974756241, 0.008892744779586792, 0.021425463259220123, 0.03395817428827286, 0.04649089276790619, 0.05902360752224922, 0.07155632227659225, 0.08408904075622559, 0.09662175178527832, 0.10915447026491165, 0.12168718874454498, 0.13421989977359772, 0.14675262570381165, 0.15928533673286438, 0.1718180626630783, 0.18435077369213104, 0.19688348472118378, 0.2094162106513977, 0.22194892168045044, 0.23448163270950317, 0.2470143437385559]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 3.0, 11.0, 6.0, 8.0, 19.0, 18.0, 23.0, 30.0, 36.0, 29.0, 41.0, 35.0, 51.0, 44.0, 41.0, 34651.0, 1013004.0, 73.0, 62.0, 47.0, 49.0, 44.0, 38.0, 37.0, 39.0, 28.0, 18.0, 12.0, 10.0, 6.0, 9.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.986328125, -3.869537353515625, -3.75274658203125, -3.635955810546875, -3.5191650390625, -3.402374267578125, -3.28558349609375, -3.168792724609375, -3.052001953125, -2.935211181640625, -2.81842041015625, -2.701629638671875, -2.5848388671875, -2.468048095703125, -2.35125732421875, -2.234466552734375, -2.11767578125, -2.000885009765625, -1.88409423828125, -1.767303466796875, -1.6505126953125, -1.533721923828125, -1.41693115234375, -1.300140380859375, -1.183349609375, -1.066558837890625, -0.94976806640625, -0.832977294921875, -0.7161865234375, -0.599395751953125, -0.48260498046875, -0.365814208984375, -0.2490234375, -0.132232666015625, -0.01544189453125, 0.101348876953125, 0.2181396484375, 0.334930419921875, 0.45172119140625, 0.568511962890625, 0.685302734375, 0.802093505859375, 0.91888427734375, 1.035675048828125, 1.1524658203125, 1.269256591796875, 1.38604736328125, 1.502838134765625, 1.61962890625, 1.736419677734375, 1.85321044921875, 1.970001220703125, 2.0867919921875, 2.203582763671875, 2.32037353515625, 2.437164306640625, 2.553955078125, 2.670745849609375, 2.78753662109375, 2.904327392578125, 3.0211181640625, 3.137908935546875, 3.25469970703125, 3.371490478515625, 3.48828125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 7.0, 28.0, 132.0, 331.0, 348.0, 140.0, 34.0], "bins": [-0.1541748046875, -0.151644766330719, -0.149114727973938, -0.14658468961715698, -0.14405465126037598, -0.14152461290359497, -0.13899457454681396, -0.13646453619003296, -0.13393449783325195, -0.13140445947647095, -0.12887442111968994, -0.12634438276290894, -0.12381434440612793, -0.12128430604934692, -0.11875426769256592, -0.11622422933578491, -0.1136941909790039, -0.1111641526222229, -0.1086341142654419, -0.10610407590866089, -0.10357403755187988, -0.10104399919509888, -0.09851396083831787, -0.09598392248153687, -0.09345388412475586, -0.09092384576797485, -0.08839380741119385, -0.08586376905441284, -0.08333373069763184, -0.08080369234085083, -0.07827365398406982, -0.07574361562728882, -0.07321357727050781, -0.0706835389137268, -0.0681535005569458, -0.0656234622001648, -0.06309342384338379, -0.06056338548660278, -0.05803334712982178, -0.05550330877304077, -0.052973270416259766, -0.05044323205947876, -0.047913193702697754, -0.04538315534591675, -0.04285311698913574, -0.040323078632354736, -0.03779304027557373, -0.035263001918792725, -0.03273296356201172, -0.030202925205230713, -0.027672886848449707, -0.0251428484916687, -0.022612810134887695, -0.02008277177810669, -0.017552733421325684, -0.015022695064544678, -0.012492656707763672, -0.009962618350982666, -0.00743257999420166, -0.004902541637420654, -0.0023725032806396484, 0.00015753507614135742, 0.0026875734329223633, 0.005217611789703369, 0.007747650146484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 10.0, 7.0, 15.0, 19.0, 30.0, 49.0, 76.0, 108.0, 189.0, 334.0, 640.0, 1477.0, 3423.0, 9683.0, 36352.0, 227415.0, 652153.0, 87030.0, 19478.0, 5828.0, 2181.0, 922.0, 446.0, 256.0, 148.0, 90.0, 64.0, 26.0, 26.0, 22.0, 16.0, 9.0, 12.0, 3.0, 2.0, 3.0, 6.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8779296875, -0.8523101806640625, -0.826690673828125, -0.8010711669921875, -0.77545166015625, -0.7498321533203125, -0.724212646484375, -0.6985931396484375, -0.6729736328125, -0.6473541259765625, -0.621734619140625, -0.5961151123046875, -0.57049560546875, -0.5448760986328125, -0.519256591796875, -0.4936370849609375, -0.468017578125, -0.4423980712890625, -0.416778564453125, -0.3911590576171875, -0.36553955078125, -0.3399200439453125, -0.314300537109375, -0.2886810302734375, -0.2630615234375, -0.2374420166015625, -0.211822509765625, -0.1862030029296875, -0.16058349609375, -0.1349639892578125, -0.109344482421875, -0.0837249755859375, -0.05810546875, -0.0324859619140625, -0.006866455078125, 0.0187530517578125, 0.04437255859375, 0.0699920654296875, 0.095611572265625, 0.1212310791015625, 0.1468505859375, 0.1724700927734375, 0.198089599609375, 0.2237091064453125, 0.24932861328125, 0.2749481201171875, 0.300567626953125, 0.3261871337890625, 0.351806640625, 0.3774261474609375, 0.403045654296875, 0.4286651611328125, 0.45428466796875, 0.4799041748046875, 0.505523681640625, 0.5311431884765625, 0.5567626953125, 0.5823822021484375, 0.608001708984375, 0.6336212158203125, 0.65924072265625, 0.6848602294921875, 0.710479736328125, 0.7360992431640625, 0.76171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 1.0, 5.0, 8.0, 10.0, 13.0, 19.0, 16.0, 28.0, 33.0, 33.0, 42.0, 39.0, 60.0, 62.0, 76.0, 65.0, 59.0, 46.0, 57.0, 50.0, 54.0, 41.0, 29.0, 28.0, 20.0, 23.0, 26.0, 11.0, 15.0, 8.0, 6.0, 5.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1160888671875, -0.11192703247070312, -0.10776519775390625, -0.10360336303710938, -0.0994415283203125, -0.09527969360351562, -0.09111785888671875, -0.08695602416992188, -0.082794189453125, -0.07863235473632812, -0.07447052001953125, -0.07030868530273438, -0.0661468505859375, -0.061985015869140625, -0.05782318115234375, -0.053661346435546875, -0.04949951171875, -0.045337677001953125, -0.04117584228515625, -0.037014007568359375, -0.0328521728515625, -0.028690338134765625, -0.02452850341796875, -0.020366668701171875, -0.016204833984375, -0.012042999267578125, -0.00788116455078125, -0.003719329833984375, 0.0004425048828125, 0.004604339599609375, 0.00876617431640625, 0.012928009033203125, 0.01708984375, 0.021251678466796875, 0.02541351318359375, 0.029575347900390625, 0.0337371826171875, 0.037899017333984375, 0.04206085205078125, 0.046222686767578125, 0.050384521484375, 0.054546356201171875, 0.05870819091796875, 0.06287002563476562, 0.0670318603515625, 0.07119369506835938, 0.07535552978515625, 0.07951736450195312, 0.08367919921875, 0.08784103393554688, 0.09200286865234375, 0.09616470336914062, 0.1003265380859375, 0.10448837280273438, 0.10865020751953125, 0.11281204223632812, 0.116973876953125, 0.12113571166992188, 0.12529754638671875, 0.12945938110351562, 0.1336212158203125, 0.13778305053710938, 0.14194488525390625, 0.14610671997070312, 0.1502685546875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 8.0, 14.0, 23.0, 39.0, 72.0, 128.0, 238.0, 546.0, 1646.0, 5240.0, 22004.0, 149174.0, 744350.0, 101350.0, 17058.0, 4225.0, 1392.0, 523.0, 229.0, 100.0, 71.0, 43.0, 28.0, 12.0, 10.0, 10.0, 4.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.841796875, -0.81500244140625, -0.7882080078125, -0.76141357421875, -0.734619140625, -0.70782470703125, -0.6810302734375, -0.65423583984375, -0.62744140625, -0.60064697265625, -0.5738525390625, -0.54705810546875, -0.520263671875, -0.49346923828125, -0.4666748046875, -0.43988037109375, -0.4130859375, -0.38629150390625, -0.3594970703125, -0.33270263671875, -0.305908203125, -0.27911376953125, -0.2523193359375, -0.22552490234375, -0.19873046875, -0.17193603515625, -0.1451416015625, -0.11834716796875, -0.091552734375, -0.06475830078125, -0.0379638671875, -0.01116943359375, 0.015625, 0.04241943359375, 0.0692138671875, 0.09600830078125, 0.122802734375, 0.14959716796875, 0.1763916015625, 0.20318603515625, 0.22998046875, 0.25677490234375, 0.2835693359375, 0.31036376953125, 0.337158203125, 0.36395263671875, 0.3907470703125, 0.41754150390625, 0.4443359375, 0.47113037109375, 0.4979248046875, 0.52471923828125, 0.551513671875, 0.57830810546875, 0.6051025390625, 0.63189697265625, 0.65869140625, 0.68548583984375, 0.7122802734375, 0.73907470703125, 0.765869140625, 0.79266357421875, 0.8194580078125, 0.84625244140625, 0.873046875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 7.0, 8.0, 11.0, 18.0, 28.0, 50.0, 49.0, 62.0, 100.0, 100.0, 135.0, 126.0, 85.0, 51.0, 40.0, 33.0, 19.0, 14.0, 13.0, 11.0, 7.0, 5.0, 7.0, 5.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-9.97781753540039e-05, -9.717419743537903e-05, -9.457021951675415e-05, -9.196624159812927e-05, -8.93622636795044e-05, -8.675828576087952e-05, -8.415430784225464e-05, -8.155032992362976e-05, -7.894635200500488e-05, -7.634237408638e-05, -7.373839616775513e-05, -7.113441824913025e-05, -6.853044033050537e-05, -6.592646241188049e-05, -6.332248449325562e-05, -6.071850657463074e-05, -5.811452865600586e-05, -5.551055073738098e-05, -5.2906572818756104e-05, -5.0302594900131226e-05, -4.769861698150635e-05, -4.509463906288147e-05, -4.249066114425659e-05, -3.9886683225631714e-05, -3.7282705307006836e-05, -3.467872738838196e-05, -3.207474946975708e-05, -2.9470771551132202e-05, -2.6866793632507324e-05, -2.4262815713882446e-05, -2.165883779525757e-05, -1.905485987663269e-05, -1.6450881958007812e-05, -1.3846904039382935e-05, -1.1242926120758057e-05, -8.638948202133179e-06, -6.034970283508301e-06, -3.430992364883423e-06, -8.270144462585449e-07, 1.776963472366333e-06, 4.380941390991211e-06, 6.984919309616089e-06, 9.588897228240967e-06, 1.2192875146865845e-05, 1.4796853065490723e-05, 1.74008309841156e-05, 2.000480890274048e-05, 2.2608786821365356e-05, 2.5212764739990234e-05, 2.7816742658615112e-05, 3.042072057723999e-05, 3.302469849586487e-05, 3.5628676414489746e-05, 3.8232654333114624e-05, 4.08366322517395e-05, 4.344061017036438e-05, 4.604458808898926e-05, 4.8648566007614136e-05, 5.1252543926239014e-05, 5.385652184486389e-05, 5.646049976348877e-05, 5.906447768211365e-05, 6.166845560073853e-05, 6.42724335193634e-05, 6.687641143798828e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 4.0, 5.0, 11.0, 11.0, 30.0, 31.0, 49.0, 75.0, 120.0, 239.0, 480.0, 1254.0, 4431.0, 22258.0, 215788.0, 728916.0, 61454.0, 9680.0, 2296.0, 749.0, 315.0, 134.0, 99.0, 58.0, 26.0, 21.0, 11.0, 10.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58447265625, -0.5582046508789062, -0.5319366455078125, -0.5056686401367188, -0.479400634765625, -0.45313262939453125, -0.4268646240234375, -0.40059661865234375, -0.37432861328125, -0.34806060791015625, -0.3217926025390625, -0.29552459716796875, -0.269256591796875, -0.24298858642578125, -0.2167205810546875, -0.19045257568359375, -0.1641845703125, -0.13791656494140625, -0.1116485595703125, -0.08538055419921875, -0.059112548828125, -0.03284454345703125, -0.0065765380859375, 0.01969146728515625, 0.04595947265625, 0.07222747802734375, 0.0984954833984375, 0.12476348876953125, 0.151031494140625, 0.17729949951171875, 0.2035675048828125, 0.22983551025390625, 0.256103515625, 0.28237152099609375, 0.3086395263671875, 0.33490753173828125, 0.361175537109375, 0.38744354248046875, 0.4137115478515625, 0.43997955322265625, 0.46624755859375, 0.49251556396484375, 0.5187835693359375, 0.5450515747070312, 0.571319580078125, 0.5975875854492188, 0.6238555908203125, 0.6501235961914062, 0.6763916015625, 0.7026596069335938, 0.7289276123046875, 0.7551956176757812, 0.781463623046875, 0.8077316284179688, 0.8339996337890625, 0.8602676391601562, 0.88653564453125, 0.9128036499023438, 0.9390716552734375, 0.9653396606445312, 0.991607666015625, 1.0178756713867188, 1.0441436767578125, 1.0704116821289062, 1.0966796875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 5.0, 5.0, 9.0, 13.0, 13.0, 14.0, 22.0, 27.0, 32.0, 43.0, 76.0, 94.0, 105.0, 112.0, 96.0, 73.0, 65.0, 36.0, 37.0, 26.0, 22.0, 17.0, 15.0, 15.0, 8.0, 15.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.34912109375, -0.34107208251953125, -0.3330230712890625, -0.32497406005859375, -0.316925048828125, -0.30887603759765625, -0.3008270263671875, -0.29277801513671875, -0.28472900390625, -0.27667999267578125, -0.2686309814453125, -0.26058197021484375, -0.252532958984375, -0.24448394775390625, -0.2364349365234375, -0.22838592529296875, -0.2203369140625, -0.21228790283203125, -0.2042388916015625, -0.19618988037109375, -0.188140869140625, -0.18009185791015625, -0.1720428466796875, -0.16399383544921875, -0.15594482421875, -0.14789581298828125, -0.1398468017578125, -0.13179779052734375, -0.123748779296875, -0.11569976806640625, -0.1076507568359375, -0.09960174560546875, -0.091552734375, -0.08350372314453125, -0.0754547119140625, -0.06740570068359375, -0.059356689453125, -0.05130767822265625, -0.0432586669921875, -0.03520965576171875, -0.02716064453125, -0.01911163330078125, -0.0110626220703125, -0.00301361083984375, 0.005035400390625, 0.01308441162109375, 0.0211334228515625, 0.02918243408203125, 0.0372314453125, 0.04528045654296875, 0.0533294677734375, 0.06137847900390625, 0.069427490234375, 0.07747650146484375, 0.0855255126953125, 0.09357452392578125, 0.10162353515625, 0.10967254638671875, 0.1177215576171875, 0.12577056884765625, 0.133819580078125, 0.14186859130859375, 0.1499176025390625, 0.15796661376953125, 0.166015625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 7.0, 21.0, 119.0, 625.0, 210.0, 20.0, 8.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.046420097351074, -6.597654342651367, -6.148888111114502, -5.700121879577637, -5.25135612487793, -4.802590370178223, -4.353824138641357, -3.9050581455230713, -3.456292152404785, -3.007526159286499, -2.558760166168213, -2.1099941730499268, -1.6612281799316406, -1.2124621868133545, -0.7636961936950684, -0.3149302005767822, 0.1338357925415039, 0.58260178565979, 1.0313677787780762, 1.4801337718963623, 1.9288997650146484, 2.3776657581329346, 2.8264317512512207, 3.275197744369507, 3.723963737487793, 4.1727294921875, 4.621495723724365, 5.0702619552612305, 5.5190277099609375, 5.9677934646606445, 6.41655969619751, 6.865325927734375, 7.314090728759766, 7.762856483459473, 8.21162223815918, 8.660388946533203, 9.10915470123291, 9.557920455932617, 10.00668716430664, 10.455452919006348, 10.904218673706055, 11.352984428405762, 11.801750183105469, 12.250516891479492, 12.6992826461792, 13.148048400878906, 13.59681510925293, 14.045580863952637, 14.494346618652344, 14.94311237335205, 15.391878128051758, 15.840644836425781, 16.289409637451172, 16.738176345825195, 17.18694305419922, 17.63570785522461, 18.084474563598633, 18.533241271972656, 18.982006072998047, 19.43077278137207, 19.879539489746094, 20.328304290771484, 20.777070999145508, 21.2258358001709, 21.674602508544922]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 9.0, 14.0, 25.0, 26.0, 38.0, 54.0, 39.0, 62.0, 59.0, 74.0, 81.0, 68.0, 82.0, 60.0, 74.0, 43.0, 58.0, 30.0, 29.0, 22.0, 15.0, 9.0, 9.0, 8.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8026463985443115, -0.7644394040107727, -0.7262324094772339, -0.6880253553390503, -0.6498183608055115, -0.6116113662719727, -0.5734043121337891, -0.5351973176002502, -0.4969903230667114, -0.4587833285331726, -0.4205763041973114, -0.3823692798614502, -0.3441622853279114, -0.30595529079437256, -0.26774826645851135, -0.22954124212265015, -0.19133424758911133, -0.15312723815441132, -0.1149202287197113, -0.07671321928501129, -0.03850620985031128, -0.0002992004156112671, 0.037907809019088745, 0.07611483335494995, 0.11432182788848877, 0.15252883732318878, 0.1907358467578888, 0.2289428561925888, 0.2671498656272888, 0.30535686016082764, 0.34356388449668884, 0.38177090883255005, 0.41997790336608887, 0.4581848978996277, 0.4963919222354889, 0.5345989465713501, 0.5728059411048889, 0.6110129356384277, 0.6492199897766113, 0.6874269843101501, 0.725633978843689, 0.7638409733772278, 0.8020479679107666, 0.8402550220489502, 0.878462016582489, 0.9166690111160278, 0.9548760652542114, 0.9930830597877502, 1.031290054321289, 1.0694971084594727, 1.1077040433883667, 1.1459110975265503, 1.1841180324554443, 1.222325086593628, 1.2605321407318115, 1.2987391948699951, 1.3369461297988892, 1.3751531839370728, 1.4133601188659668, 1.4515671730041504, 1.489774227142334, 1.527981162071228, 1.5661882162094116, 1.6043951511383057, 1.6426022052764893]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 1.0, 5.0, 7.0, 7.0, 8.0, 9.0, 13.0, 10.0, 25.0, 20.0, 17.0, 23.0, 34.0, 43.0, 41.0, 61.0, 55.0, 61.0, 120.0, 330.0, 17099.0, 4170215.0, 5442.0, 293.0, 110.0, 55.0, 43.0, 30.0, 19.0, 19.0, 22.0, 11.0, 10.0, 6.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.75, -5.59197998046875, -5.4339599609375, -5.27593994140625, -5.117919921875, -4.95989990234375, -4.8018798828125, -4.64385986328125, -4.48583984375, -4.32781982421875, -4.1697998046875, -4.01177978515625, -3.853759765625, -3.69573974609375, -3.5377197265625, -3.37969970703125, -3.2216796875, -3.06365966796875, -2.9056396484375, -2.74761962890625, -2.589599609375, -2.43157958984375, -2.2735595703125, -2.11553955078125, -1.95751953125, -1.79949951171875, -1.6414794921875, -1.48345947265625, -1.325439453125, -1.16741943359375, -1.0093994140625, -0.85137939453125, -0.693359375, -0.53533935546875, -0.3773193359375, -0.21929931640625, -0.061279296875, 0.09674072265625, 0.2547607421875, 0.41278076171875, 0.57080078125, 0.72882080078125, 0.8868408203125, 1.04486083984375, 1.202880859375, 1.36090087890625, 1.5189208984375, 1.67694091796875, 1.8349609375, 1.99298095703125, 2.1510009765625, 2.30902099609375, 2.467041015625, 2.62506103515625, 2.7830810546875, 2.94110107421875, 3.09912109375, 3.25714111328125, 3.4151611328125, 3.57318115234375, 3.731201171875, 3.88922119140625, 4.0472412109375, 4.20526123046875, 4.36328125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 6.0, 15.0, 41.0, 86.0, 136.0, 179.0, 190.0, 158.0, 103.0, 61.0, 21.0, 10.0, 5.0, 3.0, 1.0], "bins": [-0.125732421875, -0.12345290184020996, -0.12117338180541992, -0.11889386177062988, -0.11661434173583984, -0.1143348217010498, -0.11205530166625977, -0.10977578163146973, -0.10749626159667969, -0.10521674156188965, -0.10293722152709961, -0.10065770149230957, -0.09837818145751953, -0.09609866142272949, -0.09381914138793945, -0.09153962135314941, -0.08926010131835938, -0.08698058128356934, -0.0847010612487793, -0.08242154121398926, -0.08014202117919922, -0.07786250114440918, -0.07558298110961914, -0.0733034610748291, -0.07102394104003906, -0.06874442100524902, -0.06646490097045898, -0.06418538093566895, -0.061905860900878906, -0.05962634086608887, -0.05734682083129883, -0.05506730079650879, -0.05278778076171875, -0.05050826072692871, -0.04822874069213867, -0.04594922065734863, -0.043669700622558594, -0.041390180587768555, -0.039110660552978516, -0.03683114051818848, -0.03455162048339844, -0.0322721004486084, -0.02999258041381836, -0.02771306037902832, -0.02543354034423828, -0.023154020309448242, -0.020874500274658203, -0.018594980239868164, -0.016315460205078125, -0.014035940170288086, -0.011756420135498047, -0.009476900100708008, -0.007197380065917969, -0.00491786003112793, -0.0026383399963378906, -0.00035881996154785156, 0.0019207000732421875, 0.0042002201080322266, 0.006479740142822266, 0.008759260177612305, 0.011038780212402344, 0.013318300247192383, 0.015597820281982422, 0.01787734031677246, 0.0201568603515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 11.0, 13.0, 23.0, 44.0, 104.0, 179.0, 444.0, 2418.0, 3961656.0, 227002.0, 1658.0, 345.0, 189.0, 90.0, 64.0, 26.0, 10.0, 10.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2109375, -3.9287109375, -3.646484375, -3.3642578125, -3.08203125, -2.7998046875, -2.517578125, -2.2353515625, -1.953125, -1.6708984375, -1.388671875, -1.1064453125, -0.82421875, -0.5419921875, -0.259765625, 0.0224609375, 0.3046875, 0.5869140625, 0.869140625, 1.1513671875, 1.43359375, 1.7158203125, 1.998046875, 2.2802734375, 2.5625, 2.8447265625, 3.126953125, 3.4091796875, 3.69140625, 3.9736328125, 4.255859375, 4.5380859375, 4.8203125, 5.1025390625, 5.384765625, 5.6669921875, 5.94921875, 6.2314453125, 6.513671875, 6.7958984375, 7.078125, 7.3603515625, 7.642578125, 7.9248046875, 8.20703125, 8.4892578125, 8.771484375, 9.0537109375, 9.3359375, 9.6181640625, 9.900390625, 10.1826171875, 10.46484375, 10.7470703125, 11.029296875, 11.3115234375, 11.59375, 11.8759765625, 12.158203125, 12.4404296875, 12.72265625, 13.0048828125, 13.287109375, 13.5693359375, 13.8515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 14.0, 72.0, 435.0, 3217.0, 253.0, 59.0, 19.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26904296875, -0.24524688720703125, -0.2214508056640625, -0.19765472412109375, -0.173858642578125, -0.15006256103515625, -0.1262664794921875, -0.10247039794921875, -0.07867431640625, -0.05487823486328125, -0.0310821533203125, -0.00728607177734375, 0.016510009765625, 0.04030609130859375, 0.0641021728515625, 0.08789825439453125, 0.1116943359375, 0.13549041748046875, 0.1592864990234375, 0.18308258056640625, 0.206878662109375, 0.23067474365234375, 0.2544708251953125, 0.27826690673828125, 0.30206298828125, 0.32585906982421875, 0.3496551513671875, 0.37345123291015625, 0.397247314453125, 0.42104339599609375, 0.4448394775390625, 0.46863555908203125, 0.492431640625, 0.5162277221679688, 0.5400238037109375, 0.5638198852539062, 0.587615966796875, 0.6114120483398438, 0.6352081298828125, 0.6590042114257812, 0.68280029296875, 0.7065963745117188, 0.7303924560546875, 0.7541885375976562, 0.777984619140625, 0.8017807006835938, 0.8255767822265625, 0.8493728637695312, 0.8731689453125, 0.8969650268554688, 0.9207611083984375, 0.9445571899414062, 0.968353271484375, 0.9921493530273438, 1.0159454345703125, 1.0397415161132812, 1.06353759765625, 1.0873336791992188, 1.1111297607421875, 1.1349258422851562, 1.158721923828125, 1.1825180053710938, 1.2063140869140625, 1.2301101684570312, 1.25390625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 10.0, 35.0, 164.0, 504.0, 222.0, 51.0, 15.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.556102752685547, -3.3115787506103516, -3.0670547485351562, -2.822530746459961, -2.5780067443847656, -2.3334827423095703, -2.088958740234375, -1.8444346189498901, -1.5999106168746948, -1.3553866147994995, -1.1108626127243042, -0.8663385510444641, -0.6218145489692688, -0.3772904872894287, -0.1327664852142334, 0.11175751686096191, 0.3562815189361572, 0.6008055210113525, 0.8453295230865479, 1.0898535251617432, 1.3343775272369385, 1.5789016485214233, 1.8234256505966187, 2.0679497718811035, 2.312473773956299, 2.556997776031494, 2.8015217781066895, 3.0460457801818848, 3.29056978225708, 3.5350937843322754, 3.7796177864074707, 4.024141788482666, 4.268665790557861, 4.513189792633057, 4.757713794708252, 5.002237796783447, 5.246761798858643, 5.491285800933838, 5.735809803009033, 5.9803338050842285, 6.224857807159424, 6.469381809234619, 6.7139058113098145, 6.95842981338501, 7.202953815460205, 7.4474778175354, 7.692001819610596, 7.936525821685791, 8.181050300598145, 8.42557430267334, 8.670098304748535, 8.91462230682373, 9.159146308898926, 9.403670310974121, 9.648194313049316, 9.892718315124512, 10.137242317199707, 10.381766319274902, 10.626290321350098, 10.870814323425293, 11.115338325500488, 11.359862327575684, 11.604386329650879, 11.848910331726074, 12.09343433380127]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 12.0, 14.0, 36.0, 46.0, 57.0, 80.0, 89.0, 115.0, 98.0, 120.0, 100.0, 82.0, 44.0, 46.0, 28.0, 19.0, 5.0, 7.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3043053150177, -2.23893404006958, -2.17356276512146, -2.108191728591919, -2.042820453643799, -1.9774491786956787, -1.9120779037475586, -1.846706748008728, -1.7813355922698975, -1.7159643173217773, -1.6505931615829468, -1.5852218866348267, -1.519850730895996, -1.454479455947876, -1.3891081809997559, -1.3237370252609253, -1.2583657503128052, -1.192994475364685, -1.1276233196258545, -1.0622520446777344, -0.9968808889389038, -0.9315096139907837, -0.8661383986473083, -0.800767183303833, -0.7353959679603577, -0.6700247526168823, -0.604653537273407, -0.5392823219299316, -0.4739110767841339, -0.40853986144065857, -0.34316861629486084, -0.2777974009513855, -0.2124263048171997, -0.14705508947372437, -0.08168385922908783, -0.016312628984451294, 0.04905858635902405, 0.11442980170249939, 0.17980104684829712, 0.24517226219177246, 0.3105434775352478, 0.37591469287872314, 0.4412859082221985, 0.5066571235656738, 0.572028398513794, 0.6373995542526245, 0.7027708292007446, 0.76814204454422, 0.8335132598876953, 0.8988844752311707, 0.964255690574646, 1.0296269655227661, 1.0949981212615967, 1.1603693962097168, 1.225740671157837, 1.2911118268966675, 1.356482982635498, 1.4218542575836182, 1.4872254133224487, 1.5525966882705688, 1.6179678440093994, 1.6833391189575195, 1.7487103939056396, 1.8140815496444702, 1.8794528245925903]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 9.0, 6.0, 8.0, 6.0, 13.0, 9.0, 15.0, 12.0, 20.0, 25.0, 27.0, 32.0, 41.0, 50.0, 75.0, 193.0, 644.0, 4761.0, 197226.0, 827408.0, 15974.0, 1278.0, 291.0, 102.0, 64.0, 58.0, 36.0, 32.0, 24.0, 21.0, 20.0, 14.0, 9.0, 13.0, 7.0, 7.0, 4.0, 4.0, 1.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-3.556640625, -3.455596923828125, -3.35455322265625, -3.253509521484375, -3.1524658203125, -3.051422119140625, -2.95037841796875, -2.849334716796875, -2.748291015625, -2.647247314453125, -2.54620361328125, -2.445159912109375, -2.3441162109375, -2.243072509765625, -2.14202880859375, -2.040985107421875, -1.93994140625, -1.838897705078125, -1.73785400390625, -1.636810302734375, -1.5357666015625, -1.434722900390625, -1.33367919921875, -1.232635498046875, -1.131591796875, -1.030548095703125, -0.92950439453125, -0.828460693359375, -0.7274169921875, -0.626373291015625, -0.52532958984375, -0.424285888671875, -0.3232421875, -0.222198486328125, -0.12115478515625, -0.020111083984375, 0.0809326171875, 0.181976318359375, 0.28302001953125, 0.384063720703125, 0.485107421875, 0.586151123046875, 0.68719482421875, 0.788238525390625, 0.8892822265625, 0.990325927734375, 1.09136962890625, 1.192413330078125, 1.29345703125, 1.394500732421875, 1.49554443359375, 1.596588134765625, 1.6976318359375, 1.798675537109375, 1.89971923828125, 2.000762939453125, 2.101806640625, 2.202850341796875, 2.30389404296875, 2.404937744140625, 2.5059814453125, 2.607025146484375, 2.70806884765625, 2.809112548828125, 2.91015625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 4.0, 4.0, 8.0, 5.0, 20.0, 25.0, 29.0, 33.0, 47.0, 52.0, 44.0, 63.0, 67.0, 79.0, 94.0, 74.0, 58.0, 55.0, 51.0, 39.0, 41.0, 30.0, 21.0, 17.0, 11.0, 9.0, 10.0, 3.0, 6.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07733154296875, -0.07493400573730469, -0.07253646850585938, -0.07013893127441406, -0.06774139404296875, -0.06534385681152344, -0.06294631958007812, -0.06054878234863281, -0.0581512451171875, -0.05575370788574219, -0.053356170654296875, -0.05095863342285156, -0.04856109619140625, -0.04616355895996094, -0.043766021728515625, -0.04136848449707031, -0.038970947265625, -0.03657341003417969, -0.034175872802734375, -0.03177833557128906, -0.02938079833984375, -0.026983261108398438, -0.024585723876953125, -0.022188186645507812, -0.0197906494140625, -0.017393112182617188, -0.014995574951171875, -0.012598037719726562, -0.01020050048828125, -0.0078029632568359375, -0.005405426025390625, -0.0030078887939453125, -0.0006103515625, 0.0017871856689453125, 0.004184722900390625, 0.0065822601318359375, 0.00897979736328125, 0.011377334594726562, 0.013774871826171875, 0.016172409057617188, 0.0185699462890625, 0.020967483520507812, 0.023365020751953125, 0.025762557983398438, 0.02816009521484375, 0.030557632446289062, 0.032955169677734375, 0.03535270690917969, 0.037750244140625, 0.04014778137207031, 0.042545318603515625, 0.04494285583496094, 0.04734039306640625, 0.04973793029785156, 0.052135467529296875, 0.05453300476074219, 0.0569305419921875, 0.05932807922363281, 0.061725616455078125, 0.06412315368652344, 0.06652069091796875, 0.06891822814941406, 0.07131576538085938, 0.07371330261230469, 0.07611083984375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 2.0, 9.0, 8.0, 12.0, 16.0, 15.0, 31.0, 42.0, 73.0, 102.0, 157.0, 238.0, 467.0, 891.0, 2072.0, 5699.0, 22023.0, 120938.0, 567262.0, 269340.0, 43576.0, 9747.0, 3070.0, 1243.0, 612.0, 320.0, 193.0, 119.0, 69.0, 62.0, 51.0, 21.0, 21.0, 12.0, 4.0, 7.0, 7.0, 9.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8369140625, -0.808746337890625, -0.78057861328125, -0.752410888671875, -0.7242431640625, -0.696075439453125, -0.66790771484375, -0.639739990234375, -0.611572265625, -0.583404541015625, -0.55523681640625, -0.527069091796875, -0.4989013671875, -0.470733642578125, -0.44256591796875, -0.414398193359375, -0.38623046875, -0.358062744140625, -0.32989501953125, -0.301727294921875, -0.2735595703125, -0.245391845703125, -0.21722412109375, -0.189056396484375, -0.160888671875, -0.132720947265625, -0.10455322265625, -0.076385498046875, -0.0482177734375, -0.020050048828125, 0.00811767578125, 0.036285400390625, 0.064453125, 0.092620849609375, 0.12078857421875, 0.148956298828125, 0.1771240234375, 0.205291748046875, 0.23345947265625, 0.261627197265625, 0.289794921875, 0.317962646484375, 0.34613037109375, 0.374298095703125, 0.4024658203125, 0.430633544921875, 0.45880126953125, 0.486968994140625, 0.51513671875, 0.543304443359375, 0.57147216796875, 0.599639892578125, 0.6278076171875, 0.655975341796875, 0.68414306640625, 0.712310791015625, 0.740478515625, 0.768646240234375, 0.79681396484375, 0.824981689453125, 0.8531494140625, 0.881317138671875, 0.90948486328125, 0.937652587890625, 0.9658203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 7.0, 5.0, 3.0, 6.0, 12.0, 14.0, 17.0, 20.0, 27.0, 20.0, 27.0, 39.0, 57.0, 54.0, 61.0, 46.0, 58.0, 52.0, 62.0, 68.0, 57.0, 50.0, 40.0, 35.0, 36.0, 36.0, 24.0, 21.0, 12.0, 14.0, 11.0, 2.0, 5.0, 3.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.35791015625, -0.34685516357421875, -0.3358001708984375, -0.32474517822265625, -0.313690185546875, -0.30263519287109375, -0.2915802001953125, -0.28052520751953125, -0.26947021484375, -0.25841522216796875, -0.2473602294921875, -0.23630523681640625, -0.225250244140625, -0.21419525146484375, -0.2031402587890625, -0.19208526611328125, -0.1810302734375, -0.16997528076171875, -0.1589202880859375, -0.14786529541015625, -0.136810302734375, -0.12575531005859375, -0.1147003173828125, -0.10364532470703125, -0.09259033203125, -0.08153533935546875, -0.0704803466796875, -0.05942535400390625, -0.048370361328125, -0.03731536865234375, -0.0262603759765625, -0.01520538330078125, -0.004150390625, 0.00690460205078125, 0.0179595947265625, 0.02901458740234375, 0.040069580078125, 0.05112457275390625, 0.0621795654296875, 0.07323455810546875, 0.08428955078125, 0.09534454345703125, 0.1063995361328125, 0.11745452880859375, 0.128509521484375, 0.13956451416015625, 0.1506195068359375, 0.16167449951171875, 0.1727294921875, 0.18378448486328125, 0.1948394775390625, 0.20589447021484375, 0.216949462890625, 0.22800445556640625, 0.2390594482421875, 0.25011444091796875, 0.26116943359375, 0.27222442626953125, 0.2832794189453125, 0.29433441162109375, 0.305389404296875, 0.31644439697265625, 0.3274993896484375, 0.33855438232421875, 0.349609375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 11.0, 8.0, 18.0, 20.0, 29.0, 57.0, 92.0, 113.0, 177.0, 380.0, 897.0, 2652.0, 12056.0, 159283.0, 819719.0, 43818.0, 6189.0, 1719.0, 591.0, 289.0, 147.0, 96.0, 55.0, 37.0, 28.0, 19.0, 16.0, 14.0, 5.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.189453125, -1.1501922607421875, -1.110931396484375, -1.0716705322265625, -1.03240966796875, -0.9931488037109375, -0.953887939453125, -0.9146270751953125, -0.8753662109375, -0.8361053466796875, -0.796844482421875, -0.7575836181640625, -0.71832275390625, -0.6790618896484375, -0.639801025390625, -0.6005401611328125, -0.561279296875, -0.5220184326171875, -0.482757568359375, -0.4434967041015625, -0.40423583984375, -0.3649749755859375, -0.325714111328125, -0.2864532470703125, -0.2471923828125, -0.2079315185546875, -0.168670654296875, -0.1294097900390625, -0.09014892578125, -0.0508880615234375, -0.011627197265625, 0.0276336669921875, 0.06689453125, 0.1061553955078125, 0.145416259765625, 0.1846771240234375, 0.22393798828125, 0.2631988525390625, 0.302459716796875, 0.3417205810546875, 0.3809814453125, 0.4202423095703125, 0.459503173828125, 0.4987640380859375, 0.53802490234375, 0.5772857666015625, 0.616546630859375, 0.6558074951171875, 0.695068359375, 0.7343292236328125, 0.773590087890625, 0.8128509521484375, 0.85211181640625, 0.8913726806640625, 0.930633544921875, 0.9698944091796875, 1.0091552734375, 1.0484161376953125, 1.087677001953125, 1.1269378662109375, 1.16619873046875, 1.2054595947265625, 1.244720458984375, 1.2839813232421875, 1.3232421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 9.0, 13.0, 16.0, 18.0, 26.0, 29.0, 44.0, 82.0, 124.0, 142.0, 132.0, 117.0, 72.0, 61.0, 39.0, 26.0, 10.0, 15.0, 12.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.08970832824707e-05, -8.710380643606186e-05, -8.331052958965302e-05, -7.951725274324417e-05, -7.572397589683533e-05, -7.193069905042648e-05, -6.813742220401764e-05, -6.43441453576088e-05, -6.055086851119995e-05, -5.675759166479111e-05, -5.296431481838226e-05, -4.917103797197342e-05, -4.5377761125564575e-05, -4.158448427915573e-05, -3.779120743274689e-05, -3.399793058633804e-05, -3.02046537399292e-05, -2.6411376893520355e-05, -2.261810004711151e-05, -1.8824823200702667e-05, -1.5031546354293823e-05, -1.123826950788498e-05, -7.444992661476135e-06, -3.6517158150672913e-06, 1.4156103134155273e-07, 3.934837877750397e-06, 7.72811472415924e-06, 1.1521391570568085e-05, 1.531466841697693e-05, 1.9107945263385773e-05, 2.2901222109794617e-05, 2.669449895620346e-05, 3.0487775802612305e-05, 3.428105264902115e-05, 3.807432949542999e-05, 4.186760634183884e-05, 4.566088318824768e-05, 4.9454160034656525e-05, 5.324743688106537e-05, 5.704071372747421e-05, 6.083399057388306e-05, 6.46272674202919e-05, 6.842054426670074e-05, 7.221382111310959e-05, 7.600709795951843e-05, 7.980037480592728e-05, 8.359365165233612e-05, 8.738692849874496e-05, 9.118020534515381e-05, 9.497348219156265e-05, 9.87667590379715e-05, 0.00010256003588438034, 0.00010635331273078918, 0.00011014658957719803, 0.00011393986642360687, 0.00011773314327001572, 0.00012152642011642456, 0.0001253196969628334, 0.00012911297380924225, 0.0001329062506556511, 0.00013669952750205994, 0.00014049280434846878, 0.00014428608119487762, 0.00014807935804128647, 0.0001518726348876953]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 6.0, 5.0, 6.0, 11.0, 12.0, 11.0, 19.0, 23.0, 58.0, 75.0, 150.0, 246.0, 343.0, 713.0, 1486.0, 3869.0, 13118.0, 85473.0, 744060.0, 170582.0, 19627.0, 4909.0, 1887.0, 846.0, 404.0, 222.0, 133.0, 73.0, 56.0, 29.0, 26.0, 24.0, 10.0, 13.0, 9.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69140625, -0.6672592163085938, -0.6431121826171875, -0.6189651489257812, -0.594818115234375, -0.5706710815429688, -0.5465240478515625, -0.5223770141601562, -0.49822998046875, -0.47408294677734375, -0.4499359130859375, -0.42578887939453125, -0.401641845703125, -0.37749481201171875, -0.3533477783203125, -0.32920074462890625, -0.3050537109375, -0.28090667724609375, -0.2567596435546875, -0.23261260986328125, -0.208465576171875, -0.18431854248046875, -0.1601715087890625, -0.13602447509765625, -0.11187744140625, -0.08773040771484375, -0.0635833740234375, -0.03943634033203125, -0.015289306640625, 0.00885772705078125, 0.0330047607421875, 0.05715179443359375, 0.081298828125, 0.10544586181640625, 0.1295928955078125, 0.15373992919921875, 0.177886962890625, 0.20203399658203125, 0.2261810302734375, 0.25032806396484375, 0.27447509765625, 0.29862213134765625, 0.3227691650390625, 0.34691619873046875, 0.371063232421875, 0.39521026611328125, 0.4193572998046875, 0.44350433349609375, 0.4676513671875, 0.49179840087890625, 0.5159454345703125, 0.5400924682617188, 0.564239501953125, 0.5883865356445312, 0.6125335693359375, 0.6366806030273438, 0.66082763671875, 0.6849746704101562, 0.7091217041015625, 0.7332687377929688, 0.757415771484375, 0.7815628051757812, 0.8057098388671875, 0.8298568725585938, 0.85400390625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 7.0, 14.0, 14.0, 14.0, 18.0, 26.0, 33.0, 40.0, 41.0, 59.0, 64.0, 79.0, 91.0, 119.0, 70.0, 62.0, 60.0, 47.0, 22.0, 25.0, 22.0, 9.0, 11.0, 7.0, 8.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.302490234375, -0.29425048828125, -0.2860107421875, -0.27777099609375, -0.26953125, -0.26129150390625, -0.2530517578125, -0.24481201171875, -0.236572265625, -0.22833251953125, -0.2200927734375, -0.21185302734375, -0.20361328125, -0.19537353515625, -0.1871337890625, -0.17889404296875, -0.170654296875, -0.16241455078125, -0.1541748046875, -0.14593505859375, -0.1376953125, -0.12945556640625, -0.1212158203125, -0.11297607421875, -0.104736328125, -0.09649658203125, -0.0882568359375, -0.08001708984375, -0.07177734375, -0.06353759765625, -0.0552978515625, -0.04705810546875, -0.038818359375, -0.03057861328125, -0.0223388671875, -0.01409912109375, -0.005859375, 0.00238037109375, 0.0106201171875, 0.01885986328125, 0.027099609375, 0.03533935546875, 0.0435791015625, 0.05181884765625, 0.06005859375, 0.06829833984375, 0.0765380859375, 0.08477783203125, 0.093017578125, 0.10125732421875, 0.1094970703125, 0.11773681640625, 0.1259765625, 0.13421630859375, 0.1424560546875, 0.15069580078125, 0.158935546875, 0.16717529296875, 0.1754150390625, 0.18365478515625, 0.19189453125, 0.20013427734375, 0.2083740234375, 0.21661376953125, 0.224853515625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 19.0, 83.0, 335.0, 433.0, 110.0, 21.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.385377883911133, -10.91618537902832, -10.446993827819824, -9.977801322937012, -9.5086088180542, -9.039417266845703, -8.57022476196289, -8.101032257080078, -7.631840229034424, -7.1626482009887695, -6.693455696105957, -6.224263668060303, -5.755071640014648, -5.285879135131836, -4.816687107086182, -4.347495079040527, -3.878302574157715, -3.4091103076934814, -2.939918041229248, -2.4707260131835938, -2.0015337467193604, -1.532341480255127, -1.0631494522094727, -0.5939571857452393, -0.12476491928100586, 0.34442728757858276, 0.8136194944381714, 1.2828116416931152, 1.7520039081573486, 2.221196174621582, 2.6903882026672363, 3.1595804691314697, 3.628772735595703, 4.097964763641357, 4.56715726852417, 5.036349296569824, 5.505541801452637, 5.974733829498291, 6.443925857543945, 6.913118362426758, 7.382310390472412, 7.851502418518066, 8.320694923400879, 8.789886474609375, 9.259078979492188, 9.728271484375, 10.197463989257812, 10.666655540466309, 11.135848045349121, 11.605040550231934, 12.07423210144043, 12.543424606323242, 13.012617111206055, 13.481809616088867, 13.951001167297363, 14.420193672180176, 14.889385223388672, 15.358577728271484, 15.82776927947998, 16.29696273803711, 16.76615333557129, 17.2353458404541, 17.704538345336914, 18.173730850219727, 18.64292335510254]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 8.0, 5.0, 7.0, 6.0, 7.0, 10.0, 24.0, 17.0, 16.0, 22.0, 20.0, 27.0, 32.0, 31.0, 38.0, 43.0, 45.0, 36.0, 52.0, 39.0, 50.0, 63.0, 41.0, 37.0, 38.0, 35.0, 38.0, 35.0, 35.0, 21.0, 23.0, 14.0, 15.0, 8.0, 14.0, 14.0, 8.0, 7.0, 3.0, 7.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.9695837497711182, -1.9022765159606934, -1.8349692821502686, -1.7676621675491333, -1.7003549337387085, -1.6330476999282837, -1.5657405853271484, -1.4984333515167236, -1.4311261177062988, -1.363818883895874, -1.2965116500854492, -1.229204535484314, -1.1618973016738892, -1.0945900678634644, -1.027282953262329, -0.9599757194519043, -0.8926684856414795, -0.8253612518310547, -0.7580540776252747, -0.6907469034194946, -0.6234396696090698, -0.556132435798645, -0.488825261592865, -0.4215180575847626, -0.35421085357666016, -0.28690364956855774, -0.21959644556045532, -0.1522892415523529, -0.08498203754425049, -0.01767483353614807, 0.049632370471954346, 0.11693957448005676, 0.18424701690673828, 0.2515542209148407, 0.3188614249229431, 0.38616862893104553, 0.45347583293914795, 0.5207830667495728, 0.5880902409553528, 0.6553974151611328, 0.7227046489715576, 0.7900118827819824, 0.8573190569877625, 0.9246262311935425, 0.9919334650039673, 1.059240698814392, 1.1265478134155273, 1.1938550472259521, 1.261162281036377, 1.3284695148468018, 1.3957767486572266, 1.4630838632583618, 1.5303910970687866, 1.5976983308792114, 1.6650054454803467, 1.7323126792907715, 1.7996199131011963, 1.866927146911621, 1.934234380722046, 2.0015416145324707, 2.0688486099243164, 2.136155843734741, 2.203463077545166, 2.270770311355591, 2.3380775451660156]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 7.0, 4.0, 9.0, 10.0, 15.0, 9.0, 11.0, 15.0, 20.0, 13.0, 26.0, 19.0, 40.0, 31.0, 53.0, 91.0, 230.0, 1240.0, 21317.0, 4007391.0, 158001.0, 4634.0, 638.0, 185.0, 76.0, 56.0, 40.0, 36.0, 11.0, 16.0, 10.0, 10.0, 4.0, 8.0, 1.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.28125, -4.164703369140625, -4.04815673828125, -3.931610107421875, -3.8150634765625, -3.698516845703125, -3.58197021484375, -3.465423583984375, -3.348876953125, -3.232330322265625, -3.11578369140625, -2.999237060546875, -2.8826904296875, -2.766143798828125, -2.64959716796875, -2.533050537109375, -2.41650390625, -2.299957275390625, -2.18341064453125, -2.066864013671875, -1.9503173828125, -1.833770751953125, -1.71722412109375, -1.600677490234375, -1.484130859375, -1.367584228515625, -1.25103759765625, -1.134490966796875, -1.0179443359375, -0.901397705078125, -0.78485107421875, -0.668304443359375, -0.5517578125, -0.435211181640625, -0.31866455078125, -0.202117919921875, -0.0855712890625, 0.030975341796875, 0.14752197265625, 0.264068603515625, 0.380615234375, 0.497161865234375, 0.61370849609375, 0.730255126953125, 0.8468017578125, 0.963348388671875, 1.07989501953125, 1.196441650390625, 1.31298828125, 1.429534912109375, 1.54608154296875, 1.662628173828125, 1.7791748046875, 1.895721435546875, 2.01226806640625, 2.128814697265625, 2.245361328125, 2.361907958984375, 2.47845458984375, 2.595001220703125, 2.7115478515625, 2.828094482421875, 2.94464111328125, 3.061187744140625, 3.177734375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 5.0, 3.0, 4.0, 7.0, 7.0, 10.0, 24.0, 24.0, 32.0, 36.0, 44.0, 37.0, 53.0, 44.0, 62.0, 65.0, 58.0, 72.0, 68.0, 45.0, 53.0, 44.0, 40.0, 37.0, 26.0, 15.0, 17.0, 17.0, 9.0, 9.0, 9.0, 6.0, 3.0, 1.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.058685302734375, -0.05639028549194336, -0.05409526824951172, -0.05180025100708008, -0.04950523376464844, -0.0472102165222168, -0.044915199279785156, -0.042620182037353516, -0.040325164794921875, -0.038030147552490234, -0.035735130310058594, -0.03344011306762695, -0.031145095825195312, -0.028850078582763672, -0.02655506134033203, -0.02426004409790039, -0.02196502685546875, -0.01967000961303711, -0.01737499237060547, -0.015079975128173828, -0.012784957885742188, -0.010489940643310547, -0.008194923400878906, -0.005899906158447266, -0.003604888916015625, -0.0013098716735839844, 0.0009851455688476562, 0.003280162811279297, 0.0055751800537109375, 0.007870197296142578, 0.010165214538574219, 0.01246023178100586, 0.0147552490234375, 0.01705026626586914, 0.01934528350830078, 0.021640300750732422, 0.023935317993164062, 0.026230335235595703, 0.028525352478027344, 0.030820369720458984, 0.033115386962890625, 0.035410404205322266, 0.037705421447753906, 0.04000043869018555, 0.04229545593261719, 0.04459047317504883, 0.04688549041748047, 0.04918050765991211, 0.05147552490234375, 0.05377054214477539, 0.05606555938720703, 0.05836057662963867, 0.06065559387207031, 0.06295061111450195, 0.0652456283569336, 0.06754064559936523, 0.06983566284179688, 0.07213068008422852, 0.07442569732666016, 0.0767207145690918, 0.07901573181152344, 0.08131074905395508, 0.08360576629638672, 0.08590078353881836, 0.08819580078125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 7.0, 20.0, 111.0, 351.0, 1445.0, 132671.0, 4056925.0, 2124.0, 460.0, 117.0, 25.0, 16.0, 7.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53515625, -7.16009521484375, -6.7850341796875, -6.40997314453125, -6.034912109375, -5.65985107421875, -5.2847900390625, -4.90972900390625, -4.53466796875, -4.15960693359375, -3.7845458984375, -3.40948486328125, -3.034423828125, -2.65936279296875, -2.2843017578125, -1.90924072265625, -1.5341796875, -1.15911865234375, -0.7840576171875, -0.40899658203125, -0.033935546875, 0.34112548828125, 0.7161865234375, 1.09124755859375, 1.46630859375, 1.84136962890625, 2.2164306640625, 2.59149169921875, 2.966552734375, 3.34161376953125, 3.7166748046875, 4.09173583984375, 4.466796875, 4.84185791015625, 5.2169189453125, 5.59197998046875, 5.967041015625, 6.34210205078125, 6.7171630859375, 7.09222412109375, 7.46728515625, 7.84234619140625, 8.2174072265625, 8.59246826171875, 8.967529296875, 9.34259033203125, 9.7176513671875, 10.09271240234375, 10.4677734375, 10.84283447265625, 11.2178955078125, 11.59295654296875, 11.968017578125, 12.34307861328125, 12.7181396484375, 13.09320068359375, 13.46826171875, 13.84332275390625, 14.2183837890625, 14.59344482421875, 14.968505859375, 15.34356689453125, 15.7186279296875, 16.09368896484375, 16.46875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 23.0, 57.0, 445.0, 3196.0, 286.0, 54.0, 16.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81884765625, -0.7852554321289062, -0.7516632080078125, -0.7180709838867188, -0.684478759765625, -0.6508865356445312, -0.6172943115234375, -0.5837020874023438, -0.55010986328125, -0.5165176391601562, -0.4829254150390625, -0.44933319091796875, -0.415740966796875, -0.38214874267578125, -0.3485565185546875, -0.31496429443359375, -0.2813720703125, -0.24777984619140625, -0.2141876220703125, -0.18059539794921875, -0.147003173828125, -0.11341094970703125, -0.0798187255859375, -0.04622650146484375, -0.01263427734375, 0.02095794677734375, 0.0545501708984375, 0.08814239501953125, 0.121734619140625, 0.15532684326171875, 0.1889190673828125, 0.22251129150390625, 0.256103515625, 0.28969573974609375, 0.3232879638671875, 0.35688018798828125, 0.390472412109375, 0.42406463623046875, 0.4576568603515625, 0.49124908447265625, 0.52484130859375, 0.5584335327148438, 0.5920257568359375, 0.6256179809570312, 0.659210205078125, 0.6928024291992188, 0.7263946533203125, 0.7599868774414062, 0.7935791015625, 0.8271713256835938, 0.8607635498046875, 0.8943557739257812, 0.927947998046875, 0.9615402221679688, 0.9951324462890625, 1.0287246704101562, 1.06231689453125, 1.0959091186523438, 1.1295013427734375, 1.1630935668945312, 1.196685791015625, 1.2302780151367188, 1.2638702392578125, 1.2974624633789062, 1.3310546875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 8.0, 19.0, 92.0, 423.0, 367.0, 66.0, 21.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-13.477032661437988, -13.195364952087402, -12.913697242736816, -12.632030487060547, -12.350362777709961, -12.068695068359375, -11.787027359008789, -11.505359649658203, -11.223692893981934, -10.942025184631348, -10.660357475280762, -10.378690719604492, -10.097023010253906, -9.81535530090332, -9.533687591552734, -9.252019882202148, -8.970352172851562, -8.688684463500977, -8.40701675415039, -8.125349998474121, -7.843682289123535, -7.562014579772949, -7.280346870422363, -6.9986796379089355, -6.717012405395508, -6.435344696044922, -6.153677463531494, -5.872009754180908, -5.5903425216674805, -5.3086748123168945, -5.027007102966309, -4.745339870452881, -4.463673114776611, -4.182005405426025, -3.9003381729125977, -3.6186704635620117, -3.337003231048584, -3.055335521697998, -2.773668050765991, -2.4920005798339844, -2.2103331089019775, -1.9286656379699707, -1.6469981670379639, -1.3653305768966675, -1.0836631059646606, -0.8019956350326538, -0.5203280448913574, -0.23866057395935059, 0.04300689697265625, 0.3246743977069855, 0.6063418984413147, 0.8880094289779663, 1.1696768999099731, 1.45134437084198, 1.7330119609832764, 2.014679431915283, 2.29634690284729, 2.578014373779297, 2.8596818447113037, 3.1413493156433105, 3.4230170249938965, 3.704684257507324, 3.98635196685791, 4.268019676208496, 4.549686908721924]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 7.0, 11.0, 11.0, 35.0, 37.0, 38.0, 47.0, 62.0, 62.0, 69.0, 92.0, 81.0, 88.0, 59.0, 72.0, 56.0, 40.0, 39.0, 23.0, 26.0, 13.0, 10.0, 10.0, 7.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4030470848083496, -1.3432602882385254, -1.2834734916687012, -1.2236865758895874, -1.1638997793197632, -1.104112982749939, -1.0443260669708252, -0.984539270401001, -0.9247524738311768, -0.8649656772613525, -0.8051788210868835, -0.7453919649124146, -0.6856051683425903, -0.6258183717727661, -0.5660315155982971, -0.5062446594238281, -0.4464578628540039, -0.3866710364818573, -0.3268842101097107, -0.2670973837375641, -0.20731055736541748, -0.14752373099327087, -0.08773690462112427, -0.02795007824897766, 0.031836748123168945, 0.09162357449531555, 0.15141040086746216, 0.21119722723960876, 0.27098405361175537, 0.330770879983902, 0.3905577063560486, 0.4503445327281952, 0.5101313591003418, 0.569918155670166, 0.629705011844635, 0.689491868019104, 0.7492786645889282, 0.8090654611587524, 0.8688523173332214, 0.9286391735076904, 0.9884259700775146, 1.0482127666473389, 1.107999563217163, 1.1677864789962769, 1.227573275566101, 1.2873600721359253, 1.347146987915039, 1.4069337844848633, 1.4667205810546875, 1.5265073776245117, 1.586294174194336, 1.6460810899734497, 1.705867886543274, 1.7656546831130981, 1.825441598892212, 1.8852283954620361, 1.9450151920318604, 2.0048019886016846, 2.064588785171509, 2.124375581741333, 2.1841626167297363, 2.2439494132995605, 2.3037362098693848, 2.363523006439209, 2.423309803009033]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 5.0, 3.0, 8.0, 10.0, 9.0, 7.0, 15.0, 19.0, 23.0, 38.0, 56.0, 76.0, 107.0, 182.0, 340.0, 732.0, 1954.0, 9527.0, 121676.0, 813378.0, 89147.0, 7955.0, 1810.0, 594.0, 304.0, 197.0, 122.0, 60.0, 51.0, 38.0, 23.0, 23.0, 10.0, 11.0, 10.0, 8.0, 8.0, 5.0, 4.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.04296875, -1.971160888671875, -1.89935302734375, -1.827545166015625, -1.7557373046875, -1.683929443359375, -1.61212158203125, -1.540313720703125, -1.468505859375, -1.396697998046875, -1.32489013671875, -1.253082275390625, -1.1812744140625, -1.109466552734375, -1.03765869140625, -0.965850830078125, -0.89404296875, -0.822235107421875, -0.75042724609375, -0.678619384765625, -0.6068115234375, -0.535003662109375, -0.46319580078125, -0.391387939453125, -0.319580078125, -0.247772216796875, -0.17596435546875, -0.104156494140625, -0.0323486328125, 0.039459228515625, 0.11126708984375, 0.183074951171875, 0.2548828125, 0.326690673828125, 0.39849853515625, 0.470306396484375, 0.5421142578125, 0.613922119140625, 0.68572998046875, 0.757537841796875, 0.829345703125, 0.901153564453125, 0.97296142578125, 1.044769287109375, 1.1165771484375, 1.188385009765625, 1.26019287109375, 1.332000732421875, 1.40380859375, 1.475616455078125, 1.54742431640625, 1.619232177734375, 1.6910400390625, 1.762847900390625, 1.83465576171875, 1.906463623046875, 1.978271484375, 2.050079345703125, 2.12188720703125, 2.193695068359375, 2.2655029296875, 2.337310791015625, 2.40911865234375, 2.480926513671875, 2.552734375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 5.0, 3.0, 2.0, 6.0, 8.0, 19.0, 19.0, 37.0, 33.0, 49.0, 48.0, 57.0, 74.0, 78.0, 83.0, 87.0, 66.0, 82.0, 60.0, 48.0, 35.0, 34.0, 22.0, 15.0, 15.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10760498046875, -0.10328388214111328, -0.09896278381347656, -0.09464168548583984, -0.09032058715820312, -0.0859994888305664, -0.08167839050292969, -0.07735729217529297, -0.07303619384765625, -0.06871509552001953, -0.06439399719238281, -0.060072898864746094, -0.055751800537109375, -0.051430702209472656, -0.04710960388183594, -0.04278850555419922, -0.0384674072265625, -0.03414630889892578, -0.029825210571289062, -0.025504112243652344, -0.021183013916015625, -0.016861915588378906, -0.012540817260742188, -0.008219718933105469, -0.00389862060546875, 0.00042247772216796875, 0.0047435760498046875, 0.009064674377441406, 0.013385772705078125, 0.017706871032714844, 0.022027969360351562, 0.02634906768798828, 0.030670166015625, 0.03499126434326172, 0.03931236267089844, 0.043633460998535156, 0.047954559326171875, 0.052275657653808594, 0.05659675598144531, 0.06091785430908203, 0.06523895263671875, 0.06956005096435547, 0.07388114929199219, 0.0782022476196289, 0.08252334594726562, 0.08684444427490234, 0.09116554260253906, 0.09548664093017578, 0.0998077392578125, 0.10412883758544922, 0.10844993591308594, 0.11277103424072266, 0.11709213256835938, 0.1214132308959961, 0.1257343292236328, 0.13005542755126953, 0.13437652587890625, 0.13869762420654297, 0.1430187225341797, 0.1473398208618164, 0.15166091918945312, 0.15598201751708984, 0.16030311584472656, 0.16462421417236328, 0.1689453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 7.0, 6.0, 7.0, 7.0, 5.0, 10.0, 8.0, 25.0, 18.0, 33.0, 43.0, 68.0, 103.0, 134.0, 243.0, 394.0, 681.0, 1370.0, 2874.0, 6649.0, 18708.0, 67751.0, 299323.0, 473365.0, 127284.0, 31236.0, 10022.0, 3999.0, 1810.0, 950.0, 544.0, 327.0, 180.0, 130.0, 72.0, 49.0, 36.0, 25.0, 22.0, 13.0, 10.0, 2.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.92578125, -0.8994903564453125, -0.873199462890625, -0.8469085693359375, -0.82061767578125, -0.7943267822265625, -0.768035888671875, -0.7417449951171875, -0.7154541015625, -0.6891632080078125, -0.662872314453125, -0.6365814208984375, -0.61029052734375, -0.5839996337890625, -0.557708740234375, -0.5314178466796875, -0.505126953125, -0.4788360595703125, -0.452545166015625, -0.4262542724609375, -0.39996337890625, -0.3736724853515625, -0.347381591796875, -0.3210906982421875, -0.2947998046875, -0.2685089111328125, -0.242218017578125, -0.2159271240234375, -0.18963623046875, -0.1633453369140625, -0.137054443359375, -0.1107635498046875, -0.08447265625, -0.0581817626953125, -0.031890869140625, -0.0055999755859375, 0.02069091796875, 0.0469818115234375, 0.073272705078125, 0.0995635986328125, 0.1258544921875, 0.1521453857421875, 0.178436279296875, 0.2047271728515625, 0.23101806640625, 0.2573089599609375, 0.283599853515625, 0.3098907470703125, 0.336181640625, 0.3624725341796875, 0.388763427734375, 0.4150543212890625, 0.44134521484375, 0.4676361083984375, 0.493927001953125, 0.5202178955078125, 0.5465087890625, 0.5727996826171875, 0.599090576171875, 0.6253814697265625, 0.65167236328125, 0.6779632568359375, 0.704254150390625, 0.7305450439453125, 0.7568359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 3.0, 11.0, 12.0, 7.0, 15.0, 13.0, 17.0, 21.0, 26.0, 27.0, 35.0, 42.0, 47.0, 47.0, 53.0, 56.0, 56.0, 57.0, 58.0, 51.0, 33.0, 45.0, 42.0, 38.0, 31.0, 26.0, 20.0, 25.0, 15.0, 8.0, 14.0, 16.0, 5.0, 2.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.5205078125, -0.5063667297363281, -0.49222564697265625, -0.4780845642089844, -0.4639434814453125, -0.4498023986816406, -0.43566131591796875, -0.4215202331542969, -0.407379150390625, -0.3932380676269531, -0.37909698486328125, -0.3649559020996094, -0.3508148193359375, -0.3366737365722656, -0.32253265380859375, -0.3083915710449219, -0.29425048828125, -0.2801094055175781, -0.26596832275390625, -0.2518272399902344, -0.2376861572265625, -0.22354507446289062, -0.20940399169921875, -0.19526290893554688, -0.181121826171875, -0.16698074340820312, -0.15283966064453125, -0.13869857788085938, -0.1245574951171875, -0.11041641235351562, -0.09627532958984375, -0.08213424682617188, -0.0679931640625, -0.053852081298828125, -0.03971099853515625, -0.025569915771484375, -0.0114288330078125, 0.002712249755859375, 0.01685333251953125, 0.030994415283203125, 0.045135498046875, 0.059276580810546875, 0.07341766357421875, 0.08755874633789062, 0.1016998291015625, 0.11584091186523438, 0.12998199462890625, 0.14412307739257812, 0.15826416015625, 0.17240524291992188, 0.18654632568359375, 0.20068740844726562, 0.2148284912109375, 0.22896957397460938, 0.24311065673828125, 0.2572517395019531, 0.271392822265625, 0.2855339050292969, 0.29967498779296875, 0.3138160705566406, 0.3279571533203125, 0.3420982360839844, 0.35623931884765625, 0.3703804016113281, 0.384521484375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 2.0, 6.0, 3.0, 7.0, 4.0, 13.0, 17.0, 28.0, 40.0, 61.0, 114.0, 174.0, 485.0, 1438.0, 5390.0, 33847.0, 847142.0, 144494.0, 11270.0, 2563.0, 791.0, 300.0, 142.0, 73.0, 43.0, 24.0, 18.0, 20.0, 16.0, 3.0, 5.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-1.333984375, -1.2966461181640625, -1.259307861328125, -1.2219696044921875, -1.18463134765625, -1.1472930908203125, -1.109954833984375, -1.0726165771484375, -1.0352783203125, -0.9979400634765625, -0.960601806640625, -0.9232635498046875, -0.88592529296875, -0.8485870361328125, -0.811248779296875, -0.7739105224609375, -0.736572265625, -0.6992340087890625, -0.661895751953125, -0.6245574951171875, -0.58721923828125, -0.5498809814453125, -0.512542724609375, -0.4752044677734375, -0.4378662109375, -0.4005279541015625, -0.363189697265625, -0.3258514404296875, -0.28851318359375, -0.2511749267578125, -0.213836669921875, -0.1764984130859375, -0.13916015625, -0.1018218994140625, -0.064483642578125, -0.0271453857421875, 0.01019287109375, 0.0475311279296875, 0.084869384765625, 0.1222076416015625, 0.1595458984375, 0.1968841552734375, 0.234222412109375, 0.2715606689453125, 0.30889892578125, 0.3462371826171875, 0.383575439453125, 0.4209136962890625, 0.458251953125, 0.4955902099609375, 0.532928466796875, 0.5702667236328125, 0.60760498046875, 0.6449432373046875, 0.682281494140625, 0.7196197509765625, 0.7569580078125, 0.7942962646484375, 0.831634521484375, 0.8689727783203125, 0.90631103515625, 0.9436492919921875, 0.980987548828125, 1.0183258056640625, 1.0556640625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 10.0, 6.0, 8.0, 9.0, 9.0, 23.0, 25.0, 34.0, 46.0, 69.0, 118.0, 110.0, 127.0, 121.0, 98.0, 62.0, 34.0, 21.0, 24.0, 11.0, 6.0, 8.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.207559585571289e-05, -7.894355803728104e-05, -7.581152021884918e-05, -7.267948240041733e-05, -6.954744458198547e-05, -6.641540676355362e-05, -6.328336894512177e-05, -6.015133112668991e-05, -5.701929330825806e-05, -5.38872554898262e-05, -5.075521767139435e-05, -4.7623179852962494e-05, -4.449114203453064e-05, -4.1359104216098785e-05, -3.822706639766693e-05, -3.509502857923508e-05, -3.196299076080322e-05, -2.883095294237137e-05, -2.5698915123939514e-05, -2.256687730550766e-05, -1.9434839487075806e-05, -1.630280166864395e-05, -1.3170763850212097e-05, -1.0038726031780243e-05, -6.906688213348389e-06, -3.7746503949165344e-06, -6.426125764846802e-07, 2.489425241947174e-06, 5.621463060379028e-06, 8.753500878810883e-06, 1.1885538697242737e-05, 1.5017576515674591e-05, 1.8149614334106445e-05, 2.12816521525383e-05, 2.4413689970970154e-05, 2.7545727789402008e-05, 3.067776560783386e-05, 3.3809803426265717e-05, 3.694184124469757e-05, 4.0073879063129425e-05, 4.320591688156128e-05, 4.6337954699993134e-05, 4.946999251842499e-05, 5.260203033685684e-05, 5.5734068155288696e-05, 5.886610597372055e-05, 6.19981437921524e-05, 6.513018161058426e-05, 6.826221942901611e-05, 7.139425724744797e-05, 7.452629506587982e-05, 7.765833288431168e-05, 8.079037070274353e-05, 8.392240852117538e-05, 8.705444633960724e-05, 9.018648415803909e-05, 9.331852197647095e-05, 9.64505597949028e-05, 9.958259761333466e-05, 0.00010271463543176651, 0.00010584667325019836, 0.00010897871106863022, 0.00011211074888706207, 0.00011524278670549393, 0.00011837482452392578]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 8.0, 9.0, 10.0, 11.0, 23.0, 28.0, 43.0, 73.0, 81.0, 142.0, 211.0, 443.0, 820.0, 1789.0, 4205.0, 11410.0, 47320.0, 555671.0, 374097.0, 35713.0, 9474.0, 3605.0, 1651.0, 734.0, 399.0, 232.0, 118.0, 75.0, 49.0, 22.0, 21.0, 16.0, 15.0, 10.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.65185546875, -0.6326370239257812, -0.6134185791015625, -0.5942001342773438, -0.574981689453125, -0.5557632446289062, -0.5365447998046875, -0.5173263549804688, -0.49810791015625, -0.47888946533203125, -0.4596710205078125, -0.44045257568359375, -0.421234130859375, -0.40201568603515625, -0.3827972412109375, -0.36357879638671875, -0.3443603515625, -0.32514190673828125, -0.3059234619140625, -0.28670501708984375, -0.267486572265625, -0.24826812744140625, -0.2290496826171875, -0.20983123779296875, -0.19061279296875, -0.17139434814453125, -0.1521759033203125, -0.13295745849609375, -0.113739013671875, -0.09452056884765625, -0.0753021240234375, -0.05608367919921875, -0.036865234375, -0.01764678955078125, 0.0015716552734375, 0.02079010009765625, 0.040008544921875, 0.05922698974609375, 0.0784454345703125, 0.09766387939453125, 0.11688232421875, 0.13610076904296875, 0.1553192138671875, 0.17453765869140625, 0.193756103515625, 0.21297454833984375, 0.2321929931640625, 0.25141143798828125, 0.2706298828125, 0.28984832763671875, 0.3090667724609375, 0.32828521728515625, 0.347503662109375, 0.36672210693359375, 0.3859405517578125, 0.40515899658203125, 0.42437744140625, 0.44359588623046875, 0.4628143310546875, 0.48203277587890625, 0.501251220703125, 0.5204696655273438, 0.5396881103515625, 0.5589065551757812, 0.578125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 3.0, 6.0, 2.0, 5.0, 6.0, 6.0, 9.0, 14.0, 29.0, 42.0, 74.0, 134.0, 177.0, 178.0, 107.0, 80.0, 47.0, 26.0, 16.0, 9.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.486328125, -0.4715843200683594, -0.45684051513671875, -0.4420967102050781, -0.4273529052734375, -0.4126091003417969, -0.39786529541015625, -0.3831214904785156, -0.368377685546875, -0.3536338806152344, -0.33889007568359375, -0.3241462707519531, -0.3094024658203125, -0.2946586608886719, -0.27991485595703125, -0.2651710510253906, -0.25042724609375, -0.23568344116210938, -0.22093963623046875, -0.20619583129882812, -0.1914520263671875, -0.17670822143554688, -0.16196441650390625, -0.14722061157226562, -0.132476806640625, -0.11773300170898438, -0.10298919677734375, -0.08824539184570312, -0.0735015869140625, -0.058757781982421875, -0.04401397705078125, -0.029270172119140625, -0.0145263671875, 0.000217437744140625, 0.01496124267578125, 0.029705047607421875, 0.0444488525390625, 0.059192657470703125, 0.07393646240234375, 0.08868026733398438, 0.103424072265625, 0.11816787719726562, 0.13291168212890625, 0.14765548706054688, 0.1623992919921875, 0.17714309692382812, 0.19188690185546875, 0.20663070678710938, 0.22137451171875, 0.23611831665039062, 0.25086212158203125, 0.2656059265136719, 0.2803497314453125, 0.2950935363769531, 0.30983734130859375, 0.3245811462402344, 0.339324951171875, 0.3540687561035156, 0.36881256103515625, 0.3835563659667969, 0.3983001708984375, 0.4130439758300781, 0.42778778076171875, 0.4425315856933594, 0.457275390625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 7.0, 5.0, 32.0, 113.0, 239.0, 334.0, 171.0, 69.0, 20.0, 12.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.548263549804688, -9.185465812683105, -8.822668075561523, -8.459871292114258, -8.097073554992676, -7.734275817871094, -7.371478080749512, -7.008680820465088, -6.645883560180664, -6.283085823059082, -5.920288562774658, -5.557490825653076, -5.194693565368652, -4.83189582824707, -4.469098091125488, -4.1063008308410645, -3.7435030937194824, -3.3807055950164795, -3.0179080963134766, -2.6551103591918945, -2.2923130989074707, -1.9295154809951782, -1.5667178630828857, -1.2039203643798828, -0.8411228656768799, -0.47832533717155457, -0.11552780866622925, 0.24726974964141846, 0.6100672483444214, 0.9728647470474243, 1.3356623649597168, 1.6984598636627197, 2.0612573623657227, 2.4240548610687256, 2.7868523597717285, 3.1496500968933105, 3.5124473571777344, 3.8752450942993164, 4.238042831420898, 4.600840091705322, 4.963637351989746, 5.326435089111328, 5.689232349395752, 6.052030086517334, 6.414827346801758, 6.77762508392334, 7.140422821044922, 7.503220081329346, 7.866017818450928, 8.228815078735352, 8.591612815856934, 8.954410552978516, 9.317208290100098, 9.680005073547363, 10.042802810668945, 10.405600547790527, 10.76839828491211, 11.131196022033691, 11.493993759155273, 11.856790542602539, 12.219588279724121, 12.582386016845703, 12.945183753967285, 13.307981491088867, 13.670778274536133]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 7.0, 4.0, 7.0, 7.0, 12.0, 17.0, 16.0, 16.0, 25.0, 25.0, 34.0, 30.0, 39.0, 40.0, 39.0, 54.0, 46.0, 47.0, 61.0, 59.0, 43.0, 56.0, 52.0, 37.0, 44.0, 32.0, 31.0, 26.0, 23.0, 13.0, 14.0, 5.0, 14.0, 4.0, 11.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0359015464782715, -2.949129104614258, -2.862356424331665, -2.7755839824676514, -2.6888115406036377, -2.602038860321045, -2.5152664184570312, -2.4284939765930176, -2.341721296310425, -2.254948854446411, -2.1681761741638184, -2.0814037322998047, -1.9946311712265015, -1.9078586101531982, -1.8210861682891846, -1.7343136072158813, -1.6475411653518677, -1.5607686042785645, -1.4739961624145508, -1.3872236013412476, -1.3004510402679443, -1.2136785984039307, -1.1269060373306274, -1.0401334762573242, -0.9533609747886658, -0.8665884733200073, -0.7798159122467041, -0.6930434107780457, -0.6062709093093872, -0.519498348236084, -0.43272584676742554, -0.3459532856941223, -0.25918078422546387, -0.17240825295448303, -0.08563573658466339, 0.00113677978515625, 0.08790931105613708, 0.17468184232711792, 0.26145434379577637, 0.3482269048690796, 0.43499940633773804, 0.5217719078063965, 0.6085444688796997, 0.6953169703483582, 0.7820894718170166, 0.8688620328903198, 0.9556345343589783, 1.0424070358276367, 1.12917959690094, 1.2159521579742432, 1.3027245998382568, 1.38949716091156, 1.4762697219848633, 1.563042163848877, 1.6498147249221802, 1.7365872859954834, 1.823359727859497, 1.9101322889328003, 1.996904730796814, 2.083677291870117, 2.170449733734131, 2.2572224140167236, 2.3439948558807373, 2.43076753616333, 2.5175399780273438]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 2.0, 6.0, 6.0, 6.0, 5.0, 8.0, 13.0, 7.0, 11.0, 16.0, 22.0, 17.0, 26.0, 38.0, 70.0, 71.0, 128.0, 242.0, 496.0, 1420.0, 6761.0, 71579.0, 3989565.0, 110789.0, 9486.0, 2028.0, 674.0, 309.0, 170.0, 88.0, 78.0, 42.0, 28.0, 19.0, 20.0, 10.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0], "bins": [-3.2578125, -3.17547607421875, -3.0931396484375, -3.01080322265625, -2.928466796875, -2.84613037109375, -2.7637939453125, -2.68145751953125, -2.59912109375, -2.51678466796875, -2.4344482421875, -2.35211181640625, -2.269775390625, -2.18743896484375, -2.1051025390625, -2.02276611328125, -1.9404296875, -1.85809326171875, -1.7757568359375, -1.69342041015625, -1.611083984375, -1.52874755859375, -1.4464111328125, -1.36407470703125, -1.28173828125, -1.19940185546875, -1.1170654296875, -1.03472900390625, -0.952392578125, -0.87005615234375, -0.7877197265625, -0.70538330078125, -0.623046875, -0.54071044921875, -0.4583740234375, -0.37603759765625, -0.293701171875, -0.21136474609375, -0.1290283203125, -0.04669189453125, 0.03564453125, 0.11798095703125, 0.2003173828125, 0.28265380859375, 0.364990234375, 0.44732666015625, 0.5296630859375, 0.61199951171875, 0.6943359375, 0.77667236328125, 0.8590087890625, 0.94134521484375, 1.023681640625, 1.10601806640625, 1.1883544921875, 1.27069091796875, 1.35302734375, 1.43536376953125, 1.5177001953125, 1.60003662109375, 1.682373046875, 1.76470947265625, 1.8470458984375, 1.92938232421875, 2.01171875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 3.0, 10.0, 12.0, 16.0, 18.0, 26.0, 34.0, 41.0, 41.0, 43.0, 45.0, 50.0, 55.0, 80.0, 60.0, 54.0, 69.0, 46.0, 47.0, 47.0, 31.0, 33.0, 27.0, 23.0, 22.0, 19.0, 19.0, 12.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08978271484375, -0.08627033233642578, -0.08275794982910156, -0.07924556732177734, -0.07573318481445312, -0.0722208023071289, -0.06870841979980469, -0.06519603729248047, -0.06168365478515625, -0.05817127227783203, -0.05465888977050781, -0.051146507263183594, -0.047634124755859375, -0.044121742248535156, -0.04060935974121094, -0.03709697723388672, -0.0335845947265625, -0.03007221221923828, -0.026559829711914062, -0.023047447204589844, -0.019535064697265625, -0.016022682189941406, -0.012510299682617188, -0.008997917175292969, -0.00548553466796875, -0.0019731521606445312, 0.0015392303466796875, 0.005051612854003906, 0.008563995361328125, 0.012076377868652344, 0.015588760375976562, 0.01910114288330078, 0.022613525390625, 0.02612590789794922, 0.029638290405273438, 0.033150672912597656, 0.036663055419921875, 0.040175437927246094, 0.04368782043457031, 0.04720020294189453, 0.05071258544921875, 0.05422496795654297, 0.05773735046386719, 0.061249732971191406, 0.06476211547851562, 0.06827449798583984, 0.07178688049316406, 0.07529926300048828, 0.0788116455078125, 0.08232402801513672, 0.08583641052246094, 0.08934879302978516, 0.09286117553710938, 0.0963735580444336, 0.09988594055175781, 0.10339832305908203, 0.10691070556640625, 0.11042308807373047, 0.11393547058105469, 0.1174478530883789, 0.12096023559570312, 0.12447261810302734, 0.12798500061035156, 0.13149738311767578, 0.135009765625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 8.0, 14.0, 22.0, 42.0, 101.0, 177.0, 442.0, 1090.0, 4229.0, 258600.0, 3920113.0, 7162.0, 1283.0, 514.0, 244.0, 106.0, 49.0, 38.0, 23.0, 13.0, 7.0, 4.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.69921875, -2.55810546875, -2.4169921875, -2.27587890625, -2.134765625, -1.99365234375, -1.8525390625, -1.71142578125, -1.5703125, -1.42919921875, -1.2880859375, -1.14697265625, -1.005859375, -0.86474609375, -0.7236328125, -0.58251953125, -0.44140625, -0.30029296875, -0.1591796875, -0.01806640625, 0.123046875, 0.26416015625, 0.4052734375, 0.54638671875, 0.6875, 0.82861328125, 0.9697265625, 1.11083984375, 1.251953125, 1.39306640625, 1.5341796875, 1.67529296875, 1.81640625, 1.95751953125, 2.0986328125, 2.23974609375, 2.380859375, 2.52197265625, 2.6630859375, 2.80419921875, 2.9453125, 3.08642578125, 3.2275390625, 3.36865234375, 3.509765625, 3.65087890625, 3.7919921875, 3.93310546875, 4.07421875, 4.21533203125, 4.3564453125, 4.49755859375, 4.638671875, 4.77978515625, 4.9208984375, 5.06201171875, 5.203125, 5.34423828125, 5.4853515625, 5.62646484375, 5.767578125, 5.90869140625, 6.0498046875, 6.19091796875, 6.33203125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 13.0, 34.0, 81.0, 366.0, 2830.0, 558.0, 132.0, 36.0, 12.0, 10.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52294921875, -0.49877166748046875, -0.4745941162109375, -0.45041656494140625, -0.426239013671875, -0.40206146240234375, -0.3778839111328125, -0.35370635986328125, -0.32952880859375, -0.30535125732421875, -0.2811737060546875, -0.25699615478515625, -0.232818603515625, -0.20864105224609375, -0.1844635009765625, -0.16028594970703125, -0.1361083984375, -0.11193084716796875, -0.0877532958984375, -0.06357574462890625, -0.039398193359375, -0.01522064208984375, 0.0089569091796875, 0.03313446044921875, 0.05731201171875, 0.08148956298828125, 0.1056671142578125, 0.12984466552734375, 0.154022216796875, 0.17819976806640625, 0.2023773193359375, 0.22655487060546875, 0.250732421875, 0.27490997314453125, 0.2990875244140625, 0.32326507568359375, 0.347442626953125, 0.37162017822265625, 0.3957977294921875, 0.41997528076171875, 0.44415283203125, 0.46833038330078125, 0.4925079345703125, 0.5166854858398438, 0.540863037109375, 0.5650405883789062, 0.5892181396484375, 0.6133956909179688, 0.6375732421875, 0.6617507934570312, 0.6859283447265625, 0.7101058959960938, 0.734283447265625, 0.7584609985351562, 0.7826385498046875, 0.8068161010742188, 0.83099365234375, 0.8551712036132812, 0.8793487548828125, 0.9035263061523438, 0.927703857421875, 0.9518814086914062, 0.9760589599609375, 1.0002365112304688, 1.0244140625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 11.0, 54.0, 303.0, 467.0, 119.0, 33.0, 7.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.450301647186279, -5.225833892822266, -5.00136661529541, -4.776899337768555, -4.552431583404541, -4.327963829040527, -4.103496551513672, -3.8790290355682373, -3.6545615196228027, -3.430094003677368, -3.2056264877319336, -2.981158971786499, -2.7566914558410645, -2.53222393989563, -2.3077564239501953, -2.0832889080047607, -1.8588213920593262, -1.6343538761138916, -1.409886360168457, -1.1854188442230225, -0.9609513282775879, -0.7364838123321533, -0.5120162963867188, -0.2875487804412842, -0.06308126449584961, 0.16138625144958496, 0.38585376739501953, 0.6103212833404541, 0.8347887992858887, 1.0592563152313232, 1.2837238311767578, 1.5081913471221924, 1.7326583862304688, 1.9571259021759033, 2.181593418121338, 2.4060609340667725, 2.630528450012207, 2.8549959659576416, 3.079463481903076, 3.3039309978485107, 3.5283985137939453, 3.75286602973938, 3.9773335456848145, 4.201801300048828, 4.426268577575684, 4.650735855102539, 4.875203609466553, 5.099671363830566, 5.324138641357422, 5.548605918884277, 5.773073673248291, 5.997541427612305, 6.22200870513916, 6.446475982666016, 6.670943737030029, 6.895411491394043, 7.119878768920898, 7.344346046447754, 7.568813800811768, 7.793281555175781, 8.017748832702637, 8.242216110229492, 8.466684341430664, 8.69115161895752, 8.915618896484375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 6.0, 15.0, 18.0, 13.0, 37.0, 40.0, 43.0, 49.0, 65.0, 74.0, 85.0, 69.0, 73.0, 64.0, 59.0, 60.0, 47.0, 39.0, 45.0, 35.0, 25.0, 11.0, 9.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6858141422271729, -1.6417864561080933, -1.5977587699890137, -1.5537312030792236, -1.509703516960144, -1.4656758308410645, -1.4216482639312744, -1.3776205778121948, -1.3335928916931152, -1.2895652055740356, -1.245537519454956, -1.201509952545166, -1.1574822664260864, -1.1134545803070068, -1.0694270133972168, -1.0253993272781372, -0.9813716411590576, -0.937343955039978, -0.8933163285255432, -0.8492887020111084, -0.8052610158920288, -0.7612333297729492, -0.7172057032585144, -0.6731780767440796, -0.629150390625, -0.5851227045059204, -0.5410950779914856, -0.4970674216747284, -0.4530397653579712, -0.409012109041214, -0.3649844527244568, -0.3209567964076996, -0.27692925930023193, -0.23290160298347473, -0.18887394666671753, -0.14484629034996033, -0.10081863403320312, -0.05679097771644592, -0.01276332139968872, 0.03126433491706848, 0.07529199123382568, 0.11931964755058289, 0.1633473038673401, 0.2073749601840973, 0.2514026165008545, 0.2954302728176117, 0.3394579291343689, 0.3834855854511261, 0.4275132417678833, 0.4715408980846405, 0.5155685544013977, 0.5595961809158325, 0.6036238670349121, 0.6476515531539917, 0.6916791796684265, 0.7357068061828613, 0.7797344923019409, 0.8237621784210205, 0.8677898049354553, 0.9118174314498901, 0.9558451175689697, 0.9998728036880493, 1.043900489807129, 1.087928056716919, 1.1319557428359985]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 8.0, 2.0, 3.0, 7.0, 10.0, 8.0, 15.0, 13.0, 18.0, 30.0, 27.0, 37.0, 47.0, 83.0, 129.0, 205.0, 312.0, 642.0, 1413.0, 4215.0, 21046.0, 220978.0, 703656.0, 80267.0, 10441.0, 2671.0, 990.0, 481.0, 298.0, 165.0, 88.0, 64.0, 42.0, 34.0, 23.0, 27.0, 15.0, 12.0, 9.0, 3.0, 8.0, 1.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 4.0], "bins": [-2.46875, -2.4025726318359375, -2.336395263671875, -2.2702178955078125, -2.20404052734375, -2.1378631591796875, -2.071685791015625, -2.0055084228515625, -1.9393310546875, -1.8731536865234375, -1.806976318359375, -1.7407989501953125, -1.67462158203125, -1.6084442138671875, -1.542266845703125, -1.4760894775390625, -1.409912109375, -1.3437347412109375, -1.277557373046875, -1.2113800048828125, -1.14520263671875, -1.0790252685546875, -1.012847900390625, -0.9466705322265625, -0.8804931640625, -0.8143157958984375, -0.748138427734375, -0.6819610595703125, -0.61578369140625, -0.5496063232421875, -0.483428955078125, -0.4172515869140625, -0.35107421875, -0.2848968505859375, -0.218719482421875, -0.1525421142578125, -0.08636474609375, -0.0201873779296875, 0.045989990234375, 0.1121673583984375, 0.1783447265625, 0.2445220947265625, 0.310699462890625, 0.3768768310546875, 0.44305419921875, 0.5092315673828125, 0.575408935546875, 0.6415863037109375, 0.707763671875, 0.7739410400390625, 0.840118408203125, 0.9062957763671875, 0.97247314453125, 1.0386505126953125, 1.104827880859375, 1.1710052490234375, 1.2371826171875, 1.3033599853515625, 1.369537353515625, 1.4357147216796875, 1.50189208984375, 1.5680694580078125, 1.634246826171875, 1.7004241943359375, 1.7666015625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 19.0, 10.0, 22.0, 24.0, 38.0, 37.0, 54.0, 51.0, 62.0, 59.0, 65.0, 80.0, 66.0, 66.0, 49.0, 58.0, 56.0, 44.0, 32.0, 27.0, 20.0, 12.0, 8.0, 11.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12237548828125, -0.1180868148803711, -0.11379814147949219, -0.10950946807861328, -0.10522079467773438, -0.10093212127685547, -0.09664344787597656, -0.09235477447509766, -0.08806610107421875, -0.08377742767333984, -0.07948875427246094, -0.07520008087158203, -0.07091140747070312, -0.06662273406982422, -0.06233406066894531, -0.058045387268066406, -0.0537567138671875, -0.049468040466308594, -0.04517936706542969, -0.04089069366455078, -0.036602020263671875, -0.03231334686279297, -0.028024673461914062, -0.023736000061035156, -0.01944732666015625, -0.015158653259277344, -0.010869979858398438, -0.006581306457519531, -0.002292633056640625, 0.0019960403442382812, 0.0062847137451171875, 0.010573387145996094, 0.014862060546875, 0.019150733947753906, 0.023439407348632812, 0.02772808074951172, 0.032016754150390625, 0.03630542755126953, 0.04059410095214844, 0.044882774353027344, 0.04917144775390625, 0.053460121154785156, 0.05774879455566406, 0.06203746795654297, 0.06632614135742188, 0.07061481475830078, 0.07490348815917969, 0.0791921615600586, 0.0834808349609375, 0.0877695083618164, 0.09205818176269531, 0.09634685516357422, 0.10063552856445312, 0.10492420196533203, 0.10921287536621094, 0.11350154876708984, 0.11779022216796875, 0.12207889556884766, 0.12636756896972656, 0.13065624237060547, 0.13494491577148438, 0.13923358917236328, 0.1435222625732422, 0.1478109359741211, 0.152099609375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 9.0, 5.0, 7.0, 4.0, 15.0, 19.0, 29.0, 47.0, 91.0, 152.0, 235.0, 432.0, 955.0, 2315.0, 6706.0, 28079.0, 237433.0, 653549.0, 95982.0, 14980.0, 4244.0, 1643.0, 727.0, 379.0, 197.0, 117.0, 58.0, 44.0, 35.0, 18.0, 10.0, 8.0, 11.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.337890625, -1.2888946533203125, -1.239898681640625, -1.1909027099609375, -1.14190673828125, -1.0929107666015625, -1.043914794921875, -0.9949188232421875, -0.9459228515625, -0.8969268798828125, -0.847930908203125, -0.7989349365234375, -0.74993896484375, -0.7009429931640625, -0.651947021484375, -0.6029510498046875, -0.553955078125, -0.5049591064453125, -0.455963134765625, -0.4069671630859375, -0.35797119140625, -0.3089752197265625, -0.259979248046875, -0.2109832763671875, -0.1619873046875, -0.1129913330078125, -0.063995361328125, -0.0149993896484375, 0.03399658203125, 0.0829925537109375, 0.131988525390625, 0.1809844970703125, 0.22998046875, 0.2789764404296875, 0.327972412109375, 0.3769683837890625, 0.42596435546875, 0.4749603271484375, 0.523956298828125, 0.5729522705078125, 0.6219482421875, 0.6709442138671875, 0.719940185546875, 0.7689361572265625, 0.81793212890625, 0.8669281005859375, 0.915924072265625, 0.9649200439453125, 1.013916015625, 1.0629119873046875, 1.111907958984375, 1.1609039306640625, 1.20989990234375, 1.2588958740234375, 1.307891845703125, 1.3568878173828125, 1.4058837890625, 1.4548797607421875, 1.503875732421875, 1.5528717041015625, 1.60186767578125, 1.6508636474609375, 1.699859619140625, 1.7488555908203125, 1.7978515625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 6.0, 2.0, 7.0, 5.0, 7.0, 5.0, 7.0, 15.0, 19.0, 14.0, 24.0, 30.0, 36.0, 44.0, 36.0, 49.0, 46.0, 54.0, 44.0, 55.0, 64.0, 49.0, 38.0, 56.0, 34.0, 46.0, 39.0, 29.0, 27.0, 20.0, 22.0, 15.0, 16.0, 9.0, 7.0, 7.0, 6.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.418212890625, -0.4025154113769531, -0.38681793212890625, -0.3711204528808594, -0.3554229736328125, -0.3397254943847656, -0.32402801513671875, -0.3083305358886719, -0.292633056640625, -0.2769355773925781, -0.26123809814453125, -0.24554061889648438, -0.2298431396484375, -0.21414566040039062, -0.19844818115234375, -0.18275070190429688, -0.16705322265625, -0.15135574340820312, -0.13565826416015625, -0.11996078491210938, -0.1042633056640625, -0.08856582641601562, -0.07286834716796875, -0.057170867919921875, -0.041473388671875, -0.025775909423828125, -0.01007843017578125, 0.005619049072265625, 0.0213165283203125, 0.037014007568359375, 0.05271148681640625, 0.06840896606445312, 0.0841064453125, 0.09980392456054688, 0.11550140380859375, 0.13119888305664062, 0.1468963623046875, 0.16259384155273438, 0.17829132080078125, 0.19398880004882812, 0.209686279296875, 0.22538375854492188, 0.24108123779296875, 0.2567787170410156, 0.2724761962890625, 0.2881736755371094, 0.30387115478515625, 0.3195686340332031, 0.33526611328125, 0.3509635925292969, 0.36666107177734375, 0.3823585510253906, 0.3980560302734375, 0.4137535095214844, 0.42945098876953125, 0.4451484680175781, 0.460845947265625, 0.4765434265136719, 0.49224090576171875, 0.5079383850097656, 0.5236358642578125, 0.5393333435058594, 0.5550308227539062, 0.5707283020019531, 0.58642578125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 3.0, 11.0, 11.0, 22.0, 32.0, 50.0, 78.0, 136.0, 250.0, 390.0, 862.0, 2150.0, 7145.0, 38538.0, 397778.0, 535842.0, 51817.0, 8930.0, 2481.0, 932.0, 453.0, 226.0, 138.0, 85.0, 53.0, 27.0, 22.0, 26.0, 15.0, 11.0, 8.0, 3.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.68212890625, -0.662109375, -0.64208984375, -0.6220703125, -0.60205078125, -0.58203125, -0.56201171875, -0.5419921875, -0.52197265625, -0.501953125, -0.48193359375, -0.4619140625, -0.44189453125, -0.421875, -0.40185546875, -0.3818359375, -0.36181640625, -0.341796875, -0.32177734375, -0.3017578125, -0.28173828125, -0.26171875, -0.24169921875, -0.2216796875, -0.20166015625, -0.181640625, -0.16162109375, -0.1416015625, -0.12158203125, -0.1015625, -0.08154296875, -0.0615234375, -0.04150390625, -0.021484375, -0.00146484375, 0.0185546875, 0.03857421875, 0.05859375, 0.07861328125, 0.0986328125, 0.11865234375, 0.138671875, 0.15869140625, 0.1787109375, 0.19873046875, 0.21875, 0.23876953125, 0.2587890625, 0.27880859375, 0.298828125, 0.31884765625, 0.3388671875, 0.35888671875, 0.37890625, 0.39892578125, 0.4189453125, 0.43896484375, 0.458984375, 0.47900390625, 0.4990234375, 0.51904296875, 0.5390625, 0.55908203125, 0.5791015625, 0.59912109375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 10.0, 7.0, 15.0, 11.0, 19.0, 18.0, 54.0, 49.0, 82.0, 110.0, 126.0, 112.0, 106.0, 87.0, 50.0, 34.0, 25.0, 24.0, 17.0, 11.0, 8.0, 4.0, 1.0, 5.0, 3.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.970499038696289e-05, -8.610356599092484e-05, -8.250214159488678e-05, -7.890071719884872e-05, -7.529929280281067e-05, -7.169786840677261e-05, -6.809644401073456e-05, -6.44950196146965e-05, -6.089359521865845e-05, -5.729217082262039e-05, -5.3690746426582336e-05, -5.008932203054428e-05, -4.6487897634506226e-05, -4.288647323846817e-05, -3.9285048842430115e-05, -3.568362444639206e-05, -3.2082200050354004e-05, -2.848077565431595e-05, -2.4879351258277893e-05, -2.1277926862239838e-05, -1.7676502466201782e-05, -1.4075078070163727e-05, -1.0473653674125671e-05, -6.872229278087616e-06, -3.2708048820495605e-06, 3.3061951398849487e-07, 3.93204391002655e-06, 7.533468306064606e-06, 1.1134892702102661e-05, 1.4736317098140717e-05, 1.8337741494178772e-05, 2.1939165890216827e-05, 2.5540590286254883e-05, 2.9142014682292938e-05, 3.2743439078330994e-05, 3.634486347436905e-05, 3.9946287870407104e-05, 4.354771226644516e-05, 4.7149136662483215e-05, 5.075056105852127e-05, 5.4351985454559326e-05, 5.795340985059738e-05, 6.155483424663544e-05, 6.515625864267349e-05, 6.875768303871155e-05, 7.23591074347496e-05, 7.596053183078766e-05, 7.956195622682571e-05, 8.316338062286377e-05, 8.676480501890182e-05, 9.036622941493988e-05, 9.396765381097794e-05, 9.756907820701599e-05, 0.00010117050260305405, 0.0001047719269990921, 0.00010837335139513016, 0.00011197477579116821, 0.00011557620018720627, 0.00011917762458324432, 0.00012277904897928238, 0.00012638047337532043, 0.0001299818977713585, 0.00013358332216739655, 0.0001371847465634346, 0.00014078617095947266]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 11.0, 17.0, 25.0, 25.0, 33.0, 64.0, 112.0, 168.0, 322.0, 567.0, 1201.0, 2762.0, 7178.0, 23697.0, 115303.0, 580359.0, 255268.0, 42346.0, 11530.0, 4090.0, 1732.0, 805.0, 366.0, 213.0, 122.0, 75.0, 50.0, 37.0, 19.0, 12.0, 10.0, 9.0, 6.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.36376953125, -0.35109710693359375, -0.3384246826171875, -0.32575225830078125, -0.313079833984375, -0.30040740966796875, -0.2877349853515625, -0.27506256103515625, -0.26239013671875, -0.24971771240234375, -0.2370452880859375, -0.22437286376953125, -0.211700439453125, -0.19902801513671875, -0.1863555908203125, -0.17368316650390625, -0.1610107421875, -0.14833831787109375, -0.1356658935546875, -0.12299346923828125, -0.110321044921875, -0.09764862060546875, -0.0849761962890625, -0.07230377197265625, -0.05963134765625, -0.04695892333984375, -0.0342864990234375, -0.02161407470703125, -0.008941650390625, 0.00373077392578125, 0.0164031982421875, 0.02907562255859375, 0.041748046875, 0.05442047119140625, 0.0670928955078125, 0.07976531982421875, 0.092437744140625, 0.10511016845703125, 0.1177825927734375, 0.13045501708984375, 0.14312744140625, 0.15579986572265625, 0.1684722900390625, 0.18114471435546875, 0.193817138671875, 0.20648956298828125, 0.2191619873046875, 0.23183441162109375, 0.2445068359375, 0.25717926025390625, 0.2698516845703125, 0.28252410888671875, 0.295196533203125, 0.30786895751953125, 0.3205413818359375, 0.33321380615234375, 0.34588623046875, 0.35855865478515625, 0.3712310791015625, 0.38390350341796875, 0.396575927734375, 0.40924835205078125, 0.4219207763671875, 0.43459320068359375, 0.447265625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 9.0, 8.0, 9.0, 14.0, 20.0, 25.0, 37.0, 27.0, 28.0, 62.0, 52.0, 73.0, 78.0, 80.0, 80.0, 61.0, 49.0, 52.0, 46.0, 20.0, 30.0, 33.0, 20.0, 19.0, 18.0, 10.0, 5.0, 3.0, 4.0, 5.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.2218017578125, -0.2152538299560547, -0.20870590209960938, -0.20215797424316406, -0.19561004638671875, -0.18906211853027344, -0.18251419067382812, -0.1759662628173828, -0.1694183349609375, -0.1628704071044922, -0.15632247924804688, -0.14977455139160156, -0.14322662353515625, -0.13667869567871094, -0.13013076782226562, -0.12358283996582031, -0.117034912109375, -0.11048698425292969, -0.10393905639648438, -0.09739112854003906, -0.09084320068359375, -0.08429527282714844, -0.07774734497070312, -0.07119941711425781, -0.0646514892578125, -0.05810356140136719, -0.051555633544921875, -0.04500770568847656, -0.03845977783203125, -0.03191184997558594, -0.025363922119140625, -0.018815994262695312, -0.01226806640625, -0.0057201385498046875, 0.000827789306640625, 0.0073757171630859375, 0.01392364501953125, 0.020471572875976562, 0.027019500732421875, 0.03356742858886719, 0.0401153564453125, 0.04666328430175781, 0.053211212158203125, 0.05975914001464844, 0.06630706787109375, 0.07285499572753906, 0.07940292358398438, 0.08595085144042969, 0.092498779296875, 0.09904670715332031, 0.10559463500976562, 0.11214256286621094, 0.11869049072265625, 0.12523841857910156, 0.13178634643554688, 0.1383342742919922, 0.1448822021484375, 0.1514301300048828, 0.15797805786132812, 0.16452598571777344, 0.17107391357421875, 0.17762184143066406, 0.18416976928710938, 0.1907176971435547, 0.197265625]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 7.0, 42.0, 71.0, 222.0, 307.0, 208.0, 88.0, 34.0, 12.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.069975852966309, -8.64826774597168, -8.226558685302734, -7.8048505783081055, -7.38314151763916, -6.961433410644531, -6.539724826812744, -6.118016242980957, -5.69630765914917, -5.274599075317383, -4.852890491485596, -4.431181907653809, -4.00947380065918, -3.5877649784088135, -3.1660566329956055, -2.7443480491638184, -2.3226394653320312, -1.9009308815002441, -1.4792224168777466, -1.057513952255249, -0.6358053684234619, -0.2140967845916748, 0.2076115608215332, 0.6293201446533203, 1.0510287284851074, 1.4727373123168945, 1.894445776939392, 2.3161542415618896, 2.7378628253936768, 3.159571409225464, 3.581279754638672, 4.002988338470459, 4.42469596862793, 4.846404552459717, 5.268113136291504, 5.689821243286133, 6.111530303955078, 6.533238410949707, 6.954946994781494, 7.376655578613281, 7.798364162445068, 8.220072746276855, 8.641780853271484, 9.06348991394043, 9.485198020935059, 9.906907081604004, 10.328615188598633, 10.750324249267578, 11.172032356262207, 11.593740463256836, 12.015449523925781, 12.43715763092041, 12.858866691589355, 13.280574798583984, 13.70228385925293, 14.123991966247559, 14.545700073242188, 14.967408180236816, 15.389117240905762, 15.81082534790039, 16.232534408569336, 16.65424346923828, 17.075950622558594, 17.49765968322754, 17.919368743896484]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 9.0, 6.0, 12.0, 11.0, 15.0, 26.0, 36.0, 46.0, 45.0, 32.0, 50.0, 58.0, 62.0, 67.0, 57.0, 70.0, 53.0, 69.0, 46.0, 40.0, 40.0, 27.0, 27.0, 26.0, 26.0, 11.0, 13.0, 12.0, 1.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.658356666564941, -4.537021160125732, -4.415685176849365, -4.294349670410156, -4.173013687133789, -4.05167818069458, -3.930342435836792, -3.809006690979004, -3.687670946121216, -3.5663352012634277, -3.4449994564056396, -3.3236637115478516, -3.2023282051086426, -3.0809924602508545, -2.9596567153930664, -2.8383209705352783, -2.7169852256774902, -2.595649480819702, -2.474313735961914, -2.352978229522705, -2.231642484664917, -2.110306739807129, -1.9889709949493408, -1.8676352500915527, -1.7462997436523438, -1.6249639987945557, -1.5036283731460571, -1.382292628288269, -1.260956883430481, -1.1396212577819824, -1.0182855129241943, -0.8969497680664062, -0.7756140232086182, -0.6542783379554749, -0.5329425930976868, -0.41160690784454346, -0.29027119278907776, -0.16893547773361206, -0.04759979248046875, 0.07373595237731934, 0.19507163763046265, 0.31640735268592834, 0.43774306774139404, 0.5590787529945374, 0.6804144382476807, 0.8017501831054688, 0.9230858683586121, 1.044421672821045, 1.1657572984695435, 1.2870930433273315, 1.40842866897583, 1.5297644138336182, 1.6511001586914062, 1.7724359035491943, 1.8937715291976929, 2.0151071548461914, 2.1364428997039795, 2.2577786445617676, 2.3791143894195557, 2.5004501342773438, 2.6217856407165527, 2.743121385574341, 2.864457130432129, 2.985792875289917, 3.107128620147705]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 7.0, 9.0, 2.0, 10.0, 10.0, 15.0, 17.0, 28.0, 34.0, 32.0, 40.0, 54.0, 83.0, 147.0, 244.0, 624.0, 1643.0, 7369.0, 67802.0, 3816608.0, 275915.0, 18254.0, 3367.0, 1021.0, 419.0, 212.0, 124.0, 68.0, 37.0, 25.0, 18.0, 13.0, 7.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.27734375, -3.19482421875, -3.1123046875, -3.02978515625, -2.947265625, -2.86474609375, -2.7822265625, -2.69970703125, -2.6171875, -2.53466796875, -2.4521484375, -2.36962890625, -2.287109375, -2.20458984375, -2.1220703125, -2.03955078125, -1.95703125, -1.87451171875, -1.7919921875, -1.70947265625, -1.626953125, -1.54443359375, -1.4619140625, -1.37939453125, -1.296875, -1.21435546875, -1.1318359375, -1.04931640625, -0.966796875, -0.88427734375, -0.8017578125, -0.71923828125, -0.63671875, -0.55419921875, -0.4716796875, -0.38916015625, -0.306640625, -0.22412109375, -0.1416015625, -0.05908203125, 0.0234375, 0.10595703125, 0.1884765625, 0.27099609375, 0.353515625, 0.43603515625, 0.5185546875, 0.60107421875, 0.68359375, 0.76611328125, 0.8486328125, 0.93115234375, 1.013671875, 1.09619140625, 1.1787109375, 1.26123046875, 1.34375, 1.42626953125, 1.5087890625, 1.59130859375, 1.673828125, 1.75634765625, 1.8388671875, 1.92138671875, 2.00390625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 13.0, 7.0, 16.0, 16.0, 24.0, 19.0, 29.0, 40.0, 41.0, 49.0, 61.0, 61.0, 51.0, 58.0, 72.0, 62.0, 48.0, 56.0, 39.0, 46.0, 41.0, 34.0, 21.0, 19.0, 20.0, 12.0, 9.0, 7.0, 8.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1290283203125, -0.12499237060546875, -0.1209564208984375, -0.11692047119140625, -0.112884521484375, -0.10884857177734375, -0.1048126220703125, -0.10077667236328125, -0.09674072265625, -0.09270477294921875, -0.0886688232421875, -0.08463287353515625, -0.080596923828125, -0.07656097412109375, -0.0725250244140625, -0.06848907470703125, -0.064453125, -0.06041717529296875, -0.0563812255859375, -0.05234527587890625, -0.048309326171875, -0.04427337646484375, -0.0402374267578125, -0.03620147705078125, -0.03216552734375, -0.02812957763671875, -0.0240936279296875, -0.02005767822265625, -0.016021728515625, -0.01198577880859375, -0.0079498291015625, -0.00391387939453125, 0.0001220703125, 0.00415802001953125, 0.0081939697265625, 0.01222991943359375, 0.016265869140625, 0.02030181884765625, 0.0243377685546875, 0.02837371826171875, 0.03240966796875, 0.03644561767578125, 0.0404815673828125, 0.04451751708984375, 0.048553466796875, 0.05258941650390625, 0.0566253662109375, 0.06066131591796875, 0.064697265625, 0.06873321533203125, 0.0727691650390625, 0.07680511474609375, 0.080841064453125, 0.08487701416015625, 0.0889129638671875, 0.09294891357421875, 0.09698486328125, 0.10102081298828125, 0.1050567626953125, 0.10909271240234375, 0.113128662109375, 0.11716461181640625, 0.1212005615234375, 0.12523651123046875, 0.1292724609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 9.0, 18.0, 24.0, 32.0, 77.0, 158.0, 411.0, 1338.0, 6758.0, 300493.0, 3872501.0, 9677.0, 1783.0, 551.0, 184.0, 97.0, 48.0, 38.0, 26.0, 21.0, 11.0, 16.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.72265625, -4.52679443359375, -4.3309326171875, -4.13507080078125, -3.939208984375, -3.74334716796875, -3.5474853515625, -3.35162353515625, -3.15576171875, -2.95989990234375, -2.7640380859375, -2.56817626953125, -2.372314453125, -2.17645263671875, -1.9805908203125, -1.78472900390625, -1.5888671875, -1.39300537109375, -1.1971435546875, -1.00128173828125, -0.805419921875, -0.60955810546875, -0.4136962890625, -0.21783447265625, -0.02197265625, 0.17388916015625, 0.3697509765625, 0.56561279296875, 0.761474609375, 0.95733642578125, 1.1531982421875, 1.34906005859375, 1.544921875, 1.74078369140625, 1.9366455078125, 2.13250732421875, 2.328369140625, 2.52423095703125, 2.7200927734375, 2.91595458984375, 3.11181640625, 3.30767822265625, 3.5035400390625, 3.69940185546875, 3.895263671875, 4.09112548828125, 4.2869873046875, 4.48284912109375, 4.6787109375, 4.87457275390625, 5.0704345703125, 5.26629638671875, 5.462158203125, 5.65802001953125, 5.8538818359375, 6.04974365234375, 6.24560546875, 6.44146728515625, 6.6373291015625, 6.83319091796875, 7.029052734375, 7.22491455078125, 7.4207763671875, 7.61663818359375, 7.8125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 7.0, 6.0, 5.0, 8.0, 6.0, 14.0, 21.0, 20.0, 41.0, 62.0, 112.0, 226.0, 504.0, 1623.0, 791.0, 313.0, 122.0, 85.0, 42.0, 19.0, 17.0, 10.0, 7.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49951171875, -0.48211669921875, -0.4647216796875, -0.44732666015625, -0.429931640625, -0.41253662109375, -0.3951416015625, -0.37774658203125, -0.3603515625, -0.34295654296875, -0.3255615234375, -0.30816650390625, -0.290771484375, -0.27337646484375, -0.2559814453125, -0.23858642578125, -0.22119140625, -0.20379638671875, -0.1864013671875, -0.16900634765625, -0.151611328125, -0.13421630859375, -0.1168212890625, -0.09942626953125, -0.08203125, -0.06463623046875, -0.0472412109375, -0.02984619140625, -0.012451171875, 0.00494384765625, 0.0223388671875, 0.03973388671875, 0.05712890625, 0.07452392578125, 0.0919189453125, 0.10931396484375, 0.126708984375, 0.14410400390625, 0.1614990234375, 0.17889404296875, 0.1962890625, 0.21368408203125, 0.2310791015625, 0.24847412109375, 0.265869140625, 0.28326416015625, 0.3006591796875, 0.31805419921875, 0.33544921875, 0.35284423828125, 0.3702392578125, 0.38763427734375, 0.405029296875, 0.42242431640625, 0.4398193359375, 0.45721435546875, 0.474609375, 0.49200439453125, 0.5093994140625, 0.52679443359375, 0.544189453125, 0.56158447265625, 0.5789794921875, 0.59637451171875, 0.61376953125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 9.0, 5.0, 20.0, 44.0, 137.0, 304.0, 322.0, 97.0, 33.0, 18.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.602534294128418, -14.303973197937012, -14.005412101745605, -13.706851959228516, -13.40829086303711, -13.109729766845703, -12.811168670654297, -12.51260757446289, -12.214046478271484, -11.915485382080078, -11.616924285888672, -11.318364143371582, -11.019803047180176, -10.72124195098877, -10.422680854797363, -10.124119758605957, -9.825559616088867, -9.526998519897461, -9.228437423706055, -8.929877281188965, -8.631316184997559, -8.332755088806152, -8.034193992614746, -7.73563289642334, -7.437072277069092, -7.1385111808776855, -6.8399505615234375, -6.541389465332031, -6.242828369140625, -5.944267749786377, -5.645706653594971, -5.347146034240723, -5.048583984375, -4.750022888183594, -4.451462268829346, -4.1529011726379395, -3.8543403148651123, -3.555779457092285, -3.257218360900879, -2.9586575031280518, -2.6600966453552246, -2.3615357875823975, -2.0629749298095703, -1.764413833618164, -1.465852975845337, -1.1672921180725098, -0.8687311410903931, -0.5701701641082764, -0.2716093063354492, 0.026951611042022705, 0.32551252841949463, 0.6240734457969666, 0.9226343631744385, 1.2211952209472656, 1.5197561979293823, 1.818317174911499, 2.116878032684326, 2.4154388904571533, 2.7139997482299805, 3.0125608444213867, 3.311121702194214, 3.609682559967041, 3.9082436561584473, 4.206804275512695, 4.505365371704102]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 11.0, 21.0, 11.0, 24.0, 44.0, 49.0, 42.0, 65.0, 50.0, 77.0, 65.0, 62.0, 73.0, 64.0, 63.0, 54.0, 51.0, 50.0, 39.0, 26.0, 15.0, 10.0, 7.0, 9.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.830462694168091, -2.7550129890441895, -2.679563522338867, -2.604114055633545, -2.5286643505096436, -2.453214645385742, -2.37776517868042, -2.3023157119750977, -2.2268660068511963, -2.151416301727295, -2.0759668350219727, -2.0005173683166504, -1.925067663192749, -1.8496180772781372, -1.7741684913635254, -1.6987189054489136, -1.6232693195343018, -1.54781973361969, -1.4723701477050781, -1.3969205617904663, -1.3214709758758545, -1.2460213899612427, -1.1705718040466309, -1.095122218132019, -1.0196726322174072, -0.9442230463027954, -0.8687734603881836, -0.7933238744735718, -0.71787428855896, -0.6424247026443481, -0.5669751167297363, -0.4915255308151245, -0.4160761833190918, -0.34062659740448, -0.26517701148986816, -0.18972742557525635, -0.11427783966064453, -0.038828253746032715, 0.0366213321685791, 0.11207091808319092, 0.18752050399780273, 0.26297008991241455, 0.33841967582702637, 0.4138692617416382, 0.48931884765625, 0.5647684335708618, 0.6402180194854736, 0.7156676054000854, 0.7911171913146973, 0.8665667772293091, 0.9420163631439209, 1.0174659490585327, 1.0929155349731445, 1.1683651208877563, 1.2438147068023682, 1.31926429271698, 1.3947138786315918, 1.4701634645462036, 1.5456130504608154, 1.6210626363754272, 1.696512222290039, 1.7719618082046509, 1.8474113941192627, 1.9228609800338745, 1.9983105659484863]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 3.0, 7.0, 10.0, 10.0, 20.0, 17.0, 23.0, 34.0, 40.0, 64.0, 84.0, 137.0, 156.0, 254.0, 390.0, 759.0, 1761.0, 7435.0, 65520.0, 681039.0, 264118.0, 20496.0, 3435.0, 1140.0, 553.0, 324.0, 200.0, 138.0, 91.0, 86.0, 53.0, 46.0, 25.0, 18.0, 18.0, 14.0, 12.0, 9.0, 6.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.3203125, -2.249481201171875, -2.17864990234375, -2.107818603515625, -2.0369873046875, -1.966156005859375, -1.89532470703125, -1.824493408203125, -1.753662109375, -1.682830810546875, -1.61199951171875, -1.541168212890625, -1.4703369140625, -1.399505615234375, -1.32867431640625, -1.257843017578125, -1.18701171875, -1.116180419921875, -1.04534912109375, -0.974517822265625, -0.9036865234375, -0.832855224609375, -0.76202392578125, -0.691192626953125, -0.620361328125, -0.549530029296875, -0.47869873046875, -0.407867431640625, -0.3370361328125, -0.266204833984375, -0.19537353515625, -0.124542236328125, -0.0537109375, 0.017120361328125, 0.08795166015625, 0.158782958984375, 0.2296142578125, 0.300445556640625, 0.37127685546875, 0.442108154296875, 0.512939453125, 0.583770751953125, 0.65460205078125, 0.725433349609375, 0.7962646484375, 0.867095947265625, 0.93792724609375, 1.008758544921875, 1.07958984375, 1.150421142578125, 1.22125244140625, 1.292083740234375, 1.3629150390625, 1.433746337890625, 1.50457763671875, 1.575408935546875, 1.646240234375, 1.717071533203125, 1.78790283203125, 1.858734130859375, 1.9295654296875, 2.000396728515625, 2.07122802734375, 2.142059326171875, 2.212890625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 6.0, 6.0, 11.0, 21.0, 14.0, 27.0, 40.0, 65.0, 67.0, 95.0, 95.0, 88.0, 88.0, 97.0, 69.0, 57.0, 38.0, 32.0, 32.0, 20.0, 15.0, 10.0, 8.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.263671875, -0.257354736328125, -0.25103759765625, -0.244720458984375, -0.2384033203125, -0.232086181640625, -0.22576904296875, -0.219451904296875, -0.213134765625, -0.206817626953125, -0.20050048828125, -0.194183349609375, -0.1878662109375, -0.181549072265625, -0.17523193359375, -0.168914794921875, -0.16259765625, -0.156280517578125, -0.14996337890625, -0.143646240234375, -0.1373291015625, -0.131011962890625, -0.12469482421875, -0.118377685546875, -0.112060546875, -0.105743408203125, -0.09942626953125, -0.093109130859375, -0.0867919921875, -0.080474853515625, -0.07415771484375, -0.067840576171875, -0.0615234375, -0.055206298828125, -0.04888916015625, -0.042572021484375, -0.0362548828125, -0.029937744140625, -0.02362060546875, -0.017303466796875, -0.010986328125, -0.004669189453125, 0.00164794921875, 0.007965087890625, 0.0142822265625, 0.020599365234375, 0.02691650390625, 0.033233642578125, 0.03955078125, 0.045867919921875, 0.05218505859375, 0.058502197265625, 0.0648193359375, 0.071136474609375, 0.07745361328125, 0.083770751953125, 0.090087890625, 0.096405029296875, 0.10272216796875, 0.109039306640625, 0.1153564453125, 0.121673583984375, 0.12799072265625, 0.134307861328125, 0.140625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 6.0, 10.0, 13.0, 22.0, 30.0, 48.0, 46.0, 66.0, 87.0, 127.0, 211.0, 338.0, 479.0, 847.0, 1450.0, 2730.0, 5642.0, 12416.0, 29143.0, 73498.0, 180339.0, 318532.0, 242172.0, 105528.0, 41886.0, 17153.0, 7565.0, 3535.0, 1914.0, 1012.0, 618.0, 367.0, 203.0, 152.0, 108.0, 71.0, 56.0, 38.0, 23.0, 23.0, 18.0, 7.0, 9.0, 4.0, 2.0, 5.0, 7.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5341796875, -0.5167770385742188, -0.4993743896484375, -0.48197174072265625, -0.464569091796875, -0.44716644287109375, -0.4297637939453125, -0.41236114501953125, -0.39495849609375, -0.37755584716796875, -0.3601531982421875, -0.34275054931640625, -0.325347900390625, -0.30794525146484375, -0.2905426025390625, -0.27313995361328125, -0.2557373046875, -0.23833465576171875, -0.2209320068359375, -0.20352935791015625, -0.186126708984375, -0.16872406005859375, -0.1513214111328125, -0.13391876220703125, -0.11651611328125, -0.09911346435546875, -0.0817108154296875, -0.06430816650390625, -0.046905517578125, -0.02950286865234375, -0.0121002197265625, 0.00530242919921875, 0.022705078125, 0.04010772705078125, 0.0575103759765625, 0.07491302490234375, 0.092315673828125, 0.10971832275390625, 0.1271209716796875, 0.14452362060546875, 0.16192626953125, 0.17932891845703125, 0.1967315673828125, 0.21413421630859375, 0.231536865234375, 0.24893951416015625, 0.2663421630859375, 0.28374481201171875, 0.3011474609375, 0.31855010986328125, 0.3359527587890625, 0.35335540771484375, 0.370758056640625, 0.38816070556640625, 0.4055633544921875, 0.42296600341796875, 0.44036865234375, 0.45777130126953125, 0.4751739501953125, 0.49257659912109375, 0.509979248046875, 0.5273818969726562, 0.5447845458984375, 0.5621871948242188, 0.57958984375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 6.0, 3.0, 4.0, 4.0, 14.0, 7.0, 7.0, 11.0, 17.0, 13.0, 16.0, 15.0, 10.0, 18.0, 30.0, 15.0, 32.0, 31.0, 31.0, 26.0, 31.0, 47.0, 33.0, 30.0, 41.0, 35.0, 47.0, 43.0, 40.0, 45.0, 30.0, 28.0, 30.0, 24.0, 28.0, 26.0, 17.0, 21.0, 14.0, 14.0, 12.0, 15.0, 9.0, 6.0, 9.0, 1.0, 3.0, 7.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.3818359375, -0.3686256408691406, -0.35541534423828125, -0.3422050476074219, -0.3289947509765625, -0.3157844543457031, -0.30257415771484375, -0.2893638610839844, -0.276153564453125, -0.2629432678222656, -0.24973297119140625, -0.23652267456054688, -0.2233123779296875, -0.21010208129882812, -0.19689178466796875, -0.18368148803710938, -0.17047119140625, -0.15726089477539062, -0.14405059814453125, -0.13084030151367188, -0.1176300048828125, -0.10441970825195312, -0.09120941162109375, -0.07799911499023438, -0.064788818359375, -0.051578521728515625, -0.03836822509765625, -0.025157928466796875, -0.0119476318359375, 0.001262664794921875, 0.01447296142578125, 0.027683258056640625, 0.0408935546875, 0.054103851318359375, 0.06731414794921875, 0.08052444458007812, 0.0937347412109375, 0.10694503784179688, 0.12015533447265625, 0.13336563110351562, 0.146575927734375, 0.15978622436523438, 0.17299652099609375, 0.18620681762695312, 0.1994171142578125, 0.21262741088867188, 0.22583770751953125, 0.23904800415039062, 0.25225830078125, 0.2654685974121094, 0.27867889404296875, 0.2918891906738281, 0.3050994873046875, 0.3183097839355469, 0.33152008056640625, 0.3447303771972656, 0.357940673828125, 0.3711509704589844, 0.38436126708984375, 0.3975715637207031, 0.4107818603515625, 0.4239921569824219, 0.43720245361328125, 0.4504127502441406, 0.463623046875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 15.0, 16.0, 23.0, 34.0, 42.0, 71.0, 138.0, 295.0, 566.0, 1337.0, 3501.0, 12289.0, 67805.0, 414828.0, 450923.0, 76472.0, 13627.0, 3870.0, 1367.0, 654.0, 301.0, 168.0, 83.0, 42.0, 19.0, 21.0, 13.0, 3.0, 6.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.447998046875, -0.4325675964355469, -0.41713714599609375, -0.4017066955566406, -0.3862762451171875, -0.3708457946777344, -0.35541534423828125, -0.3399848937988281, -0.324554443359375, -0.3091239929199219, -0.29369354248046875, -0.2782630920410156, -0.2628326416015625, -0.24740219116210938, -0.23197174072265625, -0.21654129028320312, -0.20111083984375, -0.18568038940429688, -0.17024993896484375, -0.15481948852539062, -0.1393890380859375, -0.12395858764648438, -0.10852813720703125, -0.09309768676757812, -0.077667236328125, -0.062236785888671875, -0.04680633544921875, -0.031375885009765625, -0.0159454345703125, -0.000514984130859375, 0.01491546630859375, 0.030345916748046875, 0.0457763671875, 0.061206817626953125, 0.07663726806640625, 0.09206771850585938, 0.1074981689453125, 0.12292861938476562, 0.13835906982421875, 0.15378952026367188, 0.169219970703125, 0.18465042114257812, 0.20008087158203125, 0.21551132202148438, 0.2309417724609375, 0.24637222290039062, 0.26180267333984375, 0.2772331237792969, 0.29266357421875, 0.3080940246582031, 0.32352447509765625, 0.3389549255371094, 0.3543853759765625, 0.3698158264160156, 0.38524627685546875, 0.4006767272949219, 0.416107177734375, 0.4315376281738281, 0.44696807861328125, 0.4623985290527344, 0.4778289794921875, 0.4932594299316406, 0.5086898803710938, 0.5241203308105469, 0.53955078125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 5.0, 6.0, 10.0, 11.0, 23.0, 32.0, 35.0, 59.0, 74.0, 83.0, 102.0, 91.0, 105.0, 84.0, 70.0, 56.0, 35.0, 27.0, 19.0, 11.0, 12.0, 14.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.876489639282227e-05, -9.57949087023735e-05, -9.282492101192474e-05, -8.985493332147598e-05, -8.688494563102722e-05, -8.391495794057846e-05, -8.09449702501297e-05, -7.797498255968094e-05, -7.500499486923218e-05, -7.203500717878342e-05, -6.906501948833466e-05, -6.60950317978859e-05, -6.312504410743713e-05, -6.015505641698837e-05, -5.718506872653961e-05, -5.421508103609085e-05, -5.124509334564209e-05, -4.827510565519333e-05, -4.530511796474457e-05, -4.233513027429581e-05, -3.9365142583847046e-05, -3.6395154893398285e-05, -3.3425167202949524e-05, -3.0455179512500763e-05, -2.7485191822052002e-05, -2.451520413160324e-05, -2.154521644115448e-05, -1.857522875070572e-05, -1.5605241060256958e-05, -1.2635253369808197e-05, -9.665265679359436e-06, -6.695277988910675e-06, -3.725290298461914e-06, -7.553026080131531e-07, 2.214685082435608e-06, 5.184672772884369e-06, 8.15466046333313e-06, 1.1124648153781891e-05, 1.4094635844230652e-05, 1.7064623534679413e-05, 2.0034611225128174e-05, 2.3004598915576935e-05, 2.5974586606025696e-05, 2.8944574296474457e-05, 3.191456198692322e-05, 3.488454967737198e-05, 3.785453736782074e-05, 4.08245250582695e-05, 4.379451274871826e-05, 4.676450043916702e-05, 4.9734488129615784e-05, 5.2704475820064545e-05, 5.5674463510513306e-05, 5.864445120096207e-05, 6.161443889141083e-05, 6.458442658185959e-05, 6.755441427230835e-05, 7.052440196275711e-05, 7.349438965320587e-05, 7.646437734365463e-05, 7.94343650341034e-05, 8.240435272455215e-05, 8.537434041500092e-05, 8.834432810544968e-05, 9.131431579589844e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 9.0, 11.0, 14.0, 10.0, 26.0, 35.0, 48.0, 67.0, 125.0, 171.0, 327.0, 503.0, 898.0, 1600.0, 3587.0, 8780.0, 25332.0, 88457.0, 295079.0, 401113.0, 155607.0, 42930.0, 13548.0, 5245.0, 2243.0, 1176.0, 626.0, 359.0, 190.0, 144.0, 94.0, 63.0, 43.0, 32.0, 15.0, 13.0, 10.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.323486328125, -0.31479454040527344, -0.3061027526855469, -0.2974109649658203, -0.28871917724609375, -0.2800273895263672, -0.2713356018066406, -0.26264381408691406, -0.2539520263671875, -0.24526023864746094, -0.23656845092773438, -0.2278766632080078, -0.21918487548828125, -0.2104930877685547, -0.20180130004882812, -0.19310951232910156, -0.184417724609375, -0.17572593688964844, -0.16703414916992188, -0.1583423614501953, -0.14965057373046875, -0.1409587860107422, -0.13226699829101562, -0.12357521057128906, -0.1148834228515625, -0.10619163513183594, -0.09749984741210938, -0.08880805969238281, -0.08011627197265625, -0.07142448425292969, -0.06273269653320312, -0.05404090881347656, -0.04534912109375, -0.03665733337402344, -0.027965545654296875, -0.019273757934570312, -0.01058197021484375, -0.0018901824951171875, 0.006801605224609375, 0.015493392944335938, 0.0241851806640625, 0.03287696838378906, 0.041568756103515625, 0.05026054382324219, 0.05895233154296875, 0.06764411926269531, 0.07633590698242188, 0.08502769470214844, 0.093719482421875, 0.10241127014160156, 0.11110305786132812, 0.11979484558105469, 0.12848663330078125, 0.1371784210205078, 0.14587020874023438, 0.15456199645996094, 0.1632537841796875, 0.17194557189941406, 0.18063735961914062, 0.1893291473388672, 0.19802093505859375, 0.2067127227783203, 0.21540451049804688, 0.22409629821777344, 0.2327880859375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 1.0, 3.0, 5.0, 7.0, 9.0, 11.0, 12.0, 11.0, 14.0, 29.0, 34.0, 39.0, 55.0, 55.0, 80.0, 66.0, 46.0, 62.0, 76.0, 55.0, 57.0, 58.0, 48.0, 34.0, 32.0, 22.0, 14.0, 14.0, 10.0, 9.0, 9.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.219482421875, -0.2124652862548828, -0.20544815063476562, -0.19843101501464844, -0.19141387939453125, -0.18439674377441406, -0.17737960815429688, -0.1703624725341797, -0.1633453369140625, -0.1563282012939453, -0.14931106567382812, -0.14229393005371094, -0.13527679443359375, -0.12825965881347656, -0.12124252319335938, -0.11422538757324219, -0.107208251953125, -0.10019111633300781, -0.09317398071289062, -0.08615684509277344, -0.07913970947265625, -0.07212257385253906, -0.06510543823242188, -0.05808830261230469, -0.0510711669921875, -0.04405403137207031, -0.037036895751953125, -0.030019760131835938, -0.02300262451171875, -0.015985488891601562, -0.008968353271484375, -0.0019512176513671875, 0.00506591796875, 0.012083053588867188, 0.019100189208984375, 0.026117324829101562, 0.03313446044921875, 0.04015159606933594, 0.047168731689453125, 0.05418586730957031, 0.0612030029296875, 0.06822013854980469, 0.07523727416992188, 0.08225440979003906, 0.08927154541015625, 0.09628868103027344, 0.10330581665039062, 0.11032295227050781, 0.117340087890625, 0.12435722351074219, 0.13137435913085938, 0.13839149475097656, 0.14540863037109375, 0.15242576599121094, 0.15944290161132812, 0.1664600372314453, 0.1734771728515625, 0.1804943084716797, 0.18751144409179688, 0.19452857971191406, 0.20154571533203125, 0.20856285095214844, 0.21557998657226562, 0.2225971221923828, 0.2296142578125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 11.0, 40.0, 150.0, 298.0, 309.0, 134.0, 41.0, 12.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.177391052246094, -9.752223014831543, -9.327054023742676, -8.901885986328125, -8.476716995239258, -8.051548957824707, -7.626380920410156, -7.201212406158447, -6.776043891906738, -6.350875377655029, -5.92570686340332, -5.5005388259887695, -5.0753703117370605, -4.650201797485352, -4.225033760070801, -3.799865245819092, -3.374696731567383, -2.949528217315674, -2.524359941482544, -2.099191665649414, -1.674023151397705, -1.248854637145996, -0.8236863613128662, -0.39851808547973633, 0.026650428771972656, 0.4518188238143921, 0.8769872188568115, 1.302155613899231, 1.7273240089416504, 2.1524925231933594, 2.5776607990264893, 3.002829074859619, 3.427997589111328, 3.853166103363037, 4.278334617614746, 4.703502655029297, 5.128671169281006, 5.553839683532715, 5.979007720947266, 6.404176235198975, 6.829344749450684, 7.254513263702393, 7.679681777954102, 8.104849815368652, 8.530017852783203, 8.95518684387207, 9.380354881286621, 9.805522918701172, 10.230691909790039, 10.65585994720459, 11.081028938293457, 11.506196975708008, 11.931365966796875, 12.356534004211426, 12.781702041625977, 13.206871032714844, 13.632039070129395, 14.057207107543945, 14.482376098632812, 14.907544136047363, 15.332712173461914, 15.757881164550781, 16.18305015563965, 16.608217239379883, 17.03338623046875]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 3.0, 0.0, 6.0, 6.0, 4.0, 7.0, 10.0, 14.0, 16.0, 25.0, 17.0, 28.0, 31.0, 31.0, 37.0, 33.0, 36.0, 36.0, 47.0, 57.0, 48.0, 49.0, 54.0, 43.0, 42.0, 36.0, 27.0, 27.0, 36.0, 30.0, 34.0, 17.0, 31.0, 13.0, 18.0, 13.0, 12.0, 6.0, 3.0, 3.0, 2.0, 4.0, 4.0, 3.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-3.4539852142333984, -3.3572051525115967, -3.260425090789795, -3.1636452674865723, -3.0668652057647705, -2.9700851440429688, -2.873305082321167, -2.7765250205993652, -2.6797451972961426, -2.582965135574341, -2.486185073852539, -2.3894052505493164, -2.2926251888275146, -2.195845127105713, -2.099065065383911, -2.0022850036621094, -1.9055050611495972, -1.8087249994277954, -1.7119450569152832, -1.6151649951934814, -1.5183850526809692, -1.4216049909591675, -1.3248250484466553, -1.2280449867248535, -1.1312649250030518, -1.03448486328125, -0.9377049207687378, -0.840924859046936, -0.7441449165344238, -0.6473648548126221, -0.5505848526954651, -0.4538048505783081, -0.3570249080657959, -0.2602449059486389, -0.16346488893032074, -0.06668487191200256, 0.03009513020515442, 0.1268751323223114, 0.22365516424179077, 0.32043516635894775, 0.41721516847610474, 0.5139951705932617, 0.6107751727104187, 0.7075551748275757, 0.8043352365493774, 0.9011151790618896, 0.9978952407836914, 1.0946753025054932, 1.1914552450180054, 1.2882353067398071, 1.3850152492523193, 1.481795310974121, 1.5785752534866333, 1.675355315208435, 1.7721352577209473, 1.868915319442749, 1.9656953811645508, 2.0624754428863525, 2.1592555046081543, 2.256035327911377, 2.3528153896331787, 2.4495954513549805, 2.5463755130767822, 2.643155574798584, 2.7399353981018066]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 3.0, 7.0, 8.0, 16.0, 11.0, 17.0, 13.0, 37.0, 27.0, 46.0, 55.0, 100.0, 141.0, 244.0, 517.0, 1334.0, 5396.0, 48937.0, 3988995.0, 134443.0, 10142.0, 2020.0, 762.0, 371.0, 204.0, 136.0, 88.0, 57.0, 44.0, 35.0, 19.0, 12.0, 7.0, 12.0, 7.0, 8.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.181640625, -3.099334716796875, -3.01702880859375, -2.934722900390625, -2.8524169921875, -2.770111083984375, -2.68780517578125, -2.605499267578125, -2.523193359375, -2.440887451171875, -2.35858154296875, -2.276275634765625, -2.1939697265625, -2.111663818359375, -2.02935791015625, -1.947052001953125, -1.86474609375, -1.782440185546875, -1.70013427734375, -1.617828369140625, -1.5355224609375, -1.453216552734375, -1.37091064453125, -1.288604736328125, -1.206298828125, -1.123992919921875, -1.04168701171875, -0.959381103515625, -0.8770751953125, -0.794769287109375, -0.71246337890625, -0.630157470703125, -0.5478515625, -0.465545654296875, -0.38323974609375, -0.300933837890625, -0.2186279296875, -0.136322021484375, -0.05401611328125, 0.028289794921875, 0.110595703125, 0.192901611328125, 0.27520751953125, 0.357513427734375, 0.4398193359375, 0.522125244140625, 0.60443115234375, 0.686737060546875, 0.76904296875, 0.851348876953125, 0.93365478515625, 1.015960693359375, 1.0982666015625, 1.180572509765625, 1.26287841796875, 1.345184326171875, 1.427490234375, 1.509796142578125, 1.59210205078125, 1.674407958984375, 1.7567138671875, 1.839019775390625, 1.92132568359375, 2.003631591796875, 2.0859375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 13.0, 17.0, 25.0, 21.0, 49.0, 40.0, 64.0, 72.0, 80.0, 76.0, 84.0, 83.0, 64.0, 59.0, 56.0, 44.0, 35.0, 29.0, 30.0, 14.0, 11.0, 10.0, 3.0, 7.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2418212890625, -0.23584556579589844, -0.22986984252929688, -0.2238941192626953, -0.21791839599609375, -0.2119426727294922, -0.20596694946289062, -0.19999122619628906, -0.1940155029296875, -0.18803977966308594, -0.18206405639648438, -0.1760883331298828, -0.17011260986328125, -0.1641368865966797, -0.15816116333007812, -0.15218544006347656, -0.146209716796875, -0.14023399353027344, -0.13425827026367188, -0.1282825469970703, -0.12230682373046875, -0.11633110046386719, -0.11035537719726562, -0.10437965393066406, -0.0984039306640625, -0.09242820739746094, -0.08645248413085938, -0.08047676086425781, -0.07450103759765625, -0.06852531433105469, -0.06254959106445312, -0.05657386779785156, -0.05059814453125, -0.04462242126464844, -0.038646697998046875, -0.03267097473144531, -0.02669525146484375, -0.020719528198242188, -0.014743804931640625, -0.008768081665039062, -0.0027923583984375, 0.0031833648681640625, 0.009159088134765625, 0.015134811401367188, 0.02111053466796875, 0.027086257934570312, 0.033061981201171875, 0.03903770446777344, 0.045013427734375, 0.05098915100097656, 0.056964874267578125, 0.06294059753417969, 0.06891632080078125, 0.07489204406738281, 0.08086776733398438, 0.08684349060058594, 0.0928192138671875, 0.09879493713378906, 0.10477066040039062, 0.11074638366699219, 0.11672210693359375, 0.12269783020019531, 0.12867355346679688, 0.13464927673339844, 0.140625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 11.0, 7.0, 8.0, 16.0, 18.0, 20.0, 26.0, 39.0, 61.0, 53.0, 78.0, 190.0, 8687.0, 4182926.0, 1606.0, 135.0, 77.0, 68.0, 50.0, 42.0, 38.0, 27.0, 22.0, 12.0, 15.0, 16.0, 11.0, 6.0, 5.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -11.07080078125, -10.7822265625, -10.49365234375, -10.205078125, -9.91650390625, -9.6279296875, -9.33935546875, -9.05078125, -8.76220703125, -8.4736328125, -8.18505859375, -7.896484375, -7.60791015625, -7.3193359375, -7.03076171875, -6.7421875, -6.45361328125, -6.1650390625, -5.87646484375, -5.587890625, -5.29931640625, -5.0107421875, -4.72216796875, -4.43359375, -4.14501953125, -3.8564453125, -3.56787109375, -3.279296875, -2.99072265625, -2.7021484375, -2.41357421875, -2.125, -1.83642578125, -1.5478515625, -1.25927734375, -0.970703125, -0.68212890625, -0.3935546875, -0.10498046875, 0.18359375, 0.47216796875, 0.7607421875, 1.04931640625, 1.337890625, 1.62646484375, 1.9150390625, 2.20361328125, 2.4921875, 2.78076171875, 3.0693359375, 3.35791015625, 3.646484375, 3.93505859375, 4.2236328125, 4.51220703125, 4.80078125, 5.08935546875, 5.3779296875, 5.66650390625, 5.955078125, 6.24365234375, 6.5322265625, 6.82080078125, 7.109375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 6.0, 55.0, 413.0, 3344.0, 219.0, 39.0, 13.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.312744140625, -0.2545433044433594, -0.19634246826171875, -0.13814163208007812, -0.0799407958984375, -0.021739959716796875, 0.03646087646484375, 0.09466171264648438, 0.152862548828125, 0.21106338500976562, 0.26926422119140625, 0.3274650573730469, 0.3856658935546875, 0.4438667297363281, 0.5020675659179688, 0.5602684020996094, 0.61846923828125, 0.6766700744628906, 0.7348709106445312, 0.7930717468261719, 0.8512725830078125, 0.9094734191894531, 0.9676742553710938, 1.0258750915527344, 1.084075927734375, 1.1422767639160156, 1.2004776000976562, 1.2586784362792969, 1.3168792724609375, 1.3750801086425781, 1.4332809448242188, 1.4914817810058594, 1.5496826171875, 1.6078834533691406, 1.6660842895507812, 1.7242851257324219, 1.7824859619140625, 1.8406867980957031, 1.8988876342773438, 1.9570884704589844, 2.015289306640625, 2.0734901428222656, 2.1316909790039062, 2.189891815185547, 2.2480926513671875, 2.306293487548828, 2.3644943237304688, 2.4226951599121094, 2.48089599609375, 2.5390968322753906, 2.5972976684570312, 2.655498504638672, 2.7136993408203125, 2.771900177001953, 2.8301010131835938, 2.8883018493652344, 2.946502685546875, 3.0047035217285156, 3.0629043579101562, 3.121105194091797, 3.1793060302734375, 3.237506866455078, 3.2957077026367188, 3.3539085388183594, 3.412109375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 15.0, 418.0, 564.0, 14.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.514610290527344, -22.494400024414062, -21.47418785095215, -20.453975677490234, -19.433765411376953, -18.413555145263672, -17.393342971801758, -16.373130798339844, -15.352920532226562, -14.332709312438965, -13.312498092651367, -12.29228687286377, -11.272075653076172, -10.251864433288574, -9.231653213500977, -8.211441993713379, -7.191230773925781, -6.171019554138184, -5.150808334350586, -4.130597114562988, -3.1103858947753906, -2.090174674987793, -1.0699634552001953, -0.049752235412597656, 0.970458984375, 1.9906702041625977, 3.0108814239501953, 4.031092643737793, 5.051303863525391, 6.071515083312988, 7.091726303100586, 8.111937522888184, 9.132148742675781, 10.152359962463379, 11.172571182250977, 12.192782402038574, 13.212993621826172, 14.23320484161377, 15.253416061401367, 16.27362823486328, 17.293838500976562, 18.314048767089844, 19.334260940551758, 20.354473114013672, 21.374683380126953, 22.394893646240234, 23.41510581970215, 24.435317993164062, 25.455528259277344, 26.475738525390625, 27.49595069885254, 28.516162872314453, 29.536373138427734, 30.556583404541016, 31.57679557800293, 32.597007751464844, 33.617218017578125, 34.637428283691406, 35.65763854980469, 36.677852630615234, 37.698062896728516, 38.7182731628418, 39.738487243652344, 40.758697509765625, 41.778907775878906]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 28.0, 102.0, 163.0, 247.0, 222.0, 147.0, 56.0, 23.0, 8.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.795660972595215, -7.550102233886719, -7.304543972015381, -7.058985233306885, -6.813426494598389, -6.567868232727051, -6.322309494018555, -6.076750755310059, -5.8311920166015625, -5.585633277893066, -5.3400750160217285, -5.094516277313232, -4.848957538604736, -4.603399276733398, -4.357840538024902, -4.112281799316406, -3.8667232990264893, -3.6211647987365723, -3.375606060028076, -3.130047559738159, -2.884488821029663, -2.638930320739746, -2.39337158203125, -2.147813081741333, -1.9022544622421265, -1.65669584274292, -1.4111372232437134, -1.1655786037445068, -0.9200200438499451, -0.6744614839553833, -0.42890286445617676, -0.18334424495697021, 0.06221437454223633, 0.30777299404144287, 0.5533316135406494, 0.7988901734352112, 1.0444488525390625, 1.2900073528289795, 1.535565972328186, 1.7811245918273926, 2.0266833305358887, 2.2722418308258057, 2.5178005695343018, 2.7633590698242188, 3.008917808532715, 3.254476308822632, 3.500034809112549, 3.745593547821045, 3.991152048110962, 4.236710548400879, 4.482269287109375, 4.727828025817871, 4.973386287689209, 5.218945026397705, 5.464503765106201, 5.710062026977539, 5.955620765686035, 6.201179504394531, 6.446737766265869, 6.692296504974365, 6.937855243682861, 7.183413505554199, 7.428972244262695, 7.674530982971191, 7.9200897216796875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 3.0, 10.0, 5.0, 11.0, 11.0, 17.0, 22.0, 25.0, 30.0, 58.0, 52.0, 88.0, 114.0, 146.0, 193.0, 320.0, 437.0, 748.0, 1647.0, 4071.0, 14459.0, 71888.0, 383818.0, 452045.0, 91667.0, 17609.0, 4785.0, 1754.0, 868.0, 501.0, 295.0, 220.0, 161.0, 106.0, 86.0, 62.0, 55.0, 31.0, 32.0, 24.0, 18.0, 22.0, 11.0, 12.0, 5.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.369140625, -1.326446533203125, -1.28375244140625, -1.241058349609375, -1.1983642578125, -1.155670166015625, -1.11297607421875, -1.070281982421875, -1.027587890625, -0.984893798828125, -0.94219970703125, -0.899505615234375, -0.8568115234375, -0.814117431640625, -0.77142333984375, -0.728729248046875, -0.68603515625, -0.643341064453125, -0.60064697265625, -0.557952880859375, -0.5152587890625, -0.472564697265625, -0.42987060546875, -0.387176513671875, -0.344482421875, -0.301788330078125, -0.25909423828125, -0.216400146484375, -0.1737060546875, -0.131011962890625, -0.08831787109375, -0.045623779296875, -0.0029296875, 0.039764404296875, 0.08245849609375, 0.125152587890625, 0.1678466796875, 0.210540771484375, 0.25323486328125, 0.295928955078125, 0.338623046875, 0.381317138671875, 0.42401123046875, 0.466705322265625, 0.5093994140625, 0.552093505859375, 0.59478759765625, 0.637481689453125, 0.68017578125, 0.722869873046875, 0.76556396484375, 0.808258056640625, 0.8509521484375, 0.893646240234375, 0.93634033203125, 0.979034423828125, 1.021728515625, 1.064422607421875, 1.10711669921875, 1.149810791015625, 1.1925048828125, 1.235198974609375, 1.27789306640625, 1.320587158203125, 1.36328125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 9.0, 26.0, 33.0, 56.0, 74.0, 112.0, 127.0, 132.0, 99.0, 106.0, 70.0, 59.0, 31.0, 31.0, 13.0, 14.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23095703125, -0.22116851806640625, -0.2113800048828125, -0.20159149169921875, -0.191802978515625, -0.18201446533203125, -0.1722259521484375, -0.16243743896484375, -0.15264892578125, -0.14286041259765625, -0.1330718994140625, -0.12328338623046875, -0.113494873046875, -0.10370635986328125, -0.0939178466796875, -0.08412933349609375, -0.0743408203125, -0.06455230712890625, -0.0547637939453125, -0.04497528076171875, -0.035186767578125, -0.02539825439453125, -0.0156097412109375, -0.00582122802734375, 0.00396728515625, 0.01375579833984375, 0.0235443115234375, 0.03333282470703125, 0.043121337890625, 0.05290985107421875, 0.0626983642578125, 0.07248687744140625, 0.082275390625, 0.09206390380859375, 0.1018524169921875, 0.11164093017578125, 0.121429443359375, 0.13121795654296875, 0.1410064697265625, 0.15079498291015625, 0.16058349609375, 0.17037200927734375, 0.1801605224609375, 0.18994903564453125, 0.199737548828125, 0.20952606201171875, 0.2193145751953125, 0.22910308837890625, 0.2388916015625, 0.24868011474609375, 0.2584686279296875, 0.26825714111328125, 0.278045654296875, 0.28783416748046875, 0.2976226806640625, 0.30741119384765625, 0.31719970703125, 0.32698822021484375, 0.3367767333984375, 0.34656524658203125, 0.356353759765625, 0.36614227294921875, 0.3759307861328125, 0.38571929931640625, 0.3955078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 5.0, 5.0, 4.0, 8.0, 12.0, 16.0, 22.0, 38.0, 34.0, 63.0, 87.0, 121.0, 203.0, 331.0, 561.0, 1111.0, 2135.0, 4593.0, 10903.0, 27920.0, 76585.0, 200099.0, 350379.0, 227734.0, 89768.0, 32946.0, 12473.0, 5090.0, 2394.0, 1147.0, 640.0, 396.0, 253.0, 159.0, 94.0, 65.0, 58.0, 27.0, 21.0, 23.0, 7.0, 11.0, 4.0, 6.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.548828125, -0.5302734375, -0.51171875, -0.4931640625, -0.474609375, -0.4560546875, -0.4375, -0.4189453125, -0.400390625, -0.3818359375, -0.36328125, -0.3447265625, -0.326171875, -0.3076171875, -0.2890625, -0.2705078125, -0.251953125, -0.2333984375, -0.21484375, -0.1962890625, -0.177734375, -0.1591796875, -0.140625, -0.1220703125, -0.103515625, -0.0849609375, -0.06640625, -0.0478515625, -0.029296875, -0.0107421875, 0.0078125, 0.0263671875, 0.044921875, 0.0634765625, 0.08203125, 0.1005859375, 0.119140625, 0.1376953125, 0.15625, 0.1748046875, 0.193359375, 0.2119140625, 0.23046875, 0.2490234375, 0.267578125, 0.2861328125, 0.3046875, 0.3232421875, 0.341796875, 0.3603515625, 0.37890625, 0.3974609375, 0.416015625, 0.4345703125, 0.453125, 0.4716796875, 0.490234375, 0.5087890625, 0.52734375, 0.5458984375, 0.564453125, 0.5830078125, 0.6015625, 0.6201171875, 0.638671875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 5.0, 14.0, 10.0, 16.0, 9.0, 17.0, 19.0, 31.0, 20.0, 30.0, 33.0, 48.0, 45.0, 52.0, 41.0, 49.0, 47.0, 51.0, 60.0, 36.0, 46.0, 47.0, 41.0, 28.0, 32.0, 30.0, 32.0, 22.0, 13.0, 12.0, 15.0, 13.0, 6.0, 10.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.5058746337890625, -0.486358642578125, -0.4668426513671875, -0.44732666015625, -0.4278106689453125, -0.408294677734375, -0.3887786865234375, -0.3692626953125, -0.3497467041015625, -0.330230712890625, -0.3107147216796875, -0.29119873046875, -0.2716827392578125, -0.252166748046875, -0.2326507568359375, -0.213134765625, -0.1936187744140625, -0.174102783203125, -0.1545867919921875, -0.13507080078125, -0.1155548095703125, -0.096038818359375, -0.0765228271484375, -0.0570068359375, -0.0374908447265625, -0.017974853515625, 0.0015411376953125, 0.02105712890625, 0.0405731201171875, 0.060089111328125, 0.0796051025390625, 0.09912109375, 0.1186370849609375, 0.138153076171875, 0.1576690673828125, 0.17718505859375, 0.1967010498046875, 0.216217041015625, 0.2357330322265625, 0.2552490234375, 0.2747650146484375, 0.294281005859375, 0.3137969970703125, 0.33331298828125, 0.3528289794921875, 0.372344970703125, 0.3918609619140625, 0.411376953125, 0.4308929443359375, 0.450408935546875, 0.4699249267578125, 0.48944091796875, 0.5089569091796875, 0.528472900390625, 0.5479888916015625, 0.5675048828125, 0.5870208740234375, 0.606536865234375, 0.6260528564453125, 0.64556884765625, 0.6650848388671875, 0.684600830078125, 0.7041168212890625, 0.7236328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 7.0, 7.0, 6.0, 13.0, 31.0, 38.0, 62.0, 93.0, 137.0, 288.0, 431.0, 865.0, 1833.0, 4804.0, 22762.0, 284584.0, 654974.0, 63633.0, 8678.0, 2678.0, 1164.0, 598.0, 320.0, 205.0, 116.0, 78.0, 51.0, 27.0, 20.0, 14.0, 9.0, 10.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67236328125, -0.6527175903320312, -0.6330718994140625, -0.6134262084960938, -0.593780517578125, -0.5741348266601562, -0.5544891357421875, -0.5348434448242188, -0.51519775390625, -0.49555206298828125, -0.4759063720703125, -0.45626068115234375, -0.436614990234375, -0.41696929931640625, -0.3973236083984375, -0.37767791748046875, -0.3580322265625, -0.33838653564453125, -0.3187408447265625, -0.29909515380859375, -0.279449462890625, -0.25980377197265625, -0.2401580810546875, -0.22051239013671875, -0.20086669921875, -0.18122100830078125, -0.1615753173828125, -0.14192962646484375, -0.122283935546875, -0.10263824462890625, -0.0829925537109375, -0.06334686279296875, -0.043701171875, -0.02405548095703125, -0.0044097900390625, 0.01523590087890625, 0.034881591796875, 0.05452728271484375, 0.0741729736328125, 0.09381866455078125, 0.11346435546875, 0.13311004638671875, 0.1527557373046875, 0.17240142822265625, 0.192047119140625, 0.21169281005859375, 0.2313385009765625, 0.25098419189453125, 0.2706298828125, 0.29027557373046875, 0.3099212646484375, 0.32956695556640625, 0.349212646484375, 0.36885833740234375, 0.3885040283203125, 0.40814971923828125, 0.42779541015625, 0.44744110107421875, 0.4670867919921875, 0.48673248291015625, 0.506378173828125, 0.5260238647460938, 0.5456695556640625, 0.5653152465820312, 0.5849609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 7.0, 4.0, 7.0, 9.0, 12.0, 33.0, 54.0, 91.0, 126.0, 166.0, 166.0, 134.0, 74.0, 48.0, 26.0, 22.0, 9.0, 8.0, 3.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011342763900756836, -0.00010887999087572098, -0.0001043323427438736, -9.978469461202621e-05, -9.523704648017883e-05, -9.068939834833145e-05, -8.614175021648407e-05, -8.159410208463669e-05, -7.70464539527893e-05, -7.249880582094193e-05, -6.795115768909454e-05, -6.340350955724716e-05, -5.885586142539978e-05, -5.43082132935524e-05, -4.976056516170502e-05, -4.5212917029857635e-05, -4.0665268898010254e-05, -3.611762076616287e-05, -3.156997263431549e-05, -2.702232450246811e-05, -2.2474676370620728e-05, -1.7927028238773346e-05, -1.3379380106925964e-05, -8.831731975078583e-06, -4.284083843231201e-06, 2.635642886161804e-07, 4.811212420463562e-06, 9.358860552310944e-06, 1.3906508684158325e-05, 1.8454156816005707e-05, 2.300180494785309e-05, 2.754945307970047e-05, 3.209710121154785e-05, 3.664474934339523e-05, 4.1192397475242615e-05, 4.5740045607089996e-05, 5.028769373893738e-05, 5.483534187078476e-05, 5.938299000263214e-05, 6.393063813447952e-05, 6.84782862663269e-05, 7.302593439817429e-05, 7.757358253002167e-05, 8.212123066186905e-05, 8.666887879371643e-05, 9.121652692556381e-05, 9.57641750574112e-05, 0.00010031182318925858, 0.00010485947132110596, 0.00010940711945295334, 0.00011395476758480072, 0.0001185024157166481, 0.00012305006384849548, 0.00012759771198034286, 0.00013214536011219025, 0.00013669300824403763, 0.000141240656375885, 0.0001457883045077324, 0.00015033595263957977, 0.00015488360077142715, 0.00015943124890327454, 0.00016397889703512192, 0.0001685265451669693, 0.00017307419329881668, 0.00017762184143066406]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 8.0, 2.0, 12.0, 15.0, 18.0, 36.0, 50.0, 72.0, 127.0, 212.0, 367.0, 764.0, 1809.0, 4990.0, 19790.0, 138384.0, 632434.0, 211140.0, 27991.0, 6220.0, 2187.0, 881.0, 464.0, 207.0, 122.0, 84.0, 55.0, 35.0, 23.0, 10.0, 15.0, 12.0, 3.0, 5.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.48779296875, -0.47369384765625, -0.4595947265625, -0.44549560546875, -0.431396484375, -0.41729736328125, -0.4031982421875, -0.38909912109375, -0.375, -0.36090087890625, -0.3468017578125, -0.33270263671875, -0.318603515625, -0.30450439453125, -0.2904052734375, -0.27630615234375, -0.26220703125, -0.24810791015625, -0.2340087890625, -0.21990966796875, -0.205810546875, -0.19171142578125, -0.1776123046875, -0.16351318359375, -0.1494140625, -0.13531494140625, -0.1212158203125, -0.10711669921875, -0.093017578125, -0.07891845703125, -0.0648193359375, -0.05072021484375, -0.03662109375, -0.02252197265625, -0.0084228515625, 0.00567626953125, 0.019775390625, 0.03387451171875, 0.0479736328125, 0.06207275390625, 0.076171875, 0.09027099609375, 0.1043701171875, 0.11846923828125, 0.132568359375, 0.14666748046875, 0.1607666015625, 0.17486572265625, 0.18896484375, 0.20306396484375, 0.2171630859375, 0.23126220703125, 0.245361328125, 0.25946044921875, 0.2735595703125, 0.28765869140625, 0.3017578125, 0.31585693359375, 0.3299560546875, 0.34405517578125, 0.358154296875, 0.37225341796875, 0.3863525390625, 0.40045166015625, 0.41455078125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 7.0, 13.0, 3.0, 11.0, 20.0, 35.0, 50.0, 59.0, 72.0, 76.0, 102.0, 91.0, 109.0, 82.0, 63.0, 50.0, 43.0, 41.0, 23.0, 14.0, 6.0, 8.0, 6.0, 4.0, 2.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3896484375, -0.3786659240722656, -0.36768341064453125, -0.3567008972167969, -0.3457183837890625, -0.3347358703613281, -0.32375335693359375, -0.3127708435058594, -0.301788330078125, -0.2908058166503906, -0.27982330322265625, -0.2688407897949219, -0.2578582763671875, -0.24687576293945312, -0.23589324951171875, -0.22491073608398438, -0.21392822265625, -0.20294570922851562, -0.19196319580078125, -0.18098068237304688, -0.1699981689453125, -0.15901565551757812, -0.14803314208984375, -0.13705062866210938, -0.126068115234375, -0.11508560180664062, -0.10410308837890625, -0.09312057495117188, -0.0821380615234375, -0.07115554809570312, -0.06017303466796875, -0.049190521240234375, -0.0382080078125, -0.027225494384765625, -0.01624298095703125, -0.005260467529296875, 0.0057220458984375, 0.016704559326171875, 0.02768707275390625, 0.038669586181640625, 0.049652099609375, 0.060634613037109375, 0.07161712646484375, 0.08259963989257812, 0.0935821533203125, 0.10456466674804688, 0.11554718017578125, 0.12652969360351562, 0.13751220703125, 0.14849472045898438, 0.15947723388671875, 0.17045974731445312, 0.1814422607421875, 0.19242477416992188, 0.20340728759765625, 0.21438980102539062, 0.225372314453125, 0.23635482788085938, 0.24733734130859375, 0.2583198547363281, 0.2693023681640625, 0.2802848815917969, 0.29126739501953125, 0.3022499084472656, 0.313232421875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 24.0, 29.0, 65.0, 132.0, 205.0, 231.0, 137.0, 80.0, 46.0, 25.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.12966537475586, -8.84589672088623, -8.562128067016602, -8.278360366821289, -7.99459171295166, -7.710823059082031, -7.4270548820495605, -7.14328670501709, -6.859518051147461, -6.575749397277832, -6.291981220245361, -6.008213043212891, -5.724444389343262, -5.440675735473633, -5.156907558441162, -4.873139381408691, -4.5893707275390625, -4.305602073669434, -4.021833896636963, -3.738065481185913, -3.4542970657348633, -3.1705286502838135, -2.8867602348327637, -2.602991819381714, -2.319223403930664, -2.0354549884796143, -1.7516865730285645, -1.4679181575775146, -1.1841497421264648, -0.900381326675415, -0.6166129112243652, -0.33284449577331543, -0.049076080322265625, 0.23469233512878418, 0.518460750579834, 0.8022291660308838, 1.0859975814819336, 1.3697659969329834, 1.6535344123840332, 1.937302827835083, 2.221071243286133, 2.5048396587371826, 2.7886080741882324, 3.0723764896392822, 3.356144905090332, 3.639913320541382, 3.9236817359924316, 4.207449913024902, 4.491218566894531, 4.77498722076416, 5.058755397796631, 5.342523574829102, 5.6262922286987305, 5.910060882568359, 6.19382905960083, 6.477597236633301, 6.76136589050293, 7.045134544372559, 7.328902721405029, 7.6126708984375, 7.896439552307129, 8.180208206176758, 8.46397590637207, 8.7477445602417, 9.031513214111328]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 9.0, 4.0, 5.0, 12.0, 8.0, 7.0, 8.0, 17.0, 14.0, 8.0, 27.0, 20.0, 23.0, 27.0, 21.0, 33.0, 29.0, 29.0, 43.0, 40.0, 45.0, 34.0, 43.0, 30.0, 61.0, 31.0, 40.0, 34.0, 39.0, 29.0, 21.0, 32.0, 24.0, 24.0, 22.0, 13.0, 14.0, 19.0, 18.0, 15.0, 7.0, 4.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.2159557342529297, -3.117790460586548, -3.019625186920166, -2.9214601516723633, -2.8232948780059814, -2.7251296043395996, -2.6269643306732178, -2.528799057006836, -2.430633783340454, -2.3324685096740723, -2.2343032360076904, -2.1361379623413086, -2.037972927093506, -1.939807653427124, -1.8416423797607422, -1.7434771060943604, -1.645311951637268, -1.5471466779708862, -1.448981523513794, -1.350816249847412, -1.2526509761810303, -1.1544857025146484, -1.0563205480575562, -0.9581552743911743, -0.8599900603294373, -0.7618248462677002, -0.6636595726013184, -0.5654943585395813, -0.46732911467552185, -0.3691638708114624, -0.27099865674972534, -0.1728333830833435, -0.07466816902160645, 0.023497067391872406, 0.12166230380535126, 0.2198275327682495, 0.31799277663230896, 0.4161580204963684, 0.5143232345581055, 0.6124885082244873, 0.7106537222862244, 0.8088189363479614, 0.9069842100143433, 1.0051493644714355, 1.1033146381378174, 1.2014799118041992, 1.299645185470581, 1.397810459136963, 1.4959756135940552, 1.594140887260437, 1.6923060417175293, 1.7904713153839111, 1.888636589050293, 1.9868018627166748, 2.0849671363830566, 2.1831321716308594, 2.281297445297241, 2.379462718963623, 2.477627992630005, 2.5757932662963867, 2.6739583015441895, 2.7721235752105713, 2.870288848876953, 2.968454122543335, 3.066619396209717]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 8.0, 17.0, 18.0, 19.0, 34.0, 58.0, 79.0, 126.0, 204.0, 313.0, 623.0, 1272.0, 3190.0, 12583.0, 84874.0, 3743744.0, 310437.0, 26970.0, 5492.0, 1867.0, 879.0, 464.0, 293.0, 197.0, 126.0, 104.0, 62.0, 49.0, 31.0, 31.0, 29.0, 23.0, 13.0, 12.0, 8.0, 6.0, 6.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3232421875, -1.2697296142578125, -1.216217041015625, -1.1627044677734375, -1.10919189453125, -1.0556793212890625, -1.002166748046875, -0.9486541748046875, -0.8951416015625, -0.8416290283203125, -0.788116455078125, -0.7346038818359375, -0.68109130859375, -0.6275787353515625, -0.574066162109375, -0.5205535888671875, -0.467041015625, -0.4135284423828125, -0.360015869140625, -0.3065032958984375, -0.25299072265625, -0.1994781494140625, -0.145965576171875, -0.0924530029296875, -0.0389404296875, 0.0145721435546875, 0.068084716796875, 0.1215972900390625, 0.17510986328125, 0.2286224365234375, 0.282135009765625, 0.3356475830078125, 0.38916015625, 0.4426727294921875, 0.496185302734375, 0.5496978759765625, 0.60321044921875, 0.6567230224609375, 0.710235595703125, 0.7637481689453125, 0.8172607421875, 0.8707733154296875, 0.924285888671875, 0.9777984619140625, 1.03131103515625, 1.0848236083984375, 1.138336181640625, 1.1918487548828125, 1.245361328125, 1.2988739013671875, 1.352386474609375, 1.4058990478515625, 1.45941162109375, 1.5129241943359375, 1.566436767578125, 1.6199493408203125, 1.6734619140625, 1.7269744873046875, 1.780487060546875, 1.8339996337890625, 1.88751220703125, 1.9410247802734375, 1.994537353515625, 2.0480499267578125, 2.1015625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 3.0, 6.0, 13.0, 12.0, 19.0, 26.0, 46.0, 78.0, 75.0, 85.0, 90.0, 96.0, 113.0, 82.0, 66.0, 46.0, 40.0, 49.0, 15.0, 15.0, 12.0, 8.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2257080078125, -0.21648597717285156, -0.20726394653320312, -0.1980419158935547, -0.18881988525390625, -0.1795978546142578, -0.17037582397460938, -0.16115379333496094, -0.1519317626953125, -0.14270973205566406, -0.13348770141601562, -0.12426567077636719, -0.11504364013671875, -0.10582160949707031, -0.09659957885742188, -0.08737754821777344, -0.078155517578125, -0.06893348693847656, -0.059711456298828125, -0.05048942565917969, -0.04126739501953125, -0.03204536437988281, -0.022823333740234375, -0.013601303100585938, -0.0043792724609375, 0.0048427581787109375, 0.014064788818359375, 0.023286819458007812, 0.03250885009765625, 0.04173088073730469, 0.050952911376953125, 0.06017494201660156, 0.06939697265625, 0.07861900329589844, 0.08784103393554688, 0.09706306457519531, 0.10628509521484375, 0.11550712585449219, 0.12472915649414062, 0.13395118713378906, 0.1431732177734375, 0.15239524841308594, 0.16161727905273438, 0.1708393096923828, 0.18006134033203125, 0.1892833709716797, 0.19850540161132812, 0.20772743225097656, 0.216949462890625, 0.22617149353027344, 0.23539352416992188, 0.2446155548095703, 0.25383758544921875, 0.2630596160888672, 0.2722816467285156, 0.28150367736816406, 0.2907257080078125, 0.29994773864746094, 0.3091697692871094, 0.3183917999267578, 0.32761383056640625, 0.3368358612060547, 0.3460578918457031, 0.35527992248535156, 0.364501953125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 9.0, 8.0, 15.0, 29.0, 31.0, 40.0, 50.0, 103.0, 185.0, 330.0, 898.0, 2385.0, 9872.0, 67014.0, 3482397.0, 588440.0, 33130.0, 6091.0, 1757.0, 714.0, 331.0, 153.0, 87.0, 57.0, 45.0, 19.0, 20.0, 17.0, 12.0, 14.0, 6.0, 8.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.9033203125, -1.8530120849609375, -1.802703857421875, -1.7523956298828125, -1.70208740234375, -1.6517791748046875, -1.601470947265625, -1.5511627197265625, -1.5008544921875, -1.4505462646484375, -1.400238037109375, -1.3499298095703125, -1.29962158203125, -1.2493133544921875, -1.199005126953125, -1.1486968994140625, -1.098388671875, -1.0480804443359375, -0.997772216796875, -0.9474639892578125, -0.89715576171875, -0.8468475341796875, -0.796539306640625, -0.7462310791015625, -0.6959228515625, -0.6456146240234375, -0.595306396484375, -0.5449981689453125, -0.49468994140625, -0.4443817138671875, -0.394073486328125, -0.3437652587890625, -0.29345703125, -0.2431488037109375, -0.192840576171875, -0.1425323486328125, -0.09222412109375, -0.0419158935546875, 0.008392333984375, 0.0587005615234375, 0.1090087890625, 0.1593170166015625, 0.209625244140625, 0.2599334716796875, 0.31024169921875, 0.3605499267578125, 0.410858154296875, 0.4611663818359375, 0.511474609375, 0.5617828369140625, 0.612091064453125, 0.6623992919921875, 0.71270751953125, 0.7630157470703125, 0.813323974609375, 0.8636322021484375, 0.9139404296875, 0.9642486572265625, 1.014556884765625, 1.0648651123046875, 1.11517333984375, 1.1654815673828125, 1.215789794921875, 1.2660980224609375, 1.31640625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 1.0, 1.0, 4.0, 0.0, 3.0, 10.0, 8.0, 11.0, 27.0, 39.0, 62.0, 121.0, 187.0, 440.0, 1454.0, 894.0, 331.0, 183.0, 87.0, 62.0, 46.0, 26.0, 21.0, 10.0, 14.0, 7.0, 9.0, 0.0, 6.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302734375, -0.28823089599609375, -0.2737274169921875, -0.25922393798828125, -0.244720458984375, -0.23021697998046875, -0.2157135009765625, -0.20121002197265625, -0.18670654296875, -0.17220306396484375, -0.1576995849609375, -0.14319610595703125, -0.128692626953125, -0.11418914794921875, -0.0996856689453125, -0.08518218994140625, -0.0706787109375, -0.05617523193359375, -0.0416717529296875, -0.02716827392578125, -0.012664794921875, 0.00183868408203125, 0.0163421630859375, 0.03084564208984375, 0.04534912109375, 0.05985260009765625, 0.0743560791015625, 0.08885955810546875, 0.103363037109375, 0.11786651611328125, 0.1323699951171875, 0.14687347412109375, 0.161376953125, 0.17588043212890625, 0.1903839111328125, 0.20488739013671875, 0.219390869140625, 0.23389434814453125, 0.2483978271484375, 0.26290130615234375, 0.27740478515625, 0.29190826416015625, 0.3064117431640625, 0.32091522216796875, 0.335418701171875, 0.34992218017578125, 0.3644256591796875, 0.37892913818359375, 0.3934326171875, 0.40793609619140625, 0.4224395751953125, 0.43694305419921875, 0.451446533203125, 0.46595001220703125, 0.4804534912109375, 0.49495697021484375, 0.50946044921875, 0.5239639282226562, 0.5384674072265625, 0.5529708862304688, 0.567474365234375, 0.5819778442382812, 0.5964813232421875, 0.6109848022460938, 0.62548828125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 4.0, 7.0, 6.0, 16.0, 20.0, 67.0, 114.0, 164.0, 188.0, 156.0, 96.0, 68.0, 44.0, 12.0, 10.0, 9.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.503411293029785, -3.3913064002990723, -3.2792015075683594, -3.1670966148376465, -3.0549917221069336, -2.9428868293762207, -2.830781936645508, -2.718677043914795, -2.606572151184082, -2.494467258453369, -2.3823623657226562, -2.2702574729919434, -2.1581525802612305, -2.0460476875305176, -1.9339427947998047, -1.8218379020690918, -1.709733009338379, -1.597628116607666, -1.4855232238769531, -1.3734183311462402, -1.2613134384155273, -1.1492085456848145, -1.0371036529541016, -0.9249987602233887, -0.8128938674926758, -0.7007889747619629, -0.58868408203125, -0.4765791893005371, -0.3644742965698242, -0.25236940383911133, -0.14026451110839844, -0.028159618377685547, 0.08394527435302734, 0.19605016708374023, 0.3081550598144531, 0.420259952545166, 0.5323648452758789, 0.6444697380065918, 0.7565746307373047, 0.8686795234680176, 0.9807844161987305, 1.0928893089294434, 1.2049942016601562, 1.3170990943908691, 1.429203987121582, 1.541308879852295, 1.6534137725830078, 1.7655186653137207, 1.8776235580444336, 1.9897284507751465, 2.1018333435058594, 2.2139382362365723, 2.326043128967285, 2.438148021697998, 2.550252914428711, 2.662357807159424, 2.7744626998901367, 2.8865675926208496, 2.9986724853515625, 3.1107773780822754, 3.2228822708129883, 3.334987163543701, 3.447092056274414, 3.559196949005127, 3.67130184173584]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 6.0, 10.0, 11.0, 10.0, 29.0, 25.0, 31.0, 50.0, 32.0, 34.0, 33.0, 49.0, 50.0, 56.0, 44.0, 47.0, 47.0, 50.0, 40.0, 43.0, 44.0, 46.0, 33.0, 33.0, 26.0, 13.0, 20.0, 20.0, 17.0, 6.0, 6.0, 6.0, 11.0, 4.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4813545942306519, -1.4335582256317139, -1.3857619762420654, -1.3379656076431274, -1.2901692390441895, -1.242372989654541, -1.194576621055603, -1.146780252456665, -1.0989840030670166, -1.0511876344680786, -1.0033913850784302, -0.9555950164794922, -0.907798707485199, -0.8600023984909058, -0.8122060298919678, -0.7644097208976746, -0.7166134119033813, -0.6688171029090881, -0.6210207939147949, -0.5732244253158569, -0.5254281163215637, -0.4776318073272705, -0.4298354685306549, -0.3820391297340393, -0.3342428207397461, -0.2864465117454529, -0.23865017294883728, -0.19085384905338287, -0.14305752515792847, -0.09526120126247406, -0.04746487736701965, 0.00033146142959594727, 0.04812788963317871, 0.09592421352863312, 0.14372053742408752, 0.19151686131954193, 0.23931318521499634, 0.28710949420928955, 0.33490583300590515, 0.38270217180252075, 0.43049848079681396, 0.4782947897911072, 0.5260910987854004, 0.5738874673843384, 0.6216837763786316, 0.6694800853729248, 0.7172764539718628, 0.765072762966156, 0.8128690719604492, 0.8606653809547424, 0.9084616899490356, 0.9562580585479736, 1.004054307937622, 1.05185067653656, 1.099647045135498, 1.1474432945251465, 1.1952396631240845, 1.2430360317230225, 1.290832281112671, 1.3386286497116089, 1.3864250183105469, 1.4342212677001953, 1.4820176362991333, 1.5298140048980713, 1.5776102542877197]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 10.0, 8.0, 13.0, 15.0, 24.0, 35.0, 84.0, 182.0, 337.0, 851.0, 2831.0, 19343.0, 380639.0, 608520.0, 29966.0, 3862.0, 1009.0, 399.0, 184.0, 98.0, 56.0, 35.0, 17.0, 9.0, 12.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.828125, -2.749755859375, -2.67138671875, -2.593017578125, -2.5146484375, -2.436279296875, -2.35791015625, -2.279541015625, -2.201171875, -2.122802734375, -2.04443359375, -1.966064453125, -1.8876953125, -1.809326171875, -1.73095703125, -1.652587890625, -1.57421875, -1.495849609375, -1.41748046875, -1.339111328125, -1.2607421875, -1.182373046875, -1.10400390625, -1.025634765625, -0.947265625, -0.868896484375, -0.79052734375, -0.712158203125, -0.6337890625, -0.555419921875, -0.47705078125, -0.398681640625, -0.3203125, -0.241943359375, -0.16357421875, -0.085205078125, -0.0068359375, 0.071533203125, 0.14990234375, 0.228271484375, 0.306640625, 0.385009765625, 0.46337890625, 0.541748046875, 0.6201171875, 0.698486328125, 0.77685546875, 0.855224609375, 0.93359375, 1.011962890625, 1.09033203125, 1.168701171875, 1.2470703125, 1.325439453125, 1.40380859375, 1.482177734375, 1.560546875, 1.638916015625, 1.71728515625, 1.795654296875, 1.8740234375, 1.952392578125, 2.03076171875, 2.109130859375, 2.1875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 11.0, 13.0, 29.0, 32.0, 55.0, 63.0, 94.0, 104.0, 96.0, 128.0, 84.0, 76.0, 71.0, 44.0, 37.0, 23.0, 13.0, 6.0, 4.0, 5.0, 9.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22119140625, -0.21104049682617188, -0.20088958740234375, -0.19073867797851562, -0.1805877685546875, -0.17043685913085938, -0.16028594970703125, -0.15013504028320312, -0.139984130859375, -0.12983322143554688, -0.11968231201171875, -0.10953140258789062, -0.0993804931640625, -0.08922958374023438, -0.07907867431640625, -0.06892776489257812, -0.05877685546875, -0.048625946044921875, -0.03847503662109375, -0.028324127197265625, -0.0181732177734375, -0.008022308349609375, 0.00212860107421875, 0.012279510498046875, 0.022430419921875, 0.032581329345703125, 0.04273223876953125, 0.052883148193359375, 0.0630340576171875, 0.07318496704101562, 0.08333587646484375, 0.09348678588867188, 0.1036376953125, 0.11378860473632812, 0.12393951416015625, 0.13409042358398438, 0.1442413330078125, 0.15439224243164062, 0.16454315185546875, 0.17469406127929688, 0.184844970703125, 0.19499588012695312, 0.20514678955078125, 0.21529769897460938, 0.2254486083984375, 0.23559951782226562, 0.24575042724609375, 0.2559013366699219, 0.26605224609375, 0.2762031555175781, 0.28635406494140625, 0.2965049743652344, 0.3066558837890625, 0.3168067932128906, 0.32695770263671875, 0.3371086120605469, 0.347259521484375, 0.3574104309082031, 0.36756134033203125, 0.3777122497558594, 0.3878631591796875, 0.3980140686035156, 0.40816497802734375, 0.4183158874511719, 0.428466796875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 9.0, 9.0, 13.0, 16.0, 20.0, 17.0, 30.0, 37.0, 75.0, 129.0, 242.0, 457.0, 1010.0, 2904.0, 9280.0, 39662.0, 208538.0, 564934.0, 174709.0, 33849.0, 8253.0, 2456.0, 939.0, 405.0, 214.0, 127.0, 64.0, 48.0, 35.0, 23.0, 19.0, 12.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.1171875, -1.0856704711914062, -1.0541534423828125, -1.0226364135742188, -0.991119384765625, -0.9596023559570312, -0.9280853271484375, -0.8965682983398438, -0.86505126953125, -0.8335342407226562, -0.8020172119140625, -0.7705001831054688, -0.738983154296875, -0.7074661254882812, -0.6759490966796875, -0.6444320678710938, -0.6129150390625, -0.5813980102539062, -0.5498809814453125, -0.5183639526367188, -0.486846923828125, -0.45532989501953125, -0.4238128662109375, -0.39229583740234375, -0.36077880859375, -0.32926177978515625, -0.2977447509765625, -0.26622772216796875, -0.234710693359375, -0.20319366455078125, -0.1716766357421875, -0.14015960693359375, -0.108642578125, -0.07712554931640625, -0.0456085205078125, -0.01409149169921875, 0.017425537109375, 0.04894256591796875, 0.0804595947265625, 0.11197662353515625, 0.14349365234375, 0.17501068115234375, 0.2065277099609375, 0.23804473876953125, 0.269561767578125, 0.30107879638671875, 0.3325958251953125, 0.36411285400390625, 0.3956298828125, 0.42714691162109375, 0.4586639404296875, 0.49018096923828125, 0.521697998046875, 0.5532150268554688, 0.5847320556640625, 0.6162490844726562, 0.64776611328125, 0.6792831420898438, 0.7108001708984375, 0.7423171997070312, 0.773834228515625, 0.8053512573242188, 0.8368682861328125, 0.8683853149414062, 0.89990234375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 6.0, 6.0, 5.0, 16.0, 5.0, 15.0, 14.0, 11.0, 19.0, 23.0, 41.0, 27.0, 31.0, 39.0, 38.0, 45.0, 40.0, 50.0, 48.0, 55.0, 58.0, 51.0, 41.0, 40.0, 46.0, 31.0, 29.0, 22.0, 21.0, 26.0, 19.0, 22.0, 8.0, 12.0, 7.0, 12.0, 4.0, 8.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5869140625, -0.5660629272460938, -0.5452117919921875, -0.5243606567382812, -0.503509521484375, -0.48265838623046875, -0.4618072509765625, -0.44095611572265625, -0.42010498046875, -0.39925384521484375, -0.3784027099609375, -0.35755157470703125, -0.336700439453125, -0.31584930419921875, -0.2949981689453125, -0.27414703369140625, -0.2532958984375, -0.23244476318359375, -0.2115936279296875, -0.19074249267578125, -0.169891357421875, -0.14904022216796875, -0.1281890869140625, -0.10733795166015625, -0.08648681640625, -0.06563568115234375, -0.0447845458984375, -0.02393341064453125, -0.003082275390625, 0.01776885986328125, 0.0386199951171875, 0.05947113037109375, 0.080322265625, 0.10117340087890625, 0.1220245361328125, 0.14287567138671875, 0.163726806640625, 0.18457794189453125, 0.2054290771484375, 0.22628021240234375, 0.24713134765625, 0.26798248291015625, 0.2888336181640625, 0.30968475341796875, 0.330535888671875, 0.35138702392578125, 0.3722381591796875, 0.39308929443359375, 0.4139404296875, 0.43479156494140625, 0.4556427001953125, 0.47649383544921875, 0.497344970703125, 0.5181961059570312, 0.5390472412109375, 0.5598983764648438, 0.58074951171875, 0.6016006469726562, 0.6224517822265625, 0.6433029174804688, 0.664154052734375, 0.6850051879882812, 0.7058563232421875, 0.7267074584960938, 0.74755859375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 11.0, 17.0, 53.0, 168.0, 415.0, 3352.0, 876505.0, 165968.0, 1585.0, 280.0, 124.0, 46.0, 13.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.888671875, -1.831207275390625, -1.77374267578125, -1.716278076171875, -1.6588134765625, -1.601348876953125, -1.54388427734375, -1.486419677734375, -1.428955078125, -1.371490478515625, -1.31402587890625, -1.256561279296875, -1.1990966796875, -1.141632080078125, -1.08416748046875, -1.026702880859375, -0.96923828125, -0.911773681640625, -0.85430908203125, -0.796844482421875, -0.7393798828125, -0.681915283203125, -0.62445068359375, -0.566986083984375, -0.509521484375, -0.452056884765625, -0.39459228515625, -0.337127685546875, -0.2796630859375, -0.222198486328125, -0.16473388671875, -0.107269287109375, -0.0498046875, 0.007659912109375, 0.06512451171875, 0.122589111328125, 0.1800537109375, 0.237518310546875, 0.29498291015625, 0.352447509765625, 0.409912109375, 0.467376708984375, 0.52484130859375, 0.582305908203125, 0.6397705078125, 0.697235107421875, 0.75469970703125, 0.812164306640625, 0.86962890625, 0.927093505859375, 0.98455810546875, 1.042022705078125, 1.0994873046875, 1.156951904296875, 1.21441650390625, 1.271881103515625, 1.329345703125, 1.386810302734375, 1.44427490234375, 1.501739501953125, 1.5592041015625, 1.616668701171875, 1.67413330078125, 1.731597900390625, 1.7890625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 4.0, 11.0, 11.0, 21.0, 26.0, 49.0, 75.0, 91.0, 137.0, 162.0, 126.0, 108.0, 66.0, 49.0, 27.0, 17.0, 7.0, 10.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.259845733642578e-05, -6.901286542415619e-05, -6.54272735118866e-05, -6.1841681599617e-05, -5.825608968734741e-05, -5.467049777507782e-05, -5.108490586280823e-05, -4.7499313950538635e-05, -4.391372203826904e-05, -4.032813012599945e-05, -3.674253821372986e-05, -3.3156946301460266e-05, -2.9571354389190674e-05, -2.598576247692108e-05, -2.240017056465149e-05, -1.8814578652381897e-05, -1.5228986740112305e-05, -1.1643394827842712e-05, -8.05780291557312e-06, -4.472211003303528e-06, -8.866190910339355e-07, 2.6989728212356567e-06, 6.284564733505249e-06, 9.870156645774841e-06, 1.3455748558044434e-05, 1.7041340470314026e-05, 2.0626932382583618e-05, 2.421252429485321e-05, 2.7798116207122803e-05, 3.1383708119392395e-05, 3.496930003166199e-05, 3.855489194393158e-05, 4.214048385620117e-05, 4.5726075768470764e-05, 4.9311667680740356e-05, 5.289725959300995e-05, 5.648285150527954e-05, 6.006844341754913e-05, 6.365403532981873e-05, 6.723962724208832e-05, 7.082521915435791e-05, 7.44108110666275e-05, 7.79964029788971e-05, 8.158199489116669e-05, 8.516758680343628e-05, 8.875317871570587e-05, 9.233877062797546e-05, 9.592436254024506e-05, 9.950995445251465e-05, 0.00010309554636478424, 0.00010668113827705383, 0.00011026673018932343, 0.00011385232210159302, 0.00011743791401386261, 0.0001210235059261322, 0.0001246090978384018, 0.0001281946897506714, 0.00013178028166294098, 0.00013536587357521057, 0.00013895146548748016, 0.00014253705739974976, 0.00014612264931201935, 0.00014970824122428894, 0.00015329383313655853, 0.00015687942504882812]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 19.0, 55.0, 119.0, 346.0, 3380.0, 1033962.0, 9997.0, 424.0, 165.0, 61.0, 19.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.345703125, -2.26904296875, -2.1923828125, -2.11572265625, -2.0390625, -1.96240234375, -1.8857421875, -1.80908203125, -1.732421875, -1.65576171875, -1.5791015625, -1.50244140625, -1.42578125, -1.34912109375, -1.2724609375, -1.19580078125, -1.119140625, -1.04248046875, -0.9658203125, -0.88916015625, -0.8125, -0.73583984375, -0.6591796875, -0.58251953125, -0.505859375, -0.42919921875, -0.3525390625, -0.27587890625, -0.19921875, -0.12255859375, -0.0458984375, 0.03076171875, 0.107421875, 0.18408203125, 0.2607421875, 0.33740234375, 0.4140625, 0.49072265625, 0.5673828125, 0.64404296875, 0.720703125, 0.79736328125, 0.8740234375, 0.95068359375, 1.02734375, 1.10400390625, 1.1806640625, 1.25732421875, 1.333984375, 1.41064453125, 1.4873046875, 1.56396484375, 1.640625, 1.71728515625, 1.7939453125, 1.87060546875, 1.947265625, 2.02392578125, 2.1005859375, 2.17724609375, 2.25390625, 2.33056640625, 2.4072265625, 2.48388671875, 2.560546875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 9.0, 12.0, 95.0, 331.0, 406.0, 127.0, 20.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.544921875, -1.4935455322265625, -1.442169189453125, -1.3907928466796875, -1.33941650390625, -1.2880401611328125, -1.236663818359375, -1.1852874755859375, -1.1339111328125, -1.0825347900390625, -1.031158447265625, -0.9797821044921875, -0.92840576171875, -0.8770294189453125, -0.825653076171875, -0.7742767333984375, -0.722900390625, -0.6715240478515625, -0.620147705078125, -0.5687713623046875, -0.51739501953125, -0.4660186767578125, -0.414642333984375, -0.3632659912109375, -0.3118896484375, -0.2605133056640625, -0.209136962890625, -0.1577606201171875, -0.10638427734375, -0.0550079345703125, -0.003631591796875, 0.0477447509765625, 0.09912109375, 0.1504974365234375, 0.201873779296875, 0.2532501220703125, 0.30462646484375, 0.3560028076171875, 0.407379150390625, 0.4587554931640625, 0.5101318359375, 0.5615081787109375, 0.612884521484375, 0.6642608642578125, 0.71563720703125, 0.7670135498046875, 0.818389892578125, 0.8697662353515625, 0.921142578125, 0.9725189208984375, 1.023895263671875, 1.0752716064453125, 1.12664794921875, 1.1780242919921875, 1.229400634765625, 1.2807769775390625, 1.3321533203125, 1.3835296630859375, 1.434906005859375, 1.4862823486328125, 1.53765869140625, 1.5890350341796875, 1.640411376953125, 1.6917877197265625, 1.7431640625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 8.0, 12.0, 25.0, 95.0, 213.0, 310.0, 208.0, 87.0, 26.0, 16.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.107353210449219, -7.7137064933776855, -7.3200602531433105, -6.926413536071777, -6.532767295837402, -6.139120578765869, -5.745473861694336, -5.351827621459961, -4.958180904388428, -4.5645341873168945, -4.1708879470825195, -3.7772412300109863, -3.3835947513580322, -2.989948272705078, -2.596301555633545, -2.202655076980591, -1.8090085983276367, -1.4153621196746826, -1.021715521812439, -0.6280689239501953, -0.2344224452972412, 0.1592240333557129, 0.5528707504272461, 0.9465172290802002, 1.3401637077331543, 1.7338101863861084, 2.1274566650390625, 2.5211033821105957, 2.91474986076355, 3.308396339416504, 3.702043056488037, 4.09568977355957, 4.489336013793945, 4.8829827308654785, 5.2766289710998535, 5.670275688171387, 6.063921928405762, 6.457568645477295, 6.851215362548828, 7.244861602783203, 7.638508319854736, 8.03215503692627, 8.425801277160645, 8.819448471069336, 9.213094711303711, 9.606740951538086, 10.000387191772461, 10.394034385681152, 10.787680625915527, 11.181326866149902, 11.574974060058594, 11.968620300292969, 12.362266540527344, 12.755912780761719, 13.14955997467041, 13.543206214904785, 13.936853408813477, 14.330499649047852, 14.724146842956543, 15.117793083190918, 15.511439323425293, 15.905086517333984, 16.29873275756836, 16.692378997802734, 17.08602523803711]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 8.0, 10.0, 5.0, 13.0, 15.0, 7.0, 14.0, 23.0, 24.0, 21.0, 28.0, 29.0, 23.0, 38.0, 40.0, 35.0, 43.0, 36.0, 50.0, 32.0, 40.0, 43.0, 39.0, 36.0, 54.0, 39.0, 31.0, 34.0, 23.0, 27.0, 24.0, 21.0, 24.0, 12.0, 11.0, 7.0, 10.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 4.0, 1.0, 5.0], "bins": [-3.5458197593688965, -3.450713872909546, -3.3556082248687744, -3.260502338409424, -3.1653966903686523, -3.0702908039093018, -2.975184917449951, -2.8800792694091797, -2.784973621368408, -2.6898677349090576, -2.594762086868286, -2.4996562004089355, -2.404550552368164, -2.3094446659088135, -2.214338779449463, -2.1192331314086914, -2.024127244949341, -1.9290214776992798, -1.8339157104492188, -1.7388098239898682, -1.6437041759490967, -1.548598289489746, -1.453492522239685, -1.358386754989624, -1.263280987739563, -1.168175220489502, -1.073069453239441, -0.9779636263847351, -0.8828578591346741, -0.787752091884613, -0.6926462650299072, -0.5975404977798462, -0.502434492111206, -0.407328724861145, -0.3122229278087616, -0.21711713075637817, -0.12201136350631714, -0.026905596256256104, 0.06820023059844971, 0.16330599784851074, 0.2584117650985718, 0.3535175323486328, 0.44862332940101624, 0.5437291264533997, 0.6388348937034607, 0.7339406609535217, 0.8290464878082275, 0.9241522550582886, 1.0192580223083496, 1.1143637895584106, 1.2094695568084717, 1.3045754432678223, 1.3996810913085938, 1.4947869777679443, 1.5898927450180054, 1.6849985122680664, 1.7801042795181274, 1.8752100467681885, 1.9703158140182495, 2.0654215812683105, 2.160527467727661, 2.2556331157684326, 2.350739002227783, 2.4458446502685547, 2.5409505367279053]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 4.0, 2.0, 9.0, 3.0, 11.0, 26.0, 31.0, 36.0, 62.0, 131.0, 196.0, 404.0, 861.0, 2048.0, 7225.0, 37962.0, 1496392.0, 2598875.0, 38647.0, 7203.0, 2167.0, 832.0, 411.0, 216.0, 147.0, 97.0, 61.0, 61.0, 39.0, 28.0, 22.0, 18.0, 15.0, 7.0, 9.0, 4.0, 4.0, 4.0, 8.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.4150390625, -1.3645172119140625, -1.313995361328125, -1.2634735107421875, -1.21295166015625, -1.1624298095703125, -1.111907958984375, -1.0613861083984375, -1.0108642578125, -0.9603424072265625, -0.909820556640625, -0.8592987060546875, -0.80877685546875, -0.7582550048828125, -0.707733154296875, -0.6572113037109375, -0.606689453125, -0.5561676025390625, -0.505645751953125, -0.4551239013671875, -0.40460205078125, -0.3540802001953125, -0.303558349609375, -0.2530364990234375, -0.2025146484375, -0.1519927978515625, -0.101470947265625, -0.0509490966796875, -0.00042724609375, 0.0500946044921875, 0.100616455078125, 0.1511383056640625, 0.20166015625, 0.2521820068359375, 0.302703857421875, 0.3532257080078125, 0.40374755859375, 0.4542694091796875, 0.504791259765625, 0.5553131103515625, 0.6058349609375, 0.6563568115234375, 0.706878662109375, 0.7574005126953125, 0.80792236328125, 0.8584442138671875, 0.908966064453125, 0.9594879150390625, 1.010009765625, 1.0605316162109375, 1.111053466796875, 1.1615753173828125, 1.21209716796875, 1.2626190185546875, 1.313140869140625, 1.3636627197265625, 1.4141845703125, 1.4647064208984375, 1.515228271484375, 1.5657501220703125, 1.61627197265625, 1.6667938232421875, 1.717315673828125, 1.7678375244140625, 1.818359375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 17.0, 14.0, 31.0, 63.0, 94.0, 98.0, 94.0, 112.0, 110.0, 77.0, 74.0, 72.0, 41.0, 37.0, 26.0, 12.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2607421875, -0.2492218017578125, -0.237701416015625, -0.2261810302734375, -0.21466064453125, -0.2031402587890625, -0.191619873046875, -0.1800994873046875, -0.1685791015625, -0.1570587158203125, -0.145538330078125, -0.1340179443359375, -0.12249755859375, -0.1109771728515625, -0.099456787109375, -0.0879364013671875, -0.076416015625, -0.0648956298828125, -0.053375244140625, -0.0418548583984375, -0.03033447265625, -0.0188140869140625, -0.007293701171875, 0.0042266845703125, 0.0157470703125, 0.0272674560546875, 0.038787841796875, 0.0503082275390625, 0.06182861328125, 0.0733489990234375, 0.084869384765625, 0.0963897705078125, 0.10791015625, 0.1194305419921875, 0.130950927734375, 0.1424713134765625, 0.15399169921875, 0.1655120849609375, 0.177032470703125, 0.1885528564453125, 0.2000732421875, 0.2115936279296875, 0.223114013671875, 0.2346343994140625, 0.24615478515625, 0.2576751708984375, 0.269195556640625, 0.2807159423828125, 0.292236328125, 0.3037567138671875, 0.315277099609375, 0.3267974853515625, 0.33831787109375, 0.3498382568359375, 0.361358642578125, 0.3728790283203125, 0.3843994140625, 0.3959197998046875, 0.407440185546875, 0.4189605712890625, 0.43048095703125, 0.4420013427734375, 0.453521728515625, 0.4650421142578125, 0.4765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 4.0, 9.0, 9.0, 22.0, 34.0, 63.0, 107.0, 184.0, 431.0, 876.0, 2335.0, 9067.0, 87146.0, 3931138.0, 145602.0, 12395.0, 2928.0, 1033.0, 448.0, 210.0, 108.0, 65.0, 35.0, 16.0, 10.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.5546875, -2.496063232421875, -2.43743896484375, -2.378814697265625, -2.3201904296875, -2.261566162109375, -2.20294189453125, -2.144317626953125, -2.085693359375, -2.027069091796875, -1.96844482421875, -1.909820556640625, -1.8511962890625, -1.792572021484375, -1.73394775390625, -1.675323486328125, -1.61669921875, -1.558074951171875, -1.49945068359375, -1.440826416015625, -1.3822021484375, -1.323577880859375, -1.26495361328125, -1.206329345703125, -1.147705078125, -1.089080810546875, -1.03045654296875, -0.971832275390625, -0.9132080078125, -0.854583740234375, -0.79595947265625, -0.737335205078125, -0.6787109375, -0.620086669921875, -0.56146240234375, -0.502838134765625, -0.4442138671875, -0.385589599609375, -0.32696533203125, -0.268341064453125, -0.209716796875, -0.151092529296875, -0.09246826171875, -0.033843994140625, 0.0247802734375, 0.083404541015625, 0.14202880859375, 0.200653076171875, 0.25927734375, 0.317901611328125, 0.37652587890625, 0.435150146484375, 0.4937744140625, 0.552398681640625, 0.61102294921875, 0.669647216796875, 0.728271484375, 0.786895751953125, 0.84552001953125, 0.904144287109375, 0.9627685546875, 1.021392822265625, 1.08001708984375, 1.138641357421875, 1.197265625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 16.0, 15.0, 33.0, 51.0, 97.0, 272.0, 1411.0, 1590.0, 294.0, 106.0, 59.0, 53.0, 34.0, 10.0, 11.0, 4.0, 5.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64208984375, -0.623748779296875, -0.60540771484375, -0.587066650390625, -0.5687255859375, -0.550384521484375, -0.53204345703125, -0.513702392578125, -0.495361328125, -0.477020263671875, -0.45867919921875, -0.440338134765625, -0.4219970703125, -0.403656005859375, -0.38531494140625, -0.366973876953125, -0.3486328125, -0.330291748046875, -0.31195068359375, -0.293609619140625, -0.2752685546875, -0.256927490234375, -0.23858642578125, -0.220245361328125, -0.201904296875, -0.183563232421875, -0.16522216796875, -0.146881103515625, -0.1285400390625, -0.110198974609375, -0.09185791015625, -0.073516845703125, -0.05517578125, -0.036834716796875, -0.01849365234375, -0.000152587890625, 0.0181884765625, 0.036529541015625, 0.05487060546875, 0.073211669921875, 0.091552734375, 0.109893798828125, 0.12823486328125, 0.146575927734375, 0.1649169921875, 0.183258056640625, 0.20159912109375, 0.219940185546875, 0.23828125, 0.256622314453125, 0.27496337890625, 0.293304443359375, 0.3116455078125, 0.329986572265625, 0.34832763671875, 0.366668701171875, 0.385009765625, 0.403350830078125, 0.42169189453125, 0.440032958984375, 0.4583740234375, 0.476715087890625, 0.49505615234375, 0.513397216796875, 0.53173828125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 1.0, 7.0, 27.0, 105.0, 409.0, 342.0, 84.0, 18.0, 5.0, 7.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.522583961486816, -4.281192302703857, -4.039801120758057, -3.7984094619750977, -3.5570180416107178, -3.315626621246338, -3.074235200881958, -2.832843780517578, -2.591452121734619, -2.3500607013702393, -2.1086692810058594, -1.86727774143219, -1.6258862018585205, -1.3844947814941406, -1.1431033611297607, -0.9017118215560913, -0.660320520401001, -0.4189290404319763, -0.17753759026527405, 0.06385385990142822, 0.3052453398704529, 0.5466368198394775, 0.7880282402038574, 1.0294197797775269, 1.2708112001419067, 1.5122026205062866, 1.753594160079956, 1.994985580444336, 2.236377000808716, 2.4777684211730957, 2.7191600799560547, 2.9605515003204346, 3.2019429206848145, 3.4433343410491943, 3.684725761413574, 3.926117420196533, 4.167508602142334, 4.408900260925293, 4.650291442871094, 4.891683101654053, 5.133074760437012, 5.374466419219971, 5.6158576011657715, 5.8572492599487305, 6.098640441894531, 6.34003210067749, 6.581423759460449, 6.82281494140625, 7.064206123352051, 7.30559778213501, 7.5469889640808105, 7.7883806228637695, 8.02977180480957, 8.271163940429688, 8.512555122375488, 8.753946304321289, 8.995338439941406, 9.236729621887207, 9.478121757507324, 9.719512939453125, 9.960904121398926, 10.202295303344727, 10.443687438964844, 10.685078620910645, 10.926469802856445]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 9.0, 13.0, 17.0, 27.0, 39.0, 37.0, 57.0, 66.0, 74.0, 74.0, 84.0, 81.0, 89.0, 75.0, 56.0, 56.0, 30.0, 31.0, 31.0, 21.0, 12.0, 4.0, 4.0, 5.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9352753162384033, -1.8642559051513672, -1.7932363748550415, -1.7222169637680054, -1.6511974334716797, -1.5801780223846436, -1.5091586112976074, -1.4381392002105713, -1.3671196699142456, -1.2961002588272095, -1.2250807285308838, -1.1540613174438477, -1.0830419063568115, -1.0120223760604858, -0.9410029649734497, -0.8699834942817688, -0.7989640235900879, -0.727944552898407, -0.6569250822067261, -0.5859056711196899, -0.514886200428009, -0.4438667297363281, -0.3728472888469696, -0.3018278479576111, -0.23080837726593018, -0.15978892147541046, -0.08876946568489075, -0.017750009894371033, 0.05326944589614868, 0.12428891658782959, 0.1953083574771881, 0.26632779836654663, 0.33734703063964844, 0.40836650133132935, 0.47938594222068787, 0.5504053831100464, 0.6214248538017273, 0.6924443244934082, 0.7634637355804443, 0.8344832062721252, 0.9055026769638062, 0.9765221476554871, 1.047541618347168, 1.118561029434204, 1.1895804405212402, 1.260599970817566, 1.331619381904602, 1.4026389122009277, 1.4736583232879639, 1.544677734375, 1.6156972646713257, 1.6867166757583618, 1.7577362060546875, 1.8287556171417236, 1.8997750282287598, 1.970794439315796, 2.041813850402832, 2.112833261489868, 2.1838526725769043, 2.2548723220825195, 2.3258917331695557, 2.396911144256592, 2.467930555343628, 2.538949966430664, 2.6099696159362793]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 9.0, 5.0, 8.0, 12.0, 16.0, 24.0, 42.0, 69.0, 73.0, 136.0, 223.0, 394.0, 888.0, 2432.0, 10022.0, 64780.0, 515307.0, 394771.0, 47751.0, 7851.0, 2055.0, 787.0, 353.0, 197.0, 102.0, 88.0, 42.0, 40.0, 22.0, 14.0, 9.0, 10.0, 9.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1728515625, -1.1216888427734375, -1.070526123046875, -1.0193634033203125, -0.96820068359375, -0.9170379638671875, -0.865875244140625, -0.8147125244140625, -0.7635498046875, -0.7123870849609375, -0.661224365234375, -0.6100616455078125, -0.55889892578125, -0.5077362060546875, -0.456573486328125, -0.4054107666015625, -0.354248046875, -0.3030853271484375, -0.251922607421875, -0.2007598876953125, -0.14959716796875, -0.0984344482421875, -0.047271728515625, 0.0038909912109375, 0.0550537109375, 0.1062164306640625, 0.157379150390625, 0.2085418701171875, 0.25970458984375, 0.3108673095703125, 0.362030029296875, 0.4131927490234375, 0.46435546875, 0.5155181884765625, 0.566680908203125, 0.6178436279296875, 0.66900634765625, 0.7201690673828125, 0.771331787109375, 0.8224945068359375, 0.8736572265625, 0.9248199462890625, 0.975982666015625, 1.0271453857421875, 1.07830810546875, 1.1294708251953125, 1.180633544921875, 1.2317962646484375, 1.282958984375, 1.3341217041015625, 1.385284423828125, 1.4364471435546875, 1.48760986328125, 1.5387725830078125, 1.589935302734375, 1.6410980224609375, 1.6922607421875, 1.7434234619140625, 1.794586181640625, 1.8457489013671875, 1.89691162109375, 1.9480743408203125, 1.999237060546875, 2.0503997802734375, 2.1015625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 11.0, 21.0, 31.0, 56.0, 74.0, 100.0, 105.0, 120.0, 127.0, 76.0, 100.0, 67.0, 45.0, 29.0, 17.0, 9.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.281982421875, -0.2683906555175781, -0.25479888916015625, -0.24120712280273438, -0.2276153564453125, -0.21402359008789062, -0.20043182373046875, -0.18684005737304688, -0.173248291015625, -0.15965652465820312, -0.14606475830078125, -0.13247299194335938, -0.1188812255859375, -0.10528945922851562, -0.09169769287109375, -0.07810592651367188, -0.06451416015625, -0.050922393798828125, -0.03733062744140625, -0.023738861083984375, -0.0101470947265625, 0.003444671630859375, 0.01703643798828125, 0.030628204345703125, 0.044219970703125, 0.057811737060546875, 0.07140350341796875, 0.08499526977539062, 0.0985870361328125, 0.11217880249023438, 0.12577056884765625, 0.13936233520507812, 0.1529541015625, 0.16654586791992188, 0.18013763427734375, 0.19372940063476562, 0.2073211669921875, 0.22091293334960938, 0.23450469970703125, 0.24809646606445312, 0.261688232421875, 0.2752799987792969, 0.28887176513671875, 0.3024635314941406, 0.3160552978515625, 0.3296470642089844, 0.34323883056640625, 0.3568305969238281, 0.37042236328125, 0.3840141296386719, 0.39760589599609375, 0.4111976623535156, 0.4247894287109375, 0.4383811950683594, 0.45197296142578125, 0.4655647277832031, 0.479156494140625, 0.4927482604980469, 0.5063400268554688, 0.5199317932128906, 0.5335235595703125, 0.5471153259277344, 0.5607070922851562, 0.5742988586425781, 0.587890625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 3.0, 9.0, 9.0, 13.0, 10.0, 28.0, 29.0, 45.0, 63.0, 113.0, 172.0, 352.0, 674.0, 1676.0, 4958.0, 17921.0, 73710.0, 318234.0, 466619.0, 122869.0, 28864.0, 7829.0, 2429.0, 931.0, 423.0, 195.0, 126.0, 74.0, 47.0, 39.0, 30.0, 15.0, 9.0, 11.0, 7.0, 4.0, 3.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.9931640625, -0.9649276733398438, -0.9366912841796875, -0.9084548950195312, -0.880218505859375, -0.8519821166992188, -0.8237457275390625, -0.7955093383789062, -0.76727294921875, -0.7390365600585938, -0.7108001708984375, -0.6825637817382812, -0.654327392578125, -0.6260910034179688, -0.5978546142578125, -0.5696182250976562, -0.5413818359375, -0.5131454467773438, -0.4849090576171875, -0.45667266845703125, -0.428436279296875, -0.40019989013671875, -0.3719635009765625, -0.34372711181640625, -0.31549072265625, -0.28725433349609375, -0.2590179443359375, -0.23078155517578125, -0.202545166015625, -0.17430877685546875, -0.1460723876953125, -0.11783599853515625, -0.089599609375, -0.06136322021484375, -0.0331268310546875, -0.00489044189453125, 0.023345947265625, 0.05158233642578125, 0.0798187255859375, 0.10805511474609375, 0.13629150390625, 0.16452789306640625, 0.1927642822265625, 0.22100067138671875, 0.249237060546875, 0.27747344970703125, 0.3057098388671875, 0.33394622802734375, 0.3621826171875, 0.39041900634765625, 0.4186553955078125, 0.44689178466796875, 0.475128173828125, 0.5033645629882812, 0.5316009521484375, 0.5598373413085938, 0.58807373046875, 0.6163101196289062, 0.6445465087890625, 0.6727828979492188, 0.701019287109375, 0.7292556762695312, 0.7574920654296875, 0.7857284545898438, 0.81396484375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 8.0, 4.0, 8.0, 6.0, 14.0, 14.0, 18.0, 18.0, 28.0, 25.0, 24.0, 30.0, 35.0, 46.0, 45.0, 54.0, 46.0, 45.0, 40.0, 39.0, 40.0, 41.0, 38.0, 47.0, 34.0, 30.0, 36.0, 18.0, 29.0, 25.0, 23.0, 16.0, 19.0, 13.0, 7.0, 5.0, 6.0, 5.0, 6.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.67919921875, -0.6577529907226562, -0.6363067626953125, -0.6148605346679688, -0.593414306640625, -0.5719680786132812, -0.5505218505859375, -0.5290756225585938, -0.50762939453125, -0.48618316650390625, -0.4647369384765625, -0.44329071044921875, -0.421844482421875, -0.40039825439453125, -0.3789520263671875, -0.35750579833984375, -0.3360595703125, -0.31461334228515625, -0.2931671142578125, -0.27172088623046875, -0.250274658203125, -0.22882843017578125, -0.2073822021484375, -0.18593597412109375, -0.16448974609375, -0.14304351806640625, -0.1215972900390625, -0.10015106201171875, -0.078704833984375, -0.05725860595703125, -0.0358123779296875, -0.01436614990234375, 0.007080078125, 0.02852630615234375, 0.0499725341796875, 0.07141876220703125, 0.092864990234375, 0.11431121826171875, 0.1357574462890625, 0.15720367431640625, 0.17864990234375, 0.20009613037109375, 0.2215423583984375, 0.24298858642578125, 0.264434814453125, 0.28588104248046875, 0.3073272705078125, 0.32877349853515625, 0.3502197265625, 0.37166595458984375, 0.3931121826171875, 0.41455841064453125, 0.436004638671875, 0.45745086669921875, 0.4788970947265625, 0.5003433227539062, 0.52178955078125, 0.5432357788085938, 0.5646820068359375, 0.5861282348632812, 0.607574462890625, 0.6290206909179688, 0.6504669189453125, 0.6719131469726562, 0.693359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 10.0, 4.0, 10.0, 18.0, 18.0, 33.0, 58.0, 62.0, 113.0, 194.0, 427.0, 932.0, 3172.0, 19614.0, 243758.0, 692029.0, 76896.0, 8172.0, 1704.0, 592.0, 263.0, 159.0, 108.0, 67.0, 44.0, 38.0, 15.0, 16.0, 13.0, 3.0, 8.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.392578125, -0.3757171630859375, -0.358856201171875, -0.3419952392578125, -0.32513427734375, -0.3082733154296875, -0.291412353515625, -0.2745513916015625, -0.2576904296875, -0.2408294677734375, -0.223968505859375, -0.2071075439453125, -0.19024658203125, -0.1733856201171875, -0.156524658203125, -0.1396636962890625, -0.122802734375, -0.1059417724609375, -0.089080810546875, -0.0722198486328125, -0.05535888671875, -0.0384979248046875, -0.021636962890625, -0.0047760009765625, 0.0120849609375, 0.0289459228515625, 0.045806884765625, 0.0626678466796875, 0.07952880859375, 0.0963897705078125, 0.113250732421875, 0.1301116943359375, 0.14697265625, 0.1638336181640625, 0.180694580078125, 0.1975555419921875, 0.21441650390625, 0.2312774658203125, 0.248138427734375, 0.2649993896484375, 0.2818603515625, 0.2987213134765625, 0.315582275390625, 0.3324432373046875, 0.34930419921875, 0.3661651611328125, 0.383026123046875, 0.3998870849609375, 0.416748046875, 0.4336090087890625, 0.450469970703125, 0.4673309326171875, 0.48419189453125, 0.5010528564453125, 0.517913818359375, 0.5347747802734375, 0.5516357421875, 0.5684967041015625, 0.585357666015625, 0.6022186279296875, 0.61907958984375, 0.6359405517578125, 0.652801513671875, 0.6696624755859375, 0.6865234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 9.0, 19.0, 32.0, 49.0, 79.0, 144.0, 202.0, 182.0, 126.0, 71.0, 49.0, 15.0, 11.0, 4.0, 8.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.577108383178711e-05, -8.091423660516739e-05, -7.605738937854767e-05, -7.120054215192795e-05, -6.634369492530823e-05, -6.148684769868851e-05, -5.663000047206879e-05, -5.1773153245449066e-05, -4.6916306018829346e-05, -4.2059458792209625e-05, -3.7202611565589905e-05, -3.2345764338970184e-05, -2.7488917112350464e-05, -2.2632069885730743e-05, -1.7775222659111023e-05, -1.2918375432491302e-05, -8.061528205871582e-06, -3.2046809792518616e-06, 1.6521662473678589e-06, 6.509013473987579e-06, 1.13658607006073e-05, 1.622270792722702e-05, 2.107955515384674e-05, 2.593640238046646e-05, 3.079324960708618e-05, 3.56500968337059e-05, 4.050694406032562e-05, 4.536379128694534e-05, 5.0220638513565063e-05, 5.5077485740184784e-05, 5.9934332966804504e-05, 6.479118019342422e-05, 6.964802742004395e-05, 7.450487464666367e-05, 7.936172187328339e-05, 8.42185690999031e-05, 8.907541632652283e-05, 9.393226355314255e-05, 9.878911077976227e-05, 0.00010364595800638199, 0.00010850280523300171, 0.00011335965245962143, 0.00011821649968624115, 0.00012307334691286087, 0.0001279301941394806, 0.0001327870413661003, 0.00013764388859272003, 0.00014250073581933975, 0.00014735758304595947, 0.0001522144302725792, 0.00015707127749919891, 0.00016192812472581863, 0.00016678497195243835, 0.00017164181917905807, 0.0001764986664056778, 0.00018135551363229752, 0.00018621236085891724, 0.00019106920808553696, 0.00019592605531215668, 0.0002007829025387764, 0.00020563974976539612, 0.00021049659699201584, 0.00021535344421863556, 0.00022021029144525528, 0.000225067138671875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 13.0, 18.0, 24.0, 69.0, 131.0, 320.0, 876.0, 4033.0, 59561.0, 861998.0, 113617.0, 6103.0, 1105.0, 368.0, 171.0, 74.0, 35.0, 16.0, 12.0, 5.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85009765625, -0.827484130859375, -0.80487060546875, -0.782257080078125, -0.7596435546875, -0.737030029296875, -0.71441650390625, -0.691802978515625, -0.669189453125, -0.646575927734375, -0.62396240234375, -0.601348876953125, -0.5787353515625, -0.556121826171875, -0.53350830078125, -0.510894775390625, -0.48828125, -0.465667724609375, -0.44305419921875, -0.420440673828125, -0.3978271484375, -0.375213623046875, -0.35260009765625, -0.329986572265625, -0.307373046875, -0.284759521484375, -0.26214599609375, -0.239532470703125, -0.2169189453125, -0.194305419921875, -0.17169189453125, -0.149078369140625, -0.12646484375, -0.103851318359375, -0.08123779296875, -0.058624267578125, -0.0360107421875, -0.013397216796875, 0.00921630859375, 0.031829833984375, 0.054443359375, 0.077056884765625, 0.09967041015625, 0.122283935546875, 0.1448974609375, 0.167510986328125, 0.19012451171875, 0.212738037109375, 0.2353515625, 0.257965087890625, 0.28057861328125, 0.303192138671875, 0.3258056640625, 0.348419189453125, 0.37103271484375, 0.393646240234375, 0.416259765625, 0.438873291015625, 0.46148681640625, 0.484100341796875, 0.5067138671875, 0.529327392578125, 0.55194091796875, 0.574554443359375, 0.59716796875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 12.0, 16.0, 31.0, 66.0, 121.0, 211.0, 217.0, 128.0, 95.0, 47.0, 25.0, 11.0, 9.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9072265625, -0.8871574401855469, -0.8670883178710938, -0.8470191955566406, -0.8269500732421875, -0.8068809509277344, -0.7868118286132812, -0.7667427062988281, -0.746673583984375, -0.7266044616699219, -0.7065353393554688, -0.6864662170410156, -0.6663970947265625, -0.6463279724121094, -0.6262588500976562, -0.6061897277832031, -0.58612060546875, -0.5660514831542969, -0.5459823608398438, -0.5259132385253906, -0.5058441162109375, -0.4857749938964844, -0.46570587158203125, -0.4456367492675781, -0.425567626953125, -0.4054985046386719, -0.38542938232421875, -0.3653602600097656, -0.3452911376953125, -0.3252220153808594, -0.30515289306640625, -0.2850837707519531, -0.2650146484375, -0.24494552612304688, -0.22487640380859375, -0.20480728149414062, -0.1847381591796875, -0.16466903686523438, -0.14459991455078125, -0.12453079223632812, -0.104461669921875, -0.08439254760742188, -0.06432342529296875, -0.044254302978515625, -0.0241851806640625, -0.004116058349609375, 0.01595306396484375, 0.036022186279296875, 0.05609130859375, 0.07616043090820312, 0.09622955322265625, 0.11629867553710938, 0.1363677978515625, 0.15643692016601562, 0.17650604248046875, 0.19657516479492188, 0.216644287109375, 0.23671340942382812, 0.25678253173828125, 0.2768516540527344, 0.2969207763671875, 0.3169898986816406, 0.33705902099609375, 0.3571281433105469, 0.377197265625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 4.0, 7.0, 10.0, 15.0, 23.0, 47.0, 53.0, 84.0, 100.0, 141.0, 133.0, 117.0, 108.0, 54.0, 34.0, 25.0, 22.0, 6.0, 10.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.417672157287598, -7.24643611907959, -7.075200080871582, -6.903964042663574, -6.732728004455566, -6.561491966247559, -6.390255928039551, -6.219019889831543, -6.047783851623535, -5.876547813415527, -5.7053117752075195, -5.534075736999512, -5.362839698791504, -5.191603660583496, -5.020367622375488, -4.8491315841674805, -4.677895545959473, -4.506659507751465, -4.335423469543457, -4.164187431335449, -3.9929513931274414, -3.8217153549194336, -3.650479316711426, -3.479243278503418, -3.308006763458252, -3.136770725250244, -2.9655346870422363, -2.7942986488342285, -2.6230626106262207, -2.451826572418213, -2.280590534210205, -2.1093544960021973, -1.9381182193756104, -1.7668821811676025, -1.5956461429595947, -1.424410104751587, -1.253174066543579, -1.0819380283355713, -0.9107018709182739, -0.7394658327102661, -0.5682297945022583, -0.3969937562942505, -0.2257576882839203, -0.05452162027359009, 0.11671441793441772, 0.28795045614242554, 0.4591865539550781, 0.6304225921630859, 0.8016586303710938, 0.9728946685791016, 1.1441307067871094, 1.3153667449951172, 1.486602783203125, 1.6578388214111328, 1.8290749788284302, 2.0003108978271484, 2.1715469360351562, 2.342782974243164, 2.514019012451172, 2.6852550506591797, 2.8564910888671875, 3.0277271270751953, 3.198963165283203, 3.370199203491211, 3.541435480117798]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 4.0, 3.0, 8.0, 5.0, 7.0, 4.0, 9.0, 10.0, 18.0, 16.0, 15.0, 19.0, 26.0, 35.0, 47.0, 43.0, 43.0, 54.0, 43.0, 63.0, 36.0, 44.0, 43.0, 46.0, 37.0, 37.0, 38.0, 45.0, 34.0, 31.0, 25.0, 14.0, 27.0, 15.0, 12.0, 12.0, 10.0, 6.0, 5.0, 4.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.011470794677734, -3.9004287719726562, -3.7893869876861572, -3.678344964981079, -3.56730318069458, -3.456261157989502, -3.345219135284424, -3.2341771125793457, -3.1231353282928467, -3.0120933055877686, -2.9010515213012695, -2.7900094985961914, -2.6789674758911133, -2.5679256916046143, -2.456883668899536, -2.345841884613037, -2.234799861907959, -2.123757839202881, -2.012716054916382, -1.9016740322113037, -1.7906321287155151, -1.6795902252197266, -1.5685482025146484, -1.4575062990188599, -1.3464643955230713, -1.2354224920272827, -1.1243805885314941, -1.013338565826416, -0.9022966623306274, -0.7912547588348389, -0.6802127957344055, -0.5691708326339722, -0.4581291675567627, -0.34708723425865173, -0.23604530096054077, -0.1250033676624298, -0.013961434364318848, 0.09708046913146973, 0.20812243223190308, 0.3191643953323364, 0.430206298828125, 0.5412482023239136, 0.6522901654243469, 0.7633321285247803, 0.8743740320205688, 0.9854159355163574, 1.0964579582214355, 1.2074998617172241, 1.3185417652130127, 1.4295836687088013, 1.5406255722045898, 1.651667594909668, 1.7627094984054565, 1.8737514019012451, 1.9847934246063232, 2.0958352088928223, 2.2068772315979004, 2.3179192543029785, 2.4289610385894775, 2.5400030612945557, 2.6510448455810547, 2.762086868286133, 2.873128890991211, 2.984170913696289, 3.095212697982788]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 13.0, 6.0, 13.0, 39.0, 63.0, 101.0, 196.0, 384.0, 731.0, 1827.0, 5312.0, 24543.0, 286135.0, 3809320.0, 51449.0, 9171.0, 2628.0, 1067.0, 479.0, 275.0, 138.0, 110.0, 66.0, 49.0, 49.0, 23.0, 23.0, 17.0, 16.0, 9.0, 8.0, 6.0, 5.0, 1.0, 6.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.396484375, -1.333587646484375, -1.27069091796875, -1.207794189453125, -1.1448974609375, -1.082000732421875, -1.01910400390625, -0.956207275390625, -0.893310546875, -0.830413818359375, -0.76751708984375, -0.704620361328125, -0.6417236328125, -0.578826904296875, -0.51593017578125, -0.453033447265625, -0.39013671875, -0.327239990234375, -0.26434326171875, -0.201446533203125, -0.1385498046875, -0.075653076171875, -0.01275634765625, 0.050140380859375, 0.113037109375, 0.175933837890625, 0.23883056640625, 0.301727294921875, 0.3646240234375, 0.427520751953125, 0.49041748046875, 0.553314208984375, 0.6162109375, 0.679107666015625, 0.74200439453125, 0.804901123046875, 0.8677978515625, 0.930694580078125, 0.99359130859375, 1.056488037109375, 1.119384765625, 1.182281494140625, 1.24517822265625, 1.308074951171875, 1.3709716796875, 1.433868408203125, 1.49676513671875, 1.559661865234375, 1.62255859375, 1.685455322265625, 1.74835205078125, 1.811248779296875, 1.8741455078125, 1.937042236328125, 1.99993896484375, 2.062835693359375, 2.125732421875, 2.188629150390625, 2.25152587890625, 2.314422607421875, 2.3773193359375, 2.440216064453125, 2.50311279296875, 2.566009521484375, 2.62890625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 13.0, 12.0, 25.0, 48.0, 52.0, 68.0, 80.0, 95.0, 94.0, 86.0, 94.0, 78.0, 72.0, 51.0, 40.0, 32.0, 23.0, 13.0, 13.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.255615234375, -0.24350357055664062, -0.23139190673828125, -0.21928024291992188, -0.2071685791015625, -0.19505691528320312, -0.18294525146484375, -0.17083358764648438, -0.158721923828125, -0.14661026000976562, -0.13449859619140625, -0.12238693237304688, -0.1102752685546875, -0.09816360473632812, -0.08605194091796875, -0.07394027709960938, -0.06182861328125, -0.049716949462890625, -0.03760528564453125, -0.025493621826171875, -0.0133819580078125, -0.001270294189453125, 0.01084136962890625, 0.022953033447265625, 0.035064697265625, 0.047176361083984375, 0.05928802490234375, 0.07139968872070312, 0.0835113525390625, 0.09562301635742188, 0.10773468017578125, 0.11984634399414062, 0.1319580078125, 0.14406967163085938, 0.15618133544921875, 0.16829299926757812, 0.1804046630859375, 0.19251632690429688, 0.20462799072265625, 0.21673965454101562, 0.228851318359375, 0.24096298217773438, 0.25307464599609375, 0.2651863098144531, 0.2772979736328125, 0.2894096374511719, 0.30152130126953125, 0.3136329650878906, 0.32574462890625, 0.3378562927246094, 0.34996795654296875, 0.3620796203613281, 0.3741912841796875, 0.3863029479980469, 0.39841461181640625, 0.4105262756347656, 0.422637939453125, 0.4347496032714844, 0.44686126708984375, 0.4589729309082031, 0.4710845947265625, 0.4831962585449219, 0.49530792236328125, 0.5074195861816406, 0.51953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 9.0, 5.0, 8.0, 12.0, 24.0, 31.0, 39.0, 40.0, 91.0, 141.0, 251.0, 625.0, 2122.0, 9936.0, 79346.0, 3905699.0, 175619.0, 15778.0, 2922.0, 803.0, 327.0, 171.0, 87.0, 77.0, 36.0, 29.0, 22.0, 7.0, 13.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.623046875, -2.5600433349609375, -2.497039794921875, -2.4340362548828125, -2.37103271484375, -2.3080291748046875, -2.245025634765625, -2.1820220947265625, -2.1190185546875, -2.0560150146484375, -1.993011474609375, -1.9300079345703125, -1.86700439453125, -1.8040008544921875, -1.740997314453125, -1.6779937744140625, -1.614990234375, -1.5519866943359375, -1.488983154296875, -1.4259796142578125, -1.36297607421875, -1.2999725341796875, -1.236968994140625, -1.1739654541015625, -1.1109619140625, -1.0479583740234375, -0.984954833984375, -0.9219512939453125, -0.85894775390625, -0.7959442138671875, -0.732940673828125, -0.6699371337890625, -0.60693359375, -0.5439300537109375, -0.480926513671875, -0.4179229736328125, -0.35491943359375, -0.2919158935546875, -0.228912353515625, -0.1659088134765625, -0.1029052734375, -0.0399017333984375, 0.023101806640625, 0.0861053466796875, 0.14910888671875, 0.2121124267578125, 0.275115966796875, 0.3381195068359375, 0.401123046875, 0.4641265869140625, 0.527130126953125, 0.5901336669921875, 0.65313720703125, 0.7161407470703125, 0.779144287109375, 0.8421478271484375, 0.9051513671875, 0.9681549072265625, 1.031158447265625, 1.0941619873046875, 1.15716552734375, 1.2201690673828125, 1.283172607421875, 1.3461761474609375, 1.4091796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 9.0, 3.0, 5.0, 17.0, 14.0, 21.0, 23.0, 46.0, 47.0, 94.0, 188.0, 381.0, 2179.0, 534.0, 205.0, 100.0, 59.0, 42.0, 31.0, 16.0, 13.0, 10.0, 5.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.461669921875, -0.4483299255371094, -0.43498992919921875, -0.4216499328613281, -0.4083099365234375, -0.3949699401855469, -0.38162994384765625, -0.3682899475097656, -0.354949951171875, -0.3416099548339844, -0.32826995849609375, -0.3149299621582031, -0.3015899658203125, -0.2882499694824219, -0.27490997314453125, -0.2615699768066406, -0.24822998046875, -0.23488998413085938, -0.22154998779296875, -0.20820999145507812, -0.1948699951171875, -0.18152999877929688, -0.16819000244140625, -0.15485000610351562, -0.141510009765625, -0.12817001342773438, -0.11483001708984375, -0.10149002075195312, -0.0881500244140625, -0.07481002807617188, -0.06147003173828125, -0.048130035400390625, -0.0347900390625, -0.021450042724609375, -0.00811004638671875, 0.005229949951171875, 0.0185699462890625, 0.031909942626953125, 0.04524993896484375, 0.058589935302734375, 0.071929931640625, 0.08526992797851562, 0.09860992431640625, 0.11194992065429688, 0.1252899169921875, 0.13862991333007812, 0.15196990966796875, 0.16530990600585938, 0.17864990234375, 0.19198989868164062, 0.20532989501953125, 0.21866989135742188, 0.2320098876953125, 0.24534988403320312, 0.25868988037109375, 0.2720298767089844, 0.285369873046875, 0.2987098693847656, 0.31204986572265625, 0.3253898620605469, 0.3387298583984375, 0.3520698547363281, 0.36540985107421875, 0.3787498474121094, 0.39208984375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 9.0, 25.0, 100.0, 291.0, 348.0, 154.0, 38.0, 13.0, 3.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.679964065551758, -7.4977874755859375, -7.315610885620117, -7.133434295654297, -6.951257705688477, -6.769081115722656, -6.586904525756836, -6.404727458953857, -6.222550868988037, -6.040374279022217, -5.8581976890563965, -5.676021099090576, -5.493844509124756, -5.311667442321777, -5.129490852355957, -4.947314262390137, -4.765137672424316, -4.582961082458496, -4.400784492492676, -4.2186079025268555, -4.036431312561035, -3.8542544841766357, -3.6720778942108154, -3.489901065826416, -3.307724952697754, -3.1255483627319336, -2.9433717727661133, -2.761195182800293, -2.5790183544158936, -2.3968417644500732, -2.214665174484253, -2.0324883460998535, -1.8503117561340332, -1.668135166168213, -1.485958456993103, -1.3037818670272827, -1.1216051578521729, -0.9394285678863525, -0.7572519779205322, -0.5750752687454224, -0.39289867877960205, -0.21072204411029816, -0.028545409440994263, 0.15363121032714844, 0.3358078598976135, 0.5179845094680786, 0.7001610994338989, 0.8823378086090088, 1.064514398574829, 1.2466909885406494, 1.4288676977157593, 1.6110442876815796, 1.7932209968566895, 1.9753975868225098, 2.15757417678833, 2.3397507667541504, 2.5219273567199707, 2.704103946685791, 2.8862805366516113, 3.0684571266174316, 3.250633955001831, 3.4328105449676514, 3.6149871349334717, 3.797163963317871, 3.9793405532836914]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 9.0, 2.0, 1.0, 12.0, 7.0, 11.0, 11.0, 14.0, 19.0, 19.0, 27.0, 25.0, 39.0, 29.0, 38.0, 37.0, 41.0, 50.0, 57.0, 58.0, 49.0, 40.0, 38.0, 43.0, 37.0, 34.0, 31.0, 21.0, 18.0, 39.0, 27.0, 26.0, 14.0, 12.0, 14.0, 7.0, 8.0, 6.0, 8.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.9652738571166992, -0.9320940971374512, -0.8989143371582031, -0.8657345771789551, -0.832554817199707, -0.799375057220459, -0.7661952376365662, -0.7330154776573181, -0.6998357176780701, -0.666655957698822, -0.633476197719574, -0.6002964377403259, -0.5671166181564331, -0.5339368581771851, -0.500757098197937, -0.46757733821868896, -0.4343975782394409, -0.40121781826019287, -0.3680380582809448, -0.3348582684993744, -0.30167850852012634, -0.2684987485408783, -0.23531897366046906, -0.20213919878005981, -0.16895943880081177, -0.13577967882156372, -0.10259990394115448, -0.06942013651132584, -0.03624036908149719, -0.0030606091022491455, 0.030119165778160095, 0.06329894065856934, 0.09647881984710693, 0.12965857982635498, 0.16283835470676422, 0.19601812958717346, 0.2291978895664215, 0.26237764954566956, 0.29555743932724, 0.32873719930648804, 0.3619169592857361, 0.39509671926498413, 0.4282764792442322, 0.4614562690258026, 0.49463602900505066, 0.5278158187866211, 0.5609955787658691, 0.5941753387451172, 0.6273550987243652, 0.6605348587036133, 0.6937146186828613, 0.7268943786621094, 0.7600741386413574, 0.7932538986206055, 0.8264337182044983, 0.8596134781837463, 0.8927932381629944, 0.9259729981422424, 0.9591527581214905, 0.9923325181007385, 1.0255123376846313, 1.0586920976638794, 1.0918718576431274, 1.1250516176223755, 1.1582313776016235]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 13.0, 26.0, 31.0, 39.0, 56.0, 70.0, 136.0, 229.0, 457.0, 922.0, 2628.0, 10068.0, 55531.0, 366282.0, 505056.0, 86754.0, 14443.0, 3468.0, 1138.0, 500.0, 248.0, 163.0, 109.0, 61.0, 35.0, 23.0, 16.0, 16.0, 9.0, 6.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7939453125, -1.74285888671875, -1.6917724609375, -1.64068603515625, -1.589599609375, -1.53851318359375, -1.4874267578125, -1.43634033203125, -1.38525390625, -1.33416748046875, -1.2830810546875, -1.23199462890625, -1.180908203125, -1.12982177734375, -1.0787353515625, -1.02764892578125, -0.9765625, -0.92547607421875, -0.8743896484375, -0.82330322265625, -0.772216796875, -0.72113037109375, -0.6700439453125, -0.61895751953125, -0.56787109375, -0.51678466796875, -0.4656982421875, -0.41461181640625, -0.363525390625, -0.31243896484375, -0.2613525390625, -0.21026611328125, -0.1591796875, -0.10809326171875, -0.0570068359375, -0.00592041015625, 0.045166015625, 0.09625244140625, 0.1473388671875, 0.19842529296875, 0.24951171875, 0.30059814453125, 0.3516845703125, 0.40277099609375, 0.453857421875, 0.50494384765625, 0.5560302734375, 0.60711669921875, 0.658203125, 0.70928955078125, 0.7603759765625, 0.81146240234375, 0.862548828125, 0.91363525390625, 0.9647216796875, 1.01580810546875, 1.06689453125, 1.11798095703125, 1.1690673828125, 1.22015380859375, 1.271240234375, 1.32232666015625, 1.3734130859375, 1.42449951171875, 1.4755859375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 4.0, 11.0, 18.0, 20.0, 27.0, 42.0, 71.0, 69.0, 83.0, 80.0, 82.0, 102.0, 88.0, 66.0, 51.0, 50.0, 49.0, 28.0, 21.0, 16.0, 15.0, 5.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2425537109375, -0.23035621643066406, -0.21815872192382812, -0.2059612274169922, -0.19376373291015625, -0.1815662384033203, -0.16936874389648438, -0.15717124938964844, -0.1449737548828125, -0.13277626037597656, -0.12057876586914062, -0.10838127136230469, -0.09618377685546875, -0.08398628234863281, -0.07178878784179688, -0.05959129333496094, -0.047393798828125, -0.03519630432128906, -0.022998809814453125, -0.010801315307617188, 0.00139617919921875, 0.013593673706054688, 0.025791168212890625, 0.03798866271972656, 0.0501861572265625, 0.06238365173339844, 0.07458114624023438, 0.08677864074707031, 0.09897613525390625, 0.11117362976074219, 0.12337112426757812, 0.13556861877441406, 0.14776611328125, 0.15996360778808594, 0.17216110229492188, 0.1843585968017578, 0.19655609130859375, 0.2087535858154297, 0.22095108032226562, 0.23314857482910156, 0.2453460693359375, 0.25754356384277344, 0.2697410583496094, 0.2819385528564453, 0.29413604736328125, 0.3063335418701172, 0.3185310363769531, 0.33072853088378906, 0.342926025390625, 0.35512351989746094, 0.3673210144042969, 0.3795185089111328, 0.39171600341796875, 0.4039134979248047, 0.4161109924316406, 0.42830848693847656, 0.4405059814453125, 0.45270347595214844, 0.4649009704589844, 0.4770984649658203, 0.48929595947265625, 0.5014934539794922, 0.5136909484863281, 0.5258884429931641, 0.5380859375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 7.0, 5.0, 11.0, 20.0, 19.0, 50.0, 59.0, 58.0, 114.0, 139.0, 231.0, 368.0, 624.0, 1043.0, 2085.0, 4271.0, 10501.0, 27113.0, 76137.0, 203748.0, 355504.0, 227574.0, 86225.0, 30853.0, 11790.0, 4867.0, 2253.0, 1129.0, 619.0, 383.0, 222.0, 170.0, 120.0, 83.0, 45.0, 30.0, 18.0, 17.0, 19.0, 15.0, 8.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6474609375, -0.6269454956054688, -0.6064300537109375, -0.5859146118164062, -0.565399169921875, -0.5448837280273438, -0.5243682861328125, -0.5038528442382812, -0.48333740234375, -0.46282196044921875, -0.4423065185546875, -0.42179107666015625, -0.401275634765625, -0.38076019287109375, -0.3602447509765625, -0.33972930908203125, -0.3192138671875, -0.29869842529296875, -0.2781829833984375, -0.25766754150390625, -0.237152099609375, -0.21663665771484375, -0.1961212158203125, -0.17560577392578125, -0.15509033203125, -0.13457489013671875, -0.1140594482421875, -0.09354400634765625, -0.073028564453125, -0.05251312255859375, -0.0319976806640625, -0.01148223876953125, 0.009033203125, 0.02954864501953125, 0.0500640869140625, 0.07057952880859375, 0.091094970703125, 0.11161041259765625, 0.1321258544921875, 0.15264129638671875, 0.17315673828125, 0.19367218017578125, 0.2141876220703125, 0.23470306396484375, 0.255218505859375, 0.27573394775390625, 0.2962493896484375, 0.31676483154296875, 0.3372802734375, 0.35779571533203125, 0.3783111572265625, 0.39882659912109375, 0.419342041015625, 0.43985748291015625, 0.4603729248046875, 0.48088836669921875, 0.50140380859375, 0.5219192504882812, 0.5424346923828125, 0.5629501342773438, 0.583465576171875, 0.6039810180664062, 0.6244964599609375, 0.6450119018554688, 0.66552734375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 6.0, 3.0, 2.0, 6.0, 10.0, 9.0, 9.0, 16.0, 19.0, 14.0, 22.0, 28.0, 28.0, 37.0, 34.0, 38.0, 41.0, 35.0, 53.0, 41.0, 53.0, 50.0, 37.0, 44.0, 31.0, 52.0, 39.0, 33.0, 29.0, 32.0, 32.0, 24.0, 19.0, 14.0, 9.0, 14.0, 6.0, 6.0, 5.0, 10.0, 6.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.05078125, -1.0204391479492188, -0.9900970458984375, -0.9597549438476562, -0.929412841796875, -0.8990707397460938, -0.8687286376953125, -0.8383865356445312, -0.80804443359375, -0.7777023315429688, -0.7473602294921875, -0.7170181274414062, -0.686676025390625, -0.6563339233398438, -0.6259918212890625, -0.5956497192382812, -0.5653076171875, -0.5349655151367188, -0.5046234130859375, -0.47428131103515625, -0.443939208984375, -0.41359710693359375, -0.3832550048828125, -0.35291290283203125, -0.32257080078125, -0.29222869873046875, -0.2618865966796875, -0.23154449462890625, -0.201202392578125, -0.17086029052734375, -0.1405181884765625, -0.11017608642578125, -0.079833984375, -0.04949188232421875, -0.0191497802734375, 0.01119232177734375, 0.041534423828125, 0.07187652587890625, 0.1022186279296875, 0.13256072998046875, 0.16290283203125, 0.19324493408203125, 0.2235870361328125, 0.25392913818359375, 0.284271240234375, 0.31461334228515625, 0.3449554443359375, 0.37529754638671875, 0.4056396484375, 0.43598175048828125, 0.4663238525390625, 0.49666595458984375, 0.527008056640625, 0.5573501586914062, 0.5876922607421875, 0.6180343627929688, 0.64837646484375, 0.6787185668945312, 0.7090606689453125, 0.7394027709960938, 0.769744873046875, 0.8000869750976562, 0.8304290771484375, 0.8607711791992188, 0.89111328125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 11.0, 11.0, 13.0, 35.0, 79.0, 113.0, 231.0, 521.0, 1242.0, 4732.0, 31110.0, 359428.0, 579385.0, 61319.0, 7338.0, 1726.0, 638.0, 307.0, 149.0, 68.0, 50.0, 19.0, 13.0, 9.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64453125, -0.626190185546875, -0.60784912109375, -0.589508056640625, -0.5711669921875, -0.552825927734375, -0.53448486328125, -0.516143798828125, -0.497802734375, -0.479461669921875, -0.46112060546875, -0.442779541015625, -0.4244384765625, -0.406097412109375, -0.38775634765625, -0.369415283203125, -0.35107421875, -0.332733154296875, -0.31439208984375, -0.296051025390625, -0.2777099609375, -0.259368896484375, -0.24102783203125, -0.222686767578125, -0.204345703125, -0.186004638671875, -0.16766357421875, -0.149322509765625, -0.1309814453125, -0.112640380859375, -0.09429931640625, -0.075958251953125, -0.0576171875, -0.039276123046875, -0.02093505859375, -0.002593994140625, 0.0157470703125, 0.034088134765625, 0.05242919921875, 0.070770263671875, 0.089111328125, 0.107452392578125, 0.12579345703125, 0.144134521484375, 0.1624755859375, 0.180816650390625, 0.19915771484375, 0.217498779296875, 0.23583984375, 0.254180908203125, 0.27252197265625, 0.290863037109375, 0.3092041015625, 0.327545166015625, 0.34588623046875, 0.364227294921875, 0.382568359375, 0.400909423828125, 0.41925048828125, 0.437591552734375, 0.4559326171875, 0.474273681640625, 0.49261474609375, 0.510955810546875, 0.529296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 8.0, 17.0, 15.0, 14.0, 19.0, 20.0, 30.0, 35.0, 40.0, 53.0, 57.0, 41.0, 73.0, 65.0, 73.0, 50.0, 70.0, 56.0, 39.0, 46.0, 21.0, 23.0, 19.0, 20.0, 19.0, 7.0, 6.0, 9.0, 7.0, 7.0, 5.0, 7.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.079673767089844e-05, -5.902908742427826e-05, -5.726143717765808e-05, -5.54937869310379e-05, -5.3726136684417725e-05, -5.1958486437797546e-05, -5.019083619117737e-05, -4.842318594455719e-05, -4.665553569793701e-05, -4.4887885451316833e-05, -4.3120235204696655e-05, -4.135258495807648e-05, -3.95849347114563e-05, -3.781728446483612e-05, -3.604963421821594e-05, -3.4281983971595764e-05, -3.2514333724975586e-05, -3.074668347835541e-05, -2.897903323173523e-05, -2.721138298511505e-05, -2.5443732738494873e-05, -2.3676082491874695e-05, -2.1908432245254517e-05, -2.014078199863434e-05, -1.837313175201416e-05, -1.6605481505393982e-05, -1.4837831258773804e-05, -1.3070181012153625e-05, -1.1302530765533447e-05, -9.534880518913269e-06, -7.76723027229309e-06, -5.999580025672913e-06, -4.231929779052734e-06, -2.464279532432556e-06, -6.966292858123779e-07, 1.0710209608078003e-06, 2.8386712074279785e-06, 4.606321454048157e-06, 6.373971700668335e-06, 8.141621947288513e-06, 9.909272193908691e-06, 1.167692244052887e-05, 1.3444572687149048e-05, 1.5212222933769226e-05, 1.6979873180389404e-05, 1.8747523427009583e-05, 2.051517367362976e-05, 2.228282392024994e-05, 2.4050474166870117e-05, 2.5818124413490295e-05, 2.7585774660110474e-05, 2.9353424906730652e-05, 3.112107515335083e-05, 3.288872539997101e-05, 3.4656375646591187e-05, 3.6424025893211365e-05, 3.819167613983154e-05, 3.995932638645172e-05, 4.17269766330719e-05, 4.349462687969208e-05, 4.5262277126312256e-05, 4.7029927372932434e-05, 4.879757761955261e-05, 5.056522786617279e-05, 5.233287811279297e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 8.0, 13.0, 25.0, 33.0, 66.0, 110.0, 242.0, 428.0, 1153.0, 3507.0, 14737.0, 85230.0, 428693.0, 414948.0, 80004.0, 13810.0, 3457.0, 1117.0, 423.0, 229.0, 121.0, 79.0, 52.0, 21.0, 10.0, 18.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.56005859375, -0.5456924438476562, -0.5313262939453125, -0.5169601440429688, -0.502593994140625, -0.48822784423828125, -0.4738616943359375, -0.45949554443359375, -0.44512939453125, -0.43076324462890625, -0.4163970947265625, -0.40203094482421875, -0.387664794921875, -0.37329864501953125, -0.3589324951171875, -0.34456634521484375, -0.3302001953125, -0.31583404541015625, -0.3014678955078125, -0.28710174560546875, -0.272735595703125, -0.25836944580078125, -0.2440032958984375, -0.22963714599609375, -0.21527099609375, -0.20090484619140625, -0.1865386962890625, -0.17217254638671875, -0.157806396484375, -0.14344024658203125, -0.1290740966796875, -0.11470794677734375, -0.100341796875, -0.08597564697265625, -0.0716094970703125, -0.05724334716796875, -0.042877197265625, -0.02851104736328125, -0.0141448974609375, 0.00022125244140625, 0.01458740234375, 0.02895355224609375, 0.0433197021484375, 0.05768585205078125, 0.072052001953125, 0.08641815185546875, 0.1007843017578125, 0.11515045166015625, 0.1295166015625, 0.14388275146484375, 0.1582489013671875, 0.17261505126953125, 0.186981201171875, 0.20134735107421875, 0.2157135009765625, 0.23007965087890625, 0.24444580078125, 0.25881195068359375, 0.2731781005859375, 0.28754425048828125, 0.301910400390625, 0.31627655029296875, 0.3306427001953125, 0.34500885009765625, 0.359375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 7.0, 8.0, 3.0, 11.0, 13.0, 14.0, 23.0, 22.0, 26.0, 32.0, 43.0, 42.0, 69.0, 68.0, 62.0, 64.0, 69.0, 65.0, 59.0, 50.0, 47.0, 34.0, 44.0, 30.0, 21.0, 13.0, 18.0, 18.0, 9.0, 7.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.342529296875, -0.3314857482910156, -0.32044219970703125, -0.3093986511230469, -0.2983551025390625, -0.2873115539550781, -0.27626800537109375, -0.2652244567871094, -0.254180908203125, -0.24313735961914062, -0.23209381103515625, -0.22105026245117188, -0.2100067138671875, -0.19896316528320312, -0.18791961669921875, -0.17687606811523438, -0.16583251953125, -0.15478897094726562, -0.14374542236328125, -0.13270187377929688, -0.1216583251953125, -0.11061477661132812, -0.09957122802734375, -0.08852767944335938, -0.077484130859375, -0.06644058227539062, -0.05539703369140625, -0.044353485107421875, -0.0333099365234375, -0.022266387939453125, -0.01122283935546875, -0.000179290771484375, 0.0108642578125, 0.021907806396484375, 0.03295135498046875, 0.043994903564453125, 0.0550384521484375, 0.06608200073242188, 0.07712554931640625, 0.08816909790039062, 0.099212646484375, 0.11025619506835938, 0.12129974365234375, 0.13234329223632812, 0.1433868408203125, 0.15443038940429688, 0.16547393798828125, 0.17651748657226562, 0.18756103515625, 0.19860458374023438, 0.20964813232421875, 0.22069168090820312, 0.2317352294921875, 0.24277877807617188, 0.25382232666015625, 0.2648658752441406, 0.275909423828125, 0.2869529724121094, 0.29799652099609375, 0.3090400695800781, 0.3200836181640625, 0.3311271667480469, 0.34217071533203125, 0.3532142639160156, 0.3642578125]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 4.0, 12.0, 9.0, 18.0, 21.0, 37.0, 54.0, 70.0, 114.0, 119.0, 140.0, 125.0, 84.0, 69.0, 45.0, 22.0, 25.0, 9.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.03009033203125, -9.813689231872559, -9.597288131713867, -9.380887031555176, -9.164485931396484, -8.948084831237793, -8.731683731079102, -8.515283584594727, -8.298882484436035, -8.082481384277344, -7.866080284118652, -7.649679183959961, -7.433278560638428, -7.216877460479736, -7.000476360321045, -6.7840752601623535, -6.567673683166504, -6.3512725830078125, -6.134871482849121, -5.91847038269043, -5.7020697593688965, -5.485668659210205, -5.269267559051514, -5.052866458892822, -4.836465835571289, -4.620064735412598, -4.403663635253906, -4.187262535095215, -3.9708616733551025, -3.7544608116149902, -3.538059711456299, -3.3216586112976074, -3.105257272720337, -2.8888561725616455, -2.672455310821533, -2.456054210662842, -2.2396531105041504, -2.023252010345459, -1.8068511486053467, -1.5904500484466553, -1.3740490674972534, -1.1576480865478516, -0.9412469863891602, -0.7248460054397583, -0.5084449648857117, -0.29204392433166504, -0.07564294338226318, 0.14075815677642822, 0.3571591377258301, 0.5735601782798767, 0.7899612188339233, 1.0063621997833252, 1.2227632999420166, 1.4391642808914185, 1.6555652618408203, 1.8719663619995117, 2.088367462158203, 2.3047685623168945, 2.521169424057007, 2.7375705242156982, 2.9539716243743896, 3.170372486114502, 3.3867735862731934, 3.6031746864318848, 3.819575548171997]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 9.0, 13.0, 10.0, 9.0, 17.0, 22.0, 10.0, 26.0, 35.0, 28.0, 21.0, 28.0, 38.0, 35.0, 40.0, 34.0, 39.0, 50.0, 34.0, 37.0, 43.0, 39.0, 37.0, 38.0, 31.0, 31.0, 34.0, 29.0, 30.0, 19.0, 29.0, 13.0, 17.0, 15.0, 8.0, 12.0, 6.0, 12.0, 8.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.842136383056641, -4.691004753112793, -4.5398736000061035, -4.388741970062256, -4.237610816955566, -4.086479187011719, -3.935347557067871, -3.7842161655426025, -3.633084774017334, -3.4819533824920654, -3.330821990966797, -3.179690361022949, -3.0285589694976807, -2.877427577972412, -2.7262959480285645, -2.575164556503296, -2.4240331649780273, -2.272901773452759, -2.1217703819274902, -1.9706387519836426, -1.819507360458374, -1.6683759689331055, -1.5172444581985474, -1.3661129474639893, -1.2149815559387207, -1.0638501644134521, -0.912718653678894, -0.7615872025489807, -0.6104557514190674, -0.45932430028915405, -0.3081928491592407, -0.15706133842468262, -0.0059299468994140625, 0.14520150423049927, 0.2963329553604126, 0.4474644064903259, 0.5985958576202393, 0.7497273087501526, 0.9008587598800659, 1.051990270614624, 1.2031216621398926, 1.3542530536651611, 1.5053845643997192, 1.6565160751342773, 1.807647466659546, 1.9587788581848145, 2.109910488128662, 2.2610418796539307, 2.412173271179199, 2.5633046627044678, 2.7144360542297363, 2.865567684173584, 3.0166990756988525, 3.167830467224121, 3.3189620971679688, 3.4700934886932373, 3.621224880218506, 3.7723562717437744, 3.923487663269043, 4.074619293212891, 4.225750923156738, 4.376882076263428, 4.528013706207275, 4.679144859313965, 4.8302764892578125]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 8.0, 6.0, 7.0, 15.0, 16.0, 33.0, 82.0, 126.0, 293.0, 626.0, 1538.0, 4097.0, 14983.0, 91163.0, 3857692.0, 191567.0, 22471.0, 5678.0, 1926.0, 802.0, 440.0, 230.0, 138.0, 98.0, 68.0, 44.0, 35.0, 19.0, 26.0, 19.0, 9.0, 9.0, 8.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.8408203125, -1.7807464599609375, -1.720672607421875, -1.6605987548828125, -1.60052490234375, -1.5404510498046875, -1.480377197265625, -1.4203033447265625, -1.3602294921875, -1.3001556396484375, -1.240081787109375, -1.1800079345703125, -1.11993408203125, -1.0598602294921875, -0.999786376953125, -0.9397125244140625, -0.879638671875, -0.8195648193359375, -0.759490966796875, -0.6994171142578125, -0.63934326171875, -0.5792694091796875, -0.519195556640625, -0.4591217041015625, -0.3990478515625, -0.3389739990234375, -0.278900146484375, -0.2188262939453125, -0.15875244140625, -0.0986785888671875, -0.038604736328125, 0.0214691162109375, 0.08154296875, 0.1416168212890625, 0.201690673828125, 0.2617645263671875, 0.32183837890625, 0.3819122314453125, 0.441986083984375, 0.5020599365234375, 0.5621337890625, 0.6222076416015625, 0.682281494140625, 0.7423553466796875, 0.80242919921875, 0.8625030517578125, 0.922576904296875, 0.9826507568359375, 1.042724609375, 1.1027984619140625, 1.162872314453125, 1.2229461669921875, 1.28302001953125, 1.3430938720703125, 1.403167724609375, 1.4632415771484375, 1.5233154296875, 1.5833892822265625, 1.643463134765625, 1.7035369873046875, 1.76361083984375, 1.8236846923828125, 1.883758544921875, 1.9438323974609375, 2.00390625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 8.0, 8.0, 11.0, 14.0, 6.0, 18.0, 40.0, 39.0, 54.0, 63.0, 68.0, 71.0, 73.0, 63.0, 81.0, 71.0, 76.0, 54.0, 41.0, 39.0, 36.0, 27.0, 10.0, 12.0, 9.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26220703125, -0.2499847412109375, -0.237762451171875, -0.2255401611328125, -0.21331787109375, -0.2010955810546875, -0.188873291015625, -0.1766510009765625, -0.1644287109375, -0.1522064208984375, -0.139984130859375, -0.1277618408203125, -0.11553955078125, -0.1033172607421875, -0.091094970703125, -0.0788726806640625, -0.066650390625, -0.0544281005859375, -0.042205810546875, -0.0299835205078125, -0.01776123046875, -0.0055389404296875, 0.006683349609375, 0.0189056396484375, 0.0311279296875, 0.0433502197265625, 0.055572509765625, 0.0677947998046875, 0.08001708984375, 0.0922393798828125, 0.104461669921875, 0.1166839599609375, 0.12890625, 0.1411285400390625, 0.153350830078125, 0.1655731201171875, 0.17779541015625, 0.1900177001953125, 0.202239990234375, 0.2144622802734375, 0.2266845703125, 0.2389068603515625, 0.251129150390625, 0.2633514404296875, 0.27557373046875, 0.2877960205078125, 0.300018310546875, 0.3122406005859375, 0.324462890625, 0.3366851806640625, 0.348907470703125, 0.3611297607421875, 0.37335205078125, 0.3855743408203125, 0.397796630859375, 0.4100189208984375, 0.4222412109375, 0.4344635009765625, 0.446685791015625, 0.4589080810546875, 0.47113037109375, 0.4833526611328125, 0.495574951171875, 0.5077972412109375, 0.52001953125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 6.0, 4.0, 12.0, 14.0, 14.0, 27.0, 43.0, 57.0, 84.0, 102.0, 148.0, 215.0, 304.0, 480.0, 833.0, 1623.0, 3656.0, 9095.0, 27929.0, 128337.0, 3483539.0, 456639.0, 54235.0, 15641.0, 5754.0, 2463.0, 1135.0, 637.0, 419.0, 244.0, 162.0, 135.0, 80.0, 65.0, 47.0, 25.0, 22.0, 20.0, 16.0, 6.0, 3.0, 4.0, 2.0, 4.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.3486328125, -1.3119354248046875, -1.275238037109375, -1.2385406494140625, -1.20184326171875, -1.1651458740234375, -1.128448486328125, -1.0917510986328125, -1.0550537109375, -1.0183563232421875, -0.981658935546875, -0.9449615478515625, -0.90826416015625, -0.8715667724609375, -0.834869384765625, -0.7981719970703125, -0.761474609375, -0.7247772216796875, -0.688079833984375, -0.6513824462890625, -0.61468505859375, -0.5779876708984375, -0.541290283203125, -0.5045928955078125, -0.4678955078125, -0.4311981201171875, -0.394500732421875, -0.3578033447265625, -0.32110595703125, -0.2844085693359375, -0.247711181640625, -0.2110137939453125, -0.17431640625, -0.1376190185546875, -0.100921630859375, -0.0642242431640625, -0.02752685546875, 0.0091705322265625, 0.045867919921875, 0.0825653076171875, 0.1192626953125, 0.1559600830078125, 0.192657470703125, 0.2293548583984375, 0.26605224609375, 0.3027496337890625, 0.339447021484375, 0.3761444091796875, 0.412841796875, 0.4495391845703125, 0.486236572265625, 0.5229339599609375, 0.55963134765625, 0.5963287353515625, 0.633026123046875, 0.6697235107421875, 0.7064208984375, 0.7431182861328125, 0.779815673828125, 0.8165130615234375, 0.85321044921875, 0.8899078369140625, 0.926605224609375, 0.9633026123046875, 1.0]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 13.0, 17.0, 35.0, 65.0, 110.0, 425.0, 2666.0, 473.0, 127.0, 51.0, 26.0, 22.0, 10.0, 6.0, 11.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7392578125, -0.7064208984375, -0.673583984375, -0.6407470703125, -0.60791015625, -0.5750732421875, -0.542236328125, -0.5093994140625, -0.4765625, -0.4437255859375, -0.410888671875, -0.3780517578125, -0.34521484375, -0.3123779296875, -0.279541015625, -0.2467041015625, -0.2138671875, -0.1810302734375, -0.148193359375, -0.1153564453125, -0.08251953125, -0.0496826171875, -0.016845703125, 0.0159912109375, 0.048828125, 0.0816650390625, 0.114501953125, 0.1473388671875, 0.18017578125, 0.2130126953125, 0.245849609375, 0.2786865234375, 0.3115234375, 0.3443603515625, 0.377197265625, 0.4100341796875, 0.44287109375, 0.4757080078125, 0.508544921875, 0.5413818359375, 0.57421875, 0.6070556640625, 0.639892578125, 0.6727294921875, 0.70556640625, 0.7384033203125, 0.771240234375, 0.8040771484375, 0.8369140625, 0.8697509765625, 0.902587890625, 0.9354248046875, 0.96826171875, 1.0010986328125, 1.033935546875, 1.0667724609375, 1.099609375, 1.1324462890625, 1.165283203125, 1.1981201171875, 1.23095703125, 1.2637939453125, 1.296630859375, 1.3294677734375, 1.3623046875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 6.0, 4.0, 4.0, 22.0, 42.0, 131.0, 204.0, 236.0, 174.0, 90.0, 51.0, 12.0, 8.0, 1.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.640812397003174, -5.475379943847656, -5.309947490692139, -5.144515037536621, -4.979082107543945, -4.813649654388428, -4.64821720123291, -4.482784748077393, -4.317352294921875, -4.151919841766357, -3.98648738861084, -3.821054697036743, -3.6556222438812256, -3.490189790725708, -3.3247570991516113, -3.1593246459960938, -2.993892192840576, -2.8284597396850586, -2.663027286529541, -2.4975945949554443, -2.3321621417999268, -2.166729688644409, -2.0012969970703125, -1.835864543914795, -1.6704320907592773, -1.5049996376037598, -1.3395670652389526, -1.1741344928741455, -1.008702039718628, -0.8432695269584656, -0.6778370141983032, -0.5124044418334961, -0.3469715118408203, -0.18153899908065796, -0.016106486320495605, 0.14932602643966675, 0.3147585391998291, 0.48019105195999146, 0.6456235647201538, 0.8110561370849609, 0.9764885902404785, 1.141921043395996, 1.3073536157608032, 1.4727861881256104, 1.638218641281128, 1.8036510944366455, 1.9690836668014526, 2.1345162391662598, 2.2999486923217773, 2.465381145477295, 2.6308135986328125, 2.796246290206909, 2.9616787433624268, 3.1271111965179443, 3.292543888092041, 3.4579763412475586, 3.623408794403076, 3.7888412475585938, 3.9542737007141113, 4.119706153869629, 4.285139083862305, 4.450571537017822, 4.61600399017334, 4.781436443328857, 4.946868896484375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 4.0, 2.0, 6.0, 6.0, 8.0, 12.0, 14.0, 19.0, 21.0, 22.0, 21.0, 32.0, 30.0, 31.0, 45.0, 35.0, 37.0, 53.0, 52.0, 50.0, 40.0, 34.0, 47.0, 45.0, 32.0, 46.0, 45.0, 38.0, 27.0, 28.0, 8.0, 13.0, 16.0, 19.0, 14.0, 10.0, 19.0, 6.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.945880651473999, -1.8837227821350098, -1.8215649127960205, -1.7594070434570312, -1.697249174118042, -1.6350913047790527, -1.5729334354400635, -1.5107754468917847, -1.4486175775527954, -1.3864597082138062, -1.324301838874817, -1.2621439695358276, -1.1999861001968384, -1.1378281116485596, -1.0756702423095703, -1.013512372970581, -0.9513545632362366, -0.8891966938972473, -0.8270388245582581, -0.764880895614624, -0.7027230262756348, -0.6405651569366455, -0.5784072875976562, -0.516249418258667, -0.45409151911735535, -0.3919336497783661, -0.32977575063705444, -0.2676178812980652, -0.20545999705791473, -0.14330211281776428, -0.08114424347877502, -0.01898634433746338, 0.04317152500152588, 0.10532940924167633, 0.16748729348182678, 0.22964516282081604, 0.2918030619621277, 0.35396093130111694, 0.4161188006401062, 0.47827669978141785, 0.5404345989227295, 0.6025924682617188, 0.664750337600708, 0.7269082069396973, 0.7890661358833313, 0.8512240052223206, 0.9133818745613098, 0.9755398035049438, 1.0376975536346436, 1.0998554229736328, 1.162013292312622, 1.2241711616516113, 1.2863290309906006, 1.3484869003295898, 1.410644769668579, 1.472802758216858, 1.5349606275558472, 1.5971184968948364, 1.6592763662338257, 1.721434235572815, 1.7835921049118042, 1.845750093460083, 1.9079079627990723, 1.9700658321380615, 2.032223701477051]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 2.0, 6.0, 6.0, 10.0, 6.0, 17.0, 14.0, 30.0, 44.0, 51.0, 90.0, 124.0, 211.0, 338.0, 650.0, 1336.0, 3216.0, 9036.0, 30256.0, 117819.0, 390587.0, 354929.0, 99997.0, 25977.0, 8103.0, 2935.0, 1288.0, 611.0, 327.0, 179.0, 122.0, 77.0, 50.0, 37.0, 22.0, 16.0, 11.0, 11.0, 4.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.345703125, -1.3035736083984375, -1.261444091796875, -1.2193145751953125, -1.17718505859375, -1.1350555419921875, -1.092926025390625, -1.0507965087890625, -1.0086669921875, -0.9665374755859375, -0.924407958984375, -0.8822784423828125, -0.84014892578125, -0.7980194091796875, -0.755889892578125, -0.7137603759765625, -0.671630859375, -0.6295013427734375, -0.587371826171875, -0.5452423095703125, -0.50311279296875, -0.4609832763671875, -0.418853759765625, -0.3767242431640625, -0.3345947265625, -0.2924652099609375, -0.250335693359375, -0.2082061767578125, -0.16607666015625, -0.1239471435546875, -0.081817626953125, -0.0396881103515625, 0.00244140625, 0.0445709228515625, 0.086700439453125, 0.1288299560546875, 0.17095947265625, 0.2130889892578125, 0.255218505859375, 0.2973480224609375, 0.3394775390625, 0.3816070556640625, 0.423736572265625, 0.4658660888671875, 0.50799560546875, 0.5501251220703125, 0.592254638671875, 0.6343841552734375, 0.676513671875, 0.7186431884765625, 0.760772705078125, 0.8029022216796875, 0.84503173828125, 0.8871612548828125, 0.929290771484375, 0.9714202880859375, 1.0135498046875, 1.0556793212890625, 1.097808837890625, 1.1399383544921875, 1.18206787109375, 1.2241973876953125, 1.266326904296875, 1.3084564208984375, 1.3505859375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 3.0, 4.0, 6.0, 9.0, 10.0, 11.0, 12.0, 21.0, 16.0, 28.0, 32.0, 50.0, 55.0, 67.0, 62.0, 62.0, 85.0, 73.0, 54.0, 62.0, 54.0, 52.0, 35.0, 41.0, 19.0, 25.0, 18.0, 9.0, 10.0, 10.0, 11.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2431640625, -0.2308502197265625, -0.218536376953125, -0.2062225341796875, -0.19390869140625, -0.1815948486328125, -0.169281005859375, -0.1569671630859375, -0.1446533203125, -0.1323394775390625, -0.120025634765625, -0.1077117919921875, -0.09539794921875, -0.0830841064453125, -0.070770263671875, -0.0584564208984375, -0.046142578125, -0.0338287353515625, -0.021514892578125, -0.0092010498046875, 0.00311279296875, 0.0154266357421875, 0.027740478515625, 0.0400543212890625, 0.0523681640625, 0.0646820068359375, 0.076995849609375, 0.0893096923828125, 0.10162353515625, 0.1139373779296875, 0.126251220703125, 0.1385650634765625, 0.15087890625, 0.1631927490234375, 0.175506591796875, 0.1878204345703125, 0.20013427734375, 0.2124481201171875, 0.224761962890625, 0.2370758056640625, 0.2493896484375, 0.2617034912109375, 0.274017333984375, 0.2863311767578125, 0.29864501953125, 0.3109588623046875, 0.323272705078125, 0.3355865478515625, 0.347900390625, 0.3602142333984375, 0.372528076171875, 0.3848419189453125, 0.39715576171875, 0.4094696044921875, 0.421783447265625, 0.4340972900390625, 0.4464111328125, 0.4587249755859375, 0.471038818359375, 0.4833526611328125, 0.49566650390625, 0.5079803466796875, 0.520294189453125, 0.5326080322265625, 0.544921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 9.0, 8.0, 15.0, 18.0, 32.0, 55.0, 139.0, 340.0, 877.0, 3184.0, 14923.0, 97405.0, 598087.0, 286312.0, 37650.0, 6798.0, 1654.0, 567.0, 226.0, 100.0, 61.0, 34.0, 15.0, 14.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.09375, -2.0367889404296875, -1.979827880859375, -1.9228668212890625, -1.86590576171875, -1.8089447021484375, -1.751983642578125, -1.6950225830078125, -1.6380615234375, -1.5811004638671875, -1.524139404296875, -1.4671783447265625, -1.41021728515625, -1.3532562255859375, -1.296295166015625, -1.2393341064453125, -1.182373046875, -1.1254119873046875, -1.068450927734375, -1.0114898681640625, -0.95452880859375, -0.8975677490234375, -0.840606689453125, -0.7836456298828125, -0.7266845703125, -0.6697235107421875, -0.612762451171875, -0.5558013916015625, -0.49884033203125, -0.4418792724609375, -0.384918212890625, -0.3279571533203125, -0.27099609375, -0.2140350341796875, -0.157073974609375, -0.1001129150390625, -0.04315185546875, 0.0138092041015625, 0.070770263671875, 0.1277313232421875, 0.1846923828125, 0.2416534423828125, 0.298614501953125, 0.3555755615234375, 0.41253662109375, 0.4694976806640625, 0.526458740234375, 0.5834197998046875, 0.640380859375, 0.6973419189453125, 0.754302978515625, 0.8112640380859375, 0.86822509765625, 0.9251861572265625, 0.982147216796875, 1.0391082763671875, 1.0960693359375, 1.1530303955078125, 1.209991455078125, 1.2669525146484375, 1.32391357421875, 1.3808746337890625, 1.437835693359375, 1.4947967529296875, 1.5517578125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 10.0, 6.0, 8.0, 9.0, 16.0, 14.0, 24.0, 18.0, 19.0, 35.0, 38.0, 48.0, 42.0, 36.0, 40.0, 44.0, 73.0, 56.0, 65.0, 47.0, 40.0, 44.0, 40.0, 39.0, 30.0, 37.0, 17.0, 23.0, 16.0, 17.0, 17.0, 10.0, 7.0, 3.0, 5.0, 3.0, 4.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6591796875, -1.6095428466796875, -1.559906005859375, -1.5102691650390625, -1.46063232421875, -1.4109954833984375, -1.361358642578125, -1.3117218017578125, -1.2620849609375, -1.2124481201171875, -1.162811279296875, -1.1131744384765625, -1.06353759765625, -1.0139007568359375, -0.964263916015625, -0.9146270751953125, -0.864990234375, -0.8153533935546875, -0.765716552734375, -0.7160797119140625, -0.66644287109375, -0.6168060302734375, -0.567169189453125, -0.5175323486328125, -0.4678955078125, -0.4182586669921875, -0.368621826171875, -0.3189849853515625, -0.26934814453125, -0.2197113037109375, -0.170074462890625, -0.1204376220703125, -0.07080078125, -0.0211639404296875, 0.028472900390625, 0.0781097412109375, 0.12774658203125, 0.1773834228515625, 0.227020263671875, 0.2766571044921875, 0.3262939453125, 0.3759307861328125, 0.425567626953125, 0.4752044677734375, 0.52484130859375, 0.5744781494140625, 0.624114990234375, 0.6737518310546875, 0.723388671875, 0.7730255126953125, 0.822662353515625, 0.8722991943359375, 0.92193603515625, 0.9715728759765625, 1.021209716796875, 1.0708465576171875, 1.1204833984375, 1.1701202392578125, 1.219757080078125, 1.2693939208984375, 1.31903076171875, 1.3686676025390625, 1.418304443359375, 1.4679412841796875, 1.517578125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 7.0, 10.0, 14.0, 20.0, 48.0, 83.0, 144.0, 282.0, 565.0, 1452.0, 5571.0, 42230.0, 560387.0, 401976.0, 29098.0, 4410.0, 1167.0, 495.0, 266.0, 126.0, 80.0, 46.0, 32.0, 16.0, 13.0, 3.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90234375, -0.8731613159179688, -0.8439788818359375, -0.8147964477539062, -0.785614013671875, -0.7564315795898438, -0.7272491455078125, -0.6980667114257812, -0.66888427734375, -0.6397018432617188, -0.6105194091796875, -0.5813369750976562, -0.552154541015625, -0.5229721069335938, -0.4937896728515625, -0.46460723876953125, -0.4354248046875, -0.40624237060546875, -0.3770599365234375, -0.34787750244140625, -0.318695068359375, -0.28951263427734375, -0.2603302001953125, -0.23114776611328125, -0.20196533203125, -0.17278289794921875, -0.1436004638671875, -0.11441802978515625, -0.085235595703125, -0.05605316162109375, -0.0268707275390625, 0.00231170654296875, 0.031494140625, 0.06067657470703125, 0.0898590087890625, 0.11904144287109375, 0.148223876953125, 0.17740631103515625, 0.2065887451171875, 0.23577117919921875, 0.26495361328125, 0.29413604736328125, 0.3233184814453125, 0.35250091552734375, 0.381683349609375, 0.41086578369140625, 0.4400482177734375, 0.46923065185546875, 0.4984130859375, 0.5275955200195312, 0.5567779541015625, 0.5859603881835938, 0.615142822265625, 0.6443252563476562, 0.6735076904296875, 0.7026901245117188, 0.73187255859375, 0.7610549926757812, 0.7902374267578125, 0.8194198608398438, 0.848602294921875, 0.8777847290039062, 0.9069671630859375, 0.9361495971679688, 0.96533203125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 7.0, 2.0, 5.0, 4.0, 5.0, 11.0, 14.0, 16.0, 31.0, 33.0, 33.0, 51.0, 60.0, 83.0, 91.0, 91.0, 78.0, 95.0, 63.0, 59.0, 44.0, 38.0, 16.0, 22.0, 16.0, 10.0, 4.0, 5.0, 4.0, 7.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011032819747924805, -0.0001070583239197731, -0.00010378845036029816, -0.00010051857680082321, -9.724870324134827e-05, -9.397882968187332e-05, -9.070895612239838e-05, -8.743908256292343e-05, -8.416920900344849e-05, -8.089933544397354e-05, -7.76294618844986e-05, -7.435958832502365e-05, -7.10897147655487e-05, -6.781984120607376e-05, -6.454996764659882e-05, -6.128009408712387e-05, -5.8010220527648926e-05, -5.474034696817398e-05, -5.1470473408699036e-05, -4.820059984922409e-05, -4.4930726289749146e-05, -4.16608527302742e-05, -3.8390979170799255e-05, -3.512110561132431e-05, -3.1851232051849365e-05, -2.858135849237442e-05, -2.5311484932899475e-05, -2.204161137342453e-05, -1.8771737813949585e-05, -1.550186425447464e-05, -1.2231990694999695e-05, -8.96211713552475e-06, -5.692243576049805e-06, -2.4223700165748596e-06, 8.475035429000854e-07, 4.1173771023750305e-06, 7.387250661849976e-06, 1.065712422132492e-05, 1.3926997780799866e-05, 1.719687134027481e-05, 2.0466744899749756e-05, 2.37366184592247e-05, 2.7006492018699646e-05, 3.027636557817459e-05, 3.3546239137649536e-05, 3.681611269712448e-05, 4.0085986256599426e-05, 4.335585981607437e-05, 4.6625733375549316e-05, 4.989560693502426e-05, 5.3165480494499207e-05, 5.643535405397415e-05, 5.97052276134491e-05, 6.297510117292404e-05, 6.624497473239899e-05, 6.951484829187393e-05, 7.278472185134888e-05, 7.605459541082382e-05, 7.932446897029877e-05, 8.259434252977371e-05, 8.586421608924866e-05, 8.91340896487236e-05, 9.240396320819855e-05, 9.567383676767349e-05, 9.894371032714844e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 6.0, 12.0, 17.0, 24.0, 45.0, 64.0, 88.0, 165.0, 238.0, 449.0, 845.0, 1801.0, 4846.0, 17208.0, 82133.0, 407130.0, 420703.0, 86377.0, 17492.0, 4945.0, 1858.0, 911.0, 500.0, 272.0, 163.0, 81.0, 62.0, 37.0, 18.0, 16.0, 8.0, 10.0, 6.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4931640625, -0.476165771484375, -0.45916748046875, -0.442169189453125, -0.4251708984375, -0.408172607421875, -0.39117431640625, -0.374176025390625, -0.357177734375, -0.340179443359375, -0.32318115234375, -0.306182861328125, -0.2891845703125, -0.272186279296875, -0.25518798828125, -0.238189697265625, -0.22119140625, -0.204193115234375, -0.18719482421875, -0.170196533203125, -0.1531982421875, -0.136199951171875, -0.11920166015625, -0.102203369140625, -0.085205078125, -0.068206787109375, -0.05120849609375, -0.034210205078125, -0.0172119140625, -0.000213623046875, 0.01678466796875, 0.033782958984375, 0.05078125, 0.067779541015625, 0.08477783203125, 0.101776123046875, 0.1187744140625, 0.135772705078125, 0.15277099609375, 0.169769287109375, 0.186767578125, 0.203765869140625, 0.22076416015625, 0.237762451171875, 0.2547607421875, 0.271759033203125, 0.28875732421875, 0.305755615234375, 0.32275390625, 0.339752197265625, 0.35675048828125, 0.373748779296875, 0.3907470703125, 0.407745361328125, 0.42474365234375, 0.441741943359375, 0.458740234375, 0.475738525390625, 0.49273681640625, 0.509735107421875, 0.5267333984375, 0.543731689453125, 0.56072998046875, 0.577728271484375, 0.5947265625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 5.0, 6.0, 7.0, 13.0, 14.0, 18.0, 24.0, 30.0, 43.0, 71.0, 82.0, 127.0, 120.0, 121.0, 95.0, 64.0, 47.0, 40.0, 21.0, 18.0, 13.0, 8.0, 5.0, 2.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.88134765625, -0.8557205200195312, -0.8300933837890625, -0.8044662475585938, -0.778839111328125, -0.7532119750976562, -0.7275848388671875, -0.7019577026367188, -0.67633056640625, -0.6507034301757812, -0.6250762939453125, -0.5994491577148438, -0.573822021484375, -0.5481948852539062, -0.5225677490234375, -0.49694061279296875, -0.4713134765625, -0.44568634033203125, -0.4200592041015625, -0.39443206787109375, -0.368804931640625, -0.34317779541015625, -0.3175506591796875, -0.29192352294921875, -0.26629638671875, -0.24066925048828125, -0.2150421142578125, -0.18941497802734375, -0.163787841796875, -0.13816070556640625, -0.1125335693359375, -0.08690643310546875, -0.061279296875, -0.03565216064453125, -0.0100250244140625, 0.01560211181640625, 0.041229248046875, 0.06685638427734375, 0.0924835205078125, 0.11811065673828125, 0.14373779296875, 0.16936492919921875, 0.1949920654296875, 0.22061920166015625, 0.246246337890625, 0.27187347412109375, 0.2975006103515625, 0.32312774658203125, 0.3487548828125, 0.37438201904296875, 0.4000091552734375, 0.42563629150390625, 0.451263427734375, 0.47689056396484375, 0.5025177001953125, 0.5281448364257812, 0.55377197265625, 0.5793991088867188, 0.6050262451171875, 0.6306533813476562, 0.656280517578125, 0.6819076538085938, 0.7075347900390625, 0.7331619262695312, 0.7587890625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 14.0, 14.0, 37.0, 64.0, 84.0, 156.0, 148.0, 163.0, 115.0, 74.0, 52.0, 32.0, 26.0, 8.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.134284496307373, -5.749335289001465, -5.364386081695557, -4.979436874389648, -4.594487190246582, -4.209538459777832, -3.8245887756347656, -3.4396395683288574, -3.054690361022949, -2.669741153717041, -2.284791946411133, -1.8998425006866455, -1.5148932933807373, -1.129944086074829, -0.7449946403503418, -0.3600454330444336, 0.02490377426147461, 0.4098530411720276, 0.7948023080825806, 1.1797516345977783, 1.5647008419036865, 1.9496500492095947, 2.334599494934082, 2.7195487022399902, 3.1044979095458984, 3.4894471168518066, 3.874396324157715, 4.259346008300781, 4.644294738769531, 5.029244422912598, 5.414193630218506, 5.799142837524414, 6.184091567993164, 6.569040775299072, 6.9539899826049805, 7.338939666748047, 7.723888397216797, 8.108838081359863, 8.49378776550293, 8.87873649597168, 9.26368522644043, 9.648634910583496, 10.033583641052246, 10.418533325195312, 10.803482055664062, 11.188431739807129, 11.573381423950195, 11.958330154418945, 12.343279838562012, 12.728229522705078, 13.113178253173828, 13.498127937316895, 13.883076667785645, 14.268026351928711, 14.652975082397461, 15.037924766540527, 15.422874450683594, 15.80782413482666, 16.192773818969727, 16.577722549438477, 16.962671279907227, 17.347620010375977, 17.73257064819336, 18.11751937866211, 18.50246810913086]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 8.0, 2.0, 3.0, 5.0, 9.0, 8.0, 10.0, 19.0, 14.0, 16.0, 24.0, 34.0, 22.0, 31.0, 32.0, 44.0, 37.0, 41.0, 48.0, 44.0, 41.0, 40.0, 57.0, 38.0, 45.0, 35.0, 42.0, 24.0, 32.0, 36.0, 21.0, 23.0, 18.0, 25.0, 14.0, 19.0, 10.0, 6.0, 8.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-8.193939208984375, -7.955328464508057, -7.7167181968688965, -7.478107452392578, -7.23949670791626, -7.0008864402771, -6.762275695800781, -6.523665428161621, -6.285054683685303, -6.046443939208984, -5.807833671569824, -5.569222927093506, -5.3306121826171875, -5.092001914978027, -4.853391170501709, -4.614780426025391, -4.3761701583862305, -4.137559413909912, -3.898948907852173, -3.6603384017944336, -3.4217278957366943, -3.183117389678955, -2.9445066452026367, -2.7058961391448975, -2.46728515625, -2.2286746501922607, -1.990064024925232, -1.7514533996582031, -1.5128428936004639, -1.274232268333435, -1.0356216430664062, -0.797011137008667, -0.5584006309509277, -0.3197900652885437, -0.08117946982383728, 0.15743112564086914, 0.3960416913032532, 0.6346522569656372, 0.873262882232666, 1.1118733882904053, 1.350484013557434, 1.589094638824463, 1.8277051448822021, 2.0663156509399414, 2.3049263954162598, 2.543536901473999, 2.7821474075317383, 3.0207581520080566, 3.259368658065796, 3.497979164123535, 3.7365899085998535, 3.9752004146575928, 4.213810920715332, 4.45242166519165, 4.691032409667969, 4.929642677307129, 5.168253421783447, 5.406864166259766, 5.645474433898926, 5.884085178375244, 6.1226959228515625, 6.361306190490723, 6.599916934967041, 6.838527679443359, 7.0771379470825195]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 7.0, 21.0, 40.0, 67.0, 195.0, 809.0, 7667.0, 4162969.0, 20573.0, 1454.0, 287.0, 93.0, 45.0, 20.0, 16.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.84765625, -5.6568603515625, -5.466064453125, -5.2752685546875, -5.08447265625, -4.8936767578125, -4.702880859375, -4.5120849609375, -4.3212890625, -4.1304931640625, -3.939697265625, -3.7489013671875, -3.55810546875, -3.3673095703125, -3.176513671875, -2.9857177734375, -2.794921875, -2.6041259765625, -2.413330078125, -2.2225341796875, -2.03173828125, -1.8409423828125, -1.650146484375, -1.4593505859375, -1.2685546875, -1.0777587890625, -0.886962890625, -0.6961669921875, -0.50537109375, -0.3145751953125, -0.123779296875, 0.0670166015625, 0.2578125, 0.4486083984375, 0.639404296875, 0.8302001953125, 1.02099609375, 1.2117919921875, 1.402587890625, 1.5933837890625, 1.7841796875, 1.9749755859375, 2.165771484375, 2.3565673828125, 2.54736328125, 2.7381591796875, 2.928955078125, 3.1197509765625, 3.310546875, 3.5013427734375, 3.692138671875, 3.8829345703125, 4.07373046875, 4.2645263671875, 4.455322265625, 4.6461181640625, 4.8369140625, 5.0277099609375, 5.218505859375, 5.4093017578125, 5.60009765625, 5.7908935546875, 5.981689453125, 6.1724853515625, 6.36328125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 6.0, 14.0, 9.0, 14.0, 18.0, 26.0, 28.0, 34.0, 39.0, 42.0, 51.0, 65.0, 50.0, 61.0, 56.0, 48.0, 52.0, 68.0, 57.0, 59.0, 55.0, 35.0, 28.0, 16.0, 17.0, 10.0, 11.0, 10.0, 5.0, 4.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34716796875, -0.3330841064453125, -0.319000244140625, -0.3049163818359375, -0.29083251953125, -0.2767486572265625, -0.262664794921875, -0.2485809326171875, -0.2344970703125, -0.2204132080078125, -0.206329345703125, -0.1922454833984375, -0.17816162109375, -0.1640777587890625, -0.149993896484375, -0.1359100341796875, -0.121826171875, -0.1077423095703125, -0.093658447265625, -0.0795745849609375, -0.06549072265625, -0.0514068603515625, -0.037322998046875, -0.0232391357421875, -0.0091552734375, 0.0049285888671875, 0.019012451171875, 0.0330963134765625, 0.04718017578125, 0.0612640380859375, 0.075347900390625, 0.0894317626953125, 0.103515625, 0.1175994873046875, 0.131683349609375, 0.1457672119140625, 0.15985107421875, 0.1739349365234375, 0.188018798828125, 0.2021026611328125, 0.2161865234375, 0.2302703857421875, 0.244354248046875, 0.2584381103515625, 0.27252197265625, 0.2866058349609375, 0.300689697265625, 0.3147735595703125, 0.328857421875, 0.3429412841796875, 0.357025146484375, 0.3711090087890625, 0.38519287109375, 0.3992767333984375, 0.413360595703125, 0.4274444580078125, 0.4415283203125, 0.4556121826171875, 0.469696044921875, 0.4837799072265625, 0.49786376953125, 0.5119476318359375, 0.526031494140625, 0.5401153564453125, 0.55419921875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 9.0, 11.0, 11.0, 30.0, 30.0, 36.0, 56.0, 78.0, 91.0, 150.0, 207.0, 268.0, 426.0, 671.0, 962.0, 1570.0, 2718.0, 5222.0, 11551.0, 40564.0, 3924259.0, 164373.0, 22715.0, 8103.0, 4003.0, 2185.0, 1297.0, 832.0, 542.0, 400.0, 241.0, 194.0, 132.0, 105.0, 78.0, 43.0, 33.0, 21.0, 18.0, 10.0, 12.0, 6.0, 5.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.53125, -1.48724365234375, -1.4432373046875, -1.39923095703125, -1.355224609375, -1.31121826171875, -1.2672119140625, -1.22320556640625, -1.17919921875, -1.13519287109375, -1.0911865234375, -1.04718017578125, -1.003173828125, -0.95916748046875, -0.9151611328125, -0.87115478515625, -0.8271484375, -0.78314208984375, -0.7391357421875, -0.69512939453125, -0.651123046875, -0.60711669921875, -0.5631103515625, -0.51910400390625, -0.47509765625, -0.43109130859375, -0.3870849609375, -0.34307861328125, -0.299072265625, -0.25506591796875, -0.2110595703125, -0.16705322265625, -0.123046875, -0.07904052734375, -0.0350341796875, 0.00897216796875, 0.052978515625, 0.09698486328125, 0.1409912109375, 0.18499755859375, 0.22900390625, 0.27301025390625, 0.3170166015625, 0.36102294921875, 0.405029296875, 0.44903564453125, 0.4930419921875, 0.53704833984375, 0.5810546875, 0.62506103515625, 0.6690673828125, 0.71307373046875, 0.757080078125, 0.80108642578125, 0.8450927734375, 0.88909912109375, 0.93310546875, 0.97711181640625, 1.0211181640625, 1.06512451171875, 1.109130859375, 1.15313720703125, 1.1971435546875, 1.24114990234375, 1.28515625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 8.0, 4.0, 7.0, 11.0, 20.0, 52.0, 137.0, 3525.0, 159.0, 57.0, 31.0, 10.0, 10.0, 14.0, 2.0, 5.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.404052734375, -0.3926887512207031, -0.38132476806640625, -0.3699607849121094, -0.3585968017578125, -0.3472328186035156, -0.33586883544921875, -0.3245048522949219, -0.313140869140625, -0.3017768859863281, -0.29041290283203125, -0.2790489196777344, -0.2676849365234375, -0.2563209533691406, -0.24495697021484375, -0.23359298706054688, -0.22222900390625, -0.21086502075195312, -0.19950103759765625, -0.18813705444335938, -0.1767730712890625, -0.16540908813476562, -0.15404510498046875, -0.14268112182617188, -0.131317138671875, -0.11995315551757812, -0.10858917236328125, -0.09722518920898438, -0.0858612060546875, -0.07449722290039062, -0.06313323974609375, -0.051769256591796875, -0.0404052734375, -0.029041290283203125, -0.01767730712890625, -0.006313323974609375, 0.0050506591796875, 0.016414642333984375, 0.02777862548828125, 0.039142608642578125, 0.050506591796875, 0.061870574951171875, 0.07323455810546875, 0.08459854125976562, 0.0959625244140625, 0.10732650756835938, 0.11869049072265625, 0.13005447387695312, 0.14141845703125, 0.15278244018554688, 0.16414642333984375, 0.17551040649414062, 0.1868743896484375, 0.19823837280273438, 0.20960235595703125, 0.22096633911132812, 0.232330322265625, 0.24369430541992188, 0.25505828857421875, 0.2664222717285156, 0.2777862548828125, 0.2891502380371094, 0.30051422119140625, 0.3118782043457031, 0.3232421875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 10.0, 31.0, 92.0, 237.0, 289.0, 190.0, 99.0, 32.0, 16.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0462324619293213, -0.9535099267959595, -0.8607873916625977, -0.7680649161338806, -0.6753423810005188, -0.582619845867157, -0.48989737033843994, -0.3971748352050781, -0.3044523000717163, -0.21172977983951569, -0.11900725960731506, -0.026284754276275635, 0.06643778085708618, 0.159160315990448, 0.25188279151916504, 0.34460532665252686, 0.43732786178588867, 0.5300503969192505, 0.6227729320526123, 0.7154954075813293, 0.8082179427146912, 0.900940477848053, 0.99366295337677, 1.0863854885101318, 1.1791080236434937, 1.2718305587768555, 1.3645530939102173, 1.457275629043579, 1.5499980449676514, 1.6427206993103027, 1.735443115234375, 1.8281656503677368, 1.9208884239196777, 2.01361083984375, 2.1063334941864014, 2.1990559101104736, 2.291778564453125, 2.3845009803771973, 2.4772233963012695, 2.569946050643921, 2.6626687049865723, 2.7553911209106445, 2.848113775253296, 2.940836191177368, 3.0335588455200195, 3.126281261444092, 3.219003677368164, 3.3117263317108154, 3.4044487476348877, 3.49717116355896, 3.5898938179016113, 3.6826162338256836, 3.775338888168335, 3.8680613040924072, 3.9607839584350586, 4.053506374359131, 4.146228790283203, 4.238951206207275, 4.331673622131348, 4.424396514892578, 4.51711893081665, 4.609841346740723, 4.702563762664795, 4.795286178588867, 4.888009071350098]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 3.0, 5.0, 9.0, 11.0, 7.0, 13.0, 10.0, 11.0, 15.0, 12.0, 22.0, 34.0, 26.0, 31.0, 33.0, 43.0, 32.0, 52.0, 46.0, 66.0, 39.0, 38.0, 43.0, 37.0, 40.0, 36.0, 37.0, 33.0, 28.0, 24.0, 21.0, 28.0, 21.0, 22.0, 16.0, 14.0, 4.0, 11.0, 6.0, 2.0, 3.0, 7.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.7976868748664856, -0.7757668495178223, -0.7538468241691589, -0.7319267988204956, -0.7100067734718323, -0.688086748123169, -0.6661666631698608, -0.6442466974258423, -0.6223266124725342, -0.6004065871238708, -0.5784865617752075, -0.5565665364265442, -0.5346465110778809, -0.5127264857292175, -0.4908064305782318, -0.4688864052295685, -0.44696640968322754, -0.4250463843345642, -0.4031263589859009, -0.38120633363723755, -0.3592863082885742, -0.3373662829399109, -0.31544622778892517, -0.29352620244026184, -0.2716061770915985, -0.24968615174293518, -0.22776612639427185, -0.20584608614444733, -0.183926060795784, -0.16200603544712067, -0.14008599519729614, -0.11816596984863281, -0.09624588489532471, -0.07432585954666138, -0.05240582674741745, -0.030485793948173523, -0.008565768599510193, 0.013354256749153137, 0.03527429699897766, 0.05719432234764099, 0.07911434769630432, 0.10103437304496765, 0.12295440584421158, 0.1448744386434555, 0.16679446399211884, 0.18871448934078217, 0.2106345295906067, 0.23255455493927002, 0.25447458028793335, 0.2763946056365967, 0.29831463098526, 0.32023465633392334, 0.34215468168258667, 0.36407470703125, 0.3859947621822357, 0.40791478753089905, 0.4298348128795624, 0.4517548382282257, 0.47367486357688904, 0.49559491872787476, 0.5175149440765381, 0.5394349694252014, 0.5613549947738647, 0.5832750201225281, 0.6051950454711914]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 7.0, 11.0, 6.0, 10.0, 15.0, 22.0, 21.0, 34.0, 63.0, 86.0, 115.0, 178.0, 326.0, 562.0, 1114.0, 2232.0, 5050.0, 11364.0, 27631.0, 66528.0, 154987.0, 286040.0, 263722.0, 131824.0, 55557.0, 22732.0, 9754.0, 4228.0, 1966.0, 1009.0, 517.0, 280.0, 192.0, 111.0, 70.0, 51.0, 36.0, 28.0, 21.0, 18.0, 14.0, 6.0, 2.0, 1.0, 5.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96240234375, -0.9302139282226562, -0.8980255126953125, -0.8658370971679688, -0.833648681640625, -0.8014602661132812, -0.7692718505859375, -0.7370834350585938, -0.70489501953125, -0.6727066040039062, -0.6405181884765625, -0.6083297729492188, -0.576141357421875, -0.5439529418945312, -0.5117645263671875, -0.47957611083984375, -0.4473876953125, -0.41519927978515625, -0.3830108642578125, -0.35082244873046875, -0.318634033203125, -0.28644561767578125, -0.2542572021484375, -0.22206878662109375, -0.18988037109375, -0.15769195556640625, -0.1255035400390625, -0.09331512451171875, -0.061126708984375, -0.02893829345703125, 0.0032501220703125, 0.03543853759765625, 0.067626953125, 0.09981536865234375, 0.1320037841796875, 0.16419219970703125, 0.196380615234375, 0.22856903076171875, 0.2607574462890625, 0.29294586181640625, 0.32513427734375, 0.35732269287109375, 0.3895111083984375, 0.42169952392578125, 0.453887939453125, 0.48607635498046875, 0.5182647705078125, 0.5504531860351562, 0.5826416015625, 0.6148300170898438, 0.6470184326171875, 0.6792068481445312, 0.711395263671875, 0.7435836791992188, 0.7757720947265625, 0.8079605102539062, 0.84014892578125, 0.8723373413085938, 0.9045257568359375, 0.9367141723632812, 0.968902587890625, 1.0010910034179688, 1.0332794189453125, 1.0654678344726562, 1.09765625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 7.0, 13.0, 11.0, 11.0, 19.0, 24.0, 30.0, 36.0, 27.0, 40.0, 45.0, 51.0, 67.0, 70.0, 54.0, 40.0, 50.0, 63.0, 53.0, 60.0, 48.0, 34.0, 32.0, 27.0, 19.0, 8.0, 12.0, 13.0, 4.0, 2.0, 7.0, 12.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38720703125, -0.37223052978515625, -0.3572540283203125, -0.34227752685546875, -0.327301025390625, -0.31232452392578125, -0.2973480224609375, -0.28237152099609375, -0.26739501953125, -0.25241851806640625, -0.2374420166015625, -0.22246551513671875, -0.207489013671875, -0.19251251220703125, -0.1775360107421875, -0.16255950927734375, -0.1475830078125, -0.13260650634765625, -0.1176300048828125, -0.10265350341796875, -0.087677001953125, -0.07270050048828125, -0.0577239990234375, -0.04274749755859375, -0.02777099609375, -0.01279449462890625, 0.0021820068359375, 0.01715850830078125, 0.032135009765625, 0.04711151123046875, 0.0620880126953125, 0.07706451416015625, 0.092041015625, 0.10701751708984375, 0.1219940185546875, 0.13697052001953125, 0.151947021484375, 0.16692352294921875, 0.1819000244140625, 0.19687652587890625, 0.21185302734375, 0.22682952880859375, 0.2418060302734375, 0.25678253173828125, 0.271759033203125, 0.28673553466796875, 0.3017120361328125, 0.31668853759765625, 0.3316650390625, 0.34664154052734375, 0.3616180419921875, 0.37659454345703125, 0.391571044921875, 0.40654754638671875, 0.4215240478515625, 0.43650054931640625, 0.45147705078125, 0.46645355224609375, 0.4814300537109375, 0.49640655517578125, 0.511383056640625, 0.5263595581054688, 0.5413360595703125, 0.5563125610351562, 0.5712890625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 3.0, 4.0, 7.0, 9.0, 22.0, 34.0, 36.0, 64.0, 93.0, 181.0, 348.0, 685.0, 1655.0, 4231.0, 12371.0, 41516.0, 152567.0, 438159.0, 282486.0, 79953.0, 22241.0, 7146.0, 2598.0, 1071.0, 472.0, 225.0, 126.0, 85.0, 59.0, 38.0, 25.0, 5.0, 10.0, 6.0, 5.0, 2.0, 4.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.49609375, -1.4517669677734375, -1.407440185546875, -1.3631134033203125, -1.31878662109375, -1.2744598388671875, -1.230133056640625, -1.1858062744140625, -1.1414794921875, -1.0971527099609375, -1.052825927734375, -1.0084991455078125, -0.96417236328125, -0.9198455810546875, -0.875518798828125, -0.8311920166015625, -0.786865234375, -0.7425384521484375, -0.698211669921875, -0.6538848876953125, -0.60955810546875, -0.5652313232421875, -0.520904541015625, -0.4765777587890625, -0.4322509765625, -0.3879241943359375, -0.343597412109375, -0.2992706298828125, -0.25494384765625, -0.2106170654296875, -0.166290283203125, -0.1219635009765625, -0.07763671875, -0.0333099365234375, 0.011016845703125, 0.0553436279296875, 0.09967041015625, 0.1439971923828125, 0.188323974609375, 0.2326507568359375, 0.2769775390625, 0.3213043212890625, 0.365631103515625, 0.4099578857421875, 0.45428466796875, 0.4986114501953125, 0.542938232421875, 0.5872650146484375, 0.631591796875, 0.6759185791015625, 0.720245361328125, 0.7645721435546875, 0.80889892578125, 0.8532257080078125, 0.897552490234375, 0.9418792724609375, 0.9862060546875, 1.0305328369140625, 1.074859619140625, 1.1191864013671875, 1.16351318359375, 1.2078399658203125, 1.252166748046875, 1.2964935302734375, 1.3408203125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 6.0, 4.0, 11.0, 19.0, 12.0, 15.0, 22.0, 24.0, 28.0, 32.0, 39.0, 38.0, 46.0, 33.0, 46.0, 39.0, 55.0, 44.0, 50.0, 54.0, 55.0, 55.0, 35.0, 49.0, 26.0, 26.0, 19.0, 26.0, 23.0, 13.0, 9.0, 8.0, 10.0, 5.0, 5.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8994140625, -1.8316192626953125, -1.763824462890625, -1.6960296630859375, -1.62823486328125, -1.5604400634765625, -1.492645263671875, -1.4248504638671875, -1.3570556640625, -1.2892608642578125, -1.221466064453125, -1.1536712646484375, -1.08587646484375, -1.0180816650390625, -0.950286865234375, -0.8824920654296875, -0.814697265625, -0.7469024658203125, -0.679107666015625, -0.6113128662109375, -0.54351806640625, -0.4757232666015625, -0.407928466796875, -0.3401336669921875, -0.2723388671875, -0.2045440673828125, -0.136749267578125, -0.0689544677734375, -0.00115966796875, 0.0666351318359375, 0.134429931640625, 0.2022247314453125, 0.27001953125, 0.3378143310546875, 0.405609130859375, 0.4734039306640625, 0.54119873046875, 0.6089935302734375, 0.676788330078125, 0.7445831298828125, 0.8123779296875, 0.8801727294921875, 0.947967529296875, 1.0157623291015625, 1.08355712890625, 1.1513519287109375, 1.219146728515625, 1.2869415283203125, 1.354736328125, 1.4225311279296875, 1.490325927734375, 1.5581207275390625, 1.62591552734375, 1.6937103271484375, 1.761505126953125, 1.8292999267578125, 1.8970947265625, 1.9648895263671875, 2.032684326171875, 2.1004791259765625, 2.16827392578125, 2.2360687255859375, 2.303863525390625, 2.3716583251953125, 2.439453125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 5.0, 7.0, 8.0, 27.0, 48.0, 128.0, 316.0, 1101.0, 8330.0, 332230.0, 690169.0, 13981.0, 1547.0, 387.0, 156.0, 64.0, 22.0, 15.0, 8.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8671875, -1.8071441650390625, -1.747100830078125, -1.6870574951171875, -1.62701416015625, -1.5669708251953125, -1.506927490234375, -1.4468841552734375, -1.3868408203125, -1.3267974853515625, -1.266754150390625, -1.2067108154296875, -1.14666748046875, -1.0866241455078125, -1.026580810546875, -0.9665374755859375, -0.906494140625, -0.8464508056640625, -0.786407470703125, -0.7263641357421875, -0.66632080078125, -0.6062774658203125, -0.546234130859375, -0.4861907958984375, -0.4261474609375, -0.3661041259765625, -0.306060791015625, -0.2460174560546875, -0.18597412109375, -0.1259307861328125, -0.065887451171875, -0.0058441162109375, 0.05419921875, 0.1142425537109375, 0.174285888671875, 0.2343292236328125, 0.29437255859375, 0.3544158935546875, 0.414459228515625, 0.4745025634765625, 0.5345458984375, 0.5945892333984375, 0.654632568359375, 0.7146759033203125, 0.77471923828125, 0.8347625732421875, 0.894805908203125, 0.9548492431640625, 1.014892578125, 1.0749359130859375, 1.134979248046875, 1.1950225830078125, 1.25506591796875, 1.3151092529296875, 1.375152587890625, 1.4351959228515625, 1.4952392578125, 1.5552825927734375, 1.615325927734375, 1.6753692626953125, 1.73541259765625, 1.7954559326171875, 1.855499267578125, 1.9155426025390625, 1.9755859375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 6.0, 9.0, 8.0, 10.0, 15.0, 29.0, 36.0, 38.0, 43.0, 65.0, 69.0, 70.0, 88.0, 86.0, 105.0, 86.0, 65.0, 53.0, 38.0, 17.0, 19.0, 10.0, 8.0, 11.0, 9.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010341405868530273, -9.95611771941185e-05, -9.570829570293427e-05, -9.185541421175003e-05, -8.80025327205658e-05, -8.414965122938156e-05, -8.029676973819733e-05, -7.644388824701309e-05, -7.259100675582886e-05, -6.873812526464462e-05, -6.488524377346039e-05, -6.1032362282276154e-05, -5.717948079109192e-05, -5.3326599299907684e-05, -4.947371780872345e-05, -4.5620836317539215e-05, -4.176795482635498e-05, -3.7915073335170746e-05, -3.406219184398651e-05, -3.0209310352802277e-05, -2.6356428861618042e-05, -2.2503547370433807e-05, -1.8650665879249573e-05, -1.4797784388065338e-05, -1.0944902896881104e-05, -7.092021405696869e-06, -3.2391399145126343e-06, 6.137415766716003e-07, 4.466623067855835e-06, 8.31950455904007e-06, 1.2172386050224304e-05, 1.602526754140854e-05, 1.9878149032592773e-05, 2.3731030523777008e-05, 2.7583912014961243e-05, 3.143679350614548e-05, 3.528967499732971e-05, 3.9142556488513947e-05, 4.299543797969818e-05, 4.6848319470882416e-05, 5.070120096206665e-05, 5.4554082453250885e-05, 5.840696394443512e-05, 6.225984543561935e-05, 6.611272692680359e-05, 6.996560841798782e-05, 7.381848990917206e-05, 7.767137140035629e-05, 8.152425289154053e-05, 8.537713438272476e-05, 8.9230015873909e-05, 9.308289736509323e-05, 9.693577885627747e-05, 0.0001007886603474617, 0.00010464154183864594, 0.00010849442332983017, 0.0001123473048210144, 0.00011620018631219864, 0.00012005306780338287, 0.0001239059492945671, 0.00012775883078575134, 0.00013161171227693558, 0.0001354645937681198, 0.00013931747525930405, 0.00014317035675048828]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 14.0, 24.0, 37.0, 80.0, 211.0, 484.0, 1405.0, 5472.0, 38059.0, 505359.0, 455582.0, 34629.0, 5050.0, 1314.0, 433.0, 190.0, 92.0, 45.0, 18.0, 14.0, 16.0, 4.0, 8.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2314453125, -1.1981430053710938, -1.1648406982421875, -1.1315383911132812, -1.098236083984375, -1.0649337768554688, -1.0316314697265625, -0.9983291625976562, -0.96502685546875, -0.9317245483398438, -0.8984222412109375, -0.8651199340820312, -0.831817626953125, -0.7985153198242188, -0.7652130126953125, -0.7319107055664062, -0.6986083984375, -0.6653060913085938, -0.6320037841796875, -0.5987014770507812, -0.565399169921875, -0.5320968627929688, -0.4987945556640625, -0.46549224853515625, -0.43218994140625, -0.39888763427734375, -0.3655853271484375, -0.33228302001953125, -0.298980712890625, -0.26567840576171875, -0.2323760986328125, -0.19907379150390625, -0.165771484375, -0.13246917724609375, -0.0991668701171875, -0.06586456298828125, -0.032562255859375, 0.00074005126953125, 0.0340423583984375, 0.06734466552734375, 0.10064697265625, 0.13394927978515625, 0.1672515869140625, 0.20055389404296875, 0.233856201171875, 0.26715850830078125, 0.3004608154296875, 0.33376312255859375, 0.3670654296875, 0.40036773681640625, 0.4336700439453125, 0.46697235107421875, 0.500274658203125, 0.5335769653320312, 0.5668792724609375, 0.6001815795898438, 0.63348388671875, 0.6667861938476562, 0.7000885009765625, 0.7333908081054688, 0.766693115234375, 0.7999954223632812, 0.8332977294921875, 0.8666000366210938, 0.89990234375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 4.0, 1.0, 8.0, 8.0, 9.0, 19.0, 28.0, 38.0, 58.0, 75.0, 98.0, 101.0, 107.0, 107.0, 76.0, 66.0, 49.0, 38.0, 32.0, 19.0, 16.0, 7.0, 7.0, 9.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1708984375, -1.138763427734375, -1.10662841796875, -1.074493408203125, -1.0423583984375, -1.010223388671875, -0.97808837890625, -0.945953369140625, -0.913818359375, -0.881683349609375, -0.84954833984375, -0.817413330078125, -0.7852783203125, -0.753143310546875, -0.72100830078125, -0.688873291015625, -0.65673828125, -0.624603271484375, -0.59246826171875, -0.560333251953125, -0.5281982421875, -0.496063232421875, -0.46392822265625, -0.431793212890625, -0.399658203125, -0.367523193359375, -0.33538818359375, -0.303253173828125, -0.2711181640625, -0.238983154296875, -0.20684814453125, -0.174713134765625, -0.142578125, -0.110443115234375, -0.07830810546875, -0.046173095703125, -0.0140380859375, 0.018096923828125, 0.05023193359375, 0.082366943359375, 0.114501953125, 0.146636962890625, 0.17877197265625, 0.210906982421875, 0.2430419921875, 0.275177001953125, 0.30731201171875, 0.339447021484375, 0.37158203125, 0.403717041015625, 0.43585205078125, 0.467987060546875, 0.5001220703125, 0.532257080078125, 0.56439208984375, 0.596527099609375, 0.628662109375, 0.660797119140625, 0.69293212890625, 0.725067138671875, 0.7572021484375, 0.789337158203125, 0.82147216796875, 0.853607177734375, 0.8857421875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 7.0, 10.0, 15.0, 34.0, 59.0, 71.0, 125.0, 130.0, 126.0, 144.0, 103.0, 63.0, 45.0, 22.0, 20.0, 8.0, 5.0, 11.0, 5.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.77946949005127, -10.329562187194824, -9.879655838012695, -9.42974853515625, -8.979841232299805, -8.52993392944336, -8.080026626586914, -7.630120277404785, -7.18021297454834, -6.7303056716918945, -6.280398845672607, -5.83049201965332, -5.380584716796875, -4.93067741394043, -4.480770587921143, -4.0308637619018555, -3.58095645904541, -3.131049394607544, -2.6811423301696777, -2.2312352657318115, -1.7813282012939453, -1.331421136856079, -0.8815140724182129, -0.4316070079803467, 0.01830005645751953, 0.46820712089538574, 0.918114185333252, 1.3680212497711182, 1.8179283142089844, 2.2678353786468506, 2.717742443084717, 3.167649507522583, 3.617555618286133, 4.067462921142578, 4.517369747161865, 4.967276573181152, 5.417183876037598, 5.867091178894043, 6.31699800491333, 6.766904830932617, 7.2168121337890625, 7.666719436645508, 8.116626739501953, 8.566533088684082, 9.016440391540527, 9.466347694396973, 9.916254043579102, 10.366161346435547, 10.816068649291992, 11.265975952148438, 11.715883255004883, 12.165789604187012, 12.615696907043457, 13.065604209899902, 13.515510559082031, 13.965417861938477, 14.415325164794922, 14.865232467651367, 15.315139770507812, 15.765046119689941, 16.214954376220703, 16.664859771728516, 17.11476707458496, 17.564674377441406, 18.01458168029785]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 9.0, 11.0, 13.0, 11.0, 2.0, 15.0, 13.0, 18.0, 28.0, 21.0, 29.0, 20.0, 42.0, 35.0, 45.0, 44.0, 42.0, 48.0, 46.0, 45.0, 52.0, 45.0, 41.0, 44.0, 40.0, 30.0, 34.0, 29.0, 24.0, 20.0, 16.0, 18.0, 12.0, 9.0, 10.0, 12.0, 7.0, 11.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.964408874511719, -9.643903732299805, -9.323399543762207, -9.002894401550293, -8.682389259338379, -8.361885070800781, -8.041379928588867, -7.720874786376953, -7.400370121002197, -7.079865455627441, -6.759360313415527, -6.4388556480407715, -6.118350982666016, -5.797845840454102, -5.477341175079346, -5.15683650970459, -4.836331367492676, -4.51582670211792, -4.195321559906006, -3.87481689453125, -3.554311990737915, -3.23380708694458, -2.913302421569824, -2.5927975177764893, -2.2722926139831543, -1.9517877101898193, -1.631282925605774, -1.3107781410217285, -0.9902732372283936, -0.6697683334350586, -0.3492635488510132, -0.028758764266967773, 0.2917461395263672, 0.6122509837150574, 0.9327558279037476, 1.253260612487793, 1.573765516281128, 1.894270420074463, 2.2147750854492188, 2.5352799892425537, 2.8557848930358887, 3.1762897968292236, 3.4967947006225586, 3.8172993659973145, 4.13780403137207, 4.458309173583984, 4.77881383895874, 5.099318504333496, 5.41982364654541, 5.740328311920166, 6.06083345413208, 6.381338119506836, 6.70184326171875, 7.022347927093506, 7.342852592468262, 7.663357734680176, 7.983862400054932, 8.304367065429688, 8.624872207641602, 8.945377349853516, 9.265881538391113, 9.586386680603027, 9.906891822814941, 10.227396011352539, 10.547901153564453]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 6.0, 10.0, 8.0, 16.0, 24.0, 31.0, 43.0, 66.0, 99.0, 192.0, 337.0, 602.0, 1214.0, 2793.0, 7386.0, 28560.0, 3951876.0, 171251.0, 19420.0, 5743.0, 2191.0, 1026.0, 510.0, 343.0, 197.0, 109.0, 61.0, 51.0, 37.0, 23.0, 15.0, 11.0, 10.0, 8.0, 6.0, 5.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4375, -1.3819580078125, -1.326416015625, -1.2708740234375, -1.21533203125, -1.1597900390625, -1.104248046875, -1.0487060546875, -0.9931640625, -0.9376220703125, -0.882080078125, -0.8265380859375, -0.77099609375, -0.7154541015625, -0.659912109375, -0.6043701171875, -0.548828125, -0.4932861328125, -0.437744140625, -0.3822021484375, -0.32666015625, -0.2711181640625, -0.215576171875, -0.1600341796875, -0.1044921875, -0.0489501953125, 0.006591796875, 0.0621337890625, 0.11767578125, 0.1732177734375, 0.228759765625, 0.2843017578125, 0.33984375, 0.3953857421875, 0.450927734375, 0.5064697265625, 0.56201171875, 0.6175537109375, 0.673095703125, 0.7286376953125, 0.7841796875, 0.8397216796875, 0.895263671875, 0.9508056640625, 1.00634765625, 1.0618896484375, 1.117431640625, 1.1729736328125, 1.228515625, 1.2840576171875, 1.339599609375, 1.3951416015625, 1.45068359375, 1.5062255859375, 1.561767578125, 1.6173095703125, 1.6728515625, 1.7283935546875, 1.783935546875, 1.8394775390625, 1.89501953125, 1.9505615234375, 2.006103515625, 2.0616455078125, 2.1171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 8.0, 11.0, 16.0, 19.0, 19.0, 31.0, 30.0, 43.0, 48.0, 41.0, 51.0, 69.0, 72.0, 72.0, 62.0, 49.0, 56.0, 45.0, 39.0, 45.0, 27.0, 32.0, 29.0, 19.0, 18.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6240234375, -0.605438232421875, -0.58685302734375, -0.568267822265625, -0.5496826171875, -0.531097412109375, -0.51251220703125, -0.493927001953125, -0.475341796875, -0.456756591796875, -0.43817138671875, -0.419586181640625, -0.4010009765625, -0.382415771484375, -0.36383056640625, -0.345245361328125, -0.32666015625, -0.308074951171875, -0.28948974609375, -0.270904541015625, -0.2523193359375, -0.233734130859375, -0.21514892578125, -0.196563720703125, -0.177978515625, -0.159393310546875, -0.14080810546875, -0.122222900390625, -0.1036376953125, -0.085052490234375, -0.06646728515625, -0.047882080078125, -0.029296875, -0.010711669921875, 0.00787353515625, 0.026458740234375, 0.0450439453125, 0.063629150390625, 0.08221435546875, 0.100799560546875, 0.119384765625, 0.137969970703125, 0.15655517578125, 0.175140380859375, 0.1937255859375, 0.212310791015625, 0.23089599609375, 0.249481201171875, 0.26806640625, 0.286651611328125, 0.30523681640625, 0.323822021484375, 0.3424072265625, 0.360992431640625, 0.37957763671875, 0.398162841796875, 0.416748046875, 0.435333251953125, 0.45391845703125, 0.472503662109375, 0.4910888671875, 0.509674072265625, 0.52825927734375, 0.546844482421875, 0.5654296875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 4.0, 5.0, 10.0, 15.0, 17.0, 20.0, 28.0, 41.0, 59.0, 98.0, 141.0, 195.0, 296.0, 432.0, 664.0, 1064.0, 1658.0, 2761.0, 5155.0, 10648.0, 24686.0, 76959.0, 3766543.0, 223620.0, 44716.0, 16841.0, 7564.0, 3871.0, 2226.0, 1411.0, 801.0, 549.0, 394.0, 255.0, 187.0, 104.0, 70.0, 45.0, 37.0, 26.0, 29.0, 8.0, 11.0, 7.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.1513671875, -1.115142822265625, -1.07891845703125, -1.042694091796875, -1.0064697265625, -0.970245361328125, -0.93402099609375, -0.897796630859375, -0.861572265625, -0.825347900390625, -0.78912353515625, -0.752899169921875, -0.7166748046875, -0.680450439453125, -0.64422607421875, -0.608001708984375, -0.57177734375, -0.535552978515625, -0.49932861328125, -0.463104248046875, -0.4268798828125, -0.390655517578125, -0.35443115234375, -0.318206787109375, -0.281982421875, -0.245758056640625, -0.20953369140625, -0.173309326171875, -0.1370849609375, -0.100860595703125, -0.06463623046875, -0.028411865234375, 0.0078125, 0.044036865234375, 0.08026123046875, 0.116485595703125, 0.1527099609375, 0.188934326171875, 0.22515869140625, 0.261383056640625, 0.297607421875, 0.333831787109375, 0.37005615234375, 0.406280517578125, 0.4425048828125, 0.478729248046875, 0.51495361328125, 0.551177978515625, 0.58740234375, 0.623626708984375, 0.65985107421875, 0.696075439453125, 0.7322998046875, 0.768524169921875, 0.80474853515625, 0.840972900390625, 0.877197265625, 0.913421630859375, 0.94964599609375, 0.985870361328125, 1.0220947265625, 1.058319091796875, 1.09454345703125, 1.130767822265625, 1.1669921875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 4.0, 16.0, 20.0, 25.0, 46.0, 77.0, 166.0, 3302.0, 173.0, 80.0, 32.0, 37.0, 19.0, 11.0, 14.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.494140625, -0.48131561279296875, -0.4684906005859375, -0.45566558837890625, -0.442840576171875, -0.43001556396484375, -0.4171905517578125, -0.40436553955078125, -0.39154052734375, -0.37871551513671875, -0.3658905029296875, -0.35306549072265625, -0.340240478515625, -0.32741546630859375, -0.3145904541015625, -0.30176544189453125, -0.2889404296875, -0.27611541748046875, -0.2632904052734375, -0.25046539306640625, -0.237640380859375, -0.22481536865234375, -0.2119903564453125, -0.19916534423828125, -0.18634033203125, -0.17351531982421875, -0.1606903076171875, -0.14786529541015625, -0.135040283203125, -0.12221527099609375, -0.1093902587890625, -0.09656524658203125, -0.083740234375, -0.07091522216796875, -0.0580902099609375, -0.04526519775390625, -0.032440185546875, -0.01961517333984375, -0.0067901611328125, 0.00603485107421875, 0.01885986328125, 0.03168487548828125, 0.0445098876953125, 0.05733489990234375, 0.070159912109375, 0.08298492431640625, 0.0958099365234375, 0.10863494873046875, 0.1214599609375, 0.13428497314453125, 0.1471099853515625, 0.15993499755859375, 0.172760009765625, 0.18558502197265625, 0.1984100341796875, 0.21123504638671875, 0.22406005859375, 0.23688507080078125, 0.2497100830078125, 0.26253509521484375, 0.275360107421875, 0.28818511962890625, 0.3010101318359375, 0.31383514404296875, 0.32666015625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 0.0, 21.0, 90.0, 167.0, 231.0, 242.0, 137.0, 77.0, 29.0, 6.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.519367218017578, -5.406399250030518, -5.293430805206299, -5.180462837219238, -5.0674943923950195, -4.954526424407959, -4.84155797958374, -4.72859001159668, -4.615621566772461, -4.5026535987854, -4.389685153961182, -4.276717185974121, -4.163748741149902, -4.050780773162842, -3.937812328338623, -3.8248443603515625, -3.711876153945923, -3.598907947540283, -3.4859397411346436, -3.372971534729004, -3.2600033283233643, -3.1470351219177246, -3.034067153930664, -2.9210987091064453, -2.8081307411193848, -2.695162534713745, -2.5821943283081055, -2.469226121902466, -2.356257915496826, -2.2432897090911865, -2.130321502685547, -2.0173535346984863, -1.9043848514556885, -1.7914166450500488, -1.6784484386444092, -1.5654802322387695, -1.4525120258331299, -1.3395438194274902, -1.2265757322311401, -1.1136075258255005, -1.0006393194198608, -0.8876711130142212, -0.7747029066085815, -0.6617347598075867, -0.548766553401947, -0.4357983469963074, -0.3228302001953125, -0.20986199378967285, -0.0968937873840332, 0.01607440412044525, 0.1290425956249237, 0.24201077222824097, 0.3549789786338806, 0.46794718503952026, 0.5809153318405151, 0.6938835382461548, 0.8068517446517944, 0.9198199510574341, 1.0327881574630737, 1.1457562446594238, 1.2587244510650635, 1.3716926574707031, 1.4846608638763428, 1.5976290702819824, 1.710597276687622]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 2.0, 5.0, 6.0, 10.0, 10.0, 9.0, 8.0, 18.0, 12.0, 14.0, 15.0, 24.0, 26.0, 23.0, 23.0, 41.0, 33.0, 32.0, 36.0, 30.0, 44.0, 40.0, 51.0, 42.0, 41.0, 34.0, 40.0, 42.0, 33.0, 27.0, 22.0, 27.0, 29.0, 22.0, 28.0, 13.0, 16.0, 12.0, 11.0, 13.0, 10.0, 7.0, 8.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.7974575161933899, -0.7742125391960144, -0.7509675621986389, -0.7277225852012634, -0.7044776082038879, -0.6812326312065125, -0.657987654209137, -0.6347426772117615, -0.611497700214386, -0.5882527232170105, -0.565007746219635, -0.5417627692222595, -0.518517792224884, -0.49527281522750854, -0.47202783823013306, -0.44878286123275757, -0.42553791403770447, -0.402292937040329, -0.3790479600429535, -0.355802983045578, -0.3325580060482025, -0.309313029050827, -0.2860680818557739, -0.26282310485839844, -0.23957811295986176, -0.21633313596248627, -0.19308815896511078, -0.16984319686889648, -0.146598219871521, -0.12335323542356491, -0.10010826587677002, -0.07686328887939453, -0.05361831188201904, -0.030373336747288704, -0.007128361612558365, 0.016116611659526825, 0.03936158865690231, 0.0626065656542778, 0.08585153520107269, 0.10909651219844818, 0.13234148919582367, 0.15558646619319916, 0.17883144319057465, 0.20207640528678894, 0.22532138228416443, 0.24856635928153992, 0.2718113362789154, 0.2950563132762909, 0.3183012902736664, 0.34154626727104187, 0.36479124426841736, 0.38803622126579285, 0.41128119826316833, 0.4345261752605438, 0.4577711224555969, 0.4810160994529724, 0.5042610764503479, 0.5275060534477234, 0.5507510304450989, 0.5739960074424744, 0.5972409844398499, 0.6204859614372253, 0.6437309384346008, 0.6669759154319763, 0.6902208924293518]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 7.0, 9.0, 13.0, 14.0, 24.0, 28.0, 55.0, 77.0, 118.0, 177.0, 262.0, 448.0, 742.0, 1192.0, 2261.0, 3898.0, 7331.0, 14877.0, 31939.0, 71406.0, 157678.0, 270853.0, 246870.0, 128387.0, 57304.0, 26131.0, 12321.0, 6144.0, 3373.0, 1779.0, 1077.0, 634.0, 383.0, 253.0, 195.0, 77.0, 82.0, 46.0, 35.0, 22.0, 9.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.9306640625, -0.9005126953125, -0.870361328125, -0.8402099609375, -0.81005859375, -0.7799072265625, -0.749755859375, -0.7196044921875, -0.689453125, -0.6593017578125, -0.629150390625, -0.5989990234375, -0.56884765625, -0.5386962890625, -0.508544921875, -0.4783935546875, -0.4482421875, -0.4180908203125, -0.387939453125, -0.3577880859375, -0.32763671875, -0.2974853515625, -0.267333984375, -0.2371826171875, -0.20703125, -0.1768798828125, -0.146728515625, -0.1165771484375, -0.08642578125, -0.0562744140625, -0.026123046875, 0.0040283203125, 0.0341796875, 0.0643310546875, 0.094482421875, 0.1246337890625, 0.15478515625, 0.1849365234375, 0.215087890625, 0.2452392578125, 0.275390625, 0.3055419921875, 0.335693359375, 0.3658447265625, 0.39599609375, 0.4261474609375, 0.456298828125, 0.4864501953125, 0.5166015625, 0.5467529296875, 0.576904296875, 0.6070556640625, 0.63720703125, 0.6673583984375, 0.697509765625, 0.7276611328125, 0.7578125, 0.7879638671875, 0.818115234375, 0.8482666015625, 0.87841796875, 0.9085693359375, 0.938720703125, 0.9688720703125, 0.9990234375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 7.0, 8.0, 11.0, 18.0, 16.0, 10.0, 16.0, 31.0, 32.0, 37.0, 38.0, 41.0, 47.0, 52.0, 59.0, 59.0, 48.0, 62.0, 54.0, 57.0, 46.0, 34.0, 37.0, 28.0, 32.0, 26.0, 16.0, 11.0, 16.0, 12.0, 10.0, 9.0, 2.0, 7.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5341796875, -0.5171279907226562, -0.5000762939453125, -0.48302459716796875, -0.465972900390625, -0.44892120361328125, -0.4318695068359375, -0.41481781005859375, -0.39776611328125, -0.38071441650390625, -0.3636627197265625, -0.34661102294921875, -0.329559326171875, -0.31250762939453125, -0.2954559326171875, -0.27840423583984375, -0.2613525390625, -0.24430084228515625, -0.2272491455078125, -0.21019744873046875, -0.193145751953125, -0.17609405517578125, -0.1590423583984375, -0.14199066162109375, -0.12493896484375, -0.10788726806640625, -0.0908355712890625, -0.07378387451171875, -0.056732177734375, -0.03968048095703125, -0.0226287841796875, -0.00557708740234375, 0.011474609375, 0.02852630615234375, 0.0455780029296875, 0.06262969970703125, 0.079681396484375, 0.09673309326171875, 0.1137847900390625, 0.13083648681640625, 0.14788818359375, 0.16493988037109375, 0.1819915771484375, 0.19904327392578125, 0.216094970703125, 0.23314666748046875, 0.2501983642578125, 0.26725006103515625, 0.2843017578125, 0.30135345458984375, 0.3184051513671875, 0.33545684814453125, 0.352508544921875, 0.36956024169921875, 0.3866119384765625, 0.40366363525390625, 0.42071533203125, 0.43776702880859375, 0.4548187255859375, 0.47187042236328125, 0.488922119140625, 0.5059738159179688, 0.5230255126953125, 0.5400772094726562, 0.55712890625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 5.0, 10.0, 13.0, 24.0, 30.0, 29.0, 59.0, 72.0, 130.0, 214.0, 344.0, 677.0, 1508.0, 3974.0, 14159.0, 79042.0, 529606.0, 353847.0, 49202.0, 10021.0, 2994.0, 1216.0, 565.0, 312.0, 179.0, 99.0, 75.0, 50.0, 36.0, 16.0, 14.0, 8.0, 13.0, 2.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.478515625, -2.409423828125, -2.34033203125, -2.271240234375, -2.2021484375, -2.133056640625, -2.06396484375, -1.994873046875, -1.92578125, -1.856689453125, -1.78759765625, -1.718505859375, -1.6494140625, -1.580322265625, -1.51123046875, -1.442138671875, -1.373046875, -1.303955078125, -1.23486328125, -1.165771484375, -1.0966796875, -1.027587890625, -0.95849609375, -0.889404296875, -0.8203125, -0.751220703125, -0.68212890625, -0.613037109375, -0.5439453125, -0.474853515625, -0.40576171875, -0.336669921875, -0.267578125, -0.198486328125, -0.12939453125, -0.060302734375, 0.0087890625, 0.077880859375, 0.14697265625, 0.216064453125, 0.28515625, 0.354248046875, 0.42333984375, 0.492431640625, 0.5615234375, 0.630615234375, 0.69970703125, 0.768798828125, 0.837890625, 0.906982421875, 0.97607421875, 1.045166015625, 1.1142578125, 1.183349609375, 1.25244140625, 1.321533203125, 1.390625, 1.459716796875, 1.52880859375, 1.597900390625, 1.6669921875, 1.736083984375, 1.80517578125, 1.874267578125, 1.943359375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 9.0, 5.0, 10.0, 9.0, 15.0, 18.0, 15.0, 23.0, 23.0, 32.0, 38.0, 38.0, 51.0, 41.0, 49.0, 60.0, 43.0, 58.0, 50.0, 48.0, 43.0, 58.0, 44.0, 39.0, 37.0, 25.0, 18.0, 18.0, 15.0, 11.0, 14.0, 15.0, 12.0, 6.0, 8.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8671875, -2.789031982421875, -2.71087646484375, -2.632720947265625, -2.5545654296875, -2.476409912109375, -2.39825439453125, -2.320098876953125, -2.241943359375, -2.163787841796875, -2.08563232421875, -2.007476806640625, -1.9293212890625, -1.851165771484375, -1.77301025390625, -1.694854736328125, -1.61669921875, -1.538543701171875, -1.46038818359375, -1.382232666015625, -1.3040771484375, -1.225921630859375, -1.14776611328125, -1.069610595703125, -0.991455078125, -0.913299560546875, -0.83514404296875, -0.756988525390625, -0.6788330078125, -0.600677490234375, -0.52252197265625, -0.444366455078125, -0.3662109375, -0.288055419921875, -0.20989990234375, -0.131744384765625, -0.0535888671875, 0.024566650390625, 0.10272216796875, 0.180877685546875, 0.259033203125, 0.337188720703125, 0.41534423828125, 0.493499755859375, 0.5716552734375, 0.649810791015625, 0.72796630859375, 0.806121826171875, 0.88427734375, 0.962432861328125, 1.04058837890625, 1.118743896484375, 1.1968994140625, 1.275054931640625, 1.35321044921875, 1.431365966796875, 1.509521484375, 1.587677001953125, 1.66583251953125, 1.743988037109375, 1.8221435546875, 1.900299072265625, 1.97845458984375, 2.056610107421875, 2.134765625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 8.0, 13.0, 23.0, 35.0, 42.0, 85.0, 168.0, 373.0, 1198.0, 4844.0, 35516.0, 877468.0, 116884.0, 8941.0, 1988.0, 518.0, 192.0, 103.0, 54.0, 34.0, 24.0, 12.0, 10.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8681640625, -1.8030242919921875, -1.737884521484375, -1.6727447509765625, -1.60760498046875, -1.5424652099609375, -1.477325439453125, -1.4121856689453125, -1.3470458984375, -1.2819061279296875, -1.216766357421875, -1.1516265869140625, -1.08648681640625, -1.0213470458984375, -0.956207275390625, -0.8910675048828125, -0.825927734375, -0.7607879638671875, -0.695648193359375, -0.6305084228515625, -0.56536865234375, -0.5002288818359375, -0.435089111328125, -0.3699493408203125, -0.3048095703125, -0.2396697998046875, -0.174530029296875, -0.1093902587890625, -0.04425048828125, 0.0208892822265625, 0.086029052734375, 0.1511688232421875, 0.21630859375, 0.2814483642578125, 0.346588134765625, 0.4117279052734375, 0.47686767578125, 0.5420074462890625, 0.607147216796875, 0.6722869873046875, 0.7374267578125, 0.8025665283203125, 0.867706298828125, 0.9328460693359375, 0.99798583984375, 1.0631256103515625, 1.128265380859375, 1.1934051513671875, 1.258544921875, 1.3236846923828125, 1.388824462890625, 1.4539642333984375, 1.51910400390625, 1.5842437744140625, 1.649383544921875, 1.7145233154296875, 1.7796630859375, 1.8448028564453125, 1.909942626953125, 1.9750823974609375, 2.04022216796875, 2.1053619384765625, 2.170501708984375, 2.2356414794921875, 2.30078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 4.0, 8.0, 10.0, 30.0, 24.0, 66.0, 107.0, 158.0, 182.0, 167.0, 110.0, 68.0, 26.0, 18.0, 10.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003380775451660156, -0.00033030658960342407, -0.0003225356340408325, -0.00031476467847824097, -0.0003069937229156494, -0.00029922276735305786, -0.0002914518117904663, -0.00028368085622787476, -0.0002759099006652832, -0.00026813894510269165, -0.0002603679895401001, -0.00025259703397750854, -0.000244826078414917, -0.00023705512285232544, -0.0002292841672897339, -0.00022151321172714233, -0.00021374225616455078, -0.00020597130060195923, -0.00019820034503936768, -0.00019042938947677612, -0.00018265843391418457, -0.00017488747835159302, -0.00016711652278900146, -0.0001593455672264099, -0.00015157461166381836, -0.0001438036561012268, -0.00013603270053863525, -0.0001282617449760437, -0.00012049078941345215, -0.0001127198338508606, -0.00010494887828826904, -9.717792272567749e-05, -8.940696716308594e-05, -8.163601160049438e-05, -7.386505603790283e-05, -6.609410047531128e-05, -5.8323144912719727e-05, -5.0552189350128174e-05, -4.278123378753662e-05, -3.501027822494507e-05, -2.7239322662353516e-05, -1.9468367099761963e-05, -1.169741153717041e-05, -3.926455974578857e-06, 3.844499588012695e-06, 1.1615455150604248e-05, 1.93864107131958e-05, 2.7157366275787354e-05, 3.4928321838378906e-05, 4.269927740097046e-05, 5.047023296356201e-05, 5.8241188526153564e-05, 6.601214408874512e-05, 7.378309965133667e-05, 8.155405521392822e-05, 8.932501077651978e-05, 9.709596633911133e-05, 0.00010486692190170288, 0.00011263787746429443, 0.00012040883302688599, 0.00012817978858947754, 0.0001359507441520691, 0.00014372169971466064, 0.0001514926552772522, 0.00015926361083984375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 10.0, 6.0, 12.0, 18.0, 20.0, 34.0, 57.0, 58.0, 117.0, 199.0, 447.0, 1229.0, 4327.0, 23546.0, 599909.0, 394944.0, 18061.0, 3575.0, 1099.0, 398.0, 161.0, 98.0, 90.0, 46.0, 23.0, 16.0, 13.0, 11.0, 10.0, 6.0, 4.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.15625, -2.10357666015625, -2.0509033203125, -1.99822998046875, -1.945556640625, -1.89288330078125, -1.8402099609375, -1.78753662109375, -1.73486328125, -1.68218994140625, -1.6295166015625, -1.57684326171875, -1.524169921875, -1.47149658203125, -1.4188232421875, -1.36614990234375, -1.3134765625, -1.26080322265625, -1.2081298828125, -1.15545654296875, -1.102783203125, -1.05010986328125, -0.9974365234375, -0.94476318359375, -0.89208984375, -0.83941650390625, -0.7867431640625, -0.73406982421875, -0.681396484375, -0.62872314453125, -0.5760498046875, -0.52337646484375, -0.470703125, -0.41802978515625, -0.3653564453125, -0.31268310546875, -0.260009765625, -0.20733642578125, -0.1546630859375, -0.10198974609375, -0.04931640625, 0.00335693359375, 0.0560302734375, 0.10870361328125, 0.161376953125, 0.21405029296875, 0.2667236328125, 0.31939697265625, 0.3720703125, 0.42474365234375, 0.4774169921875, 0.53009033203125, 0.582763671875, 0.63543701171875, 0.6881103515625, 0.74078369140625, 0.79345703125, 0.84613037109375, 0.8988037109375, 0.95147705078125, 1.004150390625, 1.05682373046875, 1.1094970703125, 1.16217041015625, 1.21484375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 8.0, 9.0, 6.0, 15.0, 27.0, 83.0, 142.0, 191.0, 177.0, 136.0, 89.0, 49.0, 30.0, 12.0, 10.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.337890625, -3.266998291015625, -3.19610595703125, -3.125213623046875, -3.0543212890625, -2.983428955078125, -2.91253662109375, -2.841644287109375, -2.770751953125, -2.699859619140625, -2.62896728515625, -2.558074951171875, -2.4871826171875, -2.416290283203125, -2.34539794921875, -2.274505615234375, -2.20361328125, -2.132720947265625, -2.06182861328125, -1.990936279296875, -1.9200439453125, -1.849151611328125, -1.77825927734375, -1.707366943359375, -1.636474609375, -1.565582275390625, -1.49468994140625, -1.423797607421875, -1.3529052734375, -1.282012939453125, -1.21112060546875, -1.140228271484375, -1.0693359375, -0.998443603515625, -0.92755126953125, -0.856658935546875, -0.7857666015625, -0.714874267578125, -0.64398193359375, -0.573089599609375, -0.502197265625, -0.431304931640625, -0.36041259765625, -0.289520263671875, -0.2186279296875, -0.147735595703125, -0.07684326171875, -0.005950927734375, 0.06494140625, 0.135833740234375, 0.20672607421875, 0.277618408203125, 0.3485107421875, 0.419403076171875, 0.49029541015625, 0.561187744140625, 0.632080078125, 0.702972412109375, 0.77386474609375, 0.844757080078125, 0.9156494140625, 0.986541748046875, 1.05743408203125, 1.128326416015625, 1.19921875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 9.0, 14.0, 38.0, 87.0, 169.0, 237.0, 192.0, 149.0, 55.0, 26.0, 16.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.055191040039062, -18.141637802124023, -17.228084564208984, -16.314531326293945, -15.400978088378906, -14.487424850463867, -13.573872566223145, -12.660319328308105, -11.746766090393066, -10.833212852478027, -9.919659614562988, -9.006107330322266, -8.092554092407227, -7.179000377655029, -6.265447616577148, -5.351894378662109, -4.43834114074707, -3.5247879028320312, -2.6112349033355713, -1.6976819038391113, -0.7841286659240723, 0.1294245719909668, 1.0429773330688477, 1.9565305709838867, 2.870083808898926, 3.783637046813965, 4.697190284729004, 5.610743045806885, 6.524296283721924, 7.437849521636963, 8.351402282714844, 9.264955520629883, 10.178508758544922, 11.092061996459961, 12.005615234375, 12.919168472290039, 13.832721710205078, 14.746274948120117, 15.65982723236084, 16.573379516601562, 17.486934661865234, 18.400487899780273, 19.314041137695312, 20.22759437561035, 21.14114761352539, 22.05470085144043, 22.96825408935547, 23.881805419921875, 24.795358657836914, 25.708911895751953, 26.622465133666992, 27.53601837158203, 28.44957160949707, 29.36312484741211, 30.276676177978516, 31.190231323242188, 32.103782653808594, 33.017333984375, 33.93088912963867, 34.84444046020508, 35.75799560546875, 36.671546936035156, 37.58510208129883, 38.498653411865234, 39.412208557128906]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 5.0, 2.0, 5.0, 14.0, 11.0, 11.0, 9.0, 21.0, 16.0, 30.0, 39.0, 30.0, 34.0, 38.0, 54.0, 59.0, 43.0, 51.0, 57.0, 50.0, 42.0, 53.0, 33.0, 41.0, 41.0, 23.0, 28.0, 24.0, 33.0, 24.0, 19.0, 14.0, 15.0, 5.0, 7.0, 6.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.899551391601562, -11.535235404968262, -11.170919418334961, -10.806602478027344, -10.442286491394043, -10.077970504760742, -9.713654518127441, -9.34933853149414, -8.985021591186523, -8.620705604553223, -8.256389617919922, -7.892073154449463, -7.527756690979004, -7.163440704345703, -6.799124717712402, -6.434808731079102, -6.070492744445801, -5.7061767578125, -5.341860294342041, -4.97754430770874, -4.613227844238281, -4.2489118576049805, -3.8845958709716797, -3.5202796459198, -3.15596342086792, -2.79164719581604, -2.42733097076416, -2.0630149841308594, -1.6986987590789795, -1.3343825340270996, -0.9700665473937988, -0.605750322341919, -0.24143505096435547, 0.12288111448287964, 0.48719727993011475, 0.8515133857727051, 1.215829610824585, 1.5801458358764648, 1.9444618225097656, 2.3087780475616455, 2.6730942726135254, 3.0374104976654053, 3.401726722717285, 3.766042709350586, 4.130358695983887, 4.494675159454346, 4.8589911460876465, 5.2233076095581055, 5.587623596191406, 5.951939582824707, 6.316256046295166, 6.680572032928467, 7.044888496398926, 7.409204483032227, 7.773520469665527, 8.137836456298828, 8.502153396606445, 8.866469383239746, 9.230785369873047, 9.595102310180664, 9.959418296813965, 10.323734283447266, 10.688050270080566, 11.052366256713867, 11.416682243347168]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 9.0, 11.0, 17.0, 25.0, 47.0, 43.0, 74.0, 142.0, 196.0, 400.0, 759.0, 1438.0, 3298.0, 9382.0, 54131.0, 4095279.0, 19096.0, 5416.0, 2199.0, 1022.0, 500.0, 298.0, 172.0, 114.0, 74.0, 45.0, 32.0, 16.0, 19.0, 14.0, 1.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.248046875, -2.168487548828125, -2.08892822265625, -2.009368896484375, -1.9298095703125, -1.850250244140625, -1.77069091796875, -1.691131591796875, -1.611572265625, -1.532012939453125, -1.45245361328125, -1.372894287109375, -1.2933349609375, -1.213775634765625, -1.13421630859375, -1.054656982421875, -0.97509765625, -0.895538330078125, -0.81597900390625, -0.736419677734375, -0.6568603515625, -0.577301025390625, -0.49774169921875, -0.418182373046875, -0.338623046875, -0.259063720703125, -0.17950439453125, -0.099945068359375, -0.0203857421875, 0.059173583984375, 0.13873291015625, 0.218292236328125, 0.2978515625, 0.377410888671875, 0.45697021484375, 0.536529541015625, 0.6160888671875, 0.695648193359375, 0.77520751953125, 0.854766845703125, 0.934326171875, 1.013885498046875, 1.09344482421875, 1.173004150390625, 1.2525634765625, 1.332122802734375, 1.41168212890625, 1.491241455078125, 1.57080078125, 1.650360107421875, 1.72991943359375, 1.809478759765625, 1.8890380859375, 1.968597412109375, 2.04815673828125, 2.127716064453125, 2.207275390625, 2.286834716796875, 2.36639404296875, 2.445953369140625, 2.5255126953125, 2.605072021484375, 2.68463134765625, 2.764190673828125, 2.84375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 7.0, 7.0, 10.0, 17.0, 24.0, 35.0, 34.0, 50.0, 80.0, 79.0, 108.0, 108.0, 98.0, 81.0, 73.0, 59.0, 45.0, 33.0, 22.0, 17.0, 5.0, 3.0, 3.0, 9.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0107421875, -0.9796981811523438, -0.9486541748046875, -0.9176101684570312, -0.886566162109375, -0.8555221557617188, -0.8244781494140625, -0.7934341430664062, -0.76239013671875, -0.7313461303710938, -0.7003021240234375, -0.6692581176757812, -0.638214111328125, -0.6071701049804688, -0.5761260986328125, -0.5450820922851562, -0.5140380859375, -0.48299407958984375, -0.4519500732421875, -0.42090606689453125, -0.389862060546875, -0.35881805419921875, -0.3277740478515625, -0.29673004150390625, -0.26568603515625, -0.23464202880859375, -0.2035980224609375, -0.17255401611328125, -0.141510009765625, -0.11046600341796875, -0.0794219970703125, -0.04837799072265625, -0.017333984375, 0.01371002197265625, 0.0447540283203125, 0.07579803466796875, 0.106842041015625, 0.13788604736328125, 0.1689300537109375, 0.19997406005859375, 0.23101806640625, 0.26206207275390625, 0.2931060791015625, 0.32415008544921875, 0.355194091796875, 0.38623809814453125, 0.4172821044921875, 0.44832611083984375, 0.4793701171875, 0.5104141235351562, 0.5414581298828125, 0.5725021362304688, 0.603546142578125, 0.6345901489257812, 0.6656341552734375, 0.6966781616210938, 0.72772216796875, 0.7587661743164062, 0.7898101806640625, 0.8208541870117188, 0.851898193359375, 0.8829421997070312, 0.9139862060546875, 0.9450302124023438, 0.97607421875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 7.0, 10.0, 9.0, 11.0, 33.0, 35.0, 71.0, 74.0, 104.0, 177.0, 252.0, 471.0, 1065.0, 2525.0, 7156.0, 29387.0, 4053305.0, 79791.0, 12600.0, 3941.0, 1520.0, 723.0, 340.0, 203.0, 133.0, 100.0, 68.0, 50.0, 42.0, 29.0, 17.0, 8.0, 9.0, 4.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.984375, -2.9052734375, -2.826171875, -2.7470703125, -2.66796875, -2.5888671875, -2.509765625, -2.4306640625, -2.3515625, -2.2724609375, -2.193359375, -2.1142578125, -2.03515625, -1.9560546875, -1.876953125, -1.7978515625, -1.71875, -1.6396484375, -1.560546875, -1.4814453125, -1.40234375, -1.3232421875, -1.244140625, -1.1650390625, -1.0859375, -1.0068359375, -0.927734375, -0.8486328125, -0.76953125, -0.6904296875, -0.611328125, -0.5322265625, -0.453125, -0.3740234375, -0.294921875, -0.2158203125, -0.13671875, -0.0576171875, 0.021484375, 0.1005859375, 0.1796875, 0.2587890625, 0.337890625, 0.4169921875, 0.49609375, 0.5751953125, 0.654296875, 0.7333984375, 0.8125, 0.8916015625, 0.970703125, 1.0498046875, 1.12890625, 1.2080078125, 1.287109375, 1.3662109375, 1.4453125, 1.5244140625, 1.603515625, 1.6826171875, 1.76171875, 1.8408203125, 1.919921875, 1.9990234375, 2.078125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 8.0, 13.0, 15.0, 30.0, 66.0, 3743.0, 104.0, 42.0, 22.0, 14.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.393310546875, -0.3697242736816406, -0.34613800048828125, -0.3225517272949219, -0.2989654541015625, -0.2753791809082031, -0.25179290771484375, -0.22820663452148438, -0.204620361328125, -0.18103408813476562, -0.15744781494140625, -0.13386154174804688, -0.1102752685546875, -0.08668899536132812, -0.06310272216796875, -0.039516448974609375, -0.01593017578125, 0.007656097412109375, 0.03124237060546875, 0.054828643798828125, 0.0784149169921875, 0.10200119018554688, 0.12558746337890625, 0.14917373657226562, 0.172760009765625, 0.19634628295898438, 0.21993255615234375, 0.24351882934570312, 0.2671051025390625, 0.2906913757324219, 0.31427764892578125, 0.3378639221191406, 0.3614501953125, 0.3850364685058594, 0.40862274169921875, 0.4322090148925781, 0.4557952880859375, 0.4793815612792969, 0.5029678344726562, 0.5265541076660156, 0.550140380859375, 0.5737266540527344, 0.5973129272460938, 0.6208992004394531, 0.6444854736328125, 0.6680717468261719, 0.6916580200195312, 0.7152442932128906, 0.73883056640625, 0.7624168395996094, 0.7860031127929688, 0.8095893859863281, 0.8331756591796875, 0.8567619323730469, 0.8803482055664062, 0.9039344787597656, 0.927520751953125, 0.9511070251464844, 0.9746932983398438, 0.9982795715332031, 1.0218658447265625, 1.0454521179199219, 1.0690383911132812, 1.0926246643066406, 1.1162109375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 13.0, 37.0, 140.0, 343.0, 275.0, 138.0, 43.0, 20.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.988763332366943, -5.83800745010376, -5.687251567840576, -5.536495685577393, -5.385740280151367, -5.234984397888184, -5.084228515625, -4.933472633361816, -4.782716751098633, -4.631960868835449, -4.481204986572266, -4.330449104309082, -4.179693222045898, -4.028937816619873, -3.8781819343566895, -3.727426052093506, -3.5766701698303223, -3.4259142875671387, -3.275158405303955, -3.1244027614593506, -2.973646879196167, -2.8228909969329834, -2.672135353088379, -2.5213794708251953, -2.3706235885620117, -2.219867706298828, -2.0691118240356445, -1.91835618019104, -1.7676002979278564, -1.6168444156646729, -1.4660886526107788, -1.3153328895568848, -1.164576530456543, -1.0138206481933594, -0.8630648851394653, -0.7123090624809265, -0.5615532398223877, -0.4107974171638489, -0.26004159450531006, -0.10928583145141602, 0.04147005081176758, 0.1922258734703064, 0.3429816961288452, 0.49373751878738403, 0.6444933414459229, 0.7952491641044617, 0.9460049867630005, 1.0967607498168945, 1.2475166320800781, 1.3982725143432617, 1.5490282773971558, 1.6997840404510498, 1.8505399227142334, 2.001295804977417, 2.1520514488220215, 2.302807331085205, 2.4535632133483887, 2.6043190956115723, 2.755074977874756, 2.9058306217193604, 3.056586503982544, 3.2073423862457275, 3.358098030090332, 3.5088539123535156, 3.659609794616699]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 5.0, 4.0, 2.0, 4.0, 8.0, 6.0, 14.0, 6.0, 11.0, 23.0, 21.0, 27.0, 29.0, 17.0, 45.0, 43.0, 40.0, 39.0, 41.0, 38.0, 44.0, 42.0, 34.0, 39.0, 33.0, 46.0, 33.0, 41.0, 40.0, 27.0, 25.0, 27.0, 26.0, 20.0, 25.0, 17.0, 11.0, 12.0, 6.0, 11.0, 7.0, 8.0, 2.0, 2.0, 0.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.998574435710907, -0.9680328369140625, -0.9374912977218628, -0.9069497585296631, -0.8764081597328186, -0.8458665609359741, -0.8153250217437744, -0.7847834825515747, -0.7542418837547302, -0.7237002849578857, -0.693158745765686, -0.6626172065734863, -0.6320756077766418, -0.6015340089797974, -0.5709924697875977, -0.540450930595398, -0.5099093317985535, -0.47936776280403137, -0.4488261938095093, -0.4182846248149872, -0.3877430558204651, -0.357201486825943, -0.3266599178314209, -0.2961183488368988, -0.2655767798423767, -0.23503521084785461, -0.20449364185333252, -0.17395207285881042, -0.14341050386428833, -0.11286893486976624, -0.08232736587524414, -0.051785796880722046, -0.02124422788619995, 0.009297341108322144, 0.03983891010284424, 0.07038047909736633, 0.10092204809188843, 0.13146361708641052, 0.16200518608093262, 0.1925467550754547, 0.2230883240699768, 0.2536298930644989, 0.284171462059021, 0.3147130310535431, 0.3452546000480652, 0.3757961690425873, 0.4063377380371094, 0.43687930703163147, 0.46742087602615356, 0.49796244502067566, 0.5285040140151978, 0.5590455532073975, 0.5895871520042419, 0.6201287508010864, 0.6506702899932861, 0.6812118291854858, 0.7117534279823303, 0.7422950267791748, 0.7728365659713745, 0.8033781051635742, 0.8339197039604187, 0.8644613027572632, 0.8950028419494629, 0.9255443811416626, 0.9560859799385071]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 6.0, 11.0, 9.0, 33.0, 35.0, 53.0, 91.0, 193.0, 352.0, 746.0, 1516.0, 3649.0, 10522.0, 37583.0, 176774.0, 519201.0, 229328.0, 47665.0, 12790.0, 4449.0, 1823.0, 815.0, 410.0, 195.0, 132.0, 65.0, 36.0, 17.0, 22.0, 10.0, 10.0, 7.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.1640625, -2.0996246337890625, -2.035186767578125, -1.9707489013671875, -1.90631103515625, -1.8418731689453125, -1.777435302734375, -1.7129974365234375, -1.6485595703125, -1.5841217041015625, -1.519683837890625, -1.4552459716796875, -1.39080810546875, -1.3263702392578125, -1.261932373046875, -1.1974945068359375, -1.133056640625, -1.0686187744140625, -1.004180908203125, -0.9397430419921875, -0.87530517578125, -0.8108673095703125, -0.746429443359375, -0.6819915771484375, -0.6175537109375, -0.5531158447265625, -0.488677978515625, -0.4242401123046875, -0.35980224609375, -0.2953643798828125, -0.230926513671875, -0.1664886474609375, -0.10205078125, -0.0376129150390625, 0.026824951171875, 0.0912628173828125, 0.15570068359375, 0.2201385498046875, 0.284576416015625, 0.3490142822265625, 0.4134521484375, 0.4778900146484375, 0.542327880859375, 0.6067657470703125, 0.67120361328125, 0.7356414794921875, 0.800079345703125, 0.8645172119140625, 0.928955078125, 0.9933929443359375, 1.057830810546875, 1.1222686767578125, 1.18670654296875, 1.2511444091796875, 1.315582275390625, 1.3800201416015625, 1.4444580078125, 1.5088958740234375, 1.573333740234375, 1.6377716064453125, 1.70220947265625, 1.7666473388671875, 1.831085205078125, 1.8955230712890625, 1.9599609375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 11.0, 13.0, 6.0, 18.0, 25.0, 39.0, 45.0, 62.0, 75.0, 89.0, 92.0, 104.0, 94.0, 70.0, 69.0, 62.0, 37.0, 29.0, 25.0, 14.0, 10.0, 8.0, 5.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.0931854248046875, -1.060394287109375, -1.0276031494140625, -0.99481201171875, -0.9620208740234375, -0.929229736328125, -0.8964385986328125, -0.8636474609375, -0.8308563232421875, -0.798065185546875, -0.7652740478515625, -0.73248291015625, -0.6996917724609375, -0.666900634765625, -0.6341094970703125, -0.601318359375, -0.5685272216796875, -0.535736083984375, -0.5029449462890625, -0.47015380859375, -0.4373626708984375, -0.404571533203125, -0.3717803955078125, -0.3389892578125, -0.3061981201171875, -0.273406982421875, -0.2406158447265625, -0.20782470703125, -0.1750335693359375, -0.142242431640625, -0.1094512939453125, -0.07666015625, -0.0438690185546875, -0.011077880859375, 0.0217132568359375, 0.05450439453125, 0.0872955322265625, 0.120086669921875, 0.1528778076171875, 0.1856689453125, 0.2184600830078125, 0.251251220703125, 0.2840423583984375, 0.31683349609375, 0.3496246337890625, 0.382415771484375, 0.4152069091796875, 0.447998046875, 0.4807891845703125, 0.513580322265625, 0.5463714599609375, 0.57916259765625, 0.6119537353515625, 0.644744873046875, 0.6775360107421875, 0.7103271484375, 0.7431182861328125, 0.775909423828125, 0.8087005615234375, 0.84149169921875, 0.8742828369140625, 0.907073974609375, 0.9398651123046875, 0.97265625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 11.0, 21.0, 23.0, 53.0, 85.0, 169.0, 262.0, 532.0, 1233.0, 3648.0, 18914.0, 259042.0, 701770.0, 52358.0, 6961.0, 1917.0, 739.0, 335.0, 214.0, 108.0, 54.0, 39.0, 27.0, 17.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.296875, -3.1976318359375, -3.098388671875, -2.9991455078125, -2.89990234375, -2.8006591796875, -2.701416015625, -2.6021728515625, -2.5029296875, -2.4036865234375, -2.304443359375, -2.2052001953125, -2.10595703125, -2.0067138671875, -1.907470703125, -1.8082275390625, -1.708984375, -1.6097412109375, -1.510498046875, -1.4112548828125, -1.31201171875, -1.2127685546875, -1.113525390625, -1.0142822265625, -0.9150390625, -0.8157958984375, -0.716552734375, -0.6173095703125, -0.51806640625, -0.4188232421875, -0.319580078125, -0.2203369140625, -0.12109375, -0.0218505859375, 0.077392578125, 0.1766357421875, 0.27587890625, 0.3751220703125, 0.474365234375, 0.5736083984375, 0.6728515625, 0.7720947265625, 0.871337890625, 0.9705810546875, 1.06982421875, 1.1690673828125, 1.268310546875, 1.3675537109375, 1.466796875, 1.5660400390625, 1.665283203125, 1.7645263671875, 1.86376953125, 1.9630126953125, 2.062255859375, 2.1614990234375, 2.2607421875, 2.3599853515625, 2.459228515625, 2.5584716796875, 2.65771484375, 2.7569580078125, 2.856201171875, 2.9554443359375, 3.0546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 8.0, 8.0, 3.0, 12.0, 13.0, 13.0, 21.0, 23.0, 26.0, 26.0, 44.0, 47.0, 51.0, 55.0, 56.0, 50.0, 44.0, 68.0, 63.0, 50.0, 55.0, 38.0, 46.0, 30.0, 35.0, 27.0, 15.0, 18.0, 10.0, 16.0, 11.0, 6.0, 6.0, 5.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.703125, -2.607452392578125, -2.51177978515625, -2.416107177734375, -2.3204345703125, -2.224761962890625, -2.12908935546875, -2.033416748046875, -1.937744140625, -1.842071533203125, -1.74639892578125, -1.650726318359375, -1.5550537109375, -1.459381103515625, -1.36370849609375, -1.268035888671875, -1.17236328125, -1.076690673828125, -0.98101806640625, -0.885345458984375, -0.7896728515625, -0.694000244140625, -0.59832763671875, -0.502655029296875, -0.406982421875, -0.311309814453125, -0.21563720703125, -0.119964599609375, -0.0242919921875, 0.071380615234375, 0.16705322265625, 0.262725830078125, 0.3583984375, 0.454071044921875, 0.54974365234375, 0.645416259765625, 0.7410888671875, 0.836761474609375, 0.93243408203125, 1.028106689453125, 1.123779296875, 1.219451904296875, 1.31512451171875, 1.410797119140625, 1.5064697265625, 1.602142333984375, 1.69781494140625, 1.793487548828125, 1.88916015625, 1.984832763671875, 2.08050537109375, 2.176177978515625, 2.2718505859375, 2.367523193359375, 2.46319580078125, 2.558868408203125, 2.654541015625, 2.750213623046875, 2.84588623046875, 2.941558837890625, 3.0372314453125, 3.132904052734375, 3.22857666015625, 3.324249267578125, 3.419921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 1.0, 4.0, 5.0, 10.0, 15.0, 21.0, 51.0, 82.0, 176.0, 428.0, 1141.0, 4139.0, 35126.0, 930754.0, 68601.0, 5718.0, 1398.0, 468.0, 193.0, 99.0, 50.0, 23.0, 15.0, 16.0, 5.0, 7.0, 2.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.255859375, -3.1756591796875, -3.095458984375, -3.0152587890625, -2.93505859375, -2.8548583984375, -2.774658203125, -2.6944580078125, -2.6142578125, -2.5340576171875, -2.453857421875, -2.3736572265625, -2.29345703125, -2.2132568359375, -2.133056640625, -2.0528564453125, -1.97265625, -1.8924560546875, -1.812255859375, -1.7320556640625, -1.65185546875, -1.5716552734375, -1.491455078125, -1.4112548828125, -1.3310546875, -1.2508544921875, -1.170654296875, -1.0904541015625, -1.01025390625, -0.9300537109375, -0.849853515625, -0.7696533203125, -0.689453125, -0.6092529296875, -0.529052734375, -0.4488525390625, -0.36865234375, -0.2884521484375, -0.208251953125, -0.1280517578125, -0.0478515625, 0.0323486328125, 0.112548828125, 0.1927490234375, 0.27294921875, 0.3531494140625, 0.433349609375, 0.5135498046875, 0.59375, 0.6739501953125, 0.754150390625, 0.8343505859375, 0.91455078125, 0.9947509765625, 1.074951171875, 1.1551513671875, 1.2353515625, 1.3155517578125, 1.395751953125, 1.4759521484375, 1.55615234375, 1.6363525390625, 1.716552734375, 1.7967529296875, 1.876953125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 8.0, 9.0, 7.0, 24.0, 43.0, 70.0, 137.0, 204.0, 207.0, 135.0, 84.0, 36.0, 16.0, 7.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000324249267578125, -0.00031340867280960083, -0.00030256807804107666, -0.0002917274832725525, -0.0002808868885040283, -0.00027004629373550415, -0.00025920569896698, -0.0002483651041984558, -0.00023752450942993164, -0.00022668391466140747, -0.0002158433198928833, -0.00020500272512435913, -0.00019416213035583496, -0.0001833215355873108, -0.00017248094081878662, -0.00016164034605026245, -0.00015079975128173828, -0.0001399591565132141, -0.00012911856174468994, -0.00011827796697616577, -0.0001074373722076416, -9.659677743911743e-05, -8.575618267059326e-05, -7.491558790206909e-05, -6.407499313354492e-05, -5.323439836502075e-05, -4.239380359649658e-05, -3.155320882797241e-05, -2.0712614059448242e-05, -9.872019290924072e-06, 9.685754776000977e-07, 1.1809170246124268e-05, 2.2649765014648438e-05, 3.349035978317261e-05, 4.433095455169678e-05, 5.517154932022095e-05, 6.601214408874512e-05, 7.685273885726929e-05, 8.769333362579346e-05, 9.853392839431763e-05, 0.0001093745231628418, 0.00012021511793136597, 0.00013105571269989014, 0.0001418963074684143, 0.00015273690223693848, 0.00016357749700546265, 0.00017441809177398682, 0.00018525868654251099, 0.00019609928131103516, 0.00020693987607955933, 0.0002177804708480835, 0.00022862106561660767, 0.00023946166038513184, 0.000250302255153656, 0.0002611428499221802, 0.00027198344469070435, 0.0002828240394592285, 0.0002936646342277527, 0.00030450522899627686, 0.000315345823764801, 0.0003261864185333252, 0.00033702701330184937, 0.00034786760807037354, 0.0003587082028388977, 0.0003695487976074219]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 5.0, 5.0, 4.0, 11.0, 14.0, 18.0, 14.0, 30.0, 39.0, 83.0, 107.0, 176.0, 288.0, 488.0, 924.0, 1735.0, 3686.0, 9150.0, 35437.0, 422761.0, 515914.0, 39976.0, 9954.0, 3828.0, 1683.0, 935.0, 491.0, 269.0, 184.0, 113.0, 75.0, 42.0, 41.0, 25.0, 12.0, 8.0, 11.0, 6.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-1.515625, -1.474700927734375, -1.43377685546875, -1.392852783203125, -1.3519287109375, -1.311004638671875, -1.27008056640625, -1.229156494140625, -1.188232421875, -1.147308349609375, -1.10638427734375, -1.065460205078125, -1.0245361328125, -0.983612060546875, -0.94268798828125, -0.901763916015625, -0.86083984375, -0.819915771484375, -0.77899169921875, -0.738067626953125, -0.6971435546875, -0.656219482421875, -0.61529541015625, -0.574371337890625, -0.533447265625, -0.492523193359375, -0.45159912109375, -0.410675048828125, -0.3697509765625, -0.328826904296875, -0.28790283203125, -0.246978759765625, -0.2060546875, -0.165130615234375, -0.12420654296875, -0.083282470703125, -0.0423583984375, -0.001434326171875, 0.03948974609375, 0.080413818359375, 0.121337890625, 0.162261962890625, 0.20318603515625, 0.244110107421875, 0.2850341796875, 0.325958251953125, 0.36688232421875, 0.407806396484375, 0.44873046875, 0.489654541015625, 0.53057861328125, 0.571502685546875, 0.6124267578125, 0.653350830078125, 0.69427490234375, 0.735198974609375, 0.776123046875, 0.817047119140625, 0.85797119140625, 0.898895263671875, 0.9398193359375, 0.980743408203125, 1.02166748046875, 1.062591552734375, 1.103515625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 7.0, 4.0, 4.0, 6.0, 11.0, 14.0, 36.0, 65.0, 137.0, 171.0, 203.0, 142.0, 77.0, 47.0, 15.0, 6.0, 14.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.37109375, -2.28717041015625, -2.2032470703125, -2.11932373046875, -2.035400390625, -1.95147705078125, -1.8675537109375, -1.78363037109375, -1.69970703125, -1.61578369140625, -1.5318603515625, -1.44793701171875, -1.364013671875, -1.28009033203125, -1.1961669921875, -1.11224365234375, -1.0283203125, -0.94439697265625, -0.8604736328125, -0.77655029296875, -0.692626953125, -0.60870361328125, -0.5247802734375, -0.44085693359375, -0.35693359375, -0.27301025390625, -0.1890869140625, -0.10516357421875, -0.021240234375, 0.06268310546875, 0.1466064453125, 0.23052978515625, 0.314453125, 0.39837646484375, 0.4822998046875, 0.56622314453125, 0.650146484375, 0.73406982421875, 0.8179931640625, 0.90191650390625, 0.98583984375, 1.06976318359375, 1.1536865234375, 1.23760986328125, 1.321533203125, 1.40545654296875, 1.4893798828125, 1.57330322265625, 1.6572265625, 1.74114990234375, 1.8250732421875, 1.90899658203125, 1.992919921875, 2.07684326171875, 2.1607666015625, 2.24468994140625, 2.32861328125, 2.41253662109375, 2.4964599609375, 2.58038330078125, 2.664306640625, 2.74822998046875, 2.8321533203125, 2.91607666015625, 3.0]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 11.0, 20.0, 28.0, 64.0, 106.0, 138.0, 144.0, 143.0, 118.0, 78.0, 63.0, 36.0, 32.0, 11.0, 8.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.128128051757812, -23.487226486206055, -22.846324920654297, -22.20542335510254, -21.56452178955078, -20.923620223999023, -20.282718658447266, -19.641815185546875, -19.00091552734375, -18.360013961791992, -17.719112396240234, -17.078210830688477, -16.43730926513672, -15.796407699584961, -15.155505180358887, -14.514603614807129, -13.873701095581055, -13.232799530029297, -12.591897964477539, -11.950996398925781, -11.310094833374023, -10.669193267822266, -10.028290748596191, -9.387389183044434, -8.746487617492676, -8.105586051940918, -7.46468448638916, -6.823782444000244, -6.182880878448486, -5.5419793128967285, -4.9010772705078125, -4.260175704956055, -3.619274139404297, -2.978372573852539, -2.337470769882202, -1.6965690851211548, -1.0556674003601074, -0.4147658348083496, 0.2261359691619873, 0.8670377731323242, 1.507939338684082, 2.14884090423584, 2.7897427082061768, 3.4306445121765137, 4.0715460777282715, 4.712447643280029, 5.353349685668945, 5.994251251220703, 6.635152816772461, 7.276054382324219, 7.916955947875977, 8.557857513427734, 9.198759078979492, 9.83966064453125, 10.480563163757324, 11.121464729309082, 11.76236629486084, 12.403267860412598, 13.044169425964355, 13.685070991516113, 14.325973510742188, 14.966875076293945, 15.607776641845703, 16.24867820739746, 16.88957977294922]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 5.0, 1.0, 4.0, 5.0, 3.0, 7.0, 9.0, 10.0, 14.0, 13.0, 18.0, 15.0, 21.0, 32.0, 36.0, 31.0, 19.0, 34.0, 23.0, 53.0, 36.0, 43.0, 39.0, 51.0, 43.0, 31.0, 34.0, 37.0, 43.0, 31.0, 32.0, 29.0, 19.0, 16.0, 27.0, 27.0, 14.0, 13.0, 19.0, 12.0, 13.0, 14.0, 8.0, 4.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-12.500033378601074, -12.127107620239258, -11.754181861877441, -11.381256103515625, -11.008330345153809, -10.635404586791992, -10.26247787475586, -9.88955307006836, -9.516626358032227, -9.14370059967041, -8.770774841308594, -8.397849082946777, -8.024923324584961, -7.6519975662231445, -7.27907133102417, -6.9061455726623535, -6.533220291137695, -6.160294532775879, -5.7873687744140625, -5.414443016052246, -5.04151725769043, -4.668591499328613, -4.295665264129639, -3.9227395057678223, -3.549813747406006, -3.1768879890441895, -2.803962230682373, -2.4310362339019775, -2.058110475540161, -1.6851847171783447, -1.3122587203979492, -0.9393329620361328, -0.5664081573486328, -0.19348233938217163, 0.17944347858428955, 0.5523693561553955, 0.9252951145172119, 1.2982208728790283, 1.6711468696594238, 2.0440726280212402, 2.4169983863830566, 2.789924144744873, 3.1628499031066895, 3.535775899887085, 3.9087016582489014, 4.281627655029297, 4.654553413391113, 5.02747917175293, 5.400404930114746, 5.7733306884765625, 6.146256446838379, 6.519182205200195, 6.892107963562012, 7.265033721923828, 7.637959957122803, 8.010885238647461, 8.383811950683594, 8.75673770904541, 9.129663467407227, 9.502589225769043, 9.87551498413086, 10.248440742492676, 10.621366500854492, 10.994293212890625, 11.367218017578125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 9.0, 3.0, 3.0, 3.0, 8.0, 7.0, 17.0, 27.0, 24.0, 33.0, 53.0, 78.0, 130.0, 244.0, 352.0, 753.0, 1698.0, 4619.0, 16677.0, 115503.0, 3993591.0, 45691.0, 9351.0, 2974.0, 1166.0, 521.0, 252.0, 152.0, 101.0, 68.0, 43.0, 33.0, 27.0, 18.0, 12.0, 10.0, 3.0, 6.0, 5.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.68359375, -2.6053466796875, -2.527099609375, -2.4488525390625, -2.37060546875, -2.2923583984375, -2.214111328125, -2.1358642578125, -2.0576171875, -1.9793701171875, -1.901123046875, -1.8228759765625, -1.74462890625, -1.6663818359375, -1.588134765625, -1.5098876953125, -1.431640625, -1.3533935546875, -1.275146484375, -1.1968994140625, -1.11865234375, -1.0404052734375, -0.962158203125, -0.8839111328125, -0.8056640625, -0.7274169921875, -0.649169921875, -0.5709228515625, -0.49267578125, -0.4144287109375, -0.336181640625, -0.2579345703125, -0.1796875, -0.1014404296875, -0.023193359375, 0.0550537109375, 0.13330078125, 0.2115478515625, 0.289794921875, 0.3680419921875, 0.4462890625, 0.5245361328125, 0.602783203125, 0.6810302734375, 0.75927734375, 0.8375244140625, 0.915771484375, 0.9940185546875, 1.072265625, 1.1505126953125, 1.228759765625, 1.3070068359375, 1.38525390625, 1.4635009765625, 1.541748046875, 1.6199951171875, 1.6982421875, 1.7764892578125, 1.854736328125, 1.9329833984375, 2.01123046875, 2.0894775390625, 2.167724609375, 2.2459716796875, 2.32421875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 6.0, 17.0, 19.0, 25.0, 29.0, 35.0, 48.0, 48.0, 47.0, 47.0, 47.0, 65.0, 59.0, 49.0, 62.0, 53.0, 46.0, 45.0, 41.0, 24.0, 27.0, 22.0, 22.0, 20.0, 10.0, 11.0, 11.0, 6.0, 8.0, 8.0, 3.0, 6.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.701171875, -0.6803817749023438, -0.6595916748046875, -0.6388015747070312, -0.618011474609375, -0.5972213745117188, -0.5764312744140625, -0.5556411743164062, -0.53485107421875, -0.5140609741210938, -0.4932708740234375, -0.47248077392578125, -0.451690673828125, -0.43090057373046875, -0.4101104736328125, -0.38932037353515625, -0.3685302734375, -0.34774017333984375, -0.3269500732421875, -0.30615997314453125, -0.285369873046875, -0.26457977294921875, -0.2437896728515625, -0.22299957275390625, -0.20220947265625, -0.18141937255859375, -0.1606292724609375, -0.13983917236328125, -0.119049072265625, -0.09825897216796875, -0.0774688720703125, -0.05667877197265625, -0.035888671875, -0.01509857177734375, 0.0056915283203125, 0.02648162841796875, 0.047271728515625, 0.06806182861328125, 0.0888519287109375, 0.10964202880859375, 0.13043212890625, 0.15122222900390625, 0.1720123291015625, 0.19280242919921875, 0.213592529296875, 0.23438262939453125, 0.2551727294921875, 0.27596282958984375, 0.2967529296875, 0.31754302978515625, 0.3383331298828125, 0.35912322998046875, 0.379913330078125, 0.40070343017578125, 0.4214935302734375, 0.44228363037109375, 0.46307373046875, 0.48386383056640625, 0.5046539306640625, 0.5254440307617188, 0.546234130859375, 0.5670242309570312, 0.5878143310546875, 0.6086044311523438, 0.62939453125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 4.0, 4.0, 7.0, 6.0, 9.0, 11.0, 19.0, 33.0, 32.0, 37.0, 42.0, 64.0, 86.0, 99.0, 156.0, 208.0, 271.0, 530.0, 2414.0, 56787.0, 4120617.0, 10352.0, 1153.0, 383.0, 226.0, 164.0, 133.0, 108.0, 86.0, 62.0, 36.0, 29.0, 26.0, 23.0, 19.0, 12.0, 14.0, 4.0, 6.0, 2.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.625, -8.3734130859375, -8.121826171875, -7.8702392578125, -7.61865234375, -7.3670654296875, -7.115478515625, -6.8638916015625, -6.6123046875, -6.3607177734375, -6.109130859375, -5.8575439453125, -5.60595703125, -5.3543701171875, -5.102783203125, -4.8511962890625, -4.599609375, -4.3480224609375, -4.096435546875, -3.8448486328125, -3.59326171875, -3.3416748046875, -3.090087890625, -2.8385009765625, -2.5869140625, -2.3353271484375, -2.083740234375, -1.8321533203125, -1.58056640625, -1.3289794921875, -1.077392578125, -0.8258056640625, -0.57421875, -0.3226318359375, -0.071044921875, 0.1805419921875, 0.43212890625, 0.6837158203125, 0.935302734375, 1.1868896484375, 1.4384765625, 1.6900634765625, 1.941650390625, 2.1932373046875, 2.44482421875, 2.6964111328125, 2.947998046875, 3.1995849609375, 3.451171875, 3.7027587890625, 3.954345703125, 4.2059326171875, 4.45751953125, 4.7091064453125, 4.960693359375, 5.2122802734375, 5.4638671875, 5.7154541015625, 5.967041015625, 6.2186279296875, 6.47021484375, 6.7218017578125, 6.973388671875, 7.2249755859375, 7.4765625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 18.0, 28.0, 114.0, 3492.0, 300.0, 81.0, 25.0, 8.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0], "bins": [-4.86328125, -4.7711181640625, -4.678955078125, -4.5867919921875, -4.49462890625, -4.4024658203125, -4.310302734375, -4.2181396484375, -4.1259765625, -4.0338134765625, -3.941650390625, -3.8494873046875, -3.75732421875, -3.6651611328125, -3.572998046875, -3.4808349609375, -3.388671875, -3.2965087890625, -3.204345703125, -3.1121826171875, -3.02001953125, -2.9278564453125, -2.835693359375, -2.7435302734375, -2.6513671875, -2.5592041015625, -2.467041015625, -2.3748779296875, -2.28271484375, -2.1905517578125, -2.098388671875, -2.0062255859375, -1.9140625, -1.8218994140625, -1.729736328125, -1.6375732421875, -1.54541015625, -1.4532470703125, -1.361083984375, -1.2689208984375, -1.1767578125, -1.0845947265625, -0.992431640625, -0.9002685546875, -0.80810546875, -0.7159423828125, -0.623779296875, -0.5316162109375, -0.439453125, -0.3472900390625, -0.255126953125, -0.1629638671875, -0.07080078125, 0.0213623046875, 0.113525390625, 0.2056884765625, 0.2978515625, 0.3900146484375, 0.482177734375, 0.5743408203125, 0.66650390625, 0.7586669921875, 0.850830078125, 0.9429931640625, 1.03515625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 5.0, 15.0, 20.0, 37.0, 42.0, 89.0, 138.0, 157.0, 159.0, 129.0, 82.0, 57.0, 22.0, 19.0, 8.0, 6.0, 6.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.920400619506836, -8.658134460449219, -8.395867347717285, -8.133601188659668, -7.871334552764893, -7.609067916870117, -7.3468017578125, -7.084535121917725, -6.822268486022949, -6.560001850128174, -6.297735214233398, -6.035469055175781, -5.773202419281006, -5.5109357833862305, -5.248669624328613, -4.986402988433838, -4.7241363525390625, -4.461869716644287, -4.199603080749512, -3.9373369216918945, -3.675070285797119, -3.4128036499023438, -3.1505372524261475, -2.888270854949951, -2.626004219055176, -2.3637375831604004, -2.101471185684204, -1.8392046689987183, -1.5769381523132324, -1.3146716356277466, -1.0524051189422607, -0.7901386022567749, -0.5278730392456055, -0.26560652256011963, -0.003340005874633789, 0.25892651081085205, 0.5211930274963379, 0.7834595441818237, 1.0457260608673096, 1.3079925775527954, 1.5702590942382812, 1.832525610923767, 2.094792127609253, 2.357058525085449, 2.6193251609802246, 2.881591796875, 3.1438581943511963, 3.4061245918273926, 3.668391227722168, 3.9306578636169434, 4.192924499511719, 4.455190658569336, 4.717457294464111, 4.979723930358887, 5.241990089416504, 5.504256725311279, 5.766523361206055, 6.02878999710083, 6.2910566329956055, 6.553322792053223, 6.815589427947998, 7.077856063842773, 7.340122222900391, 7.602388858795166, 7.864655494689941]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 11.0, 7.0, 22.0, 52.0, 46.0, 60.0, 84.0, 86.0, 99.0, 110.0, 107.0, 84.0, 58.0, 54.0, 35.0, 24.0, 16.0, 17.0, 12.0, 3.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.068631172180176, -6.798524856567383, -6.528418064117432, -6.2583112716674805, -5.9882049560546875, -5.7180986404418945, -5.447991847991943, -5.177885055541992, -4.907778739929199, -4.637672424316406, -4.367565631866455, -4.097458839416504, -3.827352523803711, -3.557245969772339, -3.287139415740967, -3.0170328617095947, -2.7469263076782227, -2.4768197536468506, -2.2067131996154785, -1.9366066455841064, -1.6665000915527344, -1.3963935375213623, -1.1262869834899902, -0.8561804294586182, -0.5860738754272461, -0.315967321395874, -0.04586076736450195, 0.22424578666687012, 0.4943523406982422, 0.7644588947296143, 1.0345654487609863, 1.3046720027923584, 1.574777603149414, 1.8448841571807861, 2.114990711212158, 2.3850972652435303, 2.6552038192749023, 2.9253103733062744, 3.1954169273376465, 3.4655234813690186, 3.7356300354003906, 4.005736351013184, 4.275843143463135, 4.545949935913086, 4.816056251525879, 5.086162567138672, 5.356269359588623, 5.626376152038574, 5.896482467651367, 6.16658878326416, 6.436695575714111, 6.7068023681640625, 6.9769086837768555, 7.247014999389648, 7.5171217918396, 7.787228584289551, 8.057334899902344, 8.327441215515137, 8.59754753112793, 8.867654800415039, 9.137761116027832, 9.407867431640625, 9.677974700927734, 9.948081016540527, 10.21818733215332]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 13.0, 7.0, 13.0, 28.0, 42.0, 36.0, 51.0, 106.0, 130.0, 201.0, 326.0, 531.0, 942.0, 1697.0, 3225.0, 6500.0, 14332.0, 34550.0, 88887.0, 224228.0, 344565.0, 196975.0, 76066.0, 29661.0, 12738.0, 5896.0, 2945.0, 1594.0, 904.0, 484.0, 315.0, 175.0, 125.0, 73.0, 63.0, 41.0, 24.0, 20.0, 11.0, 9.0, 8.0, 4.0, 7.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1494140625, -1.1074981689453125, -1.065582275390625, -1.0236663818359375, -0.98175048828125, -0.9398345947265625, -0.897918701171875, -0.8560028076171875, -0.8140869140625, -0.7721710205078125, -0.730255126953125, -0.6883392333984375, -0.64642333984375, -0.6045074462890625, -0.562591552734375, -0.5206756591796875, -0.478759765625, -0.4368438720703125, -0.394927978515625, -0.3530120849609375, -0.31109619140625, -0.2691802978515625, -0.227264404296875, -0.1853485107421875, -0.1434326171875, -0.1015167236328125, -0.059600830078125, -0.0176849365234375, 0.02423095703125, 0.0661468505859375, 0.108062744140625, 0.1499786376953125, 0.19189453125, 0.2338104248046875, 0.275726318359375, 0.3176422119140625, 0.35955810546875, 0.4014739990234375, 0.443389892578125, 0.4853057861328125, 0.5272216796875, 0.5691375732421875, 0.611053466796875, 0.6529693603515625, 0.69488525390625, 0.7368011474609375, 0.778717041015625, 0.8206329345703125, 0.862548828125, 0.9044647216796875, 0.946380615234375, 0.9882965087890625, 1.03021240234375, 1.0721282958984375, 1.114044189453125, 1.1559600830078125, 1.1978759765625, 1.2397918701171875, 1.281707763671875, 1.3236236572265625, 1.36553955078125, 1.4074554443359375, 1.449371337890625, 1.4912872314453125, 1.533203125]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 2.0, 6.0, 10.0, 12.0, 15.0, 13.0, 25.0, 25.0, 30.0, 37.0, 31.0, 45.0, 40.0, 50.0, 71.0, 56.0, 62.0, 71.0, 64.0, 60.0, 39.0, 51.0, 32.0, 31.0, 26.0, 20.0, 14.0, 12.0, 9.0, 7.0, 8.0, 4.0, 6.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.65673828125, -0.6317977905273438, -0.6068572998046875, -0.5819168090820312, -0.556976318359375, -0.5320358276367188, -0.5070953369140625, -0.48215484619140625, -0.45721435546875, -0.43227386474609375, -0.4073333740234375, -0.38239288330078125, -0.357452392578125, -0.33251190185546875, -0.3075714111328125, -0.28263092041015625, -0.2576904296875, -0.23274993896484375, -0.2078094482421875, -0.18286895751953125, -0.157928466796875, -0.13298797607421875, -0.1080474853515625, -0.08310699462890625, -0.05816650390625, -0.03322601318359375, -0.0082855224609375, 0.01665496826171875, 0.041595458984375, 0.06653594970703125, 0.0914764404296875, 0.11641693115234375, 0.141357421875, 0.16629791259765625, 0.1912384033203125, 0.21617889404296875, 0.241119384765625, 0.26605987548828125, 0.2910003662109375, 0.31594085693359375, 0.34088134765625, 0.36582183837890625, 0.3907623291015625, 0.41570281982421875, 0.440643310546875, 0.46558380126953125, 0.4905242919921875, 0.5154647827148438, 0.5404052734375, 0.5653457641601562, 0.5902862548828125, 0.6152267456054688, 0.640167236328125, 0.6651077270507812, 0.6900482177734375, 0.7149887084960938, 0.73992919921875, 0.7648696899414062, 0.7898101806640625, 0.8147506713867188, 0.839691162109375, 0.8646316528320312, 0.8895721435546875, 0.9145126342773438, 0.939453125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 6.0, 9.0, 13.0, 38.0, 40.0, 87.0, 124.0, 183.0, 386.0, 911.0, 3824.0, 67998.0, 935323.0, 35122.0, 2889.0, 763.0, 338.0, 174.0, 119.0, 69.0, 49.0, 26.0, 20.0, 9.0, 9.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.8125, -5.61492919921875, -5.4173583984375, -5.21978759765625, -5.022216796875, -4.82464599609375, -4.6270751953125, -4.42950439453125, -4.23193359375, -4.03436279296875, -3.8367919921875, -3.63922119140625, -3.441650390625, -3.24407958984375, -3.0465087890625, -2.84893798828125, -2.6513671875, -2.45379638671875, -2.2562255859375, -2.05865478515625, -1.861083984375, -1.66351318359375, -1.4659423828125, -1.26837158203125, -1.07080078125, -0.87322998046875, -0.6756591796875, -0.47808837890625, -0.280517578125, -0.08294677734375, 0.1146240234375, 0.31219482421875, 0.509765625, 0.70733642578125, 0.9049072265625, 1.10247802734375, 1.300048828125, 1.49761962890625, 1.6951904296875, 1.89276123046875, 2.09033203125, 2.28790283203125, 2.4854736328125, 2.68304443359375, 2.880615234375, 3.07818603515625, 3.2757568359375, 3.47332763671875, 3.6708984375, 3.86846923828125, 4.0660400390625, 4.26361083984375, 4.461181640625, 4.65875244140625, 4.8563232421875, 5.05389404296875, 5.25146484375, 5.44903564453125, 5.6466064453125, 5.84417724609375, 6.041748046875, 6.23931884765625, 6.4368896484375, 6.63446044921875, 6.83203125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 9.0, 12.0, 12.0, 13.0, 27.0, 27.0, 40.0, 43.0, 58.0, 52.0, 71.0, 97.0, 74.0, 84.0, 61.0, 73.0, 63.0, 52.0, 36.0, 29.0, 21.0, 16.0, 13.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.015625, -4.86053466796875, -4.7054443359375, -4.55035400390625, -4.395263671875, -4.24017333984375, -4.0850830078125, -3.92999267578125, -3.77490234375, -3.61981201171875, -3.4647216796875, -3.30963134765625, -3.154541015625, -2.99945068359375, -2.8443603515625, -2.68927001953125, -2.5341796875, -2.37908935546875, -2.2239990234375, -2.06890869140625, -1.913818359375, -1.75872802734375, -1.6036376953125, -1.44854736328125, -1.29345703125, -1.13836669921875, -0.9832763671875, -0.82818603515625, -0.673095703125, -0.51800537109375, -0.3629150390625, -0.20782470703125, -0.052734375, 0.10235595703125, 0.2574462890625, 0.41253662109375, 0.567626953125, 0.72271728515625, 0.8778076171875, 1.03289794921875, 1.18798828125, 1.34307861328125, 1.4981689453125, 1.65325927734375, 1.808349609375, 1.96343994140625, 2.1185302734375, 2.27362060546875, 2.4287109375, 2.58380126953125, 2.7388916015625, 2.89398193359375, 3.049072265625, 3.20416259765625, 3.3592529296875, 3.51434326171875, 3.66943359375, 3.82452392578125, 3.9796142578125, 4.13470458984375, 4.289794921875, 4.44488525390625, 4.5999755859375, 4.75506591796875, 4.91015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 10.0, 9.0, 15.0, 17.0, 44.0, 77.0, 136.0, 344.0, 1018.0, 4556.0, 63919.0, 922021.0, 50840.0, 3932.0, 915.0, 352.0, 150.0, 86.0, 34.0, 16.0, 17.0, 15.0, 9.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.14453125, -2.0872955322265625, -2.030059814453125, -1.9728240966796875, -1.91558837890625, -1.8583526611328125, -1.801116943359375, -1.7438812255859375, -1.6866455078125, -1.6294097900390625, -1.572174072265625, -1.5149383544921875, -1.45770263671875, -1.4004669189453125, -1.343231201171875, -1.2859954833984375, -1.228759765625, -1.1715240478515625, -1.114288330078125, -1.0570526123046875, -0.99981689453125, -0.9425811767578125, -0.885345458984375, -0.8281097412109375, -0.7708740234375, -0.7136383056640625, -0.656402587890625, -0.5991668701171875, -0.54193115234375, -0.4846954345703125, -0.427459716796875, -0.3702239990234375, -0.31298828125, -0.2557525634765625, -0.198516845703125, -0.1412811279296875, -0.08404541015625, -0.0268096923828125, 0.030426025390625, 0.0876617431640625, 0.1448974609375, 0.2021331787109375, 0.259368896484375, 0.3166046142578125, 0.37384033203125, 0.4310760498046875, 0.488311767578125, 0.5455474853515625, 0.602783203125, 0.6600189208984375, 0.717254638671875, 0.7744903564453125, 0.83172607421875, 0.8889617919921875, 0.946197509765625, 1.0034332275390625, 1.0606689453125, 1.1179046630859375, 1.175140380859375, 1.2323760986328125, 1.28961181640625, 1.3468475341796875, 1.404083251953125, 1.4613189697265625, 1.5185546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 0.0, 2.0, 5.0, 4.0, 9.0, 10.0, 10.0, 19.0, 24.0, 34.0, 42.0, 71.0, 92.0, 119.0, 112.0, 109.0, 103.0, 77.0, 39.0, 32.0, 21.0, 22.0, 7.0, 6.0, 11.0, 10.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00023245811462402344, -0.00022589415311813354, -0.00021933019161224365, -0.00021276623010635376, -0.00020620226860046387, -0.00019963830709457397, -0.00019307434558868408, -0.0001865103840827942, -0.0001799464225769043, -0.0001733824610710144, -0.0001668184995651245, -0.00016025453805923462, -0.00015369057655334473, -0.00014712661504745483, -0.00014056265354156494, -0.00013399869203567505, -0.00012743473052978516, -0.00012087076902389526, -0.00011430680751800537, -0.00010774284601211548, -0.00010117888450622559, -9.46149230003357e-05, -8.80509614944458e-05, -8.148699998855591e-05, -7.492303848266602e-05, -6.835907697677612e-05, -6.179511547088623e-05, -5.523115396499634e-05, -4.8667192459106445e-05, -4.210323095321655e-05, -3.553926944732666e-05, -2.8975307941436768e-05, -2.2411346435546875e-05, -1.5847384929656982e-05, -9.28342342376709e-06, -2.7194619178771973e-06, 3.844499588012695e-06, 1.0408461093902588e-05, 1.697242259979248e-05, 2.3536384105682373e-05, 3.0100345611572266e-05, 3.666430711746216e-05, 4.322826862335205e-05, 4.979223012924194e-05, 5.6356191635131836e-05, 6.292015314102173e-05, 6.948411464691162e-05, 7.604807615280151e-05, 8.26120376586914e-05, 8.91759991645813e-05, 9.573996067047119e-05, 0.00010230392217636108, 0.00010886788368225098, 0.00011543184518814087, 0.00012199580669403076, 0.00012855976819992065, 0.00013512372970581055, 0.00014168769121170044, 0.00014825165271759033, 0.00015481561422348022, 0.00016137957572937012, 0.00016794353723526, 0.0001745074987411499, 0.0001810714602470398, 0.0001876354217529297]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 9.0, 7.0, 2.0, 9.0, 14.0, 29.0, 40.0, 58.0, 84.0, 182.0, 390.0, 820.0, 2496.0, 12710.0, 210623.0, 773386.0, 40026.0, 5149.0, 1377.0, 564.0, 247.0, 112.0, 82.0, 54.0, 29.0, 20.0, 13.0, 4.0, 5.0, 1.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4130859375, -1.3692626953125, -1.325439453125, -1.2816162109375, -1.23779296875, -1.1939697265625, -1.150146484375, -1.1063232421875, -1.0625, -1.0186767578125, -0.974853515625, -0.9310302734375, -0.88720703125, -0.8433837890625, -0.799560546875, -0.7557373046875, -0.7119140625, -0.6680908203125, -0.624267578125, -0.5804443359375, -0.53662109375, -0.4927978515625, -0.448974609375, -0.4051513671875, -0.361328125, -0.3175048828125, -0.273681640625, -0.2298583984375, -0.18603515625, -0.1422119140625, -0.098388671875, -0.0545654296875, -0.0107421875, 0.0330810546875, 0.076904296875, 0.1207275390625, 0.16455078125, 0.2083740234375, 0.252197265625, 0.2960205078125, 0.33984375, 0.3836669921875, 0.427490234375, 0.4713134765625, 0.51513671875, 0.5589599609375, 0.602783203125, 0.6466064453125, 0.6904296875, 0.7342529296875, 0.778076171875, 0.8218994140625, 0.86572265625, 0.9095458984375, 0.953369140625, 0.9971923828125, 1.041015625, 1.0848388671875, 1.128662109375, 1.1724853515625, 1.21630859375, 1.2601318359375, 1.303955078125, 1.3477783203125, 1.3916015625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 3.0, 10.0, 9.0, 11.0, 17.0, 35.0, 24.0, 58.0, 70.0, 86.0, 110.0, 118.0, 113.0, 93.0, 72.0, 60.0, 40.0, 21.0, 17.0, 11.0, 3.0, 2.0, 3.0, 3.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.990234375, -0.952606201171875, -0.91497802734375, -0.877349853515625, -0.8397216796875, -0.802093505859375, -0.76446533203125, -0.726837158203125, -0.689208984375, -0.651580810546875, -0.61395263671875, -0.576324462890625, -0.5386962890625, -0.501068115234375, -0.46343994140625, -0.425811767578125, -0.38818359375, -0.350555419921875, -0.31292724609375, -0.275299072265625, -0.2376708984375, -0.200042724609375, -0.16241455078125, -0.124786376953125, -0.087158203125, -0.049530029296875, -0.01190185546875, 0.025726318359375, 0.0633544921875, 0.100982666015625, 0.13861083984375, 0.176239013671875, 0.2138671875, 0.251495361328125, 0.28912353515625, 0.326751708984375, 0.3643798828125, 0.402008056640625, 0.43963623046875, 0.477264404296875, 0.514892578125, 0.552520751953125, 0.59014892578125, 0.627777099609375, 0.6654052734375, 0.703033447265625, 0.74066162109375, 0.778289794921875, 0.81591796875, 0.853546142578125, 0.89117431640625, 0.928802490234375, 0.9664306640625, 1.004058837890625, 1.04168701171875, 1.079315185546875, 1.116943359375, 1.154571533203125, 1.19219970703125, 1.229827880859375, 1.2674560546875, 1.305084228515625, 1.34271240234375, 1.380340576171875, 1.41796875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 15.0, 17.0, 48.0, 104.0, 207.0, 276.0, 188.0, 76.0, 42.0, 24.0, 6.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.46487808227539, -16.038665771484375, -14.612455368041992, -13.186243057250977, -11.760031700134277, -10.333820343017578, -8.907608032226562, -7.481396675109863, -6.055185317993164, -4.628973960876465, -3.2027621269226074, -1.77655029296875, -0.3503389358520508, 1.0758724212646484, 2.502084732055664, 3.9282960891723633, 5.3545074462890625, 6.780718803405762, 8.206930160522461, 9.633142471313477, 11.059353828430176, 12.485565185546875, 13.91177749633789, 15.33798885345459, 16.76420021057129, 18.190412521362305, 19.616622924804688, 21.042835235595703, 22.46904754638672, 23.8952579498291, 25.321470260620117, 26.7476806640625, 28.17389678955078, 29.600109100341797, 31.02631950378418, 32.45252990722656, 33.87874221801758, 35.304954528808594, 36.73116683959961, 38.157379150390625, 39.583587646484375, 41.00979995727539, 42.436012268066406, 43.862220764160156, 45.28843307495117, 46.71464538574219, 48.1408576965332, 49.56707000732422, 50.993282318115234, 52.41949462890625, 53.845706939697266, 55.27191925048828, 56.69812774658203, 58.12434005737305, 59.55055236816406, 60.97676467895508, 62.402976989746094, 63.82918930053711, 65.25540161132812, 66.68161010742188, 68.10782623291016, 69.5340347290039, 70.96025085449219, 72.38645935058594, 73.81266784667969]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 1.0, 4.0, 5.0, 8.0, 10.0, 16.0, 18.0, 21.0, 20.0, 30.0, 37.0, 42.0, 59.0, 63.0, 61.0, 61.0, 51.0, 75.0, 64.0, 47.0, 51.0, 48.0, 51.0, 36.0, 23.0, 26.0, 14.0, 15.0, 9.0, 9.0, 9.0, 4.0, 7.0, 5.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.036518096923828, -20.397083282470703, -19.757646560668945, -19.11821174621582, -18.478775024414062, -17.839340209960938, -17.199905395507812, -16.560470581054688, -15.92103385925293, -15.281598091125488, -14.642162322998047, -14.002727508544922, -13.36329174041748, -12.723855972290039, -12.084421157836914, -11.444985389709473, -10.805549621582031, -10.16611385345459, -9.526678085327148, -8.887243270874023, -8.247807502746582, -7.608371734619141, -6.968936443328857, -6.329501152038574, -5.690065383911133, -5.050629615783691, -4.411194324493408, -3.771758794784546, -3.1323232650756836, -2.4928877353668213, -1.853452205657959, -1.2140169143676758, -0.5745811462402344, 0.06485438346862793, 0.7042899131774902, 1.3437254428863525, 1.9831609725952148, 2.622596502304077, 3.2620320320129395, 3.9014673233032227, 4.540903091430664, 5.1803388595581055, 5.819774150848389, 6.459209442138672, 7.098645210266113, 7.738080978393555, 8.37751579284668, 9.016951560974121, 9.656387329101562, 10.295823097229004, 10.935258865356445, 11.57469367980957, 12.214129447937012, 12.853565216064453, 13.493000030517578, 14.13243579864502, 14.771871566772461, 15.411307334899902, 16.050743103027344, 16.69017791748047, 17.329612731933594, 17.96904945373535, 18.608484268188477, 19.247920989990234, 19.88735580444336]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 1.0, 2.0, 7.0, 6.0, 9.0, 9.0, 7.0, 11.0, 13.0, 19.0, 24.0, 33.0, 34.0, 41.0, 65.0, 110.0, 127.0, 223.0, 365.0, 682.0, 1260.0, 3059.0, 7999.0, 27231.0, 142278.0, 3218992.0, 697350.0, 66861.0, 17249.0, 5733.0, 2310.0, 1062.0, 495.0, 232.0, 144.0, 87.0, 53.0, 28.0, 20.0, 12.0, 12.0, 12.0, 4.0, 7.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.08203125, -2.030975341796875, -1.97991943359375, -1.928863525390625, -1.8778076171875, -1.826751708984375, -1.77569580078125, -1.724639892578125, -1.673583984375, -1.622528076171875, -1.57147216796875, -1.520416259765625, -1.4693603515625, -1.418304443359375, -1.36724853515625, -1.316192626953125, -1.26513671875, -1.214080810546875, -1.16302490234375, -1.111968994140625, -1.0609130859375, -1.009857177734375, -0.95880126953125, -0.907745361328125, -0.856689453125, -0.805633544921875, -0.75457763671875, -0.703521728515625, -0.6524658203125, -0.601409912109375, -0.55035400390625, -0.499298095703125, -0.4482421875, -0.397186279296875, -0.34613037109375, -0.295074462890625, -0.2440185546875, -0.192962646484375, -0.14190673828125, -0.090850830078125, -0.039794921875, 0.011260986328125, 0.06231689453125, 0.113372802734375, 0.1644287109375, 0.215484619140625, 0.26654052734375, 0.317596435546875, 0.36865234375, 0.419708251953125, 0.47076416015625, 0.521820068359375, 0.5728759765625, 0.623931884765625, 0.67498779296875, 0.726043701171875, 0.777099609375, 0.828155517578125, 0.87921142578125, 0.930267333984375, 0.9813232421875, 1.032379150390625, 1.08343505859375, 1.134490966796875, 1.185546875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 20.0, 34.0, 61.0, 89.0, 103.0, 145.0, 142.0, 107.0, 115.0, 57.0, 53.0, 32.0, 11.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.15625, -2.1038665771484375, -2.051483154296875, -1.9990997314453125, -1.94671630859375, -1.8943328857421875, -1.841949462890625, -1.7895660400390625, -1.7371826171875, -1.6847991943359375, -1.632415771484375, -1.5800323486328125, -1.52764892578125, -1.4752655029296875, -1.422882080078125, -1.3704986572265625, -1.318115234375, -1.2657318115234375, -1.213348388671875, -1.1609649658203125, -1.10858154296875, -1.0561981201171875, -1.003814697265625, -0.9514312744140625, -0.8990478515625, -0.8466644287109375, -0.794281005859375, -0.7418975830078125, -0.68951416015625, -0.6371307373046875, -0.584747314453125, -0.5323638916015625, -0.47998046875, -0.4275970458984375, -0.375213623046875, -0.3228302001953125, -0.27044677734375, -0.2180633544921875, -0.165679931640625, -0.1132965087890625, -0.0609130859375, -0.0085296630859375, 0.043853759765625, 0.0962371826171875, 0.14862060546875, 0.2010040283203125, 0.253387451171875, 0.3057708740234375, 0.358154296875, 0.4105377197265625, 0.462921142578125, 0.5153045654296875, 0.56768798828125, 0.6200714111328125, 0.672454833984375, 0.7248382568359375, 0.7772216796875, 0.8296051025390625, 0.881988525390625, 0.9343719482421875, 0.98675537109375, 1.0391387939453125, 1.091522216796875, 1.1439056396484375, 1.1962890625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 7.0, 10.0, 14.0, 20.0, 23.0, 50.0, 73.0, 110.0, 232.0, 518.0, 1252.0, 3844.0, 15148.0, 104116.0, 3659443.0, 368966.0, 30547.0, 6449.0, 1981.0, 780.0, 301.0, 156.0, 85.0, 44.0, 21.0, 14.0, 13.0, 10.0, 6.0, 10.0, 6.0, 4.0, 5.0, 1.0, 1.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.833984375, -2.749908447265625, -2.66583251953125, -2.581756591796875, -2.4976806640625, -2.413604736328125, -2.32952880859375, -2.245452880859375, -2.161376953125, -2.077301025390625, -1.99322509765625, -1.909149169921875, -1.8250732421875, -1.740997314453125, -1.65692138671875, -1.572845458984375, -1.48876953125, -1.404693603515625, -1.32061767578125, -1.236541748046875, -1.1524658203125, -1.068389892578125, -0.98431396484375, -0.900238037109375, -0.816162109375, -0.732086181640625, -0.64801025390625, -0.563934326171875, -0.4798583984375, -0.395782470703125, -0.31170654296875, -0.227630615234375, -0.1435546875, -0.059478759765625, 0.02459716796875, 0.108673095703125, 0.1927490234375, 0.276824951171875, 0.36090087890625, 0.444976806640625, 0.529052734375, 0.613128662109375, 0.69720458984375, 0.781280517578125, 0.8653564453125, 0.949432373046875, 1.03350830078125, 1.117584228515625, 1.20166015625, 1.285736083984375, 1.36981201171875, 1.453887939453125, 1.5379638671875, 1.622039794921875, 1.70611572265625, 1.790191650390625, 1.874267578125, 1.958343505859375, 2.04241943359375, 2.126495361328125, 2.2105712890625, 2.294647216796875, 2.37872314453125, 2.462799072265625, 2.546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 2.0, 7.0, 8.0, 14.0, 15.0, 16.0, 20.0, 37.0, 63.0, 75.0, 147.0, 322.0, 856.0, 1215.0, 645.0, 257.0, 136.0, 66.0, 52.0, 29.0, 17.0, 21.0, 9.0, 7.0, 10.0, 4.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.41796875, -2.34332275390625, -2.2686767578125, -2.19403076171875, -2.119384765625, -2.04473876953125, -1.9700927734375, -1.89544677734375, -1.82080078125, -1.74615478515625, -1.6715087890625, -1.59686279296875, -1.522216796875, -1.44757080078125, -1.3729248046875, -1.29827880859375, -1.2236328125, -1.14898681640625, -1.0743408203125, -0.99969482421875, -0.925048828125, -0.85040283203125, -0.7757568359375, -0.70111083984375, -0.62646484375, -0.55181884765625, -0.4771728515625, -0.40252685546875, -0.327880859375, -0.25323486328125, -0.1785888671875, -0.10394287109375, -0.029296875, 0.04534912109375, 0.1199951171875, 0.19464111328125, 0.269287109375, 0.34393310546875, 0.4185791015625, 0.49322509765625, 0.56787109375, 0.64251708984375, 0.7171630859375, 0.79180908203125, 0.866455078125, 0.94110107421875, 1.0157470703125, 1.09039306640625, 1.1650390625, 1.23968505859375, 1.3143310546875, 1.38897705078125, 1.463623046875, 1.53826904296875, 1.6129150390625, 1.68756103515625, 1.76220703125, 1.83685302734375, 1.9114990234375, 1.98614501953125, 2.060791015625, 2.13543701171875, 2.2100830078125, 2.28472900390625, 2.359375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 8.0, 14.0, 31.0, 94.0, 215.0, 285.0, 194.0, 99.0, 31.0, 9.0, 7.0, 6.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.81629180908203, -35.92899703979492, -35.04170227050781, -34.1544075012207, -33.267112731933594, -32.379817962646484, -31.492525100708008, -30.6052303314209, -29.71793556213379, -28.83064079284668, -27.94334602355957, -27.05605125427246, -26.168758392333984, -25.281463623046875, -24.394168853759766, -23.506874084472656, -22.619579315185547, -21.732284545898438, -20.844989776611328, -19.95769500732422, -19.07040023803711, -18.18310546875, -17.295812606811523, -16.408517837524414, -15.521223068237305, -14.633928298950195, -13.746633529663086, -12.859339714050293, -11.972044944763184, -11.084750175476074, -10.197456359863281, -9.310161590576172, -8.422868728637695, -7.535573959350586, -6.648279666900635, -5.760985374450684, -4.873690605163574, -3.986395835876465, -3.0991015434265137, -2.2118072509765625, -1.3245124816894531, -0.43721795082092285, 0.4500765800476074, 1.3373711109161377, 2.224665641784668, 3.1119604110717773, 3.9992547035217285, 4.88654899597168, 5.773843765258789, 6.661138534545898, 7.54843282699585, 8.4357271194458, 9.32302188873291, 10.21031665802002, 11.097610473632812, 11.984905242919922, 12.872200012207031, 13.75949478149414, 14.64678955078125, 15.534083366394043, 16.42137908935547, 17.308673858642578, 18.195966720581055, 19.083261489868164, 19.970556259155273]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 7.0, 7.0, 9.0, 13.0, 18.0, 21.0, 19.0, 22.0, 36.0, 28.0, 45.0, 43.0, 48.0, 66.0, 54.0, 60.0, 62.0, 56.0, 52.0, 52.0, 40.0, 40.0, 39.0, 42.0, 21.0, 23.0, 23.0, 13.0, 12.0, 8.0, 7.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.543047904968262, -9.176339149475098, -8.809630393981934, -8.44292163848877, -8.076212882995605, -7.709504127502441, -7.342795372009277, -6.976086616516113, -6.609377861022949, -6.242669105529785, -5.875960350036621, -5.509251594543457, -5.142542839050293, -4.775834083557129, -4.409125328063965, -4.042416572570801, -3.6757073402404785, -3.3089985847473145, -2.9422898292541504, -2.5755810737609863, -2.2088723182678223, -1.8421634435653687, -1.475454568862915, -1.108745813369751, -0.7420370578765869, -0.37532827258110046, -0.008619487285614014, 0.3580893278121948, 0.7247980833053589, 1.091506838798523, 1.4582157135009766, 1.8249244689941406, 2.1916332244873047, 2.5583419799804688, 2.925050735473633, 3.291759490966797, 3.658468246459961, 4.025177001953125, 4.391885757446289, 4.758594512939453, 5.125303268432617, 5.492012023925781, 5.858720779418945, 6.225429534912109, 6.592138290405273, 6.9588470458984375, 7.325555801391602, 7.692264556884766, 8.05897331237793, 8.425682067871094, 8.792390823364258, 9.159099578857422, 9.525808334350586, 9.89251708984375, 10.259225845336914, 10.625934600830078, 10.992644309997559, 11.359353065490723, 11.726061820983887, 12.09277057647705, 12.459479331970215, 12.826188087463379, 13.192896842956543, 13.559605598449707, 13.926314353942871]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 9.0, 5.0, 8.0, 8.0, 18.0, 35.0, 35.0, 70.0, 96.0, 178.0, 266.0, 411.0, 826.0, 1382.0, 2527.0, 5060.0, 10587.0, 23187.0, 53036.0, 118712.0, 230494.0, 278968.0, 173788.0, 81420.0, 35885.0, 16066.0, 7405.0, 3692.0, 1902.0, 989.0, 562.0, 343.0, 191.0, 141.0, 93.0, 48.0, 39.0, 29.0, 12.0, 9.0, 8.0, 6.0, 4.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-1.09765625, -1.0656204223632812, -1.0335845947265625, -1.0015487670898438, -0.969512939453125, -0.9374771118164062, -0.9054412841796875, -0.8734054565429688, -0.84136962890625, -0.8093338012695312, -0.7772979736328125, -0.7452621459960938, -0.713226318359375, -0.6811904907226562, -0.6491546630859375, -0.6171188354492188, -0.5850830078125, -0.5530471801757812, -0.5210113525390625, -0.48897552490234375, -0.456939697265625, -0.42490386962890625, -0.3928680419921875, -0.36083221435546875, -0.32879638671875, -0.29676055908203125, -0.2647247314453125, -0.23268890380859375, -0.200653076171875, -0.16861724853515625, -0.1365814208984375, -0.10454559326171875, -0.072509765625, -0.04047393798828125, -0.0084381103515625, 0.02359771728515625, 0.055633544921875, 0.08766937255859375, 0.1197052001953125, 0.15174102783203125, 0.18377685546875, 0.21581268310546875, 0.2478485107421875, 0.27988433837890625, 0.311920166015625, 0.34395599365234375, 0.3759918212890625, 0.40802764892578125, 0.4400634765625, 0.47209930419921875, 0.5041351318359375, 0.5361709594726562, 0.568206787109375, 0.6002426147460938, 0.6322784423828125, 0.6643142700195312, 0.69635009765625, 0.7283859252929688, 0.7604217529296875, 0.7924575805664062, 0.824493408203125, 0.8565292358398438, 0.8885650634765625, 0.9206008911132812, 0.95263671875]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 12.0, 7.0, 15.0, 21.0, 18.0, 39.0, 61.0, 83.0, 81.0, 100.0, 115.0, 97.0, 86.0, 71.0, 65.0, 45.0, 29.0, 22.0, 13.0, 10.0, 10.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3935546875, -1.35540771484375, -1.3172607421875, -1.27911376953125, -1.240966796875, -1.20281982421875, -1.1646728515625, -1.12652587890625, -1.08837890625, -1.05023193359375, -1.0120849609375, -0.97393798828125, -0.935791015625, -0.89764404296875, -0.8594970703125, -0.82135009765625, -0.783203125, -0.74505615234375, -0.7069091796875, -0.66876220703125, -0.630615234375, -0.59246826171875, -0.5543212890625, -0.51617431640625, -0.47802734375, -0.43988037109375, -0.4017333984375, -0.36358642578125, -0.325439453125, -0.28729248046875, -0.2491455078125, -0.21099853515625, -0.1728515625, -0.13470458984375, -0.0965576171875, -0.05841064453125, -0.020263671875, 0.01788330078125, 0.0560302734375, 0.09417724609375, 0.13232421875, 0.17047119140625, 0.2086181640625, 0.24676513671875, 0.284912109375, 0.32305908203125, 0.3612060546875, 0.39935302734375, 0.4375, 0.47564697265625, 0.5137939453125, 0.55194091796875, 0.590087890625, 0.62823486328125, 0.6663818359375, 0.70452880859375, 0.74267578125, 0.78082275390625, 0.8189697265625, 0.85711669921875, 0.895263671875, 0.93341064453125, 0.9715576171875, 1.00970458984375, 1.0478515625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 4.0, 17.0, 14.0, 24.0, 40.0, 44.0, 80.0, 122.0, 171.0, 280.0, 453.0, 743.0, 1439.0, 3079.0, 8967.0, 35384.0, 203057.0, 603385.0, 151022.0, 27166.0, 7176.0, 2705.0, 1258.0, 681.0, 423.0, 267.0, 157.0, 118.0, 69.0, 45.0, 43.0, 34.0, 23.0, 14.0, 8.0, 6.0, 6.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.71875, -1.6536865234375, -1.588623046875, -1.5235595703125, -1.45849609375, -1.3934326171875, -1.328369140625, -1.2633056640625, -1.1982421875, -1.1331787109375, -1.068115234375, -1.0030517578125, -0.93798828125, -0.8729248046875, -0.807861328125, -0.7427978515625, -0.677734375, -0.6126708984375, -0.547607421875, -0.4825439453125, -0.41748046875, -0.3524169921875, -0.287353515625, -0.2222900390625, -0.1572265625, -0.0921630859375, -0.027099609375, 0.0379638671875, 0.10302734375, 0.1680908203125, 0.233154296875, 0.2982177734375, 0.36328125, 0.4283447265625, 0.493408203125, 0.5584716796875, 0.62353515625, 0.6885986328125, 0.753662109375, 0.8187255859375, 0.8837890625, 0.9488525390625, 1.013916015625, 1.0789794921875, 1.14404296875, 1.2091064453125, 1.274169921875, 1.3392333984375, 1.404296875, 1.4693603515625, 1.534423828125, 1.5994873046875, 1.66455078125, 1.7296142578125, 1.794677734375, 1.8597412109375, 1.9248046875, 1.9898681640625, 2.054931640625, 2.1199951171875, 2.18505859375, 2.2501220703125, 2.315185546875, 2.3802490234375, 2.4453125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 3.0, 1.0, 4.0, 7.0, 14.0, 12.0, 14.0, 17.0, 25.0, 17.0, 26.0, 28.0, 48.0, 46.0, 43.0, 46.0, 56.0, 52.0, 48.0, 42.0, 55.0, 42.0, 46.0, 43.0, 34.0, 43.0, 30.0, 27.0, 25.0, 13.0, 20.0, 18.0, 10.0, 12.0, 5.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9765625, -2.883453369140625, -2.79034423828125, -2.697235107421875, -2.6041259765625, -2.511016845703125, -2.41790771484375, -2.324798583984375, -2.231689453125, -2.138580322265625, -2.04547119140625, -1.952362060546875, -1.8592529296875, -1.766143798828125, -1.67303466796875, -1.579925537109375, -1.48681640625, -1.393707275390625, -1.30059814453125, -1.207489013671875, -1.1143798828125, -1.021270751953125, -0.92816162109375, -0.835052490234375, -0.741943359375, -0.648834228515625, -0.55572509765625, -0.462615966796875, -0.3695068359375, -0.276397705078125, -0.18328857421875, -0.090179443359375, 0.0029296875, 0.096038818359375, 0.18914794921875, 0.282257080078125, 0.3753662109375, 0.468475341796875, 0.56158447265625, 0.654693603515625, 0.747802734375, 0.840911865234375, 0.93402099609375, 1.027130126953125, 1.1202392578125, 1.213348388671875, 1.30645751953125, 1.399566650390625, 1.49267578125, 1.585784912109375, 1.67889404296875, 1.772003173828125, 1.8651123046875, 1.958221435546875, 2.05133056640625, 2.144439697265625, 2.237548828125, 2.330657958984375, 2.42376708984375, 2.516876220703125, 2.6099853515625, 2.703094482421875, 2.79620361328125, 2.889312744140625, 2.982421875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 1.0, 10.0, 24.0, 16.0, 25.0, 57.0, 61.0, 125.0, 234.0, 514.0, 1217.0, 4067.0, 21468.0, 300791.0, 670013.0, 40820.0, 6090.0, 1674.0, 624.0, 300.0, 169.0, 87.0, 54.0, 21.0, 28.0, 18.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2216796875, -1.1858978271484375, -1.150115966796875, -1.1143341064453125, -1.07855224609375, -1.0427703857421875, -1.006988525390625, -0.9712066650390625, -0.9354248046875, -0.8996429443359375, -0.863861083984375, -0.8280792236328125, -0.79229736328125, -0.7565155029296875, -0.720733642578125, -0.6849517822265625, -0.649169921875, -0.6133880615234375, -0.577606201171875, -0.5418243408203125, -0.50604248046875, -0.4702606201171875, -0.434478759765625, -0.3986968994140625, -0.3629150390625, -0.3271331787109375, -0.291351318359375, -0.2555694580078125, -0.21978759765625, -0.1840057373046875, -0.148223876953125, -0.1124420166015625, -0.07666015625, -0.0408782958984375, -0.005096435546875, 0.0306854248046875, 0.06646728515625, 0.1022491455078125, 0.138031005859375, 0.1738128662109375, 0.2095947265625, 0.2453765869140625, 0.281158447265625, 0.3169403076171875, 0.35272216796875, 0.3885040283203125, 0.424285888671875, 0.4600677490234375, 0.495849609375, 0.5316314697265625, 0.567413330078125, 0.6031951904296875, 0.63897705078125, 0.6747589111328125, 0.710540771484375, 0.7463226318359375, 0.7821044921875, 0.8178863525390625, 0.853668212890625, 0.8894500732421875, 0.92523193359375, 0.9610137939453125, 0.996795654296875, 1.0325775146484375, 1.068359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 0.0, 2.0, 4.0, 3.0, 3.0, 9.0, 7.0, 15.0, 20.0, 31.0, 40.0, 54.0, 74.0, 78.0, 126.0, 124.0, 109.0, 66.0, 63.0, 52.0, 28.0, 25.0, 19.0, 16.0, 9.0, 4.0, 4.0, 3.0, 2.0, 6.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019669532775878906, -0.00019000470638275146, -0.00018331408500671387, -0.00017662346363067627, -0.00016993284225463867, -0.00016324222087860107, -0.00015655159950256348, -0.00014986097812652588, -0.00014317035675048828, -0.00013647973537445068, -0.00012978911399841309, -0.0001230984926223755, -0.00011640787124633789, -0.00010971724987030029, -0.0001030266284942627, -9.63360071182251e-05, -8.96453857421875e-05, -8.29547643661499e-05, -7.62641429901123e-05, -6.957352161407471e-05, -6.288290023803711e-05, -5.619227886199951e-05, -4.9501657485961914e-05, -4.2811036109924316e-05, -3.612041473388672e-05, -2.942979335784912e-05, -2.2739171981811523e-05, -1.6048550605773926e-05, -9.357929229736328e-06, -2.6673078536987305e-06, 4.023313522338867e-06, 1.0713934898376465e-05, 1.7404556274414062e-05, 2.409517765045166e-05, 3.078579902648926e-05, 3.7476420402526855e-05, 4.416704177856445e-05, 5.085766315460205e-05, 5.754828453063965e-05, 6.423890590667725e-05, 7.092952728271484e-05, 7.762014865875244e-05, 8.431077003479004e-05, 9.100139141082764e-05, 9.769201278686523e-05, 0.00010438263416290283, 0.00011107325553894043, 0.00011776387691497803, 0.00012445449829101562, 0.00013114511966705322, 0.00013783574104309082, 0.00014452636241912842, 0.00015121698379516602, 0.0001579076051712036, 0.0001645982265472412, 0.0001712888479232788, 0.0001779794692993164, 0.000184670090675354, 0.0001913607120513916, 0.0001980513334274292, 0.0002047419548034668, 0.0002114325761795044, 0.000218123197555542, 0.0002248138189315796, 0.0002315044403076172]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 7.0, 3.0, 4.0, 6.0, 12.0, 22.0, 24.0, 54.0, 86.0, 162.0, 279.0, 508.0, 1155.0, 3233.0, 11184.0, 80193.0, 722084.0, 200764.0, 20936.0, 4688.0, 1668.0, 705.0, 326.0, 163.0, 104.0, 68.0, 37.0, 25.0, 17.0, 14.0, 8.0, 2.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9033203125, -0.8738784790039062, -0.8444366455078125, -0.8149948120117188, -0.785552978515625, -0.7561111450195312, -0.7266693115234375, -0.6972274780273438, -0.66778564453125, -0.6383438110351562, -0.6089019775390625, -0.5794601440429688, -0.550018310546875, -0.5205764770507812, -0.4911346435546875, -0.46169281005859375, -0.4322509765625, -0.40280914306640625, -0.3733673095703125, -0.34392547607421875, -0.314483642578125, -0.28504180908203125, -0.2555999755859375, -0.22615814208984375, -0.19671630859375, -0.16727447509765625, -0.1378326416015625, -0.10839080810546875, -0.078948974609375, -0.04950714111328125, -0.0200653076171875, 0.00937652587890625, 0.038818359375, 0.06826019287109375, 0.0977020263671875, 0.12714385986328125, 0.156585693359375, 0.18602752685546875, 0.2154693603515625, 0.24491119384765625, 0.27435302734375, 0.30379486083984375, 0.3332366943359375, 0.36267852783203125, 0.392120361328125, 0.42156219482421875, 0.4510040283203125, 0.48044586181640625, 0.5098876953125, 0.5393295288085938, 0.5687713623046875, 0.5982131958007812, 0.627655029296875, 0.6570968627929688, 0.6865386962890625, 0.7159805297851562, 0.74542236328125, 0.7748641967773438, 0.8043060302734375, 0.8337478637695312, 0.863189697265625, 0.8926315307617188, 0.9220733642578125, 0.9515151977539062, 0.98095703125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 8.0, 5.0, 8.0, 6.0, 13.0, 15.0, 21.0, 23.0, 33.0, 35.0, 50.0, 53.0, 66.0, 86.0, 80.0, 82.0, 71.0, 69.0, 77.0, 59.0, 30.0, 26.0, 29.0, 14.0, 10.0, 13.0, 9.0, 7.0, 4.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.66455078125, -0.6380538940429688, -0.6115570068359375, -0.5850601196289062, -0.558563232421875, -0.5320663452148438, -0.5055694580078125, -0.47907257080078125, -0.45257568359375, -0.42607879638671875, -0.3995819091796875, -0.37308502197265625, -0.346588134765625, -0.32009124755859375, -0.2935943603515625, -0.26709747314453125, -0.2406005859375, -0.21410369873046875, -0.1876068115234375, -0.16110992431640625, -0.134613037109375, -0.10811614990234375, -0.0816192626953125, -0.05512237548828125, -0.02862548828125, -0.00212860107421875, 0.0243682861328125, 0.05086517333984375, 0.077362060546875, 0.10385894775390625, 0.1303558349609375, 0.15685272216796875, 0.183349609375, 0.20984649658203125, 0.2363433837890625, 0.26284027099609375, 0.289337158203125, 0.31583404541015625, 0.3423309326171875, 0.36882781982421875, 0.39532470703125, 0.42182159423828125, 0.4483184814453125, 0.47481536865234375, 0.501312255859375, 0.5278091430664062, 0.5543060302734375, 0.5808029174804688, 0.6072998046875, 0.6337966918945312, 0.6602935791015625, 0.6867904663085938, 0.713287353515625, 0.7397842407226562, 0.7662811279296875, 0.7927780151367188, 0.81927490234375, 0.8457717895507812, 0.8722686767578125, 0.8987655639648438, 0.925262451171875, 0.9517593383789062, 0.9782562255859375, 1.0047531127929688, 1.03125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 52.0, 240.0, 532.0, 164.0, 18.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.50355529785156, -74.56202697753906, -72.6205062866211, -70.6789779663086, -68.7374496459961, -66.79592895507812, -64.85440063476562, -62.91287612915039, -60.971351623535156, -59.02982711791992, -57.08829879760742, -55.14677429199219, -53.20524978637695, -51.26372528076172, -49.32219696044922, -47.380672454833984, -45.439144134521484, -43.49761962890625, -41.55609130859375, -39.614566802978516, -37.67304229736328, -35.73151397705078, -33.78998947143555, -31.848464965820312, -29.906938552856445, -27.965412139892578, -26.023887634277344, -24.082361221313477, -22.14083480834961, -20.199310302734375, -18.257783889770508, -16.31625747680664, -14.374736785888672, -12.433211326599121, -10.49168586730957, -8.550159454345703, -6.608633995056152, -4.667108535766602, -2.7255821228027344, -0.7840566635131836, 1.1574687957763672, 3.098994493484497, 5.040520191192627, 6.982046127319336, 8.923571586608887, 10.865097045898438, 12.806623458862305, 14.748148918151855, 16.689674377441406, 18.631200790405273, 20.572725296020508, 22.514251708984375, 24.45577621459961, 26.397302627563477, 28.338829040527344, 30.280353546142578, 32.22187805175781, 34.16340255737305, 36.10493087768555, 38.04645538330078, 39.987979888916016, 41.92950439453125, 43.87103271484375, 45.812557220458984, 47.754085540771484]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 6.0, 11.0, 15.0, 25.0, 38.0, 40.0, 29.0, 57.0, 76.0, 74.0, 82.0, 96.0, 80.0, 75.0, 63.0, 53.0, 35.0, 27.0, 38.0, 27.0, 21.0, 10.0, 4.0, 8.0, 6.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.208656311035156, -11.64046573638916, -11.072275161743164, -10.504084587097168, -9.935894012451172, -9.36770248413086, -8.799511909484863, -8.231321334838867, -7.663130760192871, -7.094940185546875, -6.526749610900879, -5.958558559417725, -5.3903679847717285, -4.822177410125732, -4.253986358642578, -3.685795783996582, -3.117605209350586, -2.54941463470459, -1.9812238216400146, -1.413033127784729, -0.8448424339294434, -0.27665185928344727, 0.29153895378112793, 0.8597297668457031, 1.4279203414916992, 1.9961110353469849, 2.5643017292022705, 3.1324925422668457, 3.700683116912842, 4.268873691558838, 4.837064743041992, 5.405255317687988, 5.973445892333984, 6.5416364669799805, 7.109827041625977, 7.678018093109131, 8.246208190917969, 8.814399719238281, 9.382590293884277, 9.950780868530273, 10.51897144317627, 11.087162017822266, 11.655352592468262, 12.223543167114258, 12.79173469543457, 13.35992431640625, 13.928115844726562, 14.496306419372559, 15.064496994018555, 15.63268756866455, 16.200878143310547, 16.76906967163086, 17.33725929260254, 17.90545082092285, 18.47364044189453, 19.041831970214844, 19.610023498535156, 20.17821502685547, 20.74640464782715, 21.31459617614746, 21.88278579711914, 22.450977325439453, 23.019166946411133, 23.587358474731445, 24.155548095703125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 7.0, 2.0, 3.0, 5.0, 6.0, 13.0, 19.0, 28.0, 49.0, 86.0, 187.0, 374.0, 1018.0, 3378.0, 14450.0, 105262.0, 3593194.0, 439311.0, 27866.0, 5924.0, 1758.0, 675.0, 274.0, 155.0, 72.0, 55.0, 37.0, 26.0, 17.0, 10.0, 10.0, 6.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.033203125, -1.9746246337890625, -1.916046142578125, -1.8574676513671875, -1.79888916015625, -1.7403106689453125, -1.681732177734375, -1.6231536865234375, -1.5645751953125, -1.5059967041015625, -1.447418212890625, -1.3888397216796875, -1.33026123046875, -1.2716827392578125, -1.213104248046875, -1.1545257568359375, -1.095947265625, -1.0373687744140625, -0.978790283203125, -0.9202117919921875, -0.86163330078125, -0.8030548095703125, -0.744476318359375, -0.6858978271484375, -0.6273193359375, -0.5687408447265625, -0.510162353515625, -0.4515838623046875, -0.39300537109375, -0.3344268798828125, -0.275848388671875, -0.2172698974609375, -0.15869140625, -0.1001129150390625, -0.041534423828125, 0.0170440673828125, 0.07562255859375, 0.1342010498046875, 0.192779541015625, 0.2513580322265625, 0.3099365234375, 0.3685150146484375, 0.427093505859375, 0.4856719970703125, 0.54425048828125, 0.6028289794921875, 0.661407470703125, 0.7199859619140625, 0.778564453125, 0.8371429443359375, 0.895721435546875, 0.9542999267578125, 1.01287841796875, 1.0714569091796875, 1.130035400390625, 1.1886138916015625, 1.2471923828125, 1.3057708740234375, 1.364349365234375, 1.4229278564453125, 1.48150634765625, 1.5400848388671875, 1.598663330078125, 1.6572418212890625, 1.7158203125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 20.0, 21.0, 32.0, 44.0, 62.0, 94.0, 100.0, 118.0, 114.0, 93.0, 83.0, 68.0, 55.0, 30.0, 18.0, 21.0, 15.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67529296875, -0.6360549926757812, -0.5968170166015625, -0.5575790405273438, -0.518341064453125, -0.47910308837890625, -0.4398651123046875, -0.40062713623046875, -0.36138916015625, -0.32215118408203125, -0.2829132080078125, -0.24367523193359375, -0.204437255859375, -0.16519927978515625, -0.1259613037109375, -0.08672332763671875, -0.0474853515625, -0.00824737548828125, 0.0309906005859375, 0.07022857666015625, 0.109466552734375, 0.14870452880859375, 0.1879425048828125, 0.22718048095703125, 0.26641845703125, 0.30565643310546875, 0.3448944091796875, 0.38413238525390625, 0.423370361328125, 0.46260833740234375, 0.5018463134765625, 0.5410842895507812, 0.580322265625, 0.6195602416992188, 0.6587982177734375, 0.6980361938476562, 0.737274169921875, 0.7765121459960938, 0.8157501220703125, 0.8549880981445312, 0.89422607421875, 0.9334640502929688, 0.9727020263671875, 1.0119400024414062, 1.051177978515625, 1.0904159545898438, 1.1296539306640625, 1.1688919067382812, 1.2081298828125, 1.2473678588867188, 1.2866058349609375, 1.3258438110351562, 1.365081787109375, 1.4043197631835938, 1.4435577392578125, 1.4827957153320312, 1.52203369140625, 1.5612716674804688, 1.6005096435546875, 1.6397476196289062, 1.678985595703125, 1.7182235717773438, 1.7574615478515625, 1.7966995239257812, 1.8359375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 7.0, 2.0, 1.0, 1.0, 12.0, 7.0, 17.0, 31.0, 35.0, 55.0, 108.0, 178.0, 311.0, 703.0, 1453.0, 3292.0, 7941.0, 21684.0, 82117.0, 899304.0, 2946036.0, 175515.0, 36060.0, 11405.0, 4438.0, 1889.0, 810.0, 391.0, 203.0, 108.0, 69.0, 38.0, 19.0, 18.0, 6.0, 9.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5166015625, -1.472259521484375, -1.42791748046875, -1.383575439453125, -1.3392333984375, -1.294891357421875, -1.25054931640625, -1.206207275390625, -1.161865234375, -1.117523193359375, -1.07318115234375, -1.028839111328125, -0.9844970703125, -0.940155029296875, -0.89581298828125, -0.851470947265625, -0.80712890625, -0.762786865234375, -0.71844482421875, -0.674102783203125, -0.6297607421875, -0.585418701171875, -0.54107666015625, -0.496734619140625, -0.452392578125, -0.408050537109375, -0.36370849609375, -0.319366455078125, -0.2750244140625, -0.230682373046875, -0.18634033203125, -0.141998291015625, -0.09765625, -0.053314208984375, -0.00897216796875, 0.035369873046875, 0.0797119140625, 0.124053955078125, 0.16839599609375, 0.212738037109375, 0.257080078125, 0.301422119140625, 0.34576416015625, 0.390106201171875, 0.4344482421875, 0.478790283203125, 0.52313232421875, 0.567474365234375, 0.61181640625, 0.656158447265625, 0.70050048828125, 0.744842529296875, 0.7891845703125, 0.833526611328125, 0.87786865234375, 0.922210693359375, 0.966552734375, 1.010894775390625, 1.05523681640625, 1.099578857421875, 1.1439208984375, 1.188262939453125, 1.23260498046875, 1.276947021484375, 1.3212890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 5.0, 7.0, 5.0, 8.0, 8.0, 16.0, 19.0, 23.0, 43.0, 43.0, 84.0, 144.0, 289.0, 648.0, 1122.0, 743.0, 334.0, 172.0, 121.0, 75.0, 43.0, 30.0, 20.0, 21.0, 12.0, 11.0, 6.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.958984375, -1.9055633544921875, -1.852142333984375, -1.7987213134765625, -1.74530029296875, -1.6918792724609375, -1.638458251953125, -1.5850372314453125, -1.5316162109375, -1.4781951904296875, -1.424774169921875, -1.3713531494140625, -1.31793212890625, -1.2645111083984375, -1.211090087890625, -1.1576690673828125, -1.104248046875, -1.0508270263671875, -0.997406005859375, -0.9439849853515625, -0.89056396484375, -0.8371429443359375, -0.783721923828125, -0.7303009033203125, -0.6768798828125, -0.6234588623046875, -0.570037841796875, -0.5166168212890625, -0.46319580078125, -0.4097747802734375, -0.356353759765625, -0.3029327392578125, -0.24951171875, -0.1960906982421875, -0.142669677734375, -0.0892486572265625, -0.03582763671875, 0.0175933837890625, 0.071014404296875, 0.1244354248046875, 0.1778564453125, 0.2312774658203125, 0.284698486328125, 0.3381195068359375, 0.39154052734375, 0.4449615478515625, 0.498382568359375, 0.5518035888671875, 0.605224609375, 0.6586456298828125, 0.712066650390625, 0.7654876708984375, 0.81890869140625, 0.8723297119140625, 0.925750732421875, 0.9791717529296875, 1.0325927734375, 1.0860137939453125, 1.139434814453125, 1.1928558349609375, 1.24627685546875, 1.2996978759765625, 1.353118896484375, 1.4065399169921875, 1.4599609375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 8.0, 20.0, 33.0, 106.0, 206.0, 255.0, 187.0, 93.0, 37.0, 22.0, 5.0, 8.0, 4.0, 9.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.511463165283203, -19.945589065551758, -19.379714965820312, -18.8138427734375, -18.247968673706055, -17.68209457397461, -17.116220474243164, -16.55034637451172, -15.984474182128906, -15.418600082397461, -14.852726936340332, -14.286852836608887, -13.720979690551758, -13.155105590820312, -12.589231491088867, -12.023358345031738, -11.457484245300293, -10.891610145568848, -10.325736999511719, -9.759862899780273, -9.193989753723145, -8.6281156539917, -8.06224250793457, -7.496368408203125, -6.930494785308838, -6.364621162414551, -5.798747539520264, -5.232873916625977, -4.666999816894531, -4.101126670837402, -3.535252571105957, -2.96937894821167, -2.403505325317383, -1.8376317024230957, -1.271757960319519, -0.7058842182159424, -0.14001059532165527, 0.42586302757263184, 0.991736888885498, 1.5576105117797852, 2.1234841346740723, 2.6893577575683594, 3.2552313804626465, 3.8211052417755127, 4.386979103088379, 4.952852249145508, 5.518726348876953, 6.08459997177124, 6.650473594665527, 7.2163472175598145, 7.782220840454102, 8.348094940185547, 8.913968086242676, 9.479842185974121, 10.04571533203125, 10.611589431762695, 11.17746353149414, 11.743337631225586, 12.309210777282715, 12.87508487701416, 13.440958023071289, 14.006832122802734, 14.57270622253418, 15.138579368591309, 15.704452514648438]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 7.0, 7.0, 9.0, 13.0, 17.0, 25.0, 26.0, 29.0, 43.0, 49.0, 54.0, 58.0, 68.0, 73.0, 44.0, 65.0, 57.0, 61.0, 49.0, 55.0, 41.0, 33.0, 27.0, 33.0, 13.0, 16.0, 5.0, 9.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.97507095336914, -10.702346801757812, -10.4296236038208, -10.156900405883789, -9.884176254272461, -9.611452102661133, -9.338728904724121, -9.06600570678711, -8.793281555175781, -8.520557403564453, -8.247834205627441, -7.9751105308532715, -7.702386856079102, -7.429663181304932, -7.156939506530762, -6.884215831756592, -6.611492156982422, -6.338768482208252, -6.066044807434082, -5.793321132659912, -5.520597457885742, -5.247873783111572, -4.975150108337402, -4.702426433563232, -4.4297027587890625, -4.156979084014893, -3.8842554092407227, -3.6115317344665527, -3.338808059692383, -3.066084384918213, -2.793360710144043, -2.520637035369873, -2.2479124069213867, -1.9751887321472168, -1.7024650573730469, -1.429741382598877, -1.157017707824707, -0.8842940330505371, -0.6115703582763672, -0.33884668350219727, -0.06612300872802734, 0.20660066604614258, 0.4793243408203125, 0.7520480155944824, 1.0247716903686523, 1.2974953651428223, 1.5702190399169922, 1.842942714691162, 2.115666389465332, 2.388390064239502, 2.661113739013672, 2.933837413787842, 3.2065610885620117, 3.4792847633361816, 3.7520084381103516, 4.0247321128845215, 4.297455787658691, 4.570179462432861, 4.842903137207031, 5.115626811981201, 5.388350486755371, 5.661074161529541, 5.933797836303711, 6.206521511077881, 6.479245185852051]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 15.0, 10.0, 18.0, 16.0, 37.0, 72.0, 102.0, 179.0, 282.0, 548.0, 972.0, 1831.0, 3556.0, 7507.0, 16546.0, 39832.0, 97100.0, 224158.0, 319042.0, 194028.0, 81706.0, 33418.0, 14379.0, 6529.0, 3095.0, 1550.0, 895.0, 474.0, 277.0, 150.0, 91.0, 48.0, 26.0, 19.0, 15.0, 11.0, 4.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.0791015625, -1.04473876953125, -1.0103759765625, -0.97601318359375, -0.941650390625, -0.90728759765625, -0.8729248046875, -0.83856201171875, -0.80419921875, -0.76983642578125, -0.7354736328125, -0.70111083984375, -0.666748046875, -0.63238525390625, -0.5980224609375, -0.56365966796875, -0.529296875, -0.49493408203125, -0.4605712890625, -0.42620849609375, -0.391845703125, -0.35748291015625, -0.3231201171875, -0.28875732421875, -0.25439453125, -0.22003173828125, -0.1856689453125, -0.15130615234375, -0.116943359375, -0.08258056640625, -0.0482177734375, -0.01385498046875, 0.0205078125, 0.05487060546875, 0.0892333984375, 0.12359619140625, 0.157958984375, 0.19232177734375, 0.2266845703125, 0.26104736328125, 0.29541015625, 0.32977294921875, 0.3641357421875, 0.39849853515625, 0.432861328125, 0.46722412109375, 0.5015869140625, 0.53594970703125, 0.5703125, 0.60467529296875, 0.6390380859375, 0.67340087890625, 0.707763671875, 0.74212646484375, 0.7764892578125, 0.81085205078125, 0.84521484375, 0.87957763671875, 0.9139404296875, 0.94830322265625, 0.982666015625, 1.01702880859375, 1.0513916015625, 1.08575439453125, 1.1201171875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 2.0, 9.0, 8.0, 10.0, 22.0, 19.0, 20.0, 23.0, 30.0, 31.0, 43.0, 45.0, 29.0, 41.0, 64.0, 44.0, 67.0, 46.0, 61.0, 43.0, 42.0, 37.0, 50.0, 43.0, 34.0, 20.0, 32.0, 15.0, 11.0, 12.0, 10.0, 13.0, 7.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5615234375, -0.5419845581054688, -0.5224456787109375, -0.5029067993164062, -0.483367919921875, -0.46382904052734375, -0.4442901611328125, -0.42475128173828125, -0.40521240234375, -0.38567352294921875, -0.3661346435546875, -0.34659576416015625, -0.327056884765625, -0.30751800537109375, -0.2879791259765625, -0.26844024658203125, -0.2489013671875, -0.22936248779296875, -0.2098236083984375, -0.19028472900390625, -0.170745849609375, -0.15120697021484375, -0.1316680908203125, -0.11212921142578125, -0.09259033203125, -0.07305145263671875, -0.0535125732421875, -0.03397369384765625, -0.014434814453125, 0.00510406494140625, 0.0246429443359375, 0.04418182373046875, 0.063720703125, 0.08325958251953125, 0.1027984619140625, 0.12233734130859375, 0.141876220703125, 0.16141510009765625, 0.1809539794921875, 0.20049285888671875, 0.22003173828125, 0.23957061767578125, 0.2591094970703125, 0.27864837646484375, 0.298187255859375, 0.31772613525390625, 0.3372650146484375, 0.35680389404296875, 0.3763427734375, 0.39588165283203125, 0.4154205322265625, 0.43495941162109375, 0.454498291015625, 0.47403717041015625, 0.4935760498046875, 0.5131149291992188, 0.53265380859375, 0.5521926879882812, 0.5717315673828125, 0.5912704467773438, 0.610809326171875, 0.6303482055664062, 0.6498870849609375, 0.6694259643554688, 0.68896484375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 1.0, 0.0, 7.0, 6.0, 11.0, 11.0, 23.0, 25.0, 34.0, 47.0, 87.0, 130.0, 231.0, 330.0, 692.0, 1330.0, 3303.0, 11159.0, 56850.0, 386073.0, 500787.0, 67930.0, 12789.0, 3620.0, 1365.0, 713.0, 381.0, 224.0, 132.0, 70.0, 57.0, 30.0, 35.0, 25.0, 18.0, 9.0, 6.0, 2.0, 2.0, 5.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.3125, -2.242523193359375, -2.17254638671875, -2.102569580078125, -2.0325927734375, -1.962615966796875, -1.89263916015625, -1.822662353515625, -1.752685546875, -1.682708740234375, -1.61273193359375, -1.542755126953125, -1.4727783203125, -1.402801513671875, -1.33282470703125, -1.262847900390625, -1.19287109375, -1.122894287109375, -1.05291748046875, -0.982940673828125, -0.9129638671875, -0.842987060546875, -0.77301025390625, -0.703033447265625, -0.633056640625, -0.563079833984375, -0.49310302734375, -0.423126220703125, -0.3531494140625, -0.283172607421875, -0.21319580078125, -0.143218994140625, -0.0732421875, -0.003265380859375, 0.06671142578125, 0.136688232421875, 0.2066650390625, 0.276641845703125, 0.34661865234375, 0.416595458984375, 0.486572265625, 0.556549072265625, 0.62652587890625, 0.696502685546875, 0.7664794921875, 0.836456298828125, 0.90643310546875, 0.976409912109375, 1.04638671875, 1.116363525390625, 1.18634033203125, 1.256317138671875, 1.3262939453125, 1.396270751953125, 1.46624755859375, 1.536224365234375, 1.606201171875, 1.676177978515625, 1.74615478515625, 1.816131591796875, 1.8861083984375, 1.956085205078125, 2.02606201171875, 2.096038818359375, 2.166015625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 2.0, 6.0, 5.0, 8.0, 11.0, 10.0, 15.0, 18.0, 14.0, 18.0, 30.0, 20.0, 36.0, 26.0, 34.0, 40.0, 49.0, 47.0, 59.0, 46.0, 57.0, 52.0, 52.0, 52.0, 49.0, 46.0, 29.0, 32.0, 24.0, 19.0, 23.0, 20.0, 10.0, 13.0, 7.0, 8.0, 9.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.162109375, -2.086944580078125, -2.01177978515625, -1.936614990234375, -1.8614501953125, -1.786285400390625, -1.71112060546875, -1.635955810546875, -1.560791015625, -1.485626220703125, -1.41046142578125, -1.335296630859375, -1.2601318359375, -1.184967041015625, -1.10980224609375, -1.034637451171875, -0.95947265625, -0.884307861328125, -0.80914306640625, -0.733978271484375, -0.6588134765625, -0.583648681640625, -0.50848388671875, -0.433319091796875, -0.358154296875, -0.282989501953125, -0.20782470703125, -0.132659912109375, -0.0574951171875, 0.017669677734375, 0.09283447265625, 0.167999267578125, 0.2431640625, 0.318328857421875, 0.39349365234375, 0.468658447265625, 0.5438232421875, 0.618988037109375, 0.69415283203125, 0.769317626953125, 0.844482421875, 0.919647216796875, 0.99481201171875, 1.069976806640625, 1.1451416015625, 1.220306396484375, 1.29547119140625, 1.370635986328125, 1.44580078125, 1.520965576171875, 1.59613037109375, 1.671295166015625, 1.7464599609375, 1.821624755859375, 1.89678955078125, 1.971954345703125, 2.047119140625, 2.122283935546875, 2.19744873046875, 2.272613525390625, 2.3477783203125, 2.422943115234375, 2.49810791015625, 2.573272705078125, 2.6484375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 11.0, 6.0, 4.0, 9.0, 22.0, 33.0, 54.0, 84.0, 195.0, 392.0, 1119.0, 4001.0, 26140.0, 404726.0, 572790.0, 32325.0, 4476.0, 1196.0, 481.0, 206.0, 112.0, 60.0, 38.0, 27.0, 14.0, 14.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.423828125, -1.3853912353515625, -1.346954345703125, -1.3085174560546875, -1.27008056640625, -1.2316436767578125, -1.193206787109375, -1.1547698974609375, -1.1163330078125, -1.0778961181640625, -1.039459228515625, -1.0010223388671875, -0.96258544921875, -0.9241485595703125, -0.885711669921875, -0.8472747802734375, -0.808837890625, -0.7704010009765625, -0.731964111328125, -0.6935272216796875, -0.65509033203125, -0.6166534423828125, -0.578216552734375, -0.5397796630859375, -0.5013427734375, -0.4629058837890625, -0.424468994140625, -0.3860321044921875, -0.34759521484375, -0.3091583251953125, -0.270721435546875, -0.2322845458984375, -0.19384765625, -0.1554107666015625, -0.116973876953125, -0.0785369873046875, -0.04010009765625, -0.0016632080078125, 0.036773681640625, 0.0752105712890625, 0.1136474609375, 0.1520843505859375, 0.190521240234375, 0.2289581298828125, 0.26739501953125, 0.3058319091796875, 0.344268798828125, 0.3827056884765625, 0.421142578125, 0.4595794677734375, 0.498016357421875, 0.5364532470703125, 0.57489013671875, 0.6133270263671875, 0.651763916015625, 0.6902008056640625, 0.7286376953125, 0.7670745849609375, 0.805511474609375, 0.8439483642578125, 0.88238525390625, 0.9208221435546875, 0.959259033203125, 0.9976959228515625, 1.0361328125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 5.0, 3.0, 10.0, 11.0, 22.0, 20.0, 30.0, 38.0, 55.0, 74.0, 107.0, 147.0, 121.0, 99.0, 90.0, 49.0, 32.0, 23.0, 17.0, 11.0, 12.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00024509429931640625, -0.00023714080452919006, -0.00022918730974197388, -0.0002212338149547577, -0.0002132803201675415, -0.00020532682538032532, -0.00019737333059310913, -0.00018941983580589294, -0.00018146634101867676, -0.00017351284623146057, -0.00016555935144424438, -0.0001576058566570282, -0.000149652361869812, -0.00014169886708259583, -0.00013374537229537964, -0.00012579187750816345, -0.00011783838272094727, -0.00010988488793373108, -0.00010193139314651489, -9.39778983592987e-05, -8.602440357208252e-05, -7.807090878486633e-05, -7.011741399765015e-05, -6.216391921043396e-05, -5.4210424423217773e-05, -4.625692963600159e-05, -3.83034348487854e-05, -3.0349940061569214e-05, -2.2396445274353027e-05, -1.444295048713684e-05, -6.489455699920654e-06, 1.4640390872955322e-06, 9.417533874511719e-06, 1.7371028661727905e-05, 2.5324523448944092e-05, 3.327801823616028e-05, 4.1231513023376465e-05, 4.918500781059265e-05, 5.713850259780884e-05, 6.509199738502502e-05, 7.304549217224121e-05, 8.09989869594574e-05, 8.895248174667358e-05, 9.690597653388977e-05, 0.00010485947132110596, 0.00011281296610832214, 0.00012076646089553833, 0.00012871995568275452, 0.0001366734504699707, 0.0001446269452571869, 0.00015258044004440308, 0.00016053393483161926, 0.00016848742961883545, 0.00017644092440605164, 0.00018439441919326782, 0.000192347913980484, 0.0002003014087677002, 0.00020825490355491638, 0.00021620839834213257, 0.00022416189312934875, 0.00023211538791656494, 0.00024006888270378113, 0.0002480223774909973, 0.0002559758722782135, 0.0002639293670654297]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 8.0, 8.0, 10.0, 11.0, 11.0, 26.0, 26.0, 43.0, 56.0, 105.0, 145.0, 225.0, 362.0, 857.0, 1769.0, 4940.0, 17177.0, 89947.0, 563272.0, 304078.0, 48503.0, 10607.0, 3419.0, 1382.0, 615.0, 383.0, 223.0, 123.0, 63.0, 59.0, 28.0, 26.0, 17.0, 12.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.76513671875, -0.7418289184570312, -0.7185211181640625, -0.6952133178710938, -0.671905517578125, -0.6485977172851562, -0.6252899169921875, -0.6019821166992188, -0.57867431640625, -0.5553665161132812, -0.5320587158203125, -0.5087509155273438, -0.485443115234375, -0.46213531494140625, -0.4388275146484375, -0.41551971435546875, -0.3922119140625, -0.36890411376953125, -0.3455963134765625, -0.32228851318359375, -0.298980712890625, -0.27567291259765625, -0.2523651123046875, -0.22905731201171875, -0.20574951171875, -0.18244171142578125, -0.1591339111328125, -0.13582611083984375, -0.112518310546875, -0.08921051025390625, -0.0659027099609375, -0.04259490966796875, -0.019287109375, 0.00402069091796875, 0.0273284912109375, 0.05063629150390625, 0.073944091796875, 0.09725189208984375, 0.1205596923828125, 0.14386749267578125, 0.16717529296875, 0.19048309326171875, 0.2137908935546875, 0.23709869384765625, 0.260406494140625, 0.28371429443359375, 0.3070220947265625, 0.33032989501953125, 0.3536376953125, 0.37694549560546875, 0.4002532958984375, 0.42356109619140625, 0.446868896484375, 0.47017669677734375, 0.4934844970703125, 0.5167922973632812, 0.54010009765625, 0.5634078979492188, 0.5867156982421875, 0.6100234985351562, 0.633331298828125, 0.6566390991210938, 0.6799468994140625, 0.7032546997070312, 0.7265625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 8.0, 9.0, 8.0, 5.0, 10.0, 22.0, 20.0, 29.0, 33.0, 42.0, 42.0, 61.0, 63.0, 64.0, 81.0, 82.0, 75.0, 59.0, 62.0, 57.0, 51.0, 33.0, 18.0, 15.0, 14.0, 7.0, 11.0, 5.0, 2.0, 4.0, 3.0, 0.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.90380859375, -0.8791961669921875, -0.854583740234375, -0.8299713134765625, -0.80535888671875, -0.7807464599609375, -0.756134033203125, -0.7315216064453125, -0.7069091796875, -0.6822967529296875, -0.657684326171875, -0.6330718994140625, -0.60845947265625, -0.5838470458984375, -0.559234619140625, -0.5346221923828125, -0.510009765625, -0.4853973388671875, -0.460784912109375, -0.4361724853515625, -0.41156005859375, -0.3869476318359375, -0.362335205078125, -0.3377227783203125, -0.3131103515625, -0.2884979248046875, -0.263885498046875, -0.2392730712890625, -0.21466064453125, -0.1900482177734375, -0.165435791015625, -0.1408233642578125, -0.1162109375, -0.0915985107421875, -0.066986083984375, -0.0423736572265625, -0.01776123046875, 0.0068511962890625, 0.031463623046875, 0.0560760498046875, 0.0806884765625, 0.1053009033203125, 0.129913330078125, 0.1545257568359375, 0.17913818359375, 0.2037506103515625, 0.228363037109375, 0.2529754638671875, 0.277587890625, 0.3022003173828125, 0.326812744140625, 0.3514251708984375, 0.37603759765625, 0.4006500244140625, 0.425262451171875, 0.4498748779296875, 0.4744873046875, 0.4990997314453125, 0.523712158203125, 0.5483245849609375, 0.57293701171875, 0.5975494384765625, 0.622161865234375, 0.6467742919921875, 0.67138671875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 11.0, 20.0, 28.0, 68.0, 89.0, 136.0, 210.0, 173.0, 121.0, 70.0, 35.0, 19.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.06265640258789, -23.512418746948242, -22.962181091308594, -22.411943435668945, -21.861705780029297, -21.311466217041016, -20.76123046875, -20.21099090576172, -19.66075325012207, -19.110515594482422, -18.560277938842773, -18.010040283203125, -17.459802627563477, -16.909564971923828, -16.359325408935547, -15.809088706970215, -15.258851051330566, -14.708613395690918, -14.15837574005127, -13.608137130737305, -13.057899475097656, -12.507661819458008, -11.95742416381836, -11.407186508178711, -10.856948852539062, -10.306711196899414, -9.756473541259766, -9.206235885620117, -8.655997276306152, -8.105759620666504, -7.5555219650268555, -7.005284309387207, -6.455045700073242, -5.904808044433594, -5.354569911956787, -4.804332256317139, -4.254094123840332, -3.7038564682006836, -3.153618812561035, -2.6033809185028076, -2.05314302444458, -1.5029051303863525, -0.9526673555374146, -0.40242958068847656, 0.14780831336975098, 0.6980462074279785, 1.248283863067627, 1.7985217571258545, 2.348759651184082, 2.8989975452423096, 3.449235439300537, 3.9994730949401855, 4.549711227416992, 5.099948883056641, 5.650186538696289, 6.2004241943359375, 6.750662326812744, 7.300899982452393, 7.851138114929199, 8.401375770568848, 8.951613426208496, 9.501852035522461, 10.05208969116211, 10.602327346801758, 11.152565002441406]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 1.0, 5.0, 11.0, 8.0, 11.0, 9.0, 19.0, 18.0, 21.0, 20.0, 26.0, 33.0, 30.0, 28.0, 44.0, 49.0, 47.0, 60.0, 74.0, 71.0, 53.0, 49.0, 44.0, 31.0, 37.0, 29.0, 27.0, 24.0, 23.0, 18.0, 19.0, 16.0, 16.0, 3.0, 9.0, 9.0, 0.0, 5.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.196157455444336, -8.872919082641602, -8.549680709838867, -8.226442337036133, -7.90320348739624, -7.579965114593506, -7.256726264953613, -6.933487892150879, -6.6102495193481445, -6.28701114654541, -5.963772773742676, -5.640533924102783, -5.317295551300049, -4.9940571784973145, -4.670818328857422, -4.3475799560546875, -4.024341583251953, -3.7011032104492188, -3.3778645992279053, -3.054625988006592, -2.7313876152038574, -2.408149242401123, -2.0849106311798096, -1.761672019958496, -1.4384336471557617, -1.1151951551437378, -0.7919566631317139, -0.46871817111968994, -0.14547967910766602, 0.1777588129043579, 0.5009973049163818, 0.8242359161376953, 1.1474733352661133, 1.4707118272781372, 1.7939503192901611, 2.1171889305114746, 2.440427303314209, 2.7636656761169434, 3.086904287338257, 3.4101428985595703, 3.7333812713623047, 4.056619644165039, 4.379858016967773, 4.703096866607666, 5.0263352394104, 5.349573612213135, 5.672812461853027, 5.996050834655762, 6.319289207458496, 6.6425275802612305, 6.965765953063965, 7.289004802703857, 7.612243175506592, 7.935481548309326, 8.258720397949219, 8.581958770751953, 8.905197143554688, 9.228435516357422, 9.551673889160156, 9.87491226196289, 10.198150634765625, 10.521389961242676, 10.84462833404541, 11.167866706848145, 11.491105079650879]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 10.0, 5.0, 8.0, 26.0, 20.0, 55.0, 67.0, 118.0, 207.0, 378.0, 685.0, 1303.0, 2768.0, 6139.0, 15233.0, 44501.0, 174596.0, 1136800.0, 2258958.0, 428667.0, 81422.0, 24579.0, 9544.0, 3986.0, 1906.0, 963.0, 517.0, 291.0, 177.0, 100.0, 80.0, 55.0, 25.0, 23.0, 15.0, 15.0, 9.0, 8.0, 8.0, 4.0, 6.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64990234375, -0.6260528564453125, -0.602203369140625, -0.5783538818359375, -0.55450439453125, -0.5306549072265625, -0.506805419921875, -0.4829559326171875, -0.4591064453125, -0.4352569580078125, -0.411407470703125, -0.3875579833984375, -0.36370849609375, -0.3398590087890625, -0.316009521484375, -0.2921600341796875, -0.268310546875, -0.2444610595703125, -0.220611572265625, -0.1967620849609375, -0.17291259765625, -0.1490631103515625, -0.125213623046875, -0.1013641357421875, -0.0775146484375, -0.0536651611328125, -0.029815673828125, -0.0059661865234375, 0.01788330078125, 0.0417327880859375, 0.065582275390625, 0.0894317626953125, 0.11328125, 0.1371307373046875, 0.160980224609375, 0.1848297119140625, 0.20867919921875, 0.2325286865234375, 0.256378173828125, 0.2802276611328125, 0.3040771484375, 0.3279266357421875, 0.351776123046875, 0.3756256103515625, 0.39947509765625, 0.4233245849609375, 0.447174072265625, 0.4710235595703125, 0.494873046875, 0.5187225341796875, 0.542572021484375, 0.5664215087890625, 0.59027099609375, 0.6141204833984375, 0.637969970703125, 0.6618194580078125, 0.6856689453125, 0.7095184326171875, 0.733367919921875, 0.7572174072265625, 0.78106689453125, 0.8049163818359375, 0.828765869140625, 0.8526153564453125, 0.87646484375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 5.0, 7.0, 6.0, 10.0, 13.0, 9.0, 14.0, 15.0, 31.0, 21.0, 34.0, 51.0, 57.0, 40.0, 44.0, 48.0, 59.0, 53.0, 56.0, 44.0, 44.0, 43.0, 43.0, 46.0, 35.0, 32.0, 29.0, 22.0, 30.0, 17.0, 8.0, 12.0, 10.0, 7.0, 2.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45458984375, -0.43566131591796875, -0.4167327880859375, -0.39780426025390625, -0.378875732421875, -0.35994720458984375, -0.3410186767578125, -0.32209014892578125, -0.30316162109375, -0.28423309326171875, -0.2653045654296875, -0.24637603759765625, -0.227447509765625, -0.20851898193359375, -0.1895904541015625, -0.17066192626953125, -0.1517333984375, -0.13280487060546875, -0.1138763427734375, -0.09494781494140625, -0.076019287109375, -0.05709075927734375, -0.0381622314453125, -0.01923370361328125, -0.00030517578125, 0.01862335205078125, 0.0375518798828125, 0.05648040771484375, 0.075408935546875, 0.09433746337890625, 0.1132659912109375, 0.13219451904296875, 0.151123046875, 0.17005157470703125, 0.1889801025390625, 0.20790863037109375, 0.226837158203125, 0.24576568603515625, 0.2646942138671875, 0.28362274169921875, 0.30255126953125, 0.32147979736328125, 0.3404083251953125, 0.35933685302734375, 0.378265380859375, 0.39719390869140625, 0.4161224365234375, 0.43505096435546875, 0.4539794921875, 0.47290802001953125, 0.4918365478515625, 0.5107650756835938, 0.529693603515625, 0.5486221313476562, 0.5675506591796875, 0.5864791870117188, 0.60540771484375, 0.6243362426757812, 0.6432647705078125, 0.6621932983398438, 0.681121826171875, 0.7000503540039062, 0.7189788818359375, 0.7379074096679688, 0.7568359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 5.0, 9.0, 8.0, 16.0, 18.0, 27.0, 37.0, 47.0, 80.0, 80.0, 141.0, 227.0, 442.0, 815.0, 1861.0, 4743.0, 14322.0, 56069.0, 385028.0, 3277127.0, 375236.0, 55818.0, 14281.0, 4440.0, 1652.0, 722.0, 369.0, 217.0, 132.0, 87.0, 78.0, 39.0, 36.0, 19.0, 24.0, 9.0, 6.0, 3.0, 5.0, 8.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2880859375, -1.244415283203125, -1.20074462890625, -1.157073974609375, -1.1134033203125, -1.069732666015625, -1.02606201171875, -0.982391357421875, -0.938720703125, -0.895050048828125, -0.85137939453125, -0.807708740234375, -0.7640380859375, -0.720367431640625, -0.67669677734375, -0.633026123046875, -0.58935546875, -0.545684814453125, -0.50201416015625, -0.458343505859375, -0.4146728515625, -0.371002197265625, -0.32733154296875, -0.283660888671875, -0.239990234375, -0.196319580078125, -0.15264892578125, -0.108978271484375, -0.0653076171875, -0.021636962890625, 0.02203369140625, 0.065704345703125, 0.109375, 0.153045654296875, 0.19671630859375, 0.240386962890625, 0.2840576171875, 0.327728271484375, 0.37139892578125, 0.415069580078125, 0.458740234375, 0.502410888671875, 0.54608154296875, 0.589752197265625, 0.6334228515625, 0.677093505859375, 0.72076416015625, 0.764434814453125, 0.80810546875, 0.851776123046875, 0.89544677734375, 0.939117431640625, 0.9827880859375, 1.026458740234375, 1.07012939453125, 1.113800048828125, 1.157470703125, 1.201141357421875, 1.24481201171875, 1.288482666015625, 1.3321533203125, 1.375823974609375, 1.41949462890625, 1.463165283203125, 1.5068359375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 8.0, 3.0, 5.0, 4.0, 15.0, 12.0, 14.0, 24.0, 21.0, 29.0, 41.0, 68.0, 96.0, 155.0, 213.0, 409.0, 624.0, 750.0, 538.0, 377.0, 201.0, 119.0, 82.0, 58.0, 47.0, 43.0, 23.0, 16.0, 16.0, 11.0, 14.0, 7.0, 11.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-1.689453125, -1.64306640625, -1.5966796875, -1.55029296875, -1.50390625, -1.45751953125, -1.4111328125, -1.36474609375, -1.318359375, -1.27197265625, -1.2255859375, -1.17919921875, -1.1328125, -1.08642578125, -1.0400390625, -0.99365234375, -0.947265625, -0.90087890625, -0.8544921875, -0.80810546875, -0.76171875, -0.71533203125, -0.6689453125, -0.62255859375, -0.576171875, -0.52978515625, -0.4833984375, -0.43701171875, -0.390625, -0.34423828125, -0.2978515625, -0.25146484375, -0.205078125, -0.15869140625, -0.1123046875, -0.06591796875, -0.01953125, 0.02685546875, 0.0732421875, 0.11962890625, 0.166015625, 0.21240234375, 0.2587890625, 0.30517578125, 0.3515625, 0.39794921875, 0.4443359375, 0.49072265625, 0.537109375, 0.58349609375, 0.6298828125, 0.67626953125, 0.72265625, 0.76904296875, 0.8154296875, 0.86181640625, 0.908203125, 0.95458984375, 1.0009765625, 1.04736328125, 1.09375, 1.14013671875, 1.1865234375, 1.23291015625, 1.279296875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 1.0, 5.0, 12.0, 21.0, 28.0, 54.0, 100.0, 130.0, 182.0, 158.0, 113.0, 84.0, 41.0, 19.0, 15.0, 8.0, 5.0, 5.0, 6.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.191397666931152, -12.758180618286133, -12.324963569641113, -11.891746520996094, -11.458529472351074, -11.025312423706055, -10.592095375061035, -10.158878326416016, -9.725661277770996, -9.292444229125977, -8.859227180480957, -8.426010131835938, -7.992793083190918, -7.559576034545898, -7.126358985900879, -6.693141937255859, -6.25992488861084, -5.82670783996582, -5.393490791320801, -4.960273742675781, -4.527056694030762, -4.093839645385742, -3.6606225967407227, -3.227405548095703, -2.7941884994506836, -2.360971450805664, -1.9277544021606445, -1.494537353515625, -1.0613203048706055, -0.6281032562255859, -0.1948862075805664, 0.23833084106445312, 0.6715478897094727, 1.1047649383544922, 1.5379819869995117, 1.9711990356445312, 2.404416084289551, 2.8376331329345703, 3.27085018157959, 3.7040672302246094, 4.137284278869629, 4.570501327514648, 5.003718376159668, 5.4369354248046875, 5.870152473449707, 6.303369522094727, 6.736586570739746, 7.169803619384766, 7.603020668029785, 8.036237716674805, 8.469454765319824, 8.902671813964844, 9.335888862609863, 9.769105911254883, 10.202322959899902, 10.635540008544922, 11.068757057189941, 11.501974105834961, 11.93519115447998, 12.368408203125, 12.80162525177002, 13.234842300415039, 13.668059349060059, 14.101276397705078, 14.534493446350098]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 3.0, 6.0, 2.0, 13.0, 8.0, 7.0, 12.0, 10.0, 21.0, 17.0, 24.0, 28.0, 39.0, 38.0, 38.0, 38.0, 46.0, 38.0, 71.0, 58.0, 66.0, 47.0, 46.0, 44.0, 38.0, 35.0, 39.0, 30.0, 24.0, 24.0, 20.0, 15.0, 18.0, 15.0, 10.0, 3.0, 3.0, 2.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.024250030517578, -8.745893478393555, -8.467537879943848, -8.189181327819824, -7.910825252532959, -7.632469177246094, -7.3541131019592285, -7.075757026672363, -6.79740047454834, -6.519044399261475, -6.240688323974609, -5.962331771850586, -5.683975696563721, -5.4056196212768555, -5.12726354598999, -4.848907470703125, -4.57055139541626, -4.2921953201293945, -4.013839244842529, -3.735482931137085, -3.4571266174316406, -3.1787705421447754, -2.90041446685791, -2.622058391571045, -2.3437020778656006, -2.0653460025787354, -1.786989688873291, -1.5086336135864258, -1.230277419090271, -0.9519212245941162, -0.673565149307251, -0.3952089548110962, -0.1168527603149414, 0.161503404378891, 0.4398595690727234, 0.7182157039642334, 0.9965718984603882, 1.274928092956543, 1.5532841682434082, 1.831640362739563, 2.1099965572357178, 2.388352632522583, 2.6667089462280273, 2.9450650215148926, 3.223421096801758, 3.501777410507202, 3.7801334857940674, 4.058489799499512, 4.336845874786377, 4.615201950073242, 4.893558025360107, 5.171914100646973, 5.450270652770996, 5.728626728057861, 6.006982803344727, 6.285338878631592, 6.563694953918457, 6.842051029205322, 7.1204071044921875, 7.398763656616211, 7.677119731903076, 7.955475807189941, 8.233831405639648, 8.512187957763672, 8.790544509887695]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 4.0, 4.0, 11.0, 8.0, 25.0, 37.0, 44.0, 62.0, 100.0, 163.0, 267.0, 453.0, 824.0, 1639.0, 3148.0, 6639.0, 13501.0, 28535.0, 59200.0, 115867.0, 198792.0, 242167.0, 179416.0, 100163.0, 50216.0, 24290.0, 11616.0, 5507.0, 2657.0, 1410.0, 731.0, 422.0, 222.0, 131.0, 92.0, 55.0, 45.0, 32.0, 19.0, 12.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6943359375, -0.6698760986328125, -0.645416259765625, -0.6209564208984375, -0.59649658203125, -0.5720367431640625, -0.547576904296875, -0.5231170654296875, -0.4986572265625, -0.4741973876953125, -0.449737548828125, -0.4252777099609375, -0.40081787109375, -0.3763580322265625, -0.351898193359375, -0.3274383544921875, -0.302978515625, -0.2785186767578125, -0.254058837890625, -0.2295989990234375, -0.20513916015625, -0.1806793212890625, -0.156219482421875, -0.1317596435546875, -0.1072998046875, -0.0828399658203125, -0.058380126953125, -0.0339202880859375, -0.00946044921875, 0.0149993896484375, 0.039459228515625, 0.0639190673828125, 0.08837890625, 0.1128387451171875, 0.137298583984375, 0.1617584228515625, 0.18621826171875, 0.2106781005859375, 0.235137939453125, 0.2595977783203125, 0.2840576171875, 0.3085174560546875, 0.332977294921875, 0.3574371337890625, 0.38189697265625, 0.4063568115234375, 0.430816650390625, 0.4552764892578125, 0.479736328125, 0.5041961669921875, 0.528656005859375, 0.5531158447265625, 0.57757568359375, 0.6020355224609375, 0.626495361328125, 0.6509552001953125, 0.6754150390625, 0.6998748779296875, 0.724334716796875, 0.7487945556640625, 0.77325439453125, 0.7977142333984375, 0.822174072265625, 0.8466339111328125, 0.87109375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 6.0, 7.0, 5.0, 15.0, 10.0, 19.0, 18.0, 27.0, 32.0, 19.0, 51.0, 49.0, 41.0, 50.0, 47.0, 51.0, 50.0, 63.0, 45.0, 38.0, 48.0, 43.0, 37.0, 26.0, 36.0, 39.0, 18.0, 28.0, 11.0, 12.0, 6.0, 15.0, 10.0, 8.0, 12.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5419921875, -0.524017333984375, -0.50604248046875, -0.488067626953125, -0.4700927734375, -0.452117919921875, -0.43414306640625, -0.416168212890625, -0.398193359375, -0.380218505859375, -0.36224365234375, -0.344268798828125, -0.3262939453125, -0.308319091796875, -0.29034423828125, -0.272369384765625, -0.25439453125, -0.236419677734375, -0.21844482421875, -0.200469970703125, -0.1824951171875, -0.164520263671875, -0.14654541015625, -0.128570556640625, -0.110595703125, -0.092620849609375, -0.07464599609375, -0.056671142578125, -0.0386962890625, -0.020721435546875, -0.00274658203125, 0.015228271484375, 0.033203125, 0.051177978515625, 0.06915283203125, 0.087127685546875, 0.1051025390625, 0.123077392578125, 0.14105224609375, 0.159027099609375, 0.177001953125, 0.194976806640625, 0.21295166015625, 0.230926513671875, 0.2489013671875, 0.266876220703125, 0.28485107421875, 0.302825927734375, 0.32080078125, 0.338775634765625, 0.35675048828125, 0.374725341796875, 0.3927001953125, 0.410675048828125, 0.42864990234375, 0.446624755859375, 0.464599609375, 0.482574462890625, 0.50054931640625, 0.518524169921875, 0.5364990234375, 0.554473876953125, 0.57244873046875, 0.590423583984375, 0.6083984375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 10.0, 7.0, 5.0, 12.0, 15.0, 22.0, 30.0, 42.0, 52.0, 71.0, 95.0, 160.0, 186.0, 280.0, 420.0, 653.0, 968.0, 1886.0, 4207.0, 13477.0, 69533.0, 512282.0, 364195.0, 59317.0, 12055.0, 3947.0, 1798.0, 955.0, 602.0, 353.0, 236.0, 223.0, 119.0, 100.0, 70.0, 38.0, 32.0, 24.0, 15.0, 13.0, 14.0, 12.0, 13.0, 4.0, 3.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.62890625, -1.5684814453125, -1.508056640625, -1.4476318359375, -1.38720703125, -1.3267822265625, -1.266357421875, -1.2059326171875, -1.1455078125, -1.0850830078125, -1.024658203125, -0.9642333984375, -0.90380859375, -0.8433837890625, -0.782958984375, -0.7225341796875, -0.662109375, -0.6016845703125, -0.541259765625, -0.4808349609375, -0.42041015625, -0.3599853515625, -0.299560546875, -0.2391357421875, -0.1787109375, -0.1182861328125, -0.057861328125, 0.0025634765625, 0.06298828125, 0.1234130859375, 0.183837890625, 0.2442626953125, 0.3046875, 0.3651123046875, 0.425537109375, 0.4859619140625, 0.54638671875, 0.6068115234375, 0.667236328125, 0.7276611328125, 0.7880859375, 0.8485107421875, 0.908935546875, 0.9693603515625, 1.02978515625, 1.0902099609375, 1.150634765625, 1.2110595703125, 1.271484375, 1.3319091796875, 1.392333984375, 1.4527587890625, 1.51318359375, 1.5736083984375, 1.634033203125, 1.6944580078125, 1.7548828125, 1.8153076171875, 1.875732421875, 1.9361572265625, 1.99658203125, 2.0570068359375, 2.117431640625, 2.1778564453125, 2.23828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 12.0, 11.0, 17.0, 14.0, 23.0, 26.0, 30.0, 29.0, 45.0, 58.0, 40.0, 57.0, 59.0, 51.0, 58.0, 51.0, 47.0, 64.0, 55.0, 47.0, 39.0, 33.0, 27.0, 21.0, 20.0, 18.0, 11.0, 8.0, 2.0, 6.0, 4.0, 4.0, 7.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.968658447265625, -1.87677001953125, -1.784881591796875, -1.6929931640625, -1.601104736328125, -1.50921630859375, -1.417327880859375, -1.325439453125, -1.233551025390625, -1.14166259765625, -1.049774169921875, -0.9578857421875, -0.865997314453125, -0.77410888671875, -0.682220458984375, -0.59033203125, -0.498443603515625, -0.40655517578125, -0.314666748046875, -0.2227783203125, -0.130889892578125, -0.03900146484375, 0.052886962890625, 0.144775390625, 0.236663818359375, 0.32855224609375, 0.420440673828125, 0.5123291015625, 0.604217529296875, 0.69610595703125, 0.787994384765625, 0.8798828125, 0.971771240234375, 1.06365966796875, 1.155548095703125, 1.2474365234375, 1.339324951171875, 1.43121337890625, 1.523101806640625, 1.614990234375, 1.706878662109375, 1.79876708984375, 1.890655517578125, 1.9825439453125, 2.074432373046875, 2.16632080078125, 2.258209228515625, 2.35009765625, 2.441986083984375, 2.53387451171875, 2.625762939453125, 2.7176513671875, 2.809539794921875, 2.90142822265625, 2.993316650390625, 3.085205078125, 3.177093505859375, 3.26898193359375, 3.360870361328125, 3.4527587890625, 3.544647216796875, 3.63653564453125, 3.728424072265625, 3.8203125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 19.0, 35.0, 59.0, 83.0, 141.0, 293.0, 473.0, 1036.0, 2098.0, 4999.0, 15111.0, 139286.0, 840623.0, 30437.0, 7827.0, 3065.0, 1407.0, 717.0, 345.0, 215.0, 117.0, 72.0, 37.0, 24.0, 13.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.81640625, -1.756317138671875, -1.69622802734375, -1.636138916015625, -1.5760498046875, -1.515960693359375, -1.45587158203125, -1.395782470703125, -1.335693359375, -1.275604248046875, -1.21551513671875, -1.155426025390625, -1.0953369140625, -1.035247802734375, -0.97515869140625, -0.915069580078125, -0.85498046875, -0.794891357421875, -0.73480224609375, -0.674713134765625, -0.6146240234375, -0.554534912109375, -0.49444580078125, -0.434356689453125, -0.374267578125, -0.314178466796875, -0.25408935546875, -0.194000244140625, -0.1339111328125, -0.073822021484375, -0.01373291015625, 0.046356201171875, 0.1064453125, 0.166534423828125, 0.22662353515625, 0.286712646484375, 0.3468017578125, 0.406890869140625, 0.46697998046875, 0.527069091796875, 0.587158203125, 0.647247314453125, 0.70733642578125, 0.767425537109375, 0.8275146484375, 0.887603759765625, 0.94769287109375, 1.007781982421875, 1.06787109375, 1.127960205078125, 1.18804931640625, 1.248138427734375, 1.3082275390625, 1.368316650390625, 1.42840576171875, 1.488494873046875, 1.548583984375, 1.608673095703125, 1.66876220703125, 1.728851318359375, 1.7889404296875, 1.849029541015625, 1.90911865234375, 1.969207763671875, 2.029296875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 9.0, 14.0, 22.0, 94.0, 440.0, 325.0, 40.0, 21.0, 15.0, 8.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014066696166992188, -0.001362532377243042, -0.0013183951377868652, -0.0012742578983306885, -0.0012301206588745117, -0.001185983419418335, -0.0011418461799621582, -0.0010977089405059814, -0.0010535717010498047, -0.001009434461593628, -0.0009652972221374512, -0.0009211599826812744, -0.0008770227432250977, -0.0008328855037689209, -0.0007887482643127441, -0.0007446110248565674, -0.0007004737854003906, -0.0006563365459442139, -0.0006121993064880371, -0.0005680620670318604, -0.0005239248275756836, -0.00047978758811950684, -0.0004356503486633301, -0.0003915131092071533, -0.00034737586975097656, -0.0003032386302947998, -0.00025910139083862305, -0.0002149641513824463, -0.00017082691192626953, -0.00012668967247009277, -8.255243301391602e-05, -3.841519355773926e-05, 5.7220458984375e-06, 4.985928535461426e-05, 9.399652481079102e-05, 0.00013813376426696777, 0.00018227100372314453, 0.0002264082431793213, 0.00027054548263549805, 0.0003146827220916748, 0.00035881996154785156, 0.0004029572010040283, 0.0004470944404602051, 0.0004912316799163818, 0.0005353689193725586, 0.0005795061588287354, 0.0006236433982849121, 0.0006677806377410889, 0.0007119178771972656, 0.0007560551166534424, 0.0008001923561096191, 0.0008443295955657959, 0.0008884668350219727, 0.0009326040744781494, 0.0009767413139343262, 0.001020878553390503, 0.0010650157928466797, 0.0011091530323028564, 0.0011532902717590332, 0.00119742751121521, 0.0012415647506713867, 0.0012857019901275635, 0.0013298392295837402, 0.001373976469039917, 0.0014181137084960938]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 2.0, 11.0, 10.0, 13.0, 19.0, 23.0, 36.0, 82.0, 99.0, 166.0, 251.0, 465.0, 856.0, 1601.0, 3260.0, 7605.0, 21834.0, 235502.0, 726519.0, 31927.0, 9853.0, 4098.0, 1870.0, 1001.0, 565.0, 315.0, 177.0, 125.0, 70.0, 68.0, 36.0, 34.0, 13.0, 13.0, 9.0, 7.0, 4.0, 4.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.529296875, -1.4844970703125, -1.439697265625, -1.3948974609375, -1.35009765625, -1.3052978515625, -1.260498046875, -1.2156982421875, -1.1708984375, -1.1260986328125, -1.081298828125, -1.0364990234375, -0.99169921875, -0.9468994140625, -0.902099609375, -0.8572998046875, -0.8125, -0.7677001953125, -0.722900390625, -0.6781005859375, -0.63330078125, -0.5885009765625, -0.543701171875, -0.4989013671875, -0.4541015625, -0.4093017578125, -0.364501953125, -0.3197021484375, -0.27490234375, -0.2301025390625, -0.185302734375, -0.1405029296875, -0.095703125, -0.0509033203125, -0.006103515625, 0.0386962890625, 0.08349609375, 0.1282958984375, 0.173095703125, 0.2178955078125, 0.2626953125, 0.3074951171875, 0.352294921875, 0.3970947265625, 0.44189453125, 0.4866943359375, 0.531494140625, 0.5762939453125, 0.62109375, 0.6658935546875, 0.710693359375, 0.7554931640625, 0.80029296875, 0.8450927734375, 0.889892578125, 0.9346923828125, 0.9794921875, 1.0242919921875, 1.069091796875, 1.1138916015625, 1.15869140625, 1.2034912109375, 1.248291015625, 1.2930908203125, 1.337890625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 1.0, 9.0, 6.0, 10.0, 14.0, 20.0, 25.0, 38.0, 35.0, 57.0, 85.0, 100.0, 117.0, 109.0, 101.0, 65.0, 41.0, 37.0, 32.0, 16.0, 17.0, 9.0, 12.0, 4.0, 4.0, 5.0, 7.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2783203125, -1.2392730712890625, -1.200225830078125, -1.1611785888671875, -1.12213134765625, -1.0830841064453125, -1.044036865234375, -1.0049896240234375, -0.9659423828125, -0.9268951416015625, -0.887847900390625, -0.8488006591796875, -0.80975341796875, -0.7707061767578125, -0.731658935546875, -0.6926116943359375, -0.653564453125, -0.6145172119140625, -0.575469970703125, -0.5364227294921875, -0.49737548828125, -0.4583282470703125, -0.419281005859375, -0.3802337646484375, -0.3411865234375, -0.3021392822265625, -0.263092041015625, -0.2240447998046875, -0.18499755859375, -0.1459503173828125, -0.106903076171875, -0.0678558349609375, -0.02880859375, 0.0102386474609375, 0.049285888671875, 0.0883331298828125, 0.12738037109375, 0.1664276123046875, 0.205474853515625, 0.2445220947265625, 0.2835693359375, 0.3226165771484375, 0.361663818359375, 0.4007110595703125, 0.43975830078125, 0.4788055419921875, 0.517852783203125, 0.5569000244140625, 0.595947265625, 0.6349945068359375, 0.674041748046875, 0.7130889892578125, 0.75213623046875, 0.7911834716796875, 0.830230712890625, 0.8692779541015625, 0.9083251953125, 0.9473724365234375, 0.986419677734375, 1.0254669189453125, 1.06451416015625, 1.1035614013671875, 1.142608642578125, 1.1816558837890625, 1.220703125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 6.0, 9.0, 6.0, 10.0, 19.0, 24.0, 37.0, 44.0, 71.0, 107.0, 223.0, 183.0, 107.0, 72.0, 35.0, 13.0, 14.0, 5.0, 7.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.703315734863281, -14.059226036071777, -13.41513729095459, -12.771047592163086, -12.126957893371582, -11.482868194580078, -10.83877944946289, -10.194689750671387, -9.550600051879883, -8.906510353088379, -8.262421607971191, -7.6183319091796875, -6.974242210388184, -6.330152988433838, -5.686063766479492, -5.041974067687988, -4.397885322570801, -3.753795862197876, -3.109706401824951, -2.4656171798706055, -1.8215277194976807, -1.1774382591247559, -0.5333490371704102, 0.11074066162109375, 0.7548298835754395, 1.3989193439483643, 2.043008804321289, 2.6870980262756348, 3.3311874866485596, 3.9752769470214844, 4.61936616897583, 5.263455867767334, 5.90754508972168, 6.551634311676025, 7.195724010467529, 7.839813232421875, 8.483902931213379, 9.127992630004883, 9.77208137512207, 10.416171073913574, 11.060260772705078, 11.704350471496582, 12.34843921661377, 12.992528915405273, 13.636618614196777, 14.280708312988281, 14.924797058105469, 15.568886756896973, 16.212974548339844, 16.85706329345703, 17.50115394592285, 18.14524269104004, 18.789331436157227, 19.433422088623047, 20.077510833740234, 20.721599578857422, 21.365690231323242, 22.00977897644043, 22.65386962890625, 23.297958374023438, 23.942047119140625, 24.586137771606445, 25.230226516723633, 25.874317169189453, 26.51840591430664]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 3.0, 4.0, 9.0, 17.0, 11.0, 23.0, 20.0, 27.0, 31.0, 35.0, 34.0, 37.0, 50.0, 56.0, 72.0, 79.0, 80.0, 48.0, 52.0, 39.0, 33.0, 33.0, 33.0, 28.0, 27.0, 20.0, 19.0, 9.0, 10.0, 11.0, 12.0, 7.0, 4.0, 3.0, 9.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-14.255025863647461, -13.868809700012207, -13.482592582702637, -13.096376419067383, -12.710159301757812, -12.323943138122559, -11.937726974487305, -11.551509857177734, -11.16529369354248, -10.779077529907227, -10.392860412597656, -10.006644248962402, -9.620427131652832, -9.234210968017578, -8.847993850708008, -8.461777687072754, -8.0755615234375, -7.689344882965088, -7.303128242492676, -6.916912078857422, -6.53069543838501, -6.144478797912598, -5.7582621574401855, -5.372045516967773, -4.985828399658203, -4.599611759185791, -4.213395118713379, -3.827178716659546, -3.440962314605713, -3.054745674133301, -2.6685290336608887, -2.2823126316070557, -1.8960962295532227, -1.5098797082901, -1.1236631870269775, -0.7374465465545654, -0.35123002529144287, 0.03498649597167969, 0.4212031364440918, 0.8074195384979248, 1.193636178970337, 1.5798527002334595, 1.966069221496582, 2.352285861968994, 2.7385025024414062, 3.1247189044952393, 3.5109355449676514, 3.8971519470214844, 4.2833685874938965, 4.669585227966309, 5.055801868438721, 5.442018508911133, 5.828234672546387, 6.214451313018799, 6.600667953491211, 6.986884117126465, 7.373101234436035, 7.759317874908447, 8.14553451538086, 8.531750679016113, 8.917967796325684, 9.304183959960938, 9.690401077270508, 10.076617240905762, 10.462833404541016]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 4.0, 5.0, 7.0, 8.0, 14.0, 11.0, 15.0, 27.0, 39.0, 35.0, 54.0, 86.0, 98.0, 189.0, 452.0, 1372.0, 7601.0, 72853.0, 2176094.0, 1859394.0, 64413.0, 8054.0, 2032.0, 745.0, 273.0, 131.0, 75.0, 56.0, 21.0, 27.0, 20.0, 29.0, 5.0, 11.0, 6.0, 11.0, 5.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.546875, -1.495269775390625, -1.44366455078125, -1.392059326171875, -1.3404541015625, -1.288848876953125, -1.23724365234375, -1.185638427734375, -1.134033203125, -1.082427978515625, -1.03082275390625, -0.979217529296875, -0.9276123046875, -0.876007080078125, -0.82440185546875, -0.772796630859375, -0.72119140625, -0.669586181640625, -0.61798095703125, -0.566375732421875, -0.5147705078125, -0.463165283203125, -0.41156005859375, -0.359954833984375, -0.308349609375, -0.256744384765625, -0.20513916015625, -0.153533935546875, -0.1019287109375, -0.050323486328125, 0.00128173828125, 0.052886962890625, 0.1044921875, 0.156097412109375, 0.20770263671875, 0.259307861328125, 0.3109130859375, 0.362518310546875, 0.41412353515625, 0.465728759765625, 0.517333984375, 0.568939208984375, 0.62054443359375, 0.672149658203125, 0.7237548828125, 0.775360107421875, 0.82696533203125, 0.878570556640625, 0.93017578125, 0.981781005859375, 1.03338623046875, 1.084991455078125, 1.1365966796875, 1.188201904296875, 1.23980712890625, 1.291412353515625, 1.343017578125, 1.394622802734375, 1.44622802734375, 1.497833251953125, 1.5494384765625, 1.601043701171875, 1.65264892578125, 1.704254150390625, 1.755859375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 12.0, 22.0, 37.0, 64.0, 74.0, 133.0, 120.0, 140.0, 121.0, 106.0, 63.0, 41.0, 35.0, 17.0, 8.0, 6.0, 4.0, 0.0, 1.0, 1.0], "bins": [-2.376953125, -2.3304977416992188, -2.2840423583984375, -2.2375869750976562, -2.191131591796875, -2.1446762084960938, -2.0982208251953125, -2.0517654418945312, -2.00531005859375, -1.9588546752929688, -1.9123992919921875, -1.8659439086914062, -1.819488525390625, -1.7730331420898438, -1.7265777587890625, -1.6801223754882812, -1.6336669921875, -1.5872116088867188, -1.5407562255859375, -1.4943008422851562, -1.447845458984375, -1.4013900756835938, -1.3549346923828125, -1.3084793090820312, -1.26202392578125, -1.2155685424804688, -1.1691131591796875, -1.1226577758789062, -1.076202392578125, -1.0297470092773438, -0.9832916259765625, -0.9368362426757812, -0.890380859375, -0.8439254760742188, -0.7974700927734375, -0.7510147094726562, -0.704559326171875, -0.6581039428710938, -0.6116485595703125, -0.5651931762695312, -0.51873779296875, -0.47228240966796875, -0.4258270263671875, -0.37937164306640625, -0.332916259765625, -0.28646087646484375, -0.2400054931640625, -0.19355010986328125, -0.1470947265625, -0.10063934326171875, -0.0541839599609375, -0.00772857666015625, 0.038726806640625, 0.08518218994140625, 0.1316375732421875, 0.17809295654296875, 0.22454833984375, 0.27100372314453125, 0.3174591064453125, 0.36391448974609375, 0.410369873046875, 0.45682525634765625, 0.5032806396484375, 0.5497360229492188, 0.59619140625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 7.0, 16.0, 22.0, 33.0, 48.0, 80.0, 124.0, 177.0, 281.0, 636.0, 2786.0, 36136.0, 3736828.0, 403534.0, 11165.0, 1573.0, 450.0, 191.0, 90.0, 42.0, 27.0, 13.0, 6.0, 6.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.205078125, -3.097442626953125, -2.98980712890625, -2.882171630859375, -2.7745361328125, -2.666900634765625, -2.55926513671875, -2.451629638671875, -2.343994140625, -2.236358642578125, -2.12872314453125, -2.021087646484375, -1.9134521484375, -1.805816650390625, -1.69818115234375, -1.590545654296875, -1.48291015625, -1.375274658203125, -1.26763916015625, -1.160003662109375, -1.0523681640625, -0.944732666015625, -0.83709716796875, -0.729461669921875, -0.621826171875, -0.514190673828125, -0.40655517578125, -0.298919677734375, -0.1912841796875, -0.083648681640625, 0.02398681640625, 0.131622314453125, 0.2392578125, 0.346893310546875, 0.45452880859375, 0.562164306640625, 0.6697998046875, 0.777435302734375, 0.88507080078125, 0.992706298828125, 1.100341796875, 1.207977294921875, 1.31561279296875, 1.423248291015625, 1.5308837890625, 1.638519287109375, 1.74615478515625, 1.853790283203125, 1.96142578125, 2.069061279296875, 2.17669677734375, 2.284332275390625, 2.3919677734375, 2.499603271484375, 2.60723876953125, 2.714874267578125, 2.822509765625, 2.930145263671875, 3.03778076171875, 3.145416259765625, 3.2530517578125, 3.360687255859375, 3.46832275390625, 3.575958251953125, 3.68359375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 15.0, 12.0, 12.0, 29.0, 68.0, 134.0, 346.0, 932.0, 1314.0, 693.0, 243.0, 123.0, 74.0, 36.0, 16.0, 10.0, 8.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.39453125, -4.2976226806640625, -4.200714111328125, -4.1038055419921875, -4.00689697265625, -3.9099884033203125, -3.813079833984375, -3.7161712646484375, -3.6192626953125, -3.5223541259765625, -3.425445556640625, -3.3285369873046875, -3.23162841796875, -3.1347198486328125, -3.037811279296875, -2.9409027099609375, -2.843994140625, -2.7470855712890625, -2.650177001953125, -2.5532684326171875, -2.45635986328125, -2.3594512939453125, -2.262542724609375, -2.1656341552734375, -2.0687255859375, -1.9718170166015625, -1.874908447265625, -1.7779998779296875, -1.68109130859375, -1.5841827392578125, -1.487274169921875, -1.3903656005859375, -1.29345703125, -1.1965484619140625, -1.099639892578125, -1.0027313232421875, -0.90582275390625, -0.8089141845703125, -0.712005615234375, -0.6150970458984375, -0.5181884765625, -0.4212799072265625, -0.324371337890625, -0.2274627685546875, -0.13055419921875, -0.0336456298828125, 0.063262939453125, 0.1601715087890625, 0.257080078125, 0.3539886474609375, 0.450897216796875, 0.5478057861328125, 0.64471435546875, 0.7416229248046875, 0.838531494140625, 0.9354400634765625, 1.0323486328125, 1.1292572021484375, 1.226165771484375, 1.3230743408203125, 1.41998291015625, 1.5168914794921875, 1.613800048828125, 1.7107086181640625, 1.8076171875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 10.0, 13.0, 18.0, 49.0, 81.0, 131.0, 183.0, 198.0, 146.0, 93.0, 27.0, 15.0, 11.0, 5.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.392019271850586, -15.848381042480469, -15.304742813110352, -14.761104583740234, -14.217467308044434, -13.673829078674316, -13.1301908493042, -12.586552619934082, -12.042915344238281, -11.499277114868164, -10.955638885498047, -10.41200065612793, -9.868363380432129, -9.324725151062012, -8.781086921691895, -8.237448692321777, -7.69381046295166, -7.150172233581543, -6.606534481048584, -6.062896251678467, -5.519258499145508, -4.975620269775391, -4.431982040405273, -3.8883440494537354, -3.3447060585021973, -2.801068067550659, -2.257430076599121, -1.713791847229004, -1.1701538562774658, -0.6265158653259277, -0.08287763595581055, 0.46076035499572754, 1.0043983459472656, 1.5480363368988037, 2.091674327850342, 2.635312557220459, 3.178950548171997, 3.722588539123535, 4.266226768493652, 4.8098649978637695, 5.3535027503967285, 5.897140979766846, 6.440778732299805, 6.984416961669922, 7.528055191040039, 8.071693420410156, 8.615331649780273, 9.158968925476074, 9.702607154846191, 10.246245384216309, 10.789883613586426, 11.333520889282227, 11.877159118652344, 12.420797348022461, 12.964435577392578, 13.508073806762695, 14.051712036132812, 14.59535026550293, 15.138988494873047, 15.682626724243164, 16.22626495361328, 16.769901275634766, 17.313541412353516, 17.857177734375, 18.400815963745117]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 7.0, 3.0, 11.0, 15.0, 15.0, 20.0, 27.0, 30.0, 47.0, 52.0, 59.0, 67.0, 70.0, 73.0, 75.0, 72.0, 87.0, 66.0, 49.0, 38.0, 39.0, 27.0, 16.0, 14.0, 6.0, 8.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.370281219482422, -9.933174133300781, -9.496066093444824, -9.058959007263184, -8.621851921081543, -8.184743881225586, -7.747636795043945, -7.310529708862305, -6.873422145843506, -6.436314582824707, -5.999207496643066, -5.562099933624268, -5.124992370605469, -4.687885284423828, -4.250777721405029, -3.8136703968048096, -3.37656307220459, -2.93945574760437, -2.5023484230041504, -2.0652408599853516, -1.6281335353851318, -1.191026210784912, -0.7539186477661133, -0.31681132316589355, 0.12029600143432617, 0.5574033856391907, 0.9945107698440552, 1.4316182136535645, 1.8687255382537842, 2.305832862854004, 2.7429404258728027, 3.1800477504730225, 3.617155075073242, 4.054262638092041, 4.491369724273682, 4.9284772872924805, 5.365584373474121, 5.80269193649292, 6.239799499511719, 6.676906585693359, 7.114014148712158, 7.551121711730957, 7.988228797912598, 8.425336837768555, 8.862443923950195, 9.299551010131836, 9.736658096313477, 10.173766136169434, 10.610873222351074, 11.047980308532715, 11.485088348388672, 11.922195434570312, 12.359302520751953, 12.796409606933594, 13.23351764678955, 13.670624732971191, 14.107732772827148, 14.544839859008789, 14.981947898864746, 15.419054985046387, 15.856162071228027, 16.293270111083984, 16.730377197265625, 17.167484283447266, 17.604591369628906]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 7.0, 5.0, 13.0, 17.0, 31.0, 39.0, 73.0, 88.0, 123.0, 212.0, 294.0, 469.0, 761.0, 1185.0, 1915.0, 2948.0, 5029.0, 8687.0, 15109.0, 26355.0, 47191.0, 83182.0, 143071.0, 206311.0, 198500.0, 131061.0, 75399.0, 42442.0, 24242.0, 13709.0, 7799.0, 4687.0, 2801.0, 1755.0, 1121.0, 675.0, 423.0, 279.0, 181.0, 125.0, 76.0, 51.0, 46.0, 26.0, 7.0, 8.0, 8.0, 9.0, 4.0, 6.0, 1.0, 2.0], "bins": [-0.822265625, -0.7993698120117188, -0.7764739990234375, -0.7535781860351562, -0.730682373046875, -0.7077865600585938, -0.6848907470703125, -0.6619949340820312, -0.63909912109375, -0.6162033081054688, -0.5933074951171875, -0.5704116821289062, -0.547515869140625, -0.5246200561523438, -0.5017242431640625, -0.47882843017578125, -0.4559326171875, -0.43303680419921875, -0.4101409912109375, -0.38724517822265625, -0.364349365234375, -0.34145355224609375, -0.3185577392578125, -0.29566192626953125, -0.27276611328125, -0.24987030029296875, -0.2269744873046875, -0.20407867431640625, -0.181182861328125, -0.15828704833984375, -0.1353912353515625, -0.11249542236328125, -0.089599609375, -0.06670379638671875, -0.0438079833984375, -0.02091217041015625, 0.001983642578125, 0.02487945556640625, 0.0477752685546875, 0.07067108154296875, 0.09356689453125, 0.11646270751953125, 0.1393585205078125, 0.16225433349609375, 0.185150146484375, 0.20804595947265625, 0.2309417724609375, 0.25383758544921875, 0.2767333984375, 0.29962921142578125, 0.3225250244140625, 0.34542083740234375, 0.368316650390625, 0.39121246337890625, 0.4141082763671875, 0.43700408935546875, 0.45989990234375, 0.48279571533203125, 0.5056915283203125, 0.5285873413085938, 0.551483154296875, 0.5743789672851562, 0.5972747802734375, 0.6201705932617188, 0.64306640625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 5.0, 2.0, 4.0, 4.0, 6.0, 1.0, 5.0, 8.0, 8.0, 12.0, 12.0, 19.0, 16.0, 17.0, 16.0, 30.0, 26.0, 30.0, 30.0, 30.0, 51.0, 52.0, 56.0, 53.0, 32.0, 53.0, 46.0, 62.0, 36.0, 47.0, 25.0, 35.0, 21.0, 22.0, 25.0, 22.0, 13.0, 13.0, 9.0, 6.0, 9.0, 5.0, 9.0, 10.0, 4.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.6796875, -0.6604156494140625, -0.641143798828125, -0.6218719482421875, -0.60260009765625, -0.5833282470703125, -0.564056396484375, -0.5447845458984375, -0.5255126953125, -0.5062408447265625, -0.486968994140625, -0.4676971435546875, -0.44842529296875, -0.4291534423828125, -0.409881591796875, -0.3906097412109375, -0.371337890625, -0.3520660400390625, -0.332794189453125, -0.3135223388671875, -0.29425048828125, -0.2749786376953125, -0.255706787109375, -0.2364349365234375, -0.2171630859375, -0.1978912353515625, -0.178619384765625, -0.1593475341796875, -0.14007568359375, -0.1208038330078125, -0.101531982421875, -0.0822601318359375, -0.06298828125, -0.0437164306640625, -0.024444580078125, -0.0051727294921875, 0.01409912109375, 0.0333709716796875, 0.052642822265625, 0.0719146728515625, 0.0911865234375, 0.1104583740234375, 0.129730224609375, 0.1490020751953125, 0.16827392578125, 0.1875457763671875, 0.206817626953125, 0.2260894775390625, 0.245361328125, 0.2646331787109375, 0.283905029296875, 0.3031768798828125, 0.32244873046875, 0.3417205810546875, 0.360992431640625, 0.3802642822265625, 0.3995361328125, 0.4188079833984375, 0.438079833984375, 0.4573516845703125, 0.47662353515625, 0.4958953857421875, 0.515167236328125, 0.5344390869140625, 0.5537109375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 3.0, 7.0, 8.0, 9.0, 22.0, 29.0, 36.0, 55.0, 89.0, 141.0, 207.0, 311.0, 541.0, 1067.0, 2110.0, 6461.0, 35481.0, 379485.0, 569003.0, 41540.0, 7012.0, 2282.0, 1072.0, 581.0, 379.0, 196.0, 136.0, 79.0, 65.0, 51.0, 26.0, 21.0, 19.0, 6.0, 9.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.765625, -2.670379638671875, -2.57513427734375, -2.479888916015625, -2.3846435546875, -2.289398193359375, -2.19415283203125, -2.098907470703125, -2.003662109375, -1.908416748046875, -1.81317138671875, -1.717926025390625, -1.6226806640625, -1.527435302734375, -1.43218994140625, -1.336944580078125, -1.24169921875, -1.146453857421875, -1.05120849609375, -0.955963134765625, -0.8607177734375, -0.765472412109375, -0.67022705078125, -0.574981689453125, -0.479736328125, -0.384490966796875, -0.28924560546875, -0.194000244140625, -0.0987548828125, -0.003509521484375, 0.09173583984375, 0.186981201171875, 0.2822265625, 0.377471923828125, 0.47271728515625, 0.567962646484375, 0.6632080078125, 0.758453369140625, 0.85369873046875, 0.948944091796875, 1.044189453125, 1.139434814453125, 1.23468017578125, 1.329925537109375, 1.4251708984375, 1.520416259765625, 1.61566162109375, 1.710906982421875, 1.80615234375, 1.901397705078125, 1.99664306640625, 2.091888427734375, 2.1871337890625, 2.282379150390625, 2.37762451171875, 2.472869873046875, 2.568115234375, 2.663360595703125, 2.75860595703125, 2.853851318359375, 2.9490966796875, 3.044342041015625, 3.13958740234375, 3.234832763671875, 3.330078125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 11.0, 14.0, 13.0, 15.0, 7.0, 14.0, 22.0, 20.0, 28.0, 29.0, 28.0, 34.0, 39.0, 42.0, 60.0, 44.0, 56.0, 63.0, 43.0, 67.0, 57.0, 32.0, 30.0, 43.0, 32.0, 31.0, 22.0, 17.0, 22.0, 18.0, 7.0, 12.0, 9.0, 2.0, 4.0, 3.0, 3.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-3.673828125, -3.57470703125, -3.4755859375, -3.37646484375, -3.27734375, -3.17822265625, -3.0791015625, -2.97998046875, -2.880859375, -2.78173828125, -2.6826171875, -2.58349609375, -2.484375, -2.38525390625, -2.2861328125, -2.18701171875, -2.087890625, -1.98876953125, -1.8896484375, -1.79052734375, -1.69140625, -1.59228515625, -1.4931640625, -1.39404296875, -1.294921875, -1.19580078125, -1.0966796875, -0.99755859375, -0.8984375, -0.79931640625, -0.7001953125, -0.60107421875, -0.501953125, -0.40283203125, -0.3037109375, -0.20458984375, -0.10546875, -0.00634765625, 0.0927734375, 0.19189453125, 0.291015625, 0.39013671875, 0.4892578125, 0.58837890625, 0.6875, 0.78662109375, 0.8857421875, 0.98486328125, 1.083984375, 1.18310546875, 1.2822265625, 1.38134765625, 1.48046875, 1.57958984375, 1.6787109375, 1.77783203125, 1.876953125, 1.97607421875, 2.0751953125, 2.17431640625, 2.2734375, 2.37255859375, 2.4716796875, 2.57080078125, 2.669921875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 10.0, 12.0, 17.0, 44.0, 50.0, 99.0, 188.0, 440.0, 1219.0, 4560.0, 32037.0, 883045.0, 114669.0, 8966.0, 1982.0, 619.0, 274.0, 120.0, 74.0, 38.0, 29.0, 8.0, 16.0, 8.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5595703125, -1.4988861083984375, -1.438201904296875, -1.3775177001953125, -1.31683349609375, -1.2561492919921875, -1.195465087890625, -1.1347808837890625, -1.0740966796875, -1.0134124755859375, -0.952728271484375, -0.8920440673828125, -0.83135986328125, -0.7706756591796875, -0.709991455078125, -0.6493072509765625, -0.588623046875, -0.5279388427734375, -0.467254638671875, -0.4065704345703125, -0.34588623046875, -0.2852020263671875, -0.224517822265625, -0.1638336181640625, -0.1031494140625, -0.0424652099609375, 0.018218994140625, 0.0789031982421875, 0.13958740234375, 0.2002716064453125, 0.260955810546875, 0.3216400146484375, 0.38232421875, 0.4430084228515625, 0.503692626953125, 0.5643768310546875, 0.62506103515625, 0.6857452392578125, 0.746429443359375, 0.8071136474609375, 0.8677978515625, 0.9284820556640625, 0.989166259765625, 1.0498504638671875, 1.11053466796875, 1.1712188720703125, 1.231903076171875, 1.2925872802734375, 1.353271484375, 1.4139556884765625, 1.474639892578125, 1.5353240966796875, 1.59600830078125, 1.6566925048828125, 1.717376708984375, 1.7780609130859375, 1.8387451171875, 1.8994293212890625, 1.960113525390625, 2.0207977294921875, 2.08148193359375, 2.1421661376953125, 2.202850341796875, 2.2635345458984375, 2.32421875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 7.0, 11.0, 26.0, 41.0, 97.0, 170.0, 260.0, 166.0, 113.0, 47.0, 22.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005397796630859375, -0.0005214959383010864, -0.0005032122135162354, -0.0004849284887313843, -0.0004666447639465332, -0.00044836103916168213, -0.00043007731437683105, -0.00041179358959198, -0.0003935098648071289, -0.00037522614002227783, -0.00035694241523742676, -0.0003386586904525757, -0.0003203749656677246, -0.00030209124088287354, -0.00028380751609802246, -0.0002655237913131714, -0.0002472400665283203, -0.00022895634174346924, -0.00021067261695861816, -0.0001923888921737671, -0.00017410516738891602, -0.00015582144260406494, -0.00013753771781921387, -0.00011925399303436279, -0.00010097026824951172, -8.268654346466064e-05, -6.440281867980957e-05, -4.6119093894958496e-05, -2.7835369110107422e-05, -9.551644325256348e-06, 8.732080459594727e-06, 2.70158052444458e-05, 4.5299530029296875e-05, 6.358325481414795e-05, 8.186697959899902e-05, 0.0001001507043838501, 0.00011843442916870117, 0.00013671815395355225, 0.00015500187873840332, 0.0001732856035232544, 0.00019156932830810547, 0.00020985305309295654, 0.00022813677787780762, 0.0002464205026626587, 0.00026470422744750977, 0.00028298795223236084, 0.0003012716770172119, 0.000319555401802063, 0.00033783912658691406, 0.00035612285137176514, 0.0003744065761566162, 0.0003926903009414673, 0.00041097402572631836, 0.00042925775051116943, 0.0004475414752960205, 0.0004658252000808716, 0.00048410892486572266, 0.0005023926496505737, 0.0005206763744354248, 0.0005389600992202759, 0.000557243824005127, 0.000575527548789978, 0.0005938112735748291, 0.0006120949983596802, 0.0006303787231445312]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 6.0, 8.0, 20.0, 27.0, 43.0, 101.0, 152.0, 380.0, 924.0, 2763.0, 13791.0, 242430.0, 755837.0, 25741.0, 4199.0, 1205.0, 496.0, 201.0, 87.0, 61.0, 23.0, 22.0, 10.0, 10.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4609375, -1.4124755859375, -1.364013671875, -1.3155517578125, -1.26708984375, -1.2186279296875, -1.170166015625, -1.1217041015625, -1.0732421875, -1.0247802734375, -0.976318359375, -0.9278564453125, -0.87939453125, -0.8309326171875, -0.782470703125, -0.7340087890625, -0.685546875, -0.6370849609375, -0.588623046875, -0.5401611328125, -0.49169921875, -0.4432373046875, -0.394775390625, -0.3463134765625, -0.2978515625, -0.2493896484375, -0.200927734375, -0.1524658203125, -0.10400390625, -0.0555419921875, -0.007080078125, 0.0413818359375, 0.08984375, 0.1383056640625, 0.186767578125, 0.2352294921875, 0.28369140625, 0.3321533203125, 0.380615234375, 0.4290771484375, 0.4775390625, 0.5260009765625, 0.574462890625, 0.6229248046875, 0.67138671875, 0.7198486328125, 0.768310546875, 0.8167724609375, 0.865234375, 0.9136962890625, 0.962158203125, 1.0106201171875, 1.05908203125, 1.1075439453125, 1.156005859375, 1.2044677734375, 1.2529296875, 1.3013916015625, 1.349853515625, 1.3983154296875, 1.44677734375, 1.4952392578125, 1.543701171875, 1.5921630859375, 1.640625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 9.0, 10.0, 10.0, 10.0, 15.0, 19.0, 33.0, 50.0, 56.0, 85.0, 106.0, 121.0, 115.0, 89.0, 79.0, 47.0, 47.0, 24.0, 18.0, 16.0, 6.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2119140625, -1.1768646240234375, -1.141815185546875, -1.1067657470703125, -1.07171630859375, -1.0366668701171875, -1.001617431640625, -0.9665679931640625, -0.9315185546875, -0.8964691162109375, -0.861419677734375, -0.8263702392578125, -0.79132080078125, -0.7562713623046875, -0.721221923828125, -0.6861724853515625, -0.651123046875, -0.6160736083984375, -0.581024169921875, -0.5459747314453125, -0.51092529296875, -0.4758758544921875, -0.440826416015625, -0.4057769775390625, -0.3707275390625, -0.3356781005859375, -0.300628662109375, -0.2655792236328125, -0.23052978515625, -0.1954803466796875, -0.160430908203125, -0.1253814697265625, -0.09033203125, -0.0552825927734375, -0.020233154296875, 0.0148162841796875, 0.04986572265625, 0.0849151611328125, 0.119964599609375, 0.1550140380859375, 0.1900634765625, 0.2251129150390625, 0.260162353515625, 0.2952117919921875, 0.33026123046875, 0.3653106689453125, 0.400360107421875, 0.4354095458984375, 0.470458984375, 0.5055084228515625, 0.540557861328125, 0.5756072998046875, 0.61065673828125, 0.6457061767578125, 0.680755615234375, 0.7158050537109375, 0.7508544921875, 0.7859039306640625, 0.820953369140625, 0.8560028076171875, 0.89105224609375, 0.9261016845703125, 0.961151123046875, 0.9962005615234375, 1.03125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 15.0, 16.0, 56.0, 146.0, 318.0, 195.0, 134.0, 53.0, 27.0, 16.0, 11.0, 5.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.215835571289062, -29.22852897644043, -28.241222381591797, -27.253915786743164, -26.26660919189453, -25.27930450439453, -24.2919979095459, -23.304691314697266, -22.317384719848633, -21.330078125, -20.342771530151367, -19.355464935302734, -18.368160247802734, -17.38085174560547, -16.39354705810547, -15.406240463256836, -14.418933868408203, -13.43162727355957, -12.444320678710938, -11.457015037536621, -10.469708442687988, -9.482401847839355, -8.495096206665039, -7.507789611816406, -6.520483016967773, -5.533176422119141, -4.545870304107666, -3.5585639476776123, -2.5712575912475586, -1.5839509963989258, -0.5966448783874512, 0.39066123962402344, 1.3779678344726562, 2.36527419090271, 3.3525805473327637, 4.339886665344238, 5.327193260192871, 6.314499855041504, 7.3018059730529785, 8.289112091064453, 9.276418685913086, 10.263725280761719, 11.251031875610352, 12.238337516784668, 13.2256441116333, 14.212950706481934, 15.20025634765625, 16.187562942504883, 17.174869537353516, 18.16217613220215, 19.14948272705078, 20.136789321899414, 21.124095916748047, 22.111400604248047, 23.09870719909668, 24.086013793945312, 25.073320388793945, 26.060626983642578, 27.04793357849121, 28.035240173339844, 29.022544860839844, 30.00985336303711, 30.99715805053711, 31.984464645385742, 32.971771240234375]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 7.0, 2.0, 8.0, 6.0, 7.0, 11.0, 17.0, 14.0, 19.0, 21.0, 32.0, 43.0, 38.0, 48.0, 43.0, 60.0, 117.0, 92.0, 78.0, 63.0, 45.0, 40.0, 29.0, 36.0, 22.0, 27.0, 16.0, 18.0, 12.0, 10.0, 4.0, 4.0, 6.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.239904403686523, -14.637977600097656, -14.036050796508789, -13.434123992919922, -12.832198143005371, -12.230271339416504, -11.628344535827637, -11.026418685913086, -10.424491882324219, -9.822565078735352, -9.220638275146484, -8.618711471557617, -8.016785621643066, -7.414858818054199, -6.812932014465332, -6.211005687713623, -5.609078407287598, -5.0071516036987305, -4.4052252769470215, -3.8032984733581543, -3.201371908187866, -2.599445343017578, -1.997518539428711, -1.395592212677002, -0.7936654090881348, -0.1917387843132019, 0.41018784046173096, 1.0121145248413086, 1.6140410900115967, 2.2159676551818848, 2.817894458770752, 3.419820785522461, 4.021747589111328, 4.623674392700195, 5.225600719451904, 5.8275275230407715, 6.4294538497924805, 7.031380653381348, 7.633307456970215, 8.235233306884766, 8.837160110473633, 9.4390869140625, 10.041013717651367, 10.642940521240234, 11.244866371154785, 11.846793174743652, 12.44871997833252, 13.05064582824707, 13.652573585510254, 14.254500389099121, 14.856427192687988, 15.458353042602539, 16.060279846191406, 16.662206649780273, 17.26413345336914, 17.866060256958008, 18.467987060546875, 19.069913864135742, 19.67184066772461, 20.273767471313477, 20.875694274902344, 21.477619171142578, 22.079547882080078, 22.681472778320312, 23.28339958190918]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 11.0, 11.0, 24.0, 30.0, 43.0, 80.0, 103.0, 165.0, 271.0, 575.0, 1392.0, 3839.0, 15375.0, 113253.0, 1639912.0, 2225719.0, 165510.0, 20355.0, 4649.0, 1492.0, 630.0, 310.0, 166.0, 138.0, 67.0, 46.0, 34.0, 22.0, 17.0, 6.0, 9.0, 8.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130859375, -1.09326171875, -1.0556640625, -1.01806640625, -0.98046875, -0.94287109375, -0.9052734375, -0.86767578125, -0.830078125, -0.79248046875, -0.7548828125, -0.71728515625, -0.6796875, -0.64208984375, -0.6044921875, -0.56689453125, -0.529296875, -0.49169921875, -0.4541015625, -0.41650390625, -0.37890625, -0.34130859375, -0.3037109375, -0.26611328125, -0.228515625, -0.19091796875, -0.1533203125, -0.11572265625, -0.078125, -0.04052734375, -0.0029296875, 0.03466796875, 0.072265625, 0.10986328125, 0.1474609375, 0.18505859375, 0.22265625, 0.26025390625, 0.2978515625, 0.33544921875, 0.373046875, 0.41064453125, 0.4482421875, 0.48583984375, 0.5234375, 0.56103515625, 0.5986328125, 0.63623046875, 0.673828125, 0.71142578125, 0.7490234375, 0.78662109375, 0.82421875, 0.86181640625, 0.8994140625, 0.93701171875, 0.974609375, 1.01220703125, 1.0498046875, 1.08740234375, 1.125, 1.16259765625, 1.2001953125, 1.23779296875, 1.275390625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 10.0, 13.0, 16.0, 15.0, 31.0, 23.0, 44.0, 37.0, 29.0, 49.0, 50.0, 51.0, 56.0, 73.0, 45.0, 43.0, 59.0, 50.0, 42.0, 42.0, 51.0, 32.0, 23.0, 23.0, 26.0, 13.0, 10.0, 7.0, 7.0, 10.0, 3.0, 1.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.759765625, -0.7361373901367188, -0.7125091552734375, -0.6888809204101562, -0.665252685546875, -0.6416244506835938, -0.6179962158203125, -0.5943679809570312, -0.57073974609375, -0.5471115112304688, -0.5234832763671875, -0.49985504150390625, -0.476226806640625, -0.45259857177734375, -0.4289703369140625, -0.40534210205078125, -0.3817138671875, -0.35808563232421875, -0.3344573974609375, -0.31082916259765625, -0.287200927734375, -0.26357269287109375, -0.2399444580078125, -0.21631622314453125, -0.19268798828125, -0.16905975341796875, -0.1454315185546875, -0.12180328369140625, -0.098175048828125, -0.07454681396484375, -0.0509185791015625, -0.02729034423828125, -0.003662109375, 0.01996612548828125, 0.0435943603515625, 0.06722259521484375, 0.090850830078125, 0.11447906494140625, 0.1381072998046875, 0.16173553466796875, 0.18536376953125, 0.20899200439453125, 0.2326202392578125, 0.25624847412109375, 0.279876708984375, 0.30350494384765625, 0.3271331787109375, 0.35076141357421875, 0.3743896484375, 0.39801788330078125, 0.4216461181640625, 0.44527435302734375, 0.468902587890625, 0.49253082275390625, 0.5161590576171875, 0.5397872924804688, 0.56341552734375, 0.5870437622070312, 0.6106719970703125, 0.6343002319335938, 0.657928466796875, 0.6815567016601562, 0.7051849365234375, 0.7288131713867188, 0.75244140625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 7.0, 7.0, 15.0, 25.0, 43.0, 81.0, 123.0, 203.0, 357.0, 694.0, 2163.0, 22211.0, 3815071.0, 343682.0, 6976.0, 1379.0, 501.0, 304.0, 143.0, 96.0, 61.0, 37.0, 25.0, 15.0, 17.0, 8.0, 7.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.603515625, -3.482574462890625, -3.36163330078125, -3.240692138671875, -3.1197509765625, -2.998809814453125, -2.87786865234375, -2.756927490234375, -2.635986328125, -2.515045166015625, -2.39410400390625, -2.273162841796875, -2.1522216796875, -2.031280517578125, -1.91033935546875, -1.789398193359375, -1.66845703125, -1.547515869140625, -1.42657470703125, -1.305633544921875, -1.1846923828125, -1.063751220703125, -0.94281005859375, -0.821868896484375, -0.700927734375, -0.579986572265625, -0.45904541015625, -0.338104248046875, -0.2171630859375, -0.096221923828125, 0.02471923828125, 0.145660400390625, 0.2666015625, 0.387542724609375, 0.50848388671875, 0.629425048828125, 0.7503662109375, 0.871307373046875, 0.99224853515625, 1.113189697265625, 1.234130859375, 1.355072021484375, 1.47601318359375, 1.596954345703125, 1.7178955078125, 1.838836669921875, 1.95977783203125, 2.080718994140625, 2.20166015625, 2.322601318359375, 2.44354248046875, 2.564483642578125, 2.6854248046875, 2.806365966796875, 2.92730712890625, 3.048248291015625, 3.169189453125, 3.290130615234375, 3.41107177734375, 3.532012939453125, 3.6529541015625, 3.773895263671875, 3.89483642578125, 4.015777587890625, 4.13671875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 14.0, 30.0, 69.0, 154.0, 534.0, 1596.0, 1183.0, 316.0, 97.0, 52.0, 20.0, 4.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.95703125, -3.832794189453125, -3.70855712890625, -3.584320068359375, -3.4600830078125, -3.335845947265625, -3.21160888671875, -3.087371826171875, -2.963134765625, -2.838897705078125, -2.71466064453125, -2.590423583984375, -2.4661865234375, -2.341949462890625, -2.21771240234375, -2.093475341796875, -1.96923828125, -1.845001220703125, -1.72076416015625, -1.596527099609375, -1.4722900390625, -1.348052978515625, -1.22381591796875, -1.099578857421875, -0.975341796875, -0.851104736328125, -0.72686767578125, -0.602630615234375, -0.4783935546875, -0.354156494140625, -0.22991943359375, -0.105682373046875, 0.0185546875, 0.142791748046875, 0.26702880859375, 0.391265869140625, 0.5155029296875, 0.639739990234375, 0.76397705078125, 0.888214111328125, 1.012451171875, 1.136688232421875, 1.26092529296875, 1.385162353515625, 1.5093994140625, 1.633636474609375, 1.75787353515625, 1.882110595703125, 2.00634765625, 2.130584716796875, 2.25482177734375, 2.379058837890625, 2.5032958984375, 2.627532958984375, 2.75177001953125, 2.876007080078125, 3.000244140625, 3.124481201171875, 3.24871826171875, 3.372955322265625, 3.4971923828125, 3.621429443359375, 3.74566650390625, 3.869903564453125, 3.994140625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 8.0, 10.0, 22.0, 60.0, 186.0, 276.0, 224.0, 119.0, 53.0, 19.0, 8.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.307045936584473, -12.55985164642334, -11.812658309936523, -11.06546401977539, -10.318269729614258, -9.571075439453125, -8.823881149291992, -8.076687812805176, -7.329493522644043, -6.58229923248291, -5.8351054191589355, -5.087911605834961, -4.340717315673828, -3.5935232639312744, -2.8463292121887207, -2.099135398864746, -1.3519411087036133, -0.6047470569610596, 0.14244699478149414, 0.8896410465240479, 1.6368350982666016, 2.3840291500091553, 3.131223201751709, 3.8784170150756836, 4.625611305236816, 5.372805595397949, 6.119999408721924, 6.867193222045898, 7.614387512207031, 8.361581802368164, 9.108776092529297, 9.855969429016113, 10.603164672851562, 11.350358963012695, 12.097553253173828, 12.844746589660645, 13.591940879821777, 14.33913516998291, 15.086328506469727, 15.83352279663086, 16.580717086791992, 17.327911376953125, 18.075105667114258, 18.82229995727539, 19.56949234008789, 20.316686630249023, 21.063880920410156, 21.81107521057129, 22.558269500732422, 23.305463790893555, 24.052658081054688, 24.79985237121582, 25.547046661376953, 26.294239044189453, 27.041433334350586, 27.78862762451172, 28.53582191467285, 29.283016204833984, 30.030210494995117, 30.77740478515625, 31.52459716796875, 32.271793365478516, 33.018985748291016, 33.76618194580078, 34.51337432861328]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 4.0, 6.0, 5.0, 11.0, 9.0, 6.0, 15.0, 17.0, 24.0, 18.0, 29.0, 28.0, 34.0, 54.0, 48.0, 57.0, 43.0, 49.0, 38.0, 49.0, 60.0, 51.0, 53.0, 58.0, 28.0, 34.0, 41.0, 32.0, 22.0, 23.0, 12.0, 12.0, 9.0, 9.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-10.2860746383667, -10.0123872756958, -9.738698959350586, -9.465011596679688, -9.191324234008789, -8.91763687133789, -8.643948554992676, -8.370261192321777, -8.096573829650879, -7.822885990142822, -7.549198627471924, -7.275510787963867, -7.001823425292969, -6.728135585784912, -6.4544477462768555, -6.180760383605957, -5.9070725440979, -5.633384704589844, -5.359697341918945, -5.086009502410889, -4.81232213973999, -4.538634300231934, -4.264946937561035, -3.9912590980529785, -3.717571496963501, -3.4438838958740234, -3.170196294784546, -2.8965086936950684, -2.6228208541870117, -2.3491334915161133, -2.0754456520080566, -1.801758050918579, -1.5280704498291016, -1.254382848739624, -0.9806951880455017, -0.7070075273513794, -0.43331992626190186, -0.15963232517242432, 0.11405539512634277, 0.3877429962158203, 0.6614305973052979, 0.9351181983947754, 1.208805799484253, 1.48249351978302, 1.7561811208724976, 2.0298686027526855, 2.303556442260742, 2.5772440433502197, 2.8509316444396973, 3.124619245529175, 3.3983068466186523, 3.671994686126709, 3.9456820487976074, 4.219369888305664, 4.4930572509765625, 4.766745090484619, 5.040432929992676, 5.314120769500732, 5.587808132171631, 5.8614959716796875, 6.135183334350586, 6.408871173858643, 6.682559013366699, 6.956246376037598, 7.229933738708496]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 8.0, 20.0, 20.0, 30.0, 40.0, 77.0, 130.0, 182.0, 297.0, 473.0, 794.0, 1454.0, 2482.0, 4490.0, 8647.0, 16863.0, 34537.0, 68646.0, 129081.0, 203231.0, 224588.0, 163753.0, 92608.0, 47174.0, 23429.0, 11892.0, 5846.0, 3316.0, 1769.0, 1007.0, 636.0, 372.0, 248.0, 137.0, 85.0, 64.0, 44.0, 26.0, 14.0, 10.0, 12.0, 4.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7451171875, -0.7204666137695312, -0.6958160400390625, -0.6711654663085938, -0.646514892578125, -0.6218643188476562, -0.5972137451171875, -0.5725631713867188, -0.54791259765625, -0.5232620239257812, -0.4986114501953125, -0.47396087646484375, -0.449310302734375, -0.42465972900390625, -0.4000091552734375, -0.37535858154296875, -0.3507080078125, -0.32605743408203125, -0.3014068603515625, -0.27675628662109375, -0.252105712890625, -0.22745513916015625, -0.2028045654296875, -0.17815399169921875, -0.15350341796875, -0.12885284423828125, -0.1042022705078125, -0.07955169677734375, -0.054901123046875, -0.03025054931640625, -0.0055999755859375, 0.01905059814453125, 0.043701171875, 0.06835174560546875, 0.0930023193359375, 0.11765289306640625, 0.142303466796875, 0.16695404052734375, 0.1916046142578125, 0.21625518798828125, 0.24090576171875, 0.26555633544921875, 0.2902069091796875, 0.31485748291015625, 0.339508056640625, 0.36415863037109375, 0.3888092041015625, 0.41345977783203125, 0.4381103515625, 0.46276092529296875, 0.4874114990234375, 0.5120620727539062, 0.536712646484375, 0.5613632202148438, 0.5860137939453125, 0.6106643676757812, 0.63531494140625, 0.6599655151367188, 0.6846160888671875, 0.7092666625976562, 0.733917236328125, 0.7585678100585938, 0.7832183837890625, 0.8078689575195312, 0.83251953125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 10.0, 13.0, 11.0, 18.0, 10.0, 18.0, 21.0, 33.0, 27.0, 33.0, 29.0, 41.0, 38.0, 45.0, 35.0, 47.0, 48.0, 41.0, 58.0, 43.0, 35.0, 38.0, 42.0, 38.0, 34.0, 38.0, 30.0, 23.0, 19.0, 15.0, 23.0, 8.0, 10.0, 11.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71337890625, -0.691925048828125, -0.67047119140625, -0.649017333984375, -0.6275634765625, -0.606109619140625, -0.58465576171875, -0.563201904296875, -0.541748046875, -0.520294189453125, -0.49884033203125, -0.477386474609375, -0.4559326171875, -0.434478759765625, -0.41302490234375, -0.391571044921875, -0.3701171875, -0.348663330078125, -0.32720947265625, -0.305755615234375, -0.2843017578125, -0.262847900390625, -0.24139404296875, -0.219940185546875, -0.198486328125, -0.177032470703125, -0.15557861328125, -0.134124755859375, -0.1126708984375, -0.091217041015625, -0.06976318359375, -0.048309326171875, -0.02685546875, -0.005401611328125, 0.01605224609375, 0.037506103515625, 0.0589599609375, 0.080413818359375, 0.10186767578125, 0.123321533203125, 0.144775390625, 0.166229248046875, 0.18768310546875, 0.209136962890625, 0.2305908203125, 0.252044677734375, 0.27349853515625, 0.294952392578125, 0.31640625, 0.337860107421875, 0.35931396484375, 0.380767822265625, 0.4022216796875, 0.423675537109375, 0.44512939453125, 0.466583251953125, 0.488037109375, 0.509490966796875, 0.53094482421875, 0.552398681640625, 0.5738525390625, 0.595306396484375, 0.61676025390625, 0.638214111328125, 0.65966796875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 11.0, 13.0, 31.0, 36.0, 46.0, 103.0, 189.0, 401.0, 1028.0, 3925.0, 24854.0, 263316.0, 685095.0, 58954.0, 7819.0, 1643.0, 532.0, 240.0, 121.0, 74.0, 44.0, 22.0, 13.0, 12.0, 13.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.861328125, -3.7652587890625, -3.669189453125, -3.5731201171875, -3.47705078125, -3.3809814453125, -3.284912109375, -3.1888427734375, -3.0927734375, -2.9967041015625, -2.900634765625, -2.8045654296875, -2.70849609375, -2.6124267578125, -2.516357421875, -2.4202880859375, -2.32421875, -2.2281494140625, -2.132080078125, -2.0360107421875, -1.93994140625, -1.8438720703125, -1.747802734375, -1.6517333984375, -1.5556640625, -1.4595947265625, -1.363525390625, -1.2674560546875, -1.17138671875, -1.0753173828125, -0.979248046875, -0.8831787109375, -0.787109375, -0.6910400390625, -0.594970703125, -0.4989013671875, -0.40283203125, -0.3067626953125, -0.210693359375, -0.1146240234375, -0.0185546875, 0.0775146484375, 0.173583984375, 0.2696533203125, 0.36572265625, 0.4617919921875, 0.557861328125, 0.6539306640625, 0.75, 0.8460693359375, 0.942138671875, 1.0382080078125, 1.13427734375, 1.2303466796875, 1.326416015625, 1.4224853515625, 1.5185546875, 1.6146240234375, 1.710693359375, 1.8067626953125, 1.90283203125, 1.9989013671875, 2.094970703125, 2.1910400390625, 2.287109375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 5.0, 4.0, 8.0, 5.0, 16.0, 14.0, 19.0, 13.0, 24.0, 23.0, 28.0, 36.0, 38.0, 36.0, 26.0, 53.0, 42.0, 54.0, 34.0, 59.0, 63.0, 34.0, 48.0, 35.0, 35.0, 40.0, 32.0, 25.0, 23.0, 29.0, 18.0, 16.0, 7.0, 4.0, 6.0, 5.0, 8.0, 3.0, 5.0, 6.0, 1.0, 6.0, 2.0, 2.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.318359375, -2.241180419921875, -2.16400146484375, -2.086822509765625, -2.0096435546875, -1.932464599609375, -1.85528564453125, -1.778106689453125, -1.700927734375, -1.623748779296875, -1.54656982421875, -1.469390869140625, -1.3922119140625, -1.315032958984375, -1.23785400390625, -1.160675048828125, -1.08349609375, -1.006317138671875, -0.92913818359375, -0.851959228515625, -0.7747802734375, -0.697601318359375, -0.62042236328125, -0.543243408203125, -0.466064453125, -0.388885498046875, -0.31170654296875, -0.234527587890625, -0.1573486328125, -0.080169677734375, -0.00299072265625, 0.074188232421875, 0.1513671875, 0.228546142578125, 0.30572509765625, 0.382904052734375, 0.4600830078125, 0.537261962890625, 0.61444091796875, 0.691619873046875, 0.768798828125, 0.845977783203125, 0.92315673828125, 1.000335693359375, 1.0775146484375, 1.154693603515625, 1.23187255859375, 1.309051513671875, 1.38623046875, 1.463409423828125, 1.54058837890625, 1.617767333984375, 1.6949462890625, 1.772125244140625, 1.84930419921875, 1.926483154296875, 2.003662109375, 2.080841064453125, 2.15802001953125, 2.235198974609375, 2.3123779296875, 2.389556884765625, 2.46673583984375, 2.543914794921875, 2.62109375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 10.0, 20.0, 17.0, 31.0, 57.0, 99.0, 176.0, 290.0, 518.0, 1058.0, 2246.0, 5096.0, 13239.0, 37278.0, 126909.0, 552656.0, 214808.0, 60576.0, 19974.0, 7337.0, 3089.0, 1434.0, 693.0, 386.0, 217.0, 109.0, 76.0, 40.0, 39.0, 16.0, 19.0, 6.0, 6.0, 2.0, 2.0, 2.0, 1.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4990234375, -0.4822235107421875, -0.465423583984375, -0.4486236572265625, -0.43182373046875, -0.4150238037109375, -0.398223876953125, -0.3814239501953125, -0.3646240234375, -0.3478240966796875, -0.331024169921875, -0.3142242431640625, -0.29742431640625, -0.2806243896484375, -0.263824462890625, -0.2470245361328125, -0.230224609375, -0.2134246826171875, -0.196624755859375, -0.1798248291015625, -0.16302490234375, -0.1462249755859375, -0.129425048828125, -0.1126251220703125, -0.0958251953125, -0.0790252685546875, -0.062225341796875, -0.0454254150390625, -0.02862548828125, -0.0118255615234375, 0.004974365234375, 0.0217742919921875, 0.03857421875, 0.0553741455078125, 0.072174072265625, 0.0889739990234375, 0.10577392578125, 0.1225738525390625, 0.139373779296875, 0.1561737060546875, 0.1729736328125, 0.1897735595703125, 0.206573486328125, 0.2233734130859375, 0.24017333984375, 0.2569732666015625, 0.273773193359375, 0.2905731201171875, 0.307373046875, 0.3241729736328125, 0.340972900390625, 0.3577728271484375, 0.37457275390625, 0.3913726806640625, 0.408172607421875, 0.4249725341796875, 0.4417724609375, 0.4585723876953125, 0.475372314453125, 0.4921722412109375, 0.50897216796875, 0.5257720947265625, 0.542572021484375, 0.5593719482421875, 0.576171875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 11.0, 17.0, 19.0, 39.0, 56.0, 109.0, 147.0, 154.0, 145.0, 101.0, 64.0, 43.0, 30.0, 16.0, 16.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003688335418701172, -0.0003575049340724945, -0.0003461763262748718, -0.00033484771847724915, -0.00032351911067962646, -0.0003121905028820038, -0.0003008618950843811, -0.0002895332872867584, -0.00027820467948913574, -0.00026687607169151306, -0.0002555474638938904, -0.0002442188560962677, -0.00023289024829864502, -0.00022156164050102234, -0.00021023303270339966, -0.00019890442490577698, -0.0001875758171081543, -0.00017624720931053162, -0.00016491860151290894, -0.00015358999371528625, -0.00014226138591766357, -0.0001309327781200409, -0.00011960417032241821, -0.00010827556252479553, -9.694695472717285e-05, -8.561834692955017e-05, -7.428973913192749e-05, -6.296113133430481e-05, -5.163252353668213e-05, -4.030391573905945e-05, -2.8975307941436768e-05, -1.7646700143814087e-05, -6.318092346191406e-06, 5.010515451431274e-06, 1.6339123249053955e-05, 2.7667731046676636e-05, 3.8996338844299316e-05, 5.0324946641922e-05, 6.165355443954468e-05, 7.298216223716736e-05, 8.431077003479004e-05, 9.563937783241272e-05, 0.0001069679856300354, 0.00011829659342765808, 0.00012962520122528076, 0.00014095380902290344, 0.00015228241682052612, 0.0001636110246181488, 0.00017493963241577148, 0.00018626824021339417, 0.00019759684801101685, 0.00020892545580863953, 0.0002202540636062622, 0.0002315826714038849, 0.00024291127920150757, 0.00025423988699913025, 0.00026556849479675293, 0.0002768971025943756, 0.0002882257103919983, 0.00029955431818962097, 0.00031088292598724365, 0.00032221153378486633, 0.000333540141582489, 0.0003448687493801117, 0.0003561973571777344]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 9.0, 12.0, 25.0, 33.0, 74.0, 137.0, 292.0, 722.0, 2157.0, 8946.0, 52022.0, 392390.0, 524518.0, 54376.0, 9289.0, 2265.0, 688.0, 284.0, 138.0, 57.0, 42.0, 15.0, 16.0, 16.0, 5.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0283203125, -1.0019607543945312, -0.9756011962890625, -0.9492416381835938, -0.922882080078125, -0.8965225219726562, -0.8701629638671875, -0.8438034057617188, -0.81744384765625, -0.7910842895507812, -0.7647247314453125, -0.7383651733398438, -0.712005615234375, -0.6856460571289062, -0.6592864990234375, -0.6329269409179688, -0.6065673828125, -0.5802078247070312, -0.5538482666015625, -0.5274887084960938, -0.501129150390625, -0.47476959228515625, -0.4484100341796875, -0.42205047607421875, -0.39569091796875, -0.36933135986328125, -0.3429718017578125, -0.31661224365234375, -0.290252685546875, -0.26389312744140625, -0.2375335693359375, -0.21117401123046875, -0.184814453125, -0.15845489501953125, -0.1320953369140625, -0.10573577880859375, -0.079376220703125, -0.05301666259765625, -0.0266571044921875, -0.00029754638671875, 0.02606201171875, 0.05242156982421875, 0.0787811279296875, 0.10514068603515625, 0.131500244140625, 0.15785980224609375, 0.1842193603515625, 0.21057891845703125, 0.2369384765625, 0.26329803466796875, 0.2896575927734375, 0.31601715087890625, 0.342376708984375, 0.36873626708984375, 0.3950958251953125, 0.42145538330078125, 0.44781494140625, 0.47417449951171875, 0.5005340576171875, 0.5268936157226562, 0.553253173828125, 0.5796127319335938, 0.6059722900390625, 0.6323318481445312, 0.65869140625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 10.0, 6.0, 13.0, 17.0, 18.0, 23.0, 33.0, 43.0, 41.0, 73.0, 75.0, 89.0, 93.0, 71.0, 74.0, 69.0, 53.0, 46.0, 39.0, 33.0, 22.0, 18.0, 15.0, 15.0, 4.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.578125, -0.5546722412109375, -0.531219482421875, -0.5077667236328125, -0.48431396484375, -0.4608612060546875, -0.437408447265625, -0.4139556884765625, -0.3905029296875, -0.3670501708984375, -0.343597412109375, -0.3201446533203125, -0.29669189453125, -0.2732391357421875, -0.249786376953125, -0.2263336181640625, -0.202880859375, -0.1794281005859375, -0.155975341796875, -0.1325225830078125, -0.10906982421875, -0.0856170654296875, -0.062164306640625, -0.0387115478515625, -0.0152587890625, 0.0081939697265625, 0.031646728515625, 0.0550994873046875, 0.07855224609375, 0.1020050048828125, 0.125457763671875, 0.1489105224609375, 0.17236328125, 0.1958160400390625, 0.219268798828125, 0.2427215576171875, 0.26617431640625, 0.2896270751953125, 0.313079833984375, 0.3365325927734375, 0.3599853515625, 0.3834381103515625, 0.406890869140625, 0.4303436279296875, 0.45379638671875, 0.4772491455078125, 0.500701904296875, 0.5241546630859375, 0.547607421875, 0.5710601806640625, 0.594512939453125, 0.6179656982421875, 0.64141845703125, 0.6648712158203125, 0.688323974609375, 0.7117767333984375, 0.7352294921875, 0.7586822509765625, 0.782135009765625, 0.8055877685546875, 0.82904052734375, 0.8524932861328125, 0.875946044921875, 0.8993988037109375, 0.9228515625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 14.0, 21.0, 40.0, 99.0, 166.0, 329.0, 192.0, 81.0, 29.0, 14.0, 6.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.855045318603516, -34.05562210083008, -33.256202697753906, -32.45677947998047, -31.657358169555664, -30.85793685913086, -30.058513641357422, -29.259092330932617, -28.459671020507812, -27.660249710083008, -26.860828399658203, -26.061405181884766, -25.26198387145996, -24.462562561035156, -23.66313934326172, -22.863718032836914, -22.06429672241211, -21.264875411987305, -20.4654541015625, -19.666030883789062, -18.866609573364258, -18.067188262939453, -17.267765045166016, -16.46834373474121, -15.668922424316406, -14.869501113891602, -14.07007884979248, -13.27065658569336, -12.471235275268555, -11.67181396484375, -10.872391700744629, -10.072969436645508, -9.273548126220703, -8.474126815795898, -7.674704551696777, -6.8752827644348145, -6.075860977172852, -5.276439189910889, -4.477017402648926, -3.677595615386963, -2.878173828125, -2.078752040863037, -1.2793302536010742, -0.47990846633911133, 0.31951332092285156, 1.1189351081848145, 1.9183568954467773, 2.7177786827087402, 3.517200469970703, 4.316622257232666, 5.116044044494629, 5.915465831756592, 6.714887619018555, 7.514309406280518, 8.31373119354248, 9.113153457641602, 9.912574768066406, 10.711996078491211, 11.511418342590332, 12.310840606689453, 13.110261917114258, 13.909683227539062, 14.709105491638184, 15.508527755737305, 16.30794906616211]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 9.0, 7.0, 6.0, 9.0, 12.0, 7.0, 11.0, 18.0, 17.0, 15.0, 29.0, 33.0, 33.0, 24.0, 33.0, 38.0, 44.0, 44.0, 77.0, 73.0, 75.0, 50.0, 39.0, 44.0, 30.0, 22.0, 31.0, 27.0, 17.0, 22.0, 14.0, 16.0, 11.0, 10.0, 15.0, 7.0, 10.0, 6.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-11.15542221069336, -10.822574615478516, -10.489727020263672, -10.156880378723145, -9.8240327835083, -9.491185188293457, -9.158337593078613, -8.825490951538086, -8.492643356323242, -8.159795761108398, -7.826948642730713, -7.494101047515869, -7.161253929138184, -6.82840633392334, -6.495558738708496, -6.1627116203308105, -5.829864025115967, -5.497016429901123, -5.1641693115234375, -4.831321716308594, -4.498474597930908, -4.1656270027160645, -3.8327796459198, -3.499932289123535, -3.1670849323272705, -2.834237575531006, -2.501390218734741, -2.1685428619384766, -1.8356953859329224, -1.5028480291366577, -1.1700005531311035, -0.8371531963348389, -0.5043058395385742, -0.17145845293998718, 0.16138893365859985, 0.4942363500595093, 0.8270837068557739, 1.1599310636520386, 1.4927785396575928, 1.8256258964538574, 2.158473253250122, 2.4913206100463867, 2.8241679668426514, 3.157015323638916, 3.4898629188537598, 3.8227100372314453, 4.155557632446289, 4.488405227661133, 4.821252346038818, 5.154099941253662, 5.486947059631348, 5.819794654846191, 6.152641773223877, 6.485489368438721, 6.818336486816406, 7.15118408203125, 7.484031677246094, 7.8168792724609375, 8.149726867675781, 8.482573509216309, 8.815421104431152, 9.148268699645996, 9.48111629486084, 9.813962936401367, 10.146810531616211]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 19.0, 19.0, 22.0, 33.0, 68.0, 99.0, 158.0, 250.0, 389.0, 620.0, 1185.0, 2440.0, 5490.0, 15645.0, 57658.0, 274725.0, 1244048.0, 1866085.0, 566245.0, 115034.0, 27873.0, 8877.0, 3519.0, 1668.0, 897.0, 459.0, 284.0, 172.0, 88.0, 68.0, 47.0, 24.0, 22.0, 15.0, 6.0, 16.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.75439453125, -0.7329788208007812, -0.7115631103515625, -0.6901473999023438, -0.668731689453125, -0.6473159790039062, -0.6259002685546875, -0.6044845581054688, -0.58306884765625, -0.5616531372070312, -0.5402374267578125, -0.5188217163085938, -0.497406005859375, -0.47599029541015625, -0.4545745849609375, -0.43315887451171875, -0.4117431640625, -0.39032745361328125, -0.3689117431640625, -0.34749603271484375, -0.326080322265625, -0.30466461181640625, -0.2832489013671875, -0.26183319091796875, -0.24041748046875, -0.21900177001953125, -0.1975860595703125, -0.17617034912109375, -0.154754638671875, -0.13333892822265625, -0.1119232177734375, -0.09050750732421875, -0.069091796875, -0.04767608642578125, -0.0262603759765625, -0.00484466552734375, 0.016571044921875, 0.03798675537109375, 0.0594024658203125, 0.08081817626953125, 0.10223388671875, 0.12364959716796875, 0.1450653076171875, 0.16648101806640625, 0.187896728515625, 0.20931243896484375, 0.2307281494140625, 0.25214385986328125, 0.2735595703125, 0.29497528076171875, 0.3163909912109375, 0.33780670166015625, 0.359222412109375, 0.38063812255859375, 0.4020538330078125, 0.42346954345703125, 0.44488525390625, 0.46630096435546875, 0.4877166748046875, 0.5091323852539062, 0.530548095703125, 0.5519638061523438, 0.5733795166015625, 0.5947952270507812, 0.6162109375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 4.0, 3.0, 1.0, 9.0, 6.0, 14.0, 10.0, 9.0, 23.0, 23.0, 22.0, 21.0, 35.0, 29.0, 48.0, 28.0, 42.0, 43.0, 47.0, 55.0, 37.0, 49.0, 55.0, 45.0, 35.0, 40.0, 48.0, 31.0, 31.0, 32.0, 18.0, 20.0, 21.0, 11.0, 14.0, 8.0, 7.0, 8.0, 7.0, 6.0, 2.0, 2.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67919921875, -0.6595535278320312, -0.6399078369140625, -0.6202621459960938, -0.600616455078125, -0.5809707641601562, -0.5613250732421875, -0.5416793823242188, -0.52203369140625, -0.5023880004882812, -0.4827423095703125, -0.46309661865234375, -0.443450927734375, -0.42380523681640625, -0.4041595458984375, -0.38451385498046875, -0.3648681640625, -0.34522247314453125, -0.3255767822265625, -0.30593109130859375, -0.286285400390625, -0.26663970947265625, -0.2469940185546875, -0.22734832763671875, -0.20770263671875, -0.18805694580078125, -0.1684112548828125, -0.14876556396484375, -0.129119873046875, -0.10947418212890625, -0.0898284912109375, -0.07018280029296875, -0.050537109375, -0.03089141845703125, -0.0112457275390625, 0.00839996337890625, 0.028045654296875, 0.04769134521484375, 0.0673370361328125, 0.08698272705078125, 0.10662841796875, 0.12627410888671875, 0.1459197998046875, 0.16556549072265625, 0.185211181640625, 0.20485687255859375, 0.2245025634765625, 0.24414825439453125, 0.2637939453125, 0.28343963623046875, 0.3030853271484375, 0.32273101806640625, 0.342376708984375, 0.36202239990234375, 0.3816680908203125, 0.40131378173828125, 0.42095947265625, 0.44060516357421875, 0.4602508544921875, 0.47989654541015625, 0.499542236328125, 0.5191879272460938, 0.5388336181640625, 0.5584793090820312, 0.578125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 9.0, 15.0, 16.0, 20.0, 46.0, 73.0, 117.0, 220.0, 516.0, 1163.0, 3633.0, 26255.0, 1113403.0, 2991733.0, 49127.0, 5288.0, 1451.0, 578.0, 288.0, 159.0, 74.0, 36.0, 15.0, 17.0, 5.0, 9.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.240234375, -2.168243408203125, -2.09625244140625, -2.024261474609375, -1.9522705078125, -1.880279541015625, -1.80828857421875, -1.736297607421875, -1.664306640625, -1.592315673828125, -1.52032470703125, -1.448333740234375, -1.3763427734375, -1.304351806640625, -1.23236083984375, -1.160369873046875, -1.08837890625, -1.016387939453125, -0.94439697265625, -0.872406005859375, -0.8004150390625, -0.728424072265625, -0.65643310546875, -0.584442138671875, -0.512451171875, -0.440460205078125, -0.36846923828125, -0.296478271484375, -0.2244873046875, -0.152496337890625, -0.08050537109375, -0.008514404296875, 0.0634765625, 0.135467529296875, 0.20745849609375, 0.279449462890625, 0.3514404296875, 0.423431396484375, 0.49542236328125, 0.567413330078125, 0.639404296875, 0.711395263671875, 0.78338623046875, 0.855377197265625, 0.9273681640625, 0.999359130859375, 1.07135009765625, 1.143341064453125, 1.21533203125, 1.287322998046875, 1.35931396484375, 1.431304931640625, 1.5032958984375, 1.575286865234375, 1.64727783203125, 1.719268798828125, 1.791259765625, 1.863250732421875, 1.93524169921875, 2.007232666015625, 2.0792236328125, 2.151214599609375, 2.22320556640625, 2.295196533203125, 2.3671875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 14.0, 11.0, 20.0, 31.0, 44.0, 60.0, 118.0, 217.0, 355.0, 607.0, 800.0, 698.0, 455.0, 250.0, 134.0, 83.0, 48.0, 42.0, 32.0, 15.0, 6.0, 9.0, 8.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.802734375, -1.7476654052734375, -1.692596435546875, -1.6375274658203125, -1.58245849609375, -1.5273895263671875, -1.472320556640625, -1.4172515869140625, -1.3621826171875, -1.3071136474609375, -1.252044677734375, -1.1969757080078125, -1.14190673828125, -1.0868377685546875, -1.031768798828125, -0.9766998291015625, -0.921630859375, -0.8665618896484375, -0.811492919921875, -0.7564239501953125, -0.70135498046875, -0.6462860107421875, -0.591217041015625, -0.5361480712890625, -0.4810791015625, -0.4260101318359375, -0.370941162109375, -0.3158721923828125, -0.26080322265625, -0.2057342529296875, -0.150665283203125, -0.0955963134765625, -0.04052734375, 0.0145416259765625, 0.069610595703125, 0.1246795654296875, 0.17974853515625, 0.2348175048828125, 0.289886474609375, 0.3449554443359375, 0.4000244140625, 0.4550933837890625, 0.510162353515625, 0.5652313232421875, 0.62030029296875, 0.6753692626953125, 0.730438232421875, 0.7855072021484375, 0.840576171875, 0.8956451416015625, 0.950714111328125, 1.0057830810546875, 1.06085205078125, 1.1159210205078125, 1.170989990234375, 1.2260589599609375, 1.2811279296875, 1.3361968994140625, 1.391265869140625, 1.4463348388671875, 1.50140380859375, 1.5564727783203125, 1.611541748046875, 1.6666107177734375, 1.7216796875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 4.0, 8.0, 19.0, 26.0, 48.0, 79.0, 151.0, 143.0, 159.0, 133.0, 108.0, 61.0, 25.0, 13.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.149273872375488, -7.768694877624512, -7.388116359710693, -7.007537364959717, -6.626958847045898, -6.246379852294922, -5.865800857543945, -5.485221862792969, -5.10464334487915, -4.724064350128174, -4.3434858322143555, -3.962906837463379, -3.5823280811309814, -3.201749324798584, -2.8211703300476074, -2.44059157371521, -2.0600128173828125, -1.679434061050415, -1.298855185508728, -0.918276309967041, -0.5376975536346436, -0.1571187973022461, 0.22346019744873047, 0.6040389537811279, 0.9846177101135254, 1.3651964664459229, 1.7457753419876099, 2.126354217529297, 2.5069329738616943, 2.887511730194092, 3.2680907249450684, 3.648669481277466, 4.02924919128418, 4.409828186035156, 4.790406703948975, 5.170985698699951, 5.5515642166137695, 5.932143211364746, 6.312722206115723, 6.693301200866699, 7.073879718780518, 7.454458713531494, 7.8350372314453125, 8.215616226196289, 8.596195220947266, 8.976774215698242, 9.357353210449219, 9.737931251525879, 10.118510246276855, 10.499089241027832, 10.879668235778809, 11.260246276855469, 11.640825271606445, 12.021404266357422, 12.401983261108398, 12.782562255859375, 13.163141250610352, 13.543720245361328, 13.924299240112305, 14.304878234863281, 14.685456275939941, 15.066035270690918, 15.446614265441895, 15.827193260192871, 16.20777130126953]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 7.0, 15.0, 17.0, 16.0, 21.0, 27.0, 32.0, 30.0, 49.0, 50.0, 38.0, 56.0, 73.0, 60.0, 72.0, 53.0, 59.0, 49.0, 46.0, 32.0, 32.0, 33.0, 30.0, 17.0, 16.0, 19.0, 11.0, 7.0, 12.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.081058502197266, -6.836199760437012, -6.591341495513916, -6.346482753753662, -6.101624488830566, -5.8567657470703125, -5.611907005310059, -5.367048740386963, -5.122190475463867, -4.877331733703613, -4.632473468780518, -4.387614727020264, -4.142756462097168, -3.897897720336914, -3.6530392169952393, -3.4081807136535645, -3.1633219718933105, -2.9184634685516357, -2.673604965209961, -2.428746223449707, -2.1838879585266113, -1.939029335975647, -1.6941707134246826, -1.4493122100830078, -1.204453706741333, -0.9595952033996582, -0.7147366404533386, -0.46987807750701904, -0.22501957416534424, 0.019838929176330566, 0.2646975517272949, 0.5095560550689697, 0.7544145584106445, 0.9992730617523193, 1.2441315650939941, 1.4889901876449585, 1.7338486909866333, 1.978707194328308, 2.2235658168792725, 2.4684243202209473, 2.713282823562622, 2.958141326904297, 3.2029998302459717, 3.4478583335876465, 3.6927170753479004, 3.937575340270996, 4.18243408203125, 4.427292823791504, 4.6721510887146, 4.9170098304748535, 5.161868095397949, 5.406726837158203, 5.651585102081299, 5.896443843841553, 6.141302108764648, 6.386160850524902, 6.631019592285156, 6.87587833404541, 7.120736598968506, 7.36559534072876, 7.6104536056518555, 7.855312347412109, 8.100171089172363, 8.345029830932617, 8.589887619018555]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 10.0, 13.0, 22.0, 16.0, 30.0, 57.0, 62.0, 113.0, 152.0, 266.0, 410.0, 635.0, 1103.0, 1959.0, 3326.0, 6205.0, 11379.0, 21732.0, 41598.0, 79800.0, 146213.0, 223435.0, 215456.0, 137174.0, 74127.0, 38934.0, 20326.0, 10693.0, 5625.0, 3067.0, 1754.0, 1114.0, 629.0, 376.0, 255.0, 151.0, 106.0, 67.0, 45.0, 36.0, 22.0, 13.0, 15.0, 11.0, 5.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.7548828125, -0.7326431274414062, -0.7104034423828125, -0.6881637573242188, -0.665924072265625, -0.6436843872070312, -0.6214447021484375, -0.5992050170898438, -0.57696533203125, -0.5547256469726562, -0.5324859619140625, -0.5102462768554688, -0.488006591796875, -0.46576690673828125, -0.4435272216796875, -0.42128753662109375, -0.3990478515625, -0.37680816650390625, -0.3545684814453125, -0.33232879638671875, -0.310089111328125, -0.28784942626953125, -0.2656097412109375, -0.24337005615234375, -0.22113037109375, -0.19889068603515625, -0.1766510009765625, -0.15441131591796875, -0.132171630859375, -0.10993194580078125, -0.0876922607421875, -0.06545257568359375, -0.043212890625, -0.02097320556640625, 0.0012664794921875, 0.02350616455078125, 0.045745849609375, 0.06798553466796875, 0.0902252197265625, 0.11246490478515625, 0.13470458984375, 0.15694427490234375, 0.1791839599609375, 0.20142364501953125, 0.223663330078125, 0.24590301513671875, 0.2681427001953125, 0.29038238525390625, 0.3126220703125, 0.33486175537109375, 0.3571014404296875, 0.37934112548828125, 0.401580810546875, 0.42382049560546875, 0.4460601806640625, 0.46829986572265625, 0.49053955078125, 0.5127792358398438, 0.5350189208984375, 0.5572586059570312, 0.579498291015625, 0.6017379760742188, 0.6239776611328125, 0.6462173461914062, 0.66845703125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 7.0, 7.0, 3.0, 6.0, 14.0, 18.0, 22.0, 20.0, 24.0, 36.0, 29.0, 44.0, 53.0, 48.0, 68.0, 48.0, 61.0, 57.0, 51.0, 60.0, 48.0, 36.0, 55.0, 34.0, 43.0, 17.0, 15.0, 25.0, 13.0, 11.0, 9.0, 7.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8759765625, -0.8508224487304688, -0.8256683349609375, -0.8005142211914062, -0.775360107421875, -0.7502059936523438, -0.7250518798828125, -0.6998977661132812, -0.67474365234375, -0.6495895385742188, -0.6244354248046875, -0.5992813110351562, -0.574127197265625, -0.5489730834960938, -0.5238189697265625, -0.49866485595703125, -0.4735107421875, -0.44835662841796875, -0.4232025146484375, -0.39804840087890625, -0.372894287109375, -0.34774017333984375, -0.3225860595703125, -0.29743194580078125, -0.27227783203125, -0.24712371826171875, -0.2219696044921875, -0.19681549072265625, -0.171661376953125, -0.14650726318359375, -0.1213531494140625, -0.09619903564453125, -0.071044921875, -0.04589080810546875, -0.0207366943359375, 0.00441741943359375, 0.029571533203125, 0.05472564697265625, 0.0798797607421875, 0.10503387451171875, 0.13018798828125, 0.15534210205078125, 0.1804962158203125, 0.20565032958984375, 0.230804443359375, 0.25595855712890625, 0.2811126708984375, 0.30626678466796875, 0.3314208984375, 0.35657501220703125, 0.3817291259765625, 0.40688323974609375, 0.432037353515625, 0.45719146728515625, 0.4823455810546875, 0.5074996948242188, 0.53265380859375, 0.5578079223632812, 0.5829620361328125, 0.6081161499023438, 0.633270263671875, 0.6584243774414062, 0.6835784912109375, 0.7087326049804688, 0.73388671875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 4.0, 5.0, 11.0, 14.0, 16.0, 19.0, 33.0, 40.0, 62.0, 111.0, 180.0, 274.0, 465.0, 850.0, 2159.0, 6746.0, 35104.0, 281289.0, 646502.0, 59388.0, 10001.0, 2802.0, 1067.0, 576.0, 288.0, 185.0, 126.0, 75.0, 44.0, 37.0, 24.0, 19.0, 8.0, 6.0, 9.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.56640625, -2.48895263671875, -2.4114990234375, -2.33404541015625, -2.256591796875, -2.17913818359375, -2.1016845703125, -2.02423095703125, -1.94677734375, -1.86932373046875, -1.7918701171875, -1.71441650390625, -1.636962890625, -1.55950927734375, -1.4820556640625, -1.40460205078125, -1.3271484375, -1.24969482421875, -1.1722412109375, -1.09478759765625, -1.017333984375, -0.93988037109375, -0.8624267578125, -0.78497314453125, -0.70751953125, -0.63006591796875, -0.5526123046875, -0.47515869140625, -0.397705078125, -0.32025146484375, -0.2427978515625, -0.16534423828125, -0.087890625, -0.01043701171875, 0.0670166015625, 0.14447021484375, 0.221923828125, 0.29937744140625, 0.3768310546875, 0.45428466796875, 0.53173828125, 0.60919189453125, 0.6866455078125, 0.76409912109375, 0.841552734375, 0.91900634765625, 0.9964599609375, 1.07391357421875, 1.1513671875, 1.22882080078125, 1.3062744140625, 1.38372802734375, 1.461181640625, 1.53863525390625, 1.6160888671875, 1.69354248046875, 1.77099609375, 1.84844970703125, 1.9259033203125, 2.00335693359375, 2.080810546875, 2.15826416015625, 2.2357177734375, 2.31317138671875, 2.390625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 9.0, 10.0, 10.0, 9.0, 19.0, 23.0, 14.0, 30.0, 36.0, 39.0, 43.0, 51.0, 75.0, 57.0, 80.0, 60.0, 56.0, 62.0, 60.0, 45.0, 37.0, 34.0, 38.0, 24.0, 15.0, 16.0, 9.0, 8.0, 6.0, 0.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.73828125, -2.633453369140625, -2.52862548828125, -2.423797607421875, -2.3189697265625, -2.214141845703125, -2.10931396484375, -2.004486083984375, -1.899658203125, -1.794830322265625, -1.69000244140625, -1.585174560546875, -1.4803466796875, -1.375518798828125, -1.27069091796875, -1.165863037109375, -1.06103515625, -0.956207275390625, -0.85137939453125, -0.746551513671875, -0.6417236328125, -0.536895751953125, -0.43206787109375, -0.327239990234375, -0.222412109375, -0.117584228515625, -0.01275634765625, 0.092071533203125, 0.1968994140625, 0.301727294921875, 0.40655517578125, 0.511383056640625, 0.6162109375, 0.721038818359375, 0.82586669921875, 0.930694580078125, 1.0355224609375, 1.140350341796875, 1.24517822265625, 1.350006103515625, 1.454833984375, 1.559661865234375, 1.66448974609375, 1.769317626953125, 1.8741455078125, 1.978973388671875, 2.08380126953125, 2.188629150390625, 2.29345703125, 2.398284912109375, 2.50311279296875, 2.607940673828125, 2.7127685546875, 2.817596435546875, 2.92242431640625, 3.027252197265625, 3.132080078125, 3.236907958984375, 3.34173583984375, 3.446563720703125, 3.5513916015625, 3.656219482421875, 3.76104736328125, 3.865875244140625, 3.970703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 7.0, 7.0, 8.0, 3.0, 14.0, 19.0, 17.0, 24.0, 37.0, 61.0, 98.0, 125.0, 234.0, 386.0, 786.0, 1553.0, 3600.0, 9300.0, 27990.0, 100194.0, 610582.0, 213967.0, 52849.0, 16244.0, 5755.0, 2314.0, 1040.0, 500.0, 300.0, 186.0, 111.0, 73.0, 41.0, 33.0, 28.0, 20.0, 17.0, 11.0, 7.0, 2.0, 8.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.5517578125, -0.5363273620605469, -0.5208969116210938, -0.5054664611816406, -0.4900360107421875, -0.4746055603027344, -0.45917510986328125, -0.4437446594238281, -0.428314208984375, -0.4128837585449219, -0.39745330810546875, -0.3820228576660156, -0.3665924072265625, -0.3511619567871094, -0.33573150634765625, -0.3203010559082031, -0.30487060546875, -0.2894401550292969, -0.27400970458984375, -0.2585792541503906, -0.2431488037109375, -0.22771835327148438, -0.21228790283203125, -0.19685745239257812, -0.181427001953125, -0.16599655151367188, -0.15056610107421875, -0.13513565063476562, -0.1197052001953125, -0.10427474975585938, -0.08884429931640625, -0.07341384887695312, -0.0579833984375, -0.042552947998046875, -0.02712249755859375, -0.011692047119140625, 0.0037384033203125, 0.019168853759765625, 0.03459930419921875, 0.050029754638671875, 0.065460205078125, 0.08089065551757812, 0.09632110595703125, 0.11175155639648438, 0.1271820068359375, 0.14261245727539062, 0.15804290771484375, 0.17347335815429688, 0.18890380859375, 0.20433425903320312, 0.21976470947265625, 0.23519515991210938, 0.2506256103515625, 0.2660560607910156, 0.28148651123046875, 0.2969169616699219, 0.312347412109375, 0.3277778625488281, 0.34320831298828125, 0.3586387634277344, 0.3740692138671875, 0.3894996643066406, 0.40493011474609375, 0.4203605651855469, 0.435791015625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 4.0, 4.0, 3.0, 8.0, 6.0, 14.0, 6.0, 15.0, 17.0, 20.0, 35.0, 50.0, 61.0, 86.0, 103.0, 93.0, 115.0, 78.0, 55.0, 45.0, 47.0, 31.0, 28.0, 25.0, 18.0, 8.0, 7.0, 4.0, 5.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0001710653305053711, -0.00016509182751178741, -0.00015911832451820374, -0.00015314482152462006, -0.00014717131853103638, -0.0001411978155374527, -0.00013522431254386902, -0.00012925080955028534, -0.00012327730655670166, -0.00011730380356311798, -0.0001113303005695343, -0.00010535679757595062, -9.938329458236694e-05, -9.340979158878326e-05, -8.743628859519958e-05, -8.14627856016159e-05, -7.548928260803223e-05, -6.951577961444855e-05, -6.354227662086487e-05, -5.756877362728119e-05, -5.159527063369751e-05, -4.562176764011383e-05, -3.964826464653015e-05, -3.367476165294647e-05, -2.7701258659362793e-05, -2.1727755665779114e-05, -1.5754252672195435e-05, -9.780749678611755e-06, -3.807246685028076e-06, 2.166256308555603e-06, 8.139759302139282e-06, 1.4113262295722961e-05, 2.008676528930664e-05, 2.606026828289032e-05, 3.2033771276474e-05, 3.800727427005768e-05, 4.398077726364136e-05, 4.995428025722504e-05, 5.5927783250808716e-05, 6.19012862443924e-05, 6.787478923797607e-05, 7.384829223155975e-05, 7.982179522514343e-05, 8.579529821872711e-05, 9.176880121231079e-05, 9.774230420589447e-05, 0.00010371580719947815, 0.00010968931019306183, 0.00011566281318664551, 0.00012163631618022919, 0.00012760981917381287, 0.00013358332216739655, 0.00013955682516098022, 0.0001455303281545639, 0.00015150383114814758, 0.00015747733414173126, 0.00016345083713531494, 0.00016942434012889862, 0.0001753978431224823, 0.00018137134611606598, 0.00018734484910964966, 0.00019331835210323334, 0.00019929185509681702, 0.0002052653580904007, 0.00021123886108398438]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 8.0, 3.0, 9.0, 23.0, 19.0, 25.0, 34.0, 58.0, 115.0, 220.0, 329.0, 569.0, 1303.0, 3572.0, 12524.0, 61871.0, 630410.0, 280794.0, 42019.0, 9425.0, 2808.0, 1139.0, 582.0, 282.0, 140.0, 90.0, 71.0, 41.0, 15.0, 12.0, 7.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.66943359375, -0.649078369140625, -0.62872314453125, -0.608367919921875, -0.5880126953125, -0.567657470703125, -0.54730224609375, -0.526947021484375, -0.506591796875, -0.486236572265625, -0.46588134765625, -0.445526123046875, -0.4251708984375, -0.404815673828125, -0.38446044921875, -0.364105224609375, -0.34375, -0.323394775390625, -0.30303955078125, -0.282684326171875, -0.2623291015625, -0.241973876953125, -0.22161865234375, -0.201263427734375, -0.180908203125, -0.160552978515625, -0.14019775390625, -0.119842529296875, -0.0994873046875, -0.079132080078125, -0.05877685546875, -0.038421630859375, -0.01806640625, 0.002288818359375, 0.02264404296875, 0.042999267578125, 0.0633544921875, 0.083709716796875, 0.10406494140625, 0.124420166015625, 0.144775390625, 0.165130615234375, 0.18548583984375, 0.205841064453125, 0.2261962890625, 0.246551513671875, 0.26690673828125, 0.287261962890625, 0.3076171875, 0.327972412109375, 0.34832763671875, 0.368682861328125, 0.3890380859375, 0.409393310546875, 0.42974853515625, 0.450103759765625, 0.470458984375, 0.490814208984375, 0.51116943359375, 0.531524658203125, 0.5518798828125, 0.572235107421875, 0.59259033203125, 0.612945556640625, 0.63330078125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 9.0, 5.0, 10.0, 8.0, 11.0, 10.0, 13.0, 22.0, 20.0, 20.0, 40.0, 43.0, 48.0, 76.0, 80.0, 86.0, 66.0, 72.0, 66.0, 59.0, 42.0, 38.0, 32.0, 23.0, 12.0, 22.0, 10.0, 6.0, 6.0, 7.0, 9.0, 5.0, 3.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51806640625, -0.5023002624511719, -0.48653411865234375, -0.4707679748535156, -0.4550018310546875, -0.4392356872558594, -0.42346954345703125, -0.4077033996582031, -0.391937255859375, -0.3761711120605469, -0.36040496826171875, -0.3446388244628906, -0.3288726806640625, -0.3131065368652344, -0.29734039306640625, -0.2815742492675781, -0.26580810546875, -0.2500419616699219, -0.23427581787109375, -0.21850967407226562, -0.2027435302734375, -0.18697738647460938, -0.17121124267578125, -0.15544509887695312, -0.139678955078125, -0.12391281127929688, -0.10814666748046875, -0.09238052368164062, -0.0766143798828125, -0.060848236083984375, -0.04508209228515625, -0.029315948486328125, -0.0135498046875, 0.002216339111328125, 0.01798248291015625, 0.033748626708984375, 0.0495147705078125, 0.06528091430664062, 0.08104705810546875, 0.09681320190429688, 0.112579345703125, 0.12834548950195312, 0.14411163330078125, 0.15987777709960938, 0.1756439208984375, 0.19141006469726562, 0.20717620849609375, 0.22294235229492188, 0.23870849609375, 0.2544746398925781, 0.27024078369140625, 0.2860069274902344, 0.3017730712890625, 0.3175392150878906, 0.33330535888671875, 0.3490715026855469, 0.364837646484375, 0.3806037902832031, 0.39636993408203125, 0.4121360778808594, 0.4279022216796875, 0.4436683654785156, 0.45943450927734375, 0.4752006530761719, 0.490966796875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 18.0, 10.0, 29.0, 51.0, 102.0, 170.0, 298.0, 132.0, 79.0, 58.0, 23.0, 11.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.802608489990234, -20.228418350219727, -19.65422821044922, -19.08003807067871, -18.505847930908203, -17.931657791137695, -17.357467651367188, -16.783279418945312, -16.209087371826172, -15.634897232055664, -15.060707092285156, -14.486516952514648, -13.91232681274414, -13.338136672973633, -12.763947486877441, -12.189757347106934, -11.615568161010742, -11.041378021240234, -10.467187881469727, -9.892997741699219, -9.318807601928711, -8.744617462158203, -8.170428276062012, -7.596238136291504, -7.022047996520996, -6.447857856750488, -5.8736677169799805, -5.299478054046631, -4.725287914276123, -4.151097774505615, -3.5769078731536865, -3.002717971801758, -2.428529739379883, -1.8543397188186646, -1.2801496982574463, -0.705959677696228, -0.13176965713500977, 0.44242048263549805, 1.0166103839874268, 1.5908002853393555, 2.1649904251098633, 2.739180564880371, 3.3133704662323, 3.8875603675842285, 4.461750507354736, 5.035940647125244, 5.610130310058594, 6.184320449829102, 6.758510589599609, 7.332700729370117, 7.906890869140625, 8.481081008911133, 9.05527114868164, 9.629461288452148, 10.20365047454834, 10.777840614318848, 11.352030754089355, 11.926220893859863, 12.500411033630371, 13.074601173400879, 13.64879035949707, 14.222980499267578, 14.797170639038086, 15.371360778808594, 15.945550918579102]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 0.0, 2.0, 1.0, 6.0, 5.0, 4.0, 8.0, 12.0, 12.0, 16.0, 22.0, 27.0, 30.0, 22.0, 29.0, 22.0, 32.0, 41.0, 50.0, 81.0, 116.0, 99.0, 57.0, 44.0, 38.0, 32.0, 34.0, 25.0, 31.0, 19.0, 14.0, 9.0, 8.0, 8.0, 11.0, 8.0, 2.0, 7.0, 10.0, 1.0, 4.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.73277759552002, -12.387369155883789, -12.041961669921875, -11.696554183959961, -11.35114574432373, -11.0057373046875, -10.660329818725586, -10.314922332763672, -9.969513893127441, -9.624105453491211, -9.278697967529297, -8.933290481567383, -8.587882041931152, -8.242473602294922, -7.897066116333008, -7.5516581535339355, -7.206250190734863, -6.860842227935791, -6.515434265136719, -6.1700263023376465, -5.824618339538574, -5.479210376739502, -5.13380241394043, -4.788394451141357, -4.442986488342285, -4.097578525543213, -3.7521705627441406, -3.4067625999450684, -3.061354637145996, -2.715946674346924, -2.3705387115478516, -2.0251307487487793, -1.679722785949707, -1.3343148231506348, -0.9889068603515625, -0.6434988975524902, -0.29809093475341797, 0.0473170280456543, 0.39272499084472656, 0.7381329536437988, 1.083540916442871, 1.4289488792419434, 1.7743568420410156, 2.119764804840088, 2.46517276763916, 2.8105807304382324, 3.1559886932373047, 3.501396656036377, 3.846804618835449, 4.1922125816345215, 4.537620544433594, 4.883028507232666, 5.228436470031738, 5.5738444328308105, 5.919252395629883, 6.264660358428955, 6.610068321228027, 6.9554762840271, 7.300884246826172, 7.646292209625244, 7.991700172424316, 8.337108612060547, 8.682516098022461, 9.027923583984375, 9.373332023620605]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 11.0, 21.0, 15.0, 26.0, 58.0, 59.0, 93.0, 165.0, 260.0, 455.0, 853.0, 1549.0, 3761.0, 10311.0, 36010.0, 164310.0, 869684.0, 2086854.0, 810885.0, 157041.0, 34599.0, 10060.0, 3675.0, 1571.0, 784.0, 436.0, 288.0, 156.0, 81.0, 75.0, 44.0, 29.0, 21.0, 9.0, 8.0, 6.0, 7.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.6380157470703125, -0.613922119140625, -0.5898284912109375, -0.56573486328125, -0.5416412353515625, -0.517547607421875, -0.4934539794921875, -0.4693603515625, -0.4452667236328125, -0.421173095703125, -0.3970794677734375, -0.37298583984375, -0.3488922119140625, -0.324798583984375, -0.3007049560546875, -0.276611328125, -0.2525177001953125, -0.228424072265625, -0.2043304443359375, -0.18023681640625, -0.1561431884765625, -0.132049560546875, -0.1079559326171875, -0.0838623046875, -0.0597686767578125, -0.035675048828125, -0.0115814208984375, 0.01251220703125, 0.0366058349609375, 0.060699462890625, 0.0847930908203125, 0.10888671875, 0.1329803466796875, 0.157073974609375, 0.1811676025390625, 0.20526123046875, 0.2293548583984375, 0.253448486328125, 0.2775421142578125, 0.3016357421875, 0.3257293701171875, 0.349822998046875, 0.3739166259765625, 0.39801025390625, 0.4221038818359375, 0.446197509765625, 0.4702911376953125, 0.494384765625, 0.5184783935546875, 0.542572021484375, 0.5666656494140625, 0.59075927734375, 0.6148529052734375, 0.638946533203125, 0.6630401611328125, 0.6871337890625, 0.7112274169921875, 0.735321044921875, 0.7594146728515625, 0.78350830078125, 0.8076019287109375, 0.831695556640625, 0.8557891845703125, 0.8798828125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 10.0, 6.0, 9.0, 10.0, 17.0, 19.0, 19.0, 24.0, 32.0, 37.0, 37.0, 32.0, 64.0, 44.0, 57.0, 53.0, 57.0, 61.0, 55.0, 48.0, 41.0, 44.0, 48.0, 29.0, 29.0, 27.0, 20.0, 12.0, 18.0, 7.0, 9.0, 11.0, 5.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76513671875, -0.7414627075195312, -0.7177886962890625, -0.6941146850585938, -0.670440673828125, -0.6467666625976562, -0.6230926513671875, -0.5994186401367188, -0.57574462890625, -0.5520706176757812, -0.5283966064453125, -0.5047225952148438, -0.481048583984375, -0.45737457275390625, -0.4337005615234375, -0.41002655029296875, -0.3863525390625, -0.36267852783203125, -0.3390045166015625, -0.31533050537109375, -0.291656494140625, -0.26798248291015625, -0.2443084716796875, -0.22063446044921875, -0.19696044921875, -0.17328643798828125, -0.1496124267578125, -0.12593841552734375, -0.102264404296875, -0.07859039306640625, -0.0549163818359375, -0.03124237060546875, -0.007568359375, 0.01610565185546875, 0.0397796630859375, 0.06345367431640625, 0.087127685546875, 0.11080169677734375, 0.1344757080078125, 0.15814971923828125, 0.18182373046875, 0.20549774169921875, 0.2291717529296875, 0.25284576416015625, 0.276519775390625, 0.30019378662109375, 0.3238677978515625, 0.34754180908203125, 0.3712158203125, 0.39488983154296875, 0.4185638427734375, 0.44223785400390625, 0.465911865234375, 0.48958587646484375, 0.5132598876953125, 0.5369338989257812, 0.56060791015625, 0.5842819213867188, 0.6079559326171875, 0.6316299438476562, 0.655303955078125, 0.6789779663085938, 0.7026519775390625, 0.7263259887695312, 0.75]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 4.0, 12.0, 10.0, 36.0, 83.0, 181.0, 338.0, 912.0, 11294.0, 4045942.0, 132319.0, 2155.0, 510.0, 266.0, 120.0, 56.0, 26.0, 12.0, 13.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.25, -3.08526611328125, -2.9205322265625, -2.75579833984375, -2.591064453125, -2.42633056640625, -2.2615966796875, -2.09686279296875, -1.93212890625, -1.76739501953125, -1.6026611328125, -1.43792724609375, -1.273193359375, -1.10845947265625, -0.9437255859375, -0.77899169921875, -0.6142578125, -0.44952392578125, -0.2847900390625, -0.12005615234375, 0.044677734375, 0.20941162109375, 0.3741455078125, 0.53887939453125, 0.70361328125, 0.86834716796875, 1.0330810546875, 1.19781494140625, 1.362548828125, 1.52728271484375, 1.6920166015625, 1.85675048828125, 2.021484375, 2.18621826171875, 2.3509521484375, 2.51568603515625, 2.680419921875, 2.84515380859375, 3.0098876953125, 3.17462158203125, 3.33935546875, 3.50408935546875, 3.6688232421875, 3.83355712890625, 3.998291015625, 4.16302490234375, 4.3277587890625, 4.49249267578125, 4.6572265625, 4.82196044921875, 4.9866943359375, 5.15142822265625, 5.316162109375, 5.48089599609375, 5.6456298828125, 5.81036376953125, 5.97509765625, 6.13983154296875, 6.3045654296875, 6.46929931640625, 6.634033203125, 6.79876708984375, 6.9635009765625, 7.12823486328125, 7.29296875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 10.0, 13.0, 21.0, 61.0, 133.0, 280.0, 686.0, 1243.0, 869.0, 420.0, 156.0, 81.0, 30.0, 29.0, 8.0, 16.0, 6.0, 2.0, 7.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.869140625, -1.773895263671875, -1.67864990234375, -1.583404541015625, -1.4881591796875, -1.392913818359375, -1.29766845703125, -1.202423095703125, -1.107177734375, -1.011932373046875, -0.91668701171875, -0.821441650390625, -0.7261962890625, -0.630950927734375, -0.53570556640625, -0.440460205078125, -0.34521484375, -0.249969482421875, -0.15472412109375, -0.059478759765625, 0.0357666015625, 0.131011962890625, 0.22625732421875, 0.321502685546875, 0.416748046875, 0.511993408203125, 0.60723876953125, 0.702484130859375, 0.7977294921875, 0.892974853515625, 0.98822021484375, 1.083465576171875, 1.1787109375, 1.273956298828125, 1.36920166015625, 1.464447021484375, 1.5596923828125, 1.654937744140625, 1.75018310546875, 1.845428466796875, 1.940673828125, 2.035919189453125, 2.13116455078125, 2.226409912109375, 2.3216552734375, 2.416900634765625, 2.51214599609375, 2.607391357421875, 2.70263671875, 2.797882080078125, 2.89312744140625, 2.988372802734375, 3.0836181640625, 3.178863525390625, 3.27410888671875, 3.369354248046875, 3.464599609375, 3.559844970703125, 3.65509033203125, 3.750335693359375, 3.8455810546875, 3.940826416015625, 4.03607177734375, 4.131317138671875, 4.2265625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 9.0, 23.0, 60.0, 237.0, 376.0, 198.0, 47.0, 29.0, 10.0, 9.0, 7.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.704120635986328, -22.638961791992188, -21.573802947998047, -20.508642196655273, -19.443483352661133, -18.378324508666992, -17.31316375732422, -16.248004913330078, -15.182846069335938, -14.117687225341797, -13.05252742767334, -11.987367630004883, -10.922208786010742, -9.857049942016602, -8.791890144348145, -7.726730823516846, -6.661571502685547, -5.596412181854248, -4.531252861022949, -3.4660935401916504, -2.4009342193603516, -1.3357748985290527, -0.2706155776977539, 0.7945437431335449, 1.8597030639648438, 2.9248623847961426, 3.9900217056274414, 5.05518102645874, 6.120340347290039, 7.185499668121338, 8.250658988952637, 9.315818786621094, 10.380973815917969, 11.44613265991211, 12.511292457580566, 13.576452255249023, 14.641611099243164, 15.706769943237305, 16.771930694580078, 17.83708953857422, 18.90224838256836, 19.9674072265625, 21.03256607055664, 22.097726821899414, 23.162885665893555, 24.228044509887695, 25.29320526123047, 26.35836410522461, 27.42352294921875, 28.48868179321289, 29.55384063720703, 30.619001388549805, 31.684160232543945, 32.74932098388672, 33.81447982788086, 34.879638671875, 35.94479751586914, 37.00995635986328, 38.07511520385742, 39.14027404785156, 40.20543670654297, 41.27059555053711, 42.33575439453125, 43.40091323852539, 44.46607208251953]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 7.0, 8.0, 8.0, 17.0, 18.0, 17.0, 14.0, 34.0, 30.0, 38.0, 21.0, 27.0, 33.0, 39.0, 49.0, 56.0, 44.0, 47.0, 59.0, 46.0, 53.0, 44.0, 32.0, 35.0, 22.0, 33.0, 35.0, 22.0, 21.0, 16.0, 12.0, 12.0, 10.0, 7.0, 6.0, 10.0, 8.0, 0.0, 3.0, 2.0, 6.0, 2.0, 0.0, 2.0], "bins": [-9.743474960327148, -9.488177299499512, -9.232880592346191, -8.977582931518555, -8.722286224365234, -8.466988563537598, -8.211691856384277, -7.956394195556641, -7.701097011566162, -7.445799827575684, -7.190502643585205, -6.935205459594727, -6.67990779876709, -6.4246110916137695, -6.169313430786133, -5.914016246795654, -5.658719062805176, -5.403421878814697, -5.148124694824219, -4.89282751083374, -4.637530326843262, -4.382232666015625, -4.1269354820251465, -3.871638298034668, -3.6163411140441895, -3.361043930053711, -3.1057467460632324, -2.850449323654175, -2.5951521396636963, -2.3398549556732178, -2.08455753326416, -1.8292603492736816, -1.5739641189575195, -1.318666934967041, -1.063369631767273, -0.8080723881721497, -0.5527751445770264, -0.29747796058654785, -0.042180657386779785, 0.21311664581298828, 0.4684138298034668, 0.7237110733985901, 0.9790083169937134, 1.2343056201934814, 1.48960280418396, 1.7448999881744385, 2.000197410583496, 2.2554945945739746, 2.510791778564453, 2.7660889625549316, 3.02138614654541, 3.2766835689544678, 3.5319807529449463, 3.787277936935425, 4.042575359344482, 4.297872543334961, 4.5531697273254395, 4.808466911315918, 5.0637640953063965, 5.319061279296875, 5.574358940124512, 5.829655647277832, 6.084953308105469, 6.340250492095947, 6.595547676086426]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 5.0, 9.0, 13.0, 17.0, 39.0, 41.0, 71.0, 83.0, 164.0, 259.0, 401.0, 648.0, 1150.0, 1962.0, 3512.0, 6453.0, 12196.0, 24648.0, 53073.0, 124137.0, 276367.0, 292264.0, 136779.0, 58551.0, 26963.0, 13142.0, 6809.0, 3757.0, 2046.0, 1200.0, 646.0, 404.0, 255.0, 172.0, 104.0, 62.0, 42.0, 33.0, 22.0, 18.0, 10.0, 6.0, 4.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1015625, -1.064910888671875, -1.02825927734375, -0.991607666015625, -0.9549560546875, -0.918304443359375, -0.88165283203125, -0.845001220703125, -0.808349609375, -0.771697998046875, -0.73504638671875, -0.698394775390625, -0.6617431640625, -0.625091552734375, -0.58843994140625, -0.551788330078125, -0.51513671875, -0.478485107421875, -0.44183349609375, -0.405181884765625, -0.3685302734375, -0.331878662109375, -0.29522705078125, -0.258575439453125, -0.221923828125, -0.185272216796875, -0.14862060546875, -0.111968994140625, -0.0753173828125, -0.038665771484375, -0.00201416015625, 0.034637451171875, 0.0712890625, 0.107940673828125, 0.14459228515625, 0.181243896484375, 0.2178955078125, 0.254547119140625, 0.29119873046875, 0.327850341796875, 0.364501953125, 0.401153564453125, 0.43780517578125, 0.474456787109375, 0.5111083984375, 0.547760009765625, 0.58441162109375, 0.621063232421875, 0.65771484375, 0.694366455078125, 0.73101806640625, 0.767669677734375, 0.8043212890625, 0.840972900390625, 0.87762451171875, 0.914276123046875, 0.950927734375, 0.987579345703125, 1.02423095703125, 1.060882568359375, 1.0975341796875, 1.134185791015625, 1.17083740234375, 1.207489013671875, 1.244140625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 8.0, 2.0, 2.0, 7.0, 7.0, 8.0, 12.0, 14.0, 10.0, 11.0, 10.0, 12.0, 23.0, 31.0, 33.0, 24.0, 26.0, 30.0, 63.0, 42.0, 58.0, 43.0, 57.0, 52.0, 37.0, 42.0, 44.0, 46.0, 24.0, 38.0, 27.0, 23.0, 29.0, 16.0, 20.0, 17.0, 17.0, 8.0, 9.0, 9.0, 3.0, 6.0, 1.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.69580078125, -0.6737747192382812, -0.6517486572265625, -0.6297225952148438, -0.607696533203125, -0.5856704711914062, -0.5636444091796875, -0.5416183471679688, -0.51959228515625, -0.49756622314453125, -0.4755401611328125, -0.45351409912109375, -0.431488037109375, -0.40946197509765625, -0.3874359130859375, -0.36540985107421875, -0.3433837890625, -0.32135772705078125, -0.2993316650390625, -0.27730560302734375, -0.255279541015625, -0.23325347900390625, -0.2112274169921875, -0.18920135498046875, -0.16717529296875, -0.14514923095703125, -0.1231231689453125, -0.10109710693359375, -0.079071044921875, -0.05704498291015625, -0.0350189208984375, -0.01299285888671875, 0.009033203125, 0.03105926513671875, 0.0530853271484375, 0.07511138916015625, 0.097137451171875, 0.11916351318359375, 0.1411895751953125, 0.16321563720703125, 0.18524169921875, 0.20726776123046875, 0.2292938232421875, 0.25131988525390625, 0.273345947265625, 0.29537200927734375, 0.3173980712890625, 0.33942413330078125, 0.3614501953125, 0.38347625732421875, 0.4055023193359375, 0.42752838134765625, 0.449554443359375, 0.47158050537109375, 0.4936065673828125, 0.5156326293945312, 0.53765869140625, 0.5596847534179688, 0.5817108154296875, 0.6037368774414062, 0.625762939453125, 0.6477890014648438, 0.6698150634765625, 0.6918411254882812, 0.7138671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 11.0, 9.0, 12.0, 28.0, 41.0, 72.0, 134.0, 221.0, 465.0, 981.0, 2311.0, 9354.0, 111561.0, 863263.0, 50755.0, 5923.0, 1764.0, 777.0, 392.0, 213.0, 110.0, 62.0, 39.0, 22.0, 12.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.544921875, -3.419952392578125, -3.29498291015625, -3.170013427734375, -3.0450439453125, -2.920074462890625, -2.79510498046875, -2.670135498046875, -2.545166015625, -2.420196533203125, -2.29522705078125, -2.170257568359375, -2.0452880859375, -1.920318603515625, -1.79534912109375, -1.670379638671875, -1.54541015625, -1.420440673828125, -1.29547119140625, -1.170501708984375, -1.0455322265625, -0.920562744140625, -0.79559326171875, -0.670623779296875, -0.545654296875, -0.420684814453125, -0.29571533203125, -0.170745849609375, -0.0457763671875, 0.079193115234375, 0.20416259765625, 0.329132080078125, 0.4541015625, 0.579071044921875, 0.70404052734375, 0.829010009765625, 0.9539794921875, 1.078948974609375, 1.20391845703125, 1.328887939453125, 1.453857421875, 1.578826904296875, 1.70379638671875, 1.828765869140625, 1.9537353515625, 2.078704833984375, 2.20367431640625, 2.328643798828125, 2.45361328125, 2.578582763671875, 2.70355224609375, 2.828521728515625, 2.9534912109375, 3.078460693359375, 3.20343017578125, 3.328399658203125, 3.453369140625, 3.578338623046875, 3.70330810546875, 3.828277587890625, 3.9532470703125, 4.078216552734375, 4.20318603515625, 4.328155517578125, 4.453125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 6.0, 8.0, 16.0, 14.0, 30.0, 38.0, 56.0, 66.0, 61.0, 74.0, 89.0, 98.0, 99.0, 85.0, 71.0, 52.0, 32.0, 28.0, 22.0, 14.0, 12.0, 13.0, 8.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.302734375, -3.153839111328125, -3.00494384765625, -2.856048583984375, -2.7071533203125, -2.558258056640625, -2.40936279296875, -2.260467529296875, -2.111572265625, -1.962677001953125, -1.81378173828125, -1.664886474609375, -1.5159912109375, -1.367095947265625, -1.21820068359375, -1.069305419921875, -0.92041015625, -0.771514892578125, -0.62261962890625, -0.473724365234375, -0.3248291015625, -0.175933837890625, -0.02703857421875, 0.121856689453125, 0.270751953125, 0.419647216796875, 0.56854248046875, 0.717437744140625, 0.8663330078125, 1.015228271484375, 1.16412353515625, 1.313018798828125, 1.4619140625, 1.610809326171875, 1.75970458984375, 1.908599853515625, 2.0574951171875, 2.206390380859375, 2.35528564453125, 2.504180908203125, 2.653076171875, 2.801971435546875, 2.95086669921875, 3.099761962890625, 3.2486572265625, 3.397552490234375, 3.54644775390625, 3.695343017578125, 3.84423828125, 3.993133544921875, 4.14202880859375, 4.290924072265625, 4.4398193359375, 4.588714599609375, 4.73760986328125, 4.886505126953125, 5.035400390625, 5.184295654296875, 5.33319091796875, 5.482086181640625, 5.6309814453125, 5.779876708984375, 5.92877197265625, 6.077667236328125, 6.2265625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 6.0, 5.0, 7.0, 23.0, 27.0, 40.0, 51.0, 114.0, 234.0, 469.0, 1113.0, 3112.0, 11848.0, 72676.0, 792554.0, 140268.0, 18943.0, 4427.0, 1424.0, 613.0, 251.0, 140.0, 63.0, 55.0, 28.0, 24.0, 12.0, 6.0, 8.0, 11.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6572265625, -0.6315994262695312, -0.6059722900390625, -0.5803451538085938, -0.554718017578125, -0.5290908813476562, -0.5034637451171875, -0.47783660888671875, -0.45220947265625, -0.42658233642578125, -0.4009552001953125, -0.37532806396484375, -0.349700927734375, -0.32407379150390625, -0.2984466552734375, -0.27281951904296875, -0.2471923828125, -0.22156524658203125, -0.1959381103515625, -0.17031097412109375, -0.144683837890625, -0.11905670166015625, -0.0934295654296875, -0.06780242919921875, -0.04217529296875, -0.01654815673828125, 0.0090789794921875, 0.03470611572265625, 0.060333251953125, 0.08596038818359375, 0.1115875244140625, 0.13721466064453125, 0.162841796875, 0.18846893310546875, 0.2140960693359375, 0.23972320556640625, 0.265350341796875, 0.29097747802734375, 0.3166046142578125, 0.34223175048828125, 0.36785888671875, 0.39348602294921875, 0.4191131591796875, 0.44474029541015625, 0.470367431640625, 0.49599456787109375, 0.5216217041015625, 0.5472488403320312, 0.5728759765625, 0.5985031127929688, 0.6241302490234375, 0.6497573852539062, 0.675384521484375, 0.7010116577148438, 0.7266387939453125, 0.7522659301757812, 0.77789306640625, 0.8035202026367188, 0.8291473388671875, 0.8547744750976562, 0.880401611328125, 0.9060287475585938, 0.9316558837890625, 0.9572830200195312, 0.98291015625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 5.0, 1.0, 4.0, 2.0, 2.0, 3.0, 11.0, 11.0, 11.0, 31.0, 35.0, 42.0, 77.0, 112.0, 173.0, 166.0, 115.0, 58.0, 37.0, 36.0, 19.0, 12.0, 16.0, 14.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038623809814453125, -0.00037449970841407776, -0.00036276131868362427, -0.0003510229289531708, -0.0003392845392227173, -0.0003275461494922638, -0.0003158077597618103, -0.0003040693700313568, -0.0002923309803009033, -0.00028059259057044983, -0.00026885420083999634, -0.00025711581110954285, -0.00024537742137908936, -0.00023363903164863586, -0.00022190064191818237, -0.00021016225218772888, -0.0001984238624572754, -0.0001866854727268219, -0.0001749470829963684, -0.00016320869326591492, -0.00015147030353546143, -0.00013973191380500793, -0.00012799352407455444, -0.00011625513434410095, -0.00010451674461364746, -9.277835488319397e-05, -8.103996515274048e-05, -6.930157542228699e-05, -5.7563185691833496e-05, -4.5824795961380005e-05, -3.4086406230926514e-05, -2.2348016500473022e-05, -1.0609626770019531e-05, 1.12876296043396e-06, 1.2867152690887451e-05, 2.4605542421340942e-05, 3.6343932151794434e-05, 4.8082321882247925e-05, 5.9820711612701416e-05, 7.155910134315491e-05, 8.32974910736084e-05, 9.503588080406189e-05, 0.00010677427053451538, 0.00011851266026496887, 0.00013025104999542236, 0.00014198943972587585, 0.00015372782945632935, 0.00016546621918678284, 0.00017720460891723633, 0.00018894299864768982, 0.0002006813883781433, 0.0002124197781085968, 0.0002241581678390503, 0.00023589655756950378, 0.0002476349472999573, 0.00025937333703041077, 0.00027111172676086426, 0.00028285011649131775, 0.00029458850622177124, 0.00030632689595222473, 0.0003180652856826782, 0.0003298036754131317, 0.0003415420651435852, 0.0003532804548740387, 0.0003650188446044922]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 4.0, 3.0, 6.0, 7.0, 17.0, 22.0, 29.0, 38.0, 58.0, 79.0, 178.0, 290.0, 448.0, 920.0, 2232.0, 6509.0, 28665.0, 224388.0, 709796.0, 58325.0, 10637.0, 3198.0, 1277.0, 584.0, 315.0, 187.0, 109.0, 82.0, 46.0, 32.0, 28.0, 10.0, 7.0, 9.0, 3.0, 1.0, 4.0, 4.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63671875, -0.616302490234375, -0.59588623046875, -0.575469970703125, -0.5550537109375, -0.534637451171875, -0.51422119140625, -0.493804931640625, -0.473388671875, -0.452972412109375, -0.43255615234375, -0.412139892578125, -0.3917236328125, -0.371307373046875, -0.35089111328125, -0.330474853515625, -0.31005859375, -0.289642333984375, -0.26922607421875, -0.248809814453125, -0.2283935546875, -0.207977294921875, -0.18756103515625, -0.167144775390625, -0.146728515625, -0.126312255859375, -0.10589599609375, -0.085479736328125, -0.0650634765625, -0.044647216796875, -0.02423095703125, -0.003814697265625, 0.0166015625, 0.037017822265625, 0.05743408203125, 0.077850341796875, 0.0982666015625, 0.118682861328125, 0.13909912109375, 0.159515380859375, 0.179931640625, 0.200347900390625, 0.22076416015625, 0.241180419921875, 0.2615966796875, 0.282012939453125, 0.30242919921875, 0.322845458984375, 0.34326171875, 0.363677978515625, 0.38409423828125, 0.404510498046875, 0.4249267578125, 0.445343017578125, 0.46575927734375, 0.486175537109375, 0.506591796875, 0.527008056640625, 0.54742431640625, 0.567840576171875, 0.5882568359375, 0.608673095703125, 0.62908935546875, 0.649505615234375, 0.669921875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 5.0, 8.0, 3.0, 3.0, 10.0, 11.0, 21.0, 23.0, 27.0, 26.0, 37.0, 44.0, 52.0, 62.0, 76.0, 79.0, 81.0, 88.0, 64.0, 49.0, 48.0, 40.0, 30.0, 30.0, 19.0, 15.0, 9.0, 9.0, 6.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.58056640625, -0.5638885498046875, -0.547210693359375, -0.5305328369140625, -0.51385498046875, -0.4971771240234375, -0.480499267578125, -0.4638214111328125, -0.4471435546875, -0.4304656982421875, -0.413787841796875, -0.3971099853515625, -0.38043212890625, -0.3637542724609375, -0.347076416015625, -0.3303985595703125, -0.313720703125, -0.2970428466796875, -0.280364990234375, -0.2636871337890625, -0.24700927734375, -0.2303314208984375, -0.213653564453125, -0.1969757080078125, -0.1802978515625, -0.1636199951171875, -0.146942138671875, -0.1302642822265625, -0.11358642578125, -0.0969085693359375, -0.080230712890625, -0.0635528564453125, -0.046875, -0.0301971435546875, -0.013519287109375, 0.0031585693359375, 0.01983642578125, 0.0365142822265625, 0.053192138671875, 0.0698699951171875, 0.0865478515625, 0.1032257080078125, 0.119903564453125, 0.1365814208984375, 0.15325927734375, 0.1699371337890625, 0.186614990234375, 0.2032928466796875, 0.219970703125, 0.2366485595703125, 0.253326416015625, 0.2700042724609375, 0.28668212890625, 0.3033599853515625, 0.320037841796875, 0.3367156982421875, 0.3533935546875, 0.3700714111328125, 0.386749267578125, 0.4034271240234375, 0.42010498046875, 0.4367828369140625, 0.453460693359375, 0.4701385498046875, 0.48681640625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 9.0, 11.0, 42.0, 60.0, 126.0, 382.0, 180.0, 96.0, 47.0, 21.0, 9.0, 7.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.90968132019043, -23.1590576171875, -22.40843391418457, -21.65781021118164, -20.907188415527344, -20.156564712524414, -19.405941009521484, -18.655317306518555, -17.904693603515625, -17.154069900512695, -16.403446197509766, -15.652823448181152, -14.902199745178223, -14.151576042175293, -13.40095329284668, -12.65032958984375, -11.89970588684082, -11.14908218383789, -10.398458480834961, -9.647835731506348, -8.897212028503418, -8.146588325500488, -7.395965099334717, -6.645341873168945, -5.894718170166016, -5.144094467163086, -4.3934712409973145, -3.642847776412964, -2.8922243118286133, -2.1416008472442627, -1.390977382659912, -0.6403541564941406, 0.11027145385742188, 0.8608949184417725, 1.611518383026123, 2.3621418476104736, 3.112765312194824, 3.863388776779175, 4.614012241363525, 5.364635467529297, 6.115259170532227, 6.865882873535156, 7.616506099700928, 8.3671293258667, 9.117753028869629, 9.868376731872559, 10.618999481201172, 11.369623184204102, 12.120246887207031, 12.870870590209961, 13.62149429321289, 14.372117042541504, 15.122740745544434, 15.873364448547363, 16.623987197875977, 17.374610900878906, 18.125234603881836, 18.875858306884766, 19.626482009887695, 20.377105712890625, 21.127727508544922, 21.87835121154785, 22.62897491455078, 23.37959861755371, 24.13022232055664]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 10.0, 15.0, 13.0, 15.0, 17.0, 27.0, 28.0, 29.0, 31.0, 44.0, 36.0, 48.0, 161.0, 167.0, 59.0, 41.0, 37.0, 27.0, 24.0, 36.0, 15.0, 24.0, 19.0, 15.0, 12.0, 10.0, 12.0, 4.0, 3.0, 7.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.678079605102539, -15.230937004089355, -14.783794403076172, -14.336651802062988, -13.889509201049805, -13.442366600036621, -12.995223999023438, -12.548081398010254, -12.10093879699707, -11.653796195983887, -11.206653594970703, -10.75951099395752, -10.312368392944336, -9.865225791931152, -9.418083190917969, -8.970940589904785, -8.523797988891602, -8.076655387878418, -7.629512786865234, -7.182370185852051, -6.735227584838867, -6.288084983825684, -5.8409423828125, -5.393799781799316, -4.946658134460449, -4.499515533447266, -4.052372932434082, -3.6052303314208984, -3.158087730407715, -2.7109453678131104, -2.2638027667999268, -1.8166601657867432, -1.3695173263549805, -0.9223747253417969, -0.47523218393325806, -0.02808964252471924, 0.41905295848846436, 0.8661954402923584, 1.313338041305542, 1.7604806423187256, 2.207623243331909, 2.6547658443450928, 3.1019084453582764, 3.549050807952881, 3.9961934089660645, 4.443336009979248, 4.890478610992432, 5.337621212005615, 5.784763813018799, 6.231906414031982, 6.679049015045166, 7.12619161605835, 7.573334217071533, 8.020476341247559, 8.467618942260742, 8.914761543273926, 9.36190414428711, 9.809046745300293, 10.256189346313477, 10.70333194732666, 11.150474548339844, 11.597617149353027, 12.044759750366211, 12.491902351379395, 12.939044952392578]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 4.0, 5.0, 6.0, 10.0, 13.0, 18.0, 35.0, 43.0, 57.0, 77.0, 113.0, 156.0, 227.0, 334.0, 507.0, 770.0, 1087.0, 1849.0, 3190.0, 5680.0, 11227.0, 24845.0, 62065.0, 173317.0, 488745.0, 1094812.0, 1272543.0, 646446.0, 253231.0, 88605.0, 32848.0, 14271.0, 7064.0, 3948.0, 2168.0, 1299.0, 849.0, 552.0, 376.0, 243.0, 176.0, 128.0, 97.0, 66.0, 45.0, 40.0, 27.0, 18.0, 17.0, 9.0, 16.0, 7.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.62744140625, -0.605926513671875, -0.58441162109375, -0.562896728515625, -0.5413818359375, -0.519866943359375, -0.49835205078125, -0.476837158203125, -0.455322265625, -0.433807373046875, -0.41229248046875, -0.390777587890625, -0.3692626953125, -0.347747802734375, -0.32623291015625, -0.304718017578125, -0.283203125, -0.261688232421875, -0.24017333984375, -0.218658447265625, -0.1971435546875, -0.175628662109375, -0.15411376953125, -0.132598876953125, -0.111083984375, -0.089569091796875, -0.06805419921875, -0.046539306640625, -0.0250244140625, -0.003509521484375, 0.01800537109375, 0.039520263671875, 0.06103515625, 0.082550048828125, 0.10406494140625, 0.125579833984375, 0.1470947265625, 0.168609619140625, 0.19012451171875, 0.211639404296875, 0.233154296875, 0.254669189453125, 0.27618408203125, 0.297698974609375, 0.3192138671875, 0.340728759765625, 0.36224365234375, 0.383758544921875, 0.4052734375, 0.426788330078125, 0.44830322265625, 0.469818115234375, 0.4913330078125, 0.512847900390625, 0.53436279296875, 0.555877685546875, 0.577392578125, 0.598907470703125, 0.62042236328125, 0.641937255859375, 0.6634521484375, 0.684967041015625, 0.70648193359375, 0.727996826171875, 0.74951171875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 7.0, 6.0, 14.0, 14.0, 10.0, 11.0, 23.0, 15.0, 20.0, 27.0, 18.0, 28.0, 25.0, 22.0, 48.0, 39.0, 39.0, 41.0, 44.0, 47.0, 45.0, 45.0, 43.0, 44.0, 49.0, 34.0, 34.0, 32.0, 30.0, 28.0, 22.0, 13.0, 18.0, 8.0, 17.0, 7.0, 4.0, 6.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.59228515625, -0.5721893310546875, -0.552093505859375, -0.5319976806640625, -0.51190185546875, -0.4918060302734375, -0.471710205078125, -0.4516143798828125, -0.4315185546875, -0.4114227294921875, -0.391326904296875, -0.3712310791015625, -0.35113525390625, -0.3310394287109375, -0.310943603515625, -0.2908477783203125, -0.270751953125, -0.2506561279296875, -0.230560302734375, -0.2104644775390625, -0.19036865234375, -0.1702728271484375, -0.150177001953125, -0.1300811767578125, -0.1099853515625, -0.0898895263671875, -0.069793701171875, -0.0496978759765625, -0.02960205078125, -0.0095062255859375, 0.010589599609375, 0.0306854248046875, 0.05078125, 0.0708770751953125, 0.090972900390625, 0.1110687255859375, 0.13116455078125, 0.1512603759765625, 0.171356201171875, 0.1914520263671875, 0.2115478515625, 0.2316436767578125, 0.251739501953125, 0.2718353271484375, 0.29193115234375, 0.3120269775390625, 0.332122802734375, 0.3522186279296875, 0.372314453125, 0.3924102783203125, 0.412506103515625, 0.4326019287109375, 0.45269775390625, 0.4727935791015625, 0.492889404296875, 0.5129852294921875, 0.5330810546875, 0.5531768798828125, 0.573272705078125, 0.5933685302734375, 0.61346435546875, 0.6335601806640625, 0.653656005859375, 0.6737518310546875, 0.69384765625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 6.0, 19.0, 26.0, 42.0, 61.0, 101.0, 173.0, 344.0, 654.0, 1270.0, 3741.0, 28064.0, 3798826.0, 347729.0, 8903.0, 2278.0, 941.0, 483.0, 259.0, 159.0, 74.0, 47.0, 21.0, 17.0, 12.0, 6.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.09765625, -4.9510498046875, -4.804443359375, -4.6578369140625, -4.51123046875, -4.3646240234375, -4.218017578125, -4.0714111328125, -3.9248046875, -3.7781982421875, -3.631591796875, -3.4849853515625, -3.33837890625, -3.1917724609375, -3.045166015625, -2.8985595703125, -2.751953125, -2.6053466796875, -2.458740234375, -2.3121337890625, -2.16552734375, -2.0189208984375, -1.872314453125, -1.7257080078125, -1.5791015625, -1.4324951171875, -1.285888671875, -1.1392822265625, -0.99267578125, -0.8460693359375, -0.699462890625, -0.5528564453125, -0.40625, -0.2596435546875, -0.113037109375, 0.0335693359375, 0.18017578125, 0.3267822265625, 0.473388671875, 0.6199951171875, 0.7666015625, 0.9132080078125, 1.059814453125, 1.2064208984375, 1.35302734375, 1.4996337890625, 1.646240234375, 1.7928466796875, 1.939453125, 2.0860595703125, 2.232666015625, 2.3792724609375, 2.52587890625, 2.6724853515625, 2.819091796875, 2.9656982421875, 3.1123046875, 3.2589111328125, 3.405517578125, 3.5521240234375, 3.69873046875, 3.8453369140625, 3.991943359375, 4.1385498046875, 4.28515625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 12.0, 9.0, 15.0, 24.0, 36.0, 48.0, 73.0, 120.0, 197.0, 255.0, 403.0, 587.0, 679.0, 554.0, 368.0, 222.0, 135.0, 117.0, 65.0, 58.0, 31.0, 19.0, 16.0, 10.0, 9.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.07421875, -1.989105224609375, -1.90399169921875, -1.818878173828125, -1.7337646484375, -1.648651123046875, -1.56353759765625, -1.478424072265625, -1.393310546875, -1.308197021484375, -1.22308349609375, -1.137969970703125, -1.0528564453125, -0.967742919921875, -0.88262939453125, -0.797515869140625, -0.71240234375, -0.627288818359375, -0.54217529296875, -0.457061767578125, -0.3719482421875, -0.286834716796875, -0.20172119140625, -0.116607666015625, -0.031494140625, 0.053619384765625, 0.13873291015625, 0.223846435546875, 0.3089599609375, 0.394073486328125, 0.47918701171875, 0.564300537109375, 0.6494140625, 0.734527587890625, 0.81964111328125, 0.904754638671875, 0.9898681640625, 1.074981689453125, 1.16009521484375, 1.245208740234375, 1.330322265625, 1.415435791015625, 1.50054931640625, 1.585662841796875, 1.6707763671875, 1.755889892578125, 1.84100341796875, 1.926116943359375, 2.01123046875, 2.096343994140625, 2.18145751953125, 2.266571044921875, 2.3516845703125, 2.436798095703125, 2.52191162109375, 2.607025146484375, 2.692138671875, 2.777252197265625, 2.86236572265625, 2.947479248046875, 3.0325927734375, 3.117706298828125, 3.20281982421875, 3.287933349609375, 3.373046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 12.0, 28.0, 70.0, 215.0, 372.0, 201.0, 66.0, 22.0, 9.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.13917541503906, -50.42607879638672, -48.71297836303711, -46.999881744384766, -45.286781311035156, -43.57368469238281, -41.86058807373047, -40.14748764038086, -38.434391021728516, -36.72129440307617, -35.00819396972656, -33.29509735107422, -31.581998825073242, -29.868900299072266, -28.15580177307129, -26.442703247070312, -24.729604721069336, -23.01650619506836, -21.303407669067383, -19.590309143066406, -17.877212524414062, -16.164113998413086, -14.45101547241211, -12.73791790008545, -11.024819374084473, -9.311720848083496, -7.598623275756836, -5.885524749755859, -4.172426700592041, -2.4593286514282227, -0.7462301254272461, 0.9668674468994141, 2.6799659729003906, 4.393064022064209, 6.106162071228027, 7.819260597229004, 9.532358169555664, 11.24545669555664, 12.958555221557617, 14.671652793884277, 16.384750366210938, 18.097848892211914, 19.81094741821289, 21.524044036865234, 23.23714256286621, 24.950241088867188, 26.663339614868164, 28.37643814086914, 30.089536666870117, 31.802635192871094, 33.51573181152344, 35.22883224487305, 36.94192886352539, 38.655029296875, 40.368125915527344, 42.08122253417969, 43.7943229675293, 45.50741958618164, 47.22052001953125, 48.933616638183594, 50.6467170715332, 52.35981369018555, 54.072914123535156, 55.7860107421875, 57.499107360839844]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 11.0, 8.0, 14.0, 17.0, 22.0, 16.0, 28.0, 30.0, 32.0, 50.0, 40.0, 52.0, 45.0, 66.0, 68.0, 60.0, 52.0, 39.0, 58.0, 36.0, 44.0, 49.0, 23.0, 28.0, 25.0, 18.0, 15.0, 8.0, 15.0, 6.0, 11.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.97799301147461, -15.527382850646973, -15.076772689819336, -14.626163482666016, -14.175553321838379, -13.724943161010742, -13.274333953857422, -12.823723793029785, -12.373113632202148, -11.922503471374512, -11.471893310546875, -11.021284103393555, -10.570673942565918, -10.120063781738281, -9.669454574584961, -9.218844413757324, -8.768234252929688, -8.31762409210205, -7.867014408111572, -7.416404724121094, -6.965794563293457, -6.51518440246582, -6.064574718475342, -5.613965034484863, -5.163354873657227, -4.71274471282959, -4.262135028839111, -3.8115251064300537, -3.360915184020996, -2.9103052616119385, -2.459695339202881, -2.0090854167938232, -1.558476448059082, -1.1078665256500244, -0.6572566032409668, -0.20664668083190918, 0.24396324157714844, 0.694573163986206, 1.1451830863952637, 1.5957930088043213, 2.046402931213379, 2.4970128536224365, 2.947622776031494, 3.3982326984405518, 3.8488426208496094, 4.299452781677246, 4.750062465667725, 5.200672149658203, 5.65128231048584, 6.101892471313477, 6.552502155303955, 7.003111839294434, 7.45372200012207, 7.904332160949707, 8.354942321777344, 8.805551528930664, 9.2561616897583, 9.706771850585938, 10.157381057739258, 10.607991218566895, 11.058601379394531, 11.509211540222168, 11.959821701049805, 12.410430908203125, 12.861041069030762]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 11.0, 19.0, 22.0, 26.0, 46.0, 83.0, 123.0, 226.0, 385.0, 703.0, 1305.0, 2775.0, 5966.0, 14075.0, 36857.0, 109745.0, 470004.0, 284189.0, 75438.0, 26602.0, 10569.0, 4651.0, 2230.0, 1048.0, 587.0, 353.0, 177.0, 108.0, 72.0, 49.0, 28.0, 16.0, 11.0, 14.0, 14.0, 7.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4453125, -1.3999176025390625, -1.354522705078125, -1.3091278076171875, -1.26373291015625, -1.2183380126953125, -1.172943115234375, -1.1275482177734375, -1.0821533203125, -1.0367584228515625, -0.991363525390625, -0.9459686279296875, -0.90057373046875, -0.8551788330078125, -0.809783935546875, -0.7643890380859375, -0.718994140625, -0.6735992431640625, -0.628204345703125, -0.5828094482421875, -0.53741455078125, -0.4920196533203125, -0.446624755859375, -0.4012298583984375, -0.3558349609375, -0.3104400634765625, -0.265045166015625, -0.2196502685546875, -0.17425537109375, -0.1288604736328125, -0.083465576171875, -0.0380706787109375, 0.00732421875, 0.0527191162109375, 0.098114013671875, 0.1435089111328125, 0.18890380859375, 0.2342987060546875, 0.279693603515625, 0.3250885009765625, 0.3704833984375, 0.4158782958984375, 0.461273193359375, 0.5066680908203125, 0.55206298828125, 0.5974578857421875, 0.642852783203125, 0.6882476806640625, 0.733642578125, 0.7790374755859375, 0.824432373046875, 0.8698272705078125, 0.91522216796875, 0.9606170654296875, 1.006011962890625, 1.0514068603515625, 1.0968017578125, 1.1421966552734375, 1.187591552734375, 1.2329864501953125, 1.27838134765625, 1.3237762451171875, 1.369171142578125, 1.4145660400390625, 1.4599609375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 5.0, 5.0, 16.0, 15.0, 11.0, 17.0, 26.0, 25.0, 33.0, 39.0, 44.0, 49.0, 62.0, 67.0, 63.0, 57.0, 59.0, 55.0, 54.0, 51.0, 45.0, 44.0, 37.0, 32.0, 19.0, 23.0, 10.0, 11.0, 11.0, 8.0, 8.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.2626953125, -1.2306671142578125, -1.198638916015625, -1.1666107177734375, -1.13458251953125, -1.1025543212890625, -1.070526123046875, -1.0384979248046875, -1.0064697265625, -0.9744415283203125, -0.942413330078125, -0.9103851318359375, -0.87835693359375, -0.8463287353515625, -0.814300537109375, -0.7822723388671875, -0.750244140625, -0.7182159423828125, -0.686187744140625, -0.6541595458984375, -0.62213134765625, -0.5901031494140625, -0.558074951171875, -0.5260467529296875, -0.4940185546875, -0.4619903564453125, -0.429962158203125, -0.3979339599609375, -0.36590576171875, -0.3338775634765625, -0.301849365234375, -0.2698211669921875, -0.23779296875, -0.2057647705078125, -0.173736572265625, -0.1417083740234375, -0.10968017578125, -0.0776519775390625, -0.045623779296875, -0.0135955810546875, 0.0184326171875, 0.0504608154296875, 0.082489013671875, 0.1145172119140625, 0.14654541015625, 0.1785736083984375, 0.210601806640625, 0.2426300048828125, 0.274658203125, 0.3066864013671875, 0.338714599609375, 0.3707427978515625, 0.40277099609375, 0.4347991943359375, 0.466827392578125, 0.4988555908203125, 0.5308837890625, 0.5629119873046875, 0.594940185546875, 0.6269683837890625, 0.65899658203125, 0.6910247802734375, 0.723052978515625, 0.7550811767578125, 0.787109375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 14.0, 14.0, 11.0, 9.0, 29.0, 31.0, 48.0, 86.0, 104.0, 193.0, 240.0, 417.0, 767.0, 1629.0, 4390.0, 17265.0, 108547.0, 838035.0, 59868.0, 10805.0, 3122.0, 1250.0, 635.0, 360.0, 223.0, 143.0, 74.0, 66.0, 44.0, 36.0, 30.0, 26.0, 11.0, 7.0, 5.0, 3.0, 3.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9521484375, -1.8878326416015625, -1.823516845703125, -1.7592010498046875, -1.69488525390625, -1.6305694580078125, -1.566253662109375, -1.5019378662109375, -1.4376220703125, -1.3733062744140625, -1.308990478515625, -1.2446746826171875, -1.18035888671875, -1.1160430908203125, -1.051727294921875, -0.9874114990234375, -0.923095703125, -0.8587799072265625, -0.794464111328125, -0.7301483154296875, -0.66583251953125, -0.6015167236328125, -0.537200927734375, -0.4728851318359375, -0.4085693359375, -0.3442535400390625, -0.279937744140625, -0.2156219482421875, -0.15130615234375, -0.0869903564453125, -0.022674560546875, 0.0416412353515625, 0.10595703125, 0.1702728271484375, 0.234588623046875, 0.2989044189453125, 0.36322021484375, 0.4275360107421875, 0.491851806640625, 0.5561676025390625, 0.6204833984375, 0.6847991943359375, 0.749114990234375, 0.8134307861328125, 0.87774658203125, 0.9420623779296875, 1.006378173828125, 1.0706939697265625, 1.135009765625, 1.1993255615234375, 1.263641357421875, 1.3279571533203125, 1.39227294921875, 1.4565887451171875, 1.520904541015625, 1.5852203369140625, 1.6495361328125, 1.7138519287109375, 1.778167724609375, 1.8424835205078125, 1.90679931640625, 1.9711151123046875, 2.035430908203125, 2.0997467041015625, 2.1640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 7.0, 8.0, 6.0, 14.0, 6.0, 7.0, 9.0, 19.0, 16.0, 18.0, 19.0, 18.0, 28.0, 24.0, 22.0, 34.0, 40.0, 46.0, 52.0, 78.0, 67.0, 71.0, 58.0, 57.0, 32.0, 40.0, 29.0, 19.0, 27.0, 10.0, 20.0, 13.0, 9.0, 12.0, 10.0, 12.0, 9.0, 11.0, 7.0, 3.0, 7.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-3.1796875, -3.087432861328125, -2.99517822265625, -2.902923583984375, -2.8106689453125, -2.718414306640625, -2.62615966796875, -2.533905029296875, -2.441650390625, -2.349395751953125, -2.25714111328125, -2.164886474609375, -2.0726318359375, -1.980377197265625, -1.88812255859375, -1.795867919921875, -1.70361328125, -1.611358642578125, -1.51910400390625, -1.426849365234375, -1.3345947265625, -1.242340087890625, -1.15008544921875, -1.057830810546875, -0.965576171875, -0.873321533203125, -0.78106689453125, -0.688812255859375, -0.5965576171875, -0.504302978515625, -0.41204833984375, -0.319793701171875, -0.2275390625, -0.135284423828125, -0.04302978515625, 0.049224853515625, 0.1414794921875, 0.233734130859375, 0.32598876953125, 0.418243408203125, 0.510498046875, 0.602752685546875, 0.69500732421875, 0.787261962890625, 0.8795166015625, 0.971771240234375, 1.06402587890625, 1.156280517578125, 1.24853515625, 1.340789794921875, 1.43304443359375, 1.525299072265625, 1.6175537109375, 1.709808349609375, 1.80206298828125, 1.894317626953125, 1.986572265625, 2.078826904296875, 2.17108154296875, 2.263336181640625, 2.3555908203125, 2.447845458984375, 2.54010009765625, 2.632354736328125, 2.724609375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 8.0, 11.0, 12.0, 12.0, 18.0, 22.0, 24.0, 35.0, 43.0, 54.0, 108.0, 156.0, 266.0, 523.0, 1078.0, 2669.0, 7526.0, 29994.0, 719766.0, 247471.0, 27092.0, 7039.0, 2428.0, 955.0, 481.0, 274.0, 135.0, 97.0, 60.0, 46.0, 34.0, 31.0, 15.0, 17.0, 9.0, 9.0, 10.0, 7.0, 3.0, 2.0, 4.0, 1.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.47802734375, -0.4635276794433594, -0.44902801513671875, -0.4345283508300781, -0.4200286865234375, -0.4055290222167969, -0.39102935791015625, -0.3765296936035156, -0.362030029296875, -0.3475303649902344, -0.33303070068359375, -0.3185310363769531, -0.3040313720703125, -0.2895317077636719, -0.27503204345703125, -0.2605323791503906, -0.24603271484375, -0.23153305053710938, -0.21703338623046875, -0.20253372192382812, -0.1880340576171875, -0.17353439331054688, -0.15903472900390625, -0.14453506469726562, -0.130035400390625, -0.11553573608398438, -0.10103607177734375, -0.08653640747070312, -0.0720367431640625, -0.057537078857421875, -0.04303741455078125, -0.028537750244140625, -0.0140380859375, 0.000461578369140625, 0.01496124267578125, 0.029460906982421875, 0.0439605712890625, 0.058460235595703125, 0.07295989990234375, 0.08745956420898438, 0.101959228515625, 0.11645889282226562, 0.13095855712890625, 0.14545822143554688, 0.1599578857421875, 0.17445755004882812, 0.18895721435546875, 0.20345687866210938, 0.21795654296875, 0.23245620727539062, 0.24695587158203125, 0.2614555358886719, 0.2759552001953125, 0.2904548645019531, 0.30495452880859375, 0.3194541931152344, 0.333953857421875, 0.3484535217285156, 0.36295318603515625, 0.3774528503417969, 0.3919525146484375, 0.4064521789550781, 0.42095184326171875, 0.4354515075683594, 0.449951171875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 7.0, 12.0, 10.0, 14.0, 20.0, 18.0, 22.0, 59.0, 100.0, 149.0, 186.0, 145.0, 77.0, 43.0, 30.0, 24.0, 16.0, 12.0, 4.0, 11.0, 8.0, 1.0, 6.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00027751922607421875, -0.00026943907141685486, -0.00026135891675949097, -0.0002532787621021271, -0.0002451986074447632, -0.0002371184527873993, -0.0002290382981300354, -0.0002209581434726715, -0.00021287798881530762, -0.00020479783415794373, -0.00019671767950057983, -0.00018863752484321594, -0.00018055737018585205, -0.00017247721552848816, -0.00016439706087112427, -0.00015631690621376038, -0.00014823675155639648, -0.0001401565968990326, -0.0001320764422416687, -0.0001239962875843048, -0.00011591613292694092, -0.00010783597826957703, -9.975582361221313e-05, -9.167566895484924e-05, -8.359551429748535e-05, -7.551535964012146e-05, -6.743520498275757e-05, -5.935505032539368e-05, -5.1274895668029785e-05, -4.3194741010665894e-05, -3.5114586353302e-05, -2.703443169593811e-05, -1.895427703857422e-05, -1.0874122381210327e-05, -2.7939677238464355e-06, 5.286186933517456e-06, 1.3366341590881348e-05, 2.144649624824524e-05, 2.952665090560913e-05, 3.760680556297302e-05, 4.5686960220336914e-05, 5.3767114877700806e-05, 6.18472695350647e-05, 6.992742419242859e-05, 7.800757884979248e-05, 8.608773350715637e-05, 9.416788816452026e-05, 0.00010224804282188416, 0.00011032819747924805, 0.00011840835213661194, 0.00012648850679397583, 0.00013456866145133972, 0.0001426488161087036, 0.0001507289707660675, 0.0001588091254234314, 0.0001668892800807953, 0.00017496943473815918, 0.00018304958939552307, 0.00019112974405288696, 0.00019920989871025085, 0.00020729005336761475, 0.00021537020802497864, 0.00022345036268234253, 0.00023153051733970642, 0.0002396106719970703]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 4.0, 3.0, 16.0, 25.0, 23.0, 41.0, 36.0, 42.0, 79.0, 119.0, 210.0, 291.0, 497.0, 755.0, 1265.0, 2390.0, 4719.0, 9941.0, 24780.0, 83697.0, 757233.0, 109867.0, 29464.0, 11438.0, 5209.0, 2671.0, 1458.0, 815.0, 545.0, 312.0, 198.0, 131.0, 87.0, 59.0, 35.0, 25.0, 21.0, 16.0, 10.0, 11.0, 8.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.2587890625, -0.2510833740234375, -0.243377685546875, -0.2356719970703125, -0.22796630859375, -0.2202606201171875, -0.212554931640625, -0.2048492431640625, -0.1971435546875, -0.1894378662109375, -0.181732177734375, -0.1740264892578125, -0.16632080078125, -0.1586151123046875, -0.150909423828125, -0.1432037353515625, -0.135498046875, -0.1277923583984375, -0.120086669921875, -0.1123809814453125, -0.10467529296875, -0.0969696044921875, -0.089263916015625, -0.0815582275390625, -0.0738525390625, -0.0661468505859375, -0.058441162109375, -0.0507354736328125, -0.04302978515625, -0.0353240966796875, -0.027618408203125, -0.0199127197265625, -0.01220703125, -0.0045013427734375, 0.003204345703125, 0.0109100341796875, 0.01861572265625, 0.0263214111328125, 0.034027099609375, 0.0417327880859375, 0.0494384765625, 0.0571441650390625, 0.064849853515625, 0.0725555419921875, 0.08026123046875, 0.0879669189453125, 0.095672607421875, 0.1033782958984375, 0.111083984375, 0.1187896728515625, 0.126495361328125, 0.1342010498046875, 0.14190673828125, 0.1496124267578125, 0.157318115234375, 0.1650238037109375, 0.1727294921875, 0.1804351806640625, 0.188140869140625, 0.1958465576171875, 0.20355224609375, 0.2112579345703125, 0.218963623046875, 0.2266693115234375, 0.234375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 6.0, 5.0, 6.0, 3.0, 6.0, 6.0, 4.0, 10.0, 10.0, 21.0, 17.0, 40.0, 34.0, 58.0, 67.0, 106.0, 110.0, 109.0, 87.0, 87.0, 52.0, 42.0, 29.0, 18.0, 15.0, 12.0, 7.0, 6.0, 1.0, 7.0, 6.0, 7.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5185546875, -0.5045013427734375, -0.490447998046875, -0.4763946533203125, -0.46234130859375, -0.4482879638671875, -0.434234619140625, -0.4201812744140625, -0.4061279296875, -0.3920745849609375, -0.378021240234375, -0.3639678955078125, -0.34991455078125, -0.3358612060546875, -0.321807861328125, -0.3077545166015625, -0.293701171875, -0.2796478271484375, -0.265594482421875, -0.2515411376953125, -0.23748779296875, -0.2234344482421875, -0.209381103515625, -0.1953277587890625, -0.1812744140625, -0.1672210693359375, -0.153167724609375, -0.1391143798828125, -0.12506103515625, -0.1110076904296875, -0.096954345703125, -0.0829010009765625, -0.06884765625, -0.0547943115234375, -0.040740966796875, -0.0266876220703125, -0.01263427734375, 0.0014190673828125, 0.015472412109375, 0.0295257568359375, 0.0435791015625, 0.0576324462890625, 0.071685791015625, 0.0857391357421875, 0.09979248046875, 0.1138458251953125, 0.127899169921875, 0.1419525146484375, 0.156005859375, 0.1700592041015625, 0.184112548828125, 0.1981658935546875, 0.21221923828125, 0.2262725830078125, 0.240325927734375, 0.2543792724609375, 0.2684326171875, 0.2824859619140625, 0.296539306640625, 0.3105926513671875, 0.32464599609375, 0.3386993408203125, 0.352752685546875, 0.3668060302734375, 0.380859375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 12.0, 20.0, 60.0, 128.0, 627.0, 98.0, 36.0, 17.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.526641845703125, -32.52521896362305, -31.523794174194336, -30.522369384765625, -29.520946502685547, -28.519521713256836, -27.518096923828125, -26.516674041748047, -25.51525115966797, -24.513826370239258, -23.51240348815918, -22.51097869873047, -21.50955581665039, -20.50813102722168, -19.50670623779297, -18.50528335571289, -17.50385856628418, -16.50243377685547, -15.50101089477539, -14.49958610534668, -13.498163223266602, -12.49673843383789, -11.495314598083496, -10.493890762329102, -9.492466926574707, -8.491043090820312, -7.489619255065918, -6.488194942474365, -5.486771106719971, -4.485347270965576, -3.4839229583740234, -2.482499122619629, -1.4810733795166016, -0.4796494245529175, 0.5217745304107666, 1.5231986045837402, 2.5246224403381348, 3.5260462760925293, 4.527470588684082, 5.528894424438477, 6.530318260192871, 7.531742095947266, 8.53316593170166, 9.534589767456055, 10.536014556884766, 11.537437438964844, 12.538862228393555, 13.54028606414795, 14.541709899902344, 15.543133735656738, 16.544557571411133, 17.545982360839844, 18.547405242919922, 19.548830032348633, 20.550254821777344, 21.551677703857422, 22.5531005859375, 23.55452537536621, 24.55594825744629, 25.557373046875, 26.558795928955078, 27.56022071838379, 28.5616455078125, 29.563068389892578, 30.56449317932129]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 10.0, 4.0, 6.0, 9.0, 12.0, 8.0, 11.0, 22.0, 15.0, 23.0, 25.0, 27.0, 31.0, 27.0, 43.0, 238.0, 230.0, 49.0, 32.0, 24.0, 28.0, 23.0, 17.0, 16.0, 8.0, 15.0, 11.0, 2.0, 4.0, 9.0, 5.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.442407608032227, -8.129712104797363, -7.8170166015625, -7.504321098327637, -7.191625595092773, -6.87893009185791, -6.566235065460205, -6.253539562225342, -5.9408440589904785, -5.628148555755615, -5.315453052520752, -5.002757549285889, -4.690062522888184, -4.37736701965332, -4.064671516418457, -3.7519760131835938, -3.4392805099487305, -3.126585006713867, -2.813889503479004, -2.5011942386627197, -2.1884987354278564, -1.8758032321929932, -1.5631078481674194, -1.2504124641418457, -0.9377169609069824, -0.6250215172767639, -0.3123260736465454, 0.0003693699836730957, 0.3130648136138916, 0.6257603168487549, 0.9384557008743286, 1.2511510848999023, 1.563847541809082, 1.8765430450439453, 2.1892385482788086, 2.5019338130950928, 2.814629316329956, 3.1273248195648193, 3.4400200843811035, 3.752715587615967, 4.06541109085083, 4.378106594085693, 4.690802097320557, 5.00349760055542, 5.316192626953125, 5.628888130187988, 5.941583633422852, 6.254279136657715, 6.566974639892578, 6.879670143127441, 7.192365646362305, 7.505061149597168, 7.817756652832031, 8.130452156066895, 8.443147659301758, 8.755842208862305, 9.068538665771484, 9.381234169006348, 9.693929672241211, 10.006625175476074, 10.319320678710938, 10.6320161819458, 10.944711685180664, 11.257406234741211, 11.570101737976074]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 9.0, 5.0, 6.0, 10.0, 13.0, 11.0, 27.0, 28.0, 46.0, 40.0, 63.0, 126.0, 287.0, 93.0, 57.0, 51.0, 27.0, 30.0, 21.0, 18.0, 6.0, 11.0, 6.0, 5.0, 0.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1708984375, -1.133514404296875, -1.09613037109375, -1.058746337890625, -1.0213623046875, -0.983978271484375, -0.94659423828125, -0.909210205078125, -0.871826171875, -0.834442138671875, -0.79705810546875, -0.759674072265625, -0.7222900390625, -0.684906005859375, -0.64752197265625, -0.610137939453125, -0.57275390625, -0.535369873046875, -0.49798583984375, -0.460601806640625, -0.4232177734375, -0.385833740234375, -0.34844970703125, -0.311065673828125, -0.273681640625, -0.236297607421875, -0.19891357421875, -0.161529541015625, -0.1241455078125, -0.086761474609375, -0.04937744140625, -0.011993408203125, 0.025390625, 0.062774658203125, 0.10015869140625, 0.137542724609375, 0.1749267578125, 0.212310791015625, 0.24969482421875, 0.287078857421875, 0.324462890625, 0.361846923828125, 0.39923095703125, 0.436614990234375, 0.4739990234375, 0.511383056640625, 0.54876708984375, 0.586151123046875, 0.62353515625, 0.660919189453125, 0.69830322265625, 0.735687255859375, 0.7730712890625, 0.810455322265625, 0.84783935546875, 0.885223388671875, 0.922607421875, 0.959991455078125, 0.99737548828125, 1.034759521484375, 1.0721435546875, 1.109527587890625, 1.14691162109375, 1.184295654296875, 1.2216796875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 3.0, 5.0, 4.0, 8.0, 11.0, 13.0, 12.0, 28.0, 31.0, 61.0, 102.0, 156.0, 349.0, 989.0, 3840.0, 36363.0, 8334536.0, 9000.0, 1898.0, 605.0, 215.0, 126.0, 84.0, 61.0, 22.0, 15.0, 6.0, 8.0, 4.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 3.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.785748481750488, -9.500036239624023, -9.214324951171875, -8.92861270904541, -8.642901420593262, -8.357189178466797, -8.071477890014648, -7.785765647888184, -7.500053882598877, -7.21434211730957, -6.928630352020264, -6.642918586730957, -6.357206344604492, -6.071495056152344, -5.785782814025879, -5.500071048736572, -5.214359283447266, -4.928647518157959, -4.642935752868652, -4.357223987579346, -4.071512222290039, -3.7858002185821533, -3.5000882148742676, -3.214376449584961, -2.9286646842956543, -2.6429529190063477, -2.357241153717041, -2.0715291500091553, -1.7858173847198486, -1.500105619430542, -1.2143937349319458, -0.9286818504333496, -0.642970085144043, -0.35725826025009155, -0.07154643535614014, 0.21416538953781128, 0.4998772144317627, 0.7855889797210693, 1.0713008642196655, 1.3570127487182617, 1.6427245140075684, 1.928436279296875, 2.2141480445861816, 2.4998600482940674, 2.785571813583374, 3.0712835788726807, 3.3569955825805664, 3.642707347869873, 3.9284191131591797, 4.214130878448486, 4.499842643737793, 4.7855544090271, 5.071266174316406, 5.356978416442871, 5.642690181732178, 5.928401947021484, 6.214113712310791, 6.499825477600098, 6.785537242889404, 7.071249008178711, 7.356961250305176, 7.642672538757324, 7.928384780883789, 8.214096069335938, 8.499808311462402]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 6.0, 6.0, 2.0, 4.0, 8.0, 8.0, 2.0, 4.0, 4.0, 5.0, 9.0, 5.0, 3.0, 6.0, 2.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.060517311096191, -8.824185371398926, -8.58785343170166, -8.351521492004395, -8.115188598632812, -7.878857135772705, -7.642524719238281, -7.406192779541016, -7.16986083984375, -6.933528900146484, -6.697196960449219, -6.460864543914795, -6.224532604217529, -5.988200664520264, -5.75186824798584, -5.515536308288574, -5.279204368591309, -5.042872428894043, -4.806540489196777, -4.5702080726623535, -4.333876132965088, -4.097544193267822, -3.8612120151519775, -3.624879837036133, -3.388547897338867, -3.1522159576416016, -2.915883779525757, -2.679551601409912, -2.4432196617126465, -2.206887722015381, -1.9705555438995361, -1.734223484992981, -1.497891902923584, -1.2615598440170288, -1.0252277851104736, -0.7888957262039185, -0.5525636672973633, -0.3162316083908081, -0.07989954948425293, 0.15643250942230225, 0.3927645683288574, 0.6290966272354126, 0.8654286861419678, 1.101760745048523, 1.3380928039550781, 1.5744248628616333, 1.8107569217681885, 2.047089099884033, 2.283421039581299, 2.5197529792785645, 2.756085157394409, 2.992417335510254, 3.2287492752075195, 3.465081214904785, 3.70141339302063, 3.9377455711364746, 4.17407751083374, 4.410409450531006, 4.64674186706543, 4.883073806762695, 5.119405746459961, 5.355737686157227, 5.592069625854492, 5.828402042388916, 6.064733982086182]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 8.0, 11.0, 14.0, 11.0, 21.0, 41.0, 46.0, 64.0, 106.0, 153.0, 289.0, 652.0, 1545.0, 4948.0, 18767.0, 85491.0, 268832.0, 109989.0, 23745.0, 6111.0, 1860.0, 733.0, 352.0, 185.0, 117.0, 68.0, 39.0, 28.0, 15.0, 5.0, 7.0, 4.0, 9.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.0859375, -10.7828369140625, -10.479736328125, -10.1766357421875, -9.87353515625, -9.5704345703125, -9.267333984375, -8.9642333984375, -8.6611328125, -8.3580322265625, -8.054931640625, -7.7518310546875, -7.44873046875, -7.1456298828125, -6.842529296875, -6.5394287109375, -6.236328125, -5.9332275390625, -5.630126953125, -5.3270263671875, -5.02392578125, -4.7208251953125, -4.417724609375, -4.1146240234375, -3.8115234375, -3.5084228515625, -3.205322265625, -2.9022216796875, -2.59912109375, -2.2960205078125, -1.992919921875, -1.6898193359375, -1.38671875, -1.0836181640625, -0.780517578125, -0.4774169921875, -0.17431640625, 0.1287841796875, 0.431884765625, 0.7349853515625, 1.0380859375, 1.3411865234375, 1.644287109375, 1.9473876953125, 2.25048828125, 2.5535888671875, 2.856689453125, 3.1597900390625, 3.462890625, 3.7659912109375, 4.069091796875, 4.3721923828125, 4.67529296875, 4.9783935546875, 5.281494140625, 5.5845947265625, 5.8876953125, 6.1907958984375, 6.493896484375, 6.7969970703125, 7.10009765625, 7.4031982421875, 7.706298828125, 8.0093994140625, 8.3125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 10.0, 5.0, 11.0, 13.0, 24.0, 24.0, 25.0, 32.0, 57.0, 47.0, 69.0, 68.0, 75.0, 80.0, 74.0, 79.0, 67.0, 46.0, 51.0, 31.0, 24.0, 23.0, 21.0, 14.0, 8.0, 8.0, 6.0, 7.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3447265625, -1.3103790283203125, -1.276031494140625, -1.2416839599609375, -1.20733642578125, -1.1729888916015625, -1.138641357421875, -1.1042938232421875, -1.0699462890625, -1.0355987548828125, -1.001251220703125, -0.9669036865234375, -0.93255615234375, -0.8982086181640625, -0.863861083984375, -0.8295135498046875, -0.795166015625, -0.7608184814453125, -0.726470947265625, -0.6921234130859375, -0.65777587890625, -0.6234283447265625, -0.589080810546875, -0.5547332763671875, -0.5203857421875, -0.4860382080078125, -0.451690673828125, -0.4173431396484375, -0.38299560546875, -0.3486480712890625, -0.314300537109375, -0.2799530029296875, -0.24560546875, -0.2112579345703125, -0.176910400390625, -0.1425628662109375, -0.10821533203125, -0.0738677978515625, -0.039520263671875, -0.0051727294921875, 0.0291748046875, 0.0635223388671875, 0.097869873046875, 0.1322174072265625, 0.16656494140625, 0.2009124755859375, 0.235260009765625, 0.2696075439453125, 0.303955078125, 0.3383026123046875, 0.372650146484375, 0.4069976806640625, 0.44134521484375, 0.4756927490234375, 0.510040283203125, 0.5443878173828125, 0.5787353515625, 0.6130828857421875, 0.647430419921875, 0.6817779541015625, 0.71612548828125, 0.7504730224609375, 0.784820556640625, 0.8191680908203125, 0.853515625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 5.0, 10.0, 11.0, 19.0, 29.0, 55.0, 82.0, 105.0, 71.0, 43.0, 16.0, 11.0, 10.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.611623764038086, -11.331544876098633, -11.051466941833496, -10.771388053894043, -10.491310119628906, -10.211231231689453, -9.931153297424316, -9.651074409484863, -9.370996475219727, -9.090917587280273, -8.810839653015137, -8.530760765075684, -8.250682830810547, -7.970603942871094, -7.690525531768799, -7.410447120666504, -7.130368232727051, -6.850289821624756, -6.570211410522461, -6.290132999420166, -6.010054588317871, -5.729975700378418, -5.449897289276123, -5.169818878173828, -4.889740467071533, -4.609662055969238, -4.329583644866943, -4.049505233764648, -3.7694265842437744, -3.4893481731414795, -3.2092695236206055, -2.9291911125183105, -2.649113655090332, -2.369035243988037, -2.088956832885742, -1.8088781833648682, -1.5287997722625732, -1.2487213611602783, -0.9686428308486938, -0.6885643005371094, -0.40848588943481445, -0.12840741872787476, 0.15167105197906494, 0.43174952268600464, 0.7118279933929443, 0.9919064044952393, 1.2719849348068237, 1.5520634651184082, 1.8321418762207031, 2.112220287322998, 2.392298698425293, 2.672377347946167, 2.952455759048462, 3.232534170150757, 3.512612819671631, 3.792691230773926, 4.072769641876221, 4.352848052978516, 4.6329264640808105, 4.9130048751831055, 5.193083763122559, 5.473161697387695, 5.753240585327148, 6.033318996429443, 6.313397407531738]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 7.0, 16.0, 13.0, 29.0, 53.0, 92.0, 93.0, 70.0, 34.0, 20.0, 10.0, 10.0, 4.0, 5.0, 2.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.147286891937256, -4.965672969818115, -4.784059047698975, -4.602445125579834, -4.420830726623535, -4.2392168045043945, -4.057602882385254, -3.8759889602661133, -3.6943750381469727, -3.512761116027832, -3.3311471939086914, -3.1495330333709717, -2.967919111251831, -2.7863051891326904, -2.6046910285949707, -2.42307710647583, -2.2414631843566895, -2.059849262237549, -1.8782352209091187, -1.6966211795806885, -1.5150072574615479, -1.3333933353424072, -1.151779294013977, -0.9701652526855469, -0.7885513305664062, -0.6069373488426208, -0.42532336711883545, -0.24370938539505005, -0.06209540367126465, 0.11951857805252075, 0.30113255977630615, 0.48274660110473633, 0.6643600463867188, 0.8459740281105042, 1.0275880098342896, 1.2092020511627197, 1.3908159732818604, 1.572429895401001, 1.7540439367294312, 1.9356579780578613, 2.117271900177002, 2.2988858222961426, 2.480499744415283, 2.662113904953003, 2.8437278270721436, 3.025341749191284, 3.206955909729004, 3.3885698318481445, 3.570183753967285, 3.751797676086426, 3.9334115982055664, 4.115025520324707, 4.296639442443848, 4.4782538414001465, 4.659867763519287, 4.841481685638428, 5.023095607757568, 5.204709529876709, 5.38632345199585, 5.56793737411499, 5.749551773071289, 5.93116569519043, 6.11277961730957, 6.294393539428711, 6.476007461547852]}, "eval/loss": 4.160531044006348, "eval/wer": 2.4565450218167393, "eval/runtime": 1155.2061, "eval/samples_per_second": 2.287, "eval/steps_per_second": 0.287, "train/train_runtime": 8769.6328, "train/train_samples_per_second": 3.254, "train/train_steps_per_second": 0.203, "train/total_flos": 0.0, "train/train_loss": 4.241978131735806, "_wandb": {"runtime": 10188}} \ No newline at end of file